diff --git "a/wandb/run-20220228_204859-8xn2plkx/files/wandb-summary.json" "b/wandb/run-20220228_204859-8xn2plkx/files/wandb-summary.json" --- "a/wandb/run-20220228_204859-8xn2plkx/files/wandb-summary.json" +++ "b/wandb/run-20220228_204859-8xn2plkx/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.5598, "train/learning_rate": 5.92e-06, "train/epoch": 1.0, "train/global_step": 297, "_runtime": 4778, "_timestamp": 1646086117, "_step": 297, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 18.0, 136.0, 307.0, 339.0, 165.0, 40.0, 8.0, 3.0], "bins": [-198.99710083007812, -195.63198852539062, -192.26686096191406, -188.90174865722656, -185.53662109375, -182.1715087890625, -178.80638122558594, -175.44126892089844, -172.07614135742188, -168.71102905273438, -165.3459014892578, -161.9807891845703, -158.61566162109375, -155.25054931640625, -151.8854217529297, -148.5203094482422, -145.15518188476562, -141.79006958007812, -138.42494201660156, -135.05982971191406, -131.6947021484375, -128.32958984375, -124.96446228027344, -121.5993423461914, -118.2342300415039, -114.86911010742188, -111.50399017333984, -108.13887023925781, -104.77375030517578, -101.40863037109375, -98.04351043701172, -94.67839050292969, -91.31327056884766, -87.94815063476562, -84.5830307006836, -81.21791076660156, -77.85279083251953, -74.4876708984375, -71.12255096435547, -67.75743103027344, -64.3923110961914, -61.027191162109375, -57.662071228027344, -54.29695129394531, -50.93183135986328, -47.56671142578125, -44.20159149169922, -40.83647155761719, -37.47135543823242, -34.10623550415039, -30.74111557006836, -27.375995635986328, -24.010875701904297, -20.6457576751709, -17.280637741088867, -13.915517807006836, -10.550397872924805, -7.185277938842773, -3.8201584815979004, -0.45503902435302734, 2.910080909729004, 6.275199890136719, 9.64031982421875, 13.005439758300781, 16.370559692382812]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 7.0, 12.0, 9.0, 18.0, 17.0, 20.0, 20.0, 29.0, 35.0, 31.0, 40.0, 38.0, 43.0, 50.0, 42.0, 31.0, 38.0, 44.0, 42.0, 45.0, 48.0, 45.0, 39.0, 37.0, 19.0, 26.0, 26.0, 19.0, 16.0, 20.0, 11.0, 13.0, 11.0, 9.0, 11.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.525508880615234, -47.09046173095703, -45.65541458129883, -44.22036361694336, -42.785316467285156, -41.35026931762695, -39.91522216796875, -38.48017120361328, -37.04512405395508, -35.610076904296875, -34.17502975463867, -32.7399787902832, -31.304931640625, -29.869884490966797, -28.434837341308594, -26.999788284301758, -25.564741134643555, -24.12969398498535, -22.694644927978516, -21.259597778320312, -19.824548721313477, -18.389501571655273, -16.954452514648438, -15.519405364990234, -14.084357261657715, -12.649309158325195, -11.214261054992676, -9.779212951660156, -8.344165802001953, -6.909117221832275, -5.474069595336914, -4.0390214920043945, -2.603973388671875, -1.168925404548645, 0.26612257957458496, 1.7011704444885254, 3.136218547821045, 4.5712666511535645, 6.006314277648926, 7.441362380981445, 8.876410484313965, 10.311458587646484, 11.746506690979004, 13.181554794311523, 14.616601943969727, 16.051651000976562, 17.486698150634766, 18.92174530029297, 20.356794357299805, 21.791841506958008, 23.226890563964844, 24.661937713623047, 26.096986770629883, 27.532033920288086, 28.967082977294922, 30.402130126953125, 31.837177276611328, 33.27222442626953, 34.707271575927734, 36.1423225402832, 37.577369689941406, 39.01241683959961, 40.44746398925781, 41.88251495361328, 43.317562103271484]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 6.0, 5.0, 16.0, 11.0, 22.0, 14.0, 19.0, 24.0, 27.0, 25.0, 34.0, 47.0, 43.0, 51.0, 56.0, 46.0, 41.0, 54.0, 57.0, 35.0, 44.0, 46.0, 30.0, 37.0, 32.0, 32.0, 28.0, 17.0, 15.0, 21.0, 16.0, 9.0, 11.0, 4.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.906402587890625, -2.80303955078125, -2.699676513671875, -2.5963134765625, -2.492950439453125, -2.38958740234375, -2.286224365234375, -2.182861328125, -2.079498291015625, -1.97613525390625, -1.872772216796875, -1.7694091796875, -1.666046142578125, -1.56268310546875, -1.459320068359375, -1.35595703125, -1.252593994140625, -1.14923095703125, -1.045867919921875, -0.9425048828125, -0.839141845703125, -0.73577880859375, -0.632415771484375, -0.529052734375, -0.425689697265625, -0.32232666015625, -0.218963623046875, -0.1156005859375, -0.012237548828125, 0.09112548828125, 0.194488525390625, 0.2978515625, 0.401214599609375, 0.50457763671875, 0.607940673828125, 0.7113037109375, 0.814666748046875, 0.91802978515625, 1.021392822265625, 1.124755859375, 1.228118896484375, 1.33148193359375, 1.434844970703125, 1.5382080078125, 1.641571044921875, 1.74493408203125, 1.848297119140625, 1.95166015625, 2.055023193359375, 2.15838623046875, 2.261749267578125, 2.3651123046875, 2.468475341796875, 2.57183837890625, 2.675201416015625, 2.778564453125, 2.881927490234375, 2.98529052734375, 3.088653564453125, 3.1920166015625, 3.295379638671875, 3.39874267578125, 3.502105712890625, 3.60546875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 11.0, 16.0, 23.0, 45.0, 77.0, 101.0, 196.0, 245.0, 457.0, 802.0, 1606.0, 3407.0, 10055.0, 47288.0, 504506.0, 2939452.0, 612538.0, 54358.0, 11380.0, 3863.0, 1744.0, 862.0, 478.0, 267.0, 203.0, 107.0, 72.0, 45.0, 35.0, 16.0, 13.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2421875, -12.889404296875, -12.53662109375, -12.183837890625, -11.8310546875, -11.478271484375, -11.12548828125, -10.772705078125, -10.419921875, -10.067138671875, -9.71435546875, -9.361572265625, -9.0087890625, -8.656005859375, -8.30322265625, -7.950439453125, -7.59765625, -7.244873046875, -6.89208984375, -6.539306640625, -6.1865234375, -5.833740234375, -5.48095703125, -5.128173828125, -4.775390625, -4.422607421875, -4.06982421875, -3.717041015625, -3.3642578125, -3.011474609375, -2.65869140625, -2.305908203125, -1.953125, -1.600341796875, -1.24755859375, -0.894775390625, -0.5419921875, -0.189208984375, 0.16357421875, 0.516357421875, 0.869140625, 1.221923828125, 1.57470703125, 1.927490234375, 2.2802734375, 2.633056640625, 2.98583984375, 3.338623046875, 3.69140625, 4.044189453125, 4.39697265625, 4.749755859375, 5.1025390625, 5.455322265625, 5.80810546875, 6.160888671875, 6.513671875, 6.866455078125, 7.21923828125, 7.572021484375, 7.9248046875, 8.277587890625, 8.63037109375, 8.983154296875, 9.3359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 17.0, 16.0, 20.0, 36.0, 40.0, 53.0, 75.0, 136.0, 162.0, 249.0, 364.0, 529.0, 570.0, 520.0, 368.0, 282.0, 203.0, 123.0, 94.0, 61.0, 41.0, 25.0, 21.0, 18.0, 8.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.515625, -13.111328125, -12.70703125, -12.302734375, -11.8984375, -11.494140625, -11.08984375, -10.685546875, -10.28125, -9.876953125, -9.47265625, -9.068359375, -8.6640625, -8.259765625, -7.85546875, -7.451171875, -7.046875, -6.642578125, -6.23828125, -5.833984375, -5.4296875, -5.025390625, -4.62109375, -4.216796875, -3.8125, -3.408203125, -3.00390625, -2.599609375, -2.1953125, -1.791015625, -1.38671875, -0.982421875, -0.578125, -0.173828125, 0.23046875, 0.634765625, 1.0390625, 1.443359375, 1.84765625, 2.251953125, 2.65625, 3.060546875, 3.46484375, 3.869140625, 4.2734375, 4.677734375, 5.08203125, 5.486328125, 5.890625, 6.294921875, 6.69921875, 7.103515625, 7.5078125, 7.912109375, 8.31640625, 8.720703125, 9.125, 9.529296875, 9.93359375, 10.337890625, 10.7421875, 11.146484375, 11.55078125, 11.955078125, 12.359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 11.0, 11.0, 17.0, 37.0, 49.0, 53.0, 101.0, 154.0, 271.0, 461.0, 957.0, 2154.0, 9341.0, 857523.0, 3298325.0, 19224.0, 3053.0, 1146.0, 591.0, 283.0, 182.0, 102.0, 69.0, 43.0, 32.0, 26.0, 15.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.46875, -40.04541015625, -38.6220703125, -37.19873046875, -35.775390625, -34.35205078125, -32.9287109375, -31.50537109375, -30.08203125, -28.65869140625, -27.2353515625, -25.81201171875, -24.388671875, -22.96533203125, -21.5419921875, -20.11865234375, -18.6953125, -17.27197265625, -15.8486328125, -14.42529296875, -13.001953125, -11.57861328125, -10.1552734375, -8.73193359375, -7.30859375, -5.88525390625, -4.4619140625, -3.03857421875, -1.615234375, -0.19189453125, 1.2314453125, 2.65478515625, 4.078125, 5.50146484375, 6.9248046875, 8.34814453125, 9.771484375, 11.19482421875, 12.6181640625, 14.04150390625, 15.46484375, 16.88818359375, 18.3115234375, 19.73486328125, 21.158203125, 22.58154296875, 24.0048828125, 25.42822265625, 26.8515625, 28.27490234375, 29.6982421875, 31.12158203125, 32.544921875, 33.96826171875, 35.3916015625, 36.81494140625, 38.23828125, 39.66162109375, 41.0849609375, 42.50830078125, 43.931640625, 45.35498046875, 46.7783203125, 48.20166015625, 49.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 42.0, 245.0, 426.0, 241.0, 41.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.0782012939453, -156.39073181152344, -152.70327758789062, -149.01580810546875, -145.32833862304688, -141.640869140625, -137.9534149169922, -134.2659454345703, -130.57847595214844, -126.8910140991211, -123.20354461669922, -119.51608276367188, -115.82861328125, -112.14115142822266, -108.45368957519531, -104.76622009277344, -101.0787582397461, -97.39129638671875, -93.70382690429688, -90.01636505126953, -86.32889556884766, -82.64143371582031, -78.95396423339844, -75.2665023803711, -71.57904052734375, -67.8915786743164, -64.20410919189453, -60.51664733886719, -56.82917785644531, -53.14171600341797, -49.45425033569336, -45.76678466796875, -42.079315185546875, -38.391849517822266, -34.704383850097656, -31.01692008972168, -27.32945442199707, -23.64198875427246, -19.954524993896484, -16.267059326171875, -12.579593658447266, -8.892127990722656, -5.204663276672363, -1.5171985626220703, 2.170267105102539, 5.857732772827148, 9.545196533203125, 13.232662200927734, 16.920127868652344, 20.607593536376953, 24.295059204101562, 27.98252296447754, 31.66998863220215, 35.357452392578125, 39.044918060302734, 42.732383728027344, 46.41984939575195, 50.10731506347656, 53.79478073120117, 57.48224639892578, 61.169708251953125, 64.857177734375, 68.54463958740234, 72.23210144042969, 75.91957092285156]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 7.0, 4.0, 3.0, 7.0, 7.0, 14.0, 12.0, 8.0, 11.0, 15.0, 13.0, 14.0, 27.0, 25.0, 30.0, 30.0, 35.0, 33.0, 29.0, 32.0, 38.0, 31.0, 32.0, 33.0, 38.0, 43.0, 30.0, 35.0, 38.0, 26.0, 39.0, 29.0, 34.0, 26.0, 22.0, 32.0, 16.0, 20.0, 15.0, 15.0, 13.0, 13.0, 7.0, 7.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.028709411621094, -33.95008850097656, -32.8714714050293, -31.7928524017334, -30.7142333984375, -29.6356143951416, -28.556995391845703, -27.478376388549805, -26.399757385253906, -25.321138381958008, -24.24251937866211, -23.16390037536621, -22.085281372070312, -21.006662368774414, -19.928043365478516, -18.849424362182617, -17.77080535888672, -16.69218635559082, -15.613567352294922, -14.534948348999023, -13.456329345703125, -12.377710342407227, -11.299091339111328, -10.22047233581543, -9.141853332519531, -8.063234329223633, -6.984615325927734, -5.905996322631836, -4.8273773193359375, -3.748758316040039, -2.6701393127441406, -1.5915203094482422, -0.5129051208496094, 0.5657138824462891, 1.6443328857421875, 2.722951889038086, 3.8015708923339844, 4.880189895629883, 5.958808898925781, 7.03742790222168, 8.116046905517578, 9.194665908813477, 10.273284912109375, 11.351903915405273, 12.430522918701172, 13.50914192199707, 14.587760925292969, 15.666379928588867, 16.744998931884766, 17.823617935180664, 18.902236938476562, 19.98085594177246, 21.05947494506836, 22.138093948364258, 23.216712951660156, 24.295331954956055, 25.373950958251953, 26.45256996154785, 27.53118896484375, 28.60980796813965, 29.688426971435547, 30.767045974731445, 31.845664978027344, 32.924285888671875, 34.00290298461914]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 2.0, 3.0, 9.0, 9.0, 4.0, 15.0, 19.0, 24.0, 24.0, 21.0, 26.0, 21.0, 30.0, 38.0, 39.0, 24.0, 42.0, 50.0, 46.0, 58.0, 41.0, 39.0, 35.0, 41.0, 37.0, 33.0, 35.0, 26.0, 28.0, 22.0, 20.0, 32.0, 11.0, 27.0, 10.0, 11.0, 14.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.333984375, -3.230377197265625, -3.12677001953125, -3.023162841796875, -2.9195556640625, -2.815948486328125, -2.71234130859375, -2.608734130859375, -2.505126953125, -2.401519775390625, -2.29791259765625, -2.194305419921875, -2.0906982421875, -1.987091064453125, -1.88348388671875, -1.779876708984375, -1.67626953125, -1.572662353515625, -1.46905517578125, -1.365447998046875, -1.2618408203125, -1.158233642578125, -1.05462646484375, -0.951019287109375, -0.847412109375, -0.743804931640625, -0.64019775390625, -0.536590576171875, -0.4329833984375, -0.329376220703125, -0.22576904296875, -0.122161865234375, -0.0185546875, 0.085052490234375, 0.18865966796875, 0.292266845703125, 0.3958740234375, 0.499481201171875, 0.60308837890625, 0.706695556640625, 0.810302734375, 0.913909912109375, 1.01751708984375, 1.121124267578125, 1.2247314453125, 1.328338623046875, 1.43194580078125, 1.535552978515625, 1.63916015625, 1.742767333984375, 1.84637451171875, 1.949981689453125, 2.0535888671875, 2.157196044921875, 2.26080322265625, 2.364410400390625, 2.468017578125, 2.571624755859375, 2.67523193359375, 2.778839111328125, 2.8824462890625, 2.986053466796875, 3.08966064453125, 3.193267822265625, 3.296875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 10.0, 18.0, 19.0, 25.0, 61.0, 62.0, 94.0, 120.0, 178.0, 277.0, 385.0, 589.0, 847.0, 1214.0, 1797.0, 2721.0, 4127.0, 6333.0, 9428.0, 14927.0, 22528.0, 35128.0, 55721.0, 94655.0, 192169.0, 302736.0, 117237.0, 66796.0, 41349.0, 26443.0, 17349.0, 11065.0, 7401.0, 4896.0, 3089.0, 2174.0, 1434.0, 955.0, 693.0, 471.0, 299.0, 211.0, 158.0, 98.0, 85.0, 58.0, 28.0, 33.0, 24.0, 10.0, 3.0, 9.0, 4.0, 3.0, 5.0, 0.0, 2.0], "bins": [-0.85986328125, -0.8331451416015625, -0.806427001953125, -0.7797088623046875, -0.75299072265625, -0.7262725830078125, -0.699554443359375, -0.6728363037109375, -0.6461181640625, -0.6194000244140625, -0.592681884765625, -0.5659637451171875, -0.53924560546875, -0.5125274658203125, -0.485809326171875, -0.4590911865234375, -0.432373046875, -0.4056549072265625, -0.378936767578125, -0.3522186279296875, -0.32550048828125, -0.2987823486328125, -0.272064208984375, -0.2453460693359375, -0.2186279296875, -0.1919097900390625, -0.165191650390625, -0.1384735107421875, -0.11175537109375, -0.0850372314453125, -0.058319091796875, -0.0316009521484375, -0.0048828125, 0.0218353271484375, 0.048553466796875, 0.0752716064453125, 0.10198974609375, 0.1287078857421875, 0.155426025390625, 0.1821441650390625, 0.2088623046875, 0.2355804443359375, 0.262298583984375, 0.2890167236328125, 0.31573486328125, 0.3424530029296875, 0.369171142578125, 0.3958892822265625, 0.422607421875, 0.4493255615234375, 0.476043701171875, 0.5027618408203125, 0.52947998046875, 0.5561981201171875, 0.582916259765625, 0.6096343994140625, 0.6363525390625, 0.6630706787109375, 0.689788818359375, 0.7165069580078125, 0.74322509765625, 0.7699432373046875, 0.796661376953125, 0.8233795166015625, 0.85009765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 5.0, 4.0, 6.0, 10.0, 9.0, 13.0, 16.0, 12.0, 22.0, 21.0, 14.0, 27.0, 24.0, 28.0, 42.0, 27.0, 42.0, 38.0, 44.0, 40.0, 38.0, 1060.0, 40.0, 37.0, 37.0, 31.0, 36.0, 30.0, 33.0, 33.0, 31.0, 20.0, 24.0, 27.0, 15.0, 12.0, 13.0, 7.0, 14.0, 9.0, 5.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9912109375, -1.9278717041015625, -1.864532470703125, -1.8011932373046875, -1.73785400390625, -1.6745147705078125, -1.611175537109375, -1.5478363037109375, -1.4844970703125, -1.4211578369140625, -1.357818603515625, -1.2944793701171875, -1.23114013671875, -1.1678009033203125, -1.104461669921875, -1.0411224365234375, -0.977783203125, -0.9144439697265625, -0.851104736328125, -0.7877655029296875, -0.72442626953125, -0.6610870361328125, -0.597747802734375, -0.5344085693359375, -0.4710693359375, -0.4077301025390625, -0.344390869140625, -0.2810516357421875, -0.21771240234375, -0.1543731689453125, -0.091033935546875, -0.0276947021484375, 0.03564453125, 0.0989837646484375, 0.162322998046875, 0.2256622314453125, 0.28900146484375, 0.3523406982421875, 0.415679931640625, 0.4790191650390625, 0.5423583984375, 0.6056976318359375, 0.669036865234375, 0.7323760986328125, 0.79571533203125, 0.8590545654296875, 0.922393798828125, 0.9857330322265625, 1.049072265625, 1.1124114990234375, 1.175750732421875, 1.2390899658203125, 1.30242919921875, 1.3657684326171875, 1.429107666015625, 1.4924468994140625, 1.5557861328125, 1.6191253662109375, 1.682464599609375, 1.7458038330078125, 1.80914306640625, 1.8724822998046875, 1.935821533203125, 1.9991607666015625, 2.0625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 6.0, 6.0, 19.0, 11.0, 24.0, 34.0, 59.0, 68.0, 114.0, 204.0, 272.0, 328.0, 533.0, 825.0, 1191.0, 1688.0, 2309.0, 3432.0, 4891.0, 7135.0, 10551.0, 15548.0, 23368.0, 35620.0, 54642.0, 86991.0, 156070.0, 1343173.0, 127896.0, 75728.0, 48120.0, 31549.0, 20589.0, 14036.0, 9282.0, 6342.0, 4438.0, 3083.0, 2188.0, 1493.0, 967.0, 751.0, 536.0, 344.0, 231.0, 155.0, 103.0, 76.0, 40.0, 38.0, 19.0, 9.0, 7.0, 5.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.74755859375, -0.7237167358398438, -0.6998748779296875, -0.6760330200195312, -0.652191162109375, -0.6283493041992188, -0.6045074462890625, -0.5806655883789062, -0.55682373046875, -0.5329818725585938, -0.5091400146484375, -0.48529815673828125, -0.461456298828125, -0.43761444091796875, -0.4137725830078125, -0.38993072509765625, -0.3660888671875, -0.34224700927734375, -0.3184051513671875, -0.29456329345703125, -0.270721435546875, -0.24687957763671875, -0.2230377197265625, -0.19919586181640625, -0.17535400390625, -0.15151214599609375, -0.1276702880859375, -0.10382843017578125, -0.079986572265625, -0.05614471435546875, -0.0323028564453125, -0.00846099853515625, 0.015380859375, 0.03922271728515625, 0.0630645751953125, 0.08690643310546875, 0.110748291015625, 0.13459014892578125, 0.1584320068359375, 0.18227386474609375, 0.20611572265625, 0.22995758056640625, 0.2537994384765625, 0.27764129638671875, 0.301483154296875, 0.32532501220703125, 0.3491668701171875, 0.37300872802734375, 0.3968505859375, 0.42069244384765625, 0.4445343017578125, 0.46837615966796875, 0.492218017578125, 0.5160598754882812, 0.5399017333984375, 0.5637435913085938, 0.58758544921875, 0.6114273071289062, 0.6352691650390625, 0.6591110229492188, 0.682952880859375, 0.7067947387695312, 0.7306365966796875, 0.7544784545898438, 0.7783203125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 7.0, 10.0, 12.0, 15.0, 16.0, 23.0, 18.0, 38.0, 29.0, 38.0, 62.0, 66.0, 62.0, 69.0, 81.0, 60.0, 55.0, 51.0, 48.0, 36.0, 30.0, 27.0, 15.0, 15.0, 15.0, 17.0, 17.0, 6.0, 5.0, 7.0, 5.0, 1.0, 7.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011390447616577148, -0.00011033192276954651, -0.00010675936937332153, -0.00010318681597709656, -9.961426258087158e-05, -9.60417091846466e-05, -9.246915578842163e-05, -8.889660239219666e-05, -8.532404899597168e-05, -8.17514955997467e-05, -7.817894220352173e-05, -7.460638880729675e-05, -7.103383541107178e-05, -6.74612820148468e-05, -6.388872861862183e-05, -6.031617522239685e-05, -5.6743621826171875e-05, -5.31710684299469e-05, -4.9598515033721924e-05, -4.602596163749695e-05, -4.245340824127197e-05, -3.8880854845047e-05, -3.530830144882202e-05, -3.1735748052597046e-05, -2.816319465637207e-05, -2.4590641260147095e-05, -2.101808786392212e-05, -1.7445534467697144e-05, -1.3872981071472168e-05, -1.0300427675247192e-05, -6.727874279022217e-06, -3.155320882797241e-06, 4.172325134277344e-07, 3.98978590965271e-06, 7.5623393058776855e-06, 1.1134892702102661e-05, 1.4707446098327637e-05, 1.8279999494552612e-05, 2.1852552890777588e-05, 2.5425106287002563e-05, 2.899765968322754e-05, 3.2570213079452515e-05, 3.614276647567749e-05, 3.9715319871902466e-05, 4.328787326812744e-05, 4.686042666435242e-05, 5.043298006057739e-05, 5.400553345680237e-05, 5.7578086853027344e-05, 6.115064024925232e-05, 6.47231936454773e-05, 6.829574704170227e-05, 7.186830043792725e-05, 7.544085383415222e-05, 7.90134072303772e-05, 8.258596062660217e-05, 8.615851402282715e-05, 8.973106741905212e-05, 9.33036208152771e-05, 9.687617421150208e-05, 0.00010044872760772705, 0.00010402128100395203, 0.000107593834400177, 0.00011116638779640198, 0.00011473894119262695]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 10.0, 11.0, 6.0, 10.0, 8.0, 15.0, 17.0, 30.0, 31.0, 32.0, 42.0, 53.0, 94.0, 78.0, 127.0, 147.0, 200.0, 306.0, 443.0, 717.0, 3361.0, 1032620.0, 7675.0, 736.0, 470.0, 326.0, 211.0, 179.0, 126.0, 89.0, 61.0, 80.0, 44.0, 40.0, 31.0, 16.0, 20.0, 10.0, 11.0, 19.0, 10.0, 9.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0018186569213867188, -0.001759156584739685, -0.0016996562480926514, -0.0016401559114456177, -0.001580655574798584, -0.0015211552381515503, -0.0014616549015045166, -0.001402154564857483, -0.0013426542282104492, -0.0012831538915634155, -0.0012236535549163818, -0.0011641532182693481, -0.0011046528816223145, -0.0010451525449752808, -0.000985652208328247, -0.0009261518716812134, -0.0008666515350341797, -0.000807151198387146, -0.0007476508617401123, -0.0006881505250930786, -0.0006286501884460449, -0.0005691498517990112, -0.0005096495151519775, -0.00045014917850494385, -0.00039064884185791016, -0.00033114850521087646, -0.0002716481685638428, -0.00021214783191680908, -0.0001526474952697754, -9.31471586227417e-05, -3.364682197570801e-05, 2.5853514671325684e-05, 8.535385131835938e-05, 0.00014485418796539307, 0.00020435452461242676, 0.00026385486125946045, 0.00032335519790649414, 0.00038285553455352783, 0.0004423558712005615, 0.0005018562078475952, 0.0005613565444946289, 0.0006208568811416626, 0.0006803572177886963, 0.00073985755443573, 0.0007993578910827637, 0.0008588582277297974, 0.0009183585643768311, 0.0009778589010238647, 0.0010373592376708984, 0.0010968595743179321, 0.0011563599109649658, 0.0012158602476119995, 0.0012753605842590332, 0.001334860920906067, 0.0013943612575531006, 0.0014538615942001343, 0.001513361930847168, 0.0015728622674942017, 0.0016323626041412354, 0.001691862940788269, 0.0017513632774353027, 0.0018108636140823364, 0.0018703639507293701, 0.0019298642873764038, 0.0019893646240234375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 727.0, 289.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007530585280619562, -0.0007320598233491182, -0.0007110611186362803, -0.0006900624139234424, -0.0006690637674182653, -0.0006480650627054274, -0.0006270663579925895, -0.0006060676532797515, -0.0005850689485669136, -0.0005640702438540757, -0.0005430715391412377, -0.0005220728926360607, -0.0005010741879232228, -0.00048007548321038485, -0.0004590767784975469, -0.000438078073784709, -0.00041707942727953196, -0.000396080722566694, -0.00037508204695768654, -0.0003540833422448486, -0.00033308466663584113, -0.0003120859619230032, -0.00029108725721016526, -0.00027008855249732733, -0.00024908987688831985, -0.00022809118672739714, -0.00020709249656647444, -0.0001860937918536365, -0.0001650951016927138, -0.0001440964115317911, -0.00012309770681895316, -0.00010209901665803045, -8.110032649710774e-05, -6.010163269820623e-05, -3.910293889930472e-05, -1.8104241462424397e-05, 2.8944486984983087e-06, 2.3893138859421015e-05, 4.489184357225895e-05, 6.589053373318166e-05, 8.688922389410436e-05, 0.00010788791405502707, 0.00012888660421594977, 0.0001498853089287877, 0.00017088399908971041, 0.00019188268925063312, 0.00021288139396347106, 0.00023388008412439376, 0.00025487877428531647, 0.0002758774789981544, 0.0002968761546071619, 0.0003178748593199998, 0.0003388735349290073, 0.0003598722396418452, 0.00038087094435468316, 0.0004018696490675211, 0.0004228683246765286, 0.0004438670293893665, 0.000464865704998374, 0.0004858644097112119, 0.0005068631144240499, 0.0005278617609292269, 0.0005488605238497257, 0.0005698591703549027, 0.0005908578750677407]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 12.0, 5.0, 12.0, 9.0, 17.0, 12.0, 15.0, 18.0, 25.0, 30.0, 31.0, 29.0, 22.0, 36.0, 43.0, 30.0, 50.0, 38.0, 29.0, 51.0, 42.0, 31.0, 39.0, 41.0, 39.0, 30.0, 32.0, 29.0, 29.0, 17.0, 19.0, 19.0, 19.0, 17.0, 8.0, 10.0, 11.0, 10.0, 7.0, 9.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.358457565307617e-05, -5.179643630981445e-05, -5.0008296966552734e-05, -4.8220157623291016e-05, -4.64320182800293e-05, -4.464387893676758e-05, -4.285573959350586e-05, -4.106760025024414e-05, -3.927946090698242e-05, -3.74913215637207e-05, -3.5703182220458984e-05, -3.3915042877197266e-05, -3.212690353393555e-05, -3.0338764190673828e-05, -2.855062484741211e-05, -2.676248550415039e-05, -2.4974346160888672e-05, -2.3186206817626953e-05, -2.1398067474365234e-05, -1.9609928131103516e-05, -1.7821788787841797e-05, -1.6033649444580078e-05, -1.424551010131836e-05, -1.245737075805664e-05, -1.0669231414794922e-05, -8.881092071533203e-06, -7.092952728271484e-06, -5.304813385009766e-06, -3.516674041748047e-06, -1.7285346984863281e-06, 5.960464477539063e-08, 1.8477439880371094e-06, 3.635883331298828e-06, 5.424022674560547e-06, 7.212162017822266e-06, 9.000301361083984e-06, 1.0788440704345703e-05, 1.2576580047607422e-05, 1.436471939086914e-05, 1.615285873413086e-05, 1.7940998077392578e-05, 1.9729137420654297e-05, 2.1517276763916016e-05, 2.3305416107177734e-05, 2.5093555450439453e-05, 2.6881694793701172e-05, 2.866983413696289e-05, 3.045797348022461e-05, 3.224611282348633e-05, 3.403425216674805e-05, 3.5822391510009766e-05, 3.7610530853271484e-05, 3.93986701965332e-05, 4.118680953979492e-05, 4.297494888305664e-05, 4.476308822631836e-05, 4.655122756958008e-05, 4.83393669128418e-05, 5.0127506256103516e-05, 5.1915645599365234e-05, 5.370378494262695e-05, 5.549192428588867e-05, 5.728006362915039e-05, 5.906820297241211e-05, 6.085634231567383e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 2.0, 3.0, 9.0, 9.0, 4.0, 15.0, 19.0, 24.0, 24.0, 21.0, 26.0, 21.0, 30.0, 38.0, 39.0, 24.0, 42.0, 50.0, 46.0, 58.0, 41.0, 39.0, 35.0, 41.0, 37.0, 33.0, 35.0, 26.0, 28.0, 22.0, 20.0, 32.0, 11.0, 27.0, 10.0, 11.0, 14.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.333984375, -3.230377197265625, -3.12677001953125, -3.023162841796875, -2.9195556640625, -2.815948486328125, -2.71234130859375, -2.608734130859375, -2.505126953125, -2.401519775390625, -2.29791259765625, -2.194305419921875, -2.0906982421875, -1.987091064453125, -1.88348388671875, -1.779876708984375, -1.67626953125, -1.572662353515625, -1.46905517578125, -1.365447998046875, -1.2618408203125, -1.158233642578125, -1.05462646484375, -0.951019287109375, -0.847412109375, -0.743804931640625, -0.64019775390625, -0.536590576171875, -0.4329833984375, -0.329376220703125, -0.22576904296875, -0.122161865234375, -0.0185546875, 0.085052490234375, 0.18865966796875, 0.292266845703125, 0.3958740234375, 0.499481201171875, 0.60308837890625, 0.706695556640625, 0.810302734375, 0.913909912109375, 1.01751708984375, 1.121124267578125, 1.2247314453125, 1.328338623046875, 1.43194580078125, 1.535552978515625, 1.63916015625, 1.742767333984375, 1.84637451171875, 1.949981689453125, 2.0535888671875, 2.157196044921875, 2.26080322265625, 2.364410400390625, 2.468017578125, 2.571624755859375, 2.67523193359375, 2.778839111328125, 2.8824462890625, 2.986053466796875, 3.08966064453125, 3.193267822265625, 3.296875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 15.0, 15.0, 19.0, 15.0, 39.0, 41.0, 68.0, 56.0, 91.0, 126.0, 162.0, 221.0, 298.0, 387.0, 503.0, 673.0, 995.0, 1241.0, 1882.0, 2874.0, 4343.0, 7787.0, 16292.0, 59243.0, 560990.0, 320525.0, 37650.0, 12833.0, 6636.0, 3788.0, 2428.0, 1682.0, 1184.0, 895.0, 666.0, 453.0, 351.0, 263.0, 200.0, 145.0, 114.0, 92.0, 65.0, 48.0, 39.0, 26.0, 24.0, 15.0, 13.0, 11.0, 8.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0], "bins": [-15.1171875, -14.6427001953125, -14.168212890625, -13.6937255859375, -13.21923828125, -12.7447509765625, -12.270263671875, -11.7957763671875, -11.3212890625, -10.8468017578125, -10.372314453125, -9.8978271484375, -9.42333984375, -8.9488525390625, -8.474365234375, -7.9998779296875, -7.525390625, -7.0509033203125, -6.576416015625, -6.1019287109375, -5.62744140625, -5.1529541015625, -4.678466796875, -4.2039794921875, -3.7294921875, -3.2550048828125, -2.780517578125, -2.3060302734375, -1.83154296875, -1.3570556640625, -0.882568359375, -0.4080810546875, 0.06640625, 0.5408935546875, 1.015380859375, 1.4898681640625, 1.96435546875, 2.4388427734375, 2.913330078125, 3.3878173828125, 3.8623046875, 4.3367919921875, 4.811279296875, 5.2857666015625, 5.76025390625, 6.2347412109375, 6.709228515625, 7.1837158203125, 7.658203125, 8.1326904296875, 8.607177734375, 9.0816650390625, 9.55615234375, 10.0306396484375, 10.505126953125, 10.9796142578125, 11.4541015625, 11.9285888671875, 12.403076171875, 12.8775634765625, 13.35205078125, 13.8265380859375, 14.301025390625, 14.7755126953125, 15.25]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 1.0, 6.0, 6.0, 12.0, 6.0, 12.0, 9.0, 18.0, 17.0, 14.0, 26.0, 19.0, 23.0, 37.0, 32.0, 26.0, 36.0, 52.0, 79.0, 119.0, 214.0, 1337.0, 301.0, 165.0, 83.0, 64.0, 43.0, 38.0, 34.0, 34.0, 34.0, 37.0, 23.0, 16.0, 6.0, 14.0, 10.0, 8.0, 7.0, 5.0, 2.0, 11.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.6875, -11.370849609375, -11.05419921875, -10.737548828125, -10.4208984375, -10.104248046875, -9.78759765625, -9.470947265625, -9.154296875, -8.837646484375, -8.52099609375, -8.204345703125, -7.8876953125, -7.571044921875, -7.25439453125, -6.937744140625, -6.62109375, -6.304443359375, -5.98779296875, -5.671142578125, -5.3544921875, -5.037841796875, -4.72119140625, -4.404541015625, -4.087890625, -3.771240234375, -3.45458984375, -3.137939453125, -2.8212890625, -2.504638671875, -2.18798828125, -1.871337890625, -1.5546875, -1.238037109375, -0.92138671875, -0.604736328125, -0.2880859375, 0.028564453125, 0.34521484375, 0.661865234375, 0.978515625, 1.295166015625, 1.61181640625, 1.928466796875, 2.2451171875, 2.561767578125, 2.87841796875, 3.195068359375, 3.51171875, 3.828369140625, 4.14501953125, 4.461669921875, 4.7783203125, 5.094970703125, 5.41162109375, 5.728271484375, 6.044921875, 6.361572265625, 6.67822265625, 6.994873046875, 7.3115234375, 7.628173828125, 7.94482421875, 8.261474609375, 8.578125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 5.0, 3.0, 3.0, 10.0, 4.0, 12.0, 11.0, 7.0, 13.0, 23.0, 23.0, 40.0, 38.0, 47.0, 50.0, 112.0, 170.0, 495.0, 1884.0, 261235.0, 2876437.0, 3566.0, 751.0, 282.0, 123.0, 69.0, 59.0, 31.0, 31.0, 32.0, 24.0, 24.0, 14.0, 19.0, 12.0, 7.0, 7.0, 7.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.28125, -36.92138671875, -35.5615234375, -34.20166015625, -32.841796875, -31.48193359375, -30.1220703125, -28.76220703125, -27.40234375, -26.04248046875, -24.6826171875, -23.32275390625, -21.962890625, -20.60302734375, -19.2431640625, -17.88330078125, -16.5234375, -15.16357421875, -13.8037109375, -12.44384765625, -11.083984375, -9.72412109375, -8.3642578125, -7.00439453125, -5.64453125, -4.28466796875, -2.9248046875, -1.56494140625, -0.205078125, 1.15478515625, 2.5146484375, 3.87451171875, 5.234375, 6.59423828125, 7.9541015625, 9.31396484375, 10.673828125, 12.03369140625, 13.3935546875, 14.75341796875, 16.11328125, 17.47314453125, 18.8330078125, 20.19287109375, 21.552734375, 22.91259765625, 24.2724609375, 25.63232421875, 26.9921875, 28.35205078125, 29.7119140625, 31.07177734375, 32.431640625, 33.79150390625, 35.1513671875, 36.51123046875, 37.87109375, 39.23095703125, 40.5908203125, 41.95068359375, 43.310546875, 44.67041015625, 46.0302734375, 47.39013671875, 48.75]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 36.0, 978.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.64373779296875, -133.6239013671875, -120.60406494140625, -107.584228515625, -94.56439208984375, -81.54454803466797, -68.52471160888672, -55.50487518310547, -42.48503875732422, -29.46520233154297, -16.445363998413086, -3.425525665283203, 9.594310760498047, 22.614151000976562, 35.63398742675781, 48.65382385253906, 61.67366027832031, 74.69349670410156, 87.71333312988281, 100.73316955566406, 113.75300598144531, 126.7728500366211, 139.79269409179688, 152.81253051757812, 165.83236694335938, 178.85220336914062, 191.87203979492188, 204.89187622070312, 217.91171264648438, 230.93154907226562, 243.95138549804688, 256.9712219238281, 269.9910583496094, 283.0108947753906, 296.0307312011719, 309.0505676269531, 322.0704040527344, 335.0902404785156, 348.1100769042969, 361.1299133300781, 374.1497497558594, 387.1695861816406, 400.1894226074219, 413.2092590332031, 426.2290954589844, 439.2489318847656, 452.2687683105469, 465.2886047363281, 478.3084716796875, 491.32830810546875, 504.34814453125, 517.3679809570312, 530.3878173828125, 543.4076538085938, 556.427490234375, 569.4473266601562, 582.4671630859375, 595.4869995117188, 608.5068359375, 621.5266723632812, 634.5465087890625, 647.5663452148438, 660.586181640625, 673.6060180664062, 686.6258544921875]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 1.0, 11.0, 6.0, 6.0, 8.0, 11.0, 15.0, 15.0, 22.0, 19.0, 15.0, 14.0, 30.0, 25.0, 26.0, 23.0, 40.0, 31.0, 40.0, 38.0, 42.0, 42.0, 40.0, 36.0, 36.0, 38.0, 45.0, 37.0, 33.0, 31.0, 25.0, 21.0, 27.0, 16.0, 21.0, 15.0, 15.0, 16.0, 15.0, 11.0, 7.0, 13.0, 5.0, 7.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.29164695739746, -30.18182373046875, -29.071998596191406, -27.962175369262695, -26.852352142333984, -25.74252700805664, -24.63270378112793, -23.52288055419922, -22.413055419921875, -21.303232192993164, -20.19340705871582, -19.08358383178711, -17.973758697509766, -16.863935470581055, -15.754112243652344, -14.644288063049316, -13.534463882446289, -12.424639701843262, -11.314815521240234, -10.204992294311523, -9.095168113708496, -7.985343933105469, -6.8755202293396, -5.7656965255737305, -4.655872344970703, -3.546048402786255, -2.4362244606018066, -1.3264005184173584, -0.21657657623291016, 0.8932476043701172, 2.0030713081359863, 3.1128950119018555, 4.222721099853516, 5.332545280456543, 6.442368984222412, 7.552192687988281, 8.662016868591309, 9.771841049194336, 10.881664276123047, 11.991488456726074, 13.101312637329102, 14.211136817932129, 15.320960998535156, 16.430784225463867, 17.540607452392578, 18.650432586669922, 19.760255813598633, 20.870079040527344, 21.979904174804688, 23.0897274017334, 24.199552536010742, 25.309375762939453, 26.419200897216797, 27.529024124145508, 28.63884735107422, 29.748672485351562, 30.858495712280273, 31.968318939208984, 33.07814407348633, 34.18796920776367, 35.29779052734375, 36.407615661621094, 37.51744079589844, 38.627262115478516, 39.73708724975586]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 8.0, 5.0, 8.0, 10.0, 15.0, 20.0, 25.0, 12.0, 27.0, 36.0, 19.0, 20.0, 31.0, 50.0, 44.0, 41.0, 43.0, 49.0, 58.0, 35.0, 27.0, 40.0, 37.0, 36.0, 26.0, 33.0, 35.0, 33.0, 24.0, 21.0, 21.0, 17.0, 17.0, 11.0, 7.0, 12.0, 12.0, 4.0, 5.0, 7.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.298828125, -3.188140869140625, -3.07745361328125, -2.966766357421875, -2.8560791015625, -2.745391845703125, -2.63470458984375, -2.524017333984375, -2.413330078125, -2.302642822265625, -2.19195556640625, -2.081268310546875, -1.9705810546875, -1.859893798828125, -1.74920654296875, -1.638519287109375, -1.52783203125, -1.417144775390625, -1.30645751953125, -1.195770263671875, -1.0850830078125, -0.974395751953125, -0.86370849609375, -0.753021240234375, -0.642333984375, -0.531646728515625, -0.42095947265625, -0.310272216796875, -0.1995849609375, -0.088897705078125, 0.02178955078125, 0.132476806640625, 0.2431640625, 0.353851318359375, 0.46453857421875, 0.575225830078125, 0.6859130859375, 0.796600341796875, 0.90728759765625, 1.017974853515625, 1.128662109375, 1.239349365234375, 1.35003662109375, 1.460723876953125, 1.5714111328125, 1.682098388671875, 1.79278564453125, 1.903472900390625, 2.01416015625, 2.124847412109375, 2.23553466796875, 2.346221923828125, 2.4569091796875, 2.567596435546875, 2.67828369140625, 2.788970947265625, 2.899658203125, 3.010345458984375, 3.12103271484375, 3.231719970703125, 3.3424072265625, 3.453094482421875, 3.56378173828125, 3.674468994140625, 3.78515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 11.0, 11.0, 9.0, 30.0, 22.0, 38.0, 44.0, 70.0, 71.0, 138.0, 165.0, 318.0, 481.0, 772.0, 1411.0, 2662.0, 5556.0, 12726.0, 38588.0, 278339.0, 2982182.0, 770815.0, 66083.0, 18015.0, 7503.0, 3554.0, 1839.0, 1039.0, 584.0, 365.0, 247.0, 174.0, 111.0, 71.0, 50.0, 50.0, 31.0, 24.0, 18.0, 16.0, 14.0, 7.0, 9.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-15.4296875, -14.9425048828125, -14.455322265625, -13.9681396484375, -13.48095703125, -12.9937744140625, -12.506591796875, -12.0194091796875, -11.5322265625, -11.0450439453125, -10.557861328125, -10.0706787109375, -9.58349609375, -9.0963134765625, -8.609130859375, -8.1219482421875, -7.634765625, -7.1475830078125, -6.660400390625, -6.1732177734375, -5.68603515625, -5.1988525390625, -4.711669921875, -4.2244873046875, -3.7373046875, -3.2501220703125, -2.762939453125, -2.2757568359375, -1.78857421875, -1.3013916015625, -0.814208984375, -0.3270263671875, 0.16015625, 0.6473388671875, 1.134521484375, 1.6217041015625, 2.10888671875, 2.5960693359375, 3.083251953125, 3.5704345703125, 4.0576171875, 4.5447998046875, 5.031982421875, 5.5191650390625, 6.00634765625, 6.4935302734375, 6.980712890625, 7.4678955078125, 7.955078125, 8.4422607421875, 8.929443359375, 9.4166259765625, 9.90380859375, 10.3909912109375, 10.878173828125, 11.3653564453125, 11.8525390625, 12.3397216796875, 12.826904296875, 13.3140869140625, 13.80126953125, 14.2884521484375, 14.775634765625, 15.2628173828125, 15.75]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 9.0, 10.0, 16.0, 22.0, 31.0, 41.0, 53.0, 82.0, 117.0, 143.0, 256.0, 337.0, 469.0, 555.0, 528.0, 439.0, 323.0, 194.0, 126.0, 110.0, 62.0, 49.0, 28.0, 22.0, 15.0, 15.0, 8.0, 8.0, 1.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.40625, -20.86962890625, -20.3330078125, -19.79638671875, -19.259765625, -18.72314453125, -18.1865234375, -17.64990234375, -17.11328125, -16.57666015625, -16.0400390625, -15.50341796875, -14.966796875, -14.43017578125, -13.8935546875, -13.35693359375, -12.8203125, -12.28369140625, -11.7470703125, -11.21044921875, -10.673828125, -10.13720703125, -9.6005859375, -9.06396484375, -8.52734375, -7.99072265625, -7.4541015625, -6.91748046875, -6.380859375, -5.84423828125, -5.3076171875, -4.77099609375, -4.234375, -3.69775390625, -3.1611328125, -2.62451171875, -2.087890625, -1.55126953125, -1.0146484375, -0.47802734375, 0.05859375, 0.59521484375, 1.1318359375, 1.66845703125, 2.205078125, 2.74169921875, 3.2783203125, 3.81494140625, 4.3515625, 4.88818359375, 5.4248046875, 5.96142578125, 6.498046875, 7.03466796875, 7.5712890625, 8.10791015625, 8.64453125, 9.18115234375, 9.7177734375, 10.25439453125, 10.791015625, 11.32763671875, 11.8642578125, 12.40087890625, 12.9375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 11.0, 7.0, 11.0, 12.0, 19.0, 27.0, 33.0, 34.0, 61.0, 64.0, 115.0, 182.0, 285.0, 854.0, 6765.0, 3666562.0, 515396.0, 2512.0, 542.0, 271.0, 162.0, 118.0, 67.0, 52.0, 30.0, 30.0, 13.0, 10.0, 12.0, 8.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.78125, -43.68505859375, -41.5888671875, -39.49267578125, -37.396484375, -35.30029296875, -33.2041015625, -31.10791015625, -29.01171875, -26.91552734375, -24.8193359375, -22.72314453125, -20.626953125, -18.53076171875, -16.4345703125, -14.33837890625, -12.2421875, -10.14599609375, -8.0498046875, -5.95361328125, -3.857421875, -1.76123046875, 0.3349609375, 2.43115234375, 4.52734375, 6.62353515625, 8.7197265625, 10.81591796875, 12.912109375, 15.00830078125, 17.1044921875, 19.20068359375, 21.296875, 23.39306640625, 25.4892578125, 27.58544921875, 29.681640625, 31.77783203125, 33.8740234375, 35.97021484375, 38.06640625, 40.16259765625, 42.2587890625, 44.35498046875, 46.451171875, 48.54736328125, 50.6435546875, 52.73974609375, 54.8359375, 56.93212890625, 59.0283203125, 61.12451171875, 63.220703125, 65.31689453125, 67.4130859375, 69.50927734375, 71.60546875, 73.70166015625, 75.7978515625, 77.89404296875, 79.990234375, 82.08642578125, 84.1826171875, 86.27880859375, 88.375]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 64.0, 780.0, 169.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.50341033935547, -53.95943069458008, -44.41545104980469, -34.87147521972656, -25.327495574951172, -15.783515930175781, -6.239540100097656, 3.304443359375, 12.848419189453125, 22.392398834228516, 31.936376571655273, 41.48035430908203, 51.02433395385742, 60.56831359863281, 70.11228942871094, 79.6562728881836, 89.20024871826172, 98.74422454833984, 108.2882080078125, 117.83218383789062, 127.37615966796875, 136.92013549804688, 146.464111328125, 156.0081024169922, 165.5520782470703, 175.09605407714844, 184.64002990722656, 194.18402099609375, 203.72799682617188, 213.27197265625, 222.81594848632812, 232.35992431640625, 241.90390014648438, 251.4478759765625, 260.9918518066406, 270.53582763671875, 280.0798034667969, 289.623779296875, 299.16778564453125, 308.7117614746094, 318.2557373046875, 327.7997131347656, 337.34368896484375, 346.8876647949219, 356.431640625, 365.97564697265625, 375.51959228515625, 385.0635986328125, 394.6075439453125, 404.1515197753906, 413.69549560546875, 423.2394714355469, 432.783447265625, 442.32745361328125, 451.87139892578125, 461.4154052734375, 470.9593811035156, 480.50335693359375, 490.0473327636719, 499.59130859375, 509.1352844238281, 518.6792602539062, 528.2232666015625, 537.7672119140625, 547.3112182617188]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 7.0, 4.0, 10.0, 8.0, 10.0, 11.0, 11.0, 20.0, 18.0, 15.0, 19.0, 29.0, 36.0, 24.0, 35.0, 31.0, 35.0, 34.0, 22.0, 40.0, 42.0, 29.0, 45.0, 33.0, 34.0, 31.0, 38.0, 30.0, 33.0, 31.0, 28.0, 16.0, 22.0, 22.0, 20.0, 15.0, 22.0, 10.0, 19.0, 7.0, 6.0, 2.0, 9.0, 6.0, 3.0, 9.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-42.270423889160156, -40.95475387573242, -39.63908386230469, -38.32341384887695, -37.00774383544922, -35.692073822021484, -34.37640380859375, -33.06072998046875, -31.74506187438965, -30.429391860961914, -29.11372184753418, -27.798051834106445, -26.482379913330078, -25.166709899902344, -23.85103988647461, -22.535369873046875, -21.21969985961914, -19.904029846191406, -18.588359832763672, -17.272689819335938, -15.957018852233887, -14.641348838806152, -13.325677871704102, -12.010007858276367, -10.694337844848633, -9.378667831420898, -8.062997817993164, -6.747326850891113, -5.431656837463379, -4.1159868240356445, -2.800316333770752, -1.4846458435058594, -0.168975830078125, 1.1466944217681885, 2.462364673614502, 3.7780349254608154, 5.093705177307129, 6.409375190734863, 7.725045680999756, 9.040716171264648, 10.356386184692383, 11.672056198120117, 12.987726211547852, 14.303397178649902, 15.619067192077637, 16.934738159179688, 18.250408172607422, 19.566078186035156, 20.88174819946289, 22.197418212890625, 23.51308822631836, 24.828758239746094, 26.144428253173828, 27.460098266601562, 28.77577018737793, 30.091440200805664, 31.4071102142334, 32.722782135009766, 34.0384521484375, 35.354122161865234, 36.66979217529297, 37.9854621887207, 39.30113220214844, 40.61680221557617, 41.932472229003906]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 2.0, 2.0, 16.0, 15.0, 13.0, 23.0, 18.0, 6.0, 18.0, 24.0, 20.0, 27.0, 31.0, 30.0, 31.0, 44.0, 37.0, 43.0, 44.0, 34.0, 39.0, 52.0, 25.0, 32.0, 31.0, 30.0, 29.0, 24.0, 24.0, 30.0, 23.0, 32.0, 20.0, 19.0, 14.0, 11.0, 9.0, 12.0, 6.0, 8.0, 10.0, 8.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.25, -3.14715576171875, -3.0443115234375, -2.94146728515625, -2.838623046875, -2.73577880859375, -2.6329345703125, -2.53009033203125, -2.42724609375, -2.32440185546875, -2.2215576171875, -2.11871337890625, -2.015869140625, -1.91302490234375, -1.8101806640625, -1.70733642578125, -1.6044921875, -1.50164794921875, -1.3988037109375, -1.29595947265625, -1.193115234375, -1.09027099609375, -0.9874267578125, -0.88458251953125, -0.78173828125, -0.67889404296875, -0.5760498046875, -0.47320556640625, -0.370361328125, -0.26751708984375, -0.1646728515625, -0.06182861328125, 0.041015625, 0.14385986328125, 0.2467041015625, 0.34954833984375, 0.452392578125, 0.55523681640625, 0.6580810546875, 0.76092529296875, 0.86376953125, 0.96661376953125, 1.0694580078125, 1.17230224609375, 1.275146484375, 1.37799072265625, 1.4808349609375, 1.58367919921875, 1.6865234375, 1.78936767578125, 1.8922119140625, 1.99505615234375, 2.097900390625, 2.20074462890625, 2.3035888671875, 2.40643310546875, 2.50927734375, 2.61212158203125, 2.7149658203125, 2.81781005859375, 2.920654296875, 3.02349853515625, 3.1263427734375, 3.22918701171875, 3.33203125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 2.0, 5.0, 4.0, 12.0, 18.0, 36.0, 33.0, 38.0, 66.0, 122.0, 116.0, 172.0, 264.0, 380.0, 512.0, 698.0, 994.0, 1296.0, 1743.0, 2424.0, 3374.0, 4762.0, 6478.0, 9266.0, 13340.0, 18666.0, 27201.0, 41229.0, 64518.0, 107018.0, 256166.0, 203177.0, 98931.0, 59962.0, 38630.0, 25858.0, 17721.0, 12247.0, 8490.0, 6252.0, 4581.0, 3313.0, 2344.0, 1711.0, 1232.0, 931.0, 639.0, 453.0, 353.0, 220.0, 153.0, 129.0, 93.0, 50.0, 44.0, 34.0, 26.0, 17.0, 8.0, 7.0, 5.0, 2.0, 4.0], "bins": [-0.7900390625, -0.765289306640625, -0.74053955078125, -0.715789794921875, -0.6910400390625, -0.666290283203125, -0.64154052734375, -0.616790771484375, -0.592041015625, -0.567291259765625, -0.54254150390625, -0.517791748046875, -0.4930419921875, -0.468292236328125, -0.44354248046875, -0.418792724609375, -0.39404296875, -0.369293212890625, -0.34454345703125, -0.319793701171875, -0.2950439453125, -0.270294189453125, -0.24554443359375, -0.220794677734375, -0.196044921875, -0.171295166015625, -0.14654541015625, -0.121795654296875, -0.0970458984375, -0.072296142578125, -0.04754638671875, -0.022796630859375, 0.001953125, 0.026702880859375, 0.05145263671875, 0.076202392578125, 0.1009521484375, 0.125701904296875, 0.15045166015625, 0.175201416015625, 0.199951171875, 0.224700927734375, 0.24945068359375, 0.274200439453125, 0.2989501953125, 0.323699951171875, 0.34844970703125, 0.373199462890625, 0.39794921875, 0.422698974609375, 0.44744873046875, 0.472198486328125, 0.4969482421875, 0.521697998046875, 0.54644775390625, 0.571197509765625, 0.595947265625, 0.620697021484375, 0.64544677734375, 0.670196533203125, 0.6949462890625, 0.719696044921875, 0.74444580078125, 0.769195556640625, 0.7939453125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 10.0, 7.0, 8.0, 7.0, 6.0, 15.0, 18.0, 16.0, 20.0, 24.0, 27.0, 25.0, 26.0, 36.0, 42.0, 47.0, 54.0, 39.0, 44.0, 1060.0, 32.0, 42.0, 42.0, 34.0, 32.0, 23.0, 35.0, 30.0, 25.0, 28.0, 22.0, 23.0, 20.0, 19.0, 17.0, 16.0, 12.0, 11.0, 6.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.23828125, -2.163482666015625, -2.08868408203125, -2.013885498046875, -1.9390869140625, -1.864288330078125, -1.78948974609375, -1.714691162109375, -1.639892578125, -1.565093994140625, -1.49029541015625, -1.415496826171875, -1.3406982421875, -1.265899658203125, -1.19110107421875, -1.116302490234375, -1.04150390625, -0.966705322265625, -0.89190673828125, -0.817108154296875, -0.7423095703125, -0.667510986328125, -0.59271240234375, -0.517913818359375, -0.443115234375, -0.368316650390625, -0.29351806640625, -0.218719482421875, -0.1439208984375, -0.069122314453125, 0.00567626953125, 0.080474853515625, 0.1552734375, 0.230072021484375, 0.30487060546875, 0.379669189453125, 0.4544677734375, 0.529266357421875, 0.60406494140625, 0.678863525390625, 0.753662109375, 0.828460693359375, 0.90325927734375, 0.978057861328125, 1.0528564453125, 1.127655029296875, 1.20245361328125, 1.277252197265625, 1.35205078125, 1.426849365234375, 1.50164794921875, 1.576446533203125, 1.6512451171875, 1.726043701171875, 1.80084228515625, 1.875640869140625, 1.950439453125, 2.025238037109375, 2.10003662109375, 2.174835205078125, 2.2496337890625, 2.324432373046875, 2.39923095703125, 2.474029541015625, 2.548828125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 0.0, 4.0, 4.0, 7.0, 8.0, 14.0, 20.0, 44.0, 38.0, 66.0, 97.0, 119.0, 212.0, 299.0, 457.0, 647.0, 1020.0, 1495.0, 2223.0, 3179.0, 4570.0, 6797.0, 10323.0, 15437.0, 23050.0, 35779.0, 55869.0, 91366.0, 174691.0, 1341643.0, 123395.0, 71856.0, 45241.0, 29295.0, 19148.0, 12478.0, 8482.0, 5762.0, 3910.0, 2559.0, 1819.0, 1209.0, 822.0, 536.0, 382.0, 241.0, 180.0, 122.0, 88.0, 46.0, 30.0, 23.0, 18.0, 8.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86328125, -0.8347549438476562, -0.8062286376953125, -0.7777023315429688, -0.749176025390625, -0.7206497192382812, -0.6921234130859375, -0.6635971069335938, -0.63507080078125, -0.6065444946289062, -0.5780181884765625, -0.5494918823242188, -0.520965576171875, -0.49243927001953125, -0.4639129638671875, -0.43538665771484375, -0.4068603515625, -0.37833404541015625, -0.3498077392578125, -0.32128143310546875, -0.292755126953125, -0.26422882080078125, -0.2357025146484375, -0.20717620849609375, -0.17864990234375, -0.15012359619140625, -0.1215972900390625, -0.09307098388671875, -0.064544677734375, -0.03601837158203125, -0.0074920654296875, 0.02103424072265625, 0.049560546875, 0.07808685302734375, 0.1066131591796875, 0.13513946533203125, 0.163665771484375, 0.19219207763671875, 0.2207183837890625, 0.24924468994140625, 0.27777099609375, 0.30629730224609375, 0.3348236083984375, 0.36334991455078125, 0.391876220703125, 0.42040252685546875, 0.4489288330078125, 0.47745513916015625, 0.5059814453125, 0.5345077514648438, 0.5630340576171875, 0.5915603637695312, 0.620086669921875, 0.6486129760742188, 0.6771392822265625, 0.7056655883789062, 0.73419189453125, 0.7627182006835938, 0.7912445068359375, 0.8197708129882812, 0.848297119140625, 0.8768234252929688, 0.9053497314453125, 0.9338760375976562, 0.96240234375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 12.0, 15.0, 20.0, 30.0, 24.0, 27.0, 38.0, 39.0, 46.0, 57.0, 63.0, 73.0, 61.0, 75.0, 57.0, 49.0, 49.0, 44.0, 24.0, 29.0, 19.0, 12.0, 27.0, 18.0, 11.0, 12.0, 13.0, 3.0, 6.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00011473894119262695, -0.00011072959750890732, -0.00010672025382518768, -0.00010271091014146805, -9.870156645774841e-05, -9.469222277402878e-05, -9.068287909030914e-05, -8.667353540658951e-05, -8.266419172286987e-05, -7.865484803915024e-05, -7.46455043554306e-05, -7.063616067171097e-05, -6.662681698799133e-05, -6.26174733042717e-05, -5.860812962055206e-05, -5.459878593683243e-05, -5.058944225311279e-05, -4.658009856939316e-05, -4.257075488567352e-05, -3.856141120195389e-05, -3.455206751823425e-05, -3.054272383451462e-05, -2.6533380150794983e-05, -2.2524036467075348e-05, -1.8514692783355713e-05, -1.4505349099636078e-05, -1.0496005415916443e-05, -6.486661732196808e-06, -2.477318048477173e-06, 1.5320256352424622e-06, 5.541369318962097e-06, 9.550713002681732e-06, 1.3560056686401367e-05, 1.7569400370121002e-05, 2.1578744053840637e-05, 2.5588087737560272e-05, 2.9597431421279907e-05, 3.360677510499954e-05, 3.761611878871918e-05, 4.162546247243881e-05, 4.563480615615845e-05, 4.964414983987808e-05, 5.365349352359772e-05, 5.766283720731735e-05, 6.167218089103699e-05, 6.568152457475662e-05, 6.969086825847626e-05, 7.370021194219589e-05, 7.770955562591553e-05, 8.171889930963516e-05, 8.57282429933548e-05, 8.973758667707443e-05, 9.374693036079407e-05, 9.77562740445137e-05, 0.00010176561772823334, 0.00010577496141195297, 0.00010978430509567261, 0.00011379364877939224, 0.00011780299246311188, 0.00012181233614683151, 0.00012582167983055115, 0.00012983102351427078, 0.00013384036719799042, 0.00013784971088171005, 0.0001418590545654297]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 9.0, 16.0, 16.0, 21.0, 15.0, 28.0, 43.0, 59.0, 65.0, 104.0, 106.0, 169.0, 254.0, 549.0, 1401.0, 994990.0, 48751.0, 764.0, 388.0, 213.0, 142.0, 115.0, 98.0, 57.0, 43.0, 33.0, 14.0, 14.0, 12.0, 9.0, 10.0, 7.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0030956268310546875, -0.003004014492034912, -0.0029124021530151367, -0.0028207898139953613, -0.002729177474975586, -0.0026375651359558105, -0.002545952796936035, -0.0024543404579162598, -0.0023627281188964844, -0.002271115779876709, -0.0021795034408569336, -0.002087891101837158, -0.001996278762817383, -0.0019046664237976074, -0.001813054084777832, -0.0017214417457580566, -0.0016298294067382812, -0.0015382170677185059, -0.0014466047286987305, -0.001354992389678955, -0.0012633800506591797, -0.0011717677116394043, -0.001080155372619629, -0.0009885430335998535, -0.0008969306945800781, -0.0008053183555603027, -0.0007137060165405273, -0.000622093677520752, -0.0005304813385009766, -0.00043886899948120117, -0.0003472566604614258, -0.0002556443214416504, -0.000164031982421875, -7.241964340209961e-05, 1.919269561767578e-05, 0.00011080503463745117, 0.00020241737365722656, 0.00029402971267700195, 0.00038564205169677734, 0.00047725439071655273, 0.0005688667297363281, 0.0006604790687561035, 0.0007520914077758789, 0.0008437037467956543, 0.0009353160858154297, 0.001026928424835205, 0.0011185407638549805, 0.0012101531028747559, 0.0013017654418945312, 0.0013933777809143066, 0.001484990119934082, 0.0015766024589538574, 0.0016682147979736328, 0.0017598271369934082, 0.0018514394760131836, 0.001943051815032959, 0.0020346641540527344, 0.0021262764930725098, 0.002217888832092285, 0.0023095011711120605, 0.002401113510131836, 0.0024927258491516113, 0.0025843381881713867, 0.002675950527191162, 0.0027675628662109375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 9.0, 44.0, 146.0, 341.0, 295.0, 145.0, 29.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.087855869438499e-05, -8.47978371893987e-05, -7.871711568441242e-05, -7.263638690346852e-05, -6.655566539848223e-05, -6.047494389349595e-05, -5.4394218750530854e-05, -4.831349360756576e-05, -4.2232772102579474e-05, -3.615205059759319e-05, -3.0071325454628095e-05, -2.3990602130652405e-05, -1.7909878806676716e-05, -1.1829155482701026e-05, -5.748432158725336e-06, 3.3229298423975706e-07, 6.413014489226043e-06, 1.2493737813201733e-05, 1.8574461137177423e-05, 2.4655184461153112e-05, 3.07359077851288e-05, 3.681662929011509e-05, 4.289735443308018e-05, 4.8978079576045275e-05, 5.505880108103156e-05, 6.113952258601785e-05, 6.722024409100413e-05, 7.330097287194803e-05, 7.938169437693432e-05, 8.54624158819206e-05, 9.15431446628645e-05, 9.762386616785079e-05, 0.00010370457312092185, 0.00010978529462590814, 0.00011586601613089442, 0.00012194674491183832, 0.000128027459140867, 0.0001341081951977685, 0.0001401889167027548, 0.00014626963820774108, 0.00015235035971272737, 0.00015843108121771365, 0.00016451180272269994, 0.00017059252422768623, 0.00017667326028458774, 0.00018275398178957403, 0.0001888347032945603, 0.0001949154247995466, 0.00020099614630453289, 0.00020707686780951917, 0.00021315758931450546, 0.00021923831081949174, 0.00022531903232447803, 0.00023139976838137954, 0.00023748048988636583, 0.00024356121139135212, 0.00024964194744825363, 0.0002557226689532399, 0.0002618033904582262, 0.0002678841119632125, 0.0002739648334681988, 0.00028004555497318506, 0.00028612627647817135, 0.00029220699798315763, 0.0002982877194881439]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 8.0, 4.0, 4.0, 3.0, 8.0, 13.0, 10.0, 7.0, 10.0, 21.0, 19.0, 28.0, 21.0, 25.0, 27.0, 41.0, 46.0, 33.0, 35.0, 50.0, 41.0, 50.0, 33.0, 37.0, 31.0, 27.0, 44.0, 31.0, 33.0, 26.0, 35.0, 35.0, 16.0, 22.0, 22.0, 16.0, 17.0, 14.0, 13.0, 11.0, 6.0, 6.0, 2.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.878376007080078e-05, -6.67748972773552e-05, -6.476603448390961e-05, -6.275717169046402e-05, -6.074830889701843e-05, -5.8739446103572845e-05, -5.673058331012726e-05, -5.472172051668167e-05, -5.2712857723236084e-05, -5.07039949297905e-05, -4.869513213634491e-05, -4.668626934289932e-05, -4.4677406549453735e-05, -4.266854375600815e-05, -4.065968096256256e-05, -3.8650818169116974e-05, -3.664195537567139e-05, -3.46330925822258e-05, -3.262422978878021e-05, -3.0615366995334625e-05, -2.8606504201889038e-05, -2.659764140844345e-05, -2.4588778614997864e-05, -2.2579915821552277e-05, -2.057105302810669e-05, -1.8562190234661102e-05, -1.6553327441215515e-05, -1.4544464647769928e-05, -1.253560185432434e-05, -1.0526739060878754e-05, -8.517876267433167e-06, -6.509013473987579e-06, -4.500150680541992e-06, -2.491287887096405e-06, -4.824250936508179e-07, 1.5264376997947693e-06, 3.5353004932403564e-06, 5.544163286685944e-06, 7.553026080131531e-06, 9.561888873577118e-06, 1.1570751667022705e-05, 1.3579614460468292e-05, 1.558847725391388e-05, 1.7597340047359467e-05, 1.9606202840805054e-05, 2.161506563425064e-05, 2.3623928427696228e-05, 2.5632791221141815e-05, 2.7641654014587402e-05, 2.965051680803299e-05, 3.165937960147858e-05, 3.3668242394924164e-05, 3.567710518836975e-05, 3.768596798181534e-05, 3.9694830775260925e-05, 4.170369356870651e-05, 4.37125563621521e-05, 4.572141915559769e-05, 4.7730281949043274e-05, 4.973914474248886e-05, 5.174800753593445e-05, 5.3756870329380035e-05, 5.576573312282562e-05, 5.777459591627121e-05, 5.97834587097168e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 2.0, 2.0, 16.0, 15.0, 13.0, 23.0, 18.0, 6.0, 18.0, 24.0, 20.0, 27.0, 31.0, 30.0, 31.0, 44.0, 37.0, 43.0, 44.0, 34.0, 39.0, 52.0, 25.0, 32.0, 31.0, 30.0, 29.0, 24.0, 24.0, 30.0, 23.0, 32.0, 20.0, 19.0, 14.0, 11.0, 9.0, 12.0, 6.0, 8.0, 10.0, 8.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.25, -3.14715576171875, -3.0443115234375, -2.94146728515625, -2.838623046875, -2.73577880859375, -2.6329345703125, -2.53009033203125, -2.42724609375, -2.32440185546875, -2.2215576171875, -2.11871337890625, -2.015869140625, -1.91302490234375, -1.8101806640625, -1.70733642578125, -1.6044921875, -1.50164794921875, -1.3988037109375, -1.29595947265625, -1.193115234375, -1.09027099609375, -0.9874267578125, -0.88458251953125, -0.78173828125, -0.67889404296875, -0.5760498046875, -0.47320556640625, -0.370361328125, -0.26751708984375, -0.1646728515625, -0.06182861328125, 0.041015625, 0.14385986328125, 0.2467041015625, 0.34954833984375, 0.452392578125, 0.55523681640625, 0.6580810546875, 0.76092529296875, 0.86376953125, 0.96661376953125, 1.0694580078125, 1.17230224609375, 1.275146484375, 1.37799072265625, 1.4808349609375, 1.58367919921875, 1.6865234375, 1.78936767578125, 1.8922119140625, 1.99505615234375, 2.097900390625, 2.20074462890625, 2.3035888671875, 2.40643310546875, 2.50927734375, 2.61212158203125, 2.7149658203125, 2.81781005859375, 2.920654296875, 3.02349853515625, 3.1263427734375, 3.22918701171875, 3.33203125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 10.0, 11.0, 7.0, 11.0, 17.0, 33.0, 45.0, 48.0, 76.0, 97.0, 106.0, 193.0, 240.0, 382.0, 536.0, 958.0, 1571.0, 2864.0, 5414.0, 11324.0, 25337.0, 60278.0, 144792.0, 276952.0, 272063.0, 139933.0, 57820.0, 24250.0, 10893.0, 5277.0, 2753.0, 1478.0, 927.0, 550.0, 391.0, 248.0, 186.0, 126.0, 98.0, 69.0, 50.0, 40.0, 26.0, 19.0, 16.0, 9.0, 9.0, 7.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.921875, -3.802947998046875, -3.68402099609375, -3.565093994140625, -3.4461669921875, -3.327239990234375, -3.20831298828125, -3.089385986328125, -2.970458984375, -2.851531982421875, -2.73260498046875, -2.613677978515625, -2.4947509765625, -2.375823974609375, -2.25689697265625, -2.137969970703125, -2.01904296875, -1.900115966796875, -1.78118896484375, -1.662261962890625, -1.5433349609375, -1.424407958984375, -1.30548095703125, -1.186553955078125, -1.067626953125, -0.948699951171875, -0.82977294921875, -0.710845947265625, -0.5919189453125, -0.472991943359375, -0.35406494140625, -0.235137939453125, -0.1162109375, 0.002716064453125, 0.12164306640625, 0.240570068359375, 0.3594970703125, 0.478424072265625, 0.59735107421875, 0.716278076171875, 0.835205078125, 0.954132080078125, 1.07305908203125, 1.191986083984375, 1.3109130859375, 1.429840087890625, 1.54876708984375, 1.667694091796875, 1.78662109375, 1.905548095703125, 2.02447509765625, 2.143402099609375, 2.2623291015625, 2.381256103515625, 2.50018310546875, 2.619110107421875, 2.738037109375, 2.856964111328125, 2.97589111328125, 3.094818115234375, 3.2137451171875, 3.332672119140625, 3.45159912109375, 3.570526123046875, 3.689453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 9.0, 4.0, 5.0, 11.0, 19.0, 10.0, 11.0, 9.0, 22.0, 20.0, 31.0, 27.0, 29.0, 29.0, 30.0, 49.0, 36.0, 76.0, 114.0, 257.0, 1425.0, 243.0, 105.0, 75.0, 60.0, 44.0, 45.0, 40.0, 32.0, 22.0, 21.0, 18.0, 17.0, 18.0, 17.0, 17.0, 12.0, 15.0, 3.0, 4.0, 12.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.875, -13.483642578125, -13.09228515625, -12.700927734375, -12.3095703125, -11.918212890625, -11.52685546875, -11.135498046875, -10.744140625, -10.352783203125, -9.96142578125, -9.570068359375, -9.1787109375, -8.787353515625, -8.39599609375, -8.004638671875, -7.61328125, -7.221923828125, -6.83056640625, -6.439208984375, -6.0478515625, -5.656494140625, -5.26513671875, -4.873779296875, -4.482421875, -4.091064453125, -3.69970703125, -3.308349609375, -2.9169921875, -2.525634765625, -2.13427734375, -1.742919921875, -1.3515625, -0.960205078125, -0.56884765625, -0.177490234375, 0.2138671875, 0.605224609375, 0.99658203125, 1.387939453125, 1.779296875, 2.170654296875, 2.56201171875, 2.953369140625, 3.3447265625, 3.736083984375, 4.12744140625, 4.518798828125, 4.91015625, 5.301513671875, 5.69287109375, 6.084228515625, 6.4755859375, 6.866943359375, 7.25830078125, 7.649658203125, 8.041015625, 8.432373046875, 8.82373046875, 9.215087890625, 9.6064453125, 9.997802734375, 10.38916015625, 10.780517578125, 11.171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 0.0, 4.0, 4.0, 5.0, 12.0, 7.0, 8.0, 15.0, 15.0, 16.0, 15.0, 21.0, 27.0, 34.0, 29.0, 48.0, 71.0, 102.0, 160.0, 295.0, 643.0, 2562.0, 115445.0, 2995505.0, 27837.0, 1603.0, 504.0, 210.0, 138.0, 91.0, 49.0, 44.0, 30.0, 36.0, 13.0, 21.0, 11.0, 11.0, 19.0, 15.0, 6.0, 7.0, 8.0, 7.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.703125, -21.87353515625, -21.0439453125, -20.21435546875, -19.384765625, -18.55517578125, -17.7255859375, -16.89599609375, -16.06640625, -15.23681640625, -14.4072265625, -13.57763671875, -12.748046875, -11.91845703125, -11.0888671875, -10.25927734375, -9.4296875, -8.60009765625, -7.7705078125, -6.94091796875, -6.111328125, -5.28173828125, -4.4521484375, -3.62255859375, -2.79296875, -1.96337890625, -1.1337890625, -0.30419921875, 0.525390625, 1.35498046875, 2.1845703125, 3.01416015625, 3.84375, 4.67333984375, 5.5029296875, 6.33251953125, 7.162109375, 7.99169921875, 8.8212890625, 9.65087890625, 10.48046875, 11.31005859375, 12.1396484375, 12.96923828125, 13.798828125, 14.62841796875, 15.4580078125, 16.28759765625, 17.1171875, 17.94677734375, 18.7763671875, 19.60595703125, 20.435546875, 21.26513671875, 22.0947265625, 22.92431640625, 23.75390625, 24.58349609375, 25.4130859375, 26.24267578125, 27.072265625, 27.90185546875, 28.7314453125, 29.56103515625, 30.390625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 42.0, 949.0, 25.0, 0.0, 1.0], "bins": [-371.7919006347656, -365.6394348144531, -359.48699951171875, -353.33453369140625, -347.1820983886719, -341.0296325683594, -334.877197265625, -328.7247314453125, -322.5722961425781, -316.4198303222656, -310.26739501953125, -304.11492919921875, -297.9624938964844, -291.8100280761719, -285.6575927734375, -279.505126953125, -273.3526916503906, -267.2002258300781, -261.04779052734375, -254.8953399658203, -248.74288940429688, -242.59043884277344, -236.43798828125, -230.28553771972656, -224.13307189941406, -217.98062133789062, -211.8281707763672, -205.67572021484375, -199.5232696533203, -193.37081909179688, -187.21836853027344, -181.06591796875, -174.91348266601562, -168.7610321044922, -162.60858154296875, -156.4561309814453, -150.30368041992188, -144.15122985839844, -137.998779296875, -131.84632873535156, -125.6938705444336, -119.54141998291016, -113.38896942138672, -107.23651885986328, -101.08406829833984, -94.9316177368164, -88.77915954589844, -82.626708984375, -76.47425842285156, -70.32180786132812, -64.16935729980469, -58.01690673828125, -51.86445617675781, -45.712005615234375, -39.55955123901367, -33.407100677490234, -27.25465202331543, -21.102201461791992, -14.949749946594238, -8.797298431396484, -2.644847869873047, 3.5076026916503906, 9.660055160522461, 15.812505722045898, 21.964956283569336]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 4.0, 7.0, 5.0, 10.0, 12.0, 23.0, 17.0, 14.0, 21.0, 28.0, 20.0, 29.0, 35.0, 31.0, 36.0, 38.0, 48.0, 39.0, 48.0, 39.0, 36.0, 44.0, 46.0, 32.0, 39.0, 44.0, 27.0, 27.0, 26.0, 22.0, 15.0, 29.0, 17.0, 12.0, 15.0, 15.0, 8.0, 4.0, 7.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.935726165771484, -38.70370864868164, -37.4716911315918, -36.23966979980469, -35.007652282714844, -33.775634765625, -32.543617248535156, -31.311599731445312, -30.079580307006836, -28.847562789916992, -27.615543365478516, -26.383525848388672, -25.151508331298828, -23.91948890686035, -22.687471389770508, -21.45545196533203, -20.223434448242188, -18.991416931152344, -17.759397506713867, -16.527379989624023, -15.295361518859863, -14.063343048095703, -12.83132553100586, -11.5993070602417, -10.367288589477539, -9.135270118713379, -7.903252124786377, -6.671234130859375, -5.439215660095215, -4.207197189331055, -2.9751791954040527, -1.7431612014770508, -0.5111465454101562, 0.7208716869354248, 1.9528899192810059, 3.184908151626587, 4.416926383972168, 5.648944854736328, 6.88096284866333, 8.112980842590332, 9.344999313354492, 10.577017784118652, 11.809036254882812, 13.041053771972656, 14.273072242736816, 15.505090713500977, 16.73710823059082, 17.969127655029297, 19.20114517211914, 20.433162689208984, 21.66518211364746, 22.897199630737305, 24.12921905517578, 25.361236572265625, 26.59325408935547, 27.825271606445312, 29.05729103088379, 30.289308547973633, 31.52132797241211, 32.75334548950195, 33.9853630065918, 35.217384338378906, 36.44940185546875, 37.681419372558594, 38.91343688964844]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 9.0, 12.0, 13.0, 16.0, 14.0, 15.0, 19.0, 15.0, 18.0, 23.0, 28.0, 19.0, 34.0, 27.0, 29.0, 47.0, 39.0, 39.0, 37.0, 35.0, 49.0, 45.0, 29.0, 33.0, 34.0, 31.0, 22.0, 32.0, 25.0, 29.0, 13.0, 24.0, 24.0, 21.0, 15.0, 10.0, 8.0, 8.0, 9.0, 8.0, 7.0, 7.0, 7.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.33984375, -3.23284912109375, -3.1258544921875, -3.01885986328125, -2.911865234375, -2.80487060546875, -2.6978759765625, -2.59088134765625, -2.48388671875, -2.37689208984375, -2.2698974609375, -2.16290283203125, -2.055908203125, -1.94891357421875, -1.8419189453125, -1.73492431640625, -1.6279296875, -1.52093505859375, -1.4139404296875, -1.30694580078125, -1.199951171875, -1.09295654296875, -0.9859619140625, -0.87896728515625, -0.77197265625, -0.66497802734375, -0.5579833984375, -0.45098876953125, -0.343994140625, -0.23699951171875, -0.1300048828125, -0.02301025390625, 0.083984375, 0.19097900390625, 0.2979736328125, 0.40496826171875, 0.511962890625, 0.61895751953125, 0.7259521484375, 0.83294677734375, 0.93994140625, 1.04693603515625, 1.1539306640625, 1.26092529296875, 1.367919921875, 1.47491455078125, 1.5819091796875, 1.68890380859375, 1.7958984375, 1.90289306640625, 2.0098876953125, 2.11688232421875, 2.223876953125, 2.33087158203125, 2.4378662109375, 2.54486083984375, 2.65185546875, 2.75885009765625, 2.8658447265625, 2.97283935546875, 3.079833984375, 3.18682861328125, 3.2938232421875, 3.40081787109375, 3.5078125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 4.0, 8.0, 7.0, 8.0, 11.0, 22.0, 24.0, 27.0, 37.0, 39.0, 52.0, 66.0, 109.0, 171.0, 334.0, 781.0, 2591.0, 16538.0, 289811.0, 2990276.0, 848806.0, 38028.0, 4293.0, 1102.0, 412.0, 223.0, 94.0, 87.0, 67.0, 49.0, 54.0, 24.0, 24.0, 15.0, 17.0, 11.0, 12.0, 6.0, 5.0, 3.0, 10.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-13.9296875, -13.5032958984375, -13.076904296875, -12.6505126953125, -12.22412109375, -11.7977294921875, -11.371337890625, -10.9449462890625, -10.5185546875, -10.0921630859375, -9.665771484375, -9.2393798828125, -8.81298828125, -8.3865966796875, -7.960205078125, -7.5338134765625, -7.107421875, -6.6810302734375, -6.254638671875, -5.8282470703125, -5.40185546875, -4.9754638671875, -4.549072265625, -4.1226806640625, -3.6962890625, -3.2698974609375, -2.843505859375, -2.4171142578125, -1.99072265625, -1.5643310546875, -1.137939453125, -0.7115478515625, -0.28515625, 0.1412353515625, 0.567626953125, 0.9940185546875, 1.42041015625, 1.8468017578125, 2.273193359375, 2.6995849609375, 3.1259765625, 3.5523681640625, 3.978759765625, 4.4051513671875, 4.83154296875, 5.2579345703125, 5.684326171875, 6.1107177734375, 6.537109375, 6.9635009765625, 7.389892578125, 7.8162841796875, 8.24267578125, 8.6690673828125, 9.095458984375, 9.5218505859375, 9.9482421875, 10.3746337890625, 10.801025390625, 11.2274169921875, 11.65380859375, 12.0802001953125, 12.506591796875, 12.9329833984375, 13.359375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 10.0, 14.0, 18.0, 26.0, 40.0, 60.0, 81.0, 131.0, 168.0, 221.0, 316.0, 444.0, 506.0, 541.0, 433.0, 293.0, 232.0, 155.0, 118.0, 75.0, 63.0, 36.0, 35.0, 16.0, 9.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.585693359375, -16.12451171875, -15.663330078125, -15.2021484375, -14.740966796875, -14.27978515625, -13.818603515625, -13.357421875, -12.896240234375, -12.43505859375, -11.973876953125, -11.5126953125, -11.051513671875, -10.59033203125, -10.129150390625, -9.66796875, -9.206787109375, -8.74560546875, -8.284423828125, -7.8232421875, -7.362060546875, -6.90087890625, -6.439697265625, -5.978515625, -5.517333984375, -5.05615234375, -4.594970703125, -4.1337890625, -3.672607421875, -3.21142578125, -2.750244140625, -2.2890625, -1.827880859375, -1.36669921875, -0.905517578125, -0.4443359375, 0.016845703125, 0.47802734375, 0.939208984375, 1.400390625, 1.861572265625, 2.32275390625, 2.783935546875, 3.2451171875, 3.706298828125, 4.16748046875, 4.628662109375, 5.08984375, 5.551025390625, 6.01220703125, 6.473388671875, 6.9345703125, 7.395751953125, 7.85693359375, 8.318115234375, 8.779296875, 9.240478515625, 9.70166015625, 10.162841796875, 10.6240234375, 11.085205078125, 11.54638671875, 12.007568359375, 12.46875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 13.0, 21.0, 25.0, 34.0, 65.0, 106.0, 160.0, 305.0, 703.0, 2678.0, 114570.0, 4006486.0, 65466.0, 2268.0, 624.0, 280.0, 163.0, 110.0, 65.0, 46.0, 17.0, 23.0, 11.0, 10.0, 8.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.9375, -29.4248046875, -27.912109375, -26.3994140625, -24.88671875, -23.3740234375, -21.861328125, -20.3486328125, -18.8359375, -17.3232421875, -15.810546875, -14.2978515625, -12.78515625, -11.2724609375, -9.759765625, -8.2470703125, -6.734375, -5.2216796875, -3.708984375, -2.1962890625, -0.68359375, 0.8291015625, 2.341796875, 3.8544921875, 5.3671875, 6.8798828125, 8.392578125, 9.9052734375, 11.41796875, 12.9306640625, 14.443359375, 15.9560546875, 17.46875, 18.9814453125, 20.494140625, 22.0068359375, 23.51953125, 25.0322265625, 26.544921875, 28.0576171875, 29.5703125, 31.0830078125, 32.595703125, 34.1083984375, 35.62109375, 37.1337890625, 38.646484375, 40.1591796875, 41.671875, 43.1845703125, 44.697265625, 46.2099609375, 47.72265625, 49.2353515625, 50.748046875, 52.2607421875, 53.7734375, 55.2861328125, 56.798828125, 58.3115234375, 59.82421875, 61.3369140625, 62.849609375, 64.3623046875, 65.875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 19.0, 14.0, 24.0, 42.0, 42.0, 60.0, 91.0, 88.0, 96.0, 80.0, 99.0, 82.0, 81.0, 56.0, 48.0, 41.0, 15.0, 12.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.902835845947266, -35.79629898071289, -34.68975830078125, -33.583221435546875, -32.476680755615234, -31.370141983032227, -30.26360321044922, -29.157066345214844, -28.050525665283203, -26.943986892700195, -25.837448120117188, -24.73090934753418, -23.624370574951172, -22.517831802368164, -21.411293029785156, -20.30475616455078, -19.198217391967773, -18.091678619384766, -16.985139846801758, -15.87860107421875, -14.772062301635742, -13.665523529052734, -12.558985710144043, -11.452446937561035, -10.345908164978027, -9.23936939239502, -8.132830619812012, -7.026292324066162, -5.919753551483154, -4.8132147789001465, -3.706676483154297, -2.600137710571289, -1.4935989379882812, -0.387060284614563, 0.7194783687591553, 1.826016902923584, 2.932555675506592, 4.0390944480896, 5.145632743835449, 6.252171516418457, 7.358710289001465, 8.465249061584473, 9.57178783416748, 10.678325653076172, 11.78486442565918, 12.891403198242188, 13.997941970825195, 15.104480743408203, 16.21101951599121, 17.31755828857422, 18.424097061157227, 19.530635833740234, 20.637174606323242, 21.74371337890625, 22.850250244140625, 23.956790924072266, 25.06332778930664, 26.16986656188965, 27.276405334472656, 28.382944107055664, 29.489482879638672, 30.59602165222168, 31.702560424804688, 32.80909729003906, 33.9156379699707]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 3.0, 6.0, 10.0, 8.0, 18.0, 20.0, 21.0, 16.0, 26.0, 25.0, 25.0, 38.0, 31.0, 32.0, 26.0, 40.0, 46.0, 44.0, 41.0, 54.0, 37.0, 35.0, 34.0, 37.0, 43.0, 28.0, 38.0, 35.0, 27.0, 30.0, 25.0, 14.0, 21.0, 12.0, 7.0, 9.0, 16.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.34829330444336, -39.93910598754883, -38.5299186706543, -37.120731353759766, -35.711544036865234, -34.3023567199707, -32.893165588378906, -31.483980178833008, -30.074792861938477, -28.665605545043945, -27.256418228149414, -25.84722900390625, -24.43804168701172, -23.028854370117188, -21.619667053222656, -20.210479736328125, -18.801292419433594, -17.392105102539062, -15.982917785644531, -14.573729515075684, -13.164542198181152, -11.755354881286621, -10.346166610717773, -8.936979293823242, -7.527791976928711, -6.11860466003418, -4.70941686630249, -3.300229072570801, -1.8910417556762695, -0.4818544387817383, 0.9273338317871094, 2.3365211486816406, 3.7457122802734375, 5.154899597167969, 6.564087390899658, 7.973275184631348, 9.382462501525879, 10.79164981842041, 12.200838088989258, 13.610025405883789, 15.01921272277832, 16.42840003967285, 17.837587356567383, 19.246776580810547, 20.655963897705078, 22.06515121459961, 23.47433853149414, 24.883525848388672, 26.292713165283203, 27.701900482177734, 29.111087799072266, 30.520275115966797, 31.929462432861328, 33.33864974975586, 34.747840881347656, 36.15702819824219, 37.56621551513672, 38.97540283203125, 40.38459014892578, 41.79377746582031, 43.202964782714844, 44.612152099609375, 46.021339416503906, 47.43052673339844, 48.83971405029297]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 9.0, 4.0, 10.0, 8.0, 10.0, 8.0, 13.0, 7.0, 12.0, 23.0, 18.0, 12.0, 32.0, 23.0, 25.0, 35.0, 29.0, 35.0, 46.0, 50.0, 38.0, 33.0, 46.0, 35.0, 37.0, 35.0, 35.0, 38.0, 35.0, 25.0, 25.0, 31.0, 23.0, 26.0, 10.0, 23.0, 19.0, 15.0, 14.0, 8.0, 8.0, 6.0, 3.0, 8.0, 6.0, 4.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.740234375, -3.625640869140625, -3.51104736328125, -3.396453857421875, -3.2818603515625, -3.167266845703125, -3.05267333984375, -2.938079833984375, -2.823486328125, -2.708892822265625, -2.59429931640625, -2.479705810546875, -2.3651123046875, -2.250518798828125, -2.13592529296875, -2.021331787109375, -1.90673828125, -1.792144775390625, -1.67755126953125, -1.562957763671875, -1.4483642578125, -1.333770751953125, -1.21917724609375, -1.104583740234375, -0.989990234375, -0.875396728515625, -0.76080322265625, -0.646209716796875, -0.5316162109375, -0.417022705078125, -0.30242919921875, -0.187835693359375, -0.0732421875, 0.041351318359375, 0.15594482421875, 0.270538330078125, 0.3851318359375, 0.499725341796875, 0.61431884765625, 0.728912353515625, 0.843505859375, 0.958099365234375, 1.07269287109375, 1.187286376953125, 1.3018798828125, 1.416473388671875, 1.53106689453125, 1.645660400390625, 1.76025390625, 1.874847412109375, 1.98944091796875, 2.104034423828125, 2.2186279296875, 2.333221435546875, 2.44781494140625, 2.562408447265625, 2.677001953125, 2.791595458984375, 2.90618896484375, 3.020782470703125, 3.1353759765625, 3.249969482421875, 3.36456298828125, 3.479156494140625, 3.59375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 5.0, 10.0, 18.0, 21.0, 40.0, 47.0, 71.0, 90.0, 153.0, 208.0, 311.0, 384.0, 528.0, 769.0, 1046.0, 1504.0, 2107.0, 2929.0, 4087.0, 5725.0, 7937.0, 11207.0, 16164.0, 23541.0, 33897.0, 51865.0, 84670.0, 153878.0, 291938.0, 130878.0, 73617.0, 46370.0, 30945.0, 20790.0, 14718.0, 10530.0, 7288.0, 5183.0, 3692.0, 2696.0, 1919.0, 1363.0, 964.0, 707.0, 502.0, 381.0, 266.0, 191.0, 127.0, 98.0, 65.0, 46.0, 22.0, 21.0, 17.0, 10.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.87646484375, -0.8485260009765625, -0.820587158203125, -0.7926483154296875, -0.76470947265625, -0.7367706298828125, -0.708831787109375, -0.6808929443359375, -0.6529541015625, -0.6250152587890625, -0.597076416015625, -0.5691375732421875, -0.54119873046875, -0.5132598876953125, -0.485321044921875, -0.4573822021484375, -0.429443359375, -0.4015045166015625, -0.373565673828125, -0.3456268310546875, -0.31768798828125, -0.2897491455078125, -0.261810302734375, -0.2338714599609375, -0.2059326171875, -0.1779937744140625, -0.150054931640625, -0.1221160888671875, -0.09417724609375, -0.0662384033203125, -0.038299560546875, -0.0103607177734375, 0.017578125, 0.0455169677734375, 0.073455810546875, 0.1013946533203125, 0.12933349609375, 0.1572723388671875, 0.185211181640625, 0.2131500244140625, 0.2410888671875, 0.2690277099609375, 0.296966552734375, 0.3249053955078125, 0.35284423828125, 0.3807830810546875, 0.408721923828125, 0.4366607666015625, 0.464599609375, 0.4925384521484375, 0.520477294921875, 0.5484161376953125, 0.57635498046875, 0.6042938232421875, 0.632232666015625, 0.6601715087890625, 0.6881103515625, 0.7160491943359375, 0.743988037109375, 0.7719268798828125, 0.79986572265625, 0.8278045654296875, 0.855743408203125, 0.8836822509765625, 0.91162109375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 7.0, 8.0, 3.0, 13.0, 14.0, 15.0, 20.0, 20.0, 21.0, 22.0, 29.0, 31.0, 35.0, 39.0, 39.0, 44.0, 57.0, 37.0, 1052.0, 39.0, 51.0, 50.0, 46.0, 48.0, 29.0, 40.0, 28.0, 29.0, 18.0, 19.0, 24.0, 19.0, 10.0, 13.0, 10.0, 9.0, 6.0, 6.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.453125, -2.37060546875, -2.2880859375, -2.20556640625, -2.123046875, -2.04052734375, -1.9580078125, -1.87548828125, -1.79296875, -1.71044921875, -1.6279296875, -1.54541015625, -1.462890625, -1.38037109375, -1.2978515625, -1.21533203125, -1.1328125, -1.05029296875, -0.9677734375, -0.88525390625, -0.802734375, -0.72021484375, -0.6376953125, -0.55517578125, -0.47265625, -0.39013671875, -0.3076171875, -0.22509765625, -0.142578125, -0.06005859375, 0.0224609375, 0.10498046875, 0.1875, 0.27001953125, 0.3525390625, 0.43505859375, 0.517578125, 0.60009765625, 0.6826171875, 0.76513671875, 0.84765625, 0.93017578125, 1.0126953125, 1.09521484375, 1.177734375, 1.26025390625, 1.3427734375, 1.42529296875, 1.5078125, 1.59033203125, 1.6728515625, 1.75537109375, 1.837890625, 1.92041015625, 2.0029296875, 2.08544921875, 2.16796875, 2.25048828125, 2.3330078125, 2.41552734375, 2.498046875, 2.58056640625, 2.6630859375, 2.74560546875, 2.828125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 3.0, 8.0, 5.0, 15.0, 22.0, 20.0, 54.0, 57.0, 106.0, 151.0, 247.0, 350.0, 576.0, 788.0, 1168.0, 1673.0, 2618.0, 3694.0, 5801.0, 8552.0, 13183.0, 20213.0, 32419.0, 52329.0, 89079.0, 175469.0, 1358702.0, 134339.0, 73282.0, 43702.0, 27561.0, 17211.0, 11290.0, 7447.0, 4923.0, 3258.0, 2170.0, 1557.0, 1058.0, 671.0, 466.0, 300.0, 199.0, 136.0, 98.0, 63.0, 39.0, 27.0, 16.0, 13.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9259414672851562, -0.8943634033203125, -0.8627853393554688, -0.831207275390625, -0.7996292114257812, -0.7680511474609375, -0.7364730834960938, -0.70489501953125, -0.6733169555664062, -0.6417388916015625, -0.6101608276367188, -0.578582763671875, -0.5470046997070312, -0.5154266357421875, -0.48384857177734375, -0.4522705078125, -0.42069244384765625, -0.3891143798828125, -0.35753631591796875, -0.325958251953125, -0.29438018798828125, -0.2628021240234375, -0.23122406005859375, -0.19964599609375, -0.16806793212890625, -0.1364898681640625, -0.10491180419921875, -0.073333740234375, -0.04175567626953125, -0.0101776123046875, 0.02140045166015625, 0.052978515625, 0.08455657958984375, 0.1161346435546875, 0.14771270751953125, 0.179290771484375, 0.21086883544921875, 0.2424468994140625, 0.27402496337890625, 0.30560302734375, 0.33718109130859375, 0.3687591552734375, 0.40033721923828125, 0.431915283203125, 0.46349334716796875, 0.4950714111328125, 0.5266494750976562, 0.5582275390625, 0.5898056030273438, 0.6213836669921875, 0.6529617309570312, 0.684539794921875, 0.7161178588867188, 0.7476959228515625, 0.7792739868164062, 0.81085205078125, 0.8424301147460938, 0.8740081787109375, 0.9055862426757812, 0.937164306640625, 0.9687423706054688, 1.0003204345703125, 1.0318984985351562, 1.0634765625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 11.0, 7.0, 9.0, 6.0, 9.0, 23.0, 20.0, 17.0, 29.0, 36.0, 27.0, 41.0, 32.0, 37.0, 48.0, 64.0, 68.0, 67.0, 52.0, 64.0, 55.0, 37.0, 37.0, 29.0, 34.0, 19.0, 21.0, 23.0, 22.0, 10.0, 6.0, 4.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00016391277313232422, -0.0001583937555551529, -0.00015287473797798157, -0.00014735572040081024, -0.00014183670282363892, -0.0001363176852464676, -0.00013079866766929626, -0.00012527965009212494, -0.00011976063251495361, -0.00011424161493778229, -0.00010872259736061096, -0.00010320357978343964, -9.768456220626831e-05, -9.216554462909698e-05, -8.664652705192566e-05, -8.112750947475433e-05, -7.560849189758301e-05, -7.008947432041168e-05, -6.457045674324036e-05, -5.905143916606903e-05, -5.3532421588897705e-05, -4.801340401172638e-05, -4.2494386434555054e-05, -3.697536885738373e-05, -3.14563512802124e-05, -2.5937333703041077e-05, -2.041831612586975e-05, -1.4899298548698425e-05, -9.3802809715271e-06, -3.861263394355774e-06, 1.6577541828155518e-06, 7.1767717599868774e-06, 1.2695789337158203e-05, 1.821480691432953e-05, 2.3733824491500854e-05, 2.925284206867218e-05, 3.4771859645843506e-05, 4.029087722301483e-05, 4.580989480018616e-05, 5.132891237735748e-05, 5.684792995452881e-05, 6.236694753170013e-05, 6.788596510887146e-05, 7.340498268604279e-05, 7.892400026321411e-05, 8.444301784038544e-05, 8.996203541755676e-05, 9.548105299472809e-05, 0.00010100007057189941, 0.00010651908814907074, 0.00011203810572624207, 0.00011755712330341339, 0.00012307614088058472, 0.00012859515845775604, 0.00013411417603492737, 0.0001396331936120987, 0.00014515221118927002, 0.00015067122876644135, 0.00015619024634361267, 0.000161709263920784, 0.00016722828149795532, 0.00017274729907512665, 0.00017826631665229797, 0.0001837853342294693, 0.00018930435180664062]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 5.0, 6.0, 13.0, 16.0, 17.0, 30.0, 37.0, 57.0, 62.0, 81.0, 103.0, 169.0, 236.0, 449.0, 1205.0, 1001830.0, 42440.0, 694.0, 323.0, 228.0, 146.0, 119.0, 61.0, 52.0, 40.0, 28.0, 23.0, 13.0, 11.0, 14.0, 5.0, 8.0, 8.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0044403076171875, -0.004316240549087524, -0.004192173480987549, -0.004068106412887573, -0.003944039344787598, -0.003819972276687622, -0.0036959052085876465, -0.003571838140487671, -0.0034477710723876953, -0.0033237040042877197, -0.003199636936187744, -0.0030755698680877686, -0.002951502799987793, -0.0028274357318878174, -0.002703368663787842, -0.002579301595687866, -0.0024552345275878906, -0.002331167459487915, -0.0022071003913879395, -0.002083033323287964, -0.0019589662551879883, -0.0018348991870880127, -0.0017108321189880371, -0.0015867650508880615, -0.001462697982788086, -0.0013386309146881104, -0.0012145638465881348, -0.0010904967784881592, -0.0009664297103881836, -0.000842362642288208, -0.0007182955741882324, -0.0005942285060882568, -0.00047016143798828125, -0.00034609436988830566, -0.00022202730178833008, -9.796023368835449e-05, 2.6106834411621094e-05, 0.00015017390251159668, 0.00027424097061157227, 0.00039830803871154785, 0.0005223751068115234, 0.000646442174911499, 0.0007705092430114746, 0.0008945763111114502, 0.0010186433792114258, 0.0011427104473114014, 0.001266777515411377, 0.0013908445835113525, 0.0015149116516113281, 0.0016389787197113037, 0.0017630457878112793, 0.0018871128559112549, 0.0020111799240112305, 0.002135246992111206, 0.0022593140602111816, 0.0023833811283111572, 0.002507448196411133, 0.0026315152645111084, 0.002755582332611084, 0.0028796494007110596, 0.003003716468811035, 0.0031277835369110107, 0.0032518506050109863, 0.003375917673110962, 0.0034999847412109375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 88.0, 563.0, 331.0, 29.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003600680211093277, -0.0003455566184129566, -0.000331045244820416, -0.0003165338421240449, -0.0003020224685315043, -0.0002875110658351332, -0.0002729996922425926, -0.0002584882895462215, -0.00024397690140176564, -0.0002294655132573098, -0.00021495412511285394, -0.0002004427369683981, -0.00018593133427202702, -0.0001714199606794864, -0.00015690855798311532, -0.00014239716983865947, -0.00012788578169420362, -0.00011337439354974777, -9.886300540529191e-05, -8.435160998487845e-05, -6.98402218404226e-05, -5.532883369596675e-05, -4.0817438275553286e-05, -2.6306050131097436e-05, -1.1794661986641586e-05, 2.716727976803668e-06, 1.722811794024892e-05, 3.173950972268358e-05, 4.625089786713943e-05, 6.076228601159528e-05, 7.527368143200874e-05, 8.97850695764646e-05, 0.0001042964868247509, 0.00011880787496920675, 0.0001333192631136626, 0.00014783066581003368, 0.0001623420394025743, 0.00017685344209894538, 0.00019136483024340123, 0.00020587621838785708, 0.00022038760653231293, 0.00023489899467676878, 0.00024941039737313986, 0.0002639217709656805, 0.00027843317366205156, 0.0002929445472545922, 0.00030745594995096326, 0.00032196735264733434, 0.00033647872623987496, 0.00035099012893624604, 0.00036550150252878666, 0.00038001290522515774, 0.00039452427881769836, 0.00040903568151406944, 0.00042354705510661006, 0.00043805845780298114, 0.0004525698604993522, 0.0004670812631957233, 0.0004815926367882639, 0.0004961040103808045, 0.0005106154130771756, 0.0005251268157735467, 0.0005396382184699178, 0.0005541496211662889, 0.000568660965654999]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 6.0, 14.0, 15.0, 12.0, 16.0, 17.0, 19.0, 22.0, 15.0, 32.0, 24.0, 25.0, 30.0, 37.0, 39.0, 39.0, 41.0, 27.0, 36.0, 39.0, 40.0, 43.0, 32.0, 38.0, 33.0, 35.0, 25.0, 33.0, 21.0, 25.0, 26.0, 20.0, 15.0, 20.0, 11.0, 7.0, 9.0, 14.0, 3.0, 3.0, 8.0, 2.0, 2.0, 8.0, 0.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-8.505582809448242e-05, -8.240249007940292e-05, -7.974915206432343e-05, -7.709581404924393e-05, -7.444247603416443e-05, -7.178913801908493e-05, -6.913580000400543e-05, -6.648246198892593e-05, -6.382912397384644e-05, -6.117578595876694e-05, -5.852244794368744e-05, -5.586910992860794e-05, -5.321577191352844e-05, -5.0562433898448944e-05, -4.7909095883369446e-05, -4.525575786828995e-05, -4.260241985321045e-05, -3.994908183813095e-05, -3.729574382305145e-05, -3.4642405807971954e-05, -3.1989067792892456e-05, -2.9335729777812958e-05, -2.668239176273346e-05, -2.402905374765396e-05, -2.1375715732574463e-05, -1.8722377717494965e-05, -1.6069039702415466e-05, -1.3415701687335968e-05, -1.076236367225647e-05, -8.109025657176971e-06, -5.455687642097473e-06, -2.802349627017975e-06, -1.4901161193847656e-07, 2.5043264031410217e-06, 5.15766441822052e-06, 7.811002433300018e-06, 1.0464340448379517e-05, 1.3117678463459015e-05, 1.5771016478538513e-05, 1.842435449361801e-05, 2.107769250869751e-05, 2.3731030523777008e-05, 2.6384368538856506e-05, 2.9037706553936005e-05, 3.16910445690155e-05, 3.4344382584095e-05, 3.69977205991745e-05, 3.9651058614254e-05, 4.2304396629333496e-05, 4.4957734644412994e-05, 4.761107265949249e-05, 5.026441067457199e-05, 5.291774868965149e-05, 5.557108670473099e-05, 5.8224424719810486e-05, 6.0877762734889984e-05, 6.353110074996948e-05, 6.618443876504898e-05, 6.883777678012848e-05, 7.149111479520798e-05, 7.414445281028748e-05, 7.679779082536697e-05, 7.945112884044647e-05, 8.210446685552597e-05, 8.475780487060547e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 9.0, 4.0, 10.0, 8.0, 10.0, 8.0, 13.0, 7.0, 12.0, 23.0, 18.0, 12.0, 31.0, 24.0, 25.0, 35.0, 29.0, 35.0, 46.0, 50.0, 38.0, 33.0, 46.0, 35.0, 37.0, 35.0, 35.0, 38.0, 35.0, 25.0, 25.0, 31.0, 23.0, 26.0, 10.0, 23.0, 19.0, 15.0, 14.0, 8.0, 8.0, 6.0, 3.0, 8.0, 6.0, 4.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.740234375, -3.625640869140625, -3.51104736328125, -3.396453857421875, -3.2818603515625, -3.167266845703125, -3.05267333984375, -2.938079833984375, -2.823486328125, -2.708892822265625, -2.59429931640625, -2.479705810546875, -2.3651123046875, -2.250518798828125, -2.13592529296875, -2.021331787109375, -1.90673828125, -1.792144775390625, -1.67755126953125, -1.562957763671875, -1.4483642578125, -1.333770751953125, -1.21917724609375, -1.104583740234375, -0.989990234375, -0.875396728515625, -0.76080322265625, -0.646209716796875, -0.5316162109375, -0.417022705078125, -0.30242919921875, -0.187835693359375, -0.0732421875, 0.041351318359375, 0.15594482421875, 0.270538330078125, 0.3851318359375, 0.499725341796875, 0.61431884765625, 0.728912353515625, 0.843505859375, 0.958099365234375, 1.07269287109375, 1.187286376953125, 1.3018798828125, 1.416473388671875, 1.53106689453125, 1.645660400390625, 1.76025390625, 1.874847412109375, 1.98944091796875, 2.104034423828125, 2.2186279296875, 2.333221435546875, 2.44781494140625, 2.562408447265625, 2.677001953125, 2.791595458984375, 2.90618896484375, 3.020782470703125, 3.1353759765625, 3.249969482421875, 3.36456298828125, 3.479156494140625, 3.59375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 12.0, 13.0, 13.0, 16.0, 36.0, 33.0, 61.0, 100.0, 131.0, 143.0, 221.0, 309.0, 455.0, 765.0, 1187.0, 2145.0, 4054.0, 7966.0, 17579.0, 43229.0, 123231.0, 351894.0, 316682.0, 107639.0, 38341.0, 15848.0, 7404.0, 3717.0, 2017.0, 1129.0, 672.0, 441.0, 286.0, 233.0, 152.0, 120.0, 81.0, 56.0, 37.0, 29.0, 28.0, 19.0, 13.0, 7.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.078125, -3.950439453125, -3.82275390625, -3.695068359375, -3.5673828125, -3.439697265625, -3.31201171875, -3.184326171875, -3.056640625, -2.928955078125, -2.80126953125, -2.673583984375, -2.5458984375, -2.418212890625, -2.29052734375, -2.162841796875, -2.03515625, -1.907470703125, -1.77978515625, -1.652099609375, -1.5244140625, -1.396728515625, -1.26904296875, -1.141357421875, -1.013671875, -0.885986328125, -0.75830078125, -0.630615234375, -0.5029296875, -0.375244140625, -0.24755859375, -0.119873046875, 0.0078125, 0.135498046875, 0.26318359375, 0.390869140625, 0.5185546875, 0.646240234375, 0.77392578125, 0.901611328125, 1.029296875, 1.156982421875, 1.28466796875, 1.412353515625, 1.5400390625, 1.667724609375, 1.79541015625, 1.923095703125, 2.05078125, 2.178466796875, 2.30615234375, 2.433837890625, 2.5615234375, 2.689208984375, 2.81689453125, 2.944580078125, 3.072265625, 3.199951171875, 3.32763671875, 3.455322265625, 3.5830078125, 3.710693359375, 3.83837890625, 3.966064453125, 4.09375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 3.0, 6.0, 12.0, 17.0, 13.0, 22.0, 16.0, 22.0, 25.0, 34.0, 46.0, 36.0, 36.0, 49.0, 54.0, 98.0, 309.0, 1660.0, 157.0, 58.0, 57.0, 50.0, 39.0, 41.0, 31.0, 31.0, 20.0, 15.0, 21.0, 14.0, 14.0, 15.0, 6.0, 10.0, 6.0, 8.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.1151123046875, -13.597412109375, -13.0797119140625, -12.56201171875, -12.0443115234375, -11.526611328125, -11.0089111328125, -10.4912109375, -9.9735107421875, -9.455810546875, -8.9381103515625, -8.42041015625, -7.9027099609375, -7.385009765625, -6.8673095703125, -6.349609375, -5.8319091796875, -5.314208984375, -4.7965087890625, -4.27880859375, -3.7611083984375, -3.243408203125, -2.7257080078125, -2.2080078125, -1.6903076171875, -1.172607421875, -0.6549072265625, -0.13720703125, 0.3804931640625, 0.898193359375, 1.4158935546875, 1.93359375, 2.4512939453125, 2.968994140625, 3.4866943359375, 4.00439453125, 4.5220947265625, 5.039794921875, 5.5574951171875, 6.0751953125, 6.5928955078125, 7.110595703125, 7.6282958984375, 8.14599609375, 8.6636962890625, 9.181396484375, 9.6990966796875, 10.216796875, 10.7344970703125, 11.252197265625, 11.7698974609375, 12.28759765625, 12.8052978515625, 13.322998046875, 13.8406982421875, 14.3583984375, 14.8760986328125, 15.393798828125, 15.9114990234375, 16.42919921875, 16.9468994140625, 17.464599609375, 17.9822998046875, 18.5]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 8.0, 11.0, 9.0, 21.0, 16.0, 25.0, 19.0, 32.0, 29.0, 36.0, 62.0, 104.0, 134.0, 248.0, 493.0, 1911.0, 26974.0, 2978397.0, 131574.0, 3925.0, 801.0, 293.0, 158.0, 106.0, 65.0, 51.0, 43.0, 32.0, 27.0, 24.0, 16.0, 14.0, 14.0, 9.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.21875, -27.380859375, -26.54296875, -25.705078125, -24.8671875, -24.029296875, -23.19140625, -22.353515625, -21.515625, -20.677734375, -19.83984375, -19.001953125, -18.1640625, -17.326171875, -16.48828125, -15.650390625, -14.8125, -13.974609375, -13.13671875, -12.298828125, -11.4609375, -10.623046875, -9.78515625, -8.947265625, -8.109375, -7.271484375, -6.43359375, -5.595703125, -4.7578125, -3.919921875, -3.08203125, -2.244140625, -1.40625, -0.568359375, 0.26953125, 1.107421875, 1.9453125, 2.783203125, 3.62109375, 4.458984375, 5.296875, 6.134765625, 6.97265625, 7.810546875, 8.6484375, 9.486328125, 10.32421875, 11.162109375, 12.0, 12.837890625, 13.67578125, 14.513671875, 15.3515625, 16.189453125, 17.02734375, 17.865234375, 18.703125, 19.541015625, 20.37890625, 21.216796875, 22.0546875, 22.892578125, 23.73046875, 24.568359375, 25.40625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 30.0, 91.0, 196.0, 262.0, 243.0, 114.0, 45.0, 10.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.3444709777832, -31.17164421081543, -29.998817443847656, -28.825990676879883, -27.65316390991211, -26.480337142944336, -25.307510375976562, -24.13468360900879, -22.961856842041016, -21.789030075073242, -20.61620330810547, -19.443376541137695, -18.270549774169922, -17.09772300720215, -15.924896240234375, -14.752069473266602, -13.579242706298828, -12.406415939331055, -11.233589172363281, -10.060762405395508, -8.887935638427734, -7.715108871459961, -6.5422821044921875, -5.369455337524414, -4.196628570556641, -3.023801803588867, -1.8509750366210938, -0.6781482696533203, 0.4946784973144531, 1.6675052642822266, 2.84033203125, 4.013158798217773, 5.185985565185547, 6.35881233215332, 7.531639099121094, 8.704465866088867, 9.87729263305664, 11.050119400024414, 12.222946166992188, 13.395772933959961, 14.568599700927734, 15.741426467895508, 16.91425323486328, 18.087080001831055, 19.259906768798828, 20.4327335357666, 21.605560302734375, 22.77838706970215, 23.951213836669922, 25.124040603637695, 26.29686737060547, 27.469694137573242, 28.642520904541016, 29.81534767150879, 30.988174438476562, 32.16100311279297, 33.33382797241211, 34.50665283203125, 35.679481506347656, 36.85231018066406, 38.0251350402832, 39.197959899902344, 40.37078857421875, 41.543617248535156, 42.7164421081543]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 11.0, 2.0, 13.0, 9.0, 12.0, 19.0, 12.0, 22.0, 18.0, 31.0, 35.0, 33.0, 45.0, 35.0, 32.0, 48.0, 30.0, 46.0, 36.0, 38.0, 46.0, 36.0, 43.0, 40.0, 30.0, 50.0, 26.0, 33.0, 27.0, 14.0, 23.0, 23.0, 19.0, 11.0, 10.0, 5.0, 10.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.25399398803711, -45.81037139892578, -44.36674499511719, -42.92312240600586, -41.479496002197266, -40.03587341308594, -38.592247009277344, -37.148624420166016, -35.70500183105469, -34.26137924194336, -32.817752838134766, -31.374130249023438, -29.930503845214844, -28.486881256103516, -27.043256759643555, -25.599632263183594, -24.156005859375, -22.71238136291504, -21.268756866455078, -19.82513427734375, -18.381507873535156, -16.937885284423828, -15.494260787963867, -14.050636291503906, -12.607011795043945, -11.163387298583984, -9.719762802124023, -8.276139259338379, -6.832514762878418, -5.388890266418457, -3.9452667236328125, -2.5016422271728516, -1.0580215454101562, 0.3856027126312256, 1.8292269706726074, 3.27285099029541, 4.716475486755371, 6.160099983215332, 7.603723526000977, 9.047348022460938, 10.490972518920898, 11.93459701538086, 13.37822151184082, 14.821845054626465, 16.26546859741211, 17.709095001220703, 19.15271759033203, 20.596342086791992, 22.039966583251953, 23.483591079711914, 24.927215576171875, 26.370838165283203, 27.814464569091797, 29.258087158203125, 30.701711654663086, 32.14533615112305, 33.588958740234375, 35.0325813293457, 36.4762077331543, 37.919830322265625, 39.36345672607422, 40.80707931518555, 42.250701904296875, 43.69432830810547, 45.13795471191406]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 11.0, 7.0, 12.0, 14.0, 11.0, 7.0, 11.0, 14.0, 21.0, 20.0, 23.0, 25.0, 38.0, 24.0, 32.0, 41.0, 47.0, 42.0, 36.0, 44.0, 46.0, 44.0, 41.0, 33.0, 45.0, 29.0, 35.0, 31.0, 34.0, 23.0, 27.0, 12.0, 26.0, 22.0, 17.0, 5.0, 9.0, 9.0, 6.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.15234375, -4.02435302734375, -3.8963623046875, -3.76837158203125, -3.640380859375, -3.51239013671875, -3.3843994140625, -3.25640869140625, -3.12841796875, -3.00042724609375, -2.8724365234375, -2.74444580078125, -2.616455078125, -2.48846435546875, -2.3604736328125, -2.23248291015625, -2.1044921875, -1.97650146484375, -1.8485107421875, -1.72052001953125, -1.592529296875, -1.46453857421875, -1.3365478515625, -1.20855712890625, -1.08056640625, -0.95257568359375, -0.8245849609375, -0.69659423828125, -0.568603515625, -0.44061279296875, -0.3126220703125, -0.18463134765625, -0.056640625, 0.07135009765625, 0.1993408203125, 0.32733154296875, 0.455322265625, 0.58331298828125, 0.7113037109375, 0.83929443359375, 0.96728515625, 1.09527587890625, 1.2232666015625, 1.35125732421875, 1.479248046875, 1.60723876953125, 1.7352294921875, 1.86322021484375, 1.9912109375, 2.11920166015625, 2.2471923828125, 2.37518310546875, 2.503173828125, 2.63116455078125, 2.7591552734375, 2.88714599609375, 3.01513671875, 3.14312744140625, 3.2711181640625, 3.39910888671875, 3.527099609375, 3.65509033203125, 3.7830810546875, 3.91107177734375, 4.0390625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 7.0, 7.0, 6.0, 9.0, 15.0, 6.0, 14.0, 21.0, 19.0, 25.0, 20.0, 24.0, 39.0, 34.0, 49.0, 64.0, 148.0, 503.0, 3762.0, 132521.0, 3683712.0, 365488.0, 6481.0, 750.0, 158.0, 71.0, 33.0, 39.0, 31.0, 18.0, 24.0, 27.0, 16.0, 22.0, 11.0, 16.0, 10.0, 11.0, 11.0, 8.0, 7.0, 4.0, 7.0, 4.0, 3.0, 7.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-20.53125, -19.8603515625, -19.189453125, -18.5185546875, -17.84765625, -17.1767578125, -16.505859375, -15.8349609375, -15.1640625, -14.4931640625, -13.822265625, -13.1513671875, -12.48046875, -11.8095703125, -11.138671875, -10.4677734375, -9.796875, -9.1259765625, -8.455078125, -7.7841796875, -7.11328125, -6.4423828125, -5.771484375, -5.1005859375, -4.4296875, -3.7587890625, -3.087890625, -2.4169921875, -1.74609375, -1.0751953125, -0.404296875, 0.2666015625, 0.9375, 1.6083984375, 2.279296875, 2.9501953125, 3.62109375, 4.2919921875, 4.962890625, 5.6337890625, 6.3046875, 6.9755859375, 7.646484375, 8.3173828125, 8.98828125, 9.6591796875, 10.330078125, 11.0009765625, 11.671875, 12.3427734375, 13.013671875, 13.6845703125, 14.35546875, 15.0263671875, 15.697265625, 16.3681640625, 17.0390625, 17.7099609375, 18.380859375, 19.0517578125, 19.72265625, 20.3935546875, 21.064453125, 21.7353515625, 22.40625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 4.0, 9.0, 8.0, 24.0, 25.0, 34.0, 46.0, 76.0, 95.0, 143.0, 159.0, 252.0, 380.0, 477.0, 475.0, 461.0, 364.0, 285.0, 233.0, 146.0, 93.0, 72.0, 56.0, 49.0, 34.0, 16.0, 17.0, 12.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.9765625, -15.5733642578125, -15.170166015625, -14.7669677734375, -14.36376953125, -13.9605712890625, -13.557373046875, -13.1541748046875, -12.7509765625, -12.3477783203125, -11.944580078125, -11.5413818359375, -11.13818359375, -10.7349853515625, -10.331787109375, -9.9285888671875, -9.525390625, -9.1221923828125, -8.718994140625, -8.3157958984375, -7.91259765625, -7.5093994140625, -7.106201171875, -6.7030029296875, -6.2998046875, -5.8966064453125, -5.493408203125, -5.0902099609375, -4.68701171875, -4.2838134765625, -3.880615234375, -3.4774169921875, -3.07421875, -2.6710205078125, -2.267822265625, -1.8646240234375, -1.46142578125, -1.0582275390625, -0.655029296875, -0.2518310546875, 0.1513671875, 0.5545654296875, 0.957763671875, 1.3609619140625, 1.76416015625, 2.1673583984375, 2.570556640625, 2.9737548828125, 3.376953125, 3.7801513671875, 4.183349609375, 4.5865478515625, 4.98974609375, 5.3929443359375, 5.796142578125, 6.1993408203125, 6.6025390625, 7.0057373046875, 7.408935546875, 7.8121337890625, 8.21533203125, 8.6185302734375, 9.021728515625, 9.4249267578125, 9.828125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 12.0, 7.0, 20.0, 23.0, 44.0, 77.0, 107.0, 187.0, 307.0, 801.0, 10213.0, 3796067.0, 382954.0, 2372.0, 458.0, 223.0, 156.0, 94.0, 61.0, 46.0, 13.0, 9.0, 6.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5, -44.6240234375, -42.748046875, -40.8720703125, -38.99609375, -37.1201171875, -35.244140625, -33.3681640625, -31.4921875, -29.6162109375, -27.740234375, -25.8642578125, -23.98828125, -22.1123046875, -20.236328125, -18.3603515625, -16.484375, -14.6083984375, -12.732421875, -10.8564453125, -8.98046875, -7.1044921875, -5.228515625, -3.3525390625, -1.4765625, 0.3994140625, 2.275390625, 4.1513671875, 6.02734375, 7.9033203125, 9.779296875, 11.6552734375, 13.53125, 15.4072265625, 17.283203125, 19.1591796875, 21.03515625, 22.9111328125, 24.787109375, 26.6630859375, 28.5390625, 30.4150390625, 32.291015625, 34.1669921875, 36.04296875, 37.9189453125, 39.794921875, 41.6708984375, 43.546875, 45.4228515625, 47.298828125, 49.1748046875, 51.05078125, 52.9267578125, 54.802734375, 56.6787109375, 58.5546875, 60.4306640625, 62.306640625, 64.1826171875, 66.05859375, 67.9345703125, 69.810546875, 71.6865234375, 73.5625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 8.0, 105.0, 377.0, 403.0, 118.0, 5.0, 1.0], "bins": [-367.355224609375, -361.2361755371094, -355.1170959472656, -348.998046875, -342.87896728515625, -336.7599182128906, -330.640869140625, -324.52178955078125, -318.4027404785156, -312.28369140625, -306.16461181640625, -300.0455627441406, -293.9264831542969, -287.80743408203125, -281.6883544921875, -275.5693054199219, -269.45025634765625, -263.3312072753906, -257.2121276855469, -251.09307861328125, -244.97401428222656, -238.85494995117188, -232.7358856201172, -226.6168212890625, -220.49774169921875, -214.37867736816406, -208.25961303710938, -202.14056396484375, -196.02149963378906, -189.90243530273438, -183.7833709716797, -177.664306640625, -171.54525756835938, -165.4261932373047, -159.30712890625, -153.18807983398438, -147.0690155029297, -140.949951171875, -134.8308868408203, -128.71182250976562, -122.59275817871094, -116.47369384765625, -110.3546371459961, -104.2355728149414, -98.11651611328125, -91.99745178222656, -85.87838745117188, -79.75932312011719, -73.64026641845703, -67.52120208740234, -61.40214538574219, -55.2830810546875, -49.16402053833008, -43.044960021972656, -36.92589569091797, -30.806835174560547, -24.687776565551758, -18.568714141845703, -12.449653625488281, -6.330591201782227, -0.2115306854248047, 5.907529830932617, 12.026594161987305, 18.145654678344727, 24.26471519470215]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 8.0, 3.0, 7.0, 7.0, 15.0, 11.0, 19.0, 18.0, 15.0, 23.0, 24.0, 22.0, 29.0, 38.0, 41.0, 31.0, 32.0, 41.0, 33.0, 32.0, 52.0, 54.0, 53.0, 39.0, 50.0, 37.0, 32.0, 26.0, 31.0, 33.0, 31.0, 20.0, 16.0, 19.0, 12.0, 7.0, 18.0, 6.0, 4.0, 1.0, 5.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.64929962158203, -40.31341552734375, -38.97753143310547, -37.64164733886719, -36.305763244628906, -34.969879150390625, -33.633995056152344, -32.2981071472168, -30.962223052978516, -29.626338958740234, -28.290454864501953, -26.954570770263672, -25.618684768676758, -24.282800674438477, -22.946916580200195, -21.61103057861328, -20.275148391723633, -18.93926429748535, -17.60338020324707, -16.267494201660156, -14.931610107421875, -13.595726013183594, -12.259841918945312, -10.923956871032715, -9.588072776794434, -8.252188682556152, -6.916303634643555, -5.580419540405273, -4.244534969329834, -2.9086503982543945, -1.5727663040161133, -0.23688125610351562, 1.0990028381347656, 2.434887409210205, 3.7707717418670654, 5.106656074523926, 6.442540645599365, 7.778425216674805, 9.114309310913086, 10.450194358825684, 11.786078453063965, 13.121962547302246, 14.457847595214844, 15.793731689453125, 17.129615783691406, 18.465499877929688, 19.80138397216797, 21.137269973754883, 22.473154067993164, 23.809038162231445, 25.144922256469727, 26.48080825805664, 27.816692352294922, 29.152576446533203, 30.488460540771484, 31.824344635009766, 33.16022872924805, 34.49611282348633, 35.83199691772461, 37.16788101196289, 38.50376510620117, 39.83965301513672, 41.175537109375, 42.51142120361328, 43.84730529785156]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 6.0, 9.0, 14.0, 12.0, 15.0, 19.0, 9.0, 20.0, 29.0, 30.0, 34.0, 35.0, 37.0, 33.0, 40.0, 46.0, 54.0, 40.0, 54.0, 44.0, 45.0, 29.0, 37.0, 32.0, 42.0, 29.0, 37.0, 23.0, 20.0, 21.0, 17.0, 12.0, 11.0, 11.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.4609375, -4.3212890625, -4.181640625, -4.0419921875, -3.90234375, -3.7626953125, -3.623046875, -3.4833984375, -3.34375, -3.2041015625, -3.064453125, -2.9248046875, -2.78515625, -2.6455078125, -2.505859375, -2.3662109375, -2.2265625, -2.0869140625, -1.947265625, -1.8076171875, -1.66796875, -1.5283203125, -1.388671875, -1.2490234375, -1.109375, -0.9697265625, -0.830078125, -0.6904296875, -0.55078125, -0.4111328125, -0.271484375, -0.1318359375, 0.0078125, 0.1474609375, 0.287109375, 0.4267578125, 0.56640625, 0.7060546875, 0.845703125, 0.9853515625, 1.125, 1.2646484375, 1.404296875, 1.5439453125, 1.68359375, 1.8232421875, 1.962890625, 2.1025390625, 2.2421875, 2.3818359375, 2.521484375, 2.6611328125, 2.80078125, 2.9404296875, 3.080078125, 3.2197265625, 3.359375, 3.4990234375, 3.638671875, 3.7783203125, 3.91796875, 4.0576171875, 4.197265625, 4.3369140625, 4.4765625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 7.0, 12.0, 8.0, 10.0, 23.0, 26.0, 38.0, 47.0, 67.0, 110.0, 149.0, 213.0, 288.0, 407.0, 563.0, 782.0, 1263.0, 1637.0, 2417.0, 3477.0, 5134.0, 7222.0, 11024.0, 16826.0, 25656.0, 39433.0, 63233.0, 107331.0, 275627.0, 218528.0, 98133.0, 58873.0, 37028.0, 24209.0, 15780.0, 10280.0, 7029.0, 4762.0, 3247.0, 2263.0, 1617.0, 1123.0, 763.0, 540.0, 368.0, 287.0, 202.0, 157.0, 98.0, 81.0, 49.0, 28.0, 27.0, 19.0, 13.0, 11.0, 7.0, 4.0, 4.0, 5.0, 2.0], "bins": [-1.060546875, -1.0273284912109375, -0.994110107421875, -0.9608917236328125, -0.92767333984375, -0.8944549560546875, -0.861236572265625, -0.8280181884765625, -0.7947998046875, -0.7615814208984375, -0.728363037109375, -0.6951446533203125, -0.66192626953125, -0.6287078857421875, -0.595489501953125, -0.5622711181640625, -0.529052734375, -0.4958343505859375, -0.462615966796875, -0.4293975830078125, -0.39617919921875, -0.3629608154296875, -0.329742431640625, -0.2965240478515625, -0.2633056640625, -0.2300872802734375, -0.196868896484375, -0.1636505126953125, -0.13043212890625, -0.0972137451171875, -0.063995361328125, -0.0307769775390625, 0.00244140625, 0.0356597900390625, 0.068878173828125, 0.1020965576171875, 0.13531494140625, 0.1685333251953125, 0.201751708984375, 0.2349700927734375, 0.2681884765625, 0.3014068603515625, 0.334625244140625, 0.3678436279296875, 0.40106201171875, 0.4342803955078125, 0.467498779296875, 0.5007171630859375, 0.533935546875, 0.5671539306640625, 0.600372314453125, 0.6335906982421875, 0.66680908203125, 0.7000274658203125, 0.733245849609375, 0.7664642333984375, 0.7996826171875, 0.8329010009765625, 0.866119384765625, 0.8993377685546875, 0.93255615234375, 0.9657745361328125, 0.998992919921875, 1.0322113037109375, 1.0654296875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 7.0, 7.0, 15.0, 14.0, 22.0, 18.0, 27.0, 19.0, 25.0, 38.0, 35.0, 35.0, 34.0, 38.0, 53.0, 40.0, 40.0, 1074.0, 41.0, 38.0, 45.0, 41.0, 35.0, 56.0, 35.0, 27.0, 27.0, 28.0, 22.0, 26.0, 16.0, 8.0, 9.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.111328125, -3.011627197265625, -2.91192626953125, -2.812225341796875, -2.7125244140625, -2.612823486328125, -2.51312255859375, -2.413421630859375, -2.313720703125, -2.214019775390625, -2.11431884765625, -2.014617919921875, -1.9149169921875, -1.815216064453125, -1.71551513671875, -1.615814208984375, -1.51611328125, -1.416412353515625, -1.31671142578125, -1.217010498046875, -1.1173095703125, -1.017608642578125, -0.91790771484375, -0.818206787109375, -0.718505859375, -0.618804931640625, -0.51910400390625, -0.419403076171875, -0.3197021484375, -0.220001220703125, -0.12030029296875, -0.020599365234375, 0.0791015625, 0.178802490234375, 0.27850341796875, 0.378204345703125, 0.4779052734375, 0.577606201171875, 0.67730712890625, 0.777008056640625, 0.876708984375, 0.976409912109375, 1.07611083984375, 1.175811767578125, 1.2755126953125, 1.375213623046875, 1.47491455078125, 1.574615478515625, 1.67431640625, 1.774017333984375, 1.87371826171875, 1.973419189453125, 2.0731201171875, 2.172821044921875, 2.27252197265625, 2.372222900390625, 2.471923828125, 2.571624755859375, 2.67132568359375, 2.771026611328125, 2.8707275390625, 2.970428466796875, 3.07012939453125, 3.169830322265625, 3.26953125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 9.0, 4.0, 3.0, 23.0, 28.0, 32.0, 47.0, 69.0, 119.0, 148.0, 267.0, 356.0, 524.0, 864.0, 1427.0, 2235.0, 3483.0, 5524.0, 8604.0, 13629.0, 22037.0, 36267.0, 59150.0, 98070.0, 192716.0, 1350466.0, 118615.0, 70058.0, 42998.0, 25796.0, 15841.0, 10043.0, 6442.0, 4032.0, 2566.0, 1654.0, 1003.0, 707.0, 439.0, 244.0, 189.0, 125.0, 93.0, 74.0, 30.0, 30.0, 17.0, 21.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1708984375, -1.133331298828125, -1.09576416015625, -1.058197021484375, -1.0206298828125, -0.983062744140625, -0.94549560546875, -0.907928466796875, -0.870361328125, -0.832794189453125, -0.79522705078125, -0.757659912109375, -0.7200927734375, -0.682525634765625, -0.64495849609375, -0.607391357421875, -0.56982421875, -0.532257080078125, -0.49468994140625, -0.457122802734375, -0.4195556640625, -0.381988525390625, -0.34442138671875, -0.306854248046875, -0.269287109375, -0.231719970703125, -0.19415283203125, -0.156585693359375, -0.1190185546875, -0.081451416015625, -0.04388427734375, -0.006317138671875, 0.03125, 0.068817138671875, 0.10638427734375, 0.143951416015625, 0.1815185546875, 0.219085693359375, 0.25665283203125, 0.294219970703125, 0.331787109375, 0.369354248046875, 0.40692138671875, 0.444488525390625, 0.4820556640625, 0.519622802734375, 0.55718994140625, 0.594757080078125, 0.63232421875, 0.669891357421875, 0.70745849609375, 0.745025634765625, 0.7825927734375, 0.820159912109375, 0.85772705078125, 0.895294189453125, 0.932861328125, 0.970428466796875, 1.00799560546875, 1.045562744140625, 1.0831298828125, 1.120697021484375, 1.15826416015625, 1.195831298828125, 1.2333984375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 10.0, 7.0, 13.0, 9.0, 14.0, 11.0, 18.0, 33.0, 28.0, 41.0, 61.0, 65.0, 78.0, 66.0, 86.0, 73.0, 80.0, 65.0, 57.0, 41.0, 26.0, 22.0, 16.0, 14.0, 12.0, 10.0, 7.0, 6.0, 8.0, 3.0, 4.0, 6.0, 7.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00024437904357910156, -0.0002376846969127655, -0.00023099035024642944, -0.00022429600358009338, -0.00021760165691375732, -0.00021090731024742126, -0.0002042129635810852, -0.00019751861691474915, -0.00019082427024841309, -0.00018412992358207703, -0.00017743557691574097, -0.0001707412302494049, -0.00016404688358306885, -0.0001573525369167328, -0.00015065819025039673, -0.00014396384358406067, -0.0001372694969177246, -0.00013057515025138855, -0.0001238808035850525, -0.00011718645691871643, -0.00011049211025238037, -0.00010379776358604431, -9.710341691970825e-05, -9.040907025337219e-05, -8.371472358703613e-05, -7.702037692070007e-05, -7.032603025436401e-05, -6.363168358802795e-05, -5.6937336921691895e-05, -5.0242990255355835e-05, -4.3548643589019775e-05, -3.6854296922683716e-05, -3.0159950256347656e-05, -2.3465603590011597e-05, -1.6771256923675537e-05, -1.0076910257339478e-05, -3.382563591003418e-06, 3.3117830753326416e-06, 1.0006129741668701e-05, 1.670047640800476e-05, 2.339482307434082e-05, 3.008916974067688e-05, 3.678351640701294e-05, 4.3477863073349e-05, 5.017220973968506e-05, 5.686655640602112e-05, 6.356090307235718e-05, 7.025524973869324e-05, 7.69495964050293e-05, 8.364394307136536e-05, 9.033828973770142e-05, 9.703263640403748e-05, 0.00010372698307037354, 0.0001104213297367096, 0.00011711567640304565, 0.00012381002306938171, 0.00013050436973571777, 0.00013719871640205383, 0.0001438930630683899, 0.00015058740973472595, 0.000157281756401062, 0.00016397610306739807, 0.00017067044973373413, 0.0001773647964000702, 0.00018405914306640625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 5.0, 15.0, 9.0, 11.0, 13.0, 27.0, 35.0, 43.0, 75.0, 104.0, 192.0, 322.0, 608.0, 22483.0, 1022206.0, 1301.0, 411.0, 231.0, 172.0, 77.0, 58.0, 32.0, 40.0, 17.0, 19.0, 9.0, 5.0, 6.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0047454833984375, -0.0045937299728393555, -0.004441976547241211, -0.004290223121643066, -0.004138469696044922, -0.003986716270446777, -0.003834962844848633, -0.0036832094192504883, -0.0035314559936523438, -0.0033797025680541992, -0.0032279491424560547, -0.00307619571685791, -0.0029244422912597656, -0.002772688865661621, -0.0026209354400634766, -0.002469182014465332, -0.0023174285888671875, -0.002165675163269043, -0.0020139217376708984, -0.001862168312072754, -0.0017104148864746094, -0.0015586614608764648, -0.0014069080352783203, -0.0012551546096801758, -0.0011034011840820312, -0.0009516477584838867, -0.0007998943328857422, -0.0006481409072875977, -0.0004963874816894531, -0.0003446340560913086, -0.00019288063049316406, -4.112720489501953e-05, 0.000110626220703125, 0.00026237964630126953, 0.00041413307189941406, 0.0005658864974975586, 0.0007176399230957031, 0.0008693933486938477, 0.0010211467742919922, 0.0011729001998901367, 0.0013246536254882812, 0.0014764070510864258, 0.0016281604766845703, 0.0017799139022827148, 0.0019316673278808594, 0.002083420753479004, 0.0022351741790771484, 0.002386927604675293, 0.0025386810302734375, 0.002690434455871582, 0.0028421878814697266, 0.002993941307067871, 0.0031456947326660156, 0.00329744815826416, 0.0034492015838623047, 0.0036009550094604492, 0.0037527084350585938, 0.0039044618606567383, 0.004056215286254883, 0.004207968711853027, 0.004359722137451172, 0.004511475563049316, 0.004663228988647461, 0.0048149824142456055, 0.00496673583984375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 20.0, 61.0, 258.0, 405.0, 197.0, 62.0, 12.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004406581283546984, -0.0004297544073779136, -0.0004188506572972983, -0.0004079469363205135, -0.00039704321534372866, -0.00038613949436694384, -0.00037523574428632855, -0.00036433202330954373, -0.0003534283023327589, -0.0003425245813559741, -0.0003316208312753588, -0.00032071711029857397, -0.00030981338932178915, -0.0002989096683450043, -0.00028800591826438904, -0.0002771021972876042, -0.00026619844720698893, -0.0002552947262302041, -0.0002443909761495888, -0.000233487255172804, -0.00022258353419601917, -0.00021167979866731912, -0.00020077606313861907, -0.00018987234216183424, -0.00017896860663313419, -0.00016806487110443413, -0.0001571611501276493, -0.00014625741459894925, -0.0001353536790702492, -0.00012444995809346437, -0.00011354622256476432, -0.00010264249431202188, -9.173873695544899e-05, -8.083500870270655e-05, -6.99312804499641e-05, -5.902754492126405e-05, -4.812381666852161e-05, -3.722008841577917e-05, -2.631635288707912e-05, -1.541262463433668e-05, -4.508896381594241e-06, 6.394833690137602e-06, 1.7298563761869445e-05, 2.8202295652590692e-05, 3.910602390533313e-05, 5.000975215807557e-05, 6.0913487686775625e-05, 7.181721593951806e-05, 8.27209441922605e-05, 9.362467244500294e-05, 0.00010452840069774538, 0.00011543213622644544, 0.00012633585720323026, 0.00013723959273193032, 0.00014814332826063037, 0.0001590470492374152, 0.00016995078476611525, 0.0001808545202948153, 0.00019175824127160013, 0.00020266197680030018, 0.00021356571232900023, 0.00022446943330578506, 0.00023537316883448511, 0.00024627690436318517, 0.00025718062533997]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 0.0, 7.0, 6.0, 3.0, 5.0, 5.0, 14.0, 8.0, 15.0, 15.0, 12.0, 15.0, 21.0, 28.0, 29.0, 23.0, 32.0, 26.0, 33.0, 27.0, 32.0, 37.0, 38.0, 41.0, 37.0, 41.0, 36.0, 33.0, 33.0, 36.0, 29.0, 28.0, 32.0, 42.0, 25.0, 21.0, 20.0, 23.0, 12.0, 18.0, 16.0, 6.0, 6.0, 11.0, 7.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.147954940795898e-05, -7.885601371526718e-05, -7.623247802257538e-05, -7.360894232988358e-05, -7.098540663719177e-05, -6.836187094449997e-05, -6.573833525180817e-05, -6.311479955911636e-05, -6.049126386642456e-05, -5.786772817373276e-05, -5.5244192481040955e-05, -5.262065678834915e-05, -4.999712109565735e-05, -4.7373585402965546e-05, -4.475004971027374e-05, -4.212651401758194e-05, -3.950297832489014e-05, -3.6879442632198334e-05, -3.425590693950653e-05, -3.163237124681473e-05, -2.9008835554122925e-05, -2.6385299861431122e-05, -2.376176416873932e-05, -2.1138228476047516e-05, -1.8514692783355713e-05, -1.589115709066391e-05, -1.3267621397972107e-05, -1.0644085705280304e-05, -8.020550012588501e-06, -5.397014319896698e-06, -2.773478627204895e-06, -1.4994293451309204e-07, 2.473592758178711e-06, 5.097128450870514e-06, 7.720664143562317e-06, 1.034419983625412e-05, 1.2967735528945923e-05, 1.5591271221637726e-05, 1.821480691432953e-05, 2.0838342607021332e-05, 2.3461878299713135e-05, 2.6085413992404938e-05, 2.870894968509674e-05, 3.1332485377788544e-05, 3.395602107048035e-05, 3.657955676317215e-05, 3.920309245586395e-05, 4.1826628148555756e-05, 4.445016384124756e-05, 4.707369953393936e-05, 4.9697235226631165e-05, 5.232077091932297e-05, 5.494430661201477e-05, 5.7567842304706573e-05, 6.0191377997398376e-05, 6.281491369009018e-05, 6.543844938278198e-05, 6.806198507547379e-05, 7.068552076816559e-05, 7.330905646085739e-05, 7.59325921535492e-05, 7.8556127846241e-05, 8.11796635389328e-05, 8.38031992316246e-05, 8.64267349243164e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 6.0, 9.0, 14.0, 12.0, 15.0, 19.0, 9.0, 20.0, 29.0, 30.0, 34.0, 35.0, 37.0, 33.0, 40.0, 46.0, 54.0, 40.0, 54.0, 44.0, 45.0, 29.0, 37.0, 32.0, 42.0, 29.0, 37.0, 23.0, 20.0, 21.0, 17.0, 12.0, 11.0, 11.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.4609375, -4.3212890625, -4.181640625, -4.0419921875, -3.90234375, -3.7626953125, -3.623046875, -3.4833984375, -3.34375, -3.2041015625, -3.064453125, -2.9248046875, -2.78515625, -2.6455078125, -2.505859375, -2.3662109375, -2.2265625, -2.0869140625, -1.947265625, -1.8076171875, -1.66796875, -1.5283203125, -1.388671875, -1.2490234375, -1.109375, -0.9697265625, -0.830078125, -0.6904296875, -0.55078125, -0.4111328125, -0.271484375, -0.1318359375, 0.0078125, 0.1474609375, 0.287109375, 0.4267578125, 0.56640625, 0.7060546875, 0.845703125, 0.9853515625, 1.125, 1.2646484375, 1.404296875, 1.5439453125, 1.68359375, 1.8232421875, 1.962890625, 2.1025390625, 2.2421875, 2.3818359375, 2.521484375, 2.6611328125, 2.80078125, 2.9404296875, 3.080078125, 3.2197265625, 3.359375, 3.4990234375, 3.638671875, 3.7783203125, 3.91796875, 4.0576171875, 4.197265625, 4.3369140625, 4.4765625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 10.0, 19.0, 20.0, 15.0, 33.0, 46.0, 58.0, 62.0, 119.0, 185.0, 226.0, 373.0, 626.0, 1044.0, 1964.0, 4041.0, 9956.0, 27780.0, 110545.0, 456058.0, 329090.0, 70941.0, 20447.0, 7600.0, 3197.0, 1577.0, 896.0, 534.0, 355.0, 227.0, 133.0, 106.0, 74.0, 61.0, 35.0, 21.0, 18.0, 13.0, 9.0, 12.0, 8.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16796875, -5.0057373046875, -4.843505859375, -4.6812744140625, -4.51904296875, -4.3568115234375, -4.194580078125, -4.0323486328125, -3.8701171875, -3.7078857421875, -3.545654296875, -3.3834228515625, -3.22119140625, -3.0589599609375, -2.896728515625, -2.7344970703125, -2.572265625, -2.4100341796875, -2.247802734375, -2.0855712890625, -1.92333984375, -1.7611083984375, -1.598876953125, -1.4366455078125, -1.2744140625, -1.1121826171875, -0.949951171875, -0.7877197265625, -0.62548828125, -0.4632568359375, -0.301025390625, -0.1387939453125, 0.0234375, 0.1856689453125, 0.347900390625, 0.5101318359375, 0.67236328125, 0.8345947265625, 0.996826171875, 1.1590576171875, 1.3212890625, 1.4835205078125, 1.645751953125, 1.8079833984375, 1.97021484375, 2.1324462890625, 2.294677734375, 2.4569091796875, 2.619140625, 2.7813720703125, 2.943603515625, 3.1058349609375, 3.26806640625, 3.4302978515625, 3.592529296875, 3.7547607421875, 3.9169921875, 4.0792236328125, 4.241455078125, 4.4036865234375, 4.56591796875, 4.7281494140625, 4.890380859375, 5.0526123046875, 5.21484375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 4.0, 9.0, 5.0, 11.0, 10.0, 17.0, 13.0, 25.0, 19.0, 39.0, 38.0, 46.0, 40.0, 53.0, 68.0, 115.0, 1657.0, 383.0, 91.0, 66.0, 54.0, 60.0, 36.0, 37.0, 33.0, 26.0, 16.0, 20.0, 22.0, 16.0, 9.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.984375, -21.35400390625, -20.7236328125, -20.09326171875, -19.462890625, -18.83251953125, -18.2021484375, -17.57177734375, -16.94140625, -16.31103515625, -15.6806640625, -15.05029296875, -14.419921875, -13.78955078125, -13.1591796875, -12.52880859375, -11.8984375, -11.26806640625, -10.6376953125, -10.00732421875, -9.376953125, -8.74658203125, -8.1162109375, -7.48583984375, -6.85546875, -6.22509765625, -5.5947265625, -4.96435546875, -4.333984375, -3.70361328125, -3.0732421875, -2.44287109375, -1.8125, -1.18212890625, -0.5517578125, 0.07861328125, 0.708984375, 1.33935546875, 1.9697265625, 2.60009765625, 3.23046875, 3.86083984375, 4.4912109375, 5.12158203125, 5.751953125, 6.38232421875, 7.0126953125, 7.64306640625, 8.2734375, 8.90380859375, 9.5341796875, 10.16455078125, 10.794921875, 11.42529296875, 12.0556640625, 12.68603515625, 13.31640625, 13.94677734375, 14.5771484375, 15.20751953125, 15.837890625, 16.46826171875, 17.0986328125, 17.72900390625, 18.359375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 5.0, 12.0, 14.0, 15.0, 19.0, 21.0, 22.0, 31.0, 37.0, 60.0, 76.0, 124.0, 184.0, 398.0, 1204.0, 10614.0, 2760720.0, 365540.0, 4932.0, 800.0, 320.0, 170.0, 91.0, 70.0, 47.0, 37.0, 25.0, 24.0, 12.0, 20.0, 11.0, 12.0, 6.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.234375, -22.336181640625, -21.43798828125, -20.539794921875, -19.6416015625, -18.743408203125, -17.84521484375, -16.947021484375, -16.048828125, -15.150634765625, -14.25244140625, -13.354248046875, -12.4560546875, -11.557861328125, -10.65966796875, -9.761474609375, -8.86328125, -7.965087890625, -7.06689453125, -6.168701171875, -5.2705078125, -4.372314453125, -3.47412109375, -2.575927734375, -1.677734375, -0.779541015625, 0.11865234375, 1.016845703125, 1.9150390625, 2.813232421875, 3.71142578125, 4.609619140625, 5.5078125, 6.406005859375, 7.30419921875, 8.202392578125, 9.1005859375, 9.998779296875, 10.89697265625, 11.795166015625, 12.693359375, 13.591552734375, 14.48974609375, 15.387939453125, 16.2861328125, 17.184326171875, 18.08251953125, 18.980712890625, 19.87890625, 20.777099609375, 21.67529296875, 22.573486328125, 23.4716796875, 24.369873046875, 25.26806640625, 26.166259765625, 27.064453125, 27.962646484375, 28.86083984375, 29.759033203125, 30.6572265625, 31.555419921875, 32.45361328125, 33.351806640625, 34.25]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 12.0, 159.0, 634.0, 205.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.68896484375, -126.63888549804688, -123.58880615234375, -120.53873443603516, -117.48865509033203, -114.4385757446289, -111.38850402832031, -108.33842468261719, -105.28834533691406, -102.23826599121094, -99.18818664550781, -96.13811492919922, -93.0880355834961, -90.03795623779297, -86.98788452148438, -83.93780517578125, -80.88772583007812, -77.837646484375, -74.78756713867188, -71.73749542236328, -68.68741607666016, -65.63733673095703, -62.58726119995117, -59.53718566894531, -56.48710632324219, -53.43702697753906, -50.3869514465332, -47.336875915527344, -44.28679656982422, -41.236717224121094, -38.186641693115234, -35.136566162109375, -32.08648681640625, -29.036409378051758, -25.986331939697266, -22.936254501342773, -19.88617706298828, -16.83609962463379, -13.786022186279297, -10.735944747924805, -7.6858673095703125, -4.63578987121582, -1.5857124328613281, 1.464365005493164, 4.514442443847656, 7.564519882202148, 10.61459732055664, 13.664674758911133, 16.714752197265625, 19.764829635620117, 22.81490707397461, 25.8649845123291, 28.915061950683594, 31.965139389038086, 35.01521682739258, 38.06529235839844, 41.11537170410156, 44.16545104980469, 47.21552658081055, 50.265602111816406, 53.31568145751953, 56.365760803222656, 59.415836334228516, 62.465911865234375, 65.5159912109375]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 2.0, 10.0, 8.0, 9.0, 8.0, 13.0, 20.0, 18.0, 24.0, 24.0, 32.0, 32.0, 33.0, 46.0, 34.0, 46.0, 43.0, 53.0, 43.0, 39.0, 52.0, 32.0, 51.0, 43.0, 42.0, 28.0, 27.0, 20.0, 33.0, 20.0, 14.0, 17.0, 17.0, 10.0, 5.0, 12.0, 5.0, 9.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.86970901489258, -51.22285079956055, -49.575992584228516, -47.929134368896484, -46.28227615356445, -44.63541793823242, -42.988563537597656, -41.341705322265625, -39.694847106933594, -38.04798889160156, -36.40113067626953, -34.7542724609375, -33.10741424560547, -31.460556030273438, -29.81369972229004, -28.166841506958008, -26.519981384277344, -24.873123168945312, -23.22626495361328, -21.57940673828125, -19.93254852294922, -18.285690307617188, -16.63883399963379, -14.991975784301758, -13.345117568969727, -11.698259353637695, -10.051401138305664, -8.40454387664795, -6.757685661315918, -5.110827445983887, -3.463970184326172, -1.8171119689941406, -0.170257568359375, 1.4766004085540771, 3.1234583854675293, 4.770316123962402, 6.417174339294434, 8.064032554626465, 9.71088981628418, 11.357748031616211, 13.004606246948242, 14.651464462280273, 16.298322677612305, 17.945178985595703, 19.592037200927734, 21.238895416259766, 22.885753631591797, 24.532611846923828, 26.17947006225586, 27.82632827758789, 29.473186492919922, 31.120044708251953, 32.766902923583984, 34.413761138916016, 36.06061553955078, 37.70747375488281, 39.354331970214844, 41.001190185546875, 42.648048400878906, 44.29490661621094, 45.94176483154297, 47.588623046875, 49.23548126220703, 50.88233947753906, 52.529197692871094]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 14.0, 10.0, 9.0, 9.0, 13.0, 19.0, 20.0, 25.0, 15.0, 29.0, 27.0, 31.0, 43.0, 43.0, 43.0, 40.0, 40.0, 49.0, 52.0, 45.0, 35.0, 35.0, 35.0, 30.0, 54.0, 37.0, 23.0, 24.0, 24.0, 14.0, 21.0, 17.0, 10.0, 14.0, 3.0, 10.0, 14.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.47265625, -4.3291015625, -4.185546875, -4.0419921875, -3.8984375, -3.7548828125, -3.611328125, -3.4677734375, -3.32421875, -3.1806640625, -3.037109375, -2.8935546875, -2.75, -2.6064453125, -2.462890625, -2.3193359375, -2.17578125, -2.0322265625, -1.888671875, -1.7451171875, -1.6015625, -1.4580078125, -1.314453125, -1.1708984375, -1.02734375, -0.8837890625, -0.740234375, -0.5966796875, -0.453125, -0.3095703125, -0.166015625, -0.0224609375, 0.12109375, 0.2646484375, 0.408203125, 0.5517578125, 0.6953125, 0.8388671875, 0.982421875, 1.1259765625, 1.26953125, 1.4130859375, 1.556640625, 1.7001953125, 1.84375, 1.9873046875, 2.130859375, 2.2744140625, 2.41796875, 2.5615234375, 2.705078125, 2.8486328125, 2.9921875, 3.1357421875, 3.279296875, 3.4228515625, 3.56640625, 3.7099609375, 3.853515625, 3.9970703125, 4.140625, 4.2841796875, 4.427734375, 4.5712890625, 4.71484375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 7.0, 10.0, 7.0, 11.0, 12.0, 12.0, 17.0, 19.0, 25.0, 45.0, 51.0, 82.0, 148.0, 231.0, 516.0, 1293.0, 3907.0, 16092.0, 96723.0, 717160.0, 2234878.0, 962300.0, 132323.0, 20904.0, 4796.0, 1496.0, 510.0, 265.0, 129.0, 69.0, 49.0, 36.0, 30.0, 30.0, 17.0, 16.0, 13.0, 5.0, 9.0, 10.0, 5.0, 7.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.2296142578125, -7.951416015625, -7.6732177734375, -7.39501953125, -7.1168212890625, -6.838623046875, -6.5604248046875, -6.2822265625, -6.0040283203125, -5.725830078125, -5.4476318359375, -5.16943359375, -4.8912353515625, -4.613037109375, -4.3348388671875, -4.056640625, -3.7784423828125, -3.500244140625, -3.2220458984375, -2.94384765625, -2.6656494140625, -2.387451171875, -2.1092529296875, -1.8310546875, -1.5528564453125, -1.274658203125, -0.9964599609375, -0.71826171875, -0.4400634765625, -0.161865234375, 0.1163330078125, 0.39453125, 0.6727294921875, 0.950927734375, 1.2291259765625, 1.50732421875, 1.7855224609375, 2.063720703125, 2.3419189453125, 2.6201171875, 2.8983154296875, 3.176513671875, 3.4547119140625, 3.73291015625, 4.0111083984375, 4.289306640625, 4.5675048828125, 4.845703125, 5.1239013671875, 5.402099609375, 5.6802978515625, 5.95849609375, 6.2366943359375, 6.514892578125, 6.7930908203125, 7.0712890625, 7.3494873046875, 7.627685546875, 7.9058837890625, 8.18408203125, 8.4622802734375, 8.740478515625, 9.0186767578125, 9.296875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 1.0, 10.0, 5.0, 19.0, 26.0, 36.0, 55.0, 97.0, 131.0, 166.0, 256.0, 336.0, 460.0, 517.0, 526.0, 433.0, 296.0, 207.0, 174.0, 90.0, 77.0, 68.0, 23.0, 19.0, 18.0, 12.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5390625, -13.085693359375, -12.63232421875, -12.178955078125, -11.7255859375, -11.272216796875, -10.81884765625, -10.365478515625, -9.912109375, -9.458740234375, -9.00537109375, -8.552001953125, -8.0986328125, -7.645263671875, -7.19189453125, -6.738525390625, -6.28515625, -5.831787109375, -5.37841796875, -4.925048828125, -4.4716796875, -4.018310546875, -3.56494140625, -3.111572265625, -2.658203125, -2.204833984375, -1.75146484375, -1.298095703125, -0.8447265625, -0.391357421875, 0.06201171875, 0.515380859375, 0.96875, 1.422119140625, 1.87548828125, 2.328857421875, 2.7822265625, 3.235595703125, 3.68896484375, 4.142333984375, 4.595703125, 5.049072265625, 5.50244140625, 5.955810546875, 6.4091796875, 6.862548828125, 7.31591796875, 7.769287109375, 8.22265625, 8.676025390625, 9.12939453125, 9.582763671875, 10.0361328125, 10.489501953125, 10.94287109375, 11.396240234375, 11.849609375, 12.302978515625, 12.75634765625, 13.209716796875, 13.6630859375, 14.116455078125, 14.56982421875, 15.023193359375, 15.4765625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 16.0, 12.0, 26.0, 34.0, 44.0, 80.0, 132.0, 224.0, 568.0, 2617.0, 385589.0, 3788994.0, 14177.0, 955.0, 340.0, 182.0, 91.0, 56.0, 50.0, 30.0, 19.0, 17.0, 11.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.8125, -56.07275390625, -54.3330078125, -52.59326171875, -50.853515625, -49.11376953125, -47.3740234375, -45.63427734375, -43.89453125, -42.15478515625, -40.4150390625, -38.67529296875, -36.935546875, -35.19580078125, -33.4560546875, -31.71630859375, -29.9765625, -28.23681640625, -26.4970703125, -24.75732421875, -23.017578125, -21.27783203125, -19.5380859375, -17.79833984375, -16.05859375, -14.31884765625, -12.5791015625, -10.83935546875, -9.099609375, -7.35986328125, -5.6201171875, -3.88037109375, -2.140625, -0.40087890625, 1.3388671875, 3.07861328125, 4.818359375, 6.55810546875, 8.2978515625, 10.03759765625, 11.77734375, 13.51708984375, 15.2568359375, 16.99658203125, 18.736328125, 20.47607421875, 22.2158203125, 23.95556640625, 25.6953125, 27.43505859375, 29.1748046875, 30.91455078125, 32.654296875, 34.39404296875, 36.1337890625, 37.87353515625, 39.61328125, 41.35302734375, 43.0927734375, 44.83251953125, 46.572265625, 48.31201171875, 50.0517578125, 51.79150390625, 53.53125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 111.0, 378.0, 402.0, 113.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-282.3742370605469, -275.4939880371094, -268.6137390136719, -261.7334899902344, -254.85325622558594, -247.97300720214844, -241.0927734375, -234.2125244140625, -227.332275390625, -220.4520263671875, -213.57177734375, -206.69154357910156, -199.81129455566406, -192.93104553222656, -186.05081176757812, -179.17056274414062, -172.29031372070312, -165.41006469726562, -158.52981567382812, -151.6495819091797, -144.7693328857422, -137.8890838623047, -131.00885009765625, -124.12860107421875, -117.24835205078125, -110.36810302734375, -103.48786163330078, -96.60762023925781, -89.72737121582031, -82.84712219238281, -75.96688079833984, -69.08663940429688, -62.20637512207031, -55.32612991333008, -48.445884704589844, -41.56563949584961, -34.685394287109375, -27.80514907836914, -20.924903869628906, -14.044658660888672, -7.1644134521484375, -0.2841682434082031, 6.596076965332031, 13.476322174072266, 20.3565673828125, 27.236812591552734, 34.11705780029297, 40.9973030090332, 47.87754821777344, 54.75779342651367, 61.638038635253906, 68.51828002929688, 75.39852905273438, 82.27877807617188, 89.15901947021484, 96.03926086425781, 102.91950988769531, 109.79975891113281, 116.68000030517578, 123.56024169921875, 130.44049072265625, 137.32073974609375, 144.20098876953125, 151.0812225341797, 157.9614715576172]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 8.0, 9.0, 12.0, 13.0, 8.0, 20.0, 21.0, 19.0, 23.0, 27.0, 19.0, 35.0, 37.0, 26.0, 41.0, 41.0, 49.0, 39.0, 46.0, 40.0, 40.0, 31.0, 25.0, 42.0, 29.0, 44.0, 38.0, 40.0, 24.0, 24.0, 12.0, 15.0, 16.0, 10.0, 16.0, 9.0, 14.0, 7.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.73896408081055, -39.46942138671875, -38.19987869262695, -36.930335998535156, -35.66079330444336, -34.39125061035156, -33.121707916259766, -31.85216522216797, -30.582622528076172, -29.313079833984375, -28.043537139892578, -26.77399444580078, -25.504451751708984, -24.234909057617188, -22.96536636352539, -21.695823669433594, -20.426280975341797, -19.15673828125, -17.887195587158203, -16.617652893066406, -15.34811019897461, -14.078567504882812, -12.809024810791016, -11.539482116699219, -10.269939422607422, -9.000396728515625, -7.730854034423828, -6.461311340332031, -5.191768646240234, -3.9222259521484375, -2.6526832580566406, -1.3831405639648438, -0.1136016845703125, 1.1559410095214844, 2.4254837036132812, 3.695026397705078, 4.964569091796875, 6.234111785888672, 7.503654479980469, 8.773197174072266, 10.042739868164062, 11.31228256225586, 12.581825256347656, 13.851367950439453, 15.12091064453125, 16.390453338623047, 17.659996032714844, 18.92953872680664, 20.199081420898438, 21.468624114990234, 22.73816680908203, 24.007709503173828, 25.277252197265625, 26.546794891357422, 27.81633758544922, 29.085880279541016, 30.355422973632812, 31.62496566772461, 32.894508361816406, 34.1640510559082, 35.43359375, 36.7031364440918, 37.972679138183594, 39.24222183227539, 40.51176452636719]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 10.0, 9.0, 8.0, 5.0, 14.0, 9.0, 13.0, 20.0, 21.0, 22.0, 21.0, 27.0, 31.0, 40.0, 41.0, 42.0, 38.0, 39.0, 42.0, 34.0, 50.0, 49.0, 43.0, 34.0, 45.0, 31.0, 35.0, 30.0, 28.0, 28.0, 25.0, 20.0, 12.0, 25.0, 14.0, 13.0, 8.0, 5.0, 2.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.4609375, -4.31640625, -4.171875, -4.02734375, -3.8828125, -3.73828125, -3.59375, -3.44921875, -3.3046875, -3.16015625, -3.015625, -2.87109375, -2.7265625, -2.58203125, -2.4375, -2.29296875, -2.1484375, -2.00390625, -1.859375, -1.71484375, -1.5703125, -1.42578125, -1.28125, -1.13671875, -0.9921875, -0.84765625, -0.703125, -0.55859375, -0.4140625, -0.26953125, -0.125, 0.01953125, 0.1640625, 0.30859375, 0.453125, 0.59765625, 0.7421875, 0.88671875, 1.03125, 1.17578125, 1.3203125, 1.46484375, 1.609375, 1.75390625, 1.8984375, 2.04296875, 2.1875, 2.33203125, 2.4765625, 2.62109375, 2.765625, 2.91015625, 3.0546875, 3.19921875, 3.34375, 3.48828125, 3.6328125, 3.77734375, 3.921875, 4.06640625, 4.2109375, 4.35546875, 4.5, 4.64453125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 2.0, 3.0, 9.0, 6.0, 7.0, 9.0, 27.0, 38.0, 47.0, 76.0, 100.0, 140.0, 186.0, 260.0, 393.0, 550.0, 935.0, 1324.0, 1816.0, 2910.0, 4409.0, 6682.0, 10136.0, 15556.0, 24445.0, 39063.0, 65111.0, 116630.0, 292731.0, 211639.0, 99001.0, 56776.0, 34774.0, 21770.0, 13975.0, 9166.0, 5763.0, 4006.0, 2610.0, 1761.0, 1145.0, 822.0, 542.0, 393.0, 252.0, 179.0, 130.0, 77.0, 58.0, 32.0, 28.0, 15.0, 16.0, 11.0, 11.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.2177734375, -1.1795654296875, -1.141357421875, -1.1031494140625, -1.06494140625, -1.0267333984375, -0.988525390625, -0.9503173828125, -0.912109375, -0.8739013671875, -0.835693359375, -0.7974853515625, -0.75927734375, -0.7210693359375, -0.682861328125, -0.6446533203125, -0.6064453125, -0.5682373046875, -0.530029296875, -0.4918212890625, -0.45361328125, -0.4154052734375, -0.377197265625, -0.3389892578125, -0.30078125, -0.2625732421875, -0.224365234375, -0.1861572265625, -0.14794921875, -0.1097412109375, -0.071533203125, -0.0333251953125, 0.0048828125, 0.0430908203125, 0.081298828125, 0.1195068359375, 0.15771484375, 0.1959228515625, 0.234130859375, 0.2723388671875, 0.310546875, 0.3487548828125, 0.386962890625, 0.4251708984375, 0.46337890625, 0.5015869140625, 0.539794921875, 0.5780029296875, 0.6162109375, 0.6544189453125, 0.692626953125, 0.7308349609375, 0.76904296875, 0.8072509765625, 0.845458984375, 0.8836669921875, 0.921875, 0.9600830078125, 0.998291015625, 1.0364990234375, 1.07470703125, 1.1129150390625, 1.151123046875, 1.1893310546875, 1.2275390625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 13.0, 4.0, 7.0, 10.0, 8.0, 21.0, 14.0, 12.0, 9.0, 15.0, 27.0, 28.0, 28.0, 30.0, 33.0, 35.0, 36.0, 36.0, 41.0, 52.0, 44.0, 1061.0, 27.0, 45.0, 48.0, 37.0, 34.0, 41.0, 30.0, 20.0, 23.0, 25.0, 13.0, 17.0, 10.0, 13.0, 12.0, 12.0, 11.0, 6.0, 8.0, 6.0, 2.0, 7.0, 2.0, 2.0, 3.0, 5.0], "bins": [-3.224609375, -3.138519287109375, -3.05242919921875, -2.966339111328125, -2.8802490234375, -2.794158935546875, -2.70806884765625, -2.621978759765625, -2.535888671875, -2.449798583984375, -2.36370849609375, -2.277618408203125, -2.1915283203125, -2.105438232421875, -2.01934814453125, -1.933258056640625, -1.84716796875, -1.761077880859375, -1.67498779296875, -1.588897705078125, -1.5028076171875, -1.416717529296875, -1.33062744140625, -1.244537353515625, -1.158447265625, -1.072357177734375, -0.98626708984375, -0.900177001953125, -0.8140869140625, -0.727996826171875, -0.64190673828125, -0.555816650390625, -0.4697265625, -0.383636474609375, -0.29754638671875, -0.211456298828125, -0.1253662109375, -0.039276123046875, 0.04681396484375, 0.132904052734375, 0.218994140625, 0.305084228515625, 0.39117431640625, 0.477264404296875, 0.5633544921875, 0.649444580078125, 0.73553466796875, 0.821624755859375, 0.90771484375, 0.993804931640625, 1.07989501953125, 1.165985107421875, 1.2520751953125, 1.338165283203125, 1.42425537109375, 1.510345458984375, 1.596435546875, 1.682525634765625, 1.76861572265625, 1.854705810546875, 1.9407958984375, 2.026885986328125, 2.11297607421875, 2.199066162109375, 2.28515625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 9.0, 10.0, 29.0, 27.0, 56.0, 89.0, 123.0, 172.0, 328.0, 453.0, 700.0, 1106.0, 1740.0, 2517.0, 3534.0, 5161.0, 7542.0, 11625.0, 18031.0, 28001.0, 44346.0, 73368.0, 135262.0, 1373899.0, 164981.0, 83852.0, 49797.0, 30991.0, 20323.0, 12779.0, 8577.0, 5611.0, 3962.0, 2644.0, 1838.0, 1261.0, 915.0, 517.0, 342.0, 219.0, 140.0, 89.0, 48.0, 46.0, 23.0, 15.0, 16.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.212890625, -1.17681884765625, -1.1407470703125, -1.10467529296875, -1.068603515625, -1.03253173828125, -0.9964599609375, -0.96038818359375, -0.92431640625, -0.88824462890625, -0.8521728515625, -0.81610107421875, -0.780029296875, -0.74395751953125, -0.7078857421875, -0.67181396484375, -0.6357421875, -0.59967041015625, -0.5635986328125, -0.52752685546875, -0.491455078125, -0.45538330078125, -0.4193115234375, -0.38323974609375, -0.34716796875, -0.31109619140625, -0.2750244140625, -0.23895263671875, -0.202880859375, -0.16680908203125, -0.1307373046875, -0.09466552734375, -0.05859375, -0.02252197265625, 0.0135498046875, 0.04962158203125, 0.085693359375, 0.12176513671875, 0.1578369140625, 0.19390869140625, 0.22998046875, 0.26605224609375, 0.3021240234375, 0.33819580078125, 0.374267578125, 0.41033935546875, 0.4464111328125, 0.48248291015625, 0.5185546875, 0.55462646484375, 0.5906982421875, 0.62677001953125, 0.662841796875, 0.69891357421875, 0.7349853515625, 0.77105712890625, 0.80712890625, 0.84320068359375, 0.8792724609375, 0.91534423828125, 0.951416015625, 0.98748779296875, 1.0235595703125, 1.05963134765625, 1.095703125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 6.0, 8.0, 9.0, 15.0, 16.0, 19.0, 21.0, 15.0, 20.0, 18.0, 43.0, 44.0, 44.0, 71.0, 82.0, 84.0, 82.0, 60.0, 47.0, 65.0, 38.0, 31.0, 37.0, 22.0, 20.0, 19.0, 7.0, 14.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00020885467529296875, -0.0002026595175266266, -0.00019646435976028442, -0.00019026920199394226, -0.0001840740442276001, -0.00017787888646125793, -0.00017168372869491577, -0.0001654885709285736, -0.00015929341316223145, -0.00015309825539588928, -0.00014690309762954712, -0.00014070793986320496, -0.0001345127820968628, -0.00012831762433052063, -0.00012212246656417847, -0.0001159273087978363, -0.00010973215103149414, -0.00010353699326515198, -9.734183549880981e-05, -9.114667773246765e-05, -8.495151996612549e-05, -7.875636219978333e-05, -7.256120443344116e-05, -6.6366046667099e-05, -6.0170888900756836e-05, -5.397573113441467e-05, -4.778057336807251e-05, -4.158541560173035e-05, -3.5390257835388184e-05, -2.919510006904602e-05, -2.2999942302703857e-05, -1.6804784536361694e-05, -1.0609626770019531e-05, -4.414469003677368e-06, 1.780688762664795e-06, 7.975846529006958e-06, 1.4171004295349121e-05, 2.0366162061691284e-05, 2.6561319828033447e-05, 3.275647759437561e-05, 3.8951635360717773e-05, 4.5146793127059937e-05, 5.13419508934021e-05, 5.753710865974426e-05, 6.373226642608643e-05, 6.992742419242859e-05, 7.612258195877075e-05, 8.231773972511292e-05, 8.851289749145508e-05, 9.470805525779724e-05, 0.0001009032130241394, 0.00010709837079048157, 0.00011329352855682373, 0.0001194886863231659, 0.00012568384408950806, 0.00013187900185585022, 0.00013807415962219238, 0.00014426931738853455, 0.0001504644751548767, 0.00015665963292121887, 0.00016285479068756104, 0.0001690499484539032, 0.00017524510622024536, 0.00018144026398658752, 0.0001876354217529297]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 18.0, 12.0, 19.0, 28.0, 29.0, 44.0, 70.0, 98.0, 136.0, 185.0, 260.0, 437.0, 1432.0, 798005.0, 245391.0, 1048.0, 461.0, 296.0, 179.0, 109.0, 72.0, 56.0, 40.0, 41.0, 28.0, 9.0, 13.0, 6.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0040283203125, -0.003898024559020996, -0.003767728805541992, -0.0036374330520629883, -0.0035071372985839844, -0.0033768415451049805, -0.0032465457916259766, -0.0031162500381469727, -0.0029859542846679688, -0.002855658531188965, -0.002725362777709961, -0.002595067024230957, -0.002464771270751953, -0.0023344755172729492, -0.0022041797637939453, -0.0020738840103149414, -0.0019435882568359375, -0.0018132925033569336, -0.0016829967498779297, -0.0015527009963989258, -0.0014224052429199219, -0.001292109489440918, -0.001161813735961914, -0.0010315179824829102, -0.0009012222290039062, -0.0007709264755249023, -0.0006406307220458984, -0.0005103349685668945, -0.0003800392150878906, -0.0002497434616088867, -0.00011944770812988281, 1.0848045349121094e-05, 0.000141143798828125, 0.0002714395523071289, 0.0004017353057861328, 0.0005320310592651367, 0.0006623268127441406, 0.0007926225662231445, 0.0009229183197021484, 0.0010532140731811523, 0.0011835098266601562, 0.0013138055801391602, 0.001444101333618164, 0.001574397087097168, 0.0017046928405761719, 0.0018349885940551758, 0.0019652843475341797, 0.0020955801010131836, 0.0022258758544921875, 0.0023561716079711914, 0.0024864673614501953, 0.0026167631149291992, 0.002747058868408203, 0.002877354621887207, 0.003007650375366211, 0.003137946128845215, 0.0032682418823242188, 0.0033985376358032227, 0.0035288333892822266, 0.0036591291427612305, 0.0037894248962402344, 0.003919720649719238, 0.004050016403198242, 0.004180312156677246, 0.00431060791015625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 35.0, 245.0, 465.0, 230.0, 35.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000203538074856624, -0.00018842345161829144, -0.00017330881382804364, -0.00015819419058971107, -0.00014307955279946327, -0.0001279649295611307, -0.00011285030632279813, -9.773567580850795e-05, -8.262104529421777e-05, -6.750641477992758e-05, -5.2391787903616205e-05, -3.727716102730483e-05, -2.2162530513014644e-05, -7.047899998724461e-06, 8.066723239608109e-06, 2.3181353753898293e-05, 3.8295984268188477e-05, 5.341061478247866e-05, 6.852524529676884e-05, 8.363986853510141e-05, 9.87544990493916e-05, 0.00011386912956368178, 0.00012898375280201435, 0.00014409839059226215, 0.00015921301383059472, 0.0001743276370689273, 0.00018944227485917509, 0.00020455689809750766, 0.00021967152133584023, 0.00023478615912608802, 0.0002499007969163358, 0.00026501540560275316, 0.0002801300142891705, 0.0002952446520794183, 0.00031035926076583564, 0.00032547389855608344, 0.00034058853634633124, 0.00035570317413657904, 0.0003708177828229964, 0.0003859324206132442, 0.000401047058403492, 0.00041616169619373977, 0.0004312763048801571, 0.0004463909426704049, 0.0004615055804606527, 0.0004766202182509005, 0.0004917348269373178, 0.0005068494356237352, 0.0005219640443101525, 0.0005370786529965699, 0.0005521933198906481, 0.0005673079285770655, 0.0005824225372634828, 0.0005975372041575611, 0.0006126518128439784, 0.0006277664215303957, 0.000642881088424474, 0.0006579956971108913, 0.0006731103640049696, 0.0006882249726913869, 0.0007033395813778043, 0.0007184542482718825, 0.0007335688569582999, 0.0007486834656447172, 0.0007637981325387955]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 10.0, 7.0, 10.0, 8.0, 18.0, 16.0, 24.0, 10.0, 30.0, 22.0, 24.0, 28.0, 42.0, 40.0, 43.0, 40.0, 35.0, 36.0, 50.0, 39.0, 38.0, 40.0, 34.0, 36.0, 40.0, 27.0, 24.0, 27.0, 29.0, 23.0, 20.0, 18.0, 20.0, 22.0, 11.0, 13.0, 11.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.626150131225586e-05, -9.333807975053787e-05, -9.041465818881989e-05, -8.74912366271019e-05, -8.456781506538391e-05, -8.164439350366592e-05, -7.872097194194794e-05, -7.579755038022995e-05, -7.287412881851196e-05, -6.995070725679398e-05, -6.702728569507599e-05, -6.4103864133358e-05, -6.118044257164001e-05, -5.825702100992203e-05, -5.533359944820404e-05, -5.2410177886486053e-05, -4.9486756324768066e-05, -4.656333476305008e-05, -4.363991320133209e-05, -4.0716491639614105e-05, -3.779307007789612e-05, -3.486964851617813e-05, -3.1946226954460144e-05, -2.9022805392742157e-05, -2.609938383102417e-05, -2.3175962269306183e-05, -2.0252540707588196e-05, -1.732911914587021e-05, -1.4405697584152222e-05, -1.1482276022434235e-05, -8.558854460716248e-06, -5.6354328989982605e-06, -2.7120113372802734e-06, 2.1141022443771362e-07, 3.1348317861557007e-06, 6.058253347873688e-06, 8.981674909591675e-06, 1.1905096471309662e-05, 1.4828518033027649e-05, 1.7751939594745636e-05, 2.0675361156463623e-05, 2.359878271818161e-05, 2.6522204279899597e-05, 2.9445625841617584e-05, 3.236904740333557e-05, 3.529246896505356e-05, 3.8215890526771545e-05, 4.113931208848953e-05, 4.406273365020752e-05, 4.6986155211925507e-05, 4.9909576773643494e-05, 5.283299833536148e-05, 5.575641989707947e-05, 5.8679841458797455e-05, 6.160326302051544e-05, 6.452668458223343e-05, 6.745010614395142e-05, 7.03735277056694e-05, 7.329694926738739e-05, 7.622037082910538e-05, 7.914379239082336e-05, 8.206721395254135e-05, 8.499063551425934e-05, 8.791405707597733e-05, 9.083747863769531e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 10.0, 9.0, 8.0, 5.0, 14.0, 9.0, 13.0, 20.0, 21.0, 22.0, 21.0, 27.0, 31.0, 40.0, 41.0, 42.0, 38.0, 39.0, 42.0, 34.0, 50.0, 49.0, 43.0, 34.0, 45.0, 31.0, 35.0, 30.0, 28.0, 28.0, 25.0, 20.0, 12.0, 25.0, 14.0, 13.0, 8.0, 5.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.4609375, -4.31640625, -4.171875, -4.02734375, -3.8828125, -3.73828125, -3.59375, -3.44921875, -3.3046875, -3.16015625, -3.015625, -2.87109375, -2.7265625, -2.58203125, -2.4375, -2.29296875, -2.1484375, -2.00390625, -1.859375, -1.71484375, -1.5703125, -1.42578125, -1.28125, -1.13671875, -0.9921875, -0.84765625, -0.703125, -0.55859375, -0.4140625, -0.26953125, -0.125, 0.01953125, 0.1640625, 0.30859375, 0.453125, 0.59765625, 0.7421875, 0.88671875, 1.03125, 1.17578125, 1.3203125, 1.46484375, 1.609375, 1.75390625, 1.8984375, 2.04296875, 2.1875, 2.33203125, 2.4765625, 2.62109375, 2.765625, 2.91015625, 3.0546875, 3.19921875, 3.34375, 3.48828125, 3.6328125, 3.77734375, 3.921875, 4.06640625, 4.2109375, 4.35546875, 4.5, 4.64453125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 12.0, 12.0, 12.0, 18.0, 22.0, 48.0, 63.0, 136.0, 203.0, 311.0, 516.0, 965.0, 1779.0, 3374.0, 6440.0, 13461.0, 28829.0, 66449.0, 150012.0, 267217.0, 257463.0, 138308.0, 61261.0, 26297.0, 12174.0, 6093.0, 3054.0, 1785.0, 900.0, 479.0, 293.0, 183.0, 123.0, 91.0, 50.0, 36.0, 22.0, 13.0, 14.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.741241455078125, -2.64654541015625, -2.551849365234375, -2.4571533203125, -2.362457275390625, -2.26776123046875, -2.173065185546875, -2.078369140625, -1.983673095703125, -1.88897705078125, -1.794281005859375, -1.6995849609375, -1.604888916015625, -1.51019287109375, -1.415496826171875, -1.32080078125, -1.226104736328125, -1.13140869140625, -1.036712646484375, -0.9420166015625, -0.847320556640625, -0.75262451171875, -0.657928466796875, -0.563232421875, -0.468536376953125, -0.37384033203125, -0.279144287109375, -0.1844482421875, -0.089752197265625, 0.00494384765625, 0.099639892578125, 0.1943359375, 0.289031982421875, 0.38372802734375, 0.478424072265625, 0.5731201171875, 0.667816162109375, 0.76251220703125, 0.857208251953125, 0.951904296875, 1.046600341796875, 1.14129638671875, 1.235992431640625, 1.3306884765625, 1.425384521484375, 1.52008056640625, 1.614776611328125, 1.70947265625, 1.804168701171875, 1.89886474609375, 1.993560791015625, 2.0882568359375, 2.182952880859375, 2.27764892578125, 2.372344970703125, 2.467041015625, 2.561737060546875, 2.65643310546875, 2.751129150390625, 2.8458251953125, 2.940521240234375, 3.03521728515625, 3.129913330078125, 3.224609375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 2.0, 9.0, 2.0, 8.0, 10.0, 9.0, 13.0, 18.0, 17.0, 12.0, 17.0, 26.0, 27.0, 33.0, 36.0, 29.0, 39.0, 39.0, 44.0, 110.0, 302.0, 1565.0, 198.0, 69.0, 47.0, 50.0, 36.0, 34.0, 27.0, 25.0, 14.0, 20.0, 26.0, 30.0, 29.0, 16.0, 10.0, 9.0, 9.0, 7.0, 9.0, 1.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-17.328125, -16.8375244140625, -16.346923828125, -15.8563232421875, -15.36572265625, -14.8751220703125, -14.384521484375, -13.8939208984375, -13.4033203125, -12.9127197265625, -12.422119140625, -11.9315185546875, -11.44091796875, -10.9503173828125, -10.459716796875, -9.9691162109375, -9.478515625, -8.9879150390625, -8.497314453125, -8.0067138671875, -7.51611328125, -7.0255126953125, -6.534912109375, -6.0443115234375, -5.5537109375, -5.0631103515625, -4.572509765625, -4.0819091796875, -3.59130859375, -3.1007080078125, -2.610107421875, -2.1195068359375, -1.62890625, -1.1383056640625, -0.647705078125, -0.1571044921875, 0.33349609375, 0.8240966796875, 1.314697265625, 1.8052978515625, 2.2958984375, 2.7864990234375, 3.277099609375, 3.7677001953125, 4.25830078125, 4.7489013671875, 5.239501953125, 5.7301025390625, 6.220703125, 6.7113037109375, 7.201904296875, 7.6925048828125, 8.18310546875, 8.6737060546875, 9.164306640625, 9.6549072265625, 10.1455078125, 10.6361083984375, 11.126708984375, 11.6173095703125, 12.10791015625, 12.5985107421875, 13.089111328125, 13.5797119140625, 14.0703125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 10.0, 2.0, 13.0, 9.0, 8.0, 16.0, 14.0, 22.0, 29.0, 30.0, 33.0, 41.0, 39.0, 60.0, 79.0, 131.0, 213.0, 319.0, 675.0, 3518.0, 116719.0, 2978677.0, 41290.0, 2220.0, 568.0, 280.0, 172.0, 116.0, 82.0, 74.0, 52.0, 42.0, 18.0, 11.0, 26.0, 15.0, 10.0, 16.0, 11.0, 9.0, 6.0, 2.0, 7.0, 9.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-21.453125, -20.697509765625, -19.94189453125, -19.186279296875, -18.4306640625, -17.675048828125, -16.91943359375, -16.163818359375, -15.408203125, -14.652587890625, -13.89697265625, -13.141357421875, -12.3857421875, -11.630126953125, -10.87451171875, -10.118896484375, -9.36328125, -8.607666015625, -7.85205078125, -7.096435546875, -6.3408203125, -5.585205078125, -4.82958984375, -4.073974609375, -3.318359375, -2.562744140625, -1.80712890625, -1.051513671875, -0.2958984375, 0.459716796875, 1.21533203125, 1.970947265625, 2.7265625, 3.482177734375, 4.23779296875, 4.993408203125, 5.7490234375, 6.504638671875, 7.26025390625, 8.015869140625, 8.771484375, 9.527099609375, 10.28271484375, 11.038330078125, 11.7939453125, 12.549560546875, 13.30517578125, 14.060791015625, 14.81640625, 15.572021484375, 16.32763671875, 17.083251953125, 17.8388671875, 18.594482421875, 19.35009765625, 20.105712890625, 20.861328125, 21.616943359375, 22.37255859375, 23.128173828125, 23.8837890625, 24.639404296875, 25.39501953125, 26.150634765625, 26.90625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 33.0, 217.0, 444.0, 277.0, 41.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.92256927490234, -100.5626449584961, -98.20271301269531, -95.84278869628906, -93.48286437988281, -91.12293243408203, -88.76300811767578, -86.403076171875, -84.04315185546875, -81.6832275390625, -79.32329559326172, -76.96337127685547, -74.60343933105469, -72.24351501464844, -69.88359069824219, -67.52366638183594, -65.16373443603516, -62.80380630493164, -60.443878173828125, -58.083953857421875, -55.72402572631836, -53.364097595214844, -51.004173278808594, -48.64424514770508, -46.28431701660156, -43.92438888549805, -41.56446075439453, -39.20453643798828, -36.844608306884766, -34.48468017578125, -32.124755859375, -29.764827728271484, -27.4049072265625, -25.044979095458984, -22.6850528717041, -20.32512664794922, -17.965198516845703, -15.605271339416504, -13.245344161987305, -10.885417938232422, -8.525489807128906, -6.165562629699707, -3.805635452270508, -1.4457082748413086, 0.9142189025878906, 3.27414608001709, 5.634073257446289, 7.993999481201172, 10.353927612304688, 12.713854789733887, 15.073781967163086, 17.43370819091797, 19.793636322021484, 22.153564453125, 24.513490676879883, 26.873416900634766, 29.23334503173828, 31.593273162841797, 33.95320129394531, 36.31312561035156, 38.67305374145508, 41.032981872558594, 43.392906188964844, 45.75283432006836, 48.112762451171875]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 7.0, 5.0, 5.0, 8.0, 8.0, 14.0, 20.0, 16.0, 21.0, 23.0, 31.0, 33.0, 27.0, 32.0, 35.0, 37.0, 35.0, 45.0, 49.0, 62.0, 51.0, 47.0, 45.0, 36.0, 36.0, 36.0, 32.0, 31.0, 26.0, 21.0, 27.0, 16.0, 13.0, 14.0, 10.0, 14.0, 9.0, 10.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.56816482543945, -49.88494110107422, -48.20171356201172, -46.518489837646484, -44.835262298583984, -43.15203857421875, -41.46881103515625, -39.785587310791016, -38.10236358642578, -36.41913986206055, -34.73591232299805, -33.05268859863281, -31.369461059570312, -29.686237335205078, -28.00301170349121, -26.319786071777344, -24.636558532714844, -22.953332901000977, -21.27010726928711, -19.586883544921875, -17.903656005859375, -16.22043228149414, -14.537206649780273, -12.853981018066406, -11.170755386352539, -9.487529754638672, -7.804304599761963, -6.121079444885254, -4.437853813171387, -2.7546281814575195, -1.0714035034179688, 0.6118221282958984, 2.2950515747070312, 3.9782769680023193, 5.661502361297607, 7.344727516174316, 9.027953147888184, 10.71117877960205, 12.394403457641602, 14.077629089355469, 15.760854721069336, 17.444080352783203, 19.12730598449707, 20.810531616210938, 22.493755340576172, 24.176982879638672, 25.860206604003906, 27.543432235717773, 29.22665786743164, 30.909883499145508, 32.593109130859375, 34.27633285522461, 35.95956039428711, 37.642784118652344, 39.326011657714844, 41.00923538208008, 42.69245910644531, 44.37568283081055, 46.05891036987305, 47.74213409423828, 49.42536163330078, 51.108585357666016, 52.79180908203125, 54.47503662109375, 56.15826416015625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 8.0, 7.0, 6.0, 8.0, 13.0, 16.0, 24.0, 22.0, 19.0, 21.0, 20.0, 33.0, 37.0, 45.0, 44.0, 31.0, 34.0, 45.0, 43.0, 40.0, 49.0, 38.0, 35.0, 33.0, 40.0, 40.0, 29.0, 33.0, 26.0, 27.0, 20.0, 17.0, 19.0, 8.0, 17.0, 8.0, 8.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.37713623046875, -4.2308349609375, -4.08453369140625, -3.938232421875, -3.79193115234375, -3.6456298828125, -3.49932861328125, -3.35302734375, -3.20672607421875, -3.0604248046875, -2.91412353515625, -2.767822265625, -2.62152099609375, -2.4752197265625, -2.32891845703125, -2.1826171875, -2.03631591796875, -1.8900146484375, -1.74371337890625, -1.597412109375, -1.45111083984375, -1.3048095703125, -1.15850830078125, -1.01220703125, -0.86590576171875, -0.7196044921875, -0.57330322265625, -0.427001953125, -0.28070068359375, -0.1343994140625, 0.01190185546875, 0.158203125, 0.30450439453125, 0.4508056640625, 0.59710693359375, 0.743408203125, 0.88970947265625, 1.0360107421875, 1.18231201171875, 1.32861328125, 1.47491455078125, 1.6212158203125, 1.76751708984375, 1.913818359375, 2.06011962890625, 2.2064208984375, 2.35272216796875, 2.4990234375, 2.64532470703125, 2.7916259765625, 2.93792724609375, 3.084228515625, 3.23052978515625, 3.3768310546875, 3.52313232421875, 3.66943359375, 3.81573486328125, 3.9620361328125, 4.10833740234375, 4.254638671875, 4.40093994140625, 4.5472412109375, 4.69354248046875, 4.83984375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 3.0, 7.0, 8.0, 9.0, 10.0, 14.0, 15.0, 14.0, 19.0, 20.0, 31.0, 29.0, 47.0, 61.0, 64.0, 114.0, 230.0, 457.0, 1386.0, 6868.0, 54600.0, 679689.0, 2670003.0, 713895.0, 56938.0, 7179.0, 1406.0, 492.0, 175.0, 118.0, 93.0, 55.0, 41.0, 28.0, 26.0, 17.0, 29.0, 8.0, 16.0, 15.0, 8.0, 9.0, 7.0, 4.0, 0.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-11.96875, -11.6005859375, -11.232421875, -10.8642578125, -10.49609375, -10.1279296875, -9.759765625, -9.3916015625, -9.0234375, -8.6552734375, -8.287109375, -7.9189453125, -7.55078125, -7.1826171875, -6.814453125, -6.4462890625, -6.078125, -5.7099609375, -5.341796875, -4.9736328125, -4.60546875, -4.2373046875, -3.869140625, -3.5009765625, -3.1328125, -2.7646484375, -2.396484375, -2.0283203125, -1.66015625, -1.2919921875, -0.923828125, -0.5556640625, -0.1875, 0.1806640625, 0.548828125, 0.9169921875, 1.28515625, 1.6533203125, 2.021484375, 2.3896484375, 2.7578125, 3.1259765625, 3.494140625, 3.8623046875, 4.23046875, 4.5986328125, 4.966796875, 5.3349609375, 5.703125, 6.0712890625, 6.439453125, 6.8076171875, 7.17578125, 7.5439453125, 7.912109375, 8.2802734375, 8.6484375, 9.0166015625, 9.384765625, 9.7529296875, 10.12109375, 10.4892578125, 10.857421875, 11.2255859375, 11.59375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 10.0, 6.0, 13.0, 11.0, 17.0, 17.0, 35.0, 35.0, 49.0, 58.0, 83.0, 89.0, 125.0, 160.0, 195.0, 248.0, 285.0, 304.0, 380.0, 348.0, 281.0, 303.0, 217.0, 168.0, 151.0, 98.0, 84.0, 72.0, 60.0, 38.0, 34.0, 25.0, 17.0, 15.0, 8.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.1328125, -9.8231201171875, -9.513427734375, -9.2037353515625, -8.89404296875, -8.5843505859375, -8.274658203125, -7.9649658203125, -7.6552734375, -7.3455810546875, -7.035888671875, -6.7261962890625, -6.41650390625, -6.1068115234375, -5.797119140625, -5.4874267578125, -5.177734375, -4.8680419921875, -4.558349609375, -4.2486572265625, -3.93896484375, -3.6292724609375, -3.319580078125, -3.0098876953125, -2.7001953125, -2.3905029296875, -2.080810546875, -1.7711181640625, -1.46142578125, -1.1517333984375, -0.842041015625, -0.5323486328125, -0.22265625, 0.0870361328125, 0.396728515625, 0.7064208984375, 1.01611328125, 1.3258056640625, 1.635498046875, 1.9451904296875, 2.2548828125, 2.5645751953125, 2.874267578125, 3.1839599609375, 3.49365234375, 3.8033447265625, 4.113037109375, 4.4227294921875, 4.732421875, 5.0421142578125, 5.351806640625, 5.6614990234375, 5.97119140625, 6.2808837890625, 6.590576171875, 6.9002685546875, 7.2099609375, 7.5196533203125, 7.829345703125, 8.1390380859375, 8.44873046875, 8.7584228515625, 9.068115234375, 9.3778076171875, 9.6875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 4.0, 10.0, 7.0, 10.0, 24.0, 24.0, 30.0, 44.0, 66.0, 86.0, 92.0, 133.0, 226.0, 382.0, 937.0, 7494.0, 340927.0, 3703003.0, 134710.0, 4354.0, 676.0, 276.0, 204.0, 139.0, 89.0, 68.0, 61.0, 50.0, 44.0, 34.0, 20.0, 16.0, 13.0, 4.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.78125, -32.669921875, -31.55859375, -30.447265625, -29.3359375, -28.224609375, -27.11328125, -26.001953125, -24.890625, -23.779296875, -22.66796875, -21.556640625, -20.4453125, -19.333984375, -18.22265625, -17.111328125, -16.0, -14.888671875, -13.77734375, -12.666015625, -11.5546875, -10.443359375, -9.33203125, -8.220703125, -7.109375, -5.998046875, -4.88671875, -3.775390625, -2.6640625, -1.552734375, -0.44140625, 0.669921875, 1.78125, 2.892578125, 4.00390625, 5.115234375, 6.2265625, 7.337890625, 8.44921875, 9.560546875, 10.671875, 11.783203125, 12.89453125, 14.005859375, 15.1171875, 16.228515625, 17.33984375, 18.451171875, 19.5625, 20.673828125, 21.78515625, 22.896484375, 24.0078125, 25.119140625, 26.23046875, 27.341796875, 28.453125, 29.564453125, 30.67578125, 31.787109375, 32.8984375, 34.009765625, 35.12109375, 36.232421875, 37.34375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 16.0, 38.0, 62.0, 125.0, 170.0, 191.0, 143.0, 129.0, 76.0, 34.0, 14.0, 12.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.45832443237305, -29.862314224243164, -27.26630401611328, -24.6702938079834, -22.074283599853516, -19.478273391723633, -16.88226318359375, -14.286252975463867, -11.690242767333984, -9.094232559204102, -6.498222351074219, -3.902212142944336, -1.3062019348144531, 1.2898082733154297, 3.8858184814453125, 6.481828689575195, 9.077838897705078, 11.673849105834961, 14.269859313964844, 16.865869522094727, 19.46187973022461, 22.057889938354492, 24.653900146484375, 27.249910354614258, 29.84592056274414, 32.441932678222656, 35.037940979003906, 37.633949279785156, 40.22996139526367, 42.82597351074219, 45.42198181152344, 48.01799011230469, 50.61399841308594, 53.21000671386719, 55.8060188293457, 58.40203094482422, 60.99803924560547, 63.59404754638672, 66.1900634765625, 68.78607177734375, 71.382080078125, 73.97808837890625, 76.5740966796875, 79.17011260986328, 81.76612091064453, 84.36212921142578, 86.95814514160156, 89.55415344238281, 92.15016174316406, 94.74617004394531, 97.34217834472656, 99.93819427490234, 102.5342025756836, 105.13021087646484, 107.72622680664062, 110.32223510742188, 112.91824340820312, 115.51425170898438, 118.11026000976562, 120.7062759399414, 123.30228424072266, 125.8982925415039, 128.4943084716797, 131.09031677246094, 133.6863250732422]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 19.0, 12.0, 14.0, 16.0, 20.0, 27.0, 23.0, 15.0, 26.0, 26.0, 30.0, 24.0, 24.0, 37.0, 28.0, 47.0, 40.0, 51.0, 30.0, 40.0, 22.0, 46.0, 32.0, 33.0, 32.0, 26.0, 36.0, 23.0, 19.0, 19.0, 20.0, 18.0, 17.0, 10.0, 12.0, 4.0, 10.0, 6.0, 8.0, 6.0, 1.0, 3.0, 9.0, 5.0, 5.0, 1.0, 4.0, 4.0, 0.0, 2.0], "bins": [-35.34066390991211, -34.23487091064453, -33.12907791137695, -32.023284912109375, -30.91749382019043, -29.81170082092285, -28.705907821655273, -27.600114822387695, -26.49432373046875, -25.388530731201172, -24.282737731933594, -23.176944732666016, -22.07115364074707, -20.965360641479492, -19.859567642211914, -18.753774642944336, -17.647981643676758, -16.54218864440918, -15.436396598815918, -14.33060359954834, -13.224811553955078, -12.1190185546875, -11.013225555419922, -9.907432556152344, -8.801640510559082, -7.695847988128662, -6.590055465698242, -5.484262466430664, -4.378469944000244, -3.272677421569824, -2.166884422302246, -1.0610918998718262, 0.04470062255859375, 1.1504932641983032, 2.2562859058380127, 3.3620786666870117, 4.467871189117432, 5.573663711547852, 6.67945671081543, 7.78524923324585, 8.89104175567627, 9.996834754943848, 11.10262680053711, 12.208419799804688, 13.314212799072266, 14.420004844665527, 15.525797843933105, 16.631589889526367, 17.737382888793945, 18.843175888061523, 19.9489688873291, 21.054759979248047, 22.160552978515625, 23.266345977783203, 24.37213897705078, 25.47793197631836, 26.583724975585938, 27.689517974853516, 28.795310974121094, 29.901103973388672, 31.006895065307617, 32.11268615722656, 33.218482971191406, 34.32427215576172, 35.4300651550293]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 8.0, 11.0, 9.0, 10.0, 15.0, 19.0, 21.0, 17.0, 27.0, 41.0, 35.0, 33.0, 33.0, 28.0, 36.0, 43.0, 44.0, 51.0, 35.0, 45.0, 42.0, 36.0, 39.0, 36.0, 30.0, 26.0, 29.0, 27.0, 31.0, 20.0, 21.0, 18.0, 12.0, 10.0, 10.0, 10.0, 6.0, 10.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.953125, -4.8038330078125, -4.654541015625, -4.5052490234375, -4.35595703125, -4.2066650390625, -4.057373046875, -3.9080810546875, -3.7587890625, -3.6094970703125, -3.460205078125, -3.3109130859375, -3.16162109375, -3.0123291015625, -2.863037109375, -2.7137451171875, -2.564453125, -2.4151611328125, -2.265869140625, -2.1165771484375, -1.96728515625, -1.8179931640625, -1.668701171875, -1.5194091796875, -1.3701171875, -1.2208251953125, -1.071533203125, -0.9222412109375, -0.77294921875, -0.6236572265625, -0.474365234375, -0.3250732421875, -0.17578125, -0.0264892578125, 0.122802734375, 0.2720947265625, 0.42138671875, 0.5706787109375, 0.719970703125, 0.8692626953125, 1.0185546875, 1.1678466796875, 1.317138671875, 1.4664306640625, 1.61572265625, 1.7650146484375, 1.914306640625, 2.0635986328125, 2.212890625, 2.3621826171875, 2.511474609375, 2.6607666015625, 2.81005859375, 2.9593505859375, 3.108642578125, 3.2579345703125, 3.4072265625, 3.5565185546875, 3.705810546875, 3.8551025390625, 4.00439453125, 4.1536865234375, 4.302978515625, 4.4522705078125, 4.6015625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 5.0, 16.0, 11.0, 15.0, 26.0, 36.0, 56.0, 63.0, 111.0, 177.0, 218.0, 315.0, 491.0, 626.0, 924.0, 1449.0, 1953.0, 3003.0, 4234.0, 6386.0, 9337.0, 14247.0, 21350.0, 32555.0, 50620.0, 82282.0, 160251.0, 316283.0, 133531.0, 73427.0, 45529.0, 29662.0, 19520.0, 12816.0, 8582.0, 5792.0, 3971.0, 2623.0, 1960.0, 1234.0, 873.0, 618.0, 377.0, 339.0, 218.0, 129.0, 95.0, 87.0, 30.0, 30.0, 27.0, 19.0, 16.0, 7.0, 5.0, 4.0, 6.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.0901031494140625, -1.054229736328125, -1.0183563232421875, -0.98248291015625, -0.9466094970703125, -0.910736083984375, -0.8748626708984375, -0.8389892578125, -0.8031158447265625, -0.767242431640625, -0.7313690185546875, -0.69549560546875, -0.6596221923828125, -0.623748779296875, -0.5878753662109375, -0.552001953125, -0.5161285400390625, -0.480255126953125, -0.4443817138671875, -0.40850830078125, -0.3726348876953125, -0.336761474609375, -0.3008880615234375, -0.2650146484375, -0.2291412353515625, -0.193267822265625, -0.1573944091796875, -0.12152099609375, -0.0856475830078125, -0.049774169921875, -0.0139007568359375, 0.02197265625, 0.0578460693359375, 0.093719482421875, 0.1295928955078125, 0.16546630859375, 0.2013397216796875, 0.237213134765625, 0.2730865478515625, 0.3089599609375, 0.3448333740234375, 0.380706787109375, 0.4165802001953125, 0.45245361328125, 0.4883270263671875, 0.524200439453125, 0.5600738525390625, 0.595947265625, 0.6318206787109375, 0.667694091796875, 0.7035675048828125, 0.73944091796875, 0.7753143310546875, 0.811187744140625, 0.8470611572265625, 0.8829345703125, 0.9188079833984375, 0.954681396484375, 0.9905548095703125, 1.02642822265625, 1.0623016357421875, 1.098175048828125, 1.1340484619140625, 1.169921875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 6.0, 11.0, 16.0, 11.0, 11.0, 20.0, 19.0, 20.0, 25.0, 26.0, 28.0, 33.0, 39.0, 38.0, 55.0, 33.0, 39.0, 1059.0, 39.0, 47.0, 45.0, 48.0, 33.0, 38.0, 36.0, 37.0, 29.0, 30.0, 22.0, 18.0, 26.0, 20.0, 12.0, 4.0, 11.0, 4.0, 5.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.30859375, -3.210418701171875, -3.11224365234375, -3.014068603515625, -2.9158935546875, -2.817718505859375, -2.71954345703125, -2.621368408203125, -2.523193359375, -2.425018310546875, -2.32684326171875, -2.228668212890625, -2.1304931640625, -2.032318115234375, -1.93414306640625, -1.835968017578125, -1.73779296875, -1.639617919921875, -1.54144287109375, -1.443267822265625, -1.3450927734375, -1.246917724609375, -1.14874267578125, -1.050567626953125, -0.952392578125, -0.854217529296875, -0.75604248046875, -0.657867431640625, -0.5596923828125, -0.461517333984375, -0.36334228515625, -0.265167236328125, -0.1669921875, -0.068817138671875, 0.02935791015625, 0.127532958984375, 0.2257080078125, 0.323883056640625, 0.42205810546875, 0.520233154296875, 0.618408203125, 0.716583251953125, 0.81475830078125, 0.912933349609375, 1.0111083984375, 1.109283447265625, 1.20745849609375, 1.305633544921875, 1.40380859375, 1.501983642578125, 1.60015869140625, 1.698333740234375, 1.7965087890625, 1.894683837890625, 1.99285888671875, 2.091033935546875, 2.189208984375, 2.287384033203125, 2.38555908203125, 2.483734130859375, 2.5819091796875, 2.680084228515625, 2.77825927734375, 2.876434326171875, 2.974609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 10.0, 21.0, 18.0, 35.0, 52.0, 82.0, 122.0, 162.0, 247.0, 325.0, 483.0, 715.0, 1118.0, 1617.0, 2436.0, 3535.0, 5385.0, 7885.0, 12058.0, 18497.0, 28877.0, 45698.0, 74449.0, 131042.0, 1352486.0, 168382.0, 89775.0, 54219.0, 34204.0, 21460.0, 13831.0, 9338.0, 6073.0, 3995.0, 2706.0, 1885.0, 1244.0, 832.0, 604.0, 376.0, 260.0, 204.0, 103.0, 91.0, 63.0, 45.0, 25.0, 17.0, 18.0, 9.0, 6.0, 4.0, 4.0, 0.0, 4.0], "bins": [-1.24609375, -1.2090911865234375, -1.172088623046875, -1.1350860595703125, -1.09808349609375, -1.0610809326171875, -1.024078369140625, -0.9870758056640625, -0.9500732421875, -0.9130706787109375, -0.876068115234375, -0.8390655517578125, -0.80206298828125, -0.7650604248046875, -0.728057861328125, -0.6910552978515625, -0.654052734375, -0.6170501708984375, -0.580047607421875, -0.5430450439453125, -0.50604248046875, -0.4690399169921875, -0.432037353515625, -0.3950347900390625, -0.3580322265625, -0.3210296630859375, -0.284027099609375, -0.2470245361328125, -0.21002197265625, -0.1730194091796875, -0.136016845703125, -0.0990142822265625, -0.06201171875, -0.0250091552734375, 0.011993408203125, 0.0489959716796875, 0.08599853515625, 0.1230010986328125, 0.160003662109375, 0.1970062255859375, 0.2340087890625, 0.2710113525390625, 0.308013916015625, 0.3450164794921875, 0.38201904296875, 0.4190216064453125, 0.456024169921875, 0.4930267333984375, 0.530029296875, 0.5670318603515625, 0.604034423828125, 0.6410369873046875, 0.67803955078125, 0.7150421142578125, 0.752044677734375, 0.7890472412109375, 0.8260498046875, 0.8630523681640625, 0.900054931640625, 0.9370574951171875, 0.97406005859375, 1.0110626220703125, 1.048065185546875, 1.0850677490234375, 1.1220703125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 19.0, 9.0, 17.0, 20.0, 19.0, 20.0, 39.0, 44.0, 47.0, 58.0, 83.0, 98.0, 85.0, 87.0, 81.0, 62.0, 45.0, 33.0, 18.0, 22.0, 19.0, 11.0, 15.0, 6.0, 6.0, 6.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002275705337524414, -0.00022162310779094696, -0.00021567568182945251, -0.00020972825586795807, -0.00020378082990646362, -0.00019783340394496918, -0.00019188597798347473, -0.00018593855202198029, -0.00017999112606048584, -0.0001740437000989914, -0.00016809627413749695, -0.0001621488481760025, -0.00015620142221450806, -0.0001502539962530136, -0.00014430657029151917, -0.00013835914433002472, -0.00013241171836853027, -0.00012646429240703583, -0.00012051686644554138, -0.00011456944048404694, -0.00010862201452255249, -0.00010267458856105804, -9.67271625995636e-05, -9.077973663806915e-05, -8.483231067657471e-05, -7.888488471508026e-05, -7.293745875358582e-05, -6.699003279209137e-05, -6.104260683059692e-05, -5.509518086910248e-05, -4.914775490760803e-05, -4.3200328946113586e-05, -3.725290298461914e-05, -3.1305477023124695e-05, -2.535805106163025e-05, -1.9410625100135803e-05, -1.3463199138641357e-05, -7.515773177146912e-06, -1.5683472156524658e-06, 4.37907874584198e-06, 1.0326504707336426e-05, 1.627393066883087e-05, 2.2221356630325317e-05, 2.8168782591819763e-05, 3.411620855331421e-05, 4.0063634514808655e-05, 4.60110604763031e-05, 5.1958486437797546e-05, 5.790591239929199e-05, 6.385333836078644e-05, 6.980076432228088e-05, 7.574819028377533e-05, 8.169561624526978e-05, 8.764304220676422e-05, 9.359046816825867e-05, 9.953789412975311e-05, 0.00010548532009124756, 0.000111432746052742, 0.00011738017201423645, 0.0001233275979757309, 0.00012927502393722534, 0.0001352224498987198, 0.00014116987586021423, 0.00014711730182170868, 0.00015306472778320312]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 9.0, 5.0, 17.0, 17.0, 23.0, 21.0, 47.0, 71.0, 106.0, 164.0, 290.0, 563.0, 5043.0, 1030815.0, 9979.0, 601.0, 292.0, 163.0, 117.0, 69.0, 38.0, 40.0, 22.0, 17.0, 10.0, 4.0, 1.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003307342529296875, -0.0031669139862060547, -0.0030264854431152344, -0.002886056900024414, -0.0027456283569335938, -0.0026051998138427734, -0.002464771270751953, -0.002324342727661133, -0.0021839141845703125, -0.002043485641479492, -0.0019030570983886719, -0.0017626285552978516, -0.0016222000122070312, -0.001481771469116211, -0.0013413429260253906, -0.0012009143829345703, -0.00106048583984375, -0.0009200572967529297, -0.0007796287536621094, -0.0006392002105712891, -0.0004987716674804688, -0.00035834312438964844, -0.00021791458129882812, -7.748603820800781e-05, 6.29425048828125e-05, 0.0002033710479736328, 0.0003437995910644531, 0.00048422813415527344, 0.0006246566772460938, 0.0007650852203369141, 0.0009055137634277344, 0.0010459423065185547, 0.001186370849609375, 0.0013267993927001953, 0.0014672279357910156, 0.001607656478881836, 0.0017480850219726562, 0.0018885135650634766, 0.002028942108154297, 0.002169370651245117, 0.0023097991943359375, 0.002450227737426758, 0.002590656280517578, 0.0027310848236083984, 0.0028715133666992188, 0.003011941909790039, 0.0031523704528808594, 0.0032927989959716797, 0.0034332275390625, 0.0035736560821533203, 0.0037140846252441406, 0.003854513168334961, 0.003994941711425781, 0.0041353702545166016, 0.004275798797607422, 0.004416227340698242, 0.0045566558837890625, 0.004697084426879883, 0.004837512969970703, 0.0049779415130615234, 0.005118370056152344, 0.005258798599243164, 0.005399227142333984, 0.005539655685424805, 0.005680084228515625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 13.0, 44.0, 91.0, 189.0, 238.0, 195.0, 156.0, 54.0, 21.0, 9.0, 1.0], "bins": [-0.0004177834198344499, -0.0004105457628611475, -0.0004033081349916756, -0.00039607047801837325, -0.00038883285014890134, -0.000381595193175599, -0.00037435756530612707, -0.0003671199083328247, -0.0003598822804633528, -0.00035264462349005044, -0.00034540699562057853, -0.00033816933864727616, -0.00033093171077780426, -0.0003236940538045019, -0.00031645642593503, -0.0003092187689617276, -0.00030198111198842525, -0.0002947434550151229, -0.000287505827145651, -0.0002802681701723486, -0.0002730305423028767, -0.00026579288532957435, -0.00025855525746010244, -0.0002513176004868001, -0.00024407997261732817, -0.00023684233019594103, -0.0002296046877745539, -0.00022236704535316676, -0.00021512940293177962, -0.00020789174595847726, -0.00020065411808900535, -0.000193416461115703, -0.00018617883324623108, -0.00017894119082484394, -0.0001717035484034568, -0.00016446590598206967, -0.00015722826356068254, -0.00014999060658738017, -0.00014275297871790826, -0.0001355153217446059, -0.00012827767932321876, -0.00012104003690183163, -0.00011380239448044449, -0.00010656475205905735, -9.93271023617126e-05, -9.208945994032547e-05, -8.485181751893833e-05, -7.761416782159358e-05, -7.037652540020645e-05, -6.313888297881931e-05, -5.590123691945337e-05, -4.866359449806623e-05, -4.142594843870029e-05, -3.418830601731315e-05, -2.6950663595926017e-05, -1.9713017536560073e-05, -1.2475378753151745e-05, -5.237734967522556e-06, 1.9999088181066327e-06, 9.23755214898847e-06, 1.647519638936501e-05, 2.371284062974155e-05, 3.0950483051128685e-05, 3.818812911049463e-05, 4.5425771531881765e-05]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 4.0, 6.0, 7.0, 7.0, 12.0, 12.0, 13.0, 20.0, 22.0, 25.0, 26.0, 29.0, 37.0, 36.0, 30.0, 34.0, 29.0, 45.0, 51.0, 41.0, 65.0, 42.0, 43.0, 58.0, 43.0, 36.0, 25.0, 21.0, 26.0, 26.0, 24.0, 25.0, 14.0, 10.0, 12.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.903575897216797e-05, -7.644761353731155e-05, -7.385946810245514e-05, -7.127132266759872e-05, -6.868317723274231e-05, -6.60950317978859e-05, -6.350688636302948e-05, -6.0918740928173065e-05, -5.833059549331665e-05, -5.5742450058460236e-05, -5.315430462360382e-05, -5.0566159188747406e-05, -4.797801375389099e-05, -4.5389868319034576e-05, -4.280172288417816e-05, -4.021357744932175e-05, -3.762543201446533e-05, -3.503728657960892e-05, -3.24491411447525e-05, -2.9860995709896088e-05, -2.7272850275039673e-05, -2.4684704840183258e-05, -2.2096559405326843e-05, -1.950841397047043e-05, -1.6920268535614014e-05, -1.4332123100757599e-05, -1.1743977665901184e-05, -9.15583223104477e-06, -6.5676867961883545e-06, -3.97954136133194e-06, -1.391395926475525e-06, 1.1967495083808899e-06, 3.7848949432373047e-06, 6.3730403780937195e-06, 8.961185812950134e-06, 1.1549331247806549e-05, 1.4137476682662964e-05, 1.672562211751938e-05, 1.9313767552375793e-05, 2.1901912987232208e-05, 2.4490058422088623e-05, 2.7078203856945038e-05, 2.9666349291801453e-05, 3.225449472665787e-05, 3.484264016151428e-05, 3.74307855963707e-05, 4.001893103122711e-05, 4.2607076466083527e-05, 4.519522190093994e-05, 4.7783367335796356e-05, 5.037151277065277e-05, 5.2959658205509186e-05, 5.55478036403656e-05, 5.8135949075222015e-05, 6.072409451007843e-05, 6.331223994493484e-05, 6.590038537979126e-05, 6.848853081464767e-05, 7.107667624950409e-05, 7.36648216843605e-05, 7.625296711921692e-05, 7.884111255407333e-05, 8.142925798892975e-05, 8.401740342378616e-05, 8.660554885864258e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 8.0, 11.0, 9.0, 10.0, 15.0, 19.0, 21.0, 17.0, 27.0, 41.0, 35.0, 33.0, 33.0, 28.0, 36.0, 43.0, 44.0, 51.0, 35.0, 45.0, 42.0, 36.0, 39.0, 36.0, 30.0, 26.0, 29.0, 27.0, 31.0, 20.0, 21.0, 18.0, 12.0, 10.0, 10.0, 10.0, 6.0, 10.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.953125, -4.8038330078125, -4.654541015625, -4.5052490234375, -4.35595703125, -4.2066650390625, -4.057373046875, -3.9080810546875, -3.7587890625, -3.6094970703125, -3.460205078125, -3.3109130859375, -3.16162109375, -3.0123291015625, -2.863037109375, -2.7137451171875, -2.564453125, -2.4151611328125, -2.265869140625, -2.1165771484375, -1.96728515625, -1.8179931640625, -1.668701171875, -1.5194091796875, -1.3701171875, -1.2208251953125, -1.071533203125, -0.9222412109375, -0.77294921875, -0.6236572265625, -0.474365234375, -0.3250732421875, -0.17578125, -0.0264892578125, 0.122802734375, 0.2720947265625, 0.42138671875, 0.5706787109375, 0.719970703125, 0.8692626953125, 1.0185546875, 1.1678466796875, 1.317138671875, 1.4664306640625, 1.61572265625, 1.7650146484375, 1.914306640625, 2.0635986328125, 2.212890625, 2.3621826171875, 2.511474609375, 2.6607666015625, 2.81005859375, 2.9593505859375, 3.108642578125, 3.2579345703125, 3.4072265625, 3.5565185546875, 3.705810546875, 3.8551025390625, 4.00439453125, 4.1536865234375, 4.302978515625, 4.4522705078125, 4.6015625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 12.0, 18.0, 18.0, 32.0, 43.0, 46.0, 66.0, 94.0, 175.0, 203.0, 272.0, 352.0, 679.0, 761.0, 1199.0, 1825.0, 2682.0, 3995.0, 6393.0, 10328.0, 19616.0, 42917.0, 113328.0, 317537.0, 319703.0, 114012.0, 43478.0, 19405.0, 10469.0, 6347.0, 3960.0, 2679.0, 1828.0, 1257.0, 830.0, 568.0, 401.0, 279.0, 180.0, 149.0, 120.0, 77.0, 57.0, 39.0, 33.0, 27.0, 18.0, 15.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0], "bins": [-4.70703125, -4.568603515625, -4.43017578125, -4.291748046875, -4.1533203125, -4.014892578125, -3.87646484375, -3.738037109375, -3.599609375, -3.461181640625, -3.32275390625, -3.184326171875, -3.0458984375, -2.907470703125, -2.76904296875, -2.630615234375, -2.4921875, -2.353759765625, -2.21533203125, -2.076904296875, -1.9384765625, -1.800048828125, -1.66162109375, -1.523193359375, -1.384765625, -1.246337890625, -1.10791015625, -0.969482421875, -0.8310546875, -0.692626953125, -0.55419921875, -0.415771484375, -0.27734375, -0.138916015625, -0.00048828125, 0.137939453125, 0.2763671875, 0.414794921875, 0.55322265625, 0.691650390625, 0.830078125, 0.968505859375, 1.10693359375, 1.245361328125, 1.3837890625, 1.522216796875, 1.66064453125, 1.799072265625, 1.9375, 2.075927734375, 2.21435546875, 2.352783203125, 2.4912109375, 2.629638671875, 2.76806640625, 2.906494140625, 3.044921875, 3.183349609375, 3.32177734375, 3.460205078125, 3.5986328125, 3.737060546875, 3.87548828125, 4.013916015625, 4.15234375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 8.0, 8.0, 14.0, 9.0, 16.0, 16.0, 19.0, 19.0, 32.0, 26.0, 26.0, 33.0, 37.0, 36.0, 30.0, 43.0, 61.0, 109.0, 213.0, 1501.0, 218.0, 120.0, 59.0, 54.0, 29.0, 33.0, 26.0, 28.0, 30.0, 22.0, 24.0, 21.0, 20.0, 10.0, 15.0, 11.0, 13.0, 6.0, 8.0, 4.0, 4.0, 7.0, 3.0, 4.0, 1.0, 7.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.3203125, -14.86328125, -14.40625, -13.94921875, -13.4921875, -13.03515625, -12.578125, -12.12109375, -11.6640625, -11.20703125, -10.75, -10.29296875, -9.8359375, -9.37890625, -8.921875, -8.46484375, -8.0078125, -7.55078125, -7.09375, -6.63671875, -6.1796875, -5.72265625, -5.265625, -4.80859375, -4.3515625, -3.89453125, -3.4375, -2.98046875, -2.5234375, -2.06640625, -1.609375, -1.15234375, -0.6953125, -0.23828125, 0.21875, 0.67578125, 1.1328125, 1.58984375, 2.046875, 2.50390625, 2.9609375, 3.41796875, 3.875, 4.33203125, 4.7890625, 5.24609375, 5.703125, 6.16015625, 6.6171875, 7.07421875, 7.53125, 7.98828125, 8.4453125, 8.90234375, 9.359375, 9.81640625, 10.2734375, 10.73046875, 11.1875, 11.64453125, 12.1015625, 12.55859375, 13.015625, 13.47265625, 13.9296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 7.0, 11.0, 17.0, 16.0, 13.0, 23.0, 38.0, 45.0, 68.0, 100.0, 200.0, 289.0, 703.0, 5273.0, 2348123.0, 785297.0, 4003.0, 616.0, 320.0, 155.0, 116.0, 68.0, 59.0, 35.0, 33.0, 17.0, 19.0, 14.0, 7.0, 9.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.5, -47.0712890625, -45.642578125, -44.2138671875, -42.78515625, -41.3564453125, -39.927734375, -38.4990234375, -37.0703125, -35.6416015625, -34.212890625, -32.7841796875, -31.35546875, -29.9267578125, -28.498046875, -27.0693359375, -25.640625, -24.2119140625, -22.783203125, -21.3544921875, -19.92578125, -18.4970703125, -17.068359375, -15.6396484375, -14.2109375, -12.7822265625, -11.353515625, -9.9248046875, -8.49609375, -7.0673828125, -5.638671875, -4.2099609375, -2.78125, -1.3525390625, 0.076171875, 1.5048828125, 2.93359375, 4.3623046875, 5.791015625, 7.2197265625, 8.6484375, 10.0771484375, 11.505859375, 12.9345703125, 14.36328125, 15.7919921875, 17.220703125, 18.6494140625, 20.078125, 21.5068359375, 22.935546875, 24.3642578125, 25.79296875, 27.2216796875, 28.650390625, 30.0791015625, 31.5078125, 32.9365234375, 34.365234375, 35.7939453125, 37.22265625, 38.6513671875, 40.080078125, 41.5087890625, 42.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 41.0, 551.0, 406.0, 16.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.082496643066406, -14.234087944030762, -9.385679244995117, -4.537270545959473, 0.3111381530761719, 5.1595458984375, 10.007955551147461, 14.856365203857422, 19.70477294921875, 24.553180694580078, 29.40159034729004, 34.25, 39.09840774536133, 43.946815490722656, 48.79522705078125, 53.64363479614258, 58.492042541503906, 63.340450286865234, 68.18885803222656, 73.03726959228516, 77.88568115234375, 82.73408508300781, 87.5824966430664, 92.430908203125, 97.27931213378906, 102.12772369384766, 106.97612762451172, 111.82453918457031, 116.67294311523438, 121.52135467529297, 126.36976623535156, 131.21817016601562, 136.06658935546875, 140.9149932861328, 145.76341247558594, 150.61181640625, 155.46022033691406, 160.30862426757812, 165.15704345703125, 170.0054473876953, 174.85385131835938, 179.70225524902344, 184.55067443847656, 189.39907836914062, 194.2474822998047, 199.09588623046875, 203.94430541992188, 208.79270935058594, 213.64112854003906, 218.48953247070312, 223.33795166015625, 228.1863555908203, 233.03475952148438, 237.8831787109375, 242.73158264160156, 247.57998657226562, 252.42840576171875, 257.2768249511719, 262.1252136230469, 266.9736328125, 271.8220520019531, 276.6704406738281, 281.51885986328125, 286.3672790527344, 291.2156677246094]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 12.0, 9.0, 11.0, 15.0, 9.0, 13.0, 21.0, 20.0, 22.0, 38.0, 32.0, 32.0, 26.0, 39.0, 39.0, 38.0, 38.0, 35.0, 62.0, 50.0, 41.0, 27.0, 40.0, 34.0, 31.0, 35.0, 25.0, 28.0, 26.0, 13.0, 15.0, 17.0, 9.0, 23.0, 11.0, 13.0, 4.0, 13.0, 4.0, 3.0, 10.0, 4.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.79249572753906, -46.234886169433594, -44.677276611328125, -43.119667053222656, -41.56205749511719, -40.00444412231445, -38.446834564208984, -36.889225006103516, -35.33161544799805, -33.77400588989258, -32.21639633178711, -30.658784866333008, -29.10117530822754, -27.54356575012207, -25.98595428466797, -24.4283447265625, -22.87073516845703, -21.313125610351562, -19.755516052246094, -18.197904586791992, -16.640295028686523, -15.082685470581055, -13.52507495880127, -11.967464447021484, -10.409854888916016, -8.852245330810547, -7.294634819030762, -5.737024784088135, -4.179414749145508, -2.621804714202881, -1.064194679260254, 0.49341583251953125, 2.0510292053222656, 3.6086392402648926, 5.1662492752075195, 6.7238593101501465, 8.281469345092773, 9.839078903198242, 11.396689414978027, 12.954299926757812, 14.511909484863281, 16.06951904296875, 17.62712860107422, 19.18474006652832, 20.74234962463379, 22.299959182739258, 23.85757064819336, 25.415180206298828, 26.972789764404297, 28.530399322509766, 30.088008880615234, 31.645620346069336, 33.20323181152344, 34.760841369628906, 36.318450927734375, 37.876060485839844, 39.43367004394531, 40.99127960205078, 42.54888916015625, 44.10649871826172, 45.66410827636719, 47.22172164916992, 48.77933120727539, 50.33694076538086, 51.89455032348633]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 5.0, 13.0, 9.0, 7.0, 14.0, 13.0, 21.0, 16.0, 29.0, 31.0, 35.0, 35.0, 26.0, 33.0, 44.0, 40.0, 51.0, 37.0, 43.0, 47.0, 47.0, 47.0, 39.0, 38.0, 19.0, 27.0, 28.0, 39.0, 28.0, 22.0, 17.0, 15.0, 13.0, 14.0, 16.0, 6.0, 8.0, 5.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.1796875, -5.02056884765625, -4.8614501953125, -4.70233154296875, -4.543212890625, -4.38409423828125, -4.2249755859375, -4.06585693359375, -3.90673828125, -3.74761962890625, -3.5885009765625, -3.42938232421875, -3.270263671875, -3.11114501953125, -2.9520263671875, -2.79290771484375, -2.6337890625, -2.47467041015625, -2.3155517578125, -2.15643310546875, -1.997314453125, -1.83819580078125, -1.6790771484375, -1.51995849609375, -1.36083984375, -1.20172119140625, -1.0426025390625, -0.88348388671875, -0.724365234375, -0.56524658203125, -0.4061279296875, -0.24700927734375, -0.087890625, 0.07122802734375, 0.2303466796875, 0.38946533203125, 0.548583984375, 0.70770263671875, 0.8668212890625, 1.02593994140625, 1.18505859375, 1.34417724609375, 1.5032958984375, 1.66241455078125, 1.821533203125, 1.98065185546875, 2.1397705078125, 2.29888916015625, 2.4580078125, 2.61712646484375, 2.7762451171875, 2.93536376953125, 3.094482421875, 3.25360107421875, 3.4127197265625, 3.57183837890625, 3.73095703125, 3.89007568359375, 4.0491943359375, 4.20831298828125, 4.367431640625, 4.52655029296875, 4.6856689453125, 4.84478759765625, 5.00390625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 8.0, 11.0, 13.0, 15.0, 19.0, 25.0, 32.0, 50.0, 62.0, 112.0, 169.0, 255.0, 543.0, 908.0, 1941.0, 4589.0, 12152.0, 37635.0, 133844.0, 473881.0, 1216369.0, 1399336.0, 643836.0, 189762.0, 52056.0, 16018.0, 5777.0, 2337.0, 1138.0, 522.0, 300.0, 198.0, 113.0, 81.0, 51.0, 34.0, 26.0, 19.0, 10.0, 12.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.90032958984375, -5.7108154296875, -5.52130126953125, -5.331787109375, -5.14227294921875, -4.9527587890625, -4.76324462890625, -4.57373046875, -4.38421630859375, -4.1947021484375, -4.00518798828125, -3.815673828125, -3.62615966796875, -3.4366455078125, -3.24713134765625, -3.0576171875, -2.86810302734375, -2.6785888671875, -2.48907470703125, -2.299560546875, -2.11004638671875, -1.9205322265625, -1.73101806640625, -1.54150390625, -1.35198974609375, -1.1624755859375, -0.97296142578125, -0.783447265625, -0.59393310546875, -0.4044189453125, -0.21490478515625, -0.025390625, 0.16412353515625, 0.3536376953125, 0.54315185546875, 0.732666015625, 0.92218017578125, 1.1116943359375, 1.30120849609375, 1.49072265625, 1.68023681640625, 1.8697509765625, 2.05926513671875, 2.248779296875, 2.43829345703125, 2.6278076171875, 2.81732177734375, 3.0068359375, 3.19635009765625, 3.3858642578125, 3.57537841796875, 3.764892578125, 3.95440673828125, 4.1439208984375, 4.33343505859375, 4.52294921875, 4.71246337890625, 4.9019775390625, 5.09149169921875, 5.281005859375, 5.47052001953125, 5.6600341796875, 5.84954833984375, 6.0390625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 6.0, 14.0, 15.0, 20.0, 22.0, 32.0, 45.0, 64.0, 86.0, 122.0, 160.0, 229.0, 296.0, 368.0, 400.0, 400.0, 406.0, 352.0, 270.0, 202.0, 145.0, 108.0, 96.0, 58.0, 52.0, 37.0, 20.0, 15.0, 12.0, 10.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.171875, -13.781982421875, -13.39208984375, -13.002197265625, -12.6123046875, -12.222412109375, -11.83251953125, -11.442626953125, -11.052734375, -10.662841796875, -10.27294921875, -9.883056640625, -9.4931640625, -9.103271484375, -8.71337890625, -8.323486328125, -7.93359375, -7.543701171875, -7.15380859375, -6.763916015625, -6.3740234375, -5.984130859375, -5.59423828125, -5.204345703125, -4.814453125, -4.424560546875, -4.03466796875, -3.644775390625, -3.2548828125, -2.864990234375, -2.47509765625, -2.085205078125, -1.6953125, -1.305419921875, -0.91552734375, -0.525634765625, -0.1357421875, 0.254150390625, 0.64404296875, 1.033935546875, 1.423828125, 1.813720703125, 2.20361328125, 2.593505859375, 2.9833984375, 3.373291015625, 3.76318359375, 4.153076171875, 4.54296875, 4.932861328125, 5.32275390625, 5.712646484375, 6.1025390625, 6.492431640625, 6.88232421875, 7.272216796875, 7.662109375, 8.052001953125, 8.44189453125, 8.831787109375, 9.2216796875, 9.611572265625, 10.00146484375, 10.391357421875, 10.78125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 11.0, 9.0, 13.0, 14.0, 32.0, 41.0, 40.0, 58.0, 66.0, 114.0, 171.0, 298.0, 829.0, 5661.0, 259857.0, 3775228.0, 146096.0, 4098.0, 716.0, 263.0, 188.0, 135.0, 82.0, 51.0, 50.0, 30.0, 24.0, 27.0, 21.0, 15.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.375, -24.19140625, -23.0078125, -21.82421875, -20.640625, -19.45703125, -18.2734375, -17.08984375, -15.90625, -14.72265625, -13.5390625, -12.35546875, -11.171875, -9.98828125, -8.8046875, -7.62109375, -6.4375, -5.25390625, -4.0703125, -2.88671875, -1.703125, -0.51953125, 0.6640625, 1.84765625, 3.03125, 4.21484375, 5.3984375, 6.58203125, 7.765625, 8.94921875, 10.1328125, 11.31640625, 12.5, 13.68359375, 14.8671875, 16.05078125, 17.234375, 18.41796875, 19.6015625, 20.78515625, 21.96875, 23.15234375, 24.3359375, 25.51953125, 26.703125, 27.88671875, 29.0703125, 30.25390625, 31.4375, 32.62109375, 33.8046875, 34.98828125, 36.171875, 37.35546875, 38.5390625, 39.72265625, 40.90625, 42.08984375, 43.2734375, 44.45703125, 45.640625, 46.82421875, 48.0078125, 49.19140625, 50.375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 30.0, 69.0, 157.0, 206.0, 252.0, 152.0, 89.0, 38.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-181.41685485839844, -177.7894287109375, -174.16201782226562, -170.53460693359375, -166.9071807861328, -163.27975463867188, -159.65234375, -156.02493286132812, -152.3975067138672, -148.77008056640625, -145.14266967773438, -141.5152587890625, -137.88783264160156, -134.26040649414062, -130.63299560546875, -127.00557708740234, -123.37815856933594, -119.75074005126953, -116.12332153320312, -112.49590301513672, -108.86848449707031, -105.2410659790039, -101.6136474609375, -97.9862289428711, -94.35881042480469, -90.73139190673828, -87.10397338867188, -83.47655487060547, -79.84913635253906, -76.22171783447266, -72.59429931640625, -68.96688079833984, -65.33946228027344, -61.71204376220703, -58.084625244140625, -54.45720672607422, -50.82978820800781, -47.202369689941406, -43.574951171875, -39.947532653808594, -36.32011413574219, -32.69269561767578, -29.065277099609375, -25.43785858154297, -21.810440063476562, -18.183021545410156, -14.55560302734375, -10.928184509277344, -7.3007659912109375, -3.6733474731445312, -0.045928955078125, 3.5814895629882812, 7.2089080810546875, 10.836326599121094, 14.4637451171875, 18.091163635253906, 21.718582153320312, 25.34600067138672, 28.973419189453125, 32.60083770751953, 36.22825622558594, 39.855674743652344, 43.48309326171875, 47.110511779785156, 50.73793029785156]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 9.0, 5.0, 6.0, 8.0, 11.0, 14.0, 14.0, 12.0, 15.0, 14.0, 18.0, 23.0, 26.0, 33.0, 33.0, 43.0, 28.0, 33.0, 33.0, 48.0, 38.0, 50.0, 44.0, 40.0, 47.0, 37.0, 28.0, 40.0, 24.0, 25.0, 29.0, 21.0, 28.0, 28.0, 21.0, 17.0, 18.0, 11.0, 7.0, 7.0, 8.0, 6.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.00314712524414, -39.75244140625, -38.501731872558594, -37.25102615356445, -36.00032043457031, -34.74961471557617, -33.49890899658203, -32.248199462890625, -30.997493743896484, -29.746788024902344, -28.49608039855957, -27.245372772216797, -25.994667053222656, -24.743961334228516, -23.493253707885742, -22.24254608154297, -20.991840362548828, -19.741134643554688, -18.490427017211914, -17.23971939086914, -15.989013671875, -14.738306999206543, -13.487600326538086, -12.236893653869629, -10.986186981201172, -9.735480308532715, -8.484773635864258, -7.234066963195801, -5.983360290527344, -4.732653617858887, -3.4819469451904297, -2.2312402725219727, -0.9805335998535156, 0.2701730728149414, 1.5208797454833984, 2.7715864181518555, 4.0222930908203125, 5.2729997634887695, 6.523706436157227, 7.774413108825684, 9.02511978149414, 10.275826454162598, 11.526533126831055, 12.777239799499512, 14.027946472167969, 15.278653144836426, 16.529359817504883, 17.780067443847656, 19.030773162841797, 20.281478881835938, 21.53218650817871, 22.782894134521484, 24.033599853515625, 25.284305572509766, 26.53501319885254, 27.785720825195312, 29.036426544189453, 30.287132263183594, 31.537839889526367, 32.78854751586914, 34.03925323486328, 35.28995895385742, 36.54066467285156, 37.79137420654297, 39.04207992553711]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 10.0, 12.0, 10.0, 16.0, 10.0, 24.0, 19.0, 24.0, 29.0, 24.0, 26.0, 36.0, 38.0, 42.0, 50.0, 38.0, 41.0, 46.0, 44.0, 50.0, 30.0, 34.0, 29.0, 33.0, 39.0, 27.0, 29.0, 21.0, 25.0, 21.0, 20.0, 12.0, 18.0, 9.0, 14.0, 10.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.0, -4.84271240234375, -4.6854248046875, -4.52813720703125, -4.370849609375, -4.21356201171875, -4.0562744140625, -3.89898681640625, -3.74169921875, -3.58441162109375, -3.4271240234375, -3.26983642578125, -3.112548828125, -2.95526123046875, -2.7979736328125, -2.64068603515625, -2.4833984375, -2.32611083984375, -2.1688232421875, -2.01153564453125, -1.854248046875, -1.69696044921875, -1.5396728515625, -1.38238525390625, -1.22509765625, -1.06781005859375, -0.9105224609375, -0.75323486328125, -0.595947265625, -0.43865966796875, -0.2813720703125, -0.12408447265625, 0.033203125, 0.19049072265625, 0.3477783203125, 0.50506591796875, 0.662353515625, 0.81964111328125, 0.9769287109375, 1.13421630859375, 1.29150390625, 1.44879150390625, 1.6060791015625, 1.76336669921875, 1.920654296875, 2.07794189453125, 2.2352294921875, 2.39251708984375, 2.5498046875, 2.70709228515625, 2.8643798828125, 3.02166748046875, 3.178955078125, 3.33624267578125, 3.4935302734375, 3.65081787109375, 3.80810546875, 3.96539306640625, 4.1226806640625, 4.27996826171875, 4.437255859375, 4.59454345703125, 4.7518310546875, 4.90911865234375, 5.06640625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 5.0, 3.0, 5.0, 7.0, 10.0, 13.0, 15.0, 33.0, 38.0, 69.0, 89.0, 142.0, 157.0, 256.0, 401.0, 545.0, 752.0, 1017.0, 1459.0, 2029.0, 2879.0, 4052.0, 5593.0, 8202.0, 11536.0, 16502.0, 23920.0, 35964.0, 54944.0, 89435.0, 175801.0, 293101.0, 115176.0, 67327.0, 42948.0, 28711.0, 19480.0, 13444.0, 9498.0, 6726.0, 4724.0, 3354.0, 2428.0, 1705.0, 1207.0, 858.0, 583.0, 416.0, 295.0, 206.0, 163.0, 92.0, 71.0, 54.0, 32.0, 34.0, 28.0, 12.0, 10.0, 5.0, 3.0, 2.0, 5.0], "bins": [-1.1376953125, -1.102386474609375, -1.06707763671875, -1.031768798828125, -0.9964599609375, -0.961151123046875, -0.92584228515625, -0.890533447265625, -0.855224609375, -0.819915771484375, -0.78460693359375, -0.749298095703125, -0.7139892578125, -0.678680419921875, -0.64337158203125, -0.608062744140625, -0.57275390625, -0.537445068359375, -0.50213623046875, -0.466827392578125, -0.4315185546875, -0.396209716796875, -0.36090087890625, -0.325592041015625, -0.290283203125, -0.254974365234375, -0.21966552734375, -0.184356689453125, -0.1490478515625, -0.113739013671875, -0.07843017578125, -0.043121337890625, -0.0078125, 0.027496337890625, 0.06280517578125, 0.098114013671875, 0.1334228515625, 0.168731689453125, 0.20404052734375, 0.239349365234375, 0.274658203125, 0.309967041015625, 0.34527587890625, 0.380584716796875, 0.4158935546875, 0.451202392578125, 0.48651123046875, 0.521820068359375, 0.55712890625, 0.592437744140625, 0.62774658203125, 0.663055419921875, 0.6983642578125, 0.733673095703125, 0.76898193359375, 0.804290771484375, 0.839599609375, 0.874908447265625, 0.91021728515625, 0.945526123046875, 0.9808349609375, 1.016143798828125, 1.05145263671875, 1.086761474609375, 1.1220703125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 5.0, 9.0, 9.0, 7.0, 14.0, 9.0, 17.0, 21.0, 22.0, 25.0, 27.0, 22.0, 33.0, 26.0, 42.0, 38.0, 45.0, 36.0, 42.0, 54.0, 1061.0, 36.0, 45.0, 36.0, 26.0, 40.0, 39.0, 33.0, 29.0, 22.0, 25.0, 26.0, 11.0, 17.0, 17.0, 9.0, 14.0, 8.0, 5.0, 5.0, 5.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.733123779296875, -2.63226318359375, -2.531402587890625, -2.4305419921875, -2.329681396484375, -2.22882080078125, -2.127960205078125, -2.027099609375, -1.926239013671875, -1.82537841796875, -1.724517822265625, -1.6236572265625, -1.522796630859375, -1.42193603515625, -1.321075439453125, -1.22021484375, -1.119354248046875, -1.01849365234375, -0.917633056640625, -0.8167724609375, -0.715911865234375, -0.61505126953125, -0.514190673828125, -0.413330078125, -0.312469482421875, -0.21160888671875, -0.110748291015625, -0.0098876953125, 0.090972900390625, 0.19183349609375, 0.292694091796875, 0.3935546875, 0.494415283203125, 0.59527587890625, 0.696136474609375, 0.7969970703125, 0.897857666015625, 0.99871826171875, 1.099578857421875, 1.200439453125, 1.301300048828125, 1.40216064453125, 1.503021240234375, 1.6038818359375, 1.704742431640625, 1.80560302734375, 1.906463623046875, 2.00732421875, 2.108184814453125, 2.20904541015625, 2.309906005859375, 2.4107666015625, 2.511627197265625, 2.61248779296875, 2.713348388671875, 2.814208984375, 2.915069580078125, 3.01593017578125, 3.116790771484375, 3.2176513671875, 3.318511962890625, 3.41937255859375, 3.520233154296875, 3.62109375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 11.0, 22.0, 22.0, 47.0, 53.0, 72.0, 134.0, 201.0, 297.0, 483.0, 688.0, 1059.0, 1643.0, 2479.0, 3610.0, 5542.0, 8550.0, 13231.0, 20661.0, 32892.0, 52681.0, 86139.0, 158249.0, 1373625.0, 130964.0, 75709.0, 46642.0, 28957.0, 18241.0, 11732.0, 7799.0, 4956.0, 3271.0, 2213.0, 1444.0, 987.0, 654.0, 405.0, 267.0, 178.0, 109.0, 76.0, 55.0, 18.0, 29.0, 6.0, 10.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1871185302734375, -1.146697998046875, -1.1062774658203125, -1.06585693359375, -1.0254364013671875, -0.985015869140625, -0.9445953369140625, -0.9041748046875, -0.8637542724609375, -0.823333740234375, -0.7829132080078125, -0.74249267578125, -0.7020721435546875, -0.661651611328125, -0.6212310791015625, -0.580810546875, -0.5403900146484375, -0.499969482421875, -0.4595489501953125, -0.41912841796875, -0.3787078857421875, -0.338287353515625, -0.2978668212890625, -0.2574462890625, -0.2170257568359375, -0.176605224609375, -0.1361846923828125, -0.09576416015625, -0.0553436279296875, -0.014923095703125, 0.0254974365234375, 0.06591796875, 0.1063385009765625, 0.146759033203125, 0.1871795654296875, 0.22760009765625, 0.2680206298828125, 0.308441162109375, 0.3488616943359375, 0.3892822265625, 0.4297027587890625, 0.470123291015625, 0.5105438232421875, 0.55096435546875, 0.5913848876953125, 0.631805419921875, 0.6722259521484375, 0.712646484375, 0.7530670166015625, 0.793487548828125, 0.8339080810546875, 0.87432861328125, 0.9147491455078125, 0.955169677734375, 0.9955902099609375, 1.0360107421875, 1.0764312744140625, 1.116851806640625, 1.1572723388671875, 1.19769287109375, 1.2381134033203125, 1.278533935546875, 1.3189544677734375, 1.359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 10.0, 10.0, 14.0, 16.0, 14.0, 10.0, 27.0, 30.0, 47.0, 42.0, 47.0, 68.0, 60.0, 82.0, 68.0, 72.0, 76.0, 44.0, 54.0, 32.0, 28.0, 21.0, 23.0, 23.0, 13.0, 8.0, 9.0, 8.0, 9.0, 8.0, 0.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001659393310546875, -0.00016040727496147156, -0.00015487521886825562, -0.00014934316277503967, -0.00014381110668182373, -0.0001382790505886078, -0.00013274699449539185, -0.0001272149384021759, -0.00012168288230895996, -0.00011615082621574402, -0.00011061877012252808, -0.00010508671402931213, -9.955465793609619e-05, -9.402260184288025e-05, -8.84905457496643e-05, -8.295848965644836e-05, -7.742643356323242e-05, -7.189437747001648e-05, -6.636232137680054e-05, -6.0830265283584595e-05, -5.529820919036865e-05, -4.976615309715271e-05, -4.423409700393677e-05, -3.8702040910720825e-05, -3.316998481750488e-05, -2.763792872428894e-05, -2.2105872631072998e-05, -1.6573816537857056e-05, -1.1041760444641113e-05, -5.509704351425171e-06, 2.2351741790771484e-08, 5.554407835006714e-06, 1.1086463928222656e-05, 1.66185200214386e-05, 2.215057611465454e-05, 2.7682632207870483e-05, 3.3214688301086426e-05, 3.874674439430237e-05, 4.427880048751831e-05, 4.981085658073425e-05, 5.5342912673950195e-05, 6.087496876716614e-05, 6.640702486038208e-05, 7.193908095359802e-05, 7.747113704681396e-05, 8.300319314002991e-05, 8.853524923324585e-05, 9.406730532646179e-05, 9.959936141967773e-05, 0.00010513141751289368, 0.00011066347360610962, 0.00011619552969932556, 0.0001217275857925415, 0.00012725964188575745, 0.0001327916979789734, 0.00013832375407218933, 0.00014385581016540527, 0.00014938786625862122, 0.00015491992235183716, 0.0001604519784450531, 0.00016598403453826904, 0.00017151609063148499, 0.00017704814672470093, 0.00018258020281791687, 0.0001881122589111328]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 14.0, 10.0, 13.0, 11.0, 14.0, 10.0, 25.0, 36.0, 46.0, 62.0, 108.0, 186.0, 275.0, 503.0, 2242.0, 807225.0, 235229.0, 1306.0, 469.0, 248.0, 173.0, 90.0, 65.0, 54.0, 29.0, 25.0, 11.0, 23.0, 13.0, 12.0, 9.0, 5.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003971099853515625, -0.003853917121887207, -0.003736734390258789, -0.003619551658630371, -0.003502368927001953, -0.003385186195373535, -0.003268003463745117, -0.0031508207321166992, -0.0030336380004882812, -0.0029164552688598633, -0.0027992725372314453, -0.0026820898056030273, -0.0025649070739746094, -0.0024477243423461914, -0.0023305416107177734, -0.0022133588790893555, -0.0020961761474609375, -0.0019789934158325195, -0.0018618106842041016, -0.0017446279525756836, -0.0016274452209472656, -0.0015102624893188477, -0.0013930797576904297, -0.0012758970260620117, -0.0011587142944335938, -0.0010415315628051758, -0.0009243488311767578, -0.0008071660995483398, -0.0006899833679199219, -0.0005728006362915039, -0.00045561790466308594, -0.00033843517303466797, -0.00022125244140625, -0.00010406970977783203, 1.3113021850585938e-05, 0.0001302957534790039, 0.0002474784851074219, 0.00036466121673583984, 0.0004818439483642578, 0.0005990266799926758, 0.0007162094116210938, 0.0008333921432495117, 0.0009505748748779297, 0.0010677576065063477, 0.0011849403381347656, 0.0013021230697631836, 0.0014193058013916016, 0.0015364885330200195, 0.0016536712646484375, 0.0017708539962768555, 0.0018880367279052734, 0.0020052194595336914, 0.0021224021911621094, 0.0022395849227905273, 0.0023567676544189453, 0.0024739503860473633, 0.0025911331176757812, 0.0027083158493041992, 0.002825498580932617, 0.002942681312561035, 0.003059864044189453, 0.003177046775817871, 0.003294229507446289, 0.003411412239074707, 0.003528594970703125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 15.0, 24.0, 43.0, 80.0, 91.0, 131.0, 157.0, 137.0, 105.0, 72.0, 57.0, 49.0, 24.0, 11.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017996500537265092, -0.00017478116205893457, -0.000169597304193303, -0.00016441346087958664, -0.00015922961756587029, -0.0001540457597002387, -0.00014886191638652235, -0.000143678073072806, -0.00013849421520717442, -0.00013331037189345807, -0.0001281265140278265, -0.00012294267071411014, -0.00011775882740039378, -0.00011257497681071982, -0.00010739112622104585, -0.0001022072829073295, -9.702343959361315e-05, -9.183958900393918e-05, -8.665574569022283e-05, -8.147189510054886e-05, -7.628805178683251e-05, -7.110420119715855e-05, -6.592035060748458e-05, -6.073650365578942e-05, -5.555265670409426e-05, -5.03688097523991e-05, -4.518496280070394e-05, -4.0001112211029977e-05, -3.481726525933482e-05, -2.963341830763966e-05, -2.4449567717965692e-05, -1.9265720766270533e-05, -1.4081859262660146e-05, -8.898011401470285e-06, -3.714163540280424e-06, 1.4696852304041386e-06, 6.653532182099298e-06, 1.1837379133794457e-05, 1.7021229723468423e-05, 2.2205076675163582e-05, 2.738892362685874e-05, 3.25727705785539e-05, 3.775661753024906e-05, 4.2940468119923025e-05, 4.8124315071618184e-05, 5.3308162023313344e-05, 5.849201261298731e-05, 6.367586320266128e-05, 6.885970651637763e-05, 7.40435571060516e-05, 7.922740041976795e-05, 8.441125100944191e-05, 8.959509432315826e-05, 9.477894491283223e-05, 9.99627955025062e-05, 0.00010514663881622255, 0.00011033048940589651, 0.00011551433999557048, 0.00012069818330928683, 0.0001258820411749184, 0.00013106588448863477, 0.00013624972780235112, 0.0001414335856679827, 0.00014661742898169905, 0.0001518012722954154]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 6.0, 4.0, 12.0, 12.0, 13.0, 18.0, 18.0, 15.0, 29.0, 32.0, 30.0, 29.0, 40.0, 29.0, 33.0, 50.0, 38.0, 56.0, 48.0, 30.0, 39.0, 36.0, 40.0, 36.0, 48.0, 39.0, 30.0, 30.0, 25.0, 22.0, 17.0, 20.0, 9.0, 18.0, 12.0, 10.0, 7.0, 5.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010561943054199219, -0.00010267645120620728, -9.973347187042236e-05, -9.679049253463745e-05, -9.384751319885254e-05, -9.090453386306763e-05, -8.796155452728271e-05, -8.50185751914978e-05, -8.207559585571289e-05, -7.913261651992798e-05, -7.618963718414307e-05, -7.324665784835815e-05, -7.030367851257324e-05, -6.736069917678833e-05, -6.441771984100342e-05, -6.14747405052185e-05, -5.8531761169433594e-05, -5.558878183364868e-05, -5.264580249786377e-05, -4.970282316207886e-05, -4.6759843826293945e-05, -4.381686449050903e-05, -4.087388515472412e-05, -3.793090581893921e-05, -3.49879264831543e-05, -3.2044947147369385e-05, -2.9101967811584473e-05, -2.615898847579956e-05, -2.321600914001465e-05, -2.0273029804229736e-05, -1.7330050468444824e-05, -1.4387071132659912e-05, -1.1444091796875e-05, -8.501112461090088e-06, -5.558133125305176e-06, -2.6151537895202637e-06, 3.2782554626464844e-07, 3.2708048820495605e-06, 6.213784217834473e-06, 9.156763553619385e-06, 1.2099742889404297e-05, 1.5042722225189209e-05, 1.798570156097412e-05, 2.0928680896759033e-05, 2.3871660232543945e-05, 2.6814639568328857e-05, 2.975761890411377e-05, 3.270059823989868e-05, 3.5643577575683594e-05, 3.8586556911468506e-05, 4.152953624725342e-05, 4.447251558303833e-05, 4.741549491882324e-05, 5.0358474254608154e-05, 5.3301453590393066e-05, 5.624443292617798e-05, 5.918741226196289e-05, 6.21303915977478e-05, 6.507337093353271e-05, 6.801635026931763e-05, 7.095932960510254e-05, 7.390230894088745e-05, 7.684528827667236e-05, 7.978826761245728e-05, 8.273124694824219e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 10.0, 12.0, 10.0, 16.0, 10.0, 24.0, 19.0, 24.0, 29.0, 24.0, 26.0, 36.0, 38.0, 42.0, 50.0, 38.0, 41.0, 46.0, 44.0, 50.0, 30.0, 34.0, 29.0, 33.0, 39.0, 27.0, 29.0, 21.0, 25.0, 21.0, 20.0, 12.0, 18.0, 9.0, 14.0, 10.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.0, -4.84271240234375, -4.6854248046875, -4.52813720703125, -4.370849609375, -4.21356201171875, -4.0562744140625, -3.89898681640625, -3.74169921875, -3.58441162109375, -3.4271240234375, -3.26983642578125, -3.112548828125, -2.95526123046875, -2.7979736328125, -2.64068603515625, -2.4833984375, -2.32611083984375, -2.1688232421875, -2.01153564453125, -1.854248046875, -1.69696044921875, -1.5396728515625, -1.38238525390625, -1.22509765625, -1.06781005859375, -0.9105224609375, -0.75323486328125, -0.595947265625, -0.43865966796875, -0.2813720703125, -0.12408447265625, 0.033203125, 0.19049072265625, 0.3477783203125, 0.50506591796875, 0.662353515625, 0.81964111328125, 0.9769287109375, 1.13421630859375, 1.29150390625, 1.44879150390625, 1.6060791015625, 1.76336669921875, 1.920654296875, 2.07794189453125, 2.2352294921875, 2.39251708984375, 2.5498046875, 2.70709228515625, 2.8643798828125, 3.02166748046875, 3.178955078125, 3.33624267578125, 3.4935302734375, 3.65081787109375, 3.80810546875, 3.96539306640625, 4.1226806640625, 4.27996826171875, 4.437255859375, 4.59454345703125, 4.7518310546875, 4.90911865234375, 5.06640625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 3.0, 0.0, 8.0, 7.0, 12.0, 19.0, 18.0, 40.0, 41.0, 58.0, 89.0, 143.0, 240.0, 496.0, 998.0, 1928.0, 4042.0, 8728.0, 20259.0, 52217.0, 163947.0, 397031.0, 262655.0, 82634.0, 29658.0, 12368.0, 5536.0, 2550.0, 1259.0, 678.0, 337.0, 200.0, 109.0, 45.0, 56.0, 35.0, 27.0, 25.0, 15.0, 15.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.1903076171875, -5.009521484375, -4.8287353515625, -4.64794921875, -4.4671630859375, -4.286376953125, -4.1055908203125, -3.9248046875, -3.7440185546875, -3.563232421875, -3.3824462890625, -3.20166015625, -3.0208740234375, -2.840087890625, -2.6593017578125, -2.478515625, -2.2977294921875, -2.116943359375, -1.9361572265625, -1.75537109375, -1.5745849609375, -1.393798828125, -1.2130126953125, -1.0322265625, -0.8514404296875, -0.670654296875, -0.4898681640625, -0.30908203125, -0.1282958984375, 0.052490234375, 0.2332763671875, 0.4140625, 0.5948486328125, 0.775634765625, 0.9564208984375, 1.13720703125, 1.3179931640625, 1.498779296875, 1.6795654296875, 1.8603515625, 2.0411376953125, 2.221923828125, 2.4027099609375, 2.58349609375, 2.7642822265625, 2.945068359375, 3.1258544921875, 3.306640625, 3.4874267578125, 3.668212890625, 3.8489990234375, 4.02978515625, 4.2105712890625, 4.391357421875, 4.5721435546875, 4.7529296875, 4.9337158203125, 5.114501953125, 5.2952880859375, 5.47607421875, 5.6568603515625, 5.837646484375, 6.0184326171875, 6.19921875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 9.0, 5.0, 6.0, 4.0, 7.0, 16.0, 9.0, 13.0, 12.0, 21.0, 14.0, 28.0, 27.0, 43.0, 33.0, 32.0, 59.0, 63.0, 104.0, 193.0, 1455.0, 299.0, 142.0, 77.0, 37.0, 37.0, 36.0, 38.0, 30.0, 19.0, 29.0, 30.0, 19.0, 16.0, 22.0, 12.0, 18.0, 7.0, 3.0, 6.0, 2.0, 6.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -18.02734375, -17.4765625, -16.92578125, -16.375, -15.82421875, -15.2734375, -14.72265625, -14.171875, -13.62109375, -13.0703125, -12.51953125, -11.96875, -11.41796875, -10.8671875, -10.31640625, -9.765625, -9.21484375, -8.6640625, -8.11328125, -7.5625, -7.01171875, -6.4609375, -5.91015625, -5.359375, -4.80859375, -4.2578125, -3.70703125, -3.15625, -2.60546875, -2.0546875, -1.50390625, -0.953125, -0.40234375, 0.1484375, 0.69921875, 1.25, 1.80078125, 2.3515625, 2.90234375, 3.453125, 4.00390625, 4.5546875, 5.10546875, 5.65625, 6.20703125, 6.7578125, 7.30859375, 7.859375, 8.41015625, 8.9609375, 9.51171875, 10.0625, 10.61328125, 11.1640625, 11.71484375, 12.265625, 12.81640625, 13.3671875, 13.91796875, 14.46875, 15.01953125, 15.5703125, 16.12109375, 16.671875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 8.0, 13.0, 7.0, 13.0, 19.0, 34.0, 29.0, 52.0, 64.0, 61.0, 112.0, 179.0, 256.0, 436.0, 1150.0, 16831.0, 3043409.0, 79592.0, 1999.0, 533.0, 258.0, 190.0, 118.0, 84.0, 47.0, 50.0, 28.0, 32.0, 16.0, 18.0, 10.0, 16.0, 5.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.59375, -40.19091796875, -38.7880859375, -37.38525390625, -35.982421875, -34.57958984375, -33.1767578125, -31.77392578125, -30.37109375, -28.96826171875, -27.5654296875, -26.16259765625, -24.759765625, -23.35693359375, -21.9541015625, -20.55126953125, -19.1484375, -17.74560546875, -16.3427734375, -14.93994140625, -13.537109375, -12.13427734375, -10.7314453125, -9.32861328125, -7.92578125, -6.52294921875, -5.1201171875, -3.71728515625, -2.314453125, -0.91162109375, 0.4912109375, 1.89404296875, 3.296875, 4.69970703125, 6.1025390625, 7.50537109375, 8.908203125, 10.31103515625, 11.7138671875, 13.11669921875, 14.51953125, 15.92236328125, 17.3251953125, 18.72802734375, 20.130859375, 21.53369140625, 22.9365234375, 24.33935546875, 25.7421875, 27.14501953125, 28.5478515625, 29.95068359375, 31.353515625, 32.75634765625, 34.1591796875, 35.56201171875, 36.96484375, 38.36767578125, 39.7705078125, 41.17333984375, 42.576171875, 43.97900390625, 45.3818359375, 46.78466796875, 48.1875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 66.0, 553.0, 368.0, 23.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.55719757080078, -31.037094116210938, -26.516990661621094, -21.996889114379883, -17.47678565979004, -12.956682205200195, -8.436580657958984, -3.9164772033691406, 0.6036262512207031, 5.123729228973389, 9.643832206726074, 14.163934707641602, 18.684038162231445, 23.20414161682129, 27.7242431640625, 32.244346618652344, 36.76445007324219, 41.28455352783203, 45.804656982421875, 50.32476043701172, 54.84486389160156, 59.364967346191406, 63.885066986083984, 68.40516662597656, 72.92527770996094, 77.44538116455078, 81.96548461914062, 86.48558807373047, 91.00569152832031, 95.52579498291016, 100.0458984375, 104.56599426269531, 109.08609008789062, 113.60619354248047, 118.12629699707031, 122.64640045166016, 127.16650390625, 131.6865997314453, 136.2067108154297, 140.726806640625, 145.24691772460938, 149.7670135498047, 154.28712463378906, 158.80722045898438, 163.32733154296875, 167.84742736816406, 172.36753845214844, 176.88763427734375, 181.40774536132812, 185.92784118652344, 190.4479522705078, 194.96804809570312, 199.4881591796875, 204.0082550048828, 208.5283660888672, 213.0484619140625, 217.5685577392578, 222.08865356445312, 226.6087646484375, 231.1288604736328, 235.6489715576172, 240.1690673828125, 244.68917846679688, 249.2092742919922, 253.72938537597656]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 9.0, 8.0, 6.0, 7.0, 11.0, 9.0, 18.0, 17.0, 22.0, 20.0, 33.0, 22.0, 38.0, 33.0, 29.0, 34.0, 41.0, 42.0, 38.0, 37.0, 44.0, 38.0, 39.0, 41.0, 31.0, 45.0, 36.0, 36.0, 27.0, 33.0, 18.0, 17.0, 21.0, 13.0, 11.0, 10.0, 17.0, 16.0, 8.0, 9.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-49.78704071044922, -48.39008712768555, -46.993133544921875, -45.59617614746094, -44.199222564697266, -42.802268981933594, -41.40531539916992, -40.00836181640625, -38.61140441894531, -37.21445083618164, -35.81749725341797, -34.42053985595703, -33.02358627319336, -31.626632690429688, -30.229679107666016, -28.832725524902344, -27.435771942138672, -26.038818359375, -24.641862869262695, -23.244909286499023, -21.84795379638672, -20.451000213623047, -19.054046630859375, -17.657093048095703, -16.2601375579834, -14.86318302154541, -13.466228485107422, -12.06927490234375, -10.672320365905762, -9.275365829467773, -7.878412246704102, -6.481457710266113, -5.084506988525391, -3.6875526905059814, -2.2905983924865723, -0.8936443328857422, 0.5033102035522461, 1.9002647399902344, 3.2972183227539062, 4.6941728591918945, 6.091127395629883, 7.488081932067871, 8.88503646850586, 10.281990051269531, 11.67894458770752, 13.075899124145508, 14.47285270690918, 15.869807243347168, 17.266761779785156, 18.663715362548828, 20.060670852661133, 21.457624435424805, 22.85457992553711, 24.25153350830078, 25.648487091064453, 27.045440673828125, 28.44239616394043, 29.8393497467041, 31.236305236816406, 32.63325881958008, 34.03021240234375, 35.42716979980469, 36.824119567871094, 38.22107696533203, 39.6180305480957]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 6.0, 5.0, 6.0, 9.0, 15.0, 14.0, 10.0, 17.0, 18.0, 26.0, 26.0, 27.0, 21.0, 29.0, 33.0, 32.0, 36.0, 40.0, 56.0, 39.0, 33.0, 45.0, 43.0, 41.0, 35.0, 27.0, 34.0, 30.0, 32.0, 34.0, 17.0, 21.0, 16.0, 20.0, 18.0, 15.0, 14.0, 13.0, 15.0, 9.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.0703125, -4.91156005859375, -4.7528076171875, -4.59405517578125, -4.435302734375, -4.27655029296875, -4.1177978515625, -3.95904541015625, -3.80029296875, -3.64154052734375, -3.4827880859375, -3.32403564453125, -3.165283203125, -3.00653076171875, -2.8477783203125, -2.68902587890625, -2.5302734375, -2.37152099609375, -2.2127685546875, -2.05401611328125, -1.895263671875, -1.73651123046875, -1.5777587890625, -1.41900634765625, -1.26025390625, -1.10150146484375, -0.9427490234375, -0.78399658203125, -0.625244140625, -0.46649169921875, -0.3077392578125, -0.14898681640625, 0.009765625, 0.16851806640625, 0.3272705078125, 0.48602294921875, 0.644775390625, 0.80352783203125, 0.9622802734375, 1.12103271484375, 1.27978515625, 1.43853759765625, 1.5972900390625, 1.75604248046875, 1.914794921875, 2.07354736328125, 2.2322998046875, 2.39105224609375, 2.5498046875, 2.70855712890625, 2.8673095703125, 3.02606201171875, 3.184814453125, 3.34356689453125, 3.5023193359375, 3.66107177734375, 3.81982421875, 3.97857666015625, 4.1373291015625, 4.29608154296875, 4.454833984375, 4.61358642578125, 4.7723388671875, 4.93109130859375, 5.08984375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 8.0, 8.0, 7.0, 7.0, 9.0, 11.0, 18.0, 19.0, 28.0, 21.0, 29.0, 30.0, 46.0, 51.0, 77.0, 98.0, 132.0, 239.0, 721.0, 5454.0, 382206.0, 3653701.0, 147028.0, 3030.0, 511.0, 197.0, 144.0, 93.0, 71.0, 52.0, 39.0, 29.0, 27.0, 17.0, 22.0, 22.0, 19.0, 16.0, 6.0, 8.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.390625, -23.614013671875, -22.83740234375, -22.060791015625, -21.2841796875, -20.507568359375, -19.73095703125, -18.954345703125, -18.177734375, -17.401123046875, -16.62451171875, -15.847900390625, -15.0712890625, -14.294677734375, -13.51806640625, -12.741455078125, -11.96484375, -11.188232421875, -10.41162109375, -9.635009765625, -8.8583984375, -8.081787109375, -7.30517578125, -6.528564453125, -5.751953125, -4.975341796875, -4.19873046875, -3.422119140625, -2.6455078125, -1.868896484375, -1.09228515625, -0.315673828125, 0.4609375, 1.237548828125, 2.01416015625, 2.790771484375, 3.5673828125, 4.343994140625, 5.12060546875, 5.897216796875, 6.673828125, 7.450439453125, 8.22705078125, 9.003662109375, 9.7802734375, 10.556884765625, 11.33349609375, 12.110107421875, 12.88671875, 13.663330078125, 14.43994140625, 15.216552734375, 15.9931640625, 16.769775390625, 17.54638671875, 18.322998046875, 19.099609375, 19.876220703125, 20.65283203125, 21.429443359375, 22.2060546875, 22.982666015625, 23.75927734375, 24.535888671875, 25.3125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 10.0, 12.0, 21.0, 29.0, 45.0, 51.0, 94.0, 131.0, 229.0, 292.0, 374.0, 543.0, 566.0, 527.0, 393.0, 237.0, 185.0, 108.0, 87.0, 54.0, 25.0, 19.0, 11.0, 8.0, 6.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5234375, -13.0098876953125, -12.496337890625, -11.9827880859375, -11.46923828125, -10.9556884765625, -10.442138671875, -9.9285888671875, -9.4150390625, -8.9014892578125, -8.387939453125, -7.8743896484375, -7.36083984375, -6.8472900390625, -6.333740234375, -5.8201904296875, -5.306640625, -4.7930908203125, -4.279541015625, -3.7659912109375, -3.25244140625, -2.7388916015625, -2.225341796875, -1.7117919921875, -1.1982421875, -0.6846923828125, -0.171142578125, 0.3424072265625, 0.85595703125, 1.3695068359375, 1.883056640625, 2.3966064453125, 2.91015625, 3.4237060546875, 3.937255859375, 4.4508056640625, 4.96435546875, 5.4779052734375, 5.991455078125, 6.5050048828125, 7.0185546875, 7.5321044921875, 8.045654296875, 8.5592041015625, 9.07275390625, 9.5863037109375, 10.099853515625, 10.6134033203125, 11.126953125, 11.6405029296875, 12.154052734375, 12.6676025390625, 13.18115234375, 13.6947021484375, 14.208251953125, 14.7218017578125, 15.2353515625, 15.7489013671875, 16.262451171875, 16.7760009765625, 17.28955078125, 17.8031005859375, 18.316650390625, 18.8302001953125, 19.34375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 6.0, 10.0, 9.0, 15.0, 24.0, 27.0, 44.0, 74.0, 99.0, 123.0, 167.0, 288.0, 473.0, 1099.0, 8213.0, 1092516.0, 3066944.0, 21052.0, 1494.0, 603.0, 302.0, 195.0, 132.0, 98.0, 72.0, 46.0, 38.0, 33.0, 24.0, 18.0, 15.0, 4.0, 8.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-53.78125, -52.37060546875, -50.9599609375, -49.54931640625, -48.138671875, -46.72802734375, -45.3173828125, -43.90673828125, -42.49609375, -41.08544921875, -39.6748046875, -38.26416015625, -36.853515625, -35.44287109375, -34.0322265625, -32.62158203125, -31.2109375, -29.80029296875, -28.3896484375, -26.97900390625, -25.568359375, -24.15771484375, -22.7470703125, -21.33642578125, -19.92578125, -18.51513671875, -17.1044921875, -15.69384765625, -14.283203125, -12.87255859375, -11.4619140625, -10.05126953125, -8.640625, -7.22998046875, -5.8193359375, -4.40869140625, -2.998046875, -1.58740234375, -0.1767578125, 1.23388671875, 2.64453125, 4.05517578125, 5.4658203125, 6.87646484375, 8.287109375, 9.69775390625, 11.1083984375, 12.51904296875, 13.9296875, 15.34033203125, 16.7509765625, 18.16162109375, 19.572265625, 20.98291015625, 22.3935546875, 23.80419921875, 25.21484375, 26.62548828125, 28.0361328125, 29.44677734375, 30.857421875, 32.26806640625, 33.6787109375, 35.08935546875, 36.5]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 7.0, 12.0, 61.0, 117.0, 185.0, 212.0, 174.0, 142.0, 61.0, 25.0, 13.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.015506744384766, -30.507736206054688, -26.99996566772461, -23.49219512939453, -19.984424591064453, -16.476654052734375, -12.968883514404297, -9.461112976074219, -5.953342437744141, -2.4455718994140625, 1.0621986389160156, 4.569969177246094, 8.077739715576172, 11.58551025390625, 15.093280792236328, 18.601051330566406, 22.108821868896484, 25.616592407226562, 29.12436294555664, 32.63213348388672, 36.1399040222168, 39.647674560546875, 43.15544509887695, 46.66321563720703, 50.17098617553711, 53.67875671386719, 57.186527252197266, 60.694297790527344, 64.20207214355469, 67.7098388671875, 71.21760559082031, 74.72537994384766, 78.233154296875, 81.74092102050781, 85.24869537353516, 88.7564697265625, 92.26423645019531, 95.77200317382812, 99.27977752685547, 102.78755187988281, 106.29531860351562, 109.80308532714844, 113.31085968017578, 116.81863403320312, 120.32640075683594, 123.83416748046875, 127.3419418334961, 130.84971618652344, 134.35748291015625, 137.86524963378906, 141.37301635742188, 144.88079833984375, 148.38856506347656, 151.89633178710938, 155.40411376953125, 158.91188049316406, 162.41964721679688, 165.9274139404297, 169.4351806640625, 172.94296264648438, 176.4507293701172, 179.95849609375, 183.46627807617188, 186.9740447998047, 190.4818115234375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 12.0, 4.0, 11.0, 17.0, 12.0, 14.0, 18.0, 14.0, 25.0, 21.0, 25.0, 40.0, 41.0, 42.0, 34.0, 36.0, 37.0, 37.0, 51.0, 47.0, 45.0, 40.0, 43.0, 37.0, 34.0, 37.0, 30.0, 33.0, 22.0, 24.0, 18.0, 20.0, 17.0, 14.0, 13.0, 7.0, 4.0, 6.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.61219787597656, -47.231136322021484, -45.85007858276367, -44.469017028808594, -43.08795928955078, -41.7068977355957, -40.325836181640625, -38.94477844238281, -37.563716888427734, -36.182655334472656, -34.801597595214844, -33.420536041259766, -32.03947448730469, -30.658416748046875, -29.277355194091797, -27.89629554748535, -26.515235900878906, -25.13417625427246, -23.753116607666016, -22.372055053710938, -20.990995407104492, -19.609935760498047, -18.22887420654297, -16.847814559936523, -15.466754913330078, -14.085695266723633, -12.704634666442871, -11.32357406616211, -9.942514419555664, -8.561454772949219, -7.180394172668457, -5.799333572387695, -4.418270111083984, -3.037209987640381, -1.6561498641967773, -0.27508974075317383, 1.1059703826904297, 2.487030506134033, 3.8680906295776367, 5.249151229858398, 6.630210876464844, 8.011270523071289, 9.39233112335205, 10.773391723632812, 12.154451370239258, 13.535511016845703, 14.916571617126465, 16.297632217407227, 17.678691864013672, 19.059751510620117, 20.440811157226562, 21.82187271118164, 23.202932357788086, 24.58399200439453, 25.96505355834961, 27.346113204956055, 28.7271728515625, 30.108232498168945, 31.48929214477539, 32.87035369873047, 34.25141143798828, 35.63247299194336, 37.01353454589844, 38.39459228515625, 39.77565383911133]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 4.0, 12.0, 9.0, 14.0, 15.0, 17.0, 16.0, 21.0, 31.0, 22.0, 28.0, 39.0, 37.0, 36.0, 51.0, 52.0, 40.0, 41.0, 40.0, 33.0, 39.0, 40.0, 27.0, 34.0, 42.0, 37.0, 32.0, 37.0, 20.0, 25.0, 19.0, 14.0, 13.0, 9.0, 10.0, 12.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4765625, -5.3017578125, -5.126953125, -4.9521484375, -4.77734375, -4.6025390625, -4.427734375, -4.2529296875, -4.078125, -3.9033203125, -3.728515625, -3.5537109375, -3.37890625, -3.2041015625, -3.029296875, -2.8544921875, -2.6796875, -2.5048828125, -2.330078125, -2.1552734375, -1.98046875, -1.8056640625, -1.630859375, -1.4560546875, -1.28125, -1.1064453125, -0.931640625, -0.7568359375, -0.58203125, -0.4072265625, -0.232421875, -0.0576171875, 0.1171875, 0.2919921875, 0.466796875, 0.6416015625, 0.81640625, 0.9912109375, 1.166015625, 1.3408203125, 1.515625, 1.6904296875, 1.865234375, 2.0400390625, 2.21484375, 2.3896484375, 2.564453125, 2.7392578125, 2.9140625, 3.0888671875, 3.263671875, 3.4384765625, 3.61328125, 3.7880859375, 3.962890625, 4.1376953125, 4.3125, 4.4873046875, 4.662109375, 4.8369140625, 5.01171875, 5.1865234375, 5.361328125, 5.5361328125, 5.7109375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 13.0, 12.0, 16.0, 30.0, 41.0, 62.0, 103.0, 150.0, 239.0, 353.0, 520.0, 829.0, 1275.0, 1922.0, 2940.0, 4581.0, 6945.0, 10746.0, 16954.0, 26934.0, 43751.0, 72649.0, 132922.0, 320795.0, 175105.0, 89431.0, 51614.0, 31727.0, 19833.0, 12687.0, 8211.0, 5316.0, 3384.0, 2253.0, 1464.0, 965.0, 620.0, 387.0, 268.0, 162.0, 120.0, 68.0, 50.0, 32.0, 28.0, 20.0, 16.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.484375, -1.4389495849609375, -1.393524169921875, -1.3480987548828125, -1.30267333984375, -1.2572479248046875, -1.211822509765625, -1.1663970947265625, -1.1209716796875, -1.0755462646484375, -1.030120849609375, -0.9846954345703125, -0.93927001953125, -0.8938446044921875, -0.848419189453125, -0.8029937744140625, -0.757568359375, -0.7121429443359375, -0.666717529296875, -0.6212921142578125, -0.57586669921875, -0.5304412841796875, -0.485015869140625, -0.4395904541015625, -0.3941650390625, -0.3487396240234375, -0.303314208984375, -0.2578887939453125, -0.21246337890625, -0.1670379638671875, -0.121612548828125, -0.0761871337890625, -0.03076171875, 0.0146636962890625, 0.060089111328125, 0.1055145263671875, 0.15093994140625, 0.1963653564453125, 0.241790771484375, 0.2872161865234375, 0.3326416015625, 0.3780670166015625, 0.423492431640625, 0.4689178466796875, 0.51434326171875, 0.5597686767578125, 0.605194091796875, 0.6506195068359375, 0.696044921875, 0.7414703369140625, 0.786895751953125, 0.8323211669921875, 0.87774658203125, 0.9231719970703125, 0.968597412109375, 1.0140228271484375, 1.0594482421875, 1.1048736572265625, 1.150299072265625, 1.1957244873046875, 1.24114990234375, 1.2865753173828125, 1.332000732421875, 1.3774261474609375, 1.4228515625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 6.0, 8.0, 5.0, 19.0, 11.0, 10.0, 13.0, 19.0, 18.0, 21.0, 22.0, 18.0, 27.0, 35.0, 35.0, 38.0, 33.0, 42.0, 32.0, 46.0, 1079.0, 39.0, 46.0, 38.0, 36.0, 32.0, 34.0, 26.0, 31.0, 19.0, 25.0, 25.0, 24.0, 26.0, 8.0, 12.0, 12.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0], "bins": [-3.708984375, -3.6009521484375, -3.492919921875, -3.3848876953125, -3.27685546875, -3.1688232421875, -3.060791015625, -2.9527587890625, -2.8447265625, -2.7366943359375, -2.628662109375, -2.5206298828125, -2.41259765625, -2.3045654296875, -2.196533203125, -2.0885009765625, -1.98046875, -1.8724365234375, -1.764404296875, -1.6563720703125, -1.54833984375, -1.4403076171875, -1.332275390625, -1.2242431640625, -1.1162109375, -1.0081787109375, -0.900146484375, -0.7921142578125, -0.68408203125, -0.5760498046875, -0.468017578125, -0.3599853515625, -0.251953125, -0.1439208984375, -0.035888671875, 0.0721435546875, 0.18017578125, 0.2882080078125, 0.396240234375, 0.5042724609375, 0.6123046875, 0.7203369140625, 0.828369140625, 0.9364013671875, 1.04443359375, 1.1524658203125, 1.260498046875, 1.3685302734375, 1.4765625, 1.5845947265625, 1.692626953125, 1.8006591796875, 1.90869140625, 2.0167236328125, 2.124755859375, 2.2327880859375, 2.3408203125, 2.4488525390625, 2.556884765625, 2.6649169921875, 2.77294921875, 2.8809814453125, 2.989013671875, 3.0970458984375, 3.205078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 12.0, 7.0, 25.0, 30.0, 45.0, 74.0, 94.0, 176.0, 226.0, 343.0, 447.0, 702.0, 980.0, 1484.0, 2134.0, 3016.0, 4322.0, 6391.0, 9403.0, 13607.0, 20383.0, 31024.0, 47410.0, 75119.0, 132750.0, 1371633.0, 145151.0, 79959.0, 50342.0, 32917.0, 21236.0, 14410.0, 9793.0, 6672.0, 4629.0, 3134.0, 2124.0, 1501.0, 1047.0, 738.0, 582.0, 365.0, 248.0, 139.0, 120.0, 63.0, 49.0, 34.0, 17.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0], "bins": [-1.39453125, -1.3529815673828125, -1.311431884765625, -1.2698822021484375, -1.22833251953125, -1.1867828369140625, -1.145233154296875, -1.1036834716796875, -1.0621337890625, -1.0205841064453125, -0.979034423828125, -0.9374847412109375, -0.89593505859375, -0.8543853759765625, -0.812835693359375, -0.7712860107421875, -0.729736328125, -0.6881866455078125, -0.646636962890625, -0.6050872802734375, -0.56353759765625, -0.5219879150390625, -0.480438232421875, -0.4388885498046875, -0.3973388671875, -0.3557891845703125, -0.314239501953125, -0.2726898193359375, -0.23114013671875, -0.1895904541015625, -0.148040771484375, -0.1064910888671875, -0.06494140625, -0.0233917236328125, 0.018157958984375, 0.0597076416015625, 0.10125732421875, 0.1428070068359375, 0.184356689453125, 0.2259063720703125, 0.2674560546875, 0.3090057373046875, 0.350555419921875, 0.3921051025390625, 0.43365478515625, 0.4752044677734375, 0.516754150390625, 0.5583038330078125, 0.599853515625, 0.6414031982421875, 0.682952880859375, 0.7245025634765625, 0.76605224609375, 0.8076019287109375, 0.849151611328125, 0.8907012939453125, 0.9322509765625, 0.9738006591796875, 1.015350341796875, 1.0569000244140625, 1.09844970703125, 1.1399993896484375, 1.181549072265625, 1.2230987548828125, 1.2646484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 9.0, 13.0, 11.0, 11.0, 12.0, 15.0, 20.0, 26.0, 34.0, 45.0, 57.0, 71.0, 97.0, 104.0, 80.0, 89.0, 54.0, 47.0, 28.0, 30.0, 36.0, 22.0, 13.0, 14.0, 11.0, 2.0, 6.0, 4.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002951622009277344, -0.00028659403324127197, -0.00027802586555480957, -0.00026945769786834717, -0.00026088953018188477, -0.00025232136249542236, -0.00024375319480895996, -0.00023518502712249756, -0.00022661685943603516, -0.00021804869174957275, -0.00020948052406311035, -0.00020091235637664795, -0.00019234418869018555, -0.00018377602100372314, -0.00017520785331726074, -0.00016663968563079834, -0.00015807151794433594, -0.00014950335025787354, -0.00014093518257141113, -0.00013236701488494873, -0.00012379884719848633, -0.00011523067951202393, -0.00010666251182556152, -9.809434413909912e-05, -8.952617645263672e-05, -8.095800876617432e-05, -7.238984107971191e-05, -6.382167339324951e-05, -5.525350570678711e-05, -4.668533802032471e-05, -3.8117170333862305e-05, -2.9549002647399902e-05, -2.09808349609375e-05, -1.2412667274475098e-05, -3.844499588012695e-06, 4.723668098449707e-06, 1.329183578491211e-05, 2.1860003471374512e-05, 3.0428171157836914e-05, 3.8996338844299316e-05, 4.756450653076172e-05, 5.613267421722412e-05, 6.470084190368652e-05, 7.326900959014893e-05, 8.183717727661133e-05, 9.040534496307373e-05, 9.897351264953613e-05, 0.00010754168033599854, 0.00011610984802246094, 0.00012467801570892334, 0.00013324618339538574, 0.00014181435108184814, 0.00015038251876831055, 0.00015895068645477295, 0.00016751885414123535, 0.00017608702182769775, 0.00018465518951416016, 0.00019322335720062256, 0.00020179152488708496, 0.00021035969257354736, 0.00021892786026000977, 0.00022749602794647217, 0.00023606419563293457, 0.00024463236331939697, 0.0002532005310058594]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 8.0, 9.0, 9.0, 9.0, 5.0, 12.0, 19.0, 38.0, 37.0, 51.0, 94.0, 117.0, 174.0, 352.0, 820.0, 29779.0, 1011593.0, 3985.0, 629.0, 293.0, 155.0, 89.0, 69.0, 45.0, 22.0, 23.0, 18.0, 17.0, 15.0, 11.0, 9.0, 6.0, 6.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.004840850830078125, -0.004681289196014404, -0.004521727561950684, -0.004362165927886963, -0.004202604293823242, -0.0040430426597595215, -0.0038834810256958008, -0.00372391939163208, -0.0035643577575683594, -0.0034047961235046387, -0.003245234489440918, -0.0030856728553771973, -0.0029261112213134766, -0.002766549587249756, -0.002606987953186035, -0.0024474263191223145, -0.0022878646850585938, -0.002128303050994873, -0.0019687414169311523, -0.0018091797828674316, -0.001649618148803711, -0.0014900565147399902, -0.0013304948806762695, -0.0011709332466125488, -0.0010113716125488281, -0.0008518099784851074, -0.0006922483444213867, -0.000532686710357666, -0.0003731250762939453, -0.0002135634422302246, -5.4001808166503906e-05, 0.0001055598258972168, 0.0002651214599609375, 0.0004246830940246582, 0.0005842447280883789, 0.0007438063621520996, 0.0009033679962158203, 0.001062929630279541, 0.0012224912643432617, 0.0013820528984069824, 0.0015416145324707031, 0.0017011761665344238, 0.0018607378005981445, 0.0020202994346618652, 0.002179861068725586, 0.0023394227027893066, 0.0024989843368530273, 0.002658545970916748, 0.0028181076049804688, 0.0029776692390441895, 0.00313723087310791, 0.003296792507171631, 0.0034563541412353516, 0.0036159157752990723, 0.003775477409362793, 0.003935039043426514, 0.004094600677490234, 0.004254162311553955, 0.004413723945617676, 0.0045732855796813965, 0.004732847213745117, 0.004892408847808838, 0.005051970481872559, 0.005211532115936279, 0.00537109375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 57.0, 233.0, 415.0, 250.0, 52.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009420436690561473, -0.0009237512713298202, -0.000905458873603493, -0.0008871664758771658, -0.0008688740781508386, -0.0008505816804245114, -0.0008322892826981843, -0.0008139968849718571, -0.000795704429037869, -0.0007774120313115418, -0.0007591196335852146, -0.0007408272358588874, -0.0007225348381325603, -0.0007042424404062331, -0.0006859500426799059, -0.0006676575867459178, -0.0006493652472272515, -0.0006310728495009243, -0.0006127804517745972, -0.00059448805404827, -0.0005761956563219428, -0.0005579032585956156, -0.0005396108608692884, -0.0005213184049353004, -0.0005030260654166341, -0.0004847336676903069, -0.0004664412699639797, -0.00044814887223765254, -0.00042985647451132536, -0.0004115640767849982, -0.00039327164995484054, -0.00037497925222851336, -0.0003566868253983557, -0.00033839442767202854, -0.00032010202994570136, -0.0003018096322193742, -0.000283517234493047, -0.0002652248367667198, -0.0002469324099365622, -0.000228640012210235, -0.00021034762903582305, -0.00019205523130949587, -0.00017376281903125346, -0.00015547042130492628, -0.0001371780235785991, -0.00011888562585227191, -0.00010059322084998712, -8.230081584770232e-05, -6.400841812137514e-05, -4.5716016757069156e-05, -2.7423615392763168e-05, -9.13121402845718e-06, 9.161187335848808e-06, 2.745358506217599e-05, 4.5745990064460784e-05, 6.403839506674558e-05, 8.233079279307276e-05, 0.00010062319051939994, 0.00011891559552168474, 0.00013720800052396953, 0.0001555003982502967, 0.0001737927959766239, 0.00019208519370295107, 0.00021037760598119348, 0.00022867000370752066]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 9.0, 9.0, 10.0, 6.0, 15.0, 11.0, 10.0, 18.0, 17.0, 16.0, 27.0, 36.0, 24.0, 32.0, 36.0, 36.0, 41.0, 38.0, 31.0, 37.0, 49.0, 35.0, 31.0, 49.0, 56.0, 34.0, 41.0, 25.0, 31.0, 29.0, 21.0, 14.0, 22.0, 17.0, 18.0, 13.0, 17.0, 9.0, 8.0, 6.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010722875595092773, -0.00010335631668567657, -9.948387742042542e-05, -9.561143815517426e-05, -9.17389988899231e-05, -8.786655962467194e-05, -8.399412035942078e-05, -8.012168109416962e-05, -7.624924182891846e-05, -7.23768025636673e-05, -6.850436329841614e-05, -6.463192403316498e-05, -6.075948476791382e-05, -5.688704550266266e-05, -5.30146062374115e-05, -4.914216697216034e-05, -4.526972770690918e-05, -4.139728844165802e-05, -3.752484917640686e-05, -3.36524099111557e-05, -2.977997064590454e-05, -2.590753138065338e-05, -2.203509211540222e-05, -1.8162652850151062e-05, -1.4290213584899902e-05, -1.0417774319648743e-05, -6.545335054397583e-06, -2.6728957891464233e-06, 1.1995434761047363e-06, 5.071982741355896e-06, 8.944422006607056e-06, 1.2816861271858215e-05, 1.6689300537109375e-05, 2.0561739802360535e-05, 2.4434179067611694e-05, 2.8306618332862854e-05, 3.2179057598114014e-05, 3.605149686336517e-05, 3.992393612861633e-05, 4.379637539386749e-05, 4.766881465911865e-05, 5.154125392436981e-05, 5.541369318962097e-05, 5.928613245487213e-05, 6.315857172012329e-05, 6.703101098537445e-05, 7.090345025062561e-05, 7.477588951587677e-05, 7.864832878112793e-05, 8.252076804637909e-05, 8.639320731163025e-05, 9.026564657688141e-05, 9.413808584213257e-05, 9.801052510738373e-05, 0.00010188296437263489, 0.00010575540363788605, 0.00010962784290313721, 0.00011350028216838837, 0.00011737272143363953, 0.00012124516069889069, 0.00012511759996414185, 0.000128990039229393, 0.00013286247849464417, 0.00013673491775989532, 0.00014060735702514648]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 4.0, 12.0, 9.0, 14.0, 15.0, 17.0, 16.0, 21.0, 31.0, 22.0, 28.0, 39.0, 37.0, 36.0, 51.0, 52.0, 40.0, 41.0, 40.0, 33.0, 39.0, 40.0, 27.0, 34.0, 42.0, 37.0, 32.0, 37.0, 20.0, 25.0, 19.0, 14.0, 13.0, 9.0, 10.0, 12.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4765625, -5.3017578125, -5.126953125, -4.9521484375, -4.77734375, -4.6025390625, -4.427734375, -4.2529296875, -4.078125, -3.9033203125, -3.728515625, -3.5537109375, -3.37890625, -3.2041015625, -3.029296875, -2.8544921875, -2.6796875, -2.5048828125, -2.330078125, -2.1552734375, -1.98046875, -1.8056640625, -1.630859375, -1.4560546875, -1.28125, -1.1064453125, -0.931640625, -0.7568359375, -0.58203125, -0.4072265625, -0.232421875, -0.0576171875, 0.1171875, 0.2919921875, 0.466796875, 0.6416015625, 0.81640625, 0.9912109375, 1.166015625, 1.3408203125, 1.515625, 1.6904296875, 1.865234375, 2.0400390625, 2.21484375, 2.3896484375, 2.564453125, 2.7392578125, 2.9140625, 3.0888671875, 3.263671875, 3.4384765625, 3.61328125, 3.7880859375, 3.962890625, 4.1376953125, 4.3125, 4.4873046875, 4.662109375, 4.8369140625, 5.01171875, 5.1865234375, 5.361328125, 5.5361328125, 5.7109375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 16.0, 17.0, 33.0, 35.0, 45.0, 78.0, 109.0, 185.0, 237.0, 388.0, 682.0, 1131.0, 1887.0, 3505.0, 6125.0, 11414.0, 20446.0, 38430.0, 75960.0, 162088.0, 298702.0, 216327.0, 102541.0, 49700.0, 25899.0, 14446.0, 7767.0, 4420.0, 2416.0, 1406.0, 794.0, 476.0, 291.0, 185.0, 92.0, 76.0, 56.0, 35.0, 32.0, 21.0, 15.0, 9.0, 10.0, 6.0, 4.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.9532470703125, -3.824462890625, -3.6956787109375, -3.56689453125, -3.4381103515625, -3.309326171875, -3.1805419921875, -3.0517578125, -2.9229736328125, -2.794189453125, -2.6654052734375, -2.53662109375, -2.4078369140625, -2.279052734375, -2.1502685546875, -2.021484375, -1.8927001953125, -1.763916015625, -1.6351318359375, -1.50634765625, -1.3775634765625, -1.248779296875, -1.1199951171875, -0.9912109375, -0.8624267578125, -0.733642578125, -0.6048583984375, -0.47607421875, -0.3472900390625, -0.218505859375, -0.0897216796875, 0.0390625, 0.1678466796875, 0.296630859375, 0.4254150390625, 0.55419921875, 0.6829833984375, 0.811767578125, 0.9405517578125, 1.0693359375, 1.1981201171875, 1.326904296875, 1.4556884765625, 1.58447265625, 1.7132568359375, 1.842041015625, 1.9708251953125, 2.099609375, 2.2283935546875, 2.357177734375, 2.4859619140625, 2.61474609375, 2.7435302734375, 2.872314453125, 3.0010986328125, 3.1298828125, 3.2586669921875, 3.387451171875, 3.5162353515625, 3.64501953125, 3.7738037109375, 3.902587890625, 4.0313720703125, 4.16015625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 2.0, 7.0, 7.0, 10.0, 7.0, 7.0, 7.0, 10.0, 23.0, 23.0, 23.0, 24.0, 19.0, 32.0, 38.0, 37.0, 37.0, 57.0, 49.0, 87.0, 119.0, 356.0, 1409.0, 155.0, 71.0, 52.0, 44.0, 40.0, 40.0, 29.0, 31.0, 32.0, 31.0, 20.0, 20.0, 20.0, 22.0, 7.0, 17.0, 8.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.39306640625, -17.8017578125, -17.21044921875, -16.619140625, -16.02783203125, -15.4365234375, -14.84521484375, -14.25390625, -13.66259765625, -13.0712890625, -12.47998046875, -11.888671875, -11.29736328125, -10.7060546875, -10.11474609375, -9.5234375, -8.93212890625, -8.3408203125, -7.74951171875, -7.158203125, -6.56689453125, -5.9755859375, -5.38427734375, -4.79296875, -4.20166015625, -3.6103515625, -3.01904296875, -2.427734375, -1.83642578125, -1.2451171875, -0.65380859375, -0.0625, 0.52880859375, 1.1201171875, 1.71142578125, 2.302734375, 2.89404296875, 3.4853515625, 4.07666015625, 4.66796875, 5.25927734375, 5.8505859375, 6.44189453125, 7.033203125, 7.62451171875, 8.2158203125, 8.80712890625, 9.3984375, 9.98974609375, 10.5810546875, 11.17236328125, 11.763671875, 12.35498046875, 12.9462890625, 13.53759765625, 14.12890625, 14.72021484375, 15.3115234375, 15.90283203125, 16.494140625, 17.08544921875, 17.6767578125, 18.26806640625, 18.859375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 8.0, 14.0, 24.0, 27.0, 51.0, 97.0, 151.0, 319.0, 922.0, 39116.0, 3101611.0, 2363.0, 448.0, 212.0, 109.0, 73.0, 40.0, 33.0, 20.0, 17.0, 7.0, 11.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-126.5625, -122.9697265625, -119.376953125, -115.7841796875, -112.19140625, -108.5986328125, -105.005859375, -101.4130859375, -97.8203125, -94.2275390625, -90.634765625, -87.0419921875, -83.44921875, -79.8564453125, -76.263671875, -72.6708984375, -69.078125, -65.4853515625, -61.892578125, -58.2998046875, -54.70703125, -51.1142578125, -47.521484375, -43.9287109375, -40.3359375, -36.7431640625, -33.150390625, -29.5576171875, -25.96484375, -22.3720703125, -18.779296875, -15.1865234375, -11.59375, -8.0009765625, -4.408203125, -0.8154296875, 2.77734375, 6.3701171875, 9.962890625, 13.5556640625, 17.1484375, 20.7412109375, 24.333984375, 27.9267578125, 31.51953125, 35.1123046875, 38.705078125, 42.2978515625, 45.890625, 49.4833984375, 53.076171875, 56.6689453125, 60.26171875, 63.8544921875, 67.447265625, 71.0400390625, 74.6328125, 78.2255859375, 81.818359375, 85.4111328125, 89.00390625, 92.5966796875, 96.189453125, 99.7822265625, 103.375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 816.0, 201.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.60578918457031, -52.339107513427734, -34.072425842285156, -15.805744171142578, 2.4609375, 20.727615356445312, 38.994300842285156, 57.260986328125, 75.52766418457031, 93.79434204101562, 112.06102752685547, 130.3277130126953, 148.59439086914062, 166.86106872558594, 185.12774658203125, 203.39443969726562, 221.66111755371094, 239.92779541015625, 258.1944885253906, 276.4611511230469, 294.72784423828125, 312.9945068359375, 331.2611999511719, 349.52789306640625, 367.7945556640625, 386.0612487792969, 404.3279113769531, 422.5946044921875, 440.86126708984375, 459.1279602050781, 477.3946533203125, 495.66131591796875, 513.927978515625, 532.1946411132812, 550.4613647460938, 568.72802734375, 586.9946899414062, 605.2613525390625, 623.528076171875, 641.7947387695312, 660.0614013671875, 678.3280639648438, 696.5947875976562, 714.8614501953125, 733.1281127929688, 751.394775390625, 769.6614990234375, 787.9281616210938, 806.1948852539062, 824.4615478515625, 842.728271484375, 860.9949340820312, 879.2615966796875, 897.5283203125, 915.7949829101562, 934.0616455078125, 952.328369140625, 970.5950317382812, 988.8617553710938, 1007.12841796875, 1025.3951416015625, 1043.6617431640625, 1061.928466796875, 1080.1951904296875, 1098.4617919921875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 6.0, 7.0, 10.0, 10.0, 14.0, 15.0, 16.0, 14.0, 18.0, 18.0, 22.0, 32.0, 27.0, 32.0, 24.0, 37.0, 36.0, 40.0, 40.0, 39.0, 33.0, 34.0, 53.0, 39.0, 35.0, 27.0, 28.0, 37.0, 25.0, 27.0, 25.0, 27.0, 18.0, 23.0, 16.0, 10.0, 12.0, 11.0, 10.0, 8.0, 10.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-45.475093841552734, -43.94450759887695, -42.413917541503906, -40.883331298828125, -39.352745056152344, -37.8221549987793, -36.291568756103516, -34.76097869873047, -33.23039245605469, -31.699804306030273, -30.169218063354492, -28.638629913330078, -27.108041763305664, -25.57745361328125, -24.04686737060547, -22.516279220581055, -20.985692977905273, -19.45510482788086, -17.924518585205078, -16.393930435180664, -14.86334228515625, -13.332755088806152, -11.802167892456055, -10.27157974243164, -8.740992546081543, -7.210404872894287, -5.679817199707031, -4.149230003356934, -2.6186423301696777, -1.0880546569824219, 0.4425325393676758, 1.9731206893920898, 3.5037078857421875, 5.034295558929443, 6.564883232116699, 8.095470428466797, 9.626058578491211, 11.156645774841309, 12.687232971191406, 14.21782112121582, 15.748408317565918, 17.278995513916016, 18.80958366394043, 20.340171813964844, 21.870758056640625, 23.40134620666504, 24.931934356689453, 26.462520599365234, 27.99310874938965, 29.523696899414062, 31.054283142089844, 32.584869384765625, 34.11545944213867, 35.64604568481445, 37.1766357421875, 38.70722198486328, 40.23780822753906, 41.768394470214844, 43.29898452758789, 44.82957077026367, 46.36015701293945, 47.8907470703125, 49.42133331298828, 50.95191955566406, 52.48250961303711]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 8.0, 7.0, 9.0, 18.0, 16.0, 16.0, 19.0, 17.0, 25.0, 29.0, 37.0, 39.0, 33.0, 37.0, 32.0, 44.0, 41.0, 47.0, 36.0, 49.0, 36.0, 38.0, 33.0, 39.0, 34.0, 24.0, 39.0, 29.0, 26.0, 17.0, 22.0, 15.0, 17.0, 8.0, 10.0, 6.0, 11.0, 10.0, 6.0, 0.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.073486328125, -4.88916015625, -4.704833984375, -4.5205078125, -4.336181640625, -4.15185546875, -3.967529296875, -3.783203125, -3.598876953125, -3.41455078125, -3.230224609375, -3.0458984375, -2.861572265625, -2.67724609375, -2.492919921875, -2.30859375, -2.124267578125, -1.93994140625, -1.755615234375, -1.5712890625, -1.386962890625, -1.20263671875, -1.018310546875, -0.833984375, -0.649658203125, -0.46533203125, -0.281005859375, -0.0966796875, 0.087646484375, 0.27197265625, 0.456298828125, 0.640625, 0.824951171875, 1.00927734375, 1.193603515625, 1.3779296875, 1.562255859375, 1.74658203125, 1.930908203125, 2.115234375, 2.299560546875, 2.48388671875, 2.668212890625, 2.8525390625, 3.036865234375, 3.22119140625, 3.405517578125, 3.58984375, 3.774169921875, 3.95849609375, 4.142822265625, 4.3271484375, 4.511474609375, 4.69580078125, 4.880126953125, 5.064453125, 5.248779296875, 5.43310546875, 5.617431640625, 5.8017578125, 5.986083984375, 6.17041015625, 6.354736328125, 6.5390625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 2.0, 7.0, 2.0, 18.0, 14.0, 21.0, 24.0, 34.0, 44.0, 60.0, 91.0, 102.0, 161.0, 231.0, 406.0, 740.0, 1578.0, 3871.0, 12474.0, 48919.0, 209277.0, 747761.0, 1487298.0, 1154390.0, 399116.0, 94006.0, 22450.0, 6370.0, 2340.0, 943.0, 531.0, 298.0, 208.0, 142.0, 95.0, 61.0, 41.0, 38.0, 36.0, 20.0, 15.0, 13.0, 8.0, 4.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.0703125, -6.84027099609375, -6.6102294921875, -6.38018798828125, -6.150146484375, -5.92010498046875, -5.6900634765625, -5.46002197265625, -5.22998046875, -4.99993896484375, -4.7698974609375, -4.53985595703125, -4.309814453125, -4.07977294921875, -3.8497314453125, -3.61968994140625, -3.3896484375, -3.15960693359375, -2.9295654296875, -2.69952392578125, -2.469482421875, -2.23944091796875, -2.0093994140625, -1.77935791015625, -1.54931640625, -1.31927490234375, -1.0892333984375, -0.85919189453125, -0.629150390625, -0.39910888671875, -0.1690673828125, 0.06097412109375, 0.291015625, 0.52105712890625, 0.7510986328125, 0.98114013671875, 1.211181640625, 1.44122314453125, 1.6712646484375, 1.90130615234375, 2.13134765625, 2.36138916015625, 2.5914306640625, 2.82147216796875, 3.051513671875, 3.28155517578125, 3.5115966796875, 3.74163818359375, 3.9716796875, 4.20172119140625, 4.4317626953125, 4.66180419921875, 4.891845703125, 5.12188720703125, 5.3519287109375, 5.58197021484375, 5.81201171875, 6.04205322265625, 6.2720947265625, 6.50213623046875, 6.732177734375, 6.96221923828125, 7.1922607421875, 7.42230224609375, 7.65234375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 9.0, 16.0, 20.0, 27.0, 24.0, 49.0, 62.0, 79.0, 97.0, 123.0, 175.0, 259.0, 311.0, 374.0, 418.0, 404.0, 318.0, 299.0, 262.0, 193.0, 143.0, 95.0, 93.0, 62.0, 41.0, 29.0, 23.0, 11.0, 6.0, 12.0, 7.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.5625, -14.1688232421875, -13.775146484375, -13.3814697265625, -12.98779296875, -12.5941162109375, -12.200439453125, -11.8067626953125, -11.4130859375, -11.0194091796875, -10.625732421875, -10.2320556640625, -9.83837890625, -9.4447021484375, -9.051025390625, -8.6573486328125, -8.263671875, -7.8699951171875, -7.476318359375, -7.0826416015625, -6.68896484375, -6.2952880859375, -5.901611328125, -5.5079345703125, -5.1142578125, -4.7205810546875, -4.326904296875, -3.9332275390625, -3.53955078125, -3.1458740234375, -2.752197265625, -2.3585205078125, -1.96484375, -1.5711669921875, -1.177490234375, -0.7838134765625, -0.39013671875, 0.0035400390625, 0.397216796875, 0.7908935546875, 1.1845703125, 1.5782470703125, 1.971923828125, 2.3656005859375, 2.75927734375, 3.1529541015625, 3.546630859375, 3.9403076171875, 4.333984375, 4.7276611328125, 5.121337890625, 5.5150146484375, 5.90869140625, 6.3023681640625, 6.696044921875, 7.0897216796875, 7.4833984375, 7.8770751953125, 8.270751953125, 8.6644287109375, 9.05810546875, 9.4517822265625, 9.845458984375, 10.2391357421875, 10.6328125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 7.0, 8.0, 7.0, 9.0, 16.0, 14.0, 20.0, 34.0, 44.0, 50.0, 66.0, 93.0, 185.0, 238.0, 513.0, 1341.0, 16776.0, 2051989.0, 2102931.0, 17273.0, 1345.0, 476.0, 247.0, 161.0, 108.0, 89.0, 56.0, 53.0, 39.0, 26.0, 26.0, 8.0, 15.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.875, -33.58349609375, -32.2919921875, -31.00048828125, -29.708984375, -28.41748046875, -27.1259765625, -25.83447265625, -24.54296875, -23.25146484375, -21.9599609375, -20.66845703125, -19.376953125, -18.08544921875, -16.7939453125, -15.50244140625, -14.2109375, -12.91943359375, -11.6279296875, -10.33642578125, -9.044921875, -7.75341796875, -6.4619140625, -5.17041015625, -3.87890625, -2.58740234375, -1.2958984375, -0.00439453125, 1.287109375, 2.57861328125, 3.8701171875, 5.16162109375, 6.453125, 7.74462890625, 9.0361328125, 10.32763671875, 11.619140625, 12.91064453125, 14.2021484375, 15.49365234375, 16.78515625, 18.07666015625, 19.3681640625, 20.65966796875, 21.951171875, 23.24267578125, 24.5341796875, 25.82568359375, 27.1171875, 28.40869140625, 29.7001953125, 30.99169921875, 32.283203125, 33.57470703125, 34.8662109375, 36.15771484375, 37.44921875, 38.74072265625, 40.0322265625, 41.32373046875, 42.615234375, 43.90673828125, 45.1982421875, 46.48974609375, 47.78125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 16.0, 32.0, 78.0, 124.0, 160.0, 191.0, 176.0, 117.0, 58.0, 30.0, 19.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-120.8705062866211, -117.87789916992188, -114.88529205322266, -111.89268493652344, -108.90007019042969, -105.90746307373047, -102.91485595703125, -99.92224884033203, -96.92964172363281, -93.9370346069336, -90.94442749023438, -87.95181274414062, -84.9592056274414, -81.96659851074219, -78.97399139404297, -75.98138427734375, -72.98876953125, -69.99616241455078, -67.00355529785156, -64.01094055175781, -61.01833724975586, -58.025726318359375, -55.033119201660156, -52.04051208496094, -49.04790496826172, -46.0552978515625, -43.062686920166016, -40.0700798034668, -37.07747268676758, -34.084861755371094, -31.092254638671875, -28.099647521972656, -25.107040405273438, -22.114431381225586, -19.121824264526367, -16.129215240478516, -13.13660717010498, -10.143999099731445, -7.151390075683594, -4.158782958984375, -1.1661739349365234, 1.8264343738555908, 4.819042682647705, 7.811651229858398, 10.804259300231934, 13.796867370605469, 16.78947639465332, 19.78208351135254, 22.77469253540039, 25.767301559448242, 28.75990867614746, 31.752517700195312, 34.74512481689453, 37.73773193359375, 40.730342864990234, 43.72294998168945, 46.71556091308594, 49.708168029785156, 52.70077896118164, 55.69338607788086, 58.68599319458008, 61.67860412597656, 64.67121124267578, 67.663818359375, 70.65642547607422]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 5.0, 8.0, 7.0, 5.0, 15.0, 15.0, 21.0, 20.0, 24.0, 24.0, 18.0, 23.0, 44.0, 30.0, 47.0, 39.0, 37.0, 34.0, 29.0, 56.0, 58.0, 38.0, 38.0, 43.0, 32.0, 47.0, 38.0, 41.0, 32.0, 20.0, 22.0, 21.0, 13.0, 9.0, 14.0, 9.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.60210418701172, -41.16630935668945, -39.73051452636719, -38.29472351074219, -36.85892868041992, -35.423133850097656, -33.98733901977539, -32.551544189453125, -31.115751266479492, -29.679956436157227, -28.244163513183594, -26.808368682861328, -25.372573852539062, -23.93678092956543, -22.500986099243164, -21.06519317626953, -19.629398345947266, -18.193603515625, -16.757810592651367, -15.322015762329102, -13.886221885681152, -12.450428009033203, -11.014633178710938, -9.578839302062988, -8.143045425415039, -6.70725154876709, -5.271457195281982, -3.835662841796875, -2.399868965148926, -0.9640750885009766, 0.47171974182128906, 1.9075136184692383, 3.343303680419922, 4.779097557067871, 6.2148919105529785, 7.650686264038086, 9.086480140686035, 10.522274017333984, 11.95806884765625, 13.3938627243042, 14.829656600952148, 16.265451431274414, 17.701244354248047, 19.137039184570312, 20.572834014892578, 22.00862693786621, 23.444421768188477, 24.88021469116211, 26.316009521484375, 27.75180435180664, 29.187597274780273, 30.62339210510254, 32.05918502807617, 33.49497985839844, 34.9307746887207, 36.36656951904297, 37.80236053466797, 39.238155364990234, 40.6739501953125, 42.1097412109375, 43.545536041259766, 44.98133087158203, 46.4171257019043, 47.85292053222656, 49.28871536254883]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 7.0, 10.0, 11.0, 10.0, 17.0, 19.0, 16.0, 30.0, 27.0, 29.0, 46.0, 34.0, 42.0, 37.0, 34.0, 46.0, 41.0, 53.0, 36.0, 46.0, 51.0, 40.0, 30.0, 49.0, 24.0, 36.0, 34.0, 15.0, 23.0, 17.0, 18.0, 7.0, 15.0, 8.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.37109375, -5.17547607421875, -4.9798583984375, -4.78424072265625, -4.588623046875, -4.39300537109375, -4.1973876953125, -4.00177001953125, -3.80615234375, -3.61053466796875, -3.4149169921875, -3.21929931640625, -3.023681640625, -2.82806396484375, -2.6324462890625, -2.43682861328125, -2.2412109375, -2.04559326171875, -1.8499755859375, -1.65435791015625, -1.458740234375, -1.26312255859375, -1.0675048828125, -0.87188720703125, -0.67626953125, -0.48065185546875, -0.2850341796875, -0.08941650390625, 0.106201171875, 0.30181884765625, 0.4974365234375, 0.69305419921875, 0.888671875, 1.08428955078125, 1.2799072265625, 1.47552490234375, 1.671142578125, 1.86676025390625, 2.0623779296875, 2.25799560546875, 2.45361328125, 2.64923095703125, 2.8448486328125, 3.04046630859375, 3.236083984375, 3.43170166015625, 3.6273193359375, 3.82293701171875, 4.0185546875, 4.21417236328125, 4.4097900390625, 4.60540771484375, 4.801025390625, 4.99664306640625, 5.1922607421875, 5.38787841796875, 5.58349609375, 5.77911376953125, 5.9747314453125, 6.17034912109375, 6.365966796875, 6.56158447265625, 6.7572021484375, 6.95281982421875, 7.1484375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 12.0, 12.0, 17.0, 20.0, 39.0, 50.0, 70.0, 119.0, 170.0, 260.0, 411.0, 635.0, 959.0, 1427.0, 2183.0, 3419.0, 5263.0, 8234.0, 13315.0, 21069.0, 34910.0, 58895.0, 103959.0, 234928.0, 286010.0, 111433.0, 62737.0, 36866.0, 22507.0, 13909.0, 8753.0, 5690.0, 3655.0, 2287.0, 1524.0, 1008.0, 634.0, 403.0, 284.0, 159.0, 105.0, 73.0, 41.0, 25.0, 17.0, 17.0, 10.0, 12.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.654296875, -1.602691650390625, -1.55108642578125, -1.499481201171875, -1.4478759765625, -1.396270751953125, -1.34466552734375, -1.293060302734375, -1.241455078125, -1.189849853515625, -1.13824462890625, -1.086639404296875, -1.0350341796875, -0.983428955078125, -0.93182373046875, -0.880218505859375, -0.82861328125, -0.777008056640625, -0.72540283203125, -0.673797607421875, -0.6221923828125, -0.570587158203125, -0.51898193359375, -0.467376708984375, -0.415771484375, -0.364166259765625, -0.31256103515625, -0.260955810546875, -0.2093505859375, -0.157745361328125, -0.10614013671875, -0.054534912109375, -0.0029296875, 0.048675537109375, 0.10028076171875, 0.151885986328125, 0.2034912109375, 0.255096435546875, 0.30670166015625, 0.358306884765625, 0.409912109375, 0.461517333984375, 0.51312255859375, 0.564727783203125, 0.6163330078125, 0.667938232421875, 0.71954345703125, 0.771148681640625, 0.82275390625, 0.874359130859375, 0.92596435546875, 0.977569580078125, 1.0291748046875, 1.080780029296875, 1.13238525390625, 1.183990478515625, 1.235595703125, 1.287200927734375, 1.33880615234375, 1.390411376953125, 1.4420166015625, 1.493621826171875, 1.54522705078125, 1.596832275390625, 1.6484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 8.0, 8.0, 14.0, 13.0, 11.0, 11.0, 28.0, 24.0, 20.0, 32.0, 42.0, 28.0, 30.0, 33.0, 41.0, 49.0, 47.0, 40.0, 1066.0, 52.0, 37.0, 39.0, 35.0, 31.0, 36.0, 27.0, 23.0, 19.0, 27.0, 23.0, 19.0, 23.0, 14.0, 13.0, 12.0, 5.0, 7.0, 4.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.96875, -3.8499755859375, -3.731201171875, -3.6124267578125, -3.49365234375, -3.3748779296875, -3.256103515625, -3.1373291015625, -3.0185546875, -2.8997802734375, -2.781005859375, -2.6622314453125, -2.54345703125, -2.4246826171875, -2.305908203125, -2.1871337890625, -2.068359375, -1.9495849609375, -1.830810546875, -1.7120361328125, -1.59326171875, -1.4744873046875, -1.355712890625, -1.2369384765625, -1.1181640625, -0.9993896484375, -0.880615234375, -0.7618408203125, -0.64306640625, -0.5242919921875, -0.405517578125, -0.2867431640625, -0.16796875, -0.0491943359375, 0.069580078125, 0.1883544921875, 0.30712890625, 0.4259033203125, 0.544677734375, 0.6634521484375, 0.7822265625, 0.9010009765625, 1.019775390625, 1.1385498046875, 1.25732421875, 1.3760986328125, 1.494873046875, 1.6136474609375, 1.732421875, 1.8511962890625, 1.969970703125, 2.0887451171875, 2.20751953125, 2.3262939453125, 2.445068359375, 2.5638427734375, 2.6826171875, 2.8013916015625, 2.920166015625, 3.0389404296875, 3.15771484375, 3.2764892578125, 3.395263671875, 3.5140380859375, 3.6328125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 5.0, 12.0, 9.0, 24.0, 34.0, 43.0, 84.0, 104.0, 182.0, 209.0, 315.0, 442.0, 634.0, 915.0, 1304.0, 2031.0, 2926.0, 4183.0, 6146.0, 9200.0, 13791.0, 20987.0, 31964.0, 49790.0, 79090.0, 142313.0, 1368505.0, 139741.0, 77988.0, 49272.0, 31981.0, 20519.0, 13688.0, 9337.0, 6164.0, 4170.0, 2796.0, 1895.0, 1401.0, 923.0, 622.0, 451.0, 310.0, 208.0, 144.0, 84.0, 63.0, 50.0, 28.0, 20.0, 14.0, 11.0, 4.0, 6.0, 2.0, 1.0, 5.0], "bins": [-1.494140625, -1.44952392578125, -1.4049072265625, -1.36029052734375, -1.315673828125, -1.27105712890625, -1.2264404296875, -1.18182373046875, -1.13720703125, -1.09259033203125, -1.0479736328125, -1.00335693359375, -0.958740234375, -0.91412353515625, -0.8695068359375, -0.82489013671875, -0.7802734375, -0.73565673828125, -0.6910400390625, -0.64642333984375, -0.601806640625, -0.55718994140625, -0.5125732421875, -0.46795654296875, -0.42333984375, -0.37872314453125, -0.3341064453125, -0.28948974609375, -0.244873046875, -0.20025634765625, -0.1556396484375, -0.11102294921875, -0.06640625, -0.02178955078125, 0.0228271484375, 0.06744384765625, 0.112060546875, 0.15667724609375, 0.2012939453125, 0.24591064453125, 0.29052734375, 0.33514404296875, 0.3797607421875, 0.42437744140625, 0.468994140625, 0.51361083984375, 0.5582275390625, 0.60284423828125, 0.6474609375, 0.69207763671875, 0.7366943359375, 0.78131103515625, 0.825927734375, 0.87054443359375, 0.9151611328125, 0.95977783203125, 1.00439453125, 1.04901123046875, 1.0936279296875, 1.13824462890625, 1.182861328125, 1.22747802734375, 1.2720947265625, 1.31671142578125, 1.361328125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 9.0, 8.0, 16.0, 11.0, 12.0, 20.0, 21.0, 22.0, 45.0, 41.0, 56.0, 81.0, 100.0, 94.0, 93.0, 74.0, 59.0, 35.0, 30.0, 20.0, 18.0, 15.0, 16.0, 13.0, 19.0, 5.0, 8.0, 9.0, 13.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002944469451904297, -0.0002850145101547241, -0.00027558207511901855, -0.000266149640083313, -0.0002567172050476074, -0.00024728477001190186, -0.0002378523349761963, -0.00022841989994049072, -0.00021898746490478516, -0.0002095550298690796, -0.00020012259483337402, -0.00019069015979766846, -0.0001812577247619629, -0.00017182528972625732, -0.00016239285469055176, -0.0001529604196548462, -0.00014352798461914062, -0.00013409554958343506, -0.0001246631145477295, -0.00011523067951202393, -0.00010579824447631836, -9.636580944061279e-05, -8.693337440490723e-05, -7.750093936920166e-05, -6.80685043334961e-05, -5.863606929779053e-05, -4.920363426208496e-05, -3.9771199226379395e-05, -3.0338764190673828e-05, -2.0906329154968262e-05, -1.1473894119262695e-05, -2.041459083557129e-06, 7.3909759521484375e-06, 1.6823410987854004e-05, 2.625584602355957e-05, 3.568828105926514e-05, 4.51207160949707e-05, 5.455315113067627e-05, 6.398558616638184e-05, 7.34180212020874e-05, 8.285045623779297e-05, 9.228289127349854e-05, 0.0001017153263092041, 0.00011114776134490967, 0.00012058019638061523, 0.0001300126314163208, 0.00013944506645202637, 0.00014887750148773193, 0.0001583099365234375, 0.00016774237155914307, 0.00017717480659484863, 0.0001866072416305542, 0.00019603967666625977, 0.00020547211170196533, 0.0002149045467376709, 0.00022433698177337646, 0.00023376941680908203, 0.0002432018518447876, 0.00025263428688049316, 0.00026206672191619873, 0.0002714991569519043, 0.00028093159198760986, 0.00029036402702331543, 0.000299796462059021, 0.00030922889709472656]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 11.0, 12.0, 15.0, 20.0, 19.0, 21.0, 33.0, 37.0, 45.0, 62.0, 81.0, 163.0, 275.0, 490.0, 1676.0, 634819.0, 408039.0, 1448.0, 490.0, 252.0, 174.0, 105.0, 67.0, 50.0, 34.0, 20.0, 20.0, 18.0, 12.0, 7.0, 7.0, 5.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.006465911865234375, -0.006281018257141113, -0.0060961246490478516, -0.00591123104095459, -0.005726337432861328, -0.005541443824768066, -0.005356550216674805, -0.005171656608581543, -0.004986763000488281, -0.0048018693923950195, -0.004616975784301758, -0.004432082176208496, -0.004247188568115234, -0.004062294960021973, -0.003877401351928711, -0.0036925077438354492, -0.0035076141357421875, -0.0033227205276489258, -0.003137826919555664, -0.0029529333114624023, -0.0027680397033691406, -0.002583146095275879, -0.002398252487182617, -0.0022133588790893555, -0.0020284652709960938, -0.001843571662902832, -0.0016586780548095703, -0.0014737844467163086, -0.0012888908386230469, -0.0011039972305297852, -0.0009191036224365234, -0.0007342100143432617, -0.00054931640625, -0.0003644227981567383, -0.00017952919006347656, 5.364418029785156e-06, 0.00019025802612304688, 0.0003751516342163086, 0.0005600452423095703, 0.000744938850402832, 0.0009298324584960938, 0.0011147260665893555, 0.0012996196746826172, 0.001484513282775879, 0.0016694068908691406, 0.0018543004989624023, 0.002039194107055664, 0.0022240877151489258, 0.0024089813232421875, 0.0025938749313354492, 0.002778768539428711, 0.0029636621475219727, 0.0031485557556152344, 0.003333449363708496, 0.003518342971801758, 0.0037032365798950195, 0.0038881301879882812, 0.004073023796081543, 0.004257917404174805, 0.004442811012268066, 0.004627704620361328, 0.00481259822845459, 0.0049974918365478516, 0.005182385444641113, 0.005367279052734375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 80.0, 379.0, 413.0, 120.0, 14.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020806145039387047, -0.0001851484994404018, -0.0001622355484869331, -0.00013932261208537966, -0.00011640966113191098, -9.34967101784423e-05, -7.058377377688885e-05, -4.767082282342017e-05, -2.4757871869951487e-05, -1.8449245544616133e-06, 2.106802276102826e-05, 4.3980966438539326e-05, 6.6893917392008e-05, 8.980686834547669e-05, 0.00011271980474703014, 0.00013563275570049882, 0.0001585457066539675, 0.00018145865760743618, 0.00020437160856090486, 0.0002272845449624583, 0.00025019748136401176, 0.0002731104614213109, 0.0002960233832709491, 0.0003189363342244178, 0.0003418492851778865, 0.00036476223613135517, 0.00038767518708482385, 0.00041058810893446207, 0.0004335010889917612, 0.00045641401084139943, 0.0004793269617948681, 0.0005022399127483368, 0.0005251528928056359, 0.0005480658146552742, 0.0005709787947125733, 0.0005938917165622115, 0.0006168046966195107, 0.0006397176184691489, 0.0006626305403187871, 0.0006855435203760862, 0.0007084565004333854, 0.0007313694222830236, 0.0007542824023403227, 0.000777195324189961, 0.0008001083042472601, 0.0008230212260968983, 0.0008459341479465365, 0.0008688471280038357, 0.0008917600498534739, 0.0009146729717031121, 0.0009375859517604113, 0.0009604988736100495, 0.0009834117954596877, 0.0010063247755169868, 0.001029237755574286, 0.0010521507356315851, 0.0010750635992735624, 0.0010979765793308616, 0.0011208894429728389, 0.001143802423030138, 0.0011667154030874372, 0.0011896283831447363, 0.0012125412467867136, 0.0012354542268440127, 0.0012583672069013119]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 1.0, 1.0, 4.0, 8.0, 11.0, 9.0, 12.0, 11.0, 17.0, 15.0, 26.0, 21.0, 20.0, 28.0, 28.0, 24.0, 36.0, 30.0, 36.0, 48.0, 31.0, 45.0, 39.0, 34.0, 37.0, 38.0, 32.0, 47.0, 32.0, 34.0, 35.0, 21.0, 23.0, 18.0, 18.0, 20.0, 20.0, 16.0, 5.0, 14.0, 12.0, 7.0, 12.0, 3.0, 2.0, 10.0, 2.0, 4.0, 2.0, 3.0, 1.0], "bins": [-0.00014102458953857422, -0.00013707950711250305, -0.00013313442468643188, -0.00012918934226036072, -0.00012524425983428955, -0.00012129917740821838, -0.00011735409498214722, -0.00011340901255607605, -0.00010946393013000488, -0.00010551884770393372, -0.00010157376527786255, -9.762868285179138e-05, -9.368360042572021e-05, -8.973851799964905e-05, -8.579343557357788e-05, -8.184835314750671e-05, -7.790327072143555e-05, -7.395818829536438e-05, -7.001310586929321e-05, -6.606802344322205e-05, -6.212294101715088e-05, -5.817785859107971e-05, -5.4232776165008545e-05, -5.028769373893738e-05, -4.634261131286621e-05, -4.2397528886795044e-05, -3.845244646072388e-05, -3.450736403465271e-05, -3.056228160858154e-05, -2.6617199182510376e-05, -2.267211675643921e-05, -1.8727034330368042e-05, -1.4781951904296875e-05, -1.0836869478225708e-05, -6.891787052154541e-06, -2.946704626083374e-06, 9.98377799987793e-07, 4.94346022605896e-06, 8.888542652130127e-06, 1.2833625078201294e-05, 1.677870750427246e-05, 2.0723789930343628e-05, 2.4668872356414795e-05, 2.8613954782485962e-05, 3.255903720855713e-05, 3.6504119634628296e-05, 4.044920206069946e-05, 4.439428448677063e-05, 4.83393669128418e-05, 5.2284449338912964e-05, 5.622953176498413e-05, 6.01746141910553e-05, 6.411969661712646e-05, 6.806477904319763e-05, 7.20098614692688e-05, 7.595494389533997e-05, 7.990002632141113e-05, 8.38451087474823e-05, 8.779019117355347e-05, 9.173527359962463e-05, 9.56803560256958e-05, 9.962543845176697e-05, 0.00010357052087783813, 0.0001075156033039093, 0.00011146068572998047]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 7.0, 10.0, 11.0, 10.0, 17.0, 19.0, 16.0, 30.0, 27.0, 29.0, 46.0, 34.0, 42.0, 37.0, 34.0, 46.0, 41.0, 53.0, 36.0, 46.0, 51.0, 40.0, 30.0, 49.0, 24.0, 36.0, 34.0, 15.0, 23.0, 17.0, 18.0, 7.0, 15.0, 8.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.37109375, -5.17547607421875, -4.9798583984375, -4.78424072265625, -4.588623046875, -4.39300537109375, -4.1973876953125, -4.00177001953125, -3.80615234375, -3.61053466796875, -3.4149169921875, -3.21929931640625, -3.023681640625, -2.82806396484375, -2.6324462890625, -2.43682861328125, -2.2412109375, -2.04559326171875, -1.8499755859375, -1.65435791015625, -1.458740234375, -1.26312255859375, -1.0675048828125, -0.87188720703125, -0.67626953125, -0.48065185546875, -0.2850341796875, -0.08941650390625, 0.106201171875, 0.30181884765625, 0.4974365234375, 0.69305419921875, 0.888671875, 1.08428955078125, 1.2799072265625, 1.47552490234375, 1.671142578125, 1.86676025390625, 2.0623779296875, 2.25799560546875, 2.45361328125, 2.64923095703125, 2.8448486328125, 3.04046630859375, 3.236083984375, 3.43170166015625, 3.6273193359375, 3.82293701171875, 4.0185546875, 4.21417236328125, 4.4097900390625, 4.60540771484375, 4.801025390625, 4.99664306640625, 5.1922607421875, 5.38787841796875, 5.58349609375, 5.77911376953125, 5.9747314453125, 6.17034912109375, 6.365966796875, 6.56158447265625, 6.7572021484375, 6.95281982421875, 7.1484375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 9.0, 18.0, 27.0, 32.0, 57.0, 76.0, 121.0, 171.0, 292.0, 453.0, 812.0, 1564.0, 3022.0, 5948.0, 11963.0, 24270.0, 48092.0, 96422.0, 187214.0, 273885.0, 192431.0, 100109.0, 50721.0, 25394.0, 12533.0, 6141.0, 3019.0, 1566.0, 864.0, 481.0, 307.0, 161.0, 113.0, 99.0, 55.0, 43.0, 23.0, 17.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9296875, -4.77813720703125, -4.6265869140625, -4.47503662109375, -4.323486328125, -4.17193603515625, -4.0203857421875, -3.86883544921875, -3.71728515625, -3.56573486328125, -3.4141845703125, -3.26263427734375, -3.111083984375, -2.95953369140625, -2.8079833984375, -2.65643310546875, -2.5048828125, -2.35333251953125, -2.2017822265625, -2.05023193359375, -1.898681640625, -1.74713134765625, -1.5955810546875, -1.44403076171875, -1.29248046875, -1.14093017578125, -0.9893798828125, -0.83782958984375, -0.686279296875, -0.53472900390625, -0.3831787109375, -0.23162841796875, -0.080078125, 0.07147216796875, 0.2230224609375, 0.37457275390625, 0.526123046875, 0.67767333984375, 0.8292236328125, 0.98077392578125, 1.13232421875, 1.28387451171875, 1.4354248046875, 1.58697509765625, 1.738525390625, 1.89007568359375, 2.0416259765625, 2.19317626953125, 2.3447265625, 2.49627685546875, 2.6478271484375, 2.79937744140625, 2.950927734375, 3.10247802734375, 3.2540283203125, 3.40557861328125, 3.55712890625, 3.70867919921875, 3.8602294921875, 4.01177978515625, 4.163330078125, 4.31488037109375, 4.4664306640625, 4.61798095703125, 4.76953125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 7.0, 14.0, 11.0, 18.0, 13.0, 27.0, 17.0, 28.0, 39.0, 45.0, 45.0, 51.0, 59.0, 76.0, 115.0, 282.0, 1443.0, 241.0, 99.0, 53.0, 56.0, 49.0, 36.0, 41.0, 28.0, 25.0, 10.0, 27.0, 16.0, 14.0, 9.0, 9.0, 8.0, 4.0, 6.0, 8.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-26.96875, -26.22802734375, -25.4873046875, -24.74658203125, -24.005859375, -23.26513671875, -22.5244140625, -21.78369140625, -21.04296875, -20.30224609375, -19.5615234375, -18.82080078125, -18.080078125, -17.33935546875, -16.5986328125, -15.85791015625, -15.1171875, -14.37646484375, -13.6357421875, -12.89501953125, -12.154296875, -11.41357421875, -10.6728515625, -9.93212890625, -9.19140625, -8.45068359375, -7.7099609375, -6.96923828125, -6.228515625, -5.48779296875, -4.7470703125, -4.00634765625, -3.265625, -2.52490234375, -1.7841796875, -1.04345703125, -0.302734375, 0.43798828125, 1.1787109375, 1.91943359375, 2.66015625, 3.40087890625, 4.1416015625, 4.88232421875, 5.623046875, 6.36376953125, 7.1044921875, 7.84521484375, 8.5859375, 9.32666015625, 10.0673828125, 10.80810546875, 11.548828125, 12.28955078125, 13.0302734375, 13.77099609375, 14.51171875, 15.25244140625, 15.9931640625, 16.73388671875, 17.474609375, 18.21533203125, 18.9560546875, 19.69677734375, 20.4375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 11.0, 13.0, 25.0, 24.0, 48.0, 50.0, 87.0, 118.0, 193.0, 348.0, 848.0, 16205.0, 3120571.0, 5613.0, 693.0, 308.0, 183.0, 111.0, 82.0, 60.0, 39.0, 26.0, 13.0, 11.0, 4.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.0, -76.1171875, -73.234375, -70.3515625, -67.46875, -64.5859375, -61.703125, -58.8203125, -55.9375, -53.0546875, -50.171875, -47.2890625, -44.40625, -41.5234375, -38.640625, -35.7578125, -32.875, -29.9921875, -27.109375, -24.2265625, -21.34375, -18.4609375, -15.578125, -12.6953125, -9.8125, -6.9296875, -4.046875, -1.1640625, 1.71875, 4.6015625, 7.484375, 10.3671875, 13.25, 16.1328125, 19.015625, 21.8984375, 24.78125, 27.6640625, 30.546875, 33.4296875, 36.3125, 39.1953125, 42.078125, 44.9609375, 47.84375, 50.7265625, 53.609375, 56.4921875, 59.375, 62.2578125, 65.140625, 68.0234375, 70.90625, 73.7890625, 76.671875, 79.5546875, 82.4375, 85.3203125, 88.203125, 91.0859375, 93.96875, 96.8515625, 99.734375, 102.6171875, 105.5]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 26.0, 181.0, 453.0, 296.0, 52.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-186.2519989013672, -182.5824432373047, -178.91290283203125, -175.24334716796875, -171.5738067626953, -167.9042510986328, -164.23471069335938, -160.56515502929688, -156.89559936523438, -153.22604370117188, -149.55650329589844, -145.88694763183594, -142.2174072265625, -138.5478515625, -134.87831115722656, -131.20875549316406, -127.53921508789062, -123.86966705322266, -120.20011901855469, -116.53057098388672, -112.86102294921875, -109.19146728515625, -105.52191925048828, -101.85237121582031, -98.18282318115234, -94.51327514648438, -90.8437271118164, -87.17417907714844, -83.50462341308594, -79.8350830078125, -76.16552734375, -72.49597930908203, -68.8264389038086, -65.15689086914062, -61.487342834472656, -57.81779098510742, -54.14824295043945, -50.478694915771484, -46.80914306640625, -43.13959503173828, -39.47004699707031, -35.800498962402344, -32.130950927734375, -28.46139907836914, -24.791851043701172, -21.122303009033203, -17.4527530670166, -13.783203125, -10.113655090332031, -6.444106101989746, -2.774557113647461, 0.8949918746948242, 4.564540863037109, 8.234088897705078, 11.90363883972168, 15.573188781738281, 19.24273681640625, 22.91228485107422, 26.58183479309082, 30.251384735107422, 33.92093276977539, 37.59048080444336, 41.260032653808594, 44.92958068847656, 48.59912872314453]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 6.0, 9.0, 8.0, 12.0, 16.0, 16.0, 20.0, 16.0, 20.0, 31.0, 19.0, 30.0, 24.0, 32.0, 27.0, 26.0, 32.0, 47.0, 39.0, 35.0, 30.0, 50.0, 33.0, 33.0, 42.0, 35.0, 36.0, 29.0, 40.0, 24.0, 20.0, 19.0, 19.0, 22.0, 14.0, 17.0, 16.0, 8.0, 5.0, 9.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-41.673072814941406, -40.20881271362305, -38.74455261230469, -37.28029251098633, -35.81603240966797, -34.351776123046875, -32.88751220703125, -31.423255920410156, -29.958995819091797, -28.494735717773438, -27.030475616455078, -25.56621551513672, -24.101957321166992, -22.637697219848633, -21.173437118530273, -19.709178924560547, -18.244916915893555, -16.780656814575195, -15.316397666931152, -13.852137565612793, -12.38787841796875, -10.92361831665039, -9.459358215332031, -7.995099067687988, -6.530838966369629, -5.066579341888428, -3.6023194789886475, -2.138059616088867, -0.673799991607666, 0.7904596328735352, 2.2547197341918945, 3.7189788818359375, 5.183238983154297, 6.647498607635498, 8.1117582321167, 9.576018333435059, 11.040277481079102, 12.504537582397461, 13.96879768371582, 15.433056831359863, 16.897315979003906, 18.361576080322266, 19.825836181640625, 21.290096282958984, 22.75435447692871, 24.21861457824707, 25.68287467956543, 27.147132873535156, 28.61139488220215, 30.075654983520508, 31.539915084838867, 33.004173278808594, 34.46843338012695, 35.93269348144531, 37.39695358276367, 38.86121368408203, 40.32547378540039, 41.78973388671875, 43.25399398803711, 44.71825408935547, 46.18251419067383, 47.64677429199219, 49.11103057861328, 50.57529067993164, 52.03955078125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 12.0, 9.0, 12.0, 12.0, 13.0, 12.0, 21.0, 18.0, 27.0, 27.0, 29.0, 35.0, 41.0, 45.0, 35.0, 41.0, 48.0, 46.0, 36.0, 36.0, 36.0, 47.0, 44.0, 42.0, 29.0, 36.0, 28.0, 22.0, 26.0, 27.0, 14.0, 15.0, 11.0, 9.0, 12.0, 11.0, 10.0, 3.0, 7.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.234375, -5.02911376953125, -4.8238525390625, -4.61859130859375, -4.413330078125, -4.20806884765625, -4.0028076171875, -3.79754638671875, -3.59228515625, -3.38702392578125, -3.1817626953125, -2.97650146484375, -2.771240234375, -2.56597900390625, -2.3607177734375, -2.15545654296875, -1.9501953125, -1.74493408203125, -1.5396728515625, -1.33441162109375, -1.129150390625, -0.92388916015625, -0.7186279296875, -0.51336669921875, -0.30810546875, -0.10284423828125, 0.1024169921875, 0.30767822265625, 0.512939453125, 0.71820068359375, 0.9234619140625, 1.12872314453125, 1.333984375, 1.53924560546875, 1.7445068359375, 1.94976806640625, 2.155029296875, 2.36029052734375, 2.5655517578125, 2.77081298828125, 2.97607421875, 3.18133544921875, 3.3865966796875, 3.59185791015625, 3.797119140625, 4.00238037109375, 4.2076416015625, 4.41290283203125, 4.6181640625, 4.82342529296875, 5.0286865234375, 5.23394775390625, 5.439208984375, 5.64447021484375, 5.8497314453125, 6.05499267578125, 6.26025390625, 6.46551513671875, 6.6707763671875, 6.87603759765625, 7.081298828125, 7.28656005859375, 7.4918212890625, 7.69708251953125, 7.90234375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 3.0, 6.0, 4.0, 9.0, 11.0, 9.0, 11.0, 11.0, 19.0, 16.0, 20.0, 25.0, 29.0, 42.0, 62.0, 74.0, 132.0, 211.0, 457.0, 1852.0, 31113.0, 1593559.0, 2497739.0, 65041.0, 2586.0, 522.0, 214.0, 129.0, 86.0, 64.0, 45.0, 25.0, 30.0, 25.0, 16.0, 17.0, 16.0, 6.0, 11.0, 7.0, 10.0, 4.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.15625, -17.432861328125, -16.70947265625, -15.986083984375, -15.2626953125, -14.539306640625, -13.81591796875, -13.092529296875, -12.369140625, -11.645751953125, -10.92236328125, -10.198974609375, -9.4755859375, -8.752197265625, -8.02880859375, -7.305419921875, -6.58203125, -5.858642578125, -5.13525390625, -4.411865234375, -3.6884765625, -2.965087890625, -2.24169921875, -1.518310546875, -0.794921875, -0.071533203125, 0.65185546875, 1.375244140625, 2.0986328125, 2.822021484375, 3.54541015625, 4.268798828125, 4.9921875, 5.715576171875, 6.43896484375, 7.162353515625, 7.8857421875, 8.609130859375, 9.33251953125, 10.055908203125, 10.779296875, 11.502685546875, 12.22607421875, 12.949462890625, 13.6728515625, 14.396240234375, 15.11962890625, 15.843017578125, 16.56640625, 17.289794921875, 18.01318359375, 18.736572265625, 19.4599609375, 20.183349609375, 20.90673828125, 21.630126953125, 22.353515625, 23.076904296875, 23.80029296875, 24.523681640625, 25.2470703125, 25.970458984375, 26.69384765625, 27.417236328125, 28.140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 13.0, 8.0, 11.0, 17.0, 29.0, 28.0, 64.0, 74.0, 93.0, 116.0, 177.0, 214.0, 268.0, 349.0, 396.0, 450.0, 379.0, 350.0, 264.0, 201.0, 153.0, 101.0, 70.0, 49.0, 49.0, 30.0, 26.0, 17.0, 19.0, 19.0, 6.0, 3.0, 4.0, 5.0, 4.0, 1.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.47802734375, -11.0732421875, -10.66845703125, -10.263671875, -9.85888671875, -9.4541015625, -9.04931640625, -8.64453125, -8.23974609375, -7.8349609375, -7.43017578125, -7.025390625, -6.62060546875, -6.2158203125, -5.81103515625, -5.40625, -5.00146484375, -4.5966796875, -4.19189453125, -3.787109375, -3.38232421875, -2.9775390625, -2.57275390625, -2.16796875, -1.76318359375, -1.3583984375, -0.95361328125, -0.548828125, -0.14404296875, 0.2607421875, 0.66552734375, 1.0703125, 1.47509765625, 1.8798828125, 2.28466796875, 2.689453125, 3.09423828125, 3.4990234375, 3.90380859375, 4.30859375, 4.71337890625, 5.1181640625, 5.52294921875, 5.927734375, 6.33251953125, 6.7373046875, 7.14208984375, 7.546875, 7.95166015625, 8.3564453125, 8.76123046875, 9.166015625, 9.57080078125, 9.9755859375, 10.38037109375, 10.78515625, 11.18994140625, 11.5947265625, 11.99951171875, 12.404296875, 12.80908203125, 13.2138671875, 13.61865234375, 14.0234375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 10.0, 12.0, 18.0, 22.0, 19.0, 26.0, 43.0, 60.0, 75.0, 105.0, 140.0, 226.0, 409.0, 1203.0, 21308.0, 3695242.0, 470263.0, 3517.0, 627.0, 273.0, 216.0, 143.0, 82.0, 75.0, 46.0, 41.0, 21.0, 17.0, 14.0, 9.0, 11.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.128173828125, -28.52197265625, -26.915771484375, -25.3095703125, -23.703369140625, -22.09716796875, -20.490966796875, -18.884765625, -17.278564453125, -15.67236328125, -14.066162109375, -12.4599609375, -10.853759765625, -9.24755859375, -7.641357421875, -6.03515625, -4.428955078125, -2.82275390625, -1.216552734375, 0.3896484375, 1.995849609375, 3.60205078125, 5.208251953125, 6.814453125, 8.420654296875, 10.02685546875, 11.633056640625, 13.2392578125, 14.845458984375, 16.45166015625, 18.057861328125, 19.6640625, 21.270263671875, 22.87646484375, 24.482666015625, 26.0888671875, 27.695068359375, 29.30126953125, 30.907470703125, 32.513671875, 34.119873046875, 35.72607421875, 37.332275390625, 38.9384765625, 40.544677734375, 42.15087890625, 43.757080078125, 45.36328125, 46.969482421875, 48.57568359375, 50.181884765625, 51.7880859375, 53.394287109375, 55.00048828125, 56.606689453125, 58.212890625, 59.819091796875, 61.42529296875, 63.031494140625, 64.6376953125, 66.243896484375, 67.85009765625, 69.456298828125, 71.0625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 20.0, 48.0, 94.0, 151.0, 205.0, 182.0, 170.0, 79.0, 40.0, 11.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.94778442382812, -84.80497741699219, -81.66217803955078, -78.51937103271484, -75.3765640258789, -72.2337646484375, -69.09095764160156, -65.94815063476562, -62.80534744262695, -59.66254425048828, -56.519737243652344, -53.37693405151367, -50.234130859375, -47.09132385253906, -43.94852066040039, -40.80571746826172, -37.66291046142578, -34.52010726928711, -31.377300262451172, -28.2344970703125, -25.091691970825195, -21.94888687133789, -18.80608367919922, -15.663278579711914, -12.52047348022461, -9.377668380737305, -6.234864234924316, -3.092060089111328, 0.05074501037597656, 3.1935501098632812, 6.336353302001953, 9.479158401489258, 12.621955871582031, 15.764760971069336, 18.90756607055664, 22.050369262695312, 25.193174362182617, 28.335979461669922, 31.478782653808594, 34.62158966064453, 37.7643928527832, 40.907196044921875, 44.05000305175781, 47.192806243896484, 50.335609436035156, 53.478416442871094, 56.621219635009766, 59.76402282714844, 62.906829833984375, 66.04963684082031, 69.19243621826172, 72.33524322509766, 75.4780502319336, 78.620849609375, 81.76365661621094, 84.90646362304688, 88.04927062988281, 91.19207763671875, 94.33487701416016, 97.4776840209961, 100.62049102783203, 103.76329040527344, 106.90609741210938, 110.04890441894531, 113.19170379638672]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 12.0, 8.0, 12.0, 12.0, 19.0, 20.0, 15.0, 29.0, 25.0, 22.0, 30.0, 32.0, 28.0, 41.0, 31.0, 35.0, 59.0, 37.0, 37.0, 44.0, 37.0, 38.0, 47.0, 25.0, 35.0, 31.0, 26.0, 27.0, 24.0, 21.0, 26.0, 20.0, 17.0, 14.0, 11.0, 7.0, 11.0, 5.0, 6.0, 8.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.784873962402344, -39.405967712402344, -38.027061462402344, -36.648155212402344, -35.26924514770508, -33.89033889770508, -32.51143264770508, -31.132526397705078, -29.753618240356445, -28.374711990356445, -26.995803833007812, -25.616897583007812, -24.237991333007812, -22.85908317565918, -21.48017692565918, -20.101268768310547, -18.722362518310547, -17.343456268310547, -15.964548110961914, -14.585641860961914, -13.206734657287598, -11.827827453613281, -10.448921203613281, -9.070013999938965, -7.691106796264648, -6.312199592590332, -4.933292865753174, -3.5543861389160156, -2.175478935241699, -0.7965717315673828, 0.5823345184326172, 1.9612417221069336, 3.34014892578125, 4.719056129455566, 6.097962856292725, 7.476869583129883, 8.8557767868042, 10.234683990478516, 11.613590240478516, 12.992497444152832, 14.371404647827148, 15.750311851501465, 17.12921905517578, 18.50812530517578, 19.88703155517578, 21.265939712524414, 22.644845962524414, 24.023754119873047, 25.402660369873047, 26.781566619873047, 28.16047477722168, 29.53938102722168, 30.918289184570312, 32.29719543457031, 33.67610168457031, 35.05500793457031, 36.43391418457031, 37.81282043457031, 39.19172668457031, 40.57063293457031, 41.94954299926758, 43.32844924926758, 44.70735549926758, 46.08626174926758, 47.465171813964844]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 8.0, 14.0, 16.0, 10.0, 13.0, 21.0, 31.0, 32.0, 28.0, 32.0, 47.0, 44.0, 46.0, 47.0, 37.0, 38.0, 52.0, 39.0, 50.0, 39.0, 41.0, 40.0, 43.0, 31.0, 31.0, 35.0, 28.0, 25.0, 19.0, 16.0, 7.0, 7.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.640625, -5.420654296875, -5.20068359375, -4.980712890625, -4.7607421875, -4.540771484375, -4.32080078125, -4.100830078125, -3.880859375, -3.660888671875, -3.44091796875, -3.220947265625, -3.0009765625, -2.781005859375, -2.56103515625, -2.341064453125, -2.12109375, -1.901123046875, -1.68115234375, -1.461181640625, -1.2412109375, -1.021240234375, -0.80126953125, -0.581298828125, -0.361328125, -0.141357421875, 0.07861328125, 0.298583984375, 0.5185546875, 0.738525390625, 0.95849609375, 1.178466796875, 1.3984375, 1.618408203125, 1.83837890625, 2.058349609375, 2.2783203125, 2.498291015625, 2.71826171875, 2.938232421875, 3.158203125, 3.378173828125, 3.59814453125, 3.818115234375, 4.0380859375, 4.258056640625, 4.47802734375, 4.697998046875, 4.91796875, 5.137939453125, 5.35791015625, 5.577880859375, 5.7978515625, 6.017822265625, 6.23779296875, 6.457763671875, 6.677734375, 6.897705078125, 7.11767578125, 7.337646484375, 7.5576171875, 7.777587890625, 7.99755859375, 8.217529296875, 8.4375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 0.0, 4.0, 9.0, 11.0, 16.0, 29.0, 39.0, 70.0, 106.0, 150.0, 255.0, 428.0, 693.0, 1119.0, 1922.0, 3367.0, 5754.0, 9861.0, 17458.0, 31435.0, 58223.0, 115589.0, 324772.0, 253414.0, 103910.0, 52941.0, 28669.0, 16248.0, 9008.0, 5268.0, 3072.0, 1781.0, 1113.0, 682.0, 414.0, 245.0, 167.0, 108.0, 67.0, 49.0, 32.0, 17.0, 18.0, 7.0, 5.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.20703125, -2.137908935546875, -2.06878662109375, -1.999664306640625, -1.9305419921875, -1.861419677734375, -1.79229736328125, -1.723175048828125, -1.654052734375, -1.584930419921875, -1.51580810546875, -1.446685791015625, -1.3775634765625, -1.308441162109375, -1.23931884765625, -1.170196533203125, -1.10107421875, -1.031951904296875, -0.96282958984375, -0.893707275390625, -0.8245849609375, -0.755462646484375, -0.68634033203125, -0.617218017578125, -0.548095703125, -0.478973388671875, -0.40985107421875, -0.340728759765625, -0.2716064453125, -0.202484130859375, -0.13336181640625, -0.064239501953125, 0.0048828125, 0.074005126953125, 0.14312744140625, 0.212249755859375, 0.2813720703125, 0.350494384765625, 0.41961669921875, 0.488739013671875, 0.557861328125, 0.626983642578125, 0.69610595703125, 0.765228271484375, 0.8343505859375, 0.903472900390625, 0.97259521484375, 1.041717529296875, 1.11083984375, 1.179962158203125, 1.24908447265625, 1.318206787109375, 1.3873291015625, 1.456451416015625, 1.52557373046875, 1.594696044921875, 1.663818359375, 1.732940673828125, 1.80206298828125, 1.871185302734375, 1.9403076171875, 2.009429931640625, 2.07855224609375, 2.147674560546875, 2.216796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 2.0, 10.0, 3.0, 10.0, 10.0, 16.0, 11.0, 10.0, 13.0, 26.0, 21.0, 29.0, 22.0, 31.0, 36.0, 43.0, 45.0, 31.0, 45.0, 52.0, 1061.0, 43.0, 46.0, 42.0, 37.0, 28.0, 34.0, 32.0, 36.0, 29.0, 16.0, 27.0, 25.0, 15.0, 21.0, 5.0, 11.0, 11.0, 6.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.748046875, -3.625885009765625, -3.50372314453125, -3.381561279296875, -3.2593994140625, -3.137237548828125, -3.01507568359375, -2.892913818359375, -2.770751953125, -2.648590087890625, -2.52642822265625, -2.404266357421875, -2.2821044921875, -2.159942626953125, -2.03778076171875, -1.915618896484375, -1.79345703125, -1.671295166015625, -1.54913330078125, -1.426971435546875, -1.3048095703125, -1.182647705078125, -1.06048583984375, -0.938323974609375, -0.816162109375, -0.694000244140625, -0.57183837890625, -0.449676513671875, -0.3275146484375, -0.205352783203125, -0.08319091796875, 0.038970947265625, 0.1611328125, 0.283294677734375, 0.40545654296875, 0.527618408203125, 0.6497802734375, 0.771942138671875, 0.89410400390625, 1.016265869140625, 1.138427734375, 1.260589599609375, 1.38275146484375, 1.504913330078125, 1.6270751953125, 1.749237060546875, 1.87139892578125, 1.993560791015625, 2.11572265625, 2.237884521484375, 2.36004638671875, 2.482208251953125, 2.6043701171875, 2.726531982421875, 2.84869384765625, 2.970855712890625, 3.093017578125, 3.215179443359375, 3.33734130859375, 3.459503173828125, 3.5816650390625, 3.703826904296875, 3.82598876953125, 3.948150634765625, 4.0703125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 7.0, 2.0, 9.0, 23.0, 17.0, 27.0, 52.0, 67.0, 102.0, 136.0, 227.0, 315.0, 434.0, 659.0, 926.0, 1356.0, 1894.0, 2679.0, 3978.0, 5845.0, 8358.0, 12639.0, 19207.0, 28863.0, 45508.0, 72329.0, 125248.0, 1363377.0, 162598.0, 85902.0, 53132.0, 34152.0, 21796.0, 14425.0, 9698.0, 6480.0, 4485.0, 3090.0, 2156.0, 1474.0, 1035.0, 744.0, 546.0, 373.0, 241.0, 175.0, 124.0, 83.0, 51.0, 37.0, 24.0, 15.0, 10.0, 3.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.408203125, -1.3622894287109375, -1.316375732421875, -1.2704620361328125, -1.22454833984375, -1.1786346435546875, -1.132720947265625, -1.0868072509765625, -1.0408935546875, -0.9949798583984375, -0.949066162109375, -0.9031524658203125, -0.85723876953125, -0.8113250732421875, -0.765411376953125, -0.7194976806640625, -0.673583984375, -0.6276702880859375, -0.581756591796875, -0.5358428955078125, -0.48992919921875, -0.4440155029296875, -0.398101806640625, -0.3521881103515625, -0.3062744140625, -0.2603607177734375, -0.214447021484375, -0.1685333251953125, -0.12261962890625, -0.0767059326171875, -0.030792236328125, 0.0151214599609375, 0.06103515625, 0.1069488525390625, 0.152862548828125, 0.1987762451171875, 0.24468994140625, 0.2906036376953125, 0.336517333984375, 0.3824310302734375, 0.4283447265625, 0.4742584228515625, 0.520172119140625, 0.5660858154296875, 0.61199951171875, 0.6579132080078125, 0.703826904296875, 0.7497406005859375, 0.795654296875, 0.8415679931640625, 0.887481689453125, 0.9333953857421875, 0.97930908203125, 1.0252227783203125, 1.071136474609375, 1.1170501708984375, 1.1629638671875, 1.2088775634765625, 1.254791259765625, 1.3007049560546875, 1.34661865234375, 1.3925323486328125, 1.438446044921875, 1.4843597412109375, 1.5302734375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 7.0, 9.0, 12.0, 10.0, 9.0, 15.0, 21.0, 24.0, 21.0, 43.0, 50.0, 77.0, 78.0, 106.0, 90.0, 94.0, 55.0, 48.0, 34.0, 35.0, 27.0, 22.0, 15.0, 10.0, 13.0, 8.0, 12.0, 11.0, 6.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00024127960205078125, -0.00023292377591133118, -0.0002245679497718811, -0.00021621212363243103, -0.00020785629749298096, -0.00019950047135353088, -0.0001911446452140808, -0.00018278881907463074, -0.00017443299293518066, -0.0001660771667957306, -0.00015772134065628052, -0.00014936551451683044, -0.00014100968837738037, -0.0001326538622379303, -0.00012429803609848022, -0.00011594220995903015, -0.00010758638381958008, -9.923055768013e-05, -9.087473154067993e-05, -8.251890540122986e-05, -7.416307926177979e-05, -6.580725312232971e-05, -5.745142698287964e-05, -4.9095600843429565e-05, -4.073977470397949e-05, -3.238394856452942e-05, -2.4028122425079346e-05, -1.5672296285629272e-05, -7.316470146179199e-06, 1.039355993270874e-06, 9.395182132720947e-06, 1.775100827217102e-05, 2.6106834411621094e-05, 3.446266055107117e-05, 4.281848669052124e-05, 5.1174312829971313e-05, 5.953013896942139e-05, 6.788596510887146e-05, 7.624179124832153e-05, 8.45976173877716e-05, 9.295344352722168e-05, 0.00010130926966667175, 0.00010966509580612183, 0.0001180209219455719, 0.00012637674808502197, 0.00013473257422447205, 0.00014308840036392212, 0.0001514442265033722, 0.00015980005264282227, 0.00016815587878227234, 0.0001765117049217224, 0.00018486753106117249, 0.00019322335720062256, 0.00020157918334007263, 0.0002099350094795227, 0.00021829083561897278, 0.00022664666175842285, 0.00023500248789787292, 0.000243358314037323, 0.00025171414017677307, 0.00026006996631622314, 0.0002684257924556732, 0.0002767816185951233, 0.00028513744473457336, 0.00029349327087402344]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 10.0, 12.0, 21.0, 16.0, 21.0, 28.0, 38.0, 71.0, 96.0, 174.0, 367.0, 1013.0, 171868.0, 872390.0, 1399.0, 469.0, 223.0, 93.0, 65.0, 40.0, 25.0, 21.0, 21.0, 17.0, 15.0, 6.0, 4.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.007110595703125, -0.006908059120178223, -0.006705522537231445, -0.006502985954284668, -0.006300449371337891, -0.006097912788391113, -0.005895376205444336, -0.005692839622497559, -0.005490303039550781, -0.005287766456604004, -0.0050852298736572266, -0.004882693290710449, -0.004680156707763672, -0.0044776201248168945, -0.004275083541870117, -0.00407254695892334, -0.0038700103759765625, -0.003667473793029785, -0.003464937210083008, -0.0032624006271362305, -0.003059864044189453, -0.0028573274612426758, -0.0026547908782958984, -0.002452254295349121, -0.0022497177124023438, -0.0020471811294555664, -0.001844644546508789, -0.0016421079635620117, -0.0014395713806152344, -0.001237034797668457, -0.0010344982147216797, -0.0008319616317749023, -0.000629425048828125, -0.00042688846588134766, -0.0002243518829345703, -2.181529998779297e-05, 0.00018072128295898438, 0.0003832578659057617, 0.0005857944488525391, 0.0007883310317993164, 0.0009908676147460938, 0.001193404197692871, 0.0013959407806396484, 0.0015984773635864258, 0.0018010139465332031, 0.0020035505294799805, 0.002206087112426758, 0.002408623695373535, 0.0026111602783203125, 0.00281369686126709, 0.003016233444213867, 0.0032187700271606445, 0.003421306610107422, 0.0036238431930541992, 0.0038263797760009766, 0.004028916358947754, 0.004231452941894531, 0.004433989524841309, 0.004636526107788086, 0.004839062690734863, 0.005041599273681641, 0.005244135856628418, 0.005446672439575195, 0.005649209022521973, 0.00585174560546875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 155.0, 514.0, 307.0, 32.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001896093599498272, -0.00016496184980496764, -0.0001403143396601081, -0.00011566683679120615, -9.10193266463466e-05, -6.637182377744466e-05, -4.172431363258511e-05, -1.7076803487725556e-05, 7.5707066571339965e-06, 3.221821680199355e-05, 5.6865723308874294e-05, 8.151322981575504e-05, 0.00010616073996061459, 0.00013080824282951653, 0.00015545575297437608, 0.00018010326311923563, 0.0002047507732640952, 0.00022939828340895474, 0.0002540457935538143, 0.00027869330369867384, 0.0003033408138435334, 0.0003279882948845625, 0.00035263580502942204, 0.0003772833151742816, 0.00040193082531914115, 0.0004265783354640007, 0.00045122584560886025, 0.0004758733557537198, 0.0005005208658985794, 0.0005251683760434389, 0.0005498158861882985, 0.000574463396333158, 0.0005991109064780176, 0.0006237584166228771, 0.0006484059267677367, 0.0006730534369125962, 0.0006977009470574558, 0.0007223484572023153, 0.0007469959673471749, 0.0007716434774920344, 0.000796290987636894, 0.0008209384977817535, 0.0008455860079266131, 0.0008702335180714726, 0.0008948810282163322, 0.0009195285383611917, 0.0009441760485060513, 0.0009688235586509109, 0.0009934710105881095, 0.0010181184625253081, 0.0010427660308778286, 0.0010674134828150272, 0.0010920610511675477, 0.0011167085031047463, 0.0011413560714572668, 0.0011660035233944654, 0.001190651091746986, 0.0012152985436841846, 0.001239946112036705, 0.0012645935639739037, 0.0012892411323264241, 0.0013138885842636228, 0.0013385361526161432, 0.0013631836045533419, 0.0013878311729058623]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 14.0, 23.0, 14.0, 24.0, 21.0, 24.0, 25.0, 27.0, 27.0, 35.0, 31.0, 25.0, 37.0, 43.0, 45.0, 49.0, 34.0, 37.0, 34.0, 37.0, 27.0, 34.0, 34.0, 32.0, 36.0, 20.0, 20.0, 16.0, 24.0, 23.0, 24.0, 16.0, 10.0, 12.0, 12.0, 5.0, 4.0, 6.0, 2.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.00013256072998046875, -0.00012884102761745453, -0.0001251213252544403, -0.00012140162289142609, -0.00011768192052841187, -0.00011396221816539764, -0.00011024251580238342, -0.0001065228134393692, -0.00010280311107635498, -9.908340871334076e-05, -9.536370635032654e-05, -9.164400398731232e-05, -8.79243016242981e-05, -8.420459926128387e-05, -8.048489689826965e-05, -7.676519453525543e-05, -7.304549217224121e-05, -6.932578980922699e-05, -6.560608744621277e-05, -6.188638508319855e-05, -5.8166682720184326e-05, -5.4446980357170105e-05, -5.0727277994155884e-05, -4.700757563114166e-05, -4.328787326812744e-05, -3.956817090511322e-05, -3.5848468542099e-05, -3.212876617908478e-05, -2.8409063816070557e-05, -2.4689361453056335e-05, -2.0969659090042114e-05, -1.7249956727027893e-05, -1.3530254364013672e-05, -9.81055200099945e-06, -6.0908496379852295e-06, -2.3711472749710083e-06, 1.3485550880432129e-06, 5.068257451057434e-06, 8.787959814071655e-06, 1.2507662177085876e-05, 1.6227364540100098e-05, 1.994706690311432e-05, 2.366676926612854e-05, 2.738647162914276e-05, 3.110617399215698e-05, 3.4825876355171204e-05, 3.8545578718185425e-05, 4.2265281081199646e-05, 4.598498344421387e-05, 4.970468580722809e-05, 5.342438817024231e-05, 5.714409053325653e-05, 6.086379289627075e-05, 6.458349525928497e-05, 6.83031976222992e-05, 7.202289998531342e-05, 7.574260234832764e-05, 7.946230471134186e-05, 8.318200707435608e-05, 8.69017094373703e-05, 9.062141180038452e-05, 9.434111416339874e-05, 9.806081652641296e-05, 0.00010178051888942719, 0.0001055002212524414]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 8.0, 14.0, 16.0, 10.0, 13.0, 21.0, 31.0, 32.0, 28.0, 32.0, 47.0, 44.0, 46.0, 47.0, 37.0, 38.0, 52.0, 39.0, 50.0, 39.0, 41.0, 40.0, 43.0, 31.0, 31.0, 35.0, 28.0, 25.0, 19.0, 16.0, 7.0, 7.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.640625, -5.420654296875, -5.20068359375, -4.980712890625, -4.7607421875, -4.540771484375, -4.32080078125, -4.100830078125, -3.880859375, -3.660888671875, -3.44091796875, -3.220947265625, -3.0009765625, -2.781005859375, -2.56103515625, -2.341064453125, -2.12109375, -1.901123046875, -1.68115234375, -1.461181640625, -1.2412109375, -1.021240234375, -0.80126953125, -0.581298828125, -0.361328125, -0.141357421875, 0.07861328125, 0.298583984375, 0.5185546875, 0.738525390625, 0.95849609375, 1.178466796875, 1.3984375, 1.618408203125, 1.83837890625, 2.058349609375, 2.2783203125, 2.498291015625, 2.71826171875, 2.938232421875, 3.158203125, 3.378173828125, 3.59814453125, 3.818115234375, 4.0380859375, 4.258056640625, 4.47802734375, 4.697998046875, 4.91796875, 5.137939453125, 5.35791015625, 5.577880859375, 5.7978515625, 6.017822265625, 6.23779296875, 6.457763671875, 6.677734375, 6.897705078125, 7.11767578125, 7.337646484375, 7.5576171875, 7.777587890625, 7.99755859375, 8.217529296875, 8.4375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 8.0, 9.0, 18.0, 21.0, 32.0, 38.0, 49.0, 69.0, 76.0, 144.0, 192.0, 271.0, 441.0, 715.0, 1306.0, 3101.0, 7696.0, 21755.0, 60946.0, 168880.0, 433247.0, 224653.0, 78659.0, 28431.0, 10100.0, 3720.0, 1577.0, 866.0, 511.0, 308.0, 196.0, 156.0, 95.0, 79.0, 58.0, 36.0, 27.0, 19.0, 15.0, 15.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.671875, -7.42138671875, -7.1708984375, -6.92041015625, -6.669921875, -6.41943359375, -6.1689453125, -5.91845703125, -5.66796875, -5.41748046875, -5.1669921875, -4.91650390625, -4.666015625, -4.41552734375, -4.1650390625, -3.91455078125, -3.6640625, -3.41357421875, -3.1630859375, -2.91259765625, -2.662109375, -2.41162109375, -2.1611328125, -1.91064453125, -1.66015625, -1.40966796875, -1.1591796875, -0.90869140625, -0.658203125, -0.40771484375, -0.1572265625, 0.09326171875, 0.34375, 0.59423828125, 0.8447265625, 1.09521484375, 1.345703125, 1.59619140625, 1.8466796875, 2.09716796875, 2.34765625, 2.59814453125, 2.8486328125, 3.09912109375, 3.349609375, 3.60009765625, 3.8505859375, 4.10107421875, 4.3515625, 4.60205078125, 4.8525390625, 5.10302734375, 5.353515625, 5.60400390625, 5.8544921875, 6.10498046875, 6.35546875, 6.60595703125, 6.8564453125, 7.10693359375, 7.357421875, 7.60791015625, 7.8583984375, 8.10888671875, 8.359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 8.0, 12.0, 16.0, 6.0, 17.0, 21.0, 35.0, 29.0, 42.0, 32.0, 58.0, 46.0, 66.0, 100.0, 218.0, 1511.0, 262.0, 111.0, 79.0, 44.0, 39.0, 42.0, 47.0, 32.0, 31.0, 22.0, 29.0, 24.0, 11.0, 13.0, 10.0, 8.0, 3.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.5771484375, -18.810546875, -18.0439453125, -17.27734375, -16.5107421875, -15.744140625, -14.9775390625, -14.2109375, -13.4443359375, -12.677734375, -11.9111328125, -11.14453125, -10.3779296875, -9.611328125, -8.8447265625, -8.078125, -7.3115234375, -6.544921875, -5.7783203125, -5.01171875, -4.2451171875, -3.478515625, -2.7119140625, -1.9453125, -1.1787109375, -0.412109375, 0.3544921875, 1.12109375, 1.8876953125, 2.654296875, 3.4208984375, 4.1875, 4.9541015625, 5.720703125, 6.4873046875, 7.25390625, 8.0205078125, 8.787109375, 9.5537109375, 10.3203125, 11.0869140625, 11.853515625, 12.6201171875, 13.38671875, 14.1533203125, 14.919921875, 15.6865234375, 16.453125, 17.2197265625, 17.986328125, 18.7529296875, 19.51953125, 20.2861328125, 21.052734375, 21.8193359375, 22.5859375, 23.3525390625, 24.119140625, 24.8857421875, 25.65234375, 26.4189453125, 27.185546875, 27.9521484375, 28.71875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 7.0, 10.0, 8.0, 5.0, 7.0, 10.0, 6.0, 16.0, 18.0, 26.0, 24.0, 27.0, 56.0, 57.0, 57.0, 90.0, 115.0, 149.0, 217.0, 431.0, 871.0, 5157.0, 2892196.0, 242426.0, 2078.0, 592.0, 280.0, 213.0, 119.0, 97.0, 69.0, 55.0, 47.0, 34.0, 22.0, 24.0, 18.0, 17.0, 18.0, 8.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-66.6875, -64.7158203125, -62.744140625, -60.7724609375, -58.80078125, -56.8291015625, -54.857421875, -52.8857421875, -50.9140625, -48.9423828125, -46.970703125, -44.9990234375, -43.02734375, -41.0556640625, -39.083984375, -37.1123046875, -35.140625, -33.1689453125, -31.197265625, -29.2255859375, -27.25390625, -25.2822265625, -23.310546875, -21.3388671875, -19.3671875, -17.3955078125, -15.423828125, -13.4521484375, -11.48046875, -9.5087890625, -7.537109375, -5.5654296875, -3.59375, -1.6220703125, 0.349609375, 2.3212890625, 4.29296875, 6.2646484375, 8.236328125, 10.2080078125, 12.1796875, 14.1513671875, 16.123046875, 18.0947265625, 20.06640625, 22.0380859375, 24.009765625, 25.9814453125, 27.953125, 29.9248046875, 31.896484375, 33.8681640625, 35.83984375, 37.8115234375, 39.783203125, 41.7548828125, 43.7265625, 45.6982421875, 47.669921875, 49.6416015625, 51.61328125, 53.5849609375, 55.556640625, 57.5283203125, 59.5]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 247.0, 676.0, 78.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.267841339111328, -23.244535446166992, -16.221229553222656, -9.197925567626953, -2.174619674682617, 4.848686218261719, 11.871990203857422, 18.89529800415039, 25.918601989746094, 32.9419059753418, 39.965213775634766, 46.98851776123047, 54.01182556152344, 61.03512954711914, 68.05843353271484, 75.08174133300781, 82.10504150390625, 89.12834930419922, 96.15164947509766, 103.17495727539062, 110.1982650756836, 117.22157287597656, 124.244873046875, 131.2681884765625, 138.29148864746094, 145.31478881835938, 152.33810424804688, 159.3614044189453, 166.38470458984375, 173.40802001953125, 180.4313201904297, 187.45462036132812, 194.47792053222656, 201.501220703125, 208.5245361328125, 215.54783630371094, 222.57113647460938, 229.59445190429688, 236.6177520751953, 243.64105224609375, 250.66436767578125, 257.68768310546875, 264.7109680175781, 271.7342834472656, 278.7575988769531, 285.7808837890625, 292.80419921875, 299.8275146484375, 306.8507995605469, 313.8741149902344, 320.89739990234375, 327.92071533203125, 334.94403076171875, 341.9673156738281, 348.9906311035156, 356.0139465332031, 363.0372619628906, 370.0605773925781, 377.0838623046875, 384.107177734375, 391.1304931640625, 398.1537780761719, 405.1770935058594, 412.2004089355469, 419.22369384765625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 4.0, 8.0, 8.0, 6.0, 10.0, 14.0, 17.0, 17.0, 27.0, 20.0, 19.0, 30.0, 28.0, 37.0, 37.0, 35.0, 47.0, 42.0, 50.0, 51.0, 51.0, 39.0, 37.0, 39.0, 44.0, 33.0, 39.0, 28.0, 22.0, 26.0, 22.0, 18.0, 12.0, 10.0, 11.0, 10.0, 11.0, 3.0, 6.0, 3.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-65.57060241699219, -63.566627502441406, -61.56265640258789, -59.55868148803711, -57.554710388183594, -55.55073547363281, -53.54676055908203, -51.54278564453125, -49.538814544677734, -47.53483963012695, -45.53086853027344, -43.526893615722656, -41.522918701171875, -39.51894760131836, -37.51497268676758, -35.51100158691406, -33.50702667236328, -31.503053665161133, -29.499080657958984, -27.495105743408203, -25.491132736206055, -23.487159729003906, -21.483184814453125, -19.479211807250977, -17.475238800048828, -15.47126579284668, -13.467291831970215, -11.46331787109375, -9.459344863891602, -7.455371856689453, -5.451397895812988, -3.4474239349365234, -1.4434432983398438, 0.5605301856994629, 2.5645036697387695, 4.568477153778076, 6.572450637817383, 8.576423645019531, 10.580397605895996, 12.584371566772461, 14.58834457397461, 16.592317581176758, 18.596290588378906, 20.600265502929688, 22.604238510131836, 24.608211517333984, 26.612186431884766, 28.616159439086914, 30.620132446289062, 32.624107360839844, 34.62807846069336, 36.63205337524414, 38.636024475097656, 40.63999938964844, 42.64397430419922, 44.64794921875, 46.651920318603516, 48.6558952331543, 50.65986633300781, 52.663841247558594, 54.667816162109375, 56.67178726196289, 58.67576217651367, 60.67973327636719, 62.68370819091797]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 11.0, 16.0, 13.0, 16.0, 16.0, 20.0, 24.0, 27.0, 28.0, 32.0, 42.0, 38.0, 34.0, 27.0, 59.0, 36.0, 37.0, 41.0, 42.0, 53.0, 51.0, 36.0, 42.0, 36.0, 37.0, 33.0, 31.0, 26.0, 16.0, 15.0, 13.0, 12.0, 7.0, 9.0, 7.0, 3.0, 2.0, 8.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3984375, -6.15380859375, -5.9091796875, -5.66455078125, -5.419921875, -5.17529296875, -4.9306640625, -4.68603515625, -4.44140625, -4.19677734375, -3.9521484375, -3.70751953125, -3.462890625, -3.21826171875, -2.9736328125, -2.72900390625, -2.484375, -2.23974609375, -1.9951171875, -1.75048828125, -1.505859375, -1.26123046875, -1.0166015625, -0.77197265625, -0.52734375, -0.28271484375, -0.0380859375, 0.20654296875, 0.451171875, 0.69580078125, 0.9404296875, 1.18505859375, 1.4296875, 1.67431640625, 1.9189453125, 2.16357421875, 2.408203125, 2.65283203125, 2.8974609375, 3.14208984375, 3.38671875, 3.63134765625, 3.8759765625, 4.12060546875, 4.365234375, 4.60986328125, 4.8544921875, 5.09912109375, 5.34375, 5.58837890625, 5.8330078125, 6.07763671875, 6.322265625, 6.56689453125, 6.8115234375, 7.05615234375, 7.30078125, 7.54541015625, 7.7900390625, 8.03466796875, 8.279296875, 8.52392578125, 8.7685546875, 9.01318359375, 9.2578125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 10.0, 15.0, 15.0, 13.0, 29.0, 27.0, 25.0, 23.0, 32.0, 51.0, 56.0, 104.0, 305.0, 1072.0, 9780.0, 867925.0, 3212908.0, 98056.0, 2767.0, 549.0, 172.0, 74.0, 46.0, 34.0, 35.0, 32.0, 20.0, 19.0, 10.0, 23.0, 7.0, 10.0, 4.0, 5.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.598388671875, -20.74365234375, -19.888916015625, -19.0341796875, -18.179443359375, -17.32470703125, -16.469970703125, -15.615234375, -14.760498046875, -13.90576171875, -13.051025390625, -12.1962890625, -11.341552734375, -10.48681640625, -9.632080078125, -8.77734375, -7.922607421875, -7.06787109375, -6.213134765625, -5.3583984375, -4.503662109375, -3.64892578125, -2.794189453125, -1.939453125, -1.084716796875, -0.22998046875, 0.624755859375, 1.4794921875, 2.334228515625, 3.18896484375, 4.043701171875, 4.8984375, 5.753173828125, 6.60791015625, 7.462646484375, 8.3173828125, 9.172119140625, 10.02685546875, 10.881591796875, 11.736328125, 12.591064453125, 13.44580078125, 14.300537109375, 15.1552734375, 16.010009765625, 16.86474609375, 17.719482421875, 18.57421875, 19.428955078125, 20.28369140625, 21.138427734375, 21.9931640625, 22.847900390625, 23.70263671875, 24.557373046875, 25.412109375, 26.266845703125, 27.12158203125, 27.976318359375, 28.8310546875, 29.685791015625, 30.54052734375, 31.395263671875, 32.25]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 15.0, 17.0, 33.0, 46.0, 41.0, 83.0, 129.0, 175.0, 246.0, 349.0, 400.0, 477.0, 477.0, 437.0, 301.0, 250.0, 175.0, 127.0, 75.0, 60.0, 52.0, 30.0, 18.0, 9.0, 16.0, 9.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7578125, -14.2474365234375, -13.737060546875, -13.2266845703125, -12.71630859375, -12.2059326171875, -11.695556640625, -11.1851806640625, -10.6748046875, -10.1644287109375, -9.654052734375, -9.1436767578125, -8.63330078125, -8.1229248046875, -7.612548828125, -7.1021728515625, -6.591796875, -6.0814208984375, -5.571044921875, -5.0606689453125, -4.55029296875, -4.0399169921875, -3.529541015625, -3.0191650390625, -2.5087890625, -1.9984130859375, -1.488037109375, -0.9776611328125, -0.46728515625, 0.0430908203125, 0.553466796875, 1.0638427734375, 1.57421875, 2.0845947265625, 2.594970703125, 3.1053466796875, 3.61572265625, 4.1260986328125, 4.636474609375, 5.1468505859375, 5.6572265625, 6.1676025390625, 6.677978515625, 7.1883544921875, 7.69873046875, 8.2091064453125, 8.719482421875, 9.2298583984375, 9.740234375, 10.2506103515625, 10.760986328125, 11.2713623046875, 11.78173828125, 12.2921142578125, 12.802490234375, 13.3128662109375, 13.8232421875, 14.3336181640625, 14.843994140625, 15.3543701171875, 15.86474609375, 16.3751220703125, 16.885498046875, 17.3958740234375, 17.90625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 10.0, 5.0, 14.0, 10.0, 16.0, 22.0, 44.0, 40.0, 60.0, 73.0, 110.0, 158.0, 197.0, 273.0, 411.0, 841.0, 9139.0, 2937801.0, 1238325.0, 4706.0, 711.0, 381.0, 244.0, 194.0, 134.0, 90.0, 99.0, 67.0, 38.0, 21.0, 18.0, 17.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.625, -57.9169921875, -56.208984375, -54.5009765625, -52.79296875, -51.0849609375, -49.376953125, -47.6689453125, -45.9609375, -44.2529296875, -42.544921875, -40.8369140625, -39.12890625, -37.4208984375, -35.712890625, -34.0048828125, -32.296875, -30.5888671875, -28.880859375, -27.1728515625, -25.46484375, -23.7568359375, -22.048828125, -20.3408203125, -18.6328125, -16.9248046875, -15.216796875, -13.5087890625, -11.80078125, -10.0927734375, -8.384765625, -6.6767578125, -4.96875, -3.2607421875, -1.552734375, 0.1552734375, 1.86328125, 3.5712890625, 5.279296875, 6.9873046875, 8.6953125, 10.4033203125, 12.111328125, 13.8193359375, 15.52734375, 17.2353515625, 18.943359375, 20.6513671875, 22.359375, 24.0673828125, 25.775390625, 27.4833984375, 29.19140625, 30.8994140625, 32.607421875, 34.3154296875, 36.0234375, 37.7314453125, 39.439453125, 41.1474609375, 42.85546875, 44.5634765625, 46.271484375, 47.9794921875, 49.6875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 16.0, 82.0, 212.0, 327.0, 251.0, 88.0, 28.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.50189208984375, -133.45700073242188, -128.412109375, -123.3672103881836, -118.32231140136719, -113.27742004394531, -108.23252868652344, -103.18763732910156, -98.14273834228516, -93.09784698486328, -88.05294799804688, -83.008056640625, -77.96316528320312, -72.91826629638672, -67.87337493896484, -62.8284797668457, -57.78358459472656, -52.73868942260742, -47.69379425048828, -42.648902893066406, -37.604007720947266, -32.559112548828125, -27.514219284057617, -22.46932601928711, -17.42443084716797, -12.379536628723145, -7.33464241027832, -2.289748191833496, 2.755146026611328, 7.800041198730469, 12.844934463500977, 17.889827728271484, 22.934738159179688, 27.979633331298828, 33.02452850341797, 38.069419860839844, 43.114315032958984, 48.159210205078125, 53.2041015625, 58.24899673461914, 63.29389190673828, 68.33878326416016, 73.38368225097656, 78.42857360839844, 83.47346496582031, 88.51836395263672, 93.5632553100586, 98.608154296875, 103.65304565429688, 108.69793701171875, 113.74283599853516, 118.78772735595703, 123.83262634277344, 128.8775177001953, 133.9224090576172, 138.96730041503906, 144.01220703125, 149.05709838867188, 154.10198974609375, 159.1468963623047, 164.19178771972656, 169.23667907714844, 174.2815704345703, 179.3264617919922, 184.37135314941406]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 10.0, 9.0, 13.0, 13.0, 11.0, 18.0, 20.0, 23.0, 31.0, 31.0, 31.0, 41.0, 39.0, 43.0, 36.0, 32.0, 34.0, 34.0, 51.0, 44.0, 46.0, 34.0, 31.0, 41.0, 36.0, 34.0, 30.0, 24.0, 32.0, 19.0, 18.0, 8.0, 10.0, 14.0, 8.0, 9.0, 11.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.45903396606445, -40.982994079589844, -39.506954193115234, -38.030914306640625, -36.554874420166016, -35.078834533691406, -33.6027946472168, -32.12675476074219, -30.650714874267578, -29.17467498779297, -27.69863510131836, -26.22259521484375, -24.74655532836914, -23.27051544189453, -21.794475555419922, -20.318435668945312, -18.842395782470703, -17.366355895996094, -15.890316009521484, -14.414276123046875, -12.938236236572266, -11.462196350097656, -9.986156463623047, -8.510116577148438, -7.034076690673828, -5.558036804199219, -4.081996917724609, -2.60595703125, -1.1299171447753906, 0.34612274169921875, 1.8221626281738281, 3.2982025146484375, 4.774238586425781, 6.250278472900391, 7.726318359375, 9.20235824584961, 10.678398132324219, 12.154438018798828, 13.630477905273438, 15.106517791748047, 16.582557678222656, 18.058597564697266, 19.534637451171875, 21.010677337646484, 22.486717224121094, 23.962757110595703, 25.438796997070312, 26.914836883544922, 28.39087677001953, 29.86691665649414, 31.34295654296875, 32.81899642944336, 34.29503631591797, 35.77107620239258, 37.24711608886719, 38.7231559753418, 40.199195861816406, 41.675235748291016, 43.151275634765625, 44.627315521240234, 46.103355407714844, 47.57939529418945, 49.05543518066406, 50.53147506713867, 52.00751495361328]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 8.0, 9.0, 15.0, 18.0, 18.0, 22.0, 24.0, 28.0, 34.0, 37.0, 32.0, 48.0, 49.0, 47.0, 44.0, 38.0, 49.0, 47.0, 50.0, 46.0, 48.0, 46.0, 44.0, 36.0, 46.0, 19.0, 23.0, 11.0, 15.0, 9.0, 5.0, 10.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.63348388671875, -6.3802490234375, -6.12701416015625, -5.873779296875, -5.62054443359375, -5.3673095703125, -5.11407470703125, -4.86083984375, -4.60760498046875, -4.3543701171875, -4.10113525390625, -3.847900390625, -3.59466552734375, -3.3414306640625, -3.08819580078125, -2.8349609375, -2.58172607421875, -2.3284912109375, -2.07525634765625, -1.822021484375, -1.56878662109375, -1.3155517578125, -1.06231689453125, -0.80908203125, -0.55584716796875, -0.3026123046875, -0.04937744140625, 0.203857421875, 0.45709228515625, 0.7103271484375, 0.96356201171875, 1.216796875, 1.47003173828125, 1.7232666015625, 1.97650146484375, 2.229736328125, 2.48297119140625, 2.7362060546875, 2.98944091796875, 3.24267578125, 3.49591064453125, 3.7491455078125, 4.00238037109375, 4.255615234375, 4.50885009765625, 4.7620849609375, 5.01531982421875, 5.2685546875, 5.52178955078125, 5.7750244140625, 6.02825927734375, 6.281494140625, 6.53472900390625, 6.7879638671875, 7.04119873046875, 7.29443359375, 7.54766845703125, 7.8009033203125, 8.05413818359375, 8.307373046875, 8.56060791015625, 8.8138427734375, 9.06707763671875, 9.3203125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 10.0, 20.0, 21.0, 34.0, 36.0, 59.0, 109.0, 151.0, 268.0, 462.0, 719.0, 1268.0, 2042.0, 3432.0, 5627.0, 9790.0, 17474.0, 31014.0, 56774.0, 110017.0, 269530.0, 293614.0, 113678.0, 58391.0, 31644.0, 17602.0, 10249.0, 5819.0, 3477.0, 2033.0, 1183.0, 775.0, 439.0, 301.0, 177.0, 109.0, 67.0, 42.0, 33.0, 18.0, 12.0, 11.0, 3.0, 7.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.43359375, -2.359893798828125, -2.28619384765625, -2.212493896484375, -2.1387939453125, -2.065093994140625, -1.99139404296875, -1.917694091796875, -1.843994140625, -1.770294189453125, -1.69659423828125, -1.622894287109375, -1.5491943359375, -1.475494384765625, -1.40179443359375, -1.328094482421875, -1.25439453125, -1.180694580078125, -1.10699462890625, -1.033294677734375, -0.9595947265625, -0.885894775390625, -0.81219482421875, -0.738494873046875, -0.664794921875, -0.591094970703125, -0.51739501953125, -0.443695068359375, -0.3699951171875, -0.296295166015625, -0.22259521484375, -0.148895263671875, -0.0751953125, -0.001495361328125, 0.07220458984375, 0.145904541015625, 0.2196044921875, 0.293304443359375, 0.36700439453125, 0.440704345703125, 0.514404296875, 0.588104248046875, 0.66180419921875, 0.735504150390625, 0.8092041015625, 0.882904052734375, 0.95660400390625, 1.030303955078125, 1.10400390625, 1.177703857421875, 1.25140380859375, 1.325103759765625, 1.3988037109375, 1.472503662109375, 1.54620361328125, 1.619903564453125, 1.693603515625, 1.767303466796875, 1.84100341796875, 1.914703369140625, 1.9884033203125, 2.062103271484375, 2.13580322265625, 2.209503173828125, 2.283203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 7.0, 6.0, 9.0, 6.0, 11.0, 11.0, 12.0, 12.0, 19.0, 30.0, 21.0, 27.0, 29.0, 39.0, 28.0, 41.0, 34.0, 38.0, 48.0, 41.0, 1069.0, 38.0, 51.0, 58.0, 34.0, 36.0, 25.0, 36.0, 38.0, 26.0, 34.0, 29.0, 17.0, 14.0, 10.0, 11.0, 7.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.3984375, -5.252838134765625, -5.10723876953125, -4.961639404296875, -4.8160400390625, -4.670440673828125, -4.52484130859375, -4.379241943359375, -4.233642578125, -4.088043212890625, -3.94244384765625, -3.796844482421875, -3.6512451171875, -3.505645751953125, -3.36004638671875, -3.214447021484375, -3.06884765625, -2.923248291015625, -2.77764892578125, -2.632049560546875, -2.4864501953125, -2.340850830078125, -2.19525146484375, -2.049652099609375, -1.904052734375, -1.758453369140625, -1.61285400390625, -1.467254638671875, -1.3216552734375, -1.176055908203125, -1.03045654296875, -0.884857177734375, -0.7392578125, -0.593658447265625, -0.44805908203125, -0.302459716796875, -0.1568603515625, -0.011260986328125, 0.13433837890625, 0.279937744140625, 0.425537109375, 0.571136474609375, 0.71673583984375, 0.862335205078125, 1.0079345703125, 1.153533935546875, 1.29913330078125, 1.444732666015625, 1.59033203125, 1.735931396484375, 1.88153076171875, 2.027130126953125, 2.1727294921875, 2.318328857421875, 2.46392822265625, 2.609527587890625, 2.755126953125, 2.900726318359375, 3.04632568359375, 3.191925048828125, 3.3375244140625, 3.483123779296875, 3.62872314453125, 3.774322509765625, 3.919921875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 8.0, 6.0, 11.0, 21.0, 30.0, 55.0, 70.0, 108.0, 169.0, 300.0, 487.0, 678.0, 1091.0, 1710.0, 2648.0, 4064.0, 6510.0, 10539.0, 17391.0, 27787.0, 46845.0, 79047.0, 147418.0, 1393688.0, 151940.0, 81515.0, 48024.0, 28516.0, 17450.0, 10832.0, 6533.0, 4100.0, 2623.0, 1718.0, 1140.0, 746.0, 447.0, 298.0, 210.0, 136.0, 86.0, 38.0, 33.0, 29.0, 12.0, 17.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.0234375, -1.96307373046875, -1.9027099609375, -1.84234619140625, -1.781982421875, -1.72161865234375, -1.6612548828125, -1.60089111328125, -1.54052734375, -1.48016357421875, -1.4197998046875, -1.35943603515625, -1.299072265625, -1.23870849609375, -1.1783447265625, -1.11798095703125, -1.0576171875, -0.99725341796875, -0.9368896484375, -0.87652587890625, -0.816162109375, -0.75579833984375, -0.6954345703125, -0.63507080078125, -0.57470703125, -0.51434326171875, -0.4539794921875, -0.39361572265625, -0.333251953125, -0.27288818359375, -0.2125244140625, -0.15216064453125, -0.091796875, -0.03143310546875, 0.0289306640625, 0.08929443359375, 0.149658203125, 0.21002197265625, 0.2703857421875, 0.33074951171875, 0.39111328125, 0.45147705078125, 0.5118408203125, 0.57220458984375, 0.632568359375, 0.69293212890625, 0.7532958984375, 0.81365966796875, 0.8740234375, 0.93438720703125, 0.9947509765625, 1.05511474609375, 1.115478515625, 1.17584228515625, 1.2362060546875, 1.29656982421875, 1.35693359375, 1.41729736328125, 1.4776611328125, 1.53802490234375, 1.598388671875, 1.65875244140625, 1.7191162109375, 1.77947998046875, 1.83984375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 6.0, 7.0, 6.0, 5.0, 6.0, 13.0, 7.0, 9.0, 11.0, 11.0, 10.0, 23.0, 21.0, 30.0, 37.0, 32.0, 43.0, 59.0, 63.0, 71.0, 66.0, 63.0, 45.0, 54.0, 36.0, 54.0, 26.0, 28.0, 29.0, 18.0, 19.0, 17.0, 14.0, 16.0, 7.0, 4.0, 7.0, 3.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0002315044403076172, -0.0002239122986793518, -0.00021632015705108643, -0.00020872801542282104, -0.00020113587379455566, -0.00019354373216629028, -0.0001859515905380249, -0.00017835944890975952, -0.00017076730728149414, -0.00016317516565322876, -0.00015558302402496338, -0.000147990882396698, -0.00014039874076843262, -0.00013280659914016724, -0.00012521445751190186, -0.00011762231588363647, -0.0001100301742553711, -0.00010243803262710571, -9.484589099884033e-05, -8.725374937057495e-05, -7.966160774230957e-05, -7.206946611404419e-05, -6.447732448577881e-05, -5.688518285751343e-05, -4.929304122924805e-05, -4.1700899600982666e-05, -3.4108757972717285e-05, -2.6516616344451904e-05, -1.8924474716186523e-05, -1.1332333087921143e-05, -3.7401914596557617e-06, 3.851950168609619e-06, 1.1444091796875e-05, 1.903623342514038e-05, 2.6628375053405762e-05, 3.422051668167114e-05, 4.1812658309936523e-05, 4.9404799938201904e-05, 5.6996941566467285e-05, 6.458908319473267e-05, 7.218122482299805e-05, 7.977336645126343e-05, 8.736550807952881e-05, 9.495764970779419e-05, 0.00010254979133605957, 0.00011014193296432495, 0.00011773407459259033, 0.0001253262162208557, 0.0001329183578491211, 0.00014051049947738647, 0.00014810264110565186, 0.00015569478273391724, 0.00016328692436218262, 0.000170879065990448, 0.00017847120761871338, 0.00018606334924697876, 0.00019365549087524414, 0.00020124763250350952, 0.0002088397741317749, 0.00021643191576004028, 0.00022402405738830566, 0.00023161619901657104, 0.00023920834064483643, 0.0002468004822731018, 0.0002543926239013672]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 7.0, 10.0, 9.0, 16.0, 17.0, 20.0, 30.0, 41.0, 57.0, 63.0, 117.0, 138.0, 291.0, 600.0, 2561.0, 917550.0, 124617.0, 1196.0, 504.0, 229.0, 131.0, 68.0, 51.0, 48.0, 25.0, 24.0, 19.0, 13.0, 17.0, 15.0, 8.0, 13.0, 2.0, 3.0, 10.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.005825042724609375, -0.0056528449058532715, -0.005480647087097168, -0.0053084492683410645, -0.005136251449584961, -0.004964053630828857, -0.004791855812072754, -0.00461965799331665, -0.004447460174560547, -0.004275262355804443, -0.00410306453704834, -0.003930866718292236, -0.003758668899536133, -0.0035864710807800293, -0.0034142732620239258, -0.0032420754432678223, -0.0030698776245117188, -0.0028976798057556152, -0.0027254819869995117, -0.002553284168243408, -0.0023810863494873047, -0.002208888530731201, -0.0020366907119750977, -0.0018644928932189941, -0.0016922950744628906, -0.0015200972557067871, -0.0013478994369506836, -0.00117570161819458, -0.0010035037994384766, -0.000831305980682373, -0.0006591081619262695, -0.000486910343170166, -0.0003147125244140625, -0.00014251470565795898, 2.968311309814453e-05, 0.00020188093185424805, 0.00037407875061035156, 0.0005462765693664551, 0.0007184743881225586, 0.0008906722068786621, 0.0010628700256347656, 0.0012350678443908691, 0.0014072656631469727, 0.0015794634819030762, 0.0017516613006591797, 0.0019238591194152832, 0.0020960569381713867, 0.0022682547569274902, 0.0024404525756835938, 0.0026126503944396973, 0.0027848482131958008, 0.0029570460319519043, 0.003129243850708008, 0.0033014416694641113, 0.003473639488220215, 0.0036458373069763184, 0.003818035125732422, 0.003990232944488525, 0.004162430763244629, 0.004334628582000732, 0.004506826400756836, 0.0046790242195129395, 0.004851222038269043, 0.0050234198570251465, 0.00519561767578125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 8.0, 72.0, 301.0, 412.0, 175.0, 43.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002528906334191561, -0.00023235274420585483, -0.0002118148549925536, -0.00019127698033116758, -0.0001707390765659511, -0.0001502012019045651, -0.00012966331269126385, -0.00010912542347796261, -8.858753426466137e-05, -6.804964505136013e-05, -4.7511759476037696e-05, -2.6973873900715262e-05, -6.43598468741402e-06, 1.4101904525887221e-05, 3.463978646323085e-05, 5.517767567653209e-05, 7.571556488983333e-05, 9.625345410313457e-05, 0.00011679134331643581, 0.00013732921797782183, 0.0001578671217430383, 0.0001784049964044243, 0.00019894288561772555, 0.0002194807748310268, 0.00024001866404432803, 0.0002605565532576293, 0.0002810944279190153, 0.00030163233168423176, 0.00032217020634561777, 0.00034270811011083424, 0.00036324598477222025, 0.0003837838885374367, 0.00040432176319882274, 0.00042485963786020875, 0.0004453975416254252, 0.00046593541628681123, 0.0004864733200520277, 0.0005070111947134137, 0.0005275490693747997, 0.0005480869440361857, 0.0005686248769052327, 0.0005891627515666187, 0.0006097006262280047, 0.0006302385590970516, 0.0006507764337584376, 0.0006713143084198236, 0.0006918521830812097, 0.0007123900577425957, 0.0007329279324039817, 0.0007534658070653677, 0.0007740036817267537, 0.0007945416145958006, 0.0008150794892571867, 0.0008356173639185727, 0.0008561552385799587, 0.0008766931714490056, 0.0008972310461103916, 0.0009177689207717776, 0.0009383067954331636, 0.0009588447283022106, 0.0009793825447559357, 0.0009999205358326435, 0.0010204584104940295, 0.0010409962851554155, 0.0010615341598168015]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 6.0, 7.0, 9.0, 11.0, 13.0, 17.0, 22.0, 27.0, 35.0, 34.0, 35.0, 38.0, 31.0, 35.0, 43.0, 50.0, 51.0, 42.0, 32.0, 43.0, 53.0, 41.0, 35.0, 42.0, 34.0, 30.0, 36.0, 19.0, 13.0, 23.0, 22.0, 9.0, 6.0, 13.0, 8.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.00015360116958618164, -0.00014895573258399963, -0.00014431029558181763, -0.00013966485857963562, -0.0001350194215774536, -0.0001303739845752716, -0.0001257285475730896, -0.00012108311057090759, -0.00011643767356872559, -0.00011179223656654358, -0.00010714679956436157, -0.00010250136256217957, -9.785592555999756e-05, -9.321048855781555e-05, -8.856505155563354e-05, -8.391961455345154e-05, -7.927417755126953e-05, -7.462874054908752e-05, -6.998330354690552e-05, -6.533786654472351e-05, -6.0692429542541504e-05, -5.60469925403595e-05, -5.140155553817749e-05, -4.6756118535995483e-05, -4.2110681533813477e-05, -3.746524453163147e-05, -3.281980752944946e-05, -2.8174370527267456e-05, -2.352893352508545e-05, -1.8883496522903442e-05, -1.4238059520721436e-05, -9.592622518539429e-06, -4.947185516357422e-06, -3.0174851417541504e-07, 4.343688488006592e-06, 8.989125490188599e-06, 1.3634562492370605e-05, 1.8279999494552612e-05, 2.292543649673462e-05, 2.7570873498916626e-05, 3.221631050109863e-05, 3.686174750328064e-05, 4.1507184505462646e-05, 4.615262150764465e-05, 5.079805850982666e-05, 5.544349551200867e-05, 6.0088932514190674e-05, 6.473436951637268e-05, 6.937980651855469e-05, 7.40252435207367e-05, 7.86706805229187e-05, 8.331611752510071e-05, 8.796155452728271e-05, 9.260699152946472e-05, 9.725242853164673e-05, 0.00010189786553382874, 0.00010654330253601074, 0.00011118873953819275, 0.00011583417654037476, 0.00012047961354255676, 0.00012512505054473877, 0.00012977048754692078, 0.00013441592454910278, 0.0001390613615512848, 0.0001437067985534668]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 8.0, 9.0, 15.0, 18.0, 18.0, 22.0, 24.0, 28.0, 34.0, 37.0, 32.0, 48.0, 49.0, 47.0, 44.0, 38.0, 49.0, 47.0, 50.0, 46.0, 48.0, 46.0, 44.0, 36.0, 46.0, 19.0, 23.0, 11.0, 15.0, 9.0, 5.0, 10.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.63348388671875, -6.3802490234375, -6.12701416015625, -5.873779296875, -5.62054443359375, -5.3673095703125, -5.11407470703125, -4.86083984375, -4.60760498046875, -4.3543701171875, -4.10113525390625, -3.847900390625, -3.59466552734375, -3.3414306640625, -3.08819580078125, -2.8349609375, -2.58172607421875, -2.3284912109375, -2.07525634765625, -1.822021484375, -1.56878662109375, -1.3155517578125, -1.06231689453125, -0.80908203125, -0.55584716796875, -0.3026123046875, -0.04937744140625, 0.203857421875, 0.45709228515625, 0.7103271484375, 0.96356201171875, 1.216796875, 1.47003173828125, 1.7232666015625, 1.97650146484375, 2.229736328125, 2.48297119140625, 2.7362060546875, 2.98944091796875, 3.24267578125, 3.49591064453125, 3.7491455078125, 4.00238037109375, 4.255615234375, 4.50885009765625, 4.7620849609375, 5.01531982421875, 5.2685546875, 5.52178955078125, 5.7750244140625, 6.02825927734375, 6.281494140625, 6.53472900390625, 6.7879638671875, 7.04119873046875, 7.29443359375, 7.54766845703125, 7.8009033203125, 8.05413818359375, 8.307373046875, 8.56060791015625, 8.8138427734375, 9.06707763671875, 9.3203125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 22.0, 30.0, 39.0, 67.0, 101.0, 124.0, 219.0, 260.0, 471.0, 722.0, 1266.0, 2471.0, 4941.0, 10602.0, 24928.0, 62987.0, 158112.0, 336914.0, 261209.0, 107492.0, 42472.0, 17372.0, 7566.0, 3566.0, 1842.0, 1018.0, 597.0, 362.0, 257.0, 150.0, 99.0, 73.0, 49.0, 34.0, 23.0, 15.0, 17.0, 12.0, 5.0, 5.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.90234375, -5.69732666015625, -5.4923095703125, -5.28729248046875, -5.082275390625, -4.87725830078125, -4.6722412109375, -4.46722412109375, -4.26220703125, -4.05718994140625, -3.8521728515625, -3.64715576171875, -3.442138671875, -3.23712158203125, -3.0321044921875, -2.82708740234375, -2.6220703125, -2.41705322265625, -2.2120361328125, -2.00701904296875, -1.802001953125, -1.59698486328125, -1.3919677734375, -1.18695068359375, -0.98193359375, -0.77691650390625, -0.5718994140625, -0.36688232421875, -0.161865234375, 0.04315185546875, 0.2481689453125, 0.45318603515625, 0.658203125, 0.86322021484375, 1.0682373046875, 1.27325439453125, 1.478271484375, 1.68328857421875, 1.8883056640625, 2.09332275390625, 2.29833984375, 2.50335693359375, 2.7083740234375, 2.91339111328125, 3.118408203125, 3.32342529296875, 3.5284423828125, 3.73345947265625, 3.9384765625, 4.14349365234375, 4.3485107421875, 4.55352783203125, 4.758544921875, 4.96356201171875, 5.1685791015625, 5.37359619140625, 5.57861328125, 5.78363037109375, 5.9886474609375, 6.19366455078125, 6.398681640625, 6.60369873046875, 6.8087158203125, 7.01373291015625, 7.21875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 10.0, 4.0, 16.0, 8.0, 14.0, 31.0, 18.0, 24.0, 28.0, 22.0, 30.0, 31.0, 46.0, 40.0, 66.0, 88.0, 191.0, 1486.0, 327.0, 115.0, 69.0, 66.0, 36.0, 37.0, 39.0, 36.0, 25.0, 27.0, 16.0, 21.0, 11.0, 13.0, 13.0, 12.0, 12.0, 4.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.609375, -24.8505859375, -24.091796875, -23.3330078125, -22.57421875, -21.8154296875, -21.056640625, -20.2978515625, -19.5390625, -18.7802734375, -18.021484375, -17.2626953125, -16.50390625, -15.7451171875, -14.986328125, -14.2275390625, -13.46875, -12.7099609375, -11.951171875, -11.1923828125, -10.43359375, -9.6748046875, -8.916015625, -8.1572265625, -7.3984375, -6.6396484375, -5.880859375, -5.1220703125, -4.36328125, -3.6044921875, -2.845703125, -2.0869140625, -1.328125, -0.5693359375, 0.189453125, 0.9482421875, 1.70703125, 2.4658203125, 3.224609375, 3.9833984375, 4.7421875, 5.5009765625, 6.259765625, 7.0185546875, 7.77734375, 8.5361328125, 9.294921875, 10.0537109375, 10.8125, 11.5712890625, 12.330078125, 13.0888671875, 13.84765625, 14.6064453125, 15.365234375, 16.1240234375, 16.8828125, 17.6416015625, 18.400390625, 19.1591796875, 19.91796875, 20.6767578125, 21.435546875, 22.1943359375, 22.953125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 11.0, 10.0, 13.0, 12.0, 12.0, 20.0, 39.0, 64.0, 70.0, 148.0, 206.0, 396.0, 1031.0, 225852.0, 2915266.0, 1393.0, 470.0, 218.0, 161.0, 95.0, 60.0, 35.0, 34.0, 15.0, 11.0, 11.0, 12.0, 7.0, 6.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.875, -117.22265625, -113.5703125, -109.91796875, -106.265625, -102.61328125, -98.9609375, -95.30859375, -91.65625, -88.00390625, -84.3515625, -80.69921875, -77.046875, -73.39453125, -69.7421875, -66.08984375, -62.4375, -58.78515625, -55.1328125, -51.48046875, -47.828125, -44.17578125, -40.5234375, -36.87109375, -33.21875, -29.56640625, -25.9140625, -22.26171875, -18.609375, -14.95703125, -11.3046875, -7.65234375, -4.0, -0.34765625, 3.3046875, 6.95703125, 10.609375, 14.26171875, 17.9140625, 21.56640625, 25.21875, 28.87109375, 32.5234375, 36.17578125, 39.828125, 43.48046875, 47.1328125, 50.78515625, 54.4375, 58.08984375, 61.7421875, 65.39453125, 69.046875, 72.69921875, 76.3515625, 80.00390625, 83.65625, 87.30859375, 90.9609375, 94.61328125, 98.265625, 101.91796875, 105.5703125, 109.22265625, 112.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 13.0, 18.0, 25.0, 64.0, 112.0, 167.0, 144.0, 165.0, 128.0, 83.0, 51.0, 19.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-45.60902404785156, -44.368011474609375, -43.12699508666992, -41.885982513427734, -40.64496612548828, -39.403953552246094, -38.16293716430664, -36.92192459106445, -35.680908203125, -34.43989562988281, -33.19887924194336, -31.95786476135254, -30.71685028076172, -29.47583770751953, -28.23482322692871, -26.99380874633789, -25.752796173095703, -24.511781692504883, -23.270767211914062, -22.029752731323242, -20.788738250732422, -19.547725677490234, -18.306711196899414, -17.065696716308594, -15.824682235717773, -14.583667755126953, -13.342653274536133, -12.101639747619629, -10.860625267028809, -9.619610786437988, -8.378597259521484, -7.137582778930664, -5.896568298339844, -4.655553817749023, -3.4145398139953613, -2.17352557182312, -0.9325113296508789, 0.3085031509399414, 1.5495171546936035, 2.7905311584472656, 4.031545639038086, 5.272560119628906, 6.513574123382568, 7.7545881271362305, 8.99560260772705, 10.236617088317871, 11.477630615234375, 12.718645095825195, 13.959659576416016, 15.200674057006836, 16.441688537597656, 17.682703018188477, 18.923717498779297, 20.164730072021484, 21.405744552612305, 22.646759033203125, 23.887773513793945, 25.128787994384766, 26.369802474975586, 27.610816955566406, 28.851829528808594, 30.092845916748047, 31.333858489990234, 32.57487487792969, 33.815887451171875]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 7.0, 11.0, 10.0, 10.0, 16.0, 21.0, 19.0, 17.0, 32.0, 30.0, 39.0, 27.0, 35.0, 34.0, 31.0, 40.0, 42.0, 44.0, 44.0, 51.0, 44.0, 38.0, 40.0, 34.0, 25.0, 37.0, 29.0, 31.0, 24.0, 15.0, 14.0, 20.0, 12.0, 9.0, 12.0, 10.0, 6.0, 8.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-61.82469177246094, -60.10287094116211, -58.38105010986328, -56.65922927856445, -54.937408447265625, -53.2155876159668, -51.49376678466797, -49.77194595336914, -48.05012512207031, -46.328304290771484, -44.606483459472656, -42.88466262817383, -41.162841796875, -39.44102096557617, -37.719200134277344, -35.997379302978516, -34.27555847167969, -32.55373764038086, -30.83191680908203, -29.110095977783203, -27.388275146484375, -25.666454315185547, -23.94463348388672, -22.22281265258789, -20.500991821289062, -18.779170989990234, -17.057350158691406, -15.335529327392578, -13.61370849609375, -11.891887664794922, -10.170066833496094, -8.448246002197266, -6.7264251708984375, -5.004604339599609, -3.2827835083007812, -1.5609626770019531, 0.160858154296875, 1.8826789855957031, 3.6044998168945312, 5.326320648193359, 7.0481414794921875, 8.769962310791016, 10.491783142089844, 12.213603973388672, 13.9354248046875, 15.657245635986328, 17.379066467285156, 19.100887298583984, 20.822708129882812, 22.54452896118164, 24.26634979248047, 25.988170623779297, 27.709991455078125, 29.431812286376953, 31.15363311767578, 32.87545394897461, 34.59727478027344, 36.319095611572266, 38.040916442871094, 39.76273727416992, 41.48455810546875, 43.20637893676758, 44.928199768066406, 46.650020599365234, 48.37184143066406]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 14.0, 19.0, 14.0, 21.0, 25.0, 33.0, 28.0, 31.0, 36.0, 35.0, 37.0, 48.0, 59.0, 50.0, 43.0, 51.0, 48.0, 53.0, 31.0, 49.0, 55.0, 27.0, 29.0, 33.0, 18.0, 27.0, 17.0, 9.0, 10.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.96875, -6.6956787109375, -6.422607421875, -6.1495361328125, -5.87646484375, -5.6033935546875, -5.330322265625, -5.0572509765625, -4.7841796875, -4.5111083984375, -4.238037109375, -3.9649658203125, -3.69189453125, -3.4188232421875, -3.145751953125, -2.8726806640625, -2.599609375, -2.3265380859375, -2.053466796875, -1.7803955078125, -1.50732421875, -1.2342529296875, -0.961181640625, -0.6881103515625, -0.4150390625, -0.1419677734375, 0.131103515625, 0.4041748046875, 0.67724609375, 0.9503173828125, 1.223388671875, 1.4964599609375, 1.76953125, 2.0426025390625, 2.315673828125, 2.5887451171875, 2.86181640625, 3.1348876953125, 3.407958984375, 3.6810302734375, 3.9541015625, 4.2271728515625, 4.500244140625, 4.7733154296875, 5.04638671875, 5.3194580078125, 5.592529296875, 5.8656005859375, 6.138671875, 6.4117431640625, 6.684814453125, 6.9578857421875, 7.23095703125, 7.5040283203125, 7.777099609375, 8.0501708984375, 8.3232421875, 8.5963134765625, 8.869384765625, 9.1424560546875, 9.41552734375, 9.6885986328125, 9.961669921875, 10.2347412109375, 10.5078125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 8.0, 9.0, 9.0, 15.0, 25.0, 22.0, 31.0, 30.0, 49.0, 66.0, 111.0, 181.0, 345.0, 1046.0, 6755.0, 202262.0, 2745769.0, 1198917.0, 35121.0, 2272.0, 530.0, 264.0, 126.0, 80.0, 47.0, 40.0, 36.0, 31.0, 16.0, 17.0, 12.0, 5.0, 7.0, 6.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.162109375, -16.49609375, -15.830078125, -15.1640625, -14.498046875, -13.83203125, -13.166015625, -12.5, -11.833984375, -11.16796875, -10.501953125, -9.8359375, -9.169921875, -8.50390625, -7.837890625, -7.171875, -6.505859375, -5.83984375, -5.173828125, -4.5078125, -3.841796875, -3.17578125, -2.509765625, -1.84375, -1.177734375, -0.51171875, 0.154296875, 0.8203125, 1.486328125, 2.15234375, 2.818359375, 3.484375, 4.150390625, 4.81640625, 5.482421875, 6.1484375, 6.814453125, 7.48046875, 8.146484375, 8.8125, 9.478515625, 10.14453125, 10.810546875, 11.4765625, 12.142578125, 12.80859375, 13.474609375, 14.140625, 14.806640625, 15.47265625, 16.138671875, 16.8046875, 17.470703125, 18.13671875, 18.802734375, 19.46875, 20.134765625, 20.80078125, 21.466796875, 22.1328125, 22.798828125, 23.46484375, 24.130859375, 24.796875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 2.0, 6.0, 8.0, 8.0, 18.0, 22.0, 32.0, 29.0, 48.0, 85.0, 110.0, 160.0, 179.0, 235.0, 303.0, 386.0, 425.0, 426.0, 370.0, 309.0, 235.0, 195.0, 133.0, 94.0, 70.0, 46.0, 31.0, 26.0, 26.0, 16.0, 11.0, 5.0, 3.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.8828125, -15.4410400390625, -14.999267578125, -14.5574951171875, -14.11572265625, -13.6739501953125, -13.232177734375, -12.7904052734375, -12.3486328125, -11.9068603515625, -11.465087890625, -11.0233154296875, -10.58154296875, -10.1397705078125, -9.697998046875, -9.2562255859375, -8.814453125, -8.3726806640625, -7.930908203125, -7.4891357421875, -7.04736328125, -6.6055908203125, -6.163818359375, -5.7220458984375, -5.2802734375, -4.8385009765625, -4.396728515625, -3.9549560546875, -3.51318359375, -3.0714111328125, -2.629638671875, -2.1878662109375, -1.74609375, -1.3043212890625, -0.862548828125, -0.4207763671875, 0.02099609375, 0.4627685546875, 0.904541015625, 1.3463134765625, 1.7880859375, 2.2298583984375, 2.671630859375, 3.1134033203125, 3.55517578125, 3.9969482421875, 4.438720703125, 4.8804931640625, 5.322265625, 5.7640380859375, 6.205810546875, 6.6475830078125, 7.08935546875, 7.5311279296875, 7.972900390625, 8.4146728515625, 8.8564453125, 9.2982177734375, 9.739990234375, 10.1817626953125, 10.62353515625, 11.0653076171875, 11.507080078125, 11.9488525390625, 12.390625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 5.0, 10.0, 7.0, 5.0, 11.0, 15.0, 27.0, 34.0, 38.0, 45.0, 58.0, 87.0, 118.0, 136.0, 187.0, 270.0, 403.0, 616.0, 2841.0, 330581.0, 3812032.0, 43660.0, 1251.0, 521.0, 307.0, 257.0, 194.0, 129.0, 109.0, 87.0, 43.0, 52.0, 30.0, 27.0, 26.0, 17.0, 12.0, 10.0, 3.0, 6.0, 11.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.625, -41.1201171875, -39.615234375, -38.1103515625, -36.60546875, -35.1005859375, -33.595703125, -32.0908203125, -30.5859375, -29.0810546875, -27.576171875, -26.0712890625, -24.56640625, -23.0615234375, -21.556640625, -20.0517578125, -18.546875, -17.0419921875, -15.537109375, -14.0322265625, -12.52734375, -11.0224609375, -9.517578125, -8.0126953125, -6.5078125, -5.0029296875, -3.498046875, -1.9931640625, -0.48828125, 1.0166015625, 2.521484375, 4.0263671875, 5.53125, 7.0361328125, 8.541015625, 10.0458984375, 11.55078125, 13.0556640625, 14.560546875, 16.0654296875, 17.5703125, 19.0751953125, 20.580078125, 22.0849609375, 23.58984375, 25.0947265625, 26.599609375, 28.1044921875, 29.609375, 31.1142578125, 32.619140625, 34.1240234375, 35.62890625, 37.1337890625, 38.638671875, 40.1435546875, 41.6484375, 43.1533203125, 44.658203125, 46.1630859375, 47.66796875, 49.1728515625, 50.677734375, 52.1826171875, 53.6875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 10.0, 10.0, 34.0, 42.0, 50.0, 69.0, 128.0, 113.0, 114.0, 131.0, 113.0, 76.0, 50.0, 24.0, 25.0, 13.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.03345489501953, -64.05902099609375, -62.0845947265625, -60.110164642333984, -58.13573455810547, -56.16130065917969, -54.18687438964844, -52.212440490722656, -50.23801040649414, -48.263580322265625, -46.28915023803711, -44.314720153808594, -42.34029006958008, -40.36585998535156, -38.39142608642578, -36.416996002197266, -34.44256591796875, -32.468135833740234, -30.49370574951172, -28.519275665283203, -26.544843673706055, -24.57041358947754, -22.595983505249023, -20.621551513671875, -18.647125244140625, -16.67269515991211, -14.698264122009277, -12.723834037780762, -10.74940299987793, -8.774972915649414, -6.800542831420898, -4.826111793518066, -2.8516807556152344, -0.8772503137588501, 1.0971801280975342, 3.071610450744629, 5.046041011810303, 7.020471572875977, 8.994901657104492, 10.969332695007324, 12.94376277923584, 14.918192863464355, 16.892623901367188, 18.867053985595703, 20.84148406982422, 22.815914154052734, 24.79034423828125, 26.7647762298584, 28.739206314086914, 30.71363639831543, 32.68806838989258, 34.662498474121094, 36.63692855834961, 38.611358642578125, 40.58578872680664, 42.560218811035156, 44.53464889526367, 46.50907897949219, 48.4835090637207, 50.45793914794922, 52.432369232177734, 54.40679931640625, 56.38123321533203, 58.35566329956055, 60.33009338378906]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 8.0, 5.0, 9.0, 9.0, 8.0, 10.0, 9.0, 8.0, 7.0, 13.0, 12.0, 20.0, 18.0, 20.0, 21.0, 31.0, 36.0, 33.0, 28.0, 25.0, 38.0, 31.0, 34.0, 46.0, 39.0, 42.0, 38.0, 29.0, 25.0, 16.0, 25.0, 27.0, 35.0, 41.0, 30.0, 19.0, 22.0, 19.0, 22.0, 22.0, 9.0, 14.0, 10.0, 9.0, 7.0, 6.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.33945846557617, -38.082916259765625, -36.826377868652344, -35.56983947753906, -34.313297271728516, -33.05675506591797, -31.800216674804688, -30.543676376342773, -29.28713607788086, -28.030595779418945, -26.77405548095703, -25.517515182495117, -24.260974884033203, -23.00443458557129, -21.747894287109375, -20.49135398864746, -19.234813690185547, -17.978273391723633, -16.72173309326172, -15.465192794799805, -14.20865249633789, -12.952112197875977, -11.695571899414062, -10.439031600952148, -9.182491302490234, -7.92595100402832, -6.669410705566406, -5.412870407104492, -4.156330108642578, -2.899789810180664, -1.64324951171875, -0.38670921325683594, 0.8698272705078125, 2.1263675689697266, 3.3829078674316406, 4.639448165893555, 5.895988464355469, 7.152528762817383, 8.409069061279297, 9.665609359741211, 10.922149658203125, 12.178689956665039, 13.435230255126953, 14.691770553588867, 15.948310852050781, 17.204851150512695, 18.46139144897461, 19.717931747436523, 20.974472045898438, 22.23101234436035, 23.487552642822266, 24.74409294128418, 26.000633239746094, 27.257173538208008, 28.513713836669922, 29.770254135131836, 31.02679443359375, 32.28333282470703, 33.53987503051758, 34.796417236328125, 36.052955627441406, 37.30949401855469, 38.566036224365234, 39.82257843017578, 41.07911682128906]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 11.0, 6.0, 5.0, 11.0, 15.0, 21.0, 21.0, 20.0, 26.0, 27.0, 39.0, 41.0, 41.0, 43.0, 54.0, 44.0, 59.0, 47.0, 50.0, 39.0, 44.0, 47.0, 45.0, 44.0, 33.0, 31.0, 20.0, 24.0, 20.0, 19.0, 10.0, 9.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6328125, -6.37109375, -6.109375, -5.84765625, -5.5859375, -5.32421875, -5.0625, -4.80078125, -4.5390625, -4.27734375, -4.015625, -3.75390625, -3.4921875, -3.23046875, -2.96875, -2.70703125, -2.4453125, -2.18359375, -1.921875, -1.66015625, -1.3984375, -1.13671875, -0.875, -0.61328125, -0.3515625, -0.08984375, 0.171875, 0.43359375, 0.6953125, 0.95703125, 1.21875, 1.48046875, 1.7421875, 2.00390625, 2.265625, 2.52734375, 2.7890625, 3.05078125, 3.3125, 3.57421875, 3.8359375, 4.09765625, 4.359375, 4.62109375, 4.8828125, 5.14453125, 5.40625, 5.66796875, 5.9296875, 6.19140625, 6.453125, 6.71484375, 6.9765625, 7.23828125, 7.5, 7.76171875, 8.0234375, 8.28515625, 8.546875, 8.80859375, 9.0703125, 9.33203125, 9.59375, 9.85546875, 10.1171875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 18.0, 36.0, 41.0, 92.0, 95.0, 161.0, 267.0, 443.0, 813.0, 1446.0, 2558.0, 4630.0, 8583.0, 16124.0, 31410.0, 65409.0, 148380.0, 426796.0, 185173.0, 78306.0, 37014.0, 18702.0, 9948.0, 5301.0, 2928.0, 1647.0, 871.0, 503.0, 325.0, 172.0, 130.0, 78.0, 49.0, 34.0, 23.0, 14.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.697265625, -2.609161376953125, -2.52105712890625, -2.432952880859375, -2.3448486328125, -2.256744384765625, -2.16864013671875, -2.080535888671875, -1.992431640625, -1.904327392578125, -1.81622314453125, -1.728118896484375, -1.6400146484375, -1.551910400390625, -1.46380615234375, -1.375701904296875, -1.28759765625, -1.199493408203125, -1.11138916015625, -1.023284912109375, -0.9351806640625, -0.847076416015625, -0.75897216796875, -0.670867919921875, -0.582763671875, -0.494659423828125, -0.40655517578125, -0.318450927734375, -0.2303466796875, -0.142242431640625, -0.05413818359375, 0.033966064453125, 0.1220703125, 0.210174560546875, 0.29827880859375, 0.386383056640625, 0.4744873046875, 0.562591552734375, 0.65069580078125, 0.738800048828125, 0.826904296875, 0.915008544921875, 1.00311279296875, 1.091217041015625, 1.1793212890625, 1.267425537109375, 1.35552978515625, 1.443634033203125, 1.53173828125, 1.619842529296875, 1.70794677734375, 1.796051025390625, 1.8841552734375, 1.972259521484375, 2.06036376953125, 2.148468017578125, 2.236572265625, 2.324676513671875, 2.41278076171875, 2.500885009765625, 2.5889892578125, 2.677093505859375, 2.76519775390625, 2.853302001953125, 2.94140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 7.0, 11.0, 13.0, 15.0, 12.0, 20.0, 24.0, 22.0, 27.0, 24.0, 25.0, 26.0, 37.0, 40.0, 39.0, 38.0, 41.0, 34.0, 1079.0, 42.0, 46.0, 34.0, 42.0, 46.0, 31.0, 32.0, 26.0, 33.0, 19.0, 26.0, 18.0, 16.0, 9.0, 8.0, 12.0, 8.0, 15.0, 9.0, 2.0, 1.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.966796875, -3.826629638671875, -3.68646240234375, -3.546295166015625, -3.4061279296875, -3.265960693359375, -3.12579345703125, -2.985626220703125, -2.845458984375, -2.705291748046875, -2.56512451171875, -2.424957275390625, -2.2847900390625, -2.144622802734375, -2.00445556640625, -1.864288330078125, -1.72412109375, -1.583953857421875, -1.44378662109375, -1.303619384765625, -1.1634521484375, -1.023284912109375, -0.88311767578125, -0.742950439453125, -0.602783203125, -0.462615966796875, -0.32244873046875, -0.182281494140625, -0.0421142578125, 0.098052978515625, 0.23822021484375, 0.378387451171875, 0.5185546875, 0.658721923828125, 0.79888916015625, 0.939056396484375, 1.0792236328125, 1.219390869140625, 1.35955810546875, 1.499725341796875, 1.639892578125, 1.780059814453125, 1.92022705078125, 2.060394287109375, 2.2005615234375, 2.340728759765625, 2.48089599609375, 2.621063232421875, 2.76123046875, 2.901397705078125, 3.04156494140625, 3.181732177734375, 3.3218994140625, 3.462066650390625, 3.60223388671875, 3.742401123046875, 3.882568359375, 4.022735595703125, 4.16290283203125, 4.303070068359375, 4.4432373046875, 4.583404541015625, 4.72357177734375, 4.863739013671875, 5.00390625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 9.0, 7.0, 16.0, 25.0, 27.0, 59.0, 80.0, 157.0, 222.0, 416.0, 600.0, 905.0, 1527.0, 2180.0, 3336.0, 5120.0, 7737.0, 11976.0, 18751.0, 29540.0, 47611.0, 77303.0, 138774.0, 1379584.0, 151318.0, 82488.0, 50188.0, 31015.0, 19831.0, 12803.0, 8215.0, 5198.0, 3495.0, 2446.0, 1484.0, 1051.0, 609.0, 384.0, 262.0, 128.0, 89.0, 77.0, 37.0, 12.0, 18.0, 12.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.708984375, -1.6530609130859375, -1.597137451171875, -1.5412139892578125, -1.48529052734375, -1.4293670654296875, -1.373443603515625, -1.3175201416015625, -1.2615966796875, -1.2056732177734375, -1.149749755859375, -1.0938262939453125, -1.03790283203125, -0.9819793701171875, -0.926055908203125, -0.8701324462890625, -0.814208984375, -0.7582855224609375, -0.702362060546875, -0.6464385986328125, -0.59051513671875, -0.5345916748046875, -0.478668212890625, -0.4227447509765625, -0.3668212890625, -0.3108978271484375, -0.254974365234375, -0.1990509033203125, -0.14312744140625, -0.0872039794921875, -0.031280517578125, 0.0246429443359375, 0.08056640625, 0.1364898681640625, 0.192413330078125, 0.2483367919921875, 0.30426025390625, 0.3601837158203125, 0.416107177734375, 0.4720306396484375, 0.5279541015625, 0.5838775634765625, 0.639801025390625, 0.6957244873046875, 0.75164794921875, 0.8075714111328125, 0.863494873046875, 0.9194183349609375, 0.975341796875, 1.0312652587890625, 1.087188720703125, 1.1431121826171875, 1.19903564453125, 1.2549591064453125, 1.310882568359375, 1.3668060302734375, 1.4227294921875, 1.4786529541015625, 1.534576416015625, 1.5904998779296875, 1.64642333984375, 1.7023468017578125, 1.758270263671875, 1.8141937255859375, 1.8701171875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 15.0, 14.0, 18.0, 19.0, 31.0, 43.0, 48.0, 67.0, 81.0, 68.0, 82.0, 88.0, 72.0, 64.0, 45.0, 54.0, 38.0, 22.0, 24.0, 13.0, 16.0, 18.0, 11.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029158592224121094, -0.0002821795642375946, -0.00027277320623397827, -0.00026336684823036194, -0.0002539604902267456, -0.00024455413222312927, -0.00023514777421951294, -0.0002257414162158966, -0.00021633505821228027, -0.00020692870020866394, -0.0001975223422050476, -0.00018811598420143127, -0.00017870962619781494, -0.0001693032681941986, -0.00015989691019058228, -0.00015049055218696594, -0.0001410841941833496, -0.00013167783617973328, -0.00012227147817611694, -0.00011286512017250061, -0.00010345876216888428, -9.405240416526794e-05, -8.464604616165161e-05, -7.523968815803528e-05, -6.583333015441895e-05, -5.642697215080261e-05, -4.702061414718628e-05, -3.7614256143569946e-05, -2.8207898139953613e-05, -1.880154013633728e-05, -9.395182132720947e-06, 1.1175870895385742e-08, 9.417533874511719e-06, 1.8823891878128052e-05, 2.8230249881744385e-05, 3.763660788536072e-05, 4.704296588897705e-05, 5.6449323892593384e-05, 6.585568189620972e-05, 7.526203989982605e-05, 8.466839790344238e-05, 9.407475590705872e-05, 0.00010348111391067505, 0.00011288747191429138, 0.00012229382991790771, 0.00013170018792152405, 0.00014110654592514038, 0.00015051290392875671, 0.00015991926193237305, 0.00016932561993598938, 0.0001787319779396057, 0.00018813833594322205, 0.00019754469394683838, 0.0002069510519504547, 0.00021635740995407104, 0.00022576376795768738, 0.0002351701259613037, 0.00024457648396492004, 0.0002539828419685364, 0.0002633891999721527, 0.00027279555797576904, 0.0002822019159793854, 0.0002916082739830017, 0.00030101463198661804, 0.0003104209899902344]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 6.0, 4.0, 8.0, 11.0, 14.0, 13.0, 23.0, 35.0, 30.0, 31.0, 70.0, 124.0, 163.0, 340.0, 1171.0, 827658.0, 217117.0, 867.0, 324.0, 165.0, 111.0, 74.0, 43.0, 46.0, 21.0, 17.0, 13.0, 13.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.006740570068359375, -0.006535768508911133, -0.006330966949462891, -0.0061261653900146484, -0.005921363830566406, -0.005716562271118164, -0.005511760711669922, -0.00530695915222168, -0.0051021575927734375, -0.004897356033325195, -0.004692554473876953, -0.004487752914428711, -0.004282951354980469, -0.0040781497955322266, -0.0038733482360839844, -0.003668546676635742, -0.0034637451171875, -0.003258943557739258, -0.0030541419982910156, -0.0028493404388427734, -0.0026445388793945312, -0.002439737319946289, -0.002234935760498047, -0.0020301342010498047, -0.0018253326416015625, -0.0016205310821533203, -0.0014157295227050781, -0.001210927963256836, -0.0010061264038085938, -0.0008013248443603516, -0.0005965232849121094, -0.0003917217254638672, -0.000186920166015625, 1.7881393432617188e-05, 0.00022268295288085938, 0.00042748451232910156, 0.0006322860717773438, 0.0008370876312255859, 0.0010418891906738281, 0.0012466907501220703, 0.0014514923095703125, 0.0016562938690185547, 0.0018610954284667969, 0.002065896987915039, 0.0022706985473632812, 0.0024755001068115234, 0.0026803016662597656, 0.002885103225708008, 0.00308990478515625, 0.003294706344604492, 0.0034995079040527344, 0.0037043094635009766, 0.003909111022949219, 0.004113912582397461, 0.004318714141845703, 0.004523515701293945, 0.0047283172607421875, 0.00493311882019043, 0.005137920379638672, 0.005342721939086914, 0.005547523498535156, 0.0057523250579833984, 0.005957126617431641, 0.006161928176879883, 0.006366729736328125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 6.0, 17.0, 23.0, 45.0, 86.0, 100.0, 129.0, 145.0, 139.0, 114.0, 94.0, 35.0, 33.0, 17.0, 10.0, 3.0, 5.0, 3.0, 1.0], "bins": [-0.000325835746480152, -0.00031961838249117136, -0.0003134010185021907, -0.00030718365451321006, -0.0003009662905242294, -0.00029474892653524876, -0.0002885315625462681, -0.00028231419855728745, -0.00027609680546447635, -0.0002698794414754957, -0.00026366207748651505, -0.0002574447134975344, -0.00025122734950855374, -0.0002450099855195731, -0.0002387926069786772, -0.00023257524298969656, -0.00022635789355263114, -0.0002201405295636505, -0.00021392316557466984, -0.0002077058015856892, -0.00020148843759670854, -0.00019527107360772789, -0.000189053695066832, -0.00018283633107785136, -0.0001766189670888707, -0.00017040160309989005, -0.0001641842391109094, -0.00015796687512192875, -0.00015174949658103287, -0.00014553213259205222, -0.00013931476860307157, -0.00013309740461409092, -0.00012688004062511027, -0.00012066267663612962, -0.00011444531264714897, -0.0001082279413822107, -0.00010201057739323005, -9.57932134042494e-05, -8.957584213931113e-05, -8.335847815033048e-05, -7.714110688539222e-05, -7.092374289641157e-05, -6.47063716314733e-05, -5.848900764249265e-05, -5.2271643653512e-05, -4.605427966453135e-05, -3.983691203757189e-05, -3.3619544410612434e-05, -2.7402180421631783e-05, -2.118481461366173e-05, -1.4967448805691674e-05, -8.75008299772162e-06, -2.5327171897515655e-06, 3.6846467992290854e-06, 9.902014426188543e-06, 1.6119382053148e-05, 2.2336746042128652e-05, 2.8554111850098707e-05, 3.477147765806876e-05, 4.098884528502822e-05, 4.720620927400887e-05, 5.342357326298952e-05, 5.964094088994898e-05, 6.585830851690844e-05, 7.207567250588909e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 3.0, 12.0, 18.0, 17.0, 30.0, 29.0, 30.0, 36.0, 38.0, 44.0, 54.0, 49.0, 52.0, 52.0, 46.0, 36.0, 44.0, 46.0, 50.0, 42.0, 35.0, 36.0, 36.0, 25.0, 36.0, 24.0, 17.0, 10.0, 9.0, 11.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001621246337890625, -0.00015720073133707047, -0.00015227682888507843, -0.0001473529264330864, -0.00014242902398109436, -0.00013750512152910233, -0.0001325812190771103, -0.00012765731662511826, -0.00012273341417312622, -0.00011780951172113419, -0.00011288560926914215, -0.00010796170681715012, -0.00010303780436515808, -9.811390191316605e-05, -9.318999946117401e-05, -8.826609700918198e-05, -8.334219455718994e-05, -7.84182921051979e-05, -7.349438965320587e-05, -6.857048720121384e-05, -6.36465847492218e-05, -5.872268229722977e-05, -5.379877984523773e-05, -4.88748773932457e-05, -4.395097494125366e-05, -3.902707248926163e-05, -3.410317003726959e-05, -2.9179267585277557e-05, -2.4255365133285522e-05, -1.9331462681293488e-05, -1.4407560229301453e-05, -9.483657777309418e-06, -4.559755325317383e-06, 3.641471266746521e-07, 5.288049578666687e-06, 1.0211952030658722e-05, 1.5135854482650757e-05, 2.0059756934642792e-05, 2.4983659386634827e-05, 2.990756183862686e-05, 3.4831464290618896e-05, 3.975536674261093e-05, 4.4679269194602966e-05, 4.9603171646595e-05, 5.4527074098587036e-05, 5.945097655057907e-05, 6.43748790025711e-05, 6.929878145456314e-05, 7.422268390655518e-05, 7.914658635854721e-05, 8.407048881053925e-05, 8.899439126253128e-05, 9.391829371452332e-05, 9.884219616651535e-05, 0.00010376609861850739, 0.00010869000107049942, 0.00011361390352249146, 0.00011853780597448349, 0.00012346170842647552, 0.00012838561087846756, 0.0001333095133304596, 0.00013823341578245163, 0.00014315731823444366, 0.0001480812206864357, 0.00015300512313842773]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 11.0, 6.0, 5.0, 11.0, 15.0, 21.0, 21.0, 20.0, 26.0, 27.0, 39.0, 41.0, 41.0, 43.0, 54.0, 44.0, 59.0, 47.0, 50.0, 39.0, 44.0, 47.0, 45.0, 44.0, 33.0, 31.0, 20.0, 24.0, 20.0, 19.0, 10.0, 9.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6328125, -6.37109375, -6.109375, -5.84765625, -5.5859375, -5.32421875, -5.0625, -4.80078125, -4.5390625, -4.27734375, -4.015625, -3.75390625, -3.4921875, -3.23046875, -2.96875, -2.70703125, -2.4453125, -2.18359375, -1.921875, -1.66015625, -1.3984375, -1.13671875, -0.875, -0.61328125, -0.3515625, -0.08984375, 0.171875, 0.43359375, 0.6953125, 0.95703125, 1.21875, 1.48046875, 1.7421875, 2.00390625, 2.265625, 2.52734375, 2.7890625, 3.05078125, 3.3125, 3.57421875, 3.8359375, 4.09765625, 4.359375, 4.62109375, 4.8828125, 5.14453125, 5.40625, 5.66796875, 5.9296875, 6.19140625, 6.453125, 6.71484375, 6.9765625, 7.23828125, 7.5, 7.76171875, 8.0234375, 8.28515625, 8.546875, 8.80859375, 9.0703125, 9.33203125, 9.59375, 9.85546875, 10.1171875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 14.0, 17.0, 22.0, 31.0, 42.0, 71.0, 86.0, 137.0, 261.0, 464.0, 1087.0, 2792.0, 8487.0, 28329.0, 102235.0, 371733.0, 383004.0, 106724.0, 29038.0, 8677.0, 2903.0, 1118.0, 512.0, 285.0, 152.0, 116.0, 84.0, 41.0, 23.0, 18.0, 18.0, 12.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.9215087890625, -8.624267578125, -8.3270263671875, -8.02978515625, -7.7325439453125, -7.435302734375, -7.1380615234375, -6.8408203125, -6.5435791015625, -6.246337890625, -5.9490966796875, -5.65185546875, -5.3546142578125, -5.057373046875, -4.7601318359375, -4.462890625, -4.1656494140625, -3.868408203125, -3.5711669921875, -3.27392578125, -2.9766845703125, -2.679443359375, -2.3822021484375, -2.0849609375, -1.7877197265625, -1.490478515625, -1.1932373046875, -0.89599609375, -0.5987548828125, -0.301513671875, -0.0042724609375, 0.29296875, 0.5902099609375, 0.887451171875, 1.1846923828125, 1.48193359375, 1.7791748046875, 2.076416015625, 2.3736572265625, 2.6708984375, 2.9681396484375, 3.265380859375, 3.5626220703125, 3.85986328125, 4.1571044921875, 4.454345703125, 4.7515869140625, 5.048828125, 5.3460693359375, 5.643310546875, 5.9405517578125, 6.23779296875, 6.5350341796875, 6.832275390625, 7.1295166015625, 7.4267578125, 7.7239990234375, 8.021240234375, 8.3184814453125, 8.61572265625, 8.9129638671875, 9.210205078125, 9.5074462890625, 9.8046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 7.0, 5.0, 7.0, 8.0, 14.0, 18.0, 12.0, 19.0, 23.0, 19.0, 26.0, 36.0, 36.0, 40.0, 41.0, 52.0, 47.0, 70.0, 167.0, 1398.0, 376.0, 128.0, 67.0, 53.0, 42.0, 45.0, 37.0, 42.0, 23.0, 33.0, 20.0, 14.0, 27.0, 20.0, 18.0, 17.0, 11.0, 5.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0, -20.274658203125, -19.54931640625, -18.823974609375, -18.0986328125, -17.373291015625, -16.64794921875, -15.922607421875, -15.197265625, -14.471923828125, -13.74658203125, -13.021240234375, -12.2958984375, -11.570556640625, -10.84521484375, -10.119873046875, -9.39453125, -8.669189453125, -7.94384765625, -7.218505859375, -6.4931640625, -5.767822265625, -5.04248046875, -4.317138671875, -3.591796875, -2.866455078125, -2.14111328125, -1.415771484375, -0.6904296875, 0.034912109375, 0.76025390625, 1.485595703125, 2.2109375, 2.936279296875, 3.66162109375, 4.386962890625, 5.1123046875, 5.837646484375, 6.56298828125, 7.288330078125, 8.013671875, 8.739013671875, 9.46435546875, 10.189697265625, 10.9150390625, 11.640380859375, 12.36572265625, 13.091064453125, 13.81640625, 14.541748046875, 15.26708984375, 15.992431640625, 16.7177734375, 17.443115234375, 18.16845703125, 18.893798828125, 19.619140625, 20.344482421875, 21.06982421875, 21.795166015625, 22.5205078125, 23.245849609375, 23.97119140625, 24.696533203125, 25.421875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 8.0, 11.0, 9.0, 16.0, 30.0, 26.0, 54.0, 75.0, 128.0, 172.0, 361.0, 1083.0, 48175.0, 3092435.0, 2039.0, 471.0, 219.0, 131.0, 85.0, 57.0, 40.0, 26.0, 19.0, 10.0, 7.0, 6.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.5, -143.18359375, -138.8671875, -134.55078125, -130.234375, -125.91796875, -121.6015625, -117.28515625, -112.96875, -108.65234375, -104.3359375, -100.01953125, -95.703125, -91.38671875, -87.0703125, -82.75390625, -78.4375, -74.12109375, -69.8046875, -65.48828125, -61.171875, -56.85546875, -52.5390625, -48.22265625, -43.90625, -39.58984375, -35.2734375, -30.95703125, -26.640625, -22.32421875, -18.0078125, -13.69140625, -9.375, -5.05859375, -0.7421875, 3.57421875, 7.890625, 12.20703125, 16.5234375, 20.83984375, 25.15625, 29.47265625, 33.7890625, 38.10546875, 42.421875, 46.73828125, 51.0546875, 55.37109375, 59.6875, 64.00390625, 68.3203125, 72.63671875, 76.953125, 81.26953125, 85.5859375, 89.90234375, 94.21875, 98.53515625, 102.8515625, 107.16796875, 111.484375, 115.80078125, 120.1171875, 124.43359375, 128.75]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 26.0, 99.0, 246.0, 376.0, 201.0, 56.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-121.8890609741211, -119.25873565673828, -116.62841033935547, -113.99809265136719, -111.36776733398438, -108.73744201660156, -106.10711669921875, -103.47679138183594, -100.84647369384766, -98.21614837646484, -95.58582305908203, -92.95550537109375, -90.32518005371094, -87.69485473632812, -85.06452941894531, -82.4342041015625, -79.80387878417969, -77.17355346679688, -74.54322814941406, -71.91291046142578, -69.28258514404297, -66.65225982666016, -64.02193450927734, -61.3916130065918, -58.76129150390625, -56.13096618652344, -53.50064468383789, -50.87031936645508, -48.23999786376953, -45.60967254638672, -42.979347229003906, -40.34902572631836, -37.71870803833008, -35.088382720947266, -32.45806121826172, -29.827735900878906, -27.19741439819336, -24.567089080810547, -21.936765670776367, -19.306442260742188, -16.676118850708008, -14.045795440673828, -11.415472030639648, -8.785147666931152, -6.154824256896973, -3.524500846862793, -0.8941764831542969, 1.7361469268798828, 4.3664703369140625, 6.996793746948242, 9.627117156982422, 12.257441520690918, 14.887764930725098, 17.518089294433594, 20.148412704467773, 22.778736114501953, 25.409059524536133, 28.039382934570312, 30.669706344604492, 33.30002975463867, 35.930355072021484, 38.56067657470703, 41.191001892089844, 43.821327209472656, 46.4516487121582]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 7.0, 12.0, 16.0, 24.0, 24.0, 15.0, 34.0, 31.0, 31.0, 30.0, 43.0, 39.0, 46.0, 38.0, 44.0, 41.0, 41.0, 54.0, 43.0, 44.0, 42.0, 39.0, 29.0, 25.0, 29.0, 25.0, 24.0, 20.0, 12.0, 17.0, 19.0, 10.0, 6.0, 11.0, 7.0, 4.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.51719284057617, -48.575565338134766, -46.63393783569336, -44.69231033325195, -42.75068283081055, -40.80905532836914, -38.867431640625, -36.925804138183594, -34.98417663574219, -33.04254913330078, -31.100921630859375, -29.15929412841797, -27.217666625976562, -25.276039123535156, -23.334413528442383, -21.392786026000977, -19.451156616210938, -17.50952911376953, -15.567901611328125, -13.626275062561035, -11.684647560119629, -9.743020057678223, -7.801393508911133, -5.859766006469727, -3.9181385040283203, -1.9765112400054932, -0.034883975982666016, 1.906743049621582, 3.8483705520629883, 5.7899980545043945, 7.731624603271484, 9.67325210571289, 11.614875793457031, 13.556503295898438, 15.498130798339844, 17.43975830078125, 19.381385803222656, 21.323013305664062, 23.264638900756836, 25.206266403198242, 27.14789390563965, 29.089521408081055, 31.03114891052246, 32.972774505615234, 34.91440200805664, 36.85602951049805, 38.79765701293945, 40.73928451538086, 42.680912017822266, 44.62253952026367, 46.56416702270508, 48.505794525146484, 50.44742202758789, 52.3890495300293, 54.33067321777344, 56.272300720214844, 58.21392822265625, 60.155555725097656, 62.09718322753906, 64.03881072998047, 65.98043823242188, 67.92206573486328, 69.86369323730469, 71.8053207397461, 73.7469482421875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 11.0, 13.0, 14.0, 13.0, 19.0, 17.0, 30.0, 38.0, 32.0, 37.0, 29.0, 42.0, 54.0, 52.0, 47.0, 46.0, 55.0, 50.0, 50.0, 44.0, 41.0, 42.0, 39.0, 26.0, 36.0, 24.0, 17.0, 17.0, 12.0, 11.0, 11.0, 6.0, 3.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4609375, -7.1712646484375, -6.881591796875, -6.5919189453125, -6.30224609375, -6.0125732421875, -5.722900390625, -5.4332275390625, -5.1435546875, -4.8538818359375, -4.564208984375, -4.2745361328125, -3.98486328125, -3.6951904296875, -3.405517578125, -3.1158447265625, -2.826171875, -2.5364990234375, -2.246826171875, -1.9571533203125, -1.66748046875, -1.3778076171875, -1.088134765625, -0.7984619140625, -0.5087890625, -0.2191162109375, 0.070556640625, 0.3602294921875, 0.64990234375, 0.9395751953125, 1.229248046875, 1.5189208984375, 1.80859375, 2.0982666015625, 2.387939453125, 2.6776123046875, 2.96728515625, 3.2569580078125, 3.546630859375, 3.8363037109375, 4.1259765625, 4.4156494140625, 4.705322265625, 4.9949951171875, 5.28466796875, 5.5743408203125, 5.864013671875, 6.1536865234375, 6.443359375, 6.7330322265625, 7.022705078125, 7.3123779296875, 7.60205078125, 7.8917236328125, 8.181396484375, 8.4710693359375, 8.7607421875, 9.0504150390625, 9.340087890625, 9.6297607421875, 9.91943359375, 10.2091064453125, 10.498779296875, 10.7884521484375, 11.078125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 11.0, 8.0, 8.0, 23.0, 20.0, 14.0, 21.0, 41.0, 54.0, 54.0, 60.0, 71.0, 109.0, 149.0, 248.0, 562.0, 2204.0, 27710.0, 835945.0, 2926504.0, 385733.0, 12053.0, 1418.0, 455.0, 200.0, 143.0, 91.0, 87.0, 47.0, 59.0, 39.0, 31.0, 19.0, 22.0, 13.0, 17.0, 17.0, 5.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.4375, -16.7763671875, -16.115234375, -15.4541015625, -14.79296875, -14.1318359375, -13.470703125, -12.8095703125, -12.1484375, -11.4873046875, -10.826171875, -10.1650390625, -9.50390625, -8.8427734375, -8.181640625, -7.5205078125, -6.859375, -6.1982421875, -5.537109375, -4.8759765625, -4.21484375, -3.5537109375, -2.892578125, -2.2314453125, -1.5703125, -0.9091796875, -0.248046875, 0.4130859375, 1.07421875, 1.7353515625, 2.396484375, 3.0576171875, 3.71875, 4.3798828125, 5.041015625, 5.7021484375, 6.36328125, 7.0244140625, 7.685546875, 8.3466796875, 9.0078125, 9.6689453125, 10.330078125, 10.9912109375, 11.65234375, 12.3134765625, 12.974609375, 13.6357421875, 14.296875, 14.9580078125, 15.619140625, 16.2802734375, 16.94140625, 17.6025390625, 18.263671875, 18.9248046875, 19.5859375, 20.2470703125, 20.908203125, 21.5693359375, 22.23046875, 22.8916015625, 23.552734375, 24.2138671875, 24.875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 10.0, 12.0, 19.0, 24.0, 22.0, 39.0, 67.0, 79.0, 128.0, 174.0, 232.0, 295.0, 396.0, 425.0, 463.0, 448.0, 314.0, 268.0, 177.0, 138.0, 89.0, 52.0, 56.0, 41.0, 25.0, 18.0, 16.0, 12.0, 7.0, 4.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9765625, -12.5001220703125, -12.023681640625, -11.5472412109375, -11.07080078125, -10.5943603515625, -10.117919921875, -9.6414794921875, -9.1650390625, -8.6885986328125, -8.212158203125, -7.7357177734375, -7.25927734375, -6.7828369140625, -6.306396484375, -5.8299560546875, -5.353515625, -4.8770751953125, -4.400634765625, -3.9241943359375, -3.44775390625, -2.9713134765625, -2.494873046875, -2.0184326171875, -1.5419921875, -1.0655517578125, -0.589111328125, -0.1126708984375, 0.36376953125, 0.8402099609375, 1.316650390625, 1.7930908203125, 2.26953125, 2.7459716796875, 3.222412109375, 3.6988525390625, 4.17529296875, 4.6517333984375, 5.128173828125, 5.6046142578125, 6.0810546875, 6.5574951171875, 7.033935546875, 7.5103759765625, 7.98681640625, 8.4632568359375, 8.939697265625, 9.4161376953125, 9.892578125, 10.3690185546875, 10.845458984375, 11.3218994140625, 11.79833984375, 12.2747802734375, 12.751220703125, 13.2276611328125, 13.7041015625, 14.1805419921875, 14.656982421875, 15.1334228515625, 15.60986328125, 16.0863037109375, 16.562744140625, 17.0391845703125, 17.515625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 4.0, 5.0, 3.0, 10.0, 13.0, 12.0, 28.0, 28.0, 62.0, 67.0, 65.0, 118.0, 190.0, 228.0, 339.0, 498.0, 2396.0, 2007353.0, 2178535.0, 2552.0, 522.0, 348.0, 249.0, 200.0, 145.0, 104.0, 67.0, 38.0, 29.0, 21.0, 17.0, 15.0, 13.0, 1.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.0, -79.7841796875, -77.568359375, -75.3525390625, -73.13671875, -70.9208984375, -68.705078125, -66.4892578125, -64.2734375, -62.0576171875, -59.841796875, -57.6259765625, -55.41015625, -53.1943359375, -50.978515625, -48.7626953125, -46.546875, -44.3310546875, -42.115234375, -39.8994140625, -37.68359375, -35.4677734375, -33.251953125, -31.0361328125, -28.8203125, -26.6044921875, -24.388671875, -22.1728515625, -19.95703125, -17.7412109375, -15.525390625, -13.3095703125, -11.09375, -8.8779296875, -6.662109375, -4.4462890625, -2.23046875, -0.0146484375, 2.201171875, 4.4169921875, 6.6328125, 8.8486328125, 11.064453125, 13.2802734375, 15.49609375, 17.7119140625, 19.927734375, 22.1435546875, 24.359375, 26.5751953125, 28.791015625, 31.0068359375, 33.22265625, 35.4384765625, 37.654296875, 39.8701171875, 42.0859375, 44.3017578125, 46.517578125, 48.7333984375, 50.94921875, 53.1650390625, 55.380859375, 57.5966796875, 59.8125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 34.0, 326.0, 496.0, 142.0, 17.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.7945556640625, -62.24710464477539, -53.69965362548828, -45.15220260620117, -36.60475158691406, -28.057300567626953, -19.509849548339844, -10.962398529052734, -2.414947509765625, 6.132503509521484, 14.679954528808594, 23.227405548095703, 31.774856567382812, 40.32230758666992, 48.86975860595703, 57.41720962524414, 65.96466064453125, 74.51211547851562, 83.05956268310547, 91.60700988769531, 100.15446472167969, 108.70191955566406, 117.2493667602539, 125.79681396484375, 134.34426879882812, 142.8917236328125, 151.43917846679688, 159.9866180419922, 168.53407287597656, 177.08152770996094, 185.62896728515625, 194.17642211914062, 202.723876953125, 211.27133178710938, 219.81878662109375, 228.36622619628906, 236.91368103027344, 245.4611358642578, 254.00857543945312, 262.5560302734375, 271.1034851074219, 279.65093994140625, 288.1983947753906, 296.745849609375, 305.29327392578125, 313.8407287597656, 322.38818359375, 330.9356384277344, 339.48309326171875, 348.0305480957031, 356.5780029296875, 365.1254577636719, 373.67291259765625, 382.2203369140625, 390.7677917480469, 399.31524658203125, 407.8627014160156, 416.41015625, 424.9576110839844, 433.50506591796875, 442.052490234375, 450.5999450683594, 459.14739990234375, 467.6948547363281, 476.2423095703125]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 2.0, 9.0, 1.0, 9.0, 6.0, 13.0, 11.0, 11.0, 12.0, 12.0, 26.0, 22.0, 20.0, 40.0, 33.0, 31.0, 30.0, 32.0, 35.0, 42.0, 45.0, 35.0, 34.0, 37.0, 32.0, 51.0, 33.0, 39.0, 33.0, 32.0, 36.0, 24.0, 20.0, 18.0, 20.0, 15.0, 18.0, 18.0, 14.0, 9.0, 11.0, 6.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.30508041381836, -36.9688720703125, -35.63266372680664, -34.29645538330078, -32.96025085449219, -31.624040603637695, -30.28783416748047, -28.95162582397461, -27.61541748046875, -26.27920913696289, -24.94300079345703, -23.606794357299805, -22.270586013793945, -20.934377670288086, -19.59817123413086, -18.261962890625, -16.92575454711914, -15.589546203613281, -14.253338813781738, -12.917131423950195, -11.580923080444336, -10.244714736938477, -8.908507347106934, -7.572299957275391, -6.236091613769531, -4.89988374710083, -3.563675880432129, -2.2274680137634277, -0.8912601470947266, 0.4449477195739746, 1.7811555862426758, 3.1173629760742188, 4.4535675048828125, 5.789775371551514, 7.125983238220215, 8.462190628051758, 9.798398971557617, 11.134607315063477, 12.47081470489502, 13.807022094726562, 15.143230438232422, 16.47943878173828, 17.81564712524414, 19.151853561401367, 20.488061904907227, 21.824270248413086, 23.160476684570312, 24.496685028076172, 25.83289337158203, 27.16910171508789, 28.50531005859375, 29.841516494750977, 31.177724838256836, 32.51393127441406, 33.85013961791992, 35.18634796142578, 36.52255630493164, 37.8587646484375, 39.19497299194336, 40.53118133544922, 41.86738586425781, 43.20359420776367, 44.53980255126953, 45.87601089477539, 47.21221923828125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 12.0, 20.0, 17.0, 16.0, 33.0, 31.0, 35.0, 30.0, 41.0, 51.0, 51.0, 28.0, 42.0, 47.0, 54.0, 41.0, 43.0, 45.0, 35.0, 40.0, 42.0, 27.0, 32.0, 26.0, 26.0, 20.0, 15.0, 17.0, 11.0, 12.0, 16.0, 4.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0703125, -6.8115234375, -6.552734375, -6.2939453125, -6.03515625, -5.7763671875, -5.517578125, -5.2587890625, -5.0, -4.7412109375, -4.482421875, -4.2236328125, -3.96484375, -3.7060546875, -3.447265625, -3.1884765625, -2.9296875, -2.6708984375, -2.412109375, -2.1533203125, -1.89453125, -1.6357421875, -1.376953125, -1.1181640625, -0.859375, -0.6005859375, -0.341796875, -0.0830078125, 0.17578125, 0.4345703125, 0.693359375, 0.9521484375, 1.2109375, 1.4697265625, 1.728515625, 1.9873046875, 2.24609375, 2.5048828125, 2.763671875, 3.0224609375, 3.28125, 3.5400390625, 3.798828125, 4.0576171875, 4.31640625, 4.5751953125, 4.833984375, 5.0927734375, 5.3515625, 5.6103515625, 5.869140625, 6.1279296875, 6.38671875, 6.6455078125, 6.904296875, 7.1630859375, 7.421875, 7.6806640625, 7.939453125, 8.1982421875, 8.45703125, 8.7158203125, 8.974609375, 9.2333984375, 9.4921875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 9.0, 12.0, 20.0, 33.0, 46.0, 83.0, 124.0, 174.0, 291.0, 476.0, 711.0, 1146.0, 1832.0, 2817.0, 4608.0, 7293.0, 11638.0, 19549.0, 32879.0, 58761.0, 108008.0, 244662.0, 290472.0, 113757.0, 61402.0, 34623.0, 20430.0, 12227.0, 7529.0, 4830.0, 2977.0, 1879.0, 1203.0, 743.0, 476.0, 285.0, 194.0, 117.0, 87.0, 52.0, 36.0, 18.0, 18.0, 12.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.157073974609375, -2.08758544921875, -2.018096923828125, -1.9486083984375, -1.879119873046875, -1.80963134765625, -1.740142822265625, -1.670654296875, -1.601165771484375, -1.53167724609375, -1.462188720703125, -1.3927001953125, -1.323211669921875, -1.25372314453125, -1.184234619140625, -1.11474609375, -1.045257568359375, -0.97576904296875, -0.906280517578125, -0.8367919921875, -0.767303466796875, -0.69781494140625, -0.628326416015625, -0.558837890625, -0.489349365234375, -0.41986083984375, -0.350372314453125, -0.2808837890625, -0.211395263671875, -0.14190673828125, -0.072418212890625, -0.0029296875, 0.066558837890625, 0.13604736328125, 0.205535888671875, 0.2750244140625, 0.344512939453125, 0.41400146484375, 0.483489990234375, 0.552978515625, 0.622467041015625, 0.69195556640625, 0.761444091796875, 0.8309326171875, 0.900421142578125, 0.96990966796875, 1.039398193359375, 1.10888671875, 1.178375244140625, 1.24786376953125, 1.317352294921875, 1.3868408203125, 1.456329345703125, 1.52581787109375, 1.595306396484375, 1.664794921875, 1.734283447265625, 1.80377197265625, 1.873260498046875, 1.9427490234375, 2.012237548828125, 2.08172607421875, 2.151214599609375, 2.220703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 2.0, 9.0, 11.0, 13.0, 5.0, 12.0, 21.0, 18.0, 22.0, 15.0, 30.0, 35.0, 34.0, 36.0, 38.0, 41.0, 45.0, 33.0, 37.0, 1061.0, 47.0, 57.0, 36.0, 34.0, 35.0, 37.0, 26.0, 27.0, 20.0, 28.0, 21.0, 21.0, 22.0, 17.0, 12.0, 13.0, 13.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.9609375, -4.8148193359375, -4.668701171875, -4.5225830078125, -4.37646484375, -4.2303466796875, -4.084228515625, -3.9381103515625, -3.7919921875, -3.6458740234375, -3.499755859375, -3.3536376953125, -3.20751953125, -3.0614013671875, -2.915283203125, -2.7691650390625, -2.623046875, -2.4769287109375, -2.330810546875, -2.1846923828125, -2.03857421875, -1.8924560546875, -1.746337890625, -1.6002197265625, -1.4541015625, -1.3079833984375, -1.161865234375, -1.0157470703125, -0.86962890625, -0.7235107421875, -0.577392578125, -0.4312744140625, -0.28515625, -0.1390380859375, 0.007080078125, 0.1531982421875, 0.29931640625, 0.4454345703125, 0.591552734375, 0.7376708984375, 0.8837890625, 1.0299072265625, 1.176025390625, 1.3221435546875, 1.46826171875, 1.6143798828125, 1.760498046875, 1.9066162109375, 2.052734375, 2.1988525390625, 2.344970703125, 2.4910888671875, 2.63720703125, 2.7833251953125, 2.929443359375, 3.0755615234375, 3.2216796875, 3.3677978515625, 3.513916015625, 3.6600341796875, 3.80615234375, 3.9522705078125, 4.098388671875, 4.2445068359375, 4.390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 9.0, 22.0, 19.0, 36.0, 57.0, 77.0, 138.0, 180.0, 288.0, 399.0, 613.0, 877.0, 1297.0, 1948.0, 2870.0, 4179.0, 6090.0, 9145.0, 13547.0, 20694.0, 32115.0, 49912.0, 79936.0, 141515.0, 1363189.0, 142566.0, 79845.0, 50286.0, 32228.0, 21033.0, 13778.0, 9074.0, 6162.0, 4256.0, 2791.0, 1905.0, 1307.0, 914.0, 591.0, 444.0, 267.0, 184.0, 103.0, 93.0, 50.0, 39.0, 20.0, 14.0, 16.0, 5.0, 5.0, 6.0, 0.0, 0.0, 3.0], "bins": [-1.8583984375, -1.8029327392578125, -1.747467041015625, -1.6920013427734375, -1.63653564453125, -1.5810699462890625, -1.525604248046875, -1.4701385498046875, -1.4146728515625, -1.3592071533203125, -1.303741455078125, -1.2482757568359375, -1.19281005859375, -1.1373443603515625, -1.081878662109375, -1.0264129638671875, -0.970947265625, -0.9154815673828125, -0.860015869140625, -0.8045501708984375, -0.74908447265625, -0.6936187744140625, -0.638153076171875, -0.5826873779296875, -0.5272216796875, -0.4717559814453125, -0.416290283203125, -0.3608245849609375, -0.30535888671875, -0.2498931884765625, -0.194427490234375, -0.1389617919921875, -0.08349609375, -0.0280303955078125, 0.027435302734375, 0.0829010009765625, 0.13836669921875, 0.1938323974609375, 0.249298095703125, 0.3047637939453125, 0.3602294921875, 0.4156951904296875, 0.471160888671875, 0.5266265869140625, 0.58209228515625, 0.6375579833984375, 0.693023681640625, 0.7484893798828125, 0.803955078125, 0.8594207763671875, 0.914886474609375, 0.9703521728515625, 1.02581787109375, 1.0812835693359375, 1.136749267578125, 1.1922149658203125, 1.2476806640625, 1.3031463623046875, 1.358612060546875, 1.4140777587890625, 1.46954345703125, 1.5250091552734375, 1.580474853515625, 1.6359405517578125, 1.69140625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 7.0, 4.0, 5.0, 6.0, 4.0, 5.0, 11.0, 21.0, 14.0, 26.0, 24.0, 30.0, 44.0, 52.0, 59.0, 82.0, 102.0, 127.0, 79.0, 64.0, 46.0, 27.0, 29.0, 26.0, 21.0, 20.0, 11.0, 10.0, 9.0, 7.0, 8.0, 8.0, 4.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002951622009277344, -0.00028489530086517334, -0.0002746284008026123, -0.00026436150074005127, -0.00025409460067749023, -0.0002438277006149292, -0.00023356080055236816, -0.00022329390048980713, -0.0002130270004272461, -0.00020276010036468506, -0.00019249320030212402, -0.000182226300239563, -0.00017195940017700195, -0.00016169250011444092, -0.00015142560005187988, -0.00014115869998931885, -0.0001308917999267578, -0.00012062489986419678, -0.00011035799980163574, -0.00010009109973907471, -8.982419967651367e-05, -7.955729961395264e-05, -6.92903995513916e-05, -5.9023499488830566e-05, -4.875659942626953e-05, -3.8489699363708496e-05, -2.822279930114746e-05, -1.7955899238586426e-05, -7.68899917602539e-06, 2.5779008865356445e-06, 1.284480094909668e-05, 2.3111701011657715e-05, 3.337860107421875e-05, 4.3645501136779785e-05, 5.391240119934082e-05, 6.417930126190186e-05, 7.444620132446289e-05, 8.471310138702393e-05, 9.498000144958496e-05, 0.000105246901512146, 0.00011551380157470703, 0.00012578070163726807, 0.0001360476016998291, 0.00014631450176239014, 0.00015658140182495117, 0.0001668483018875122, 0.00017711520195007324, 0.00018738210201263428, 0.0001976490020751953, 0.00020791590213775635, 0.00021818280220031738, 0.00022844970226287842, 0.00023871660232543945, 0.0002489835023880005, 0.0002592504024505615, 0.00026951730251312256, 0.0002797842025756836, 0.00029005110263824463, 0.00030031800270080566, 0.0003105849027633667, 0.00032085180282592773, 0.00033111870288848877, 0.0003413856029510498, 0.00035165250301361084, 0.0003619194030761719]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 7.0, 10.0, 8.0, 21.0, 20.0, 28.0, 33.0, 43.0, 59.0, 69.0, 161.0, 350.0, 955.0, 578551.0, 466556.0, 892.0, 312.0, 148.0, 81.0, 55.0, 41.0, 34.0, 17.0, 25.0, 13.0, 11.0, 8.0, 8.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00826263427734375, -0.008026480674743652, -0.007790327072143555, -0.007554173469543457, -0.007318019866943359, -0.007081866264343262, -0.006845712661743164, -0.006609559059143066, -0.006373405456542969, -0.006137251853942871, -0.0059010982513427734, -0.005664944648742676, -0.005428791046142578, -0.0051926374435424805, -0.004956483840942383, -0.004720330238342285, -0.0044841766357421875, -0.00424802303314209, -0.004011869430541992, -0.0037757158279418945, -0.003539562225341797, -0.0033034086227416992, -0.0030672550201416016, -0.002831101417541504, -0.0025949478149414062, -0.0023587942123413086, -0.002122640609741211, -0.0018864870071411133, -0.0016503334045410156, -0.001414179801940918, -0.0011780261993408203, -0.0009418725967407227, -0.000705718994140625, -0.00046956539154052734, -0.0002334117889404297, 2.7418136596679688e-06, 0.00023889541625976562, 0.0004750490188598633, 0.0007112026214599609, 0.0009473562240600586, 0.0011835098266601562, 0.001419663429260254, 0.0016558170318603516, 0.0018919706344604492, 0.002128124237060547, 0.0023642778396606445, 0.002600431442260742, 0.00283658504486084, 0.0030727386474609375, 0.003308892250061035, 0.003545045852661133, 0.0037811994552612305, 0.004017353057861328, 0.004253506660461426, 0.0044896602630615234, 0.004725813865661621, 0.004961967468261719, 0.005198121070861816, 0.005434274673461914, 0.005670428276062012, 0.005906581878662109, 0.006142735481262207, 0.006378889083862305, 0.006615042686462402, 0.0068511962890625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 28.0, 147.0, 270.0, 285.0, 193.0, 58.0, 18.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.0007903288933448493, -0.0007762444438412786, -0.0007621600525453687, -0.0007480756030417979, -0.0007339911535382271, -0.0007199067622423172, -0.0007058223127387464, -0.0006917378632351756, -0.0006776534719392657, -0.0006635690224356949, -0.000649484631139785, -0.0006354001816362143, -0.0006213157321326435, -0.0006072313408367336, -0.0005931468913331628, -0.000579062441829592, -0.0005649779923260212, -0.0005508935428224504, -0.0005368091515265405, -0.0005227247020229697, -0.0005086402525193989, -0.000494555861223489, -0.00048047141171991825, -0.00046638696221634746, -0.0004523025709204376, -0.00043821815052069724, -0.00042413370101712644, -0.0004100492806173861, -0.00039596486021764576, -0.00038188041071407497, -0.00036779599031433463, -0.00035371154081076384, -0.0003396271204110235, -0.00032554270001128316, -0.00031145825050771236, -0.000297373830107972, -0.0002832894097082317, -0.0002692049602046609, -0.00025512053980492055, -0.000241036104853265, -0.00022695166990160942, -0.00021286723494995385, -0.00019878281455021352, -0.00018469837959855795, -0.00017061394464690238, -0.00015652950969524682, -0.00014244508929550648, -0.0001283606543438509, -0.00011427622666815296, -0.000100191798992455, -8.610736404079944e-05, -7.202293636510149e-05, -5.793850505142473e-05, -4.385407373774797e-05, -2.9769646062050015e-05, -1.5685211110394448e-05, -1.6007834346964955e-06, 1.2483646969485562e-05, 2.656807737366762e-05, 4.0652506868354976e-05, 5.4736938182031736e-05, 6.88213694957085e-05, 8.290579717140645e-05, 9.699023212306201e-05, 0.00011107465979875997]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 8.0, 6.0, 14.0, 10.0, 7.0, 13.0, 14.0, 13.0, 23.0, 26.0, 33.0, 38.0, 26.0, 26.0, 27.0, 35.0, 50.0, 36.0, 49.0, 45.0, 40.0, 37.0, 39.0, 45.0, 46.0, 34.0, 40.0, 34.0, 19.0, 32.0, 22.0, 14.0, 9.0, 20.0, 19.0, 8.0, 9.0, 8.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00013846158981323242, -0.0001339958980679512, -0.00012953020632266998, -0.00012506451457738876, -0.00012059882283210754, -0.00011613313108682632, -0.0001116674393415451, -0.00010720174759626389, -0.00010273605585098267, -9.827036410570145e-05, -9.380467236042023e-05, -8.933898061513901e-05, -8.487328886985779e-05, -8.040759712457657e-05, -7.594190537929535e-05, -7.147621363401413e-05, -6.701052188873291e-05, -6.254483014345169e-05, -5.807913839817047e-05, -5.361344665288925e-05, -4.914775490760803e-05, -4.468206316232681e-05, -4.021637141704559e-05, -3.5750679671764374e-05, -3.1284987926483154e-05, -2.6819296181201935e-05, -2.2353604435920715e-05, -1.7887912690639496e-05, -1.3422220945358276e-05, -8.956529200077057e-06, -4.490837454795837e-06, -2.514570951461792e-08, 4.4405460357666016e-06, 8.906237781047821e-06, 1.337192952632904e-05, 1.783762127161026e-05, 2.230331301689148e-05, 2.67690047621727e-05, 3.123469650745392e-05, 3.570038825273514e-05, 4.016607999801636e-05, 4.463177174329758e-05, 4.9097463488578796e-05, 5.3563155233860016e-05, 5.8028846979141235e-05, 6.249453872442245e-05, 6.696023046970367e-05, 7.14259222149849e-05, 7.589161396026611e-05, 8.035730570554733e-05, 8.482299745082855e-05, 8.928868919610977e-05, 9.375438094139099e-05, 9.822007268667221e-05, 0.00010268576443195343, 0.00010715145617723465, 0.00011161714792251587, 0.00011608283966779709, 0.00012054853141307831, 0.00012501422315835953, 0.00012947991490364075, 0.00013394560664892197, 0.00013841129839420319, 0.0001428769901394844, 0.00014734268188476562]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 12.0, 20.0, 17.0, 16.0, 33.0, 31.0, 35.0, 30.0, 41.0, 51.0, 51.0, 28.0, 42.0, 47.0, 54.0, 41.0, 43.0, 45.0, 35.0, 40.0, 42.0, 27.0, 32.0, 26.0, 26.0, 20.0, 15.0, 17.0, 11.0, 12.0, 16.0, 4.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0703125, -6.8115234375, -6.552734375, -6.2939453125, -6.03515625, -5.7763671875, -5.517578125, -5.2587890625, -5.0, -4.7412109375, -4.482421875, -4.2236328125, -3.96484375, -3.7060546875, -3.447265625, -3.1884765625, -2.9296875, -2.6708984375, -2.412109375, -2.1533203125, -1.89453125, -1.6357421875, -1.376953125, -1.1181640625, -0.859375, -0.6005859375, -0.341796875, -0.0830078125, 0.17578125, 0.4345703125, 0.693359375, 0.9521484375, 1.2109375, 1.4697265625, 1.728515625, 1.9873046875, 2.24609375, 2.5048828125, 2.763671875, 3.0224609375, 3.28125, 3.5400390625, 3.798828125, 4.0576171875, 4.31640625, 4.5751953125, 4.833984375, 5.0927734375, 5.3515625, 5.6103515625, 5.869140625, 6.1279296875, 6.38671875, 6.6455078125, 6.904296875, 7.1630859375, 7.421875, 7.6806640625, 7.939453125, 8.1982421875, 8.45703125, 8.7158203125, 8.974609375, 9.2333984375, 9.4921875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 10.0, 10.0, 11.0, 16.0, 12.0, 31.0, 53.0, 75.0, 120.0, 163.0, 314.0, 613.0, 1456.0, 3007.0, 6642.0, 14506.0, 33811.0, 85046.0, 224446.0, 362643.0, 190775.0, 72246.0, 28897.0, 12684.0, 5690.0, 2683.0, 1286.0, 567.0, 307.0, 130.0, 108.0, 57.0, 29.0, 29.0, 23.0, 15.0, 10.0, 12.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.6602783203125, -6.433837890625, -6.2073974609375, -5.98095703125, -5.7545166015625, -5.528076171875, -5.3016357421875, -5.0751953125, -4.8487548828125, -4.622314453125, -4.3958740234375, -4.16943359375, -3.9429931640625, -3.716552734375, -3.4901123046875, -3.263671875, -3.0372314453125, -2.810791015625, -2.5843505859375, -2.35791015625, -2.1314697265625, -1.905029296875, -1.6785888671875, -1.4521484375, -1.2257080078125, -0.999267578125, -0.7728271484375, -0.54638671875, -0.3199462890625, -0.093505859375, 0.1329345703125, 0.359375, 0.5858154296875, 0.812255859375, 1.0386962890625, 1.26513671875, 1.4915771484375, 1.718017578125, 1.9444580078125, 2.1708984375, 2.3973388671875, 2.623779296875, 2.8502197265625, 3.07666015625, 3.3031005859375, 3.529541015625, 3.7559814453125, 3.982421875, 4.2088623046875, 4.435302734375, 4.6617431640625, 4.88818359375, 5.1146240234375, 5.341064453125, 5.5675048828125, 5.7939453125, 6.0203857421875, 6.246826171875, 6.4732666015625, 6.69970703125, 6.9261474609375, 7.152587890625, 7.3790283203125, 7.60546875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 9.0, 6.0, 6.0, 11.0, 12.0, 8.0, 12.0, 11.0, 10.0, 28.0, 23.0, 16.0, 32.0, 32.0, 42.0, 48.0, 57.0, 63.0, 133.0, 336.0, 1436.0, 222.0, 102.0, 57.0, 35.0, 49.0, 37.0, 34.0, 27.0, 20.0, 12.0, 21.0, 15.0, 19.0, 17.0, 12.0, 9.0, 5.0, 7.0, 7.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.8125, -28.942626953125, -28.07275390625, -27.202880859375, -26.3330078125, -25.463134765625, -24.59326171875, -23.723388671875, -22.853515625, -21.983642578125, -21.11376953125, -20.243896484375, -19.3740234375, -18.504150390625, -17.63427734375, -16.764404296875, -15.89453125, -15.024658203125, -14.15478515625, -13.284912109375, -12.4150390625, -11.545166015625, -10.67529296875, -9.805419921875, -8.935546875, -8.065673828125, -7.19580078125, -6.325927734375, -5.4560546875, -4.586181640625, -3.71630859375, -2.846435546875, -1.9765625, -1.106689453125, -0.23681640625, 0.633056640625, 1.5029296875, 2.372802734375, 3.24267578125, 4.112548828125, 4.982421875, 5.852294921875, 6.72216796875, 7.592041015625, 8.4619140625, 9.331787109375, 10.20166015625, 11.071533203125, 11.94140625, 12.811279296875, 13.68115234375, 14.551025390625, 15.4208984375, 16.290771484375, 17.16064453125, 18.030517578125, 18.900390625, 19.770263671875, 20.64013671875, 21.510009765625, 22.3798828125, 23.249755859375, 24.11962890625, 24.989501953125, 25.859375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 4.0, 4.0, 4.0, 6.0, 10.0, 21.0, 23.0, 22.0, 31.0, 51.0, 52.0, 72.0, 109.0, 180.0, 303.0, 489.0, 1850.0, 2866165.0, 273962.0, 1106.0, 455.0, 269.0, 157.0, 97.0, 71.0, 47.0, 28.0, 28.0, 36.0, 20.0, 13.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-99.125, -96.0166015625, -92.908203125, -89.7998046875, -86.69140625, -83.5830078125, -80.474609375, -77.3662109375, -74.2578125, -71.1494140625, -68.041015625, -64.9326171875, -61.82421875, -58.7158203125, -55.607421875, -52.4990234375, -49.390625, -46.2822265625, -43.173828125, -40.0654296875, -36.95703125, -33.8486328125, -30.740234375, -27.6318359375, -24.5234375, -21.4150390625, -18.306640625, -15.1982421875, -12.08984375, -8.9814453125, -5.873046875, -2.7646484375, 0.34375, 3.4521484375, 6.560546875, 9.6689453125, 12.77734375, 15.8857421875, 18.994140625, 22.1025390625, 25.2109375, 28.3193359375, 31.427734375, 34.5361328125, 37.64453125, 40.7529296875, 43.861328125, 46.9697265625, 50.078125, 53.1865234375, 56.294921875, 59.4033203125, 62.51171875, 65.6201171875, 68.728515625, 71.8369140625, 74.9453125, 78.0537109375, 81.162109375, 84.2705078125, 87.37890625, 90.4873046875, 93.595703125, 96.7041015625, 99.8125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [2.0, 33.0, 378.0, 542.0, 56.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.687761306762695, -11.46932601928711, -6.250889778137207, -1.0324535369873047, 4.185981750488281, 9.404417037963867, 14.622854232788086, 19.84128761291504, 25.059724807739258, 30.278160095214844, 35.49659729003906, 40.71503448486328, 45.933467864990234, 51.15190124511719, 56.370338439941406, 61.588775634765625, 66.80721282958984, 72.02565002441406, 77.24408721923828, 82.4625244140625, 87.68095397949219, 92.8993911743164, 98.11782836914062, 103.33625793457031, 108.55469512939453, 113.77313232421875, 118.99156951904297, 124.21000671386719, 129.42843627929688, 134.64688110351562, 139.8653106689453, 145.083740234375, 150.3021697998047, 155.52059936523438, 160.73904418945312, 165.9574737548828, 171.17591857910156, 176.39434814453125, 181.61279296875, 186.8312225341797, 192.04965209960938, 197.26808166503906, 202.4865264892578, 207.7049560546875, 212.92340087890625, 218.14183044433594, 223.36026000976562, 228.57870483398438, 233.79714965820312, 239.0155792236328, 244.23402404785156, 249.45245361328125, 254.6708984375, 259.88934326171875, 265.1077575683594, 270.3262023925781, 275.54461669921875, 280.7630615234375, 285.9814758300781, 291.1999206542969, 296.4183654785156, 301.63677978515625, 306.855224609375, 312.07366943359375, 317.2921142578125]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 5.0, 6.0, 13.0, 21.0, 12.0, 14.0, 16.0, 16.0, 20.0, 20.0, 15.0, 25.0, 20.0, 40.0, 22.0, 34.0, 34.0, 37.0, 39.0, 33.0, 34.0, 34.0, 33.0, 24.0, 35.0, 32.0, 35.0, 38.0, 35.0, 21.0, 28.0, 33.0, 22.0, 24.0, 21.0, 14.0, 12.0, 21.0, 2.0, 8.0, 13.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-58.020729064941406, -56.284339904785156, -54.547950744628906, -52.81156539916992, -51.07517623901367, -49.33878707885742, -47.60239791870117, -45.86601257324219, -44.12962341308594, -42.39323425292969, -40.65684509277344, -38.92045974731445, -37.1840705871582, -35.44768142700195, -33.7112922668457, -31.974905014038086, -30.238515853881836, -28.502126693725586, -26.76573944091797, -25.02935028076172, -23.2929630279541, -21.55657386779785, -19.820186614990234, -18.083797454833984, -16.347408294677734, -14.6110200881958, -12.874631881713867, -11.138242721557617, -9.40185546875, -7.66546630859375, -5.929078102111816, -4.192689895629883, -2.4563026428222656, -0.7199143171310425, 1.0164740085601807, 2.7528624534606934, 4.489250659942627, 6.225639343261719, 7.962027549743652, 9.698415756225586, 11.43480396270752, 13.171192169189453, 14.907580375671387, 16.64396858215332, 18.38035774230957, 20.116744995117188, 21.853134155273438, 23.589523315429688, 25.325910568237305, 27.062299728393555, 28.798686981201172, 30.535076141357422, 32.27146530151367, 34.007850646972656, 35.744239807128906, 37.480628967285156, 39.217018127441406, 40.953407287597656, 42.689796447753906, 44.42618179321289, 46.16257095336914, 47.89896011352539, 49.63534927368164, 51.371734619140625, 53.108123779296875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 7.0, 10.0, 14.0, 14.0, 26.0, 17.0, 27.0, 32.0, 30.0, 39.0, 35.0, 35.0, 37.0, 47.0, 51.0, 49.0, 46.0, 44.0, 42.0, 48.0, 34.0, 35.0, 35.0, 32.0, 20.0, 25.0, 28.0, 13.0, 23.0, 17.0, 13.0, 12.0, 12.0, 8.0, 7.0, 7.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.24609375, -6.97015380859375, -6.6942138671875, -6.41827392578125, -6.142333984375, -5.86639404296875, -5.5904541015625, -5.31451416015625, -5.03857421875, -4.76263427734375, -4.4866943359375, -4.21075439453125, -3.934814453125, -3.65887451171875, -3.3829345703125, -3.10699462890625, -2.8310546875, -2.55511474609375, -2.2791748046875, -2.00323486328125, -1.727294921875, -1.45135498046875, -1.1754150390625, -0.89947509765625, -0.62353515625, -0.34759521484375, -0.0716552734375, 0.20428466796875, 0.480224609375, 0.75616455078125, 1.0321044921875, 1.30804443359375, 1.583984375, 1.85992431640625, 2.1358642578125, 2.41180419921875, 2.687744140625, 2.96368408203125, 3.2396240234375, 3.51556396484375, 3.79150390625, 4.06744384765625, 4.3433837890625, 4.61932373046875, 4.895263671875, 5.17120361328125, 5.4471435546875, 5.72308349609375, 5.9990234375, 6.27496337890625, 6.5509033203125, 6.82684326171875, 7.102783203125, 7.37872314453125, 7.6546630859375, 7.93060302734375, 8.20654296875, 8.48248291015625, 8.7584228515625, 9.03436279296875, 9.310302734375, 9.58624267578125, 9.8621826171875, 10.13812255859375, 10.4140625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 8.0, 9.0, 8.0, 13.0, 17.0, 16.0, 26.0, 28.0, 50.0, 47.0, 57.0, 97.0, 148.0, 222.0, 524.0, 1281.0, 10427.0, 672672.0, 3296405.0, 205650.0, 4635.0, 888.0, 378.0, 187.0, 120.0, 83.0, 59.0, 44.0, 29.0, 31.0, 28.0, 25.0, 15.0, 12.0, 11.0, 6.0, 7.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.8125, -22.942138671875, -22.07177734375, -21.201416015625, -20.3310546875, -19.460693359375, -18.59033203125, -17.719970703125, -16.849609375, -15.979248046875, -15.10888671875, -14.238525390625, -13.3681640625, -12.497802734375, -11.62744140625, -10.757080078125, -9.88671875, -9.016357421875, -8.14599609375, -7.275634765625, -6.4052734375, -5.534912109375, -4.66455078125, -3.794189453125, -2.923828125, -2.053466796875, -1.18310546875, -0.312744140625, 0.5576171875, 1.427978515625, 2.29833984375, 3.168701171875, 4.0390625, 4.909423828125, 5.77978515625, 6.650146484375, 7.5205078125, 8.390869140625, 9.26123046875, 10.131591796875, 11.001953125, 11.872314453125, 12.74267578125, 13.613037109375, 14.4833984375, 15.353759765625, 16.22412109375, 17.094482421875, 17.96484375, 18.835205078125, 19.70556640625, 20.575927734375, 21.4462890625, 22.316650390625, 23.18701171875, 24.057373046875, 24.927734375, 25.798095703125, 26.66845703125, 27.538818359375, 28.4091796875, 29.279541015625, 30.14990234375, 31.020263671875, 31.890625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 9.0, 9.0, 19.0, 26.0, 29.0, 52.0, 54.0, 92.0, 106.0, 124.0, 198.0, 253.0, 302.0, 373.0, 436.0, 413.0, 345.0, 314.0, 225.0, 184.0, 117.0, 105.0, 62.0, 60.0, 41.0, 27.0, 29.0, 19.0, 6.0, 8.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.453125, -15.9805908203125, -15.508056640625, -15.0355224609375, -14.56298828125, -14.0904541015625, -13.617919921875, -13.1453857421875, -12.6728515625, -12.2003173828125, -11.727783203125, -11.2552490234375, -10.78271484375, -10.3101806640625, -9.837646484375, -9.3651123046875, -8.892578125, -8.4200439453125, -7.947509765625, -7.4749755859375, -7.00244140625, -6.5299072265625, -6.057373046875, -5.5848388671875, -5.1123046875, -4.6397705078125, -4.167236328125, -3.6947021484375, -3.22216796875, -2.7496337890625, -2.277099609375, -1.8045654296875, -1.33203125, -0.8594970703125, -0.386962890625, 0.0855712890625, 0.55810546875, 1.0306396484375, 1.503173828125, 1.9757080078125, 2.4482421875, 2.9207763671875, 3.393310546875, 3.8658447265625, 4.33837890625, 4.8109130859375, 5.283447265625, 5.7559814453125, 6.228515625, 6.7010498046875, 7.173583984375, 7.6461181640625, 8.11865234375, 8.5911865234375, 9.063720703125, 9.5362548828125, 10.0087890625, 10.4813232421875, 10.953857421875, 11.4263916015625, 11.89892578125, 12.3714599609375, 12.843994140625, 13.3165283203125, 13.7890625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 14.0, 24.0, 34.0, 46.0, 50.0, 75.0, 102.0, 133.0, 176.0, 240.0, 306.0, 497.0, 1339.0, 182954.0, 3988883.0, 17106.0, 736.0, 388.0, 294.0, 201.0, 189.0, 122.0, 92.0, 74.0, 41.0, 35.0, 36.0, 23.0, 10.0, 11.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.3125, -60.1875, -58.0625, -55.9375, -53.8125, -51.6875, -49.5625, -47.4375, -45.3125, -43.1875, -41.0625, -38.9375, -36.8125, -34.6875, -32.5625, -30.4375, -28.3125, -26.1875, -24.0625, -21.9375, -19.8125, -17.6875, -15.5625, -13.4375, -11.3125, -9.1875, -7.0625, -4.9375, -2.8125, -0.6875, 1.4375, 3.5625, 5.6875, 7.8125, 9.9375, 12.0625, 14.1875, 16.3125, 18.4375, 20.5625, 22.6875, 24.8125, 26.9375, 29.0625, 31.1875, 33.3125, 35.4375, 37.5625, 39.6875, 41.8125, 43.9375, 46.0625, 48.1875, 50.3125, 52.4375, 54.5625, 56.6875, 58.8125, 60.9375, 63.0625, 65.1875, 67.3125, 69.4375, 71.5625, 73.6875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 6.0, 30.0, 219.0, 409.0, 278.0, 65.0, 10.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.27892303466797, -43.66758728027344, -37.05625534057617, -30.444921493530273, -23.833587646484375, -17.222251892089844, -10.610919952392578, -3.9995880126953125, 2.6117477416992188, 9.223081588745117, 15.834415435791016, 22.445749282836914, 29.057083129882812, 35.668418884277344, 42.27975082397461, 48.891082763671875, 55.502418518066406, 62.11375427246094, 68.72508239746094, 75.33641815185547, 81.94775390625, 88.55908966064453, 95.17042541503906, 101.78175354003906, 108.3930892944336, 115.00442504882812, 121.61575317382812, 128.2270965576172, 134.8384246826172, 141.44976806640625, 148.06109619140625, 154.67242431640625, 161.28375244140625, 167.89508056640625, 174.5064239501953, 181.1177520751953, 187.72909545898438, 194.34042358398438, 200.95175170898438, 207.56307983398438, 214.17442321777344, 220.78575134277344, 227.3970947265625, 234.0084228515625, 240.6197509765625, 247.23109436035156, 253.84242248535156, 260.4537658691406, 267.0650939941406, 273.6764221191406, 280.2877502441406, 286.89910888671875, 293.51043701171875, 300.12176513671875, 306.73309326171875, 313.34442138671875, 319.95574951171875, 326.56707763671875, 333.17840576171875, 339.7897644042969, 346.4010925292969, 353.0124206542969, 359.6237487792969, 366.2350769042969, 372.846435546875]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 13.0, 13.0, 17.0, 10.0, 22.0, 17.0, 22.0, 22.0, 34.0, 31.0, 45.0, 30.0, 36.0, 44.0, 37.0, 44.0, 28.0, 44.0, 44.0, 42.0, 42.0, 44.0, 35.0, 37.0, 24.0, 28.0, 27.0, 20.0, 25.0, 14.0, 18.0, 14.0, 13.0, 9.0, 9.0, 7.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-58.853214263916016, -57.18791580200195, -55.522613525390625, -53.85731506347656, -52.1920166015625, -50.52671813964844, -48.861419677734375, -47.19611740112305, -45.530818939208984, -43.86552047729492, -42.200218200683594, -40.53491973876953, -38.86962127685547, -37.204322814941406, -35.539024353027344, -33.873722076416016, -32.20842361450195, -30.54312515258789, -28.877824783325195, -27.2125244140625, -25.547225952148438, -23.881927490234375, -22.21662712097168, -20.551326751708984, -18.886028289794922, -17.22072982788086, -15.555429458618164, -13.890130043029785, -12.224830627441406, -10.559531211853027, -8.894231796264648, -7.2289323806762695, -5.563632965087891, -3.8983335494995117, -2.233034133911133, -0.5677347183227539, 1.097564697265625, 2.762864112854004, 4.428163528442383, 6.093462944030762, 7.758762359619141, 9.42406177520752, 11.089361190795898, 12.754660606384277, 14.419960021972656, 16.08525848388672, 17.750558853149414, 19.41585922241211, 21.081157684326172, 22.746456146240234, 24.41175651550293, 26.077056884765625, 27.742355346679688, 29.40765380859375, 31.072954177856445, 32.73825454711914, 34.4035530090332, 36.068851470947266, 37.734153747558594, 39.399452209472656, 41.06475067138672, 42.73004913330078, 44.395347595214844, 46.06064987182617, 47.725948333740234]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 3.0, 9.0, 6.0, 18.0, 12.0, 12.0, 20.0, 13.0, 17.0, 27.0, 23.0, 24.0, 28.0, 26.0, 36.0, 39.0, 54.0, 42.0, 49.0, 46.0, 50.0, 47.0, 31.0, 41.0, 43.0, 38.0, 32.0, 22.0, 31.0, 25.0, 24.0, 18.0, 21.0, 14.0, 13.0, 14.0, 12.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6328125, -8.376953125, -8.12109375, -7.865234375, -7.609375, -7.353515625, -7.09765625, -6.841796875, -6.5859375, -6.330078125, -6.07421875, -5.818359375, -5.5625, -5.306640625, -5.05078125, -4.794921875, -4.5390625, -4.283203125, -4.02734375, -3.771484375, -3.515625, -3.259765625, -3.00390625, -2.748046875, -2.4921875, -2.236328125, -1.98046875, -1.724609375, -1.46875, -1.212890625, -0.95703125, -0.701171875, -0.4453125, -0.189453125, 0.06640625, 0.322265625, 0.578125, 0.833984375, 1.08984375, 1.345703125, 1.6015625, 1.857421875, 2.11328125, 2.369140625, 2.625, 2.880859375, 3.13671875, 3.392578125, 3.6484375, 3.904296875, 4.16015625, 4.416015625, 4.671875, 4.927734375, 5.18359375, 5.439453125, 5.6953125, 5.951171875, 6.20703125, 6.462890625, 6.71875, 6.974609375, 7.23046875, 7.486328125, 7.7421875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 10.0, 22.0, 13.0, 23.0, 46.0, 65.0, 95.0, 103.0, 175.0, 304.0, 434.0, 610.0, 975.0, 1468.0, 2169.0, 3108.0, 4674.0, 7130.0, 10945.0, 16800.0, 25779.0, 41423.0, 70339.0, 130814.0, 328492.0, 176284.0, 87428.0, 50014.0, 31119.0, 19760.0, 12953.0, 8374.0, 5520.0, 3654.0, 2527.0, 1641.0, 1079.0, 737.0, 470.0, 298.0, 213.0, 174.0, 98.0, 42.0, 49.0, 37.0, 24.0, 16.0, 9.0, 4.0, 10.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-2.12890625, -2.06378173828125, -1.9986572265625, -1.93353271484375, -1.868408203125, -1.80328369140625, -1.7381591796875, -1.67303466796875, -1.60791015625, -1.54278564453125, -1.4776611328125, -1.41253662109375, -1.347412109375, -1.28228759765625, -1.2171630859375, -1.15203857421875, -1.0869140625, -1.02178955078125, -0.9566650390625, -0.89154052734375, -0.826416015625, -0.76129150390625, -0.6961669921875, -0.63104248046875, -0.56591796875, -0.50079345703125, -0.4356689453125, -0.37054443359375, -0.305419921875, -0.24029541015625, -0.1751708984375, -0.11004638671875, -0.044921875, 0.02020263671875, 0.0853271484375, 0.15045166015625, 0.215576171875, 0.28070068359375, 0.3458251953125, 0.41094970703125, 0.47607421875, 0.54119873046875, 0.6063232421875, 0.67144775390625, 0.736572265625, 0.80169677734375, 0.8668212890625, 0.93194580078125, 0.9970703125, 1.06219482421875, 1.1273193359375, 1.19244384765625, 1.257568359375, 1.32269287109375, 1.3878173828125, 1.45294189453125, 1.51806640625, 1.58319091796875, 1.6483154296875, 1.71343994140625, 1.778564453125, 1.84368896484375, 1.9088134765625, 1.97393798828125, 2.0390625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 6.0, 6.0, 6.0, 12.0, 9.0, 12.0, 12.0, 15.0, 24.0, 20.0, 14.0, 24.0, 30.0, 29.0, 38.0, 34.0, 37.0, 36.0, 37.0, 42.0, 34.0, 1067.0, 40.0, 47.0, 29.0, 38.0, 32.0, 32.0, 40.0, 31.0, 21.0, 20.0, 19.0, 20.0, 11.0, 17.0, 15.0, 15.0, 8.0, 5.0, 10.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5078125, -4.35845947265625, -4.2091064453125, -4.05975341796875, -3.910400390625, -3.76104736328125, -3.6116943359375, -3.46234130859375, -3.31298828125, -3.16363525390625, -3.0142822265625, -2.86492919921875, -2.715576171875, -2.56622314453125, -2.4168701171875, -2.26751708984375, -2.1181640625, -1.96881103515625, -1.8194580078125, -1.67010498046875, -1.520751953125, -1.37139892578125, -1.2220458984375, -1.07269287109375, -0.92333984375, -0.77398681640625, -0.6246337890625, -0.47528076171875, -0.325927734375, -0.17657470703125, -0.0272216796875, 0.12213134765625, 0.271484375, 0.42083740234375, 0.5701904296875, 0.71954345703125, 0.868896484375, 1.01824951171875, 1.1676025390625, 1.31695556640625, 1.46630859375, 1.61566162109375, 1.7650146484375, 1.91436767578125, 2.063720703125, 2.21307373046875, 2.3624267578125, 2.51177978515625, 2.6611328125, 2.81048583984375, 2.9598388671875, 3.10919189453125, 3.258544921875, 3.40789794921875, 3.5572509765625, 3.70660400390625, 3.85595703125, 4.00531005859375, 4.1546630859375, 4.30401611328125, 4.453369140625, 4.60272216796875, 4.7520751953125, 4.90142822265625, 5.05078125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 5.0, 14.0, 17.0, 26.0, 34.0, 42.0, 95.0, 100.0, 176.0, 268.0, 389.0, 541.0, 882.0, 1242.0, 1803.0, 2411.0, 3605.0, 4877.0, 7259.0, 10698.0, 15387.0, 23323.0, 35366.0, 53950.0, 85671.0, 156645.0, 1346551.0, 126897.0, 74703.0, 47164.0, 31590.0, 20670.0, 13824.0, 9307.0, 6550.0, 4594.0, 3195.0, 2284.0, 1533.0, 1097.0, 743.0, 534.0, 359.0, 235.0, 164.0, 131.0, 63.0, 43.0, 32.0, 18.0, 13.0, 5.0, 3.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.712890625, -1.656463623046875, -1.60003662109375, -1.543609619140625, -1.4871826171875, -1.430755615234375, -1.37432861328125, -1.317901611328125, -1.261474609375, -1.205047607421875, -1.14862060546875, -1.092193603515625, -1.0357666015625, -0.979339599609375, -0.92291259765625, -0.866485595703125, -0.81005859375, -0.753631591796875, -0.69720458984375, -0.640777587890625, -0.5843505859375, -0.527923583984375, -0.47149658203125, -0.415069580078125, -0.358642578125, -0.302215576171875, -0.24578857421875, -0.189361572265625, -0.1329345703125, -0.076507568359375, -0.02008056640625, 0.036346435546875, 0.0927734375, 0.149200439453125, 0.20562744140625, 0.262054443359375, 0.3184814453125, 0.374908447265625, 0.43133544921875, 0.487762451171875, 0.544189453125, 0.600616455078125, 0.65704345703125, 0.713470458984375, 0.7698974609375, 0.826324462890625, 0.88275146484375, 0.939178466796875, 0.99560546875, 1.052032470703125, 1.10845947265625, 1.164886474609375, 1.2213134765625, 1.277740478515625, 1.33416748046875, 1.390594482421875, 1.447021484375, 1.503448486328125, 1.55987548828125, 1.616302490234375, 1.6727294921875, 1.729156494140625, 1.78558349609375, 1.842010498046875, 1.8984375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 9.0, 10.0, 8.0, 7.0, 12.0, 13.0, 10.0, 21.0, 16.0, 18.0, 26.0, 33.0, 32.0, 41.0, 33.0, 67.0, 57.0, 70.0, 67.0, 56.0, 62.0, 59.0, 48.0, 33.0, 34.0, 23.0, 17.0, 20.0, 19.0, 10.0, 11.0, 11.0, 5.0, 4.0, 3.0, 6.0, 1.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0002617835998535156, -0.0002538226544857025, -0.0002458617091178894, -0.0002379007637500763, -0.00022993981838226318, -0.00022197887301445007, -0.00021401792764663696, -0.00020605698227882385, -0.00019809603691101074, -0.00019013509154319763, -0.00018217414617538452, -0.0001742132008075714, -0.0001662522554397583, -0.0001582913100719452, -0.00015033036470413208, -0.00014236941933631897, -0.00013440847396850586, -0.00012644752860069275, -0.00011848658323287964, -0.00011052563786506653, -0.00010256469249725342, -9.460374712944031e-05, -8.66428017616272e-05, -7.868185639381409e-05, -7.072091102600098e-05, -6.275996565818787e-05, -5.4799020290374756e-05, -4.6838074922561646e-05, -3.8877129554748535e-05, -3.0916184186935425e-05, -2.2955238819122314e-05, -1.4994293451309204e-05, -7.033348083496094e-06, 9.275972843170166e-07, 8.888542652130127e-06, 1.6849488019943237e-05, 2.4810433387756348e-05, 3.277137875556946e-05, 4.073232412338257e-05, 4.869326949119568e-05, 5.665421485900879e-05, 6.46151602268219e-05, 7.257610559463501e-05, 8.053705096244812e-05, 8.849799633026123e-05, 9.645894169807434e-05, 0.00010441988706588745, 0.00011238083243370056, 0.00012034177780151367, 0.00012830272316932678, 0.0001362636685371399, 0.000144224613904953, 0.0001521855592727661, 0.00016014650464057922, 0.00016810745000839233, 0.00017606839537620544, 0.00018402934074401855, 0.00019199028611183167, 0.00019995123147964478, 0.00020791217684745789, 0.000215873122215271, 0.0002238340675830841, 0.00023179501295089722, 0.00023975595831871033, 0.00024771690368652344]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 9.0, 2.0, 5.0, 7.0, 6.0, 11.0, 13.0, 21.0, 18.0, 20.0, 26.0, 24.0, 49.0, 45.0, 79.0, 140.0, 203.0, 325.0, 1040.0, 155805.0, 887717.0, 1816.0, 447.0, 218.0, 120.0, 92.0, 53.0, 36.0, 34.0, 38.0, 20.0, 31.0, 14.0, 14.0, 18.0, 11.0, 7.0, 5.0, 2.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.005886077880859375, -0.0057029128074646, -0.005519747734069824, -0.005336582660675049, -0.0051534175872802734, -0.004970252513885498, -0.004787087440490723, -0.004603922367095947, -0.004420757293701172, -0.0042375922203063965, -0.004054427146911621, -0.0038712620735168457, -0.0036880970001220703, -0.003504931926727295, -0.0033217668533325195, -0.003138601779937744, -0.0029554367065429688, -0.0027722716331481934, -0.002589106559753418, -0.0024059414863586426, -0.002222776412963867, -0.002039611339569092, -0.0018564462661743164, -0.001673281192779541, -0.0014901161193847656, -0.0013069510459899902, -0.0011237859725952148, -0.0009406208992004395, -0.0007574558258056641, -0.0005742907524108887, -0.0003911256790161133, -0.0002079606056213379, -2.47955322265625e-05, 0.0001583695411682129, 0.0003415346145629883, 0.0005246996879577637, 0.0007078647613525391, 0.0008910298347473145, 0.0010741949081420898, 0.0012573599815368652, 0.0014405250549316406, 0.001623690128326416, 0.0018068552017211914, 0.001990020275115967, 0.002173185348510742, 0.0023563504219055176, 0.002539515495300293, 0.0027226805686950684, 0.0029058456420898438, 0.003089010715484619, 0.0032721757888793945, 0.00345534086227417, 0.0036385059356689453, 0.0038216710090637207, 0.004004836082458496, 0.0041880011558532715, 0.004371166229248047, 0.004554331302642822, 0.004737496376037598, 0.004920661449432373, 0.0051038265228271484, 0.005286991596221924, 0.005470156669616699, 0.005653321743011475, 0.00583648681640625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 11.0, 20.0, 38.0, 103.0, 158.0, 212.0, 213.0, 142.0, 62.0, 25.0, 18.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000443780270870775, -0.0004340611631050706, -0.00042434208444319665, -0.00041462297667749226, -0.00040490386891178787, -0.00039518479024991393, -0.00038546568248420954, -0.00037574657471850514, -0.00036602746695280075, -0.00035630835918709636, -0.0003465892805252224, -0.00033687017275951803, -0.00032715106499381363, -0.0003174319863319397, -0.0003077128785662353, -0.0002979937708005309, -0.000288274692138657, -0.0002785555843729526, -0.00026883650571107864, -0.00025911739794537425, -0.00024939829017966986, -0.0002396791969658807, -0.00022996010375209153, -0.00022024099598638713, -0.00021052190277259797, -0.0002008028095588088, -0.0001910837017931044, -0.00018136460857931525, -0.00017164551536552608, -0.0001619264075998217, -0.00015220731438603252, -0.00014248822117224336, -0.0001327690843027085, -0.00012304999108891934, -0.00011333088332321495, -0.00010361179010942578, -9.3892689619679e-05, -8.417358912993222e-05, -7.445449591614306e-05, -6.473539542639628e-05, -5.50162949366495e-05, -4.529719444690272e-05, -3.557809759513475e-05, -2.5858998924377374e-05, -1.613990025362e-05, -6.4207997638732195e-06, 3.2982970878947526e-06, 1.3017393939662725e-05, 2.2736494429409504e-05, 3.245559491915628e-05, 4.2174691770924255e-05, 5.189378862269223e-05, 6.1612889112439e-05, 7.133198960218579e-05, 8.105108281597495e-05, 9.077018330572173e-05, 0.00010048928379546851, 0.00011020838428521529, 0.00011992748477496207, 0.00012964657798875123, 0.0001393656712025404, 0.0001490847789682448, 0.00015880387218203396, 0.00016852296539582312, 0.00017824207316152751]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 11.0, 11.0, 9.0, 17.0, 13.0, 14.0, 18.0, 22.0, 26.0, 29.0, 30.0, 24.0, 36.0, 36.0, 46.0, 41.0, 42.0, 45.0, 48.0, 41.0, 46.0, 35.0, 40.0, 35.0, 32.0, 24.0, 38.0, 24.0, 23.0, 25.0, 14.0, 15.0, 18.0, 9.0, 9.0, 8.0, 11.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012576580047607422, -0.00012152735143899918, -0.00011728890240192413, -0.00011305045336484909, -0.00010881200432777405, -0.000104573555290699, -0.00010033510625362396, -9.609665721654892e-05, -9.185820817947388e-05, -8.761975914239883e-05, -8.338131010532379e-05, -7.914286106824875e-05, -7.49044120311737e-05, -7.066596299409866e-05, -6.642751395702362e-05, -6.218906491994858e-05, -5.7950615882873535e-05, -5.371216684579849e-05, -4.947371780872345e-05, -4.523526877164841e-05, -4.0996819734573364e-05, -3.675837069749832e-05, -3.251992166042328e-05, -2.8281472623348236e-05, -2.4043023586273193e-05, -1.980457454919815e-05, -1.5566125512123108e-05, -1.1327676475048065e-05, -7.0892274379730225e-06, -2.8507784008979797e-06, 1.387670636177063e-06, 5.626119673252106e-06, 9.864568710327148e-06, 1.4103017747402191e-05, 1.8341466784477234e-05, 2.2579915821552277e-05, 2.681836485862732e-05, 3.105681389570236e-05, 3.5295262932777405e-05, 3.953371196985245e-05, 4.377216100692749e-05, 4.801061004400253e-05, 5.2249059081077576e-05, 5.648750811815262e-05, 6.072595715522766e-05, 6.49644061923027e-05, 6.920285522937775e-05, 7.344130426645279e-05, 7.767975330352783e-05, 8.191820234060287e-05, 8.615665137767792e-05, 9.039510041475296e-05, 9.4633549451828e-05, 9.887199848890305e-05, 0.00010311044752597809, 0.00010734889656305313, 0.00011158734560012817, 0.00011582579463720322, 0.00012006424367427826, 0.0001243026927113533, 0.00012854114174842834, 0.0001327795907855034, 0.00013701803982257843, 0.00014125648885965347, 0.00014549493789672852]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 3.0, 9.0, 6.0, 18.0, 12.0, 12.0, 20.0, 13.0, 17.0, 27.0, 23.0, 24.0, 28.0, 26.0, 36.0, 39.0, 54.0, 42.0, 49.0, 46.0, 50.0, 47.0, 31.0, 41.0, 43.0, 38.0, 32.0, 22.0, 31.0, 25.0, 24.0, 18.0, 21.0, 14.0, 13.0, 14.0, 12.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6328125, -8.376953125, -8.12109375, -7.865234375, -7.609375, -7.353515625, -7.09765625, -6.841796875, -6.5859375, -6.330078125, -6.07421875, -5.818359375, -5.5625, -5.306640625, -5.05078125, -4.794921875, -4.5390625, -4.283203125, -4.02734375, -3.771484375, -3.515625, -3.259765625, -3.00390625, -2.748046875, -2.4921875, -2.236328125, -1.98046875, -1.724609375, -1.46875, -1.212890625, -0.95703125, -0.701171875, -0.4453125, -0.189453125, 0.06640625, 0.322265625, 0.578125, 0.833984375, 1.08984375, 1.345703125, 1.6015625, 1.857421875, 2.11328125, 2.369140625, 2.625, 2.880859375, 3.13671875, 3.392578125, 3.6484375, 3.904296875, 4.16015625, 4.416015625, 4.671875, 4.927734375, 5.18359375, 5.439453125, 5.6953125, 5.951171875, 6.20703125, 6.462890625, 6.71875, 6.974609375, 7.23046875, 7.486328125, 7.7421875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 7.0, 13.0, 11.0, 21.0, 19.0, 38.0, 38.0, 57.0, 67.0, 106.0, 172.0, 197.0, 404.0, 813.0, 2233.0, 5866.0, 17103.0, 47507.0, 130648.0, 333272.0, 315866.0, 123152.0, 45475.0, 15837.0, 5647.0, 2008.0, 810.0, 386.0, 203.0, 137.0, 113.0, 90.0, 55.0, 46.0, 33.0, 22.0, 27.0, 12.0, 11.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6640625, -8.39306640625, -8.1220703125, -7.85107421875, -7.580078125, -7.30908203125, -7.0380859375, -6.76708984375, -6.49609375, -6.22509765625, -5.9541015625, -5.68310546875, -5.412109375, -5.14111328125, -4.8701171875, -4.59912109375, -4.328125, -4.05712890625, -3.7861328125, -3.51513671875, -3.244140625, -2.97314453125, -2.7021484375, -2.43115234375, -2.16015625, -1.88916015625, -1.6181640625, -1.34716796875, -1.076171875, -0.80517578125, -0.5341796875, -0.26318359375, 0.0078125, 0.27880859375, 0.5498046875, 0.82080078125, 1.091796875, 1.36279296875, 1.6337890625, 1.90478515625, 2.17578125, 2.44677734375, 2.7177734375, 2.98876953125, 3.259765625, 3.53076171875, 3.8017578125, 4.07275390625, 4.34375, 4.61474609375, 4.8857421875, 5.15673828125, 5.427734375, 5.69873046875, 5.9697265625, 6.24072265625, 6.51171875, 6.78271484375, 7.0537109375, 7.32470703125, 7.595703125, 7.86669921875, 8.1376953125, 8.40869140625, 8.6796875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 3.0, 8.0, 5.0, 8.0, 16.0, 17.0, 13.0, 17.0, 21.0, 22.0, 19.0, 39.0, 23.0, 33.0, 38.0, 28.0, 50.0, 64.0, 142.0, 1455.0, 466.0, 122.0, 74.0, 40.0, 34.0, 39.0, 39.0, 32.0, 25.0, 29.0, 18.0, 24.0, 17.0, 15.0, 12.0, 11.0, 10.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-32.21875, -31.347412109375, -30.47607421875, -29.604736328125, -28.7333984375, -27.862060546875, -26.99072265625, -26.119384765625, -25.248046875, -24.376708984375, -23.50537109375, -22.634033203125, -21.7626953125, -20.891357421875, -20.02001953125, -19.148681640625, -18.27734375, -17.406005859375, -16.53466796875, -15.663330078125, -14.7919921875, -13.920654296875, -13.04931640625, -12.177978515625, -11.306640625, -10.435302734375, -9.56396484375, -8.692626953125, -7.8212890625, -6.949951171875, -6.07861328125, -5.207275390625, -4.3359375, -3.464599609375, -2.59326171875, -1.721923828125, -0.8505859375, 0.020751953125, 0.89208984375, 1.763427734375, 2.634765625, 3.506103515625, 4.37744140625, 5.248779296875, 6.1201171875, 6.991455078125, 7.86279296875, 8.734130859375, 9.60546875, 10.476806640625, 11.34814453125, 12.219482421875, 13.0908203125, 13.962158203125, 14.83349609375, 15.704833984375, 16.576171875, 17.447509765625, 18.31884765625, 19.190185546875, 20.0615234375, 20.932861328125, 21.80419921875, 22.675537109375, 23.546875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 10.0, 9.0, 14.0, 16.0, 6.0, 22.0, 31.0, 65.0, 66.0, 91.0, 162.0, 234.0, 583.0, 2169.0, 2998024.0, 141671.0, 1363.0, 468.0, 240.0, 114.0, 91.0, 59.0, 48.0, 36.0, 27.0, 15.0, 10.0, 11.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-145.125, -141.1884765625, -137.251953125, -133.3154296875, -129.37890625, -125.4423828125, -121.505859375, -117.5693359375, -113.6328125, -109.6962890625, -105.759765625, -101.8232421875, -97.88671875, -93.9501953125, -90.013671875, -86.0771484375, -82.140625, -78.2041015625, -74.267578125, -70.3310546875, -66.39453125, -62.4580078125, -58.521484375, -54.5849609375, -50.6484375, -46.7119140625, -42.775390625, -38.8388671875, -34.90234375, -30.9658203125, -27.029296875, -23.0927734375, -19.15625, -15.2197265625, -11.283203125, -7.3466796875, -3.41015625, 0.5263671875, 4.462890625, 8.3994140625, 12.3359375, 16.2724609375, 20.208984375, 24.1455078125, 28.08203125, 32.0185546875, 35.955078125, 39.8916015625, 43.828125, 47.7646484375, 51.701171875, 55.6376953125, 59.57421875, 63.5107421875, 67.447265625, 71.3837890625, 75.3203125, 79.2568359375, 83.193359375, 87.1298828125, 91.06640625, 95.0029296875, 98.939453125, 102.8759765625, 106.8125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 9.0, 47.0, 308.0, 509.0, 130.0, 13.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-235.23777770996094, -230.8983917236328, -226.55899047851562, -222.2196044921875, -217.88021850585938, -213.54083251953125, -209.20143127441406, -204.86204528808594, -200.52264404296875, -196.18325805664062, -191.84385681152344, -187.5044708251953, -183.1650848388672, -178.82568359375, -174.48629760742188, -170.14691162109375, -165.80752563476562, -161.4681396484375, -157.1287384033203, -152.7893524169922, -148.44996643066406, -144.11056518554688, -139.77117919921875, -135.43179321289062, -131.0924072265625, -126.75301361083984, -122.41362762451172, -118.07423400878906, -113.73484802246094, -109.39545440673828, -105.05606079101562, -100.7166748046875, -96.37728881835938, -92.03789520263672, -87.6985092163086, -83.35911560058594, -79.01972961425781, -74.68033599853516, -70.3409423828125, -66.00155639648438, -61.66216278076172, -57.32277297973633, -52.98338317871094, -48.64398956298828, -44.30459976196289, -39.9652099609375, -35.625816345214844, -31.286426544189453, -26.947036743164062, -22.607646942138672, -18.26825523376465, -13.928864479064941, -9.589473724365234, -5.250083923339844, -0.9106922149658203, 3.428699493408203, 7.768089294433594, 12.1074800491333, 16.446870803833008, 20.78626251220703, 25.125652313232422, 29.465042114257812, 33.80443572998047, 38.14382553100586, 42.48321533203125]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 7.0, 12.0, 10.0, 16.0, 14.0, 15.0, 20.0, 27.0, 26.0, 25.0, 28.0, 27.0, 37.0, 33.0, 23.0, 45.0, 42.0, 34.0, 40.0, 50.0, 48.0, 42.0, 35.0, 41.0, 39.0, 28.0, 36.0, 20.0, 20.0, 23.0, 16.0, 16.0, 19.0, 17.0, 10.0, 17.0, 8.0, 15.0, 4.0, 2.0, 7.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.32453536987305, -59.222618103027344, -57.120697021484375, -55.01877975463867, -52.91686248779297, -50.81494140625, -48.7130241394043, -46.611106872558594, -44.509185791015625, -42.40726852416992, -40.30534744262695, -38.20343017578125, -36.10150909423828, -33.99959182739258, -31.897674560546875, -29.79575538635254, -27.693836212158203, -25.591917037963867, -23.48999786376953, -21.388080596923828, -19.286161422729492, -17.184242248535156, -15.082324028015137, -12.980405807495117, -10.878486633300781, -8.776567459106445, -6.674649238586426, -4.572730541229248, -2.4708118438720703, -0.3688926696777344, 1.7330255508422852, 3.8349437713623047, 5.936859130859375, 8.038778305053711, 10.14069652557373, 12.24261474609375, 14.344533920288086, 16.446453094482422, 18.548370361328125, 20.65028953552246, 22.752208709716797, 24.854127883911133, 26.95604705810547, 29.057964324951172, 31.159883499145508, 33.261802673339844, 35.36371994018555, 37.46563720703125, 39.56755828857422, 41.66947555541992, 43.77139663696289, 45.873313903808594, 47.97523498535156, 50.077152252197266, 52.17906951904297, 54.28099060058594, 56.38290786743164, 58.484825134277344, 60.58674621582031, 62.688663482666016, 64.79058074951172, 66.89250183105469, 68.99442291259766, 71.0963363647461, 73.19825744628906]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 3.0, 6.0, 9.0, 16.0, 10.0, 16.0, 15.0, 11.0, 21.0, 18.0, 27.0, 28.0, 22.0, 36.0, 40.0, 35.0, 45.0, 46.0, 41.0, 47.0, 48.0, 36.0, 40.0, 41.0, 46.0, 34.0, 41.0, 33.0, 21.0, 28.0, 19.0, 26.0, 15.0, 12.0, 20.0, 15.0, 11.0, 11.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.3486328125, -9.056640625, -8.7646484375, -8.47265625, -8.1806640625, -7.888671875, -7.5966796875, -7.3046875, -7.0126953125, -6.720703125, -6.4287109375, -6.13671875, -5.8447265625, -5.552734375, -5.2607421875, -4.96875, -4.6767578125, -4.384765625, -4.0927734375, -3.80078125, -3.5087890625, -3.216796875, -2.9248046875, -2.6328125, -2.3408203125, -2.048828125, -1.7568359375, -1.46484375, -1.1728515625, -0.880859375, -0.5888671875, -0.296875, -0.0048828125, 0.287109375, 0.5791015625, 0.87109375, 1.1630859375, 1.455078125, 1.7470703125, 2.0390625, 2.3310546875, 2.623046875, 2.9150390625, 3.20703125, 3.4990234375, 3.791015625, 4.0830078125, 4.375, 4.6669921875, 4.958984375, 5.2509765625, 5.54296875, 5.8349609375, 6.126953125, 6.4189453125, 6.7109375, 7.0029296875, 7.294921875, 7.5869140625, 7.87890625, 8.1708984375, 8.462890625, 8.7548828125, 9.046875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 0.0, 3.0, 5.0, 11.0, 9.0, 11.0, 16.0, 26.0, 25.0, 21.0, 33.0, 44.0, 60.0, 75.0, 97.0, 114.0, 148.0, 252.0, 647.0, 4448.0, 255851.0, 3531028.0, 394034.0, 5617.0, 716.0, 279.0, 150.0, 115.0, 96.0, 67.0, 62.0, 48.0, 40.0, 21.0, 20.0, 25.0, 25.0, 12.0, 6.0, 8.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.53125, -32.560546875, -31.58984375, -30.619140625, -29.6484375, -28.677734375, -27.70703125, -26.736328125, -25.765625, -24.794921875, -23.82421875, -22.853515625, -21.8828125, -20.912109375, -19.94140625, -18.970703125, -18.0, -17.029296875, -16.05859375, -15.087890625, -14.1171875, -13.146484375, -12.17578125, -11.205078125, -10.234375, -9.263671875, -8.29296875, -7.322265625, -6.3515625, -5.380859375, -4.41015625, -3.439453125, -2.46875, -1.498046875, -0.52734375, 0.443359375, 1.4140625, 2.384765625, 3.35546875, 4.326171875, 5.296875, 6.267578125, 7.23828125, 8.208984375, 9.1796875, 10.150390625, 11.12109375, 12.091796875, 13.0625, 14.033203125, 15.00390625, 15.974609375, 16.9453125, 17.916015625, 18.88671875, 19.857421875, 20.828125, 21.798828125, 22.76953125, 23.740234375, 24.7109375, 25.681640625, 26.65234375, 27.623046875, 28.59375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 8.0, 8.0, 9.0, 13.0, 16.0, 28.0, 25.0, 45.0, 57.0, 85.0, 119.0, 173.0, 244.0, 299.0, 410.0, 487.0, 458.0, 412.0, 318.0, 234.0, 182.0, 108.0, 67.0, 68.0, 50.0, 44.0, 34.0, 28.0, 13.0, 8.0, 5.0, 7.0, 7.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.046875, -13.526611328125, -13.00634765625, -12.486083984375, -11.9658203125, -11.445556640625, -10.92529296875, -10.405029296875, -9.884765625, -9.364501953125, -8.84423828125, -8.323974609375, -7.8037109375, -7.283447265625, -6.76318359375, -6.242919921875, -5.72265625, -5.202392578125, -4.68212890625, -4.161865234375, -3.6416015625, -3.121337890625, -2.60107421875, -2.080810546875, -1.560546875, -1.040283203125, -0.52001953125, 0.000244140625, 0.5205078125, 1.040771484375, 1.56103515625, 2.081298828125, 2.6015625, 3.121826171875, 3.64208984375, 4.162353515625, 4.6826171875, 5.202880859375, 5.72314453125, 6.243408203125, 6.763671875, 7.283935546875, 7.80419921875, 8.324462890625, 8.8447265625, 9.364990234375, 9.88525390625, 10.405517578125, 10.92578125, 11.446044921875, 11.96630859375, 12.486572265625, 13.0068359375, 13.527099609375, 14.04736328125, 14.567626953125, 15.087890625, 15.608154296875, 16.12841796875, 16.648681640625, 17.1689453125, 17.689208984375, 18.20947265625, 18.729736328125, 19.25]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 7.0, 6.0, 2.0, 11.0, 22.0, 26.0, 33.0, 47.0, 61.0, 82.0, 98.0, 148.0, 230.0, 344.0, 465.0, 1778.0, 542513.0, 3642333.0, 4304.0, 590.0, 362.0, 259.0, 179.0, 105.0, 89.0, 55.0, 34.0, 32.0, 22.0, 11.0, 11.0, 11.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.0625, -100.2880859375, -97.513671875, -94.7392578125, -91.96484375, -89.1904296875, -86.416015625, -83.6416015625, -80.8671875, -78.0927734375, -75.318359375, -72.5439453125, -69.76953125, -66.9951171875, -64.220703125, -61.4462890625, -58.671875, -55.8974609375, -53.123046875, -50.3486328125, -47.57421875, -44.7998046875, -42.025390625, -39.2509765625, -36.4765625, -33.7021484375, -30.927734375, -28.1533203125, -25.37890625, -22.6044921875, -19.830078125, -17.0556640625, -14.28125, -11.5068359375, -8.732421875, -5.9580078125, -3.18359375, -0.4091796875, 2.365234375, 5.1396484375, 7.9140625, 10.6884765625, 13.462890625, 16.2373046875, 19.01171875, 21.7861328125, 24.560546875, 27.3349609375, 30.109375, 32.8837890625, 35.658203125, 38.4326171875, 41.20703125, 43.9814453125, 46.755859375, 49.5302734375, 52.3046875, 55.0791015625, 57.853515625, 60.6279296875, 63.40234375, 66.1767578125, 68.951171875, 71.7255859375, 74.5]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 45.0, 154.0, 278.0, 307.0, 165.0, 46.0, 14.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.33499908447266, -89.36363983154297, -84.39227294921875, -79.42091369628906, -74.44955444335938, -69.47818756103516, -64.50682830810547, -59.535465240478516, -54.56410217285156, -49.59273910522461, -44.621376037597656, -39.65001678466797, -34.678653717041016, -29.707290649414062, -24.735929489135742, -19.764568328857422, -14.793205261230469, -9.821843147277832, -4.850481033325195, 0.1208810806274414, 5.092243194580078, 10.063606262207031, 15.034967422485352, 20.006328582763672, 24.977691650390625, 29.949054718017578, 34.92041778564453, 39.89177703857422, 44.86314010620117, 49.834503173828125, 54.80586242675781, 59.777225494384766, 64.74858093261719, 69.71994018554688, 74.6913070678711, 79.66266632080078, 84.634033203125, 89.60539245605469, 94.57675170898438, 99.54811096191406, 104.51947784423828, 109.49083709716797, 114.46220397949219, 119.43356323242188, 124.40492248535156, 129.37628173828125, 134.34765625, 139.3190155029297, 144.29037475585938, 149.26173400878906, 154.23309326171875, 159.2044677734375, 164.1758270263672, 169.14718627929688, 174.11854553222656, 179.08990478515625, 184.061279296875, 189.0326385498047, 194.00399780273438, 198.97537231445312, 203.9467315673828, 208.9180908203125, 213.8894500732422, 218.86080932617188, 223.83216857910156]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 9.0, 7.0, 5.0, 7.0, 6.0, 20.0, 11.0, 10.0, 17.0, 14.0, 18.0, 24.0, 17.0, 22.0, 18.0, 32.0, 25.0, 25.0, 29.0, 34.0, 40.0, 48.0, 41.0, 45.0, 34.0, 29.0, 35.0, 34.0, 34.0, 30.0, 32.0, 28.0, 29.0, 17.0, 21.0, 14.0, 23.0, 13.0, 18.0, 14.0, 16.0, 12.0, 6.0, 6.0, 6.0, 3.0, 4.0, 5.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0], "bins": [-45.16847610473633, -43.82695007324219, -42.48542785644531, -41.14390182495117, -39.8023796081543, -38.460853576660156, -37.11933135986328, -35.77780532836914, -34.436279296875, -33.09475326538086, -31.753231048583984, -30.411705017089844, -29.070180892944336, -27.728656768798828, -26.38713264465332, -25.045608520507812, -23.704084396362305, -22.362560272216797, -21.02103614807129, -19.67951202392578, -18.33798599243164, -16.996461868286133, -15.654937744140625, -14.3134126663208, -12.971888542175293, -11.630364418029785, -10.288839340209961, -8.947315216064453, -7.605790615081787, -6.264266014099121, -4.922741889953613, -3.581216812133789, -2.2396926879882812, -0.8981682062149048, 0.4433562755584717, 1.7848806381225586, 3.1264052391052246, 4.467929840087891, 5.809453964233398, 7.150979042053223, 8.49250316619873, 9.834027290344238, 11.175552368164062, 12.51707649230957, 13.858600616455078, 15.200125694274902, 16.541648864746094, 17.883174896240234, 19.224699020385742, 20.56622314453125, 21.907747268676758, 23.249271392822266, 24.590797424316406, 25.932321548461914, 27.273845672607422, 28.615371704101562, 29.956893920898438, 31.298418045043945, 32.63994216918945, 33.981468200683594, 35.32299041748047, 36.66451644897461, 38.00604248046875, 39.347564697265625, 40.689090728759766]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 13.0, 6.0, 12.0, 17.0, 20.0, 17.0, 21.0, 27.0, 28.0, 19.0, 42.0, 33.0, 31.0, 35.0, 42.0, 45.0, 41.0, 52.0, 38.0, 47.0, 51.0, 32.0, 36.0, 42.0, 29.0, 33.0, 33.0, 18.0, 26.0, 17.0, 11.0, 9.0, 15.0, 12.0, 7.0, 7.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.203125, -8.9273681640625, -8.651611328125, -8.3758544921875, -8.10009765625, -7.8243408203125, -7.548583984375, -7.2728271484375, -6.9970703125, -6.7213134765625, -6.445556640625, -6.1697998046875, -5.89404296875, -5.6182861328125, -5.342529296875, -5.0667724609375, -4.791015625, -4.5152587890625, -4.239501953125, -3.9637451171875, -3.68798828125, -3.4122314453125, -3.136474609375, -2.8607177734375, -2.5849609375, -2.3092041015625, -2.033447265625, -1.7576904296875, -1.48193359375, -1.2061767578125, -0.930419921875, -0.6546630859375, -0.37890625, -0.1031494140625, 0.172607421875, 0.4483642578125, 0.72412109375, 0.9998779296875, 1.275634765625, 1.5513916015625, 1.8271484375, 2.1029052734375, 2.378662109375, 2.6544189453125, 2.93017578125, 3.2059326171875, 3.481689453125, 3.7574462890625, 4.033203125, 4.3089599609375, 4.584716796875, 4.8604736328125, 5.13623046875, 5.4119873046875, 5.687744140625, 5.9635009765625, 6.2392578125, 6.5150146484375, 6.790771484375, 7.0665283203125, 7.34228515625, 7.6180419921875, 7.893798828125, 8.1695556640625, 8.4453125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 15.0, 16.0, 22.0, 37.0, 49.0, 70.0, 128.0, 145.0, 245.0, 330.0, 510.0, 723.0, 1091.0, 1557.0, 2382.0, 3438.0, 5187.0, 7657.0, 11778.0, 17894.0, 27499.0, 43489.0, 72509.0, 135539.0, 325022.0, 165931.0, 85064.0, 49517.0, 31126.0, 20120.0, 12962.0, 8688.0, 5902.0, 3754.0, 2645.0, 1752.0, 1142.0, 862.0, 537.0, 388.0, 256.0, 180.0, 120.0, 82.0, 70.0, 37.0, 30.0, 17.0, 15.0, 10.0, 9.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.041015625, -1.974395751953125, -1.90777587890625, -1.841156005859375, -1.7745361328125, -1.707916259765625, -1.64129638671875, -1.574676513671875, -1.508056640625, -1.441436767578125, -1.37481689453125, -1.308197021484375, -1.2415771484375, -1.174957275390625, -1.10833740234375, -1.041717529296875, -0.97509765625, -0.908477783203125, -0.84185791015625, -0.775238037109375, -0.7086181640625, -0.641998291015625, -0.57537841796875, -0.508758544921875, -0.442138671875, -0.375518798828125, -0.30889892578125, -0.242279052734375, -0.1756591796875, -0.109039306640625, -0.04241943359375, 0.024200439453125, 0.0908203125, 0.157440185546875, 0.22406005859375, 0.290679931640625, 0.3572998046875, 0.423919677734375, 0.49053955078125, 0.557159423828125, 0.623779296875, 0.690399169921875, 0.75701904296875, 0.823638916015625, 0.8902587890625, 0.956878662109375, 1.02349853515625, 1.090118408203125, 1.15673828125, 1.223358154296875, 1.28997802734375, 1.356597900390625, 1.4232177734375, 1.489837646484375, 1.55645751953125, 1.623077392578125, 1.689697265625, 1.756317138671875, 1.82293701171875, 1.889556884765625, 1.9561767578125, 2.022796630859375, 2.08941650390625, 2.156036376953125, 2.22265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 6.0, 5.0, 9.0, 7.0, 9.0, 6.0, 8.0, 9.0, 16.0, 12.0, 21.0, 30.0, 31.0, 32.0, 31.0, 38.0, 31.0, 35.0, 41.0, 39.0, 39.0, 39.0, 1068.0, 33.0, 47.0, 37.0, 33.0, 34.0, 36.0, 28.0, 21.0, 30.0, 28.0, 25.0, 17.0, 16.0, 18.0, 11.0, 6.0, 10.0, 6.0, 6.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.90234375, -4.7349853515625, -4.567626953125, -4.4002685546875, -4.23291015625, -4.0655517578125, -3.898193359375, -3.7308349609375, -3.5634765625, -3.3961181640625, -3.228759765625, -3.0614013671875, -2.89404296875, -2.7266845703125, -2.559326171875, -2.3919677734375, -2.224609375, -2.0572509765625, -1.889892578125, -1.7225341796875, -1.55517578125, -1.3878173828125, -1.220458984375, -1.0531005859375, -0.8857421875, -0.7183837890625, -0.551025390625, -0.3836669921875, -0.21630859375, -0.0489501953125, 0.118408203125, 0.2857666015625, 0.453125, 0.6204833984375, 0.787841796875, 0.9552001953125, 1.12255859375, 1.2899169921875, 1.457275390625, 1.6246337890625, 1.7919921875, 1.9593505859375, 2.126708984375, 2.2940673828125, 2.46142578125, 2.6287841796875, 2.796142578125, 2.9635009765625, 3.130859375, 3.2982177734375, 3.465576171875, 3.6329345703125, 3.80029296875, 3.9676513671875, 4.135009765625, 4.3023681640625, 4.4697265625, 4.6370849609375, 4.804443359375, 4.9718017578125, 5.13916015625, 5.3065185546875, 5.473876953125, 5.6412353515625, 5.80859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 1.0, 5.0, 6.0, 15.0, 15.0, 36.0, 37.0, 59.0, 88.0, 135.0, 189.0, 337.0, 470.0, 700.0, 1061.0, 1492.0, 2084.0, 2997.0, 4307.0, 6451.0, 9896.0, 15150.0, 22629.0, 35182.0, 55573.0, 89561.0, 164710.0, 1352521.0, 124257.0, 73260.0, 46521.0, 29375.0, 19224.0, 12845.0, 8353.0, 5539.0, 3643.0, 2613.0, 1862.0, 1232.0, 882.0, 630.0, 421.0, 253.0, 175.0, 130.0, 85.0, 41.0, 42.0, 18.0, 11.0, 6.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.966796875, -1.901885986328125, -1.83697509765625, -1.772064208984375, -1.7071533203125, -1.642242431640625, -1.57733154296875, -1.512420654296875, -1.447509765625, -1.382598876953125, -1.31768798828125, -1.252777099609375, -1.1878662109375, -1.122955322265625, -1.05804443359375, -0.993133544921875, -0.92822265625, -0.863311767578125, -0.79840087890625, -0.733489990234375, -0.6685791015625, -0.603668212890625, -0.53875732421875, -0.473846435546875, -0.408935546875, -0.344024658203125, -0.27911376953125, -0.214202880859375, -0.1492919921875, -0.084381103515625, -0.01947021484375, 0.045440673828125, 0.1103515625, 0.175262451171875, 0.24017333984375, 0.305084228515625, 0.3699951171875, 0.434906005859375, 0.49981689453125, 0.564727783203125, 0.629638671875, 0.694549560546875, 0.75946044921875, 0.824371337890625, 0.8892822265625, 0.954193115234375, 1.01910400390625, 1.084014892578125, 1.14892578125, 1.213836669921875, 1.27874755859375, 1.343658447265625, 1.4085693359375, 1.473480224609375, 1.53839111328125, 1.603302001953125, 1.668212890625, 1.733123779296875, 1.79803466796875, 1.862945556640625, 1.9278564453125, 1.992767333984375, 2.05767822265625, 2.122589111328125, 2.1875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 9.0, 4.0, 8.0, 13.0, 9.0, 16.0, 25.0, 30.0, 43.0, 46.0, 69.0, 78.0, 106.0, 123.0, 88.0, 72.0, 52.0, 44.0, 39.0, 33.0, 16.0, 9.0, 15.0, 10.0, 7.0, 5.0, 3.0, 11.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00041675567626953125, -0.00040387362241744995, -0.00039099156856536865, -0.00037810951471328735, -0.00036522746086120605, -0.00035234540700912476, -0.00033946335315704346, -0.00032658129930496216, -0.00031369924545288086, -0.00030081719160079956, -0.00028793513774871826, -0.00027505308389663696, -0.00026217103004455566, -0.00024928897619247437, -0.00023640692234039307, -0.00022352486848831177, -0.00021064281463623047, -0.00019776076078414917, -0.00018487870693206787, -0.00017199665307998657, -0.00015911459922790527, -0.00014623254537582397, -0.00013335049152374268, -0.00012046843767166138, -0.00010758638381958008, -9.470432996749878e-05, -8.182227611541748e-05, -6.894022226333618e-05, -5.605816841125488e-05, -4.3176114559173584e-05, -3.0294060707092285e-05, -1.7412006855010986e-05, -4.5299530029296875e-06, 8.352100849151611e-06, 2.123415470123291e-05, 3.411620855331421e-05, 4.699826240539551e-05, 5.988031625747681e-05, 7.27623701095581e-05, 8.56444239616394e-05, 9.85264778137207e-05, 0.000111408531665802, 0.0001242905855178833, 0.0001371726393699646, 0.0001500546932220459, 0.0001629367470741272, 0.0001758188009262085, 0.0001887008547782898, 0.0002015829086303711, 0.0002144649624824524, 0.0002273470163345337, 0.000240229070186615, 0.0002531111240386963, 0.0002659931778907776, 0.0002788752317428589, 0.0002917572855949402, 0.0003046393394470215, 0.0003175213932991028, 0.0003304034471511841, 0.0003432855010032654, 0.0003561675548553467, 0.000369049608707428, 0.0003819316625595093, 0.0003948137164115906, 0.0004076957702636719]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 0.0, 2.0, 7.0, 9.0, 6.0, 15.0, 12.0, 22.0, 16.0, 33.0, 45.0, 72.0, 126.0, 210.0, 456.0, 2383.0, 1038302.0, 5658.0, 553.0, 215.0, 141.0, 78.0, 44.0, 37.0, 26.0, 25.0, 17.0, 8.0, 10.0, 13.0, 2.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0091705322265625, -0.008880138397216797, -0.008589744567871094, -0.00829935073852539, -0.008008956909179688, -0.007718563079833984, -0.007428169250488281, -0.007137775421142578, -0.006847381591796875, -0.006556987762451172, -0.006266593933105469, -0.005976200103759766, -0.0056858062744140625, -0.005395412445068359, -0.005105018615722656, -0.004814624786376953, -0.00452423095703125, -0.004233837127685547, -0.003943443298339844, -0.0036530494689941406, -0.0033626556396484375, -0.0030722618103027344, -0.0027818679809570312, -0.002491474151611328, -0.002201080322265625, -0.0019106864929199219, -0.0016202926635742188, -0.0013298988342285156, -0.0010395050048828125, -0.0007491111755371094, -0.00045871734619140625, -0.00016832351684570312, 0.0001220703125, 0.0004124641418457031, 0.0007028579711914062, 0.0009932518005371094, 0.0012836456298828125, 0.0015740394592285156, 0.0018644332885742188, 0.002154827117919922, 0.002445220947265625, 0.002735614776611328, 0.0030260086059570312, 0.0033164024353027344, 0.0036067962646484375, 0.0038971900939941406, 0.004187583923339844, 0.004477977752685547, 0.00476837158203125, 0.005058765411376953, 0.005349159240722656, 0.005639553070068359, 0.0059299468994140625, 0.006220340728759766, 0.006510734558105469, 0.006801128387451172, 0.007091522216796875, 0.007381916046142578, 0.007672309875488281, 0.007962703704833984, 0.008253097534179688, 0.00854349136352539, 0.008833885192871094, 0.009124279022216797, 0.0094146728515625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 26.0, 125.0, 320.0, 349.0, 147.0, 37.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000897666672244668, -0.0008789906860329211, -0.0008603146998211741, -0.0008416387718170881, -0.0008229627856053412, -0.0008042867993935943, -0.0007856108713895082, -0.0007669348851777613, -0.0007482588989660144, -0.0007295829127542675, -0.0007109069265425205, -0.0006922309985384345, -0.0006735550123266876, -0.0006548790261149406, -0.0006362030981108546, -0.0006175271118991077, -0.0005988511256873608, -0.0005801751394756138, -0.0005614991532638669, -0.0005428232252597809, -0.000524147239048034, -0.000505471252836287, -0.00048679529572837055, -0.0004681193386204541, -0.00044944335240870714, -0.0004307673661969602, -0.00041209140908904374, -0.00039341545198112726, -0.00037473946576938033, -0.0003560634795576334, -0.0003373875224497169, -0.00031871156534180045, -0.0003000355209223926, -0.0002813595347106457, -0.0002626835776027292, -0.0002440076059428975, -0.0002253316342830658, -0.0002066556626232341, -0.0001879796909634024, -0.0001693037193035707, -0.00015062774764373899, -0.00013195177598390728, -0.00011327580432407558, -9.459983266424388e-05, -7.592386100441217e-05, -5.724788934458047e-05, -3.857191768474877e-05, -1.9895946024917066e-05, -1.2199743650853634e-06, 1.745599729474634e-05, 3.613196895457804e-05, 5.4807940614409745e-05, 7.348391227424145e-05, 9.215988393407315e-05, 0.00011083585559390485, 0.00012951182725373656, 0.00014818779891356826, 0.00016686377057339996, 0.00018553974223323166, 0.00020421571389306337, 0.00022289168555289507, 0.00024156765721272677, 0.0002602436288725585, 0.00027891958598047495, 0.0002975955721922219]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 5.0, 2.0, 3.0, 5.0, 9.0, 8.0, 10.0, 13.0, 15.0, 13.0, 14.0, 21.0, 19.0, 15.0, 21.0, 23.0, 28.0, 27.0, 24.0, 30.0, 44.0, 31.0, 32.0, 32.0, 30.0, 34.0, 38.0, 46.0, 38.0, 23.0, 39.0, 28.0, 34.0, 43.0, 28.0, 16.0, 17.0, 17.0, 20.0, 25.0, 18.0, 7.0, 10.0, 6.0, 10.0, 11.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00015294551849365234, -0.00014839600771665573, -0.00014384649693965912, -0.0001392969861626625, -0.0001347474753856659, -0.00013019796460866928, -0.00012564845383167267, -0.00012109894305467606, -0.00011654943227767944, -0.00011199992150068283, -0.00010745041072368622, -0.0001029008999466896, -9.835138916969299e-05, -9.380187839269638e-05, -8.925236761569977e-05, -8.470285683870316e-05, -8.015334606170654e-05, -7.560383528470993e-05, -7.105432450771332e-05, -6.65048137307167e-05, -6.195530295372009e-05, -5.740579217672348e-05, -5.285628139972687e-05, -4.8306770622730255e-05, -4.375725984573364e-05, -3.920774906873703e-05, -3.465823829174042e-05, -3.0108727514743805e-05, -2.5559216737747192e-05, -2.100970596075058e-05, -1.6460195183753967e-05, -1.1910684406757355e-05, -7.361173629760742e-06, -2.8116628527641296e-06, 1.737847924232483e-06, 6.2873587012290955e-06, 1.0836869478225708e-05, 1.538638025522232e-05, 1.9935891032218933e-05, 2.4485401809215546e-05, 2.9034912586212158e-05, 3.358442336320877e-05, 3.813393414020538e-05, 4.2683444917201996e-05, 4.723295569419861e-05, 5.178246647119522e-05, 5.6331977248191833e-05, 6.0881488025188446e-05, 6.543099880218506e-05, 6.998050957918167e-05, 7.453002035617828e-05, 7.90795311331749e-05, 8.362904191017151e-05, 8.817855268716812e-05, 9.272806346416473e-05, 9.727757424116135e-05, 0.00010182708501815796, 0.00010637659579515457, 0.00011092610657215118, 0.0001154756173491478, 0.00012002512812614441, 0.00012457463890314102, 0.00012912414968013763, 0.00013367366045713425, 0.00013822317123413086]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 13.0, 6.0, 12.0, 17.0, 20.0, 17.0, 21.0, 27.0, 28.0, 19.0, 42.0, 33.0, 31.0, 35.0, 42.0, 45.0, 41.0, 52.0, 38.0, 47.0, 51.0, 32.0, 36.0, 42.0, 29.0, 33.0, 33.0, 18.0, 26.0, 17.0, 11.0, 9.0, 15.0, 12.0, 7.0, 7.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.203125, -8.9273681640625, -8.651611328125, -8.3758544921875, -8.10009765625, -7.8243408203125, -7.548583984375, -7.2728271484375, -6.9970703125, -6.7213134765625, -6.445556640625, -6.1697998046875, -5.89404296875, -5.6182861328125, -5.342529296875, -5.0667724609375, -4.791015625, -4.5152587890625, -4.239501953125, -3.9637451171875, -3.68798828125, -3.4122314453125, -3.136474609375, -2.8607177734375, -2.5849609375, -2.3092041015625, -2.033447265625, -1.7576904296875, -1.48193359375, -1.2061767578125, -0.930419921875, -0.6546630859375, -0.37890625, -0.1031494140625, 0.172607421875, 0.4483642578125, 0.72412109375, 0.9998779296875, 1.275634765625, 1.5513916015625, 1.8271484375, 2.1029052734375, 2.378662109375, 2.6544189453125, 2.93017578125, 3.2059326171875, 3.481689453125, 3.7574462890625, 4.033203125, 4.3089599609375, 4.584716796875, 4.8604736328125, 5.13623046875, 5.4119873046875, 5.687744140625, 5.9635009765625, 6.2392578125, 6.5150146484375, 6.790771484375, 7.0665283203125, 7.34228515625, 7.6180419921875, 7.893798828125, 8.1695556640625, 8.4453125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 10.0, 9.0, 13.0, 16.0, 23.0, 23.0, 33.0, 45.0, 60.0, 74.0, 99.0, 141.0, 232.0, 339.0, 621.0, 1629.0, 7866.0, 56367.0, 427468.0, 477968.0, 63042.0, 8787.0, 1747.0, 703.0, 392.0, 226.0, 146.0, 99.0, 70.0, 68.0, 59.0, 28.0, 35.0, 21.0, 17.0, 11.0, 9.0, 14.0, 8.0, 3.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.125, -16.59033203125, -16.0556640625, -15.52099609375, -14.986328125, -14.45166015625, -13.9169921875, -13.38232421875, -12.84765625, -12.31298828125, -11.7783203125, -11.24365234375, -10.708984375, -10.17431640625, -9.6396484375, -9.10498046875, -8.5703125, -8.03564453125, -7.5009765625, -6.96630859375, -6.431640625, -5.89697265625, -5.3623046875, -4.82763671875, -4.29296875, -3.75830078125, -3.2236328125, -2.68896484375, -2.154296875, -1.61962890625, -1.0849609375, -0.55029296875, -0.015625, 0.51904296875, 1.0537109375, 1.58837890625, 2.123046875, 2.65771484375, 3.1923828125, 3.72705078125, 4.26171875, 4.79638671875, 5.3310546875, 5.86572265625, 6.400390625, 6.93505859375, 7.4697265625, 8.00439453125, 8.5390625, 9.07373046875, 9.6083984375, 10.14306640625, 10.677734375, 11.21240234375, 11.7470703125, 12.28173828125, 12.81640625, 13.35107421875, 13.8857421875, 14.42041015625, 14.955078125, 15.48974609375, 16.0244140625, 16.55908203125, 17.09375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 2.0, 10.0, 7.0, 8.0, 15.0, 22.0, 19.0, 14.0, 25.0, 33.0, 43.0, 40.0, 43.0, 46.0, 73.0, 141.0, 303.0, 1500.0, 163.0, 100.0, 68.0, 51.0, 47.0, 50.0, 43.0, 35.0, 24.0, 22.0, 23.0, 15.0, 17.0, 10.0, 10.0, 8.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.828125, -30.778076171875, -29.72802734375, -28.677978515625, -27.6279296875, -26.577880859375, -25.52783203125, -24.477783203125, -23.427734375, -22.377685546875, -21.32763671875, -20.277587890625, -19.2275390625, -18.177490234375, -17.12744140625, -16.077392578125, -15.02734375, -13.977294921875, -12.92724609375, -11.877197265625, -10.8271484375, -9.777099609375, -8.72705078125, -7.677001953125, -6.626953125, -5.576904296875, -4.52685546875, -3.476806640625, -2.4267578125, -1.376708984375, -0.32666015625, 0.723388671875, 1.7734375, 2.823486328125, 3.87353515625, 4.923583984375, 5.9736328125, 7.023681640625, 8.07373046875, 9.123779296875, 10.173828125, 11.223876953125, 12.27392578125, 13.323974609375, 14.3740234375, 15.424072265625, 16.47412109375, 17.524169921875, 18.57421875, 19.624267578125, 20.67431640625, 21.724365234375, 22.7744140625, 23.824462890625, 24.87451171875, 25.924560546875, 26.974609375, 28.024658203125, 29.07470703125, 30.124755859375, 31.1748046875, 32.224853515625, 33.27490234375, 34.324951171875, 35.375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 5.0, 10.0, 17.0, 14.0, 20.0, 27.0, 37.0, 39.0, 57.0, 54.0, 87.0, 122.0, 148.0, 263.0, 533.0, 1556.0, 69779.0, 3066245.0, 4782.0, 809.0, 359.0, 171.0, 144.0, 109.0, 70.0, 47.0, 36.0, 36.0, 37.0, 17.0, 17.0, 15.0, 9.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.5625, -96.271484375, -92.98046875, -89.689453125, -86.3984375, -83.107421875, -79.81640625, -76.525390625, -73.234375, -69.943359375, -66.65234375, -63.361328125, -60.0703125, -56.779296875, -53.48828125, -50.197265625, -46.90625, -43.615234375, -40.32421875, -37.033203125, -33.7421875, -30.451171875, -27.16015625, -23.869140625, -20.578125, -17.287109375, -13.99609375, -10.705078125, -7.4140625, -4.123046875, -0.83203125, 2.458984375, 5.75, 9.041015625, 12.33203125, 15.623046875, 18.9140625, 22.205078125, 25.49609375, 28.787109375, 32.078125, 35.369140625, 38.66015625, 41.951171875, 45.2421875, 48.533203125, 51.82421875, 55.115234375, 58.40625, 61.697265625, 64.98828125, 68.279296875, 71.5703125, 74.861328125, 78.15234375, 81.443359375, 84.734375, 88.025390625, 91.31640625, 94.607421875, 97.8984375, 101.189453125, 104.48046875, 107.771484375, 111.0625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 35.0, 231.0, 449.0, 254.0, 37.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-207.31723022460938, -203.58607482910156, -199.8549346923828, -196.123779296875, -192.39263916015625, -188.66148376464844, -184.93032836914062, -181.19918823242188, -177.46803283691406, -173.73687744140625, -170.0057373046875, -166.2745819091797, -162.54344177246094, -158.81228637695312, -155.08114624023438, -151.34999084472656, -147.61883544921875, -143.88768005371094, -140.1565399169922, -136.42538452148438, -132.69424438476562, -128.9630889892578, -125.23194122314453, -121.50079345703125, -117.7696533203125, -114.03850555419922, -110.30735778808594, -106.57620239257812, -102.84505462646484, -99.11390686035156, -95.38275909423828, -91.651611328125, -87.92046356201172, -84.18931579589844, -80.45816802978516, -76.72702026367188, -72.99586486816406, -69.26471710205078, -65.5335693359375, -61.80242156982422, -58.07126998901367, -54.34012222290039, -50.608970642089844, -46.87782287597656, -43.14667510986328, -39.415523529052734, -35.68437576293945, -31.95322608947754, -28.222076416015625, -24.49092674255371, -20.759777069091797, -17.028629302978516, -13.297479629516602, -9.566329956054688, -5.835182189941406, -2.104032516479492, 1.6271171569824219, 5.358266353607178, 9.089415550231934, 12.820564270019531, 16.551713943481445, 20.28286361694336, 24.01401138305664, 27.745161056518555, 31.47631072998047]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 10.0, 9.0, 7.0, 9.0, 9.0, 14.0, 15.0, 22.0, 13.0, 15.0, 26.0, 28.0, 29.0, 30.0, 50.0, 38.0, 38.0, 30.0, 45.0, 39.0, 43.0, 44.0, 35.0, 47.0, 41.0, 34.0, 33.0, 21.0, 22.0, 20.0, 27.0, 23.0, 13.0, 16.0, 16.0, 18.0, 13.0, 8.0, 11.0, 3.0, 10.0, 5.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.11868286132812, -67.88211059570312, -65.64554595947266, -63.408973693847656, -61.172401428222656, -58.93583297729492, -56.69926452636719, -54.46269226074219, -52.22612380981445, -49.98955535888672, -47.75298309326172, -45.516414642333984, -43.27984619140625, -41.04327392578125, -38.806705474853516, -36.57013702392578, -34.33356475830078, -32.09699630737305, -29.860424041748047, -27.623855590820312, -25.387285232543945, -23.150714874267578, -20.914146423339844, -18.677576065063477, -16.44100570678711, -14.204435348510742, -11.967865943908691, -9.73129653930664, -7.494726181030273, -5.258155822753906, -3.0215864181518555, -0.7850170135498047, 1.4515533447265625, 3.6881232261657715, 5.9246931076049805, 8.161262512207031, 10.397832870483398, 12.634403228759766, 14.870972633361816, 17.107542037963867, 19.344112396240234, 21.5806827545166, 23.81725311279297, 26.053821563720703, 28.29039192199707, 30.526962280273438, 32.76353073120117, 35.000099182128906, 37.236671447753906, 39.47323989868164, 41.70981216430664, 43.946380615234375, 46.182952880859375, 48.41952133178711, 50.656089782714844, 52.892662048339844, 55.12923049926758, 57.36579895019531, 59.60237121582031, 61.83893966674805, 64.07550811767578, 66.31208038330078, 68.54865264892578, 70.78521728515625, 73.02178955078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 9.0, 2.0, 12.0, 5.0, 14.0, 16.0, 15.0, 20.0, 28.0, 29.0, 34.0, 31.0, 34.0, 24.0, 44.0, 38.0, 46.0, 43.0, 45.0, 49.0, 43.0, 45.0, 36.0, 45.0, 37.0, 26.0, 44.0, 31.0, 17.0, 22.0, 27.0, 16.0, 15.0, 11.0, 10.0, 8.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.3828125, -11.056884765625, -10.73095703125, -10.405029296875, -10.0791015625, -9.753173828125, -9.42724609375, -9.101318359375, -8.775390625, -8.449462890625, -8.12353515625, -7.797607421875, -7.4716796875, -7.145751953125, -6.81982421875, -6.493896484375, -6.16796875, -5.842041015625, -5.51611328125, -5.190185546875, -4.8642578125, -4.538330078125, -4.21240234375, -3.886474609375, -3.560546875, -3.234619140625, -2.90869140625, -2.582763671875, -2.2568359375, -1.930908203125, -1.60498046875, -1.279052734375, -0.953125, -0.627197265625, -0.30126953125, 0.024658203125, 0.3505859375, 0.676513671875, 1.00244140625, 1.328369140625, 1.654296875, 1.980224609375, 2.30615234375, 2.632080078125, 2.9580078125, 3.283935546875, 3.60986328125, 3.935791015625, 4.26171875, 4.587646484375, 4.91357421875, 5.239501953125, 5.5654296875, 5.891357421875, 6.21728515625, 6.543212890625, 6.869140625, 7.195068359375, 7.52099609375, 7.846923828125, 8.1728515625, 8.498779296875, 8.82470703125, 9.150634765625, 9.4765625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 6.0, 0.0, 3.0, 5.0, 5.0, 5.0, 8.0, 12.0, 18.0, 16.0, 39.0, 41.0, 34.0, 49.0, 81.0, 136.0, 194.0, 322.0, 671.0, 1701.0, 5869.0, 31521.0, 216888.0, 1028034.0, 1820825.0, 878763.0, 174801.0, 26345.0, 4984.0, 1477.0, 565.0, 278.0, 180.0, 109.0, 70.0, 42.0, 45.0, 30.0, 26.0, 21.0, 12.0, 14.0, 9.0, 6.0, 9.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.5234375, -14.089111328125, -13.65478515625, -13.220458984375, -12.7861328125, -12.351806640625, -11.91748046875, -11.483154296875, -11.048828125, -10.614501953125, -10.18017578125, -9.745849609375, -9.3115234375, -8.877197265625, -8.44287109375, -8.008544921875, -7.57421875, -7.139892578125, -6.70556640625, -6.271240234375, -5.8369140625, -5.402587890625, -4.96826171875, -4.533935546875, -4.099609375, -3.665283203125, -3.23095703125, -2.796630859375, -2.3623046875, -1.927978515625, -1.49365234375, -1.059326171875, -0.625, -0.190673828125, 0.24365234375, 0.677978515625, 1.1123046875, 1.546630859375, 1.98095703125, 2.415283203125, 2.849609375, 3.283935546875, 3.71826171875, 4.152587890625, 4.5869140625, 5.021240234375, 5.45556640625, 5.889892578125, 6.32421875, 6.758544921875, 7.19287109375, 7.627197265625, 8.0615234375, 8.495849609375, 8.93017578125, 9.364501953125, 9.798828125, 10.233154296875, 10.66748046875, 11.101806640625, 11.5361328125, 11.970458984375, 12.40478515625, 12.839111328125, 13.2734375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 13.0, 20.0, 15.0, 40.0, 50.0, 54.0, 74.0, 83.0, 111.0, 150.0, 192.0, 237.0, 294.0, 332.0, 357.0, 371.0, 320.0, 270.0, 230.0, 175.0, 132.0, 104.0, 93.0, 69.0, 49.0, 59.0, 32.0, 25.0, 29.0, 16.0, 11.0, 13.0, 3.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.5577392578125, -15.099853515625, -14.6419677734375, -14.18408203125, -13.7261962890625, -13.268310546875, -12.8104248046875, -12.3525390625, -11.8946533203125, -11.436767578125, -10.9788818359375, -10.52099609375, -10.0631103515625, -9.605224609375, -9.1473388671875, -8.689453125, -8.2315673828125, -7.773681640625, -7.3157958984375, -6.85791015625, -6.4000244140625, -5.942138671875, -5.4842529296875, -5.0263671875, -4.5684814453125, -4.110595703125, -3.6527099609375, -3.19482421875, -2.7369384765625, -2.279052734375, -1.8211669921875, -1.36328125, -0.9053955078125, -0.447509765625, 0.0103759765625, 0.46826171875, 0.9261474609375, 1.384033203125, 1.8419189453125, 2.2998046875, 2.7576904296875, 3.215576171875, 3.6734619140625, 4.13134765625, 4.5892333984375, 5.047119140625, 5.5050048828125, 5.962890625, 6.4207763671875, 6.878662109375, 7.3365478515625, 7.79443359375, 8.2523193359375, 8.710205078125, 9.1680908203125, 9.6259765625, 10.0838623046875, 10.541748046875, 10.9996337890625, 11.45751953125, 11.9154052734375, 12.373291015625, 12.8311767578125, 13.2890625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 4.0, 5.0, 13.0, 9.0, 21.0, 17.0, 40.0, 44.0, 56.0, 82.0, 128.0, 160.0, 187.0, 248.0, 341.0, 578.0, 1151.0, 3107.0, 50424.0, 3649117.0, 477430.0, 7242.0, 1500.0, 746.0, 478.0, 298.0, 219.0, 179.0, 130.0, 89.0, 77.0, 36.0, 28.0, 29.0, 14.0, 17.0, 7.0, 8.0, 8.0, 4.0, 5.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.78125, -46.11767578125, -44.4541015625, -42.79052734375, -41.126953125, -39.46337890625, -37.7998046875, -36.13623046875, -34.47265625, -32.80908203125, -31.1455078125, -29.48193359375, -27.818359375, -26.15478515625, -24.4912109375, -22.82763671875, -21.1640625, -19.50048828125, -17.8369140625, -16.17333984375, -14.509765625, -12.84619140625, -11.1826171875, -9.51904296875, -7.85546875, -6.19189453125, -4.5283203125, -2.86474609375, -1.201171875, 0.46240234375, 2.1259765625, 3.78955078125, 5.453125, 7.11669921875, 8.7802734375, 10.44384765625, 12.107421875, 13.77099609375, 15.4345703125, 17.09814453125, 18.76171875, 20.42529296875, 22.0888671875, 23.75244140625, 25.416015625, 27.07958984375, 28.7431640625, 30.40673828125, 32.0703125, 33.73388671875, 35.3974609375, 37.06103515625, 38.724609375, 40.38818359375, 42.0517578125, 43.71533203125, 45.37890625, 47.04248046875, 48.7060546875, 50.36962890625, 52.033203125, 53.69677734375, 55.3603515625, 57.02392578125, 58.6875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 10.0, 100.0, 357.0, 383.0, 142.0, 17.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-419.21783447265625, -411.4634094238281, -403.708984375, -395.9545593261719, -388.20013427734375, -380.4457092285156, -372.6912841796875, -364.9368591308594, -357.18243408203125, -349.4280090332031, -341.673583984375, -333.9191589355469, -326.16473388671875, -318.4103088378906, -310.6558837890625, -302.9014587402344, -295.14703369140625, -287.3926086425781, -279.63818359375, -271.8837585449219, -264.12933349609375, -256.3749084472656, -248.6204833984375, -240.86605834960938, -233.1116180419922, -225.35719299316406, -217.60276794433594, -209.8483428955078, -202.0939178466797, -194.33949279785156, -186.58506774902344, -178.8306427001953, -171.07623291015625, -163.32180786132812, -155.5673828125, -147.81295776367188, -140.05853271484375, -132.30410766601562, -124.5496826171875, -116.79525756835938, -109.04081726074219, -101.28639221191406, -93.53196716308594, -85.77754211425781, -78.02311706542969, -70.26869201660156, -62.51426315307617, -54.75983810424805, -47.00541687011719, -39.25099182128906, -31.496566772460938, -23.74213981628418, -15.987714767456055, -8.233287811279297, -0.4788627624511719, 7.275562286376953, 15.029987335205078, 22.784412384033203, 30.538837432861328, 38.29326629638672, 46.047691345214844, 53.80211639404297, 61.556541442871094, 69.31096649169922, 77.06539154052734]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 12.0, 6.0, 17.0, 14.0, 14.0, 14.0, 15.0, 16.0, 26.0, 33.0, 24.0, 32.0, 27.0, 43.0, 43.0, 33.0, 49.0, 34.0, 54.0, 40.0, 43.0, 40.0, 54.0, 38.0, 35.0, 41.0, 33.0, 25.0, 24.0, 29.0, 21.0, 10.0, 15.0, 13.0, 10.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.907901763916016, -60.98272705078125, -59.05754852294922, -57.13237380981445, -55.20719909667969, -53.282020568847656, -51.35684585571289, -49.431671142578125, -47.506492614746094, -45.58131790161133, -43.6561393737793, -41.73096466064453, -39.805789947509766, -37.880615234375, -35.95543670654297, -34.0302619934082, -32.10508728027344, -30.17991065979004, -28.254735946655273, -26.329559326171875, -24.40438461303711, -22.47920799255371, -20.554031372070312, -18.628856658935547, -16.70368003845215, -14.778504371643066, -12.853328704833984, -10.928152084350586, -9.002976417541504, -7.077800750732422, -5.152624130249023, -3.2274484634399414, -1.302276611328125, 0.6228992938995361, 2.5480751991271973, 4.4732513427734375, 6.3984270095825195, 8.323602676391602, 10.248779296875, 12.173954963684082, 14.099130630493164, 16.024307250976562, 17.949481964111328, 19.874658584594727, 21.799835205078125, 23.72500991821289, 25.65018653869629, 27.575363159179688, 29.500537872314453, 31.42571449279785, 33.35089111328125, 35.276065826416016, 37.20124053955078, 39.12641906738281, 41.05159378051758, 42.976768493652344, 44.901947021484375, 46.82712173461914, 48.75230026245117, 50.67747497558594, 52.6026496887207, 54.52782440185547, 56.4530029296875, 58.378177642822266, 60.30335235595703]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 2.0, 7.0, 6.0, 3.0, 6.0, 8.0, 10.0, 14.0, 13.0, 20.0, 19.0, 16.0, 21.0, 30.0, 39.0, 25.0, 26.0, 36.0, 34.0, 52.0, 36.0, 36.0, 41.0, 48.0, 41.0, 48.0, 38.0, 40.0, 32.0, 34.0, 28.0, 24.0, 16.0, 31.0, 21.0, 10.0, 19.0, 10.0, 10.0, 9.0, 8.0, 11.0, 5.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.2578125, -8.9742431640625, -8.690673828125, -8.4071044921875, -8.12353515625, -7.8399658203125, -7.556396484375, -7.2728271484375, -6.9892578125, -6.7056884765625, -6.422119140625, -6.1385498046875, -5.85498046875, -5.5714111328125, -5.287841796875, -5.0042724609375, -4.720703125, -4.4371337890625, -4.153564453125, -3.8699951171875, -3.58642578125, -3.3028564453125, -3.019287109375, -2.7357177734375, -2.4521484375, -2.1685791015625, -1.885009765625, -1.6014404296875, -1.31787109375, -1.0343017578125, -0.750732421875, -0.4671630859375, -0.18359375, 0.0999755859375, 0.383544921875, 0.6671142578125, 0.95068359375, 1.2342529296875, 1.517822265625, 1.8013916015625, 2.0849609375, 2.3685302734375, 2.652099609375, 2.9356689453125, 3.21923828125, 3.5028076171875, 3.786376953125, 4.0699462890625, 4.353515625, 4.6370849609375, 4.920654296875, 5.2042236328125, 5.48779296875, 5.7713623046875, 6.054931640625, 6.3385009765625, 6.6220703125, 6.9056396484375, 7.189208984375, 7.4727783203125, 7.75634765625, 8.0399169921875, 8.323486328125, 8.6070556640625, 8.890625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 13.0, 19.0, 34.0, 54.0, 77.0, 110.0, 148.0, 236.0, 371.0, 533.0, 790.0, 1111.0, 1735.0, 2508.0, 3662.0, 5402.0, 8181.0, 12209.0, 18688.0, 28710.0, 45889.0, 79457.0, 160741.0, 350838.0, 136995.0, 70458.0, 41575.0, 26564.0, 17070.0, 11171.0, 7553.0, 5098.0, 3394.0, 2283.0, 1547.0, 1093.0, 747.0, 465.0, 360.0, 215.0, 153.0, 109.0, 54.0, 42.0, 32.0, 23.0, 11.0, 9.0, 6.0, 7.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.40625, -2.329620361328125, -2.25299072265625, -2.176361083984375, -2.0997314453125, -2.023101806640625, -1.94647216796875, -1.869842529296875, -1.793212890625, -1.716583251953125, -1.63995361328125, -1.563323974609375, -1.4866943359375, -1.410064697265625, -1.33343505859375, -1.256805419921875, -1.18017578125, -1.103546142578125, -1.02691650390625, -0.950286865234375, -0.8736572265625, -0.797027587890625, -0.72039794921875, -0.643768310546875, -0.567138671875, -0.490509033203125, -0.41387939453125, -0.337249755859375, -0.2606201171875, -0.183990478515625, -0.10736083984375, -0.030731201171875, 0.0458984375, 0.122528076171875, 0.19915771484375, 0.275787353515625, 0.3524169921875, 0.429046630859375, 0.50567626953125, 0.582305908203125, 0.658935546875, 0.735565185546875, 0.81219482421875, 0.888824462890625, 0.9654541015625, 1.042083740234375, 1.11871337890625, 1.195343017578125, 1.27197265625, 1.348602294921875, 1.42523193359375, 1.501861572265625, 1.5784912109375, 1.655120849609375, 1.73175048828125, 1.808380126953125, 1.885009765625, 1.961639404296875, 2.03826904296875, 2.114898681640625, 2.1915283203125, 2.268157958984375, 2.34478759765625, 2.421417236328125, 2.498046875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 8.0, 6.0, 12.0, 9.0, 8.0, 12.0, 12.0, 17.0, 22.0, 23.0, 33.0, 28.0, 37.0, 42.0, 38.0, 29.0, 48.0, 36.0, 38.0, 1063.0, 45.0, 37.0, 51.0, 39.0, 36.0, 37.0, 41.0, 27.0, 30.0, 26.0, 28.0, 20.0, 18.0, 17.0, 14.0, 7.0, 7.0, 13.0, 3.0, 8.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-7.5859375, -7.38568115234375, -7.1854248046875, -6.98516845703125, -6.784912109375, -6.58465576171875, -6.3843994140625, -6.18414306640625, -5.98388671875, -5.78363037109375, -5.5833740234375, -5.38311767578125, -5.182861328125, -4.98260498046875, -4.7823486328125, -4.58209228515625, -4.3818359375, -4.18157958984375, -3.9813232421875, -3.78106689453125, -3.580810546875, -3.38055419921875, -3.1802978515625, -2.98004150390625, -2.77978515625, -2.57952880859375, -2.3792724609375, -2.17901611328125, -1.978759765625, -1.77850341796875, -1.5782470703125, -1.37799072265625, -1.177734375, -0.97747802734375, -0.7772216796875, -0.57696533203125, -0.376708984375, -0.17645263671875, 0.0238037109375, 0.22406005859375, 0.42431640625, 0.62457275390625, 0.8248291015625, 1.02508544921875, 1.225341796875, 1.42559814453125, 1.6258544921875, 1.82611083984375, 2.0263671875, 2.22662353515625, 2.4268798828125, 2.62713623046875, 2.827392578125, 3.02764892578125, 3.2279052734375, 3.42816162109375, 3.62841796875, 3.82867431640625, 4.0289306640625, 4.22918701171875, 4.429443359375, 4.62969970703125, 4.8299560546875, 5.03021240234375, 5.23046875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 8.0, 18.0, 25.0, 38.0, 36.0, 87.0, 117.0, 209.0, 386.0, 495.0, 983.0, 1523.0, 2383.0, 3779.0, 5832.0, 9562.0, 16053.0, 26136.0, 44414.0, 75719.0, 135693.0, 1380862.0, 170961.0, 89910.0, 52639.0, 30931.0, 18614.0, 11266.0, 6899.0, 4169.0, 2770.0, 1767.0, 1056.0, 715.0, 418.0, 235.0, 150.0, 107.0, 51.0, 40.0, 16.0, 22.0, 6.0, 16.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.85546875, -2.7706298828125, -2.685791015625, -2.6009521484375, -2.51611328125, -2.4312744140625, -2.346435546875, -2.2615966796875, -2.1767578125, -2.0919189453125, -2.007080078125, -1.9222412109375, -1.83740234375, -1.7525634765625, -1.667724609375, -1.5828857421875, -1.498046875, -1.4132080078125, -1.328369140625, -1.2435302734375, -1.15869140625, -1.0738525390625, -0.989013671875, -0.9041748046875, -0.8193359375, -0.7344970703125, -0.649658203125, -0.5648193359375, -0.47998046875, -0.3951416015625, -0.310302734375, -0.2254638671875, -0.140625, -0.0557861328125, 0.029052734375, 0.1138916015625, 0.19873046875, 0.2835693359375, 0.368408203125, 0.4532470703125, 0.5380859375, 0.6229248046875, 0.707763671875, 0.7926025390625, 0.87744140625, 0.9622802734375, 1.047119140625, 1.1319580078125, 1.216796875, 1.3016357421875, 1.386474609375, 1.4713134765625, 1.55615234375, 1.6409912109375, 1.725830078125, 1.8106689453125, 1.8955078125, 1.9803466796875, 2.065185546875, 2.1500244140625, 2.23486328125, 2.3197021484375, 2.404541015625, 2.4893798828125, 2.57421875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 0.0, 3.0, 5.0, 3.0, 5.0, 3.0, 5.0, 10.0, 13.0, 11.0, 13.0, 19.0, 23.0, 34.0, 30.0, 42.0, 51.0, 78.0, 92.0, 104.0, 109.0, 68.0, 56.0, 52.0, 31.0, 42.0, 17.0, 26.0, 12.0, 8.0, 13.0, 4.0, 5.0, 2.0, 1.0, 5.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005817413330078125, -0.0005673989653587341, -0.0005530565977096558, -0.0005387142300605774, -0.000524371862411499, -0.0005100294947624207, -0.0004956871271133423, -0.0004813447594642639, -0.00046700239181518555, -0.0004526600241661072, -0.0004383176565170288, -0.00042397528886795044, -0.00040963292121887207, -0.0003952905535697937, -0.00038094818592071533, -0.00036660581827163696, -0.0003522634506225586, -0.0003379210829734802, -0.00032357871532440186, -0.0003092363476753235, -0.0002948939800262451, -0.00028055161237716675, -0.0002662092447280884, -0.00025186687707901, -0.00023752450942993164, -0.00022318214178085327, -0.0002088397741317749, -0.00019449740648269653, -0.00018015503883361816, -0.0001658126711845398, -0.00015147030353546143, -0.00013712793588638306, -0.0001227855682373047, -0.00010844320058822632, -9.410083293914795e-05, -7.975846529006958e-05, -6.541609764099121e-05, -5.107372999191284e-05, -3.673136234283447e-05, -2.2388994693756104e-05, -8.046627044677734e-06, 6.295740604400635e-06, 2.0638108253479004e-05, 3.498047590255737e-05, 4.932284355163574e-05, 6.366521120071411e-05, 7.800757884979248e-05, 9.234994649887085e-05, 0.00010669231414794922, 0.00012103468179702759, 0.00013537704944610596, 0.00014971941709518433, 0.0001640617847442627, 0.00017840415239334106, 0.00019274652004241943, 0.0002070888876914978, 0.00022143125534057617, 0.00023577362298965454, 0.0002501159906387329, 0.0002644583582878113, 0.00027880072593688965, 0.000293143093585968, 0.0003074854612350464, 0.00032182782888412476, 0.0003361701965332031]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 6.0, 2.0, 7.0, 10.0, 15.0, 13.0, 9.0, 24.0, 39.0, 50.0, 69.0, 81.0, 139.0, 232.0, 555.0, 3203.0, 1037788.0, 4923.0, 636.0, 242.0, 137.0, 95.0, 59.0, 52.0, 40.0, 19.0, 19.0, 10.0, 19.0, 11.0, 9.0, 12.0, 6.0, 4.0, 10.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0069580078125, -0.006662487983703613, -0.0063669681549072266, -0.00607144832611084, -0.005775928497314453, -0.005480408668518066, -0.00518488883972168, -0.004889369010925293, -0.004593849182128906, -0.0042983293533325195, -0.004002809524536133, -0.003707289695739746, -0.0034117698669433594, -0.0031162500381469727, -0.002820730209350586, -0.0025252103805541992, -0.0022296905517578125, -0.0019341707229614258, -0.001638650894165039, -0.0013431310653686523, -0.0010476112365722656, -0.0007520914077758789, -0.0004565715789794922, -0.00016105175018310547, 0.00013446807861328125, 0.00042998790740966797, 0.0007255077362060547, 0.0010210275650024414, 0.0013165473937988281, 0.0016120672225952148, 0.0019075870513916016, 0.0022031068801879883, 0.002498626708984375, 0.0027941465377807617, 0.0030896663665771484, 0.003385186195373535, 0.003680706024169922, 0.003976225852966309, 0.004271745681762695, 0.004567265510559082, 0.004862785339355469, 0.0051583051681518555, 0.005453824996948242, 0.005749344825744629, 0.006044864654541016, 0.006340384483337402, 0.006635904312133789, 0.006931424140930176, 0.0072269439697265625, 0.007522463798522949, 0.007817983627319336, 0.008113503456115723, 0.00840902328491211, 0.008704543113708496, 0.009000062942504883, 0.00929558277130127, 0.009591102600097656, 0.009886622428894043, 0.01018214225769043, 0.010477662086486816, 0.010773181915283203, 0.01106870174407959, 0.011364221572875977, 0.011659741401672363, 0.01195526123046875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 20.0, 131.0, 415.0, 345.0, 83.0, 16.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0013385488418862224, -0.001314577297307551, -0.0012906056363135576, -0.0012666340917348862, -0.0012426624307408929, -0.0012186908861622214, -0.0011947192251682281, -0.0011707476805895567, -0.0011467761360108852, -0.0011228045914322138, -0.0010988329304382205, -0.001074861385859549, -0.0010508897248655558, -0.0010269181802868843, -0.0010029466357082129, -0.0009789749747142196, -0.0009550033137202263, -0.0009310317109338939, -0.0009070601081475616, -0.0008830885635688901, -0.0008591169607825577, -0.0008351453579962254, -0.000811173755209893, -0.0007872021524235606, -0.0007632306078448892, -0.0007392590050585568, -0.0007152874022722244, -0.000691315857693553, -0.0006673442549072206, -0.0006433726521208882, -0.0006194010493345559, -0.0005954294465482235, -0.0005714578437618911, -0.0005474862409755588, -0.0005235146381892264, -0.000499543035402894, -0.0004755714617203921, -0.0004515998880378902, -0.0004276282852515578, -0.00040365668246522546, -0.00037968510878272355, -0.0003557135059963912, -0.00033174193231388927, -0.0003077703295275569, -0.00028379872674122453, -0.00025982712395489216, -0.00023585555027239025, -0.00021188394748605788, -0.00018791235925164074, -0.0001639407710172236, -0.00013996916823089123, -0.00011599757999647409, -9.202598448609933e-05, -6.805438897572458e-05, -4.408280074130744e-05, -2.011119795497507e-05, 3.860390279442072e-06, 2.7831983970827423e-05, 5.1803577662212774e-05, 7.577516953460872e-05, 9.974676504498348e-05, 0.00012371836055535823, 0.00014768994878977537, 0.00017166155157610774, 0.00019563313981052488]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 14.0, 3.0, 11.0, 9.0, 7.0, 10.0, 19.0, 12.0, 14.0, 23.0, 23.0, 34.0, 36.0, 42.0, 31.0, 32.0, 45.0, 43.0, 47.0, 43.0, 42.0, 40.0, 44.0, 38.0, 39.0, 25.0, 38.0, 25.0, 28.0, 32.0, 24.0, 22.0, 17.0, 21.0, 14.0, 14.0, 10.0, 6.0, 3.0, 7.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017088651657104492, -0.000164874829351902, -0.0001588631421327591, -0.00015285145491361618, -0.00014683976769447327, -0.00014082808047533035, -0.00013481639325618744, -0.00012880470603704453, -0.0001227930188179016, -0.0001167813315987587, -0.00011076964437961578, -0.00010475795716047287, -9.874626994132996e-05, -9.273458272218704e-05, -8.672289550304413e-05, -8.071120828390121e-05, -7.46995210647583e-05, -6.868783384561539e-05, -6.267614662647247e-05, -5.666445940732956e-05, -5.0652772188186646e-05, -4.464108496904373e-05, -3.862939774990082e-05, -3.2617710530757904e-05, -2.660602331161499e-05, -2.0594336092472076e-05, -1.4582648873329163e-05, -8.570961654186249e-06, -2.559274435043335e-06, 3.452412784099579e-06, 9.464100003242493e-06, 1.5475787222385406e-05, 2.148747444152832e-05, 2.7499161660671234e-05, 3.351084887981415e-05, 3.952253609895706e-05, 4.5534223318099976e-05, 5.154591053724289e-05, 5.75575977563858e-05, 6.356928497552872e-05, 6.958097219467163e-05, 7.559265941381454e-05, 8.160434663295746e-05, 8.761603385210037e-05, 9.362772107124329e-05, 9.96394082903862e-05, 0.00010565109550952911, 0.00011166278272867203, 0.00011767446994781494, 0.00012368615716695786, 0.00012969784438610077, 0.00013570953160524368, 0.0001417212188243866, 0.0001477329060435295, 0.00015374459326267242, 0.00015975628048181534, 0.00016576796770095825, 0.00017177965492010117, 0.00017779134213924408, 0.000183803029358387, 0.0001898147165775299, 0.00019582640379667282, 0.00020183809101581573, 0.00020784977823495865, 0.00021386146545410156]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 2.0, 7.0, 6.0, 3.0, 6.0, 8.0, 10.0, 14.0, 13.0, 20.0, 19.0, 16.0, 21.0, 30.0, 39.0, 25.0, 26.0, 36.0, 34.0, 51.0, 37.0, 36.0, 41.0, 48.0, 41.0, 48.0, 38.0, 40.0, 32.0, 34.0, 28.0, 24.0, 16.0, 31.0, 21.0, 10.0, 19.0, 10.0, 10.0, 9.0, 8.0, 11.0, 5.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.2578125, -8.9742431640625, -8.690673828125, -8.4071044921875, -8.12353515625, -7.8399658203125, -7.556396484375, -7.2728271484375, -6.9892578125, -6.7056884765625, -6.422119140625, -6.1385498046875, -5.85498046875, -5.5714111328125, -5.287841796875, -5.0042724609375, -4.720703125, -4.4371337890625, -4.153564453125, -3.8699951171875, -3.58642578125, -3.3028564453125, -3.019287109375, -2.7357177734375, -2.4521484375, -2.1685791015625, -1.885009765625, -1.6014404296875, -1.31787109375, -1.0343017578125, -0.750732421875, -0.4671630859375, -0.18359375, 0.0999755859375, 0.383544921875, 0.6671142578125, 0.95068359375, 1.2342529296875, 1.517822265625, 1.8013916015625, 2.0849609375, 2.3685302734375, 2.652099609375, 2.9356689453125, 3.21923828125, 3.5028076171875, 3.786376953125, 4.0699462890625, 4.353515625, 4.6370849609375, 4.920654296875, 5.2042236328125, 5.48779296875, 5.7713623046875, 6.054931640625, 6.3385009765625, 6.6220703125, 6.9056396484375, 7.189208984375, 7.4727783203125, 7.75634765625, 8.0399169921875, 8.323486328125, 8.6070556640625, 8.890625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 6.0, 5.0, 11.0, 8.0, 14.0, 21.0, 22.0, 29.0, 38.0, 71.0, 110.0, 173.0, 305.0, 606.0, 1342.0, 3000.0, 6792.0, 16251.0, 39755.0, 108605.0, 278324.0, 338920.0, 158355.0, 56665.0, 22259.0, 9273.0, 3959.0, 1782.0, 806.0, 413.0, 208.0, 128.0, 73.0, 55.0, 34.0, 31.0, 21.0, 14.0, 7.0, 11.0, 9.0, 10.0, 6.0, 6.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6640625, -9.36376953125, -9.0634765625, -8.76318359375, -8.462890625, -8.16259765625, -7.8623046875, -7.56201171875, -7.26171875, -6.96142578125, -6.6611328125, -6.36083984375, -6.060546875, -5.76025390625, -5.4599609375, -5.15966796875, -4.859375, -4.55908203125, -4.2587890625, -3.95849609375, -3.658203125, -3.35791015625, -3.0576171875, -2.75732421875, -2.45703125, -2.15673828125, -1.8564453125, -1.55615234375, -1.255859375, -0.95556640625, -0.6552734375, -0.35498046875, -0.0546875, 0.24560546875, 0.5458984375, 0.84619140625, 1.146484375, 1.44677734375, 1.7470703125, 2.04736328125, 2.34765625, 2.64794921875, 2.9482421875, 3.24853515625, 3.548828125, 3.84912109375, 4.1494140625, 4.44970703125, 4.75, 5.05029296875, 5.3505859375, 5.65087890625, 5.951171875, 6.25146484375, 6.5517578125, 6.85205078125, 7.15234375, 7.45263671875, 7.7529296875, 8.05322265625, 8.353515625, 8.65380859375, 8.9541015625, 9.25439453125, 9.5546875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 6.0, 8.0, 13.0, 13.0, 11.0, 14.0, 20.0, 33.0, 22.0, 32.0, 34.0, 41.0, 51.0, 42.0, 56.0, 79.0, 195.0, 1464.0, 344.0, 126.0, 64.0, 47.0, 44.0, 42.0, 34.0, 36.0, 27.0, 22.0, 18.0, 17.0, 15.0, 14.0, 8.0, 17.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.625, -25.59423828125, -24.5634765625, -23.53271484375, -22.501953125, -21.47119140625, -20.4404296875, -19.40966796875, -18.37890625, -17.34814453125, -16.3173828125, -15.28662109375, -14.255859375, -13.22509765625, -12.1943359375, -11.16357421875, -10.1328125, -9.10205078125, -8.0712890625, -7.04052734375, -6.009765625, -4.97900390625, -3.9482421875, -2.91748046875, -1.88671875, -0.85595703125, 0.1748046875, 1.20556640625, 2.236328125, 3.26708984375, 4.2978515625, 5.32861328125, 6.359375, 7.39013671875, 8.4208984375, 9.45166015625, 10.482421875, 11.51318359375, 12.5439453125, 13.57470703125, 14.60546875, 15.63623046875, 16.6669921875, 17.69775390625, 18.728515625, 19.75927734375, 20.7900390625, 21.82080078125, 22.8515625, 23.88232421875, 24.9130859375, 25.94384765625, 26.974609375, 28.00537109375, 29.0361328125, 30.06689453125, 31.09765625, 32.12841796875, 33.1591796875, 34.18994140625, 35.220703125, 36.25146484375, 37.2822265625, 38.31298828125, 39.34375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 4.0, 1.0, 11.0, 13.0, 13.0, 20.0, 37.0, 47.0, 61.0, 77.0, 100.0, 189.0, 306.0, 570.0, 1493.0, 46130.0, 3076402.0, 17629.0, 1170.0, 529.0, 273.0, 198.0, 130.0, 66.0, 49.0, 44.0, 28.0, 22.0, 21.0, 10.0, 9.0, 11.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.125, -69.6728515625, -67.220703125, -64.7685546875, -62.31640625, -59.8642578125, -57.412109375, -54.9599609375, -52.5078125, -50.0556640625, -47.603515625, -45.1513671875, -42.69921875, -40.2470703125, -37.794921875, -35.3427734375, -32.890625, -30.4384765625, -27.986328125, -25.5341796875, -23.08203125, -20.6298828125, -18.177734375, -15.7255859375, -13.2734375, -10.8212890625, -8.369140625, -5.9169921875, -3.46484375, -1.0126953125, 1.439453125, 3.8916015625, 6.34375, 8.7958984375, 11.248046875, 13.7001953125, 16.15234375, 18.6044921875, 21.056640625, 23.5087890625, 25.9609375, 28.4130859375, 30.865234375, 33.3173828125, 35.76953125, 38.2216796875, 40.673828125, 43.1259765625, 45.578125, 48.0302734375, 50.482421875, 52.9345703125, 55.38671875, 57.8388671875, 60.291015625, 62.7431640625, 65.1953125, 67.6474609375, 70.099609375, 72.5517578125, 75.00390625, 77.4560546875, 79.908203125, 82.3603515625, 84.8125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 167.0, 541.0, 272.0, 31.0, 1.0, 0.0, 1.0], "bins": [-321.1007385253906, -315.61968994140625, -310.1386413574219, -304.6575927734375, -299.1765441894531, -293.69549560546875, -288.21441650390625, -282.7333679199219, -277.2523193359375, -271.7712707519531, -266.29022216796875, -260.8091735839844, -255.32810974121094, -249.84706115722656, -244.3660125732422, -238.8849639892578, -233.40391540527344, -227.92286682128906, -222.4418182373047, -216.96075439453125, -211.47970581054688, -205.9986572265625, -200.51760864257812, -195.03656005859375, -189.55551147460938, -184.074462890625, -178.59341430664062, -173.11236572265625, -167.6313018798828, -162.15025329589844, -156.66920471191406, -151.1881561279297, -145.7071075439453, -140.22605895996094, -134.74501037597656, -129.26394653320312, -123.78289794921875, -118.30184936523438, -112.82080078125, -107.33975219726562, -101.85868835449219, -96.37763977050781, -90.8965835571289, -85.41553497314453, -79.93447875976562, -74.45343017578125, -68.97238159179688, -63.491329193115234, -58.010276794433594, -52.52922439575195, -47.04817199707031, -41.56712341308594, -36.0860710144043, -30.605018615722656, -25.12397003173828, -19.64291763305664, -14.161867141723633, -8.680815696716309, -3.1997642517089844, 2.2812862396240234, 7.762338638305664, 13.243391036987305, 18.72443962097168, 24.20549201965332, 29.68654441833496]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 4.0, 8.0, 10.0, 13.0, 10.0, 17.0, 20.0, 20.0, 17.0, 22.0, 29.0, 26.0, 32.0, 34.0, 46.0, 40.0, 36.0, 49.0, 50.0, 42.0, 46.0, 38.0, 40.0, 46.0, 31.0, 33.0, 37.0, 32.0, 29.0, 31.0, 16.0, 21.0, 12.0, 13.0, 7.0, 15.0, 7.0, 6.0, 7.0, 1.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.52777099609375, -76.05451965332031, -73.5812759399414, -71.10802459716797, -68.63477325439453, -66.16152954101562, -63.68827819824219, -61.21502685546875, -58.74177932739258, -56.268531799316406, -53.79528045654297, -51.3220329284668, -48.848785400390625, -46.37553405761719, -43.902286529541016, -41.429039001464844, -38.955787658691406, -36.482540130615234, -34.0092887878418, -31.536041259765625, -29.06279182434082, -26.589542388916016, -24.116294860839844, -21.64304542541504, -19.169795989990234, -16.69654655456543, -14.223298072814941, -11.750049591064453, -9.276800155639648, -6.803550720214844, -4.3303022384643555, -1.8570537567138672, 0.6162033081054688, 3.0894522666931152, 5.562701225280762, 8.03594970703125, 10.509199142456055, 12.98244857788086, 15.455697059631348, 17.928945541381836, 20.40219497680664, 22.875444412231445, 25.34869384765625, 27.821941375732422, 30.295190811157227, 32.76844024658203, 35.2416877746582, 37.714935302734375, 40.18818664550781, 42.661434173583984, 45.13468551635742, 47.607933044433594, 50.08118438720703, 52.5544319152832, 55.027679443359375, 57.50093078613281, 59.974178314208984, 62.447425842285156, 64.9206771850586, 67.39392852783203, 69.86717224121094, 72.34042358398438, 74.81367492675781, 77.28691864013672, 79.76016998291016]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 6.0, 1.0, 10.0, 5.0, 8.0, 8.0, 9.0, 9.0, 22.0, 29.0, 25.0, 27.0, 37.0, 28.0, 30.0, 41.0, 33.0, 35.0, 38.0, 53.0, 47.0, 50.0, 55.0, 49.0, 29.0, 51.0, 26.0, 34.0, 39.0, 26.0, 20.0, 16.0, 22.0, 21.0, 11.0, 12.0, 9.0, 4.0, 10.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.7734375, -11.4420166015625, -11.110595703125, -10.7791748046875, -10.44775390625, -10.1163330078125, -9.784912109375, -9.4534912109375, -9.1220703125, -8.7906494140625, -8.459228515625, -8.1278076171875, -7.79638671875, -7.4649658203125, -7.133544921875, -6.8021240234375, -6.470703125, -6.1392822265625, -5.807861328125, -5.4764404296875, -5.14501953125, -4.8135986328125, -4.482177734375, -4.1507568359375, -3.8193359375, -3.4879150390625, -3.156494140625, -2.8250732421875, -2.49365234375, -2.1622314453125, -1.830810546875, -1.4993896484375, -1.16796875, -0.8365478515625, -0.505126953125, -0.1737060546875, 0.15771484375, 0.4891357421875, 0.820556640625, 1.1519775390625, 1.4833984375, 1.8148193359375, 2.146240234375, 2.4776611328125, 2.80908203125, 3.1405029296875, 3.471923828125, 3.8033447265625, 4.134765625, 4.4661865234375, 4.797607421875, 5.1290283203125, 5.46044921875, 5.7918701171875, 6.123291015625, 6.4547119140625, 6.7861328125, 7.1175537109375, 7.448974609375, 7.7803955078125, 8.11181640625, 8.4432373046875, 8.774658203125, 9.1060791015625, 9.4375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 4.0, 11.0, 9.0, 11.0, 17.0, 23.0, 19.0, 32.0, 43.0, 48.0, 53.0, 77.0, 107.0, 184.0, 491.0, 2618.0, 112151.0, 3353088.0, 715365.0, 8364.0, 775.0, 246.0, 126.0, 86.0, 75.0, 47.0, 38.0, 22.0, 32.0, 14.0, 17.0, 20.0, 17.0, 12.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.90625, -38.788330078125, -37.67041015625, -36.552490234375, -35.4345703125, -34.316650390625, -33.19873046875, -32.080810546875, -30.962890625, -29.844970703125, -28.72705078125, -27.609130859375, -26.4912109375, -25.373291015625, -24.25537109375, -23.137451171875, -22.01953125, -20.901611328125, -19.78369140625, -18.665771484375, -17.5478515625, -16.429931640625, -15.31201171875, -14.194091796875, -13.076171875, -11.958251953125, -10.84033203125, -9.722412109375, -8.6044921875, -7.486572265625, -6.36865234375, -5.250732421875, -4.1328125, -3.014892578125, -1.89697265625, -0.779052734375, 0.3388671875, 1.456787109375, 2.57470703125, 3.692626953125, 4.810546875, 5.928466796875, 7.04638671875, 8.164306640625, 9.2822265625, 10.400146484375, 11.51806640625, 12.635986328125, 13.75390625, 14.871826171875, 15.98974609375, 17.107666015625, 18.2255859375, 19.343505859375, 20.46142578125, 21.579345703125, 22.697265625, 23.815185546875, 24.93310546875, 26.051025390625, 27.1689453125, 28.286865234375, 29.40478515625, 30.522705078125, 31.640625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 10.0, 14.0, 19.0, 34.0, 33.0, 39.0, 56.0, 60.0, 103.0, 150.0, 185.0, 251.0, 336.0, 398.0, 445.0, 426.0, 374.0, 306.0, 226.0, 168.0, 96.0, 83.0, 67.0, 42.0, 33.0, 30.0, 21.0, 19.0, 14.0, 5.0, 5.0, 4.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.328125, -13.81298828125, -13.2978515625, -12.78271484375, -12.267578125, -11.75244140625, -11.2373046875, -10.72216796875, -10.20703125, -9.69189453125, -9.1767578125, -8.66162109375, -8.146484375, -7.63134765625, -7.1162109375, -6.60107421875, -6.0859375, -5.57080078125, -5.0556640625, -4.54052734375, -4.025390625, -3.51025390625, -2.9951171875, -2.47998046875, -1.96484375, -1.44970703125, -0.9345703125, -0.41943359375, 0.095703125, 0.61083984375, 1.1259765625, 1.64111328125, 2.15625, 2.67138671875, 3.1865234375, 3.70166015625, 4.216796875, 4.73193359375, 5.2470703125, 5.76220703125, 6.27734375, 6.79248046875, 7.3076171875, 7.82275390625, 8.337890625, 8.85302734375, 9.3681640625, 9.88330078125, 10.3984375, 10.91357421875, 11.4287109375, 11.94384765625, 12.458984375, 12.97412109375, 13.4892578125, 14.00439453125, 14.51953125, 15.03466796875, 15.5498046875, 16.06494140625, 16.580078125, 17.09521484375, 17.6103515625, 18.12548828125, 18.640625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 10.0, 11.0, 18.0, 29.0, 30.0, 45.0, 59.0, 81.0, 100.0, 130.0, 168.0, 245.0, 380.0, 791.0, 3288.0, 92024.0, 3821248.0, 267360.0, 5696.0, 1016.0, 452.0, 306.0, 200.0, 144.0, 115.0, 73.0, 75.0, 49.0, 43.0, 27.0, 21.0, 11.0, 14.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-65.625, -63.83251953125, -62.0400390625, -60.24755859375, -58.455078125, -56.66259765625, -54.8701171875, -53.07763671875, -51.28515625, -49.49267578125, -47.7001953125, -45.90771484375, -44.115234375, -42.32275390625, -40.5302734375, -38.73779296875, -36.9453125, -35.15283203125, -33.3603515625, -31.56787109375, -29.775390625, -27.98291015625, -26.1904296875, -24.39794921875, -22.60546875, -20.81298828125, -19.0205078125, -17.22802734375, -15.435546875, -13.64306640625, -11.8505859375, -10.05810546875, -8.265625, -6.47314453125, -4.6806640625, -2.88818359375, -1.095703125, 0.69677734375, 2.4892578125, 4.28173828125, 6.07421875, 7.86669921875, 9.6591796875, 11.45166015625, 13.244140625, 15.03662109375, 16.8291015625, 18.62158203125, 20.4140625, 22.20654296875, 23.9990234375, 25.79150390625, 27.583984375, 29.37646484375, 31.1689453125, 32.96142578125, 34.75390625, 36.54638671875, 38.3388671875, 40.13134765625, 41.923828125, 43.71630859375, 45.5087890625, 47.30126953125, 49.09375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 15.0, 398.0, 559.0, 43.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.58255004882812, -184.50808715820312, -170.43362426757812, -156.35914611816406, -142.28468322753906, -128.21022033691406, -114.13574981689453, -100.061279296875, -85.98681640625, -71.912353515625, -57.83788299560547, -43.7634162902832, -29.688949584960938, -15.614486694335938, -1.5400161743164062, 12.534454345703125, 26.608917236328125, 40.68338394165039, 54.757850646972656, 68.83232116699219, 82.90678405761719, 96.98124694824219, 111.05571746826172, 125.13018798828125, 139.20465087890625, 153.27911376953125, 167.35357666015625, 181.4280548095703, 195.5025177001953, 209.5769805908203, 223.65145874023438, 237.72592163085938, 251.8004150390625, 265.8748779296875, 279.9493408203125, 294.0238037109375, 308.0982666015625, 322.1727294921875, 336.2472229003906, 350.3216857910156, 364.3961486816406, 378.4706115722656, 392.5450744628906, 406.6195373535156, 420.69403076171875, 434.76849365234375, 448.84295654296875, 462.91741943359375, 476.99188232421875, 491.06634521484375, 505.14080810546875, 519.2152709960938, 533.2897338867188, 547.3641967773438, 561.4386596679688, 575.51318359375, 589.587646484375, 603.662109375, 617.736572265625, 631.81103515625, 645.885498046875, 659.9599609375, 674.034423828125, 688.10888671875, 702.183349609375]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 13.0, 8.0, 8.0, 12.0, 17.0, 4.0, 31.0, 20.0, 29.0, 32.0, 26.0, 34.0, 23.0, 49.0, 40.0, 40.0, 38.0, 37.0, 42.0, 31.0, 38.0, 40.0, 42.0, 36.0, 38.0, 29.0, 28.0, 23.0, 29.0, 14.0, 20.0, 19.0, 22.0, 14.0, 10.0, 12.0, 8.0, 7.0, 4.0, 3.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-61.49842834472656, -59.76128005981445, -58.024131774902344, -56.28697967529297, -54.54983139038086, -52.81268310546875, -51.075531005859375, -49.338382720947266, -47.601234436035156, -45.86408615112305, -44.12693786621094, -42.38978576660156, -40.65263748168945, -38.915489196777344, -37.17833709716797, -35.44118881225586, -33.70404052734375, -31.96689224243164, -30.2297420501709, -28.492591857910156, -26.755443572998047, -25.018295288085938, -23.281145095825195, -21.543994903564453, -19.806846618652344, -18.069698333740234, -16.332548141479492, -14.595398902893066, -12.85824966430664, -11.121100425720215, -9.383951187133789, -7.646801948547363, -5.9096527099609375, -4.172503471374512, -2.435354232788086, -0.6982049942016602, 1.0389442443847656, 2.7760934829711914, 4.513242721557617, 6.250391960144043, 7.987541198730469, 9.724690437316895, 11.46183967590332, 13.198988914489746, 14.936138153076172, 16.67328643798828, 18.410436630249023, 20.147586822509766, 21.884735107421875, 23.621883392333984, 25.359033584594727, 27.09618377685547, 28.833332061767578, 30.570480346679688, 32.30763244628906, 34.04478073120117, 35.78192901611328, 37.51907730102539, 39.2562255859375, 40.993377685546875, 42.730525970458984, 44.467674255371094, 46.20482635498047, 47.94197463989258, 49.67912292480469]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 8.0, 4.0, 13.0, 9.0, 7.0, 10.0, 13.0, 14.0, 8.0, 23.0, 22.0, 22.0, 21.0, 34.0, 27.0, 27.0, 47.0, 38.0, 43.0, 47.0, 44.0, 48.0, 38.0, 47.0, 37.0, 30.0, 35.0, 41.0, 19.0, 16.0, 19.0, 17.0, 27.0, 21.0, 20.0, 21.0, 13.0, 17.0, 11.0, 10.0, 7.0, 2.0, 5.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.7421875, -9.4517822265625, -9.161376953125, -8.8709716796875, -8.58056640625, -8.2901611328125, -7.999755859375, -7.7093505859375, -7.4189453125, -7.1285400390625, -6.838134765625, -6.5477294921875, -6.25732421875, -5.9669189453125, -5.676513671875, -5.3861083984375, -5.095703125, -4.8052978515625, -4.514892578125, -4.2244873046875, -3.93408203125, -3.6436767578125, -3.353271484375, -3.0628662109375, -2.7724609375, -2.4820556640625, -2.191650390625, -1.9012451171875, -1.61083984375, -1.3204345703125, -1.030029296875, -0.7396240234375, -0.44921875, -0.1588134765625, 0.131591796875, 0.4219970703125, 0.71240234375, 1.0028076171875, 1.293212890625, 1.5836181640625, 1.8740234375, 2.1644287109375, 2.454833984375, 2.7452392578125, 3.03564453125, 3.3260498046875, 3.616455078125, 3.9068603515625, 4.197265625, 4.4876708984375, 4.778076171875, 5.0684814453125, 5.35888671875, 5.6492919921875, 5.939697265625, 6.2301025390625, 6.5205078125, 6.8109130859375, 7.101318359375, 7.3917236328125, 7.68212890625, 7.9725341796875, 8.262939453125, 8.5533447265625, 8.84375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 12.0, 20.0, 24.0, 41.0, 53.0, 81.0, 122.0, 159.0, 261.0, 385.0, 546.0, 801.0, 1178.0, 1772.0, 2585.0, 3792.0, 5564.0, 8008.0, 11931.0, 18008.0, 28078.0, 44066.0, 75438.0, 148394.0, 341698.0, 150534.0, 76026.0, 45186.0, 27730.0, 18419.0, 12296.0, 8197.0, 5484.0, 3672.0, 2539.0, 1719.0, 1179.0, 844.0, 525.0, 367.0, 265.0, 175.0, 118.0, 93.0, 52.0, 42.0, 24.0, 19.0, 14.0, 5.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.39727783203125, -2.3160400390625, -2.23480224609375, -2.153564453125, -2.07232666015625, -1.9910888671875, -1.90985107421875, -1.82861328125, -1.74737548828125, -1.6661376953125, -1.58489990234375, -1.503662109375, -1.42242431640625, -1.3411865234375, -1.25994873046875, -1.1787109375, -1.09747314453125, -1.0162353515625, -0.93499755859375, -0.853759765625, -0.77252197265625, -0.6912841796875, -0.61004638671875, -0.52880859375, -0.44757080078125, -0.3663330078125, -0.28509521484375, -0.203857421875, -0.12261962890625, -0.0413818359375, 0.03985595703125, 0.12109375, 0.20233154296875, 0.2835693359375, 0.36480712890625, 0.446044921875, 0.52728271484375, 0.6085205078125, 0.68975830078125, 0.77099609375, 0.85223388671875, 0.9334716796875, 1.01470947265625, 1.095947265625, 1.17718505859375, 1.2584228515625, 1.33966064453125, 1.4208984375, 1.50213623046875, 1.5833740234375, 1.66461181640625, 1.745849609375, 1.82708740234375, 1.9083251953125, 1.98956298828125, 2.07080078125, 2.15203857421875, 2.2332763671875, 2.31451416015625, 2.395751953125, 2.47698974609375, 2.5582275390625, 2.63946533203125, 2.720703125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 6.0, 9.0, 13.0, 15.0, 19.0, 20.0, 19.0, 17.0, 21.0, 23.0, 34.0, 32.0, 33.0, 44.0, 40.0, 42.0, 37.0, 1065.0, 42.0, 35.0, 38.0, 36.0, 39.0, 35.0, 33.0, 29.0, 36.0, 19.0, 29.0, 15.0, 19.0, 21.0, 12.0, 25.0, 9.0, 12.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.35546875, -6.1617431640625, -5.968017578125, -5.7742919921875, -5.58056640625, -5.3868408203125, -5.193115234375, -4.9993896484375, -4.8056640625, -4.6119384765625, -4.418212890625, -4.2244873046875, -4.03076171875, -3.8370361328125, -3.643310546875, -3.4495849609375, -3.255859375, -3.0621337890625, -2.868408203125, -2.6746826171875, -2.48095703125, -2.2872314453125, -2.093505859375, -1.8997802734375, -1.7060546875, -1.5123291015625, -1.318603515625, -1.1248779296875, -0.93115234375, -0.7374267578125, -0.543701171875, -0.3499755859375, -0.15625, 0.0374755859375, 0.231201171875, 0.4249267578125, 0.61865234375, 0.8123779296875, 1.006103515625, 1.1998291015625, 1.3935546875, 1.5872802734375, 1.781005859375, 1.9747314453125, 2.16845703125, 2.3621826171875, 2.555908203125, 2.7496337890625, 2.943359375, 3.1370849609375, 3.330810546875, 3.5245361328125, 3.71826171875, 3.9119873046875, 4.105712890625, 4.2994384765625, 4.4931640625, 4.6868896484375, 4.880615234375, 5.0743408203125, 5.26806640625, 5.4617919921875, 5.655517578125, 5.8492431640625, 6.04296875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 23.0, 20.0, 35.0, 51.0, 80.0, 134.0, 159.0, 254.0, 396.0, 484.0, 717.0, 1024.0, 1357.0, 2008.0, 3065.0, 4274.0, 6316.0, 9050.0, 12939.0, 19476.0, 29911.0, 45072.0, 71422.0, 120017.0, 1340146.0, 168201.0, 91295.0, 56948.0, 36805.0, 24396.0, 15891.0, 10674.0, 7471.0, 5394.0, 3577.0, 2390.0, 1715.0, 1129.0, 834.0, 588.0, 419.0, 317.0, 210.0, 128.0, 105.0, 73.0, 56.0, 23.0, 19.0, 14.0, 8.0, 10.0, 1.0, 2.0, 3.0, 1.0], "bins": [-2.384765625, -2.31195068359375, -2.2391357421875, -2.16632080078125, -2.093505859375, -2.02069091796875, -1.9478759765625, -1.87506103515625, -1.80224609375, -1.72943115234375, -1.6566162109375, -1.58380126953125, -1.510986328125, -1.43817138671875, -1.3653564453125, -1.29254150390625, -1.2197265625, -1.14691162109375, -1.0740966796875, -1.00128173828125, -0.928466796875, -0.85565185546875, -0.7828369140625, -0.71002197265625, -0.63720703125, -0.56439208984375, -0.4915771484375, -0.41876220703125, -0.345947265625, -0.27313232421875, -0.2003173828125, -0.12750244140625, -0.0546875, 0.01812744140625, 0.0909423828125, 0.16375732421875, 0.236572265625, 0.30938720703125, 0.3822021484375, 0.45501708984375, 0.52783203125, 0.60064697265625, 0.6734619140625, 0.74627685546875, 0.819091796875, 0.89190673828125, 0.9647216796875, 1.03753662109375, 1.1103515625, 1.18316650390625, 1.2559814453125, 1.32879638671875, 1.401611328125, 1.47442626953125, 1.5472412109375, 1.62005615234375, 1.69287109375, 1.76568603515625, 1.8385009765625, 1.91131591796875, 1.984130859375, 2.05694580078125, 2.1297607421875, 2.20257568359375, 2.275390625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 10.0, 6.0, 24.0, 16.0, 41.0, 49.0, 66.0, 104.0, 112.0, 109.0, 110.0, 100.0, 64.0, 59.0, 34.0, 38.0, 16.0, 12.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010042190551757812, -0.000978916883468628, -0.0009536147117614746, -0.0009283125400543213, -0.000903010368347168, -0.0008777081966400146, -0.0008524060249328613, -0.000827103853225708, -0.0008018016815185547, -0.0007764995098114014, -0.000751197338104248, -0.0007258951663970947, -0.0007005929946899414, -0.0006752908229827881, -0.0006499886512756348, -0.0006246864795684814, -0.0005993843078613281, -0.0005740821361541748, -0.0005487799644470215, -0.0005234777927398682, -0.0004981756210327148, -0.0004728734493255615, -0.0004475712776184082, -0.0004222691059112549, -0.00039696693420410156, -0.00037166476249694824, -0.0003463625907897949, -0.0003210604190826416, -0.0002957582473754883, -0.00027045607566833496, -0.00024515390396118164, -0.00021985173225402832, -0.000194549560546875, -0.00016924738883972168, -0.00014394521713256836, -0.00011864304542541504, -9.334087371826172e-05, -6.80387020111084e-05, -4.273653030395508e-05, -1.7434358596801758e-05, 7.867813110351562e-06, 3.316998481750488e-05, 5.84721565246582e-05, 8.377432823181152e-05, 0.00010907649993896484, 0.00013437867164611816, 0.00015968084335327148, 0.0001849830150604248, 0.00021028518676757812, 0.00023558735847473145, 0.00026088953018188477, 0.0002861917018890381, 0.0003114938735961914, 0.0003367960453033447, 0.00036209821701049805, 0.00038740038871765137, 0.0004127025604248047, 0.000438004732131958, 0.00046330690383911133, 0.0004886090755462646, 0.000513911247253418, 0.0005392134189605713, 0.0005645155906677246, 0.0005898177623748779, 0.0006151199340820312]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 15.0, 19.0, 32.0, 40.0, 56.0, 85.0, 130.0, 242.0, 584.0, 9026.0, 1036101.0, 1316.0, 369.0, 179.0, 109.0, 74.0, 48.0, 35.0, 21.0, 15.0, 9.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01166534423828125, -0.01118457317352295, -0.010703802108764648, -0.010223031044006348, -0.009742259979248047, -0.009261488914489746, -0.008780717849731445, -0.008299946784973145, -0.007819175720214844, -0.007338404655456543, -0.006857633590698242, -0.006376862525939941, -0.005896091461181641, -0.00541532039642334, -0.004934549331665039, -0.004453778266906738, -0.0039730072021484375, -0.0034922361373901367, -0.003011465072631836, -0.002530694007873535, -0.0020499229431152344, -0.0015691518783569336, -0.0010883808135986328, -0.000607609748840332, -0.00012683868408203125, 0.00035393238067626953, 0.0008347034454345703, 0.001315474510192871, 0.0017962455749511719, 0.0022770166397094727, 0.0027577877044677734, 0.0032385587692260742, 0.003719329833984375, 0.004200100898742676, 0.0046808719635009766, 0.005161643028259277, 0.005642414093017578, 0.006123185157775879, 0.00660395622253418, 0.0070847272872924805, 0.007565498352050781, 0.008046269416809082, 0.008527040481567383, 0.009007811546325684, 0.009488582611083984, 0.009969353675842285, 0.010450124740600586, 0.010930895805358887, 0.011411666870117188, 0.011892437934875488, 0.012373208999633789, 0.01285398006439209, 0.01333475112915039, 0.013815522193908691, 0.014296293258666992, 0.014777064323425293, 0.015257835388183594, 0.015738606452941895, 0.016219377517700195, 0.016700148582458496, 0.017180919647216797, 0.017661690711975098, 0.0181424617767334, 0.0186232328414917, 0.01910400390625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 33.0, 163.0, 449.0, 296.0, 67.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044992691255174577, -0.00042295450111851096, -0.0003959821187891066, -0.0003690097073558718, -0.000342037295922637, -0.0003150648844894022, -0.00028809247305616736, -0.000261120090726763, -0.0002341476792935282, -0.0002071752678602934, -0.0001802028709789738, -0.00015323047409765422, -0.0001262580626644194, -9.92856512311846e-05, -7.231325434986502e-05, -4.534085746854544e-05, -1.8368446035310626e-05, 8.60395812196657e-06, 3.557636227924377e-05, 6.254876643652096e-05, 8.952117059379816e-05, 0.00011649358202703297, 0.00014346597890835255, 0.00017043837578967214, 0.00019741078722290695, 0.00022438319865614176, 0.0002513555809855461, 0.0002783279924187809, 0.00030530040385201573, 0.00033227281528525054, 0.00035924522671848536, 0.0003862176090478897, 0.00041318999137729406, 0.0004401624028105289, 0.0004671348142437637, 0.000494107196573168, 0.0005210796371102333, 0.0005480520194396377, 0.000575024401769042, 0.0006019967840984464, 0.0006289692246355116, 0.000655941606964916, 0.0006829140475019813, 0.0007098864298313856, 0.00073685881216079, 0.0007638312526978552, 0.0007908036350272596, 0.0008177760755643249, 0.0008447484578937292, 0.0008717208402231336, 0.0008986932807601988, 0.0009256656630896032, 0.0009526381036266685, 0.0009796104859560728, 0.0010065828682854772, 0.0010335552506148815, 0.0010605277493596077, 0.001087500131689012, 0.0011144725140184164, 0.0011414450127631426, 0.001168417395092547, 0.0011953897774219513, 0.0012223621597513556, 0.00124933454208076, 0.0012763069244101644]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 5.0, 6.0, 11.0, 23.0, 16.0, 14.0, 12.0, 28.0, 19.0, 21.0, 33.0, 32.0, 34.0, 39.0, 36.0, 33.0, 40.0, 47.0, 53.0, 35.0, 29.0, 28.0, 38.0, 33.0, 39.0, 36.0, 39.0, 32.0, 20.0, 18.0, 22.0, 17.0, 20.0, 11.0, 9.0, 7.0, 8.0, 9.0, 9.0, 7.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00025707483291625977, -0.00024903565645217896, -0.00024099647998809814, -0.00023295730352401733, -0.00022491812705993652, -0.0002168789505958557, -0.0002088397741317749, -0.0002008005976676941, -0.00019276142120361328, -0.00018472224473953247, -0.00017668306827545166, -0.00016864389181137085, -0.00016060471534729004, -0.00015256553888320923, -0.00014452636241912842, -0.0001364871859550476, -0.0001284480094909668, -0.00012040883302688599, -0.00011236965656280518, -0.00010433048009872437, -9.629130363464355e-05, -8.825212717056274e-05, -8.021295070648193e-05, -7.217377424240112e-05, -6.413459777832031e-05, -5.60954213142395e-05, -4.805624485015869e-05, -4.001706838607788e-05, -3.197789192199707e-05, -2.393871545791626e-05, -1.589953899383545e-05, -7.860362529754639e-06, 1.7881393432617188e-07, 8.217990398406982e-06, 1.6257166862487793e-05, 2.4296343326568604e-05, 3.2335519790649414e-05, 4.0374696254730225e-05, 4.8413872718811035e-05, 5.6453049182891846e-05, 6.449222564697266e-05, 7.253140211105347e-05, 8.057057857513428e-05, 8.860975503921509e-05, 9.66489315032959e-05, 0.00010468810796737671, 0.00011272728443145752, 0.00012076646089553833, 0.00012880563735961914, 0.00013684481382369995, 0.00014488399028778076, 0.00015292316675186157, 0.00016096234321594238, 0.0001690015196800232, 0.000177040696144104, 0.00018507987260818481, 0.00019311904907226562, 0.00020115822553634644, 0.00020919740200042725, 0.00021723657846450806, 0.00022527575492858887, 0.00023331493139266968, 0.0002413541078567505, 0.0002493932843208313, 0.0002574324607849121]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 8.0, 4.0, 13.0, 9.0, 7.0, 10.0, 13.0, 14.0, 8.0, 23.0, 22.0, 22.0, 21.0, 34.0, 27.0, 27.0, 47.0, 38.0, 43.0, 47.0, 44.0, 48.0, 38.0, 47.0, 37.0, 30.0, 35.0, 41.0, 19.0, 16.0, 19.0, 17.0, 27.0, 21.0, 20.0, 21.0, 13.0, 17.0, 11.0, 10.0, 7.0, 2.0, 5.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.7421875, -9.4517822265625, -9.161376953125, -8.8709716796875, -8.58056640625, -8.2901611328125, -7.999755859375, -7.7093505859375, -7.4189453125, -7.1285400390625, -6.838134765625, -6.5477294921875, -6.25732421875, -5.9669189453125, -5.676513671875, -5.3861083984375, -5.095703125, -4.8052978515625, -4.514892578125, -4.2244873046875, -3.93408203125, -3.6436767578125, -3.353271484375, -3.0628662109375, -2.7724609375, -2.4820556640625, -2.191650390625, -1.9012451171875, -1.61083984375, -1.3204345703125, -1.030029296875, -0.7396240234375, -0.44921875, -0.1588134765625, 0.131591796875, 0.4219970703125, 0.71240234375, 1.0028076171875, 1.293212890625, 1.5836181640625, 1.8740234375, 2.1644287109375, 2.454833984375, 2.7452392578125, 3.03564453125, 3.3260498046875, 3.616455078125, 3.9068603515625, 4.197265625, 4.4876708984375, 4.778076171875, 5.0684814453125, 5.35888671875, 5.6492919921875, 5.939697265625, 6.2301025390625, 6.5205078125, 6.8109130859375, 7.101318359375, 7.3917236328125, 7.68212890625, 7.9725341796875, 8.262939453125, 8.5533447265625, 8.84375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 6.0, 6.0, 13.0, 14.0, 15.0, 12.0, 23.0, 32.0, 42.0, 39.0, 68.0, 90.0, 99.0, 135.0, 204.0, 303.0, 485.0, 1050.0, 2598.0, 7571.0, 23710.0, 89822.0, 376541.0, 406898.0, 99376.0, 25910.0, 7937.0, 2688.0, 1116.0, 540.0, 335.0, 230.0, 138.0, 96.0, 91.0, 65.0, 55.0, 40.0, 21.0, 29.0, 23.0, 13.0, 18.0, 7.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0], "bins": [-15.21875, -14.758056640625, -14.29736328125, -13.836669921875, -13.3759765625, -12.915283203125, -12.45458984375, -11.993896484375, -11.533203125, -11.072509765625, -10.61181640625, -10.151123046875, -9.6904296875, -9.229736328125, -8.76904296875, -8.308349609375, -7.84765625, -7.386962890625, -6.92626953125, -6.465576171875, -6.0048828125, -5.544189453125, -5.08349609375, -4.622802734375, -4.162109375, -3.701416015625, -3.24072265625, -2.780029296875, -2.3193359375, -1.858642578125, -1.39794921875, -0.937255859375, -0.4765625, -0.015869140625, 0.44482421875, 0.905517578125, 1.3662109375, 1.826904296875, 2.28759765625, 2.748291015625, 3.208984375, 3.669677734375, 4.13037109375, 4.591064453125, 5.0517578125, 5.512451171875, 5.97314453125, 6.433837890625, 6.89453125, 7.355224609375, 7.81591796875, 8.276611328125, 8.7373046875, 9.197998046875, 9.65869140625, 10.119384765625, 10.580078125, 11.040771484375, 11.50146484375, 11.962158203125, 12.4228515625, 12.883544921875, 13.34423828125, 13.804931640625, 14.265625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 4.0, 8.0, 10.0, 13.0, 13.0, 15.0, 17.0, 33.0, 21.0, 17.0, 25.0, 28.0, 33.0, 41.0, 36.0, 44.0, 66.0, 77.0, 175.0, 1348.0, 331.0, 137.0, 85.0, 49.0, 46.0, 42.0, 31.0, 34.0, 34.0, 29.0, 26.0, 23.0, 26.0, 19.0, 14.0, 13.0, 14.0, 7.0, 6.0, 9.0, 4.0, 7.0, 7.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-28.40625, -27.51806640625, -26.6298828125, -25.74169921875, -24.853515625, -23.96533203125, -23.0771484375, -22.18896484375, -21.30078125, -20.41259765625, -19.5244140625, -18.63623046875, -17.748046875, -16.85986328125, -15.9716796875, -15.08349609375, -14.1953125, -13.30712890625, -12.4189453125, -11.53076171875, -10.642578125, -9.75439453125, -8.8662109375, -7.97802734375, -7.08984375, -6.20166015625, -5.3134765625, -4.42529296875, -3.537109375, -2.64892578125, -1.7607421875, -0.87255859375, 0.015625, 0.90380859375, 1.7919921875, 2.68017578125, 3.568359375, 4.45654296875, 5.3447265625, 6.23291015625, 7.12109375, 8.00927734375, 8.8974609375, 9.78564453125, 10.673828125, 11.56201171875, 12.4501953125, 13.33837890625, 14.2265625, 15.11474609375, 16.0029296875, 16.89111328125, 17.779296875, 18.66748046875, 19.5556640625, 20.44384765625, 21.33203125, 22.22021484375, 23.1083984375, 23.99658203125, 24.884765625, 25.77294921875, 26.6611328125, 27.54931640625, 28.4375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 7.0, 6.0, 14.0, 14.0, 14.0, 26.0, 36.0, 46.0, 55.0, 79.0, 109.0, 151.0, 260.0, 462.0, 1296.0, 14504.0, 3081339.0, 44107.0, 1700.0, 586.0, 270.0, 187.0, 101.0, 83.0, 60.0, 46.0, 39.0, 19.0, 18.0, 12.0, 15.0, 9.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.3125, -74.29296875, -71.2734375, -68.25390625, -65.234375, -62.21484375, -59.1953125, -56.17578125, -53.15625, -50.13671875, -47.1171875, -44.09765625, -41.078125, -38.05859375, -35.0390625, -32.01953125, -29.0, -25.98046875, -22.9609375, -19.94140625, -16.921875, -13.90234375, -10.8828125, -7.86328125, -4.84375, -1.82421875, 1.1953125, 4.21484375, 7.234375, 10.25390625, 13.2734375, 16.29296875, 19.3125, 22.33203125, 25.3515625, 28.37109375, 31.390625, 34.41015625, 37.4296875, 40.44921875, 43.46875, 46.48828125, 49.5078125, 52.52734375, 55.546875, 58.56640625, 61.5859375, 64.60546875, 67.625, 70.64453125, 73.6640625, 76.68359375, 79.703125, 82.72265625, 85.7421875, 88.76171875, 91.78125, 94.80078125, 97.8203125, 100.83984375, 103.859375, 106.87890625, 109.8984375, 112.91796875, 115.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 217.0, 754.0, 43.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-515.4291381835938, -504.5255432128906, -493.6219787597656, -482.7183837890625, -471.8148193359375, -460.9112243652344, -450.00762939453125, -439.10406494140625, -428.20050048828125, -417.2969055175781, -406.3933410644531, -395.48974609375, -384.586181640625, -373.6825866699219, -362.77899169921875, -351.87542724609375, -340.9718322753906, -330.0682373046875, -319.1646728515625, -308.2610778808594, -297.3575134277344, -286.45391845703125, -275.55035400390625, -264.6467590332031, -253.74317932128906, -242.839599609375, -231.93601989746094, -221.03244018554688, -210.12884521484375, -199.22528076171875, -188.32168579101562, -177.41810607910156, -166.51454162597656, -155.6109619140625, -144.70738220214844, -133.80380249023438, -122.90021514892578, -111.99663543701172, -101.09304809570312, -90.18946838378906, -79.285888671875, -68.38230895996094, -57.47872543334961, -46.57514190673828, -35.67156219482422, -24.767982482910156, -13.864395141601562, -2.9608154296875, 7.9427642822265625, 18.846345901489258, 29.749927520751953, 40.65351104736328, 51.557090759277344, 62.460670471191406, 73.3642578125, 84.26783752441406, 95.17141723632812, 106.07499694824219, 116.97857666015625, 127.88216400146484, 138.78573608398438, 149.6893310546875, 160.59291076660156, 171.49649047851562, 182.4000701904297]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 6.0, 6.0, 10.0, 11.0, 16.0, 18.0, 21.0, 22.0, 18.0, 17.0, 20.0, 33.0, 30.0, 28.0, 34.0, 38.0, 44.0, 29.0, 51.0, 48.0, 36.0, 36.0, 48.0, 35.0, 33.0, 44.0, 32.0, 21.0, 32.0, 21.0, 15.0, 26.0, 25.0, 18.0, 12.0, 8.0, 12.0, 9.0, 5.0, 1.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.20426177978516, -73.78888702392578, -71.3735122680664, -68.95813751220703, -66.54277038574219, -64.12739562988281, -61.71202087402344, -59.29664611816406, -56.88127136230469, -54.46589660644531, -52.05052185058594, -49.63515090942383, -47.21977615356445, -44.80440139770508, -42.38903045654297, -39.973655700683594, -37.55828094482422, -35.142906188964844, -32.72753143310547, -30.31216049194336, -27.896785736083984, -25.48141098022461, -23.066038131713867, -20.650665283203125, -18.23529052734375, -15.819916725158691, -13.404542922973633, -10.989169120788574, -8.573795318603516, -6.158421516418457, -3.7430477142333984, -1.3276748657226562, 1.0876998901367188, 3.5030736923217773, 5.918447494506836, 8.333821296691895, 10.749195098876953, 13.164568901062012, 15.57994270324707, 17.995315551757812, 20.410690307617188, 22.826065063476562, 25.241437911987305, 27.656810760498047, 30.072185516357422, 32.4875602722168, 34.902931213378906, 37.31830596923828, 39.733680725097656, 42.14905548095703, 44.564430236816406, 46.979801177978516, 49.39517593383789, 51.810550689697266, 54.225921630859375, 56.64129638671875, 59.056671142578125, 61.4720458984375, 63.887420654296875, 66.30279541015625, 68.71817016601562, 71.13353729248047, 73.54891204833984, 75.96428680419922, 78.3796615600586]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 6.0, 3.0, 6.0, 5.0, 7.0, 8.0, 11.0, 5.0, 11.0, 13.0, 15.0, 19.0, 15.0, 12.0, 25.0, 35.0, 31.0, 31.0, 37.0, 23.0, 38.0, 36.0, 30.0, 31.0, 39.0, 39.0, 46.0, 42.0, 34.0, 36.0, 36.0, 38.0, 22.0, 29.0, 29.0, 15.0, 19.0, 26.0, 17.0, 11.0, 16.0, 12.0, 14.0, 9.0, 9.0, 3.0, 2.0, 2.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.659912109375, -8.35107421875, -8.042236328125, -7.7333984375, -7.424560546875, -7.11572265625, -6.806884765625, -6.498046875, -6.189208984375, -5.88037109375, -5.571533203125, -5.2626953125, -4.953857421875, -4.64501953125, -4.336181640625, -4.02734375, -3.718505859375, -3.40966796875, -3.100830078125, -2.7919921875, -2.483154296875, -2.17431640625, -1.865478515625, -1.556640625, -1.247802734375, -0.93896484375, -0.630126953125, -0.3212890625, -0.012451171875, 0.29638671875, 0.605224609375, 0.9140625, 1.222900390625, 1.53173828125, 1.840576171875, 2.1494140625, 2.458251953125, 2.76708984375, 3.075927734375, 3.384765625, 3.693603515625, 4.00244140625, 4.311279296875, 4.6201171875, 4.928955078125, 5.23779296875, 5.546630859375, 5.85546875, 6.164306640625, 6.47314453125, 6.781982421875, 7.0908203125, 7.399658203125, 7.70849609375, 8.017333984375, 8.326171875, 8.635009765625, 8.94384765625, 9.252685546875, 9.5615234375, 9.870361328125, 10.17919921875, 10.488037109375, 10.796875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 8.0, 7.0, 10.0, 10.0, 11.0, 15.0, 27.0, 21.0, 25.0, 23.0, 35.0, 63.0, 78.0, 96.0, 137.0, 290.0, 692.0, 2555.0, 21105.0, 399661.0, 2688757.0, 1017703.0, 56080.0, 4806.0, 1005.0, 375.0, 196.0, 109.0, 72.0, 44.0, 39.0, 35.0, 29.0, 21.0, 21.0, 17.0, 12.0, 20.0, 10.0, 10.0, 7.0, 10.0, 5.0, 0.0, 10.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.234375, -22.451416015625, -21.66845703125, -20.885498046875, -20.1025390625, -19.319580078125, -18.53662109375, -17.753662109375, -16.970703125, -16.187744140625, -15.40478515625, -14.621826171875, -13.8388671875, -13.055908203125, -12.27294921875, -11.489990234375, -10.70703125, -9.924072265625, -9.14111328125, -8.358154296875, -7.5751953125, -6.792236328125, -6.00927734375, -5.226318359375, -4.443359375, -3.660400390625, -2.87744140625, -2.094482421875, -1.3115234375, -0.528564453125, 0.25439453125, 1.037353515625, 1.8203125, 2.603271484375, 3.38623046875, 4.169189453125, 4.9521484375, 5.735107421875, 6.51806640625, 7.301025390625, 8.083984375, 8.866943359375, 9.64990234375, 10.432861328125, 11.2158203125, 11.998779296875, 12.78173828125, 13.564697265625, 14.34765625, 15.130615234375, 15.91357421875, 16.696533203125, 17.4794921875, 18.262451171875, 19.04541015625, 19.828369140625, 20.611328125, 21.394287109375, 22.17724609375, 22.960205078125, 23.7431640625, 24.526123046875, 25.30908203125, 26.092041015625, 26.875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 8.0, 10.0, 8.0, 13.0, 18.0, 23.0, 29.0, 44.0, 47.0, 68.0, 110.0, 156.0, 210.0, 274.0, 403.0, 448.0, 477.0, 441.0, 362.0, 274.0, 180.0, 141.0, 114.0, 67.0, 33.0, 38.0, 19.0, 18.0, 12.0, 9.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.578125, -19.008056640625, -18.43798828125, -17.867919921875, -17.2978515625, -16.727783203125, -16.15771484375, -15.587646484375, -15.017578125, -14.447509765625, -13.87744140625, -13.307373046875, -12.7373046875, -12.167236328125, -11.59716796875, -11.027099609375, -10.45703125, -9.886962890625, -9.31689453125, -8.746826171875, -8.1767578125, -7.606689453125, -7.03662109375, -6.466552734375, -5.896484375, -5.326416015625, -4.75634765625, -4.186279296875, -3.6162109375, -3.046142578125, -2.47607421875, -1.906005859375, -1.3359375, -0.765869140625, -0.19580078125, 0.374267578125, 0.9443359375, 1.514404296875, 2.08447265625, 2.654541015625, 3.224609375, 3.794677734375, 4.36474609375, 4.934814453125, 5.5048828125, 6.074951171875, 6.64501953125, 7.215087890625, 7.78515625, 8.355224609375, 8.92529296875, 9.495361328125, 10.0654296875, 10.635498046875, 11.20556640625, 11.775634765625, 12.345703125, 12.915771484375, 13.48583984375, 14.055908203125, 14.6259765625, 15.196044921875, 15.76611328125, 16.336181640625, 16.90625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 13.0, 8.0, 22.0, 35.0, 35.0, 60.0, 71.0, 86.0, 108.0, 161.0, 222.0, 368.0, 651.0, 1588.0, 6711.0, 77282.0, 2559530.0, 1495373.0, 44327.0, 4651.0, 1229.0, 560.0, 335.0, 211.0, 168.0, 103.0, 96.0, 63.0, 48.0, 43.0, 37.0, 26.0, 9.0, 7.0, 12.0, 11.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.6875, -36.3837890625, -35.080078125, -33.7763671875, -32.47265625, -31.1689453125, -29.865234375, -28.5615234375, -27.2578125, -25.9541015625, -24.650390625, -23.3466796875, -22.04296875, -20.7392578125, -19.435546875, -18.1318359375, -16.828125, -15.5244140625, -14.220703125, -12.9169921875, -11.61328125, -10.3095703125, -9.005859375, -7.7021484375, -6.3984375, -5.0947265625, -3.791015625, -2.4873046875, -1.18359375, 0.1201171875, 1.423828125, 2.7275390625, 4.03125, 5.3349609375, 6.638671875, 7.9423828125, 9.24609375, 10.5498046875, 11.853515625, 13.1572265625, 14.4609375, 15.7646484375, 17.068359375, 18.3720703125, 19.67578125, 20.9794921875, 22.283203125, 23.5869140625, 24.890625, 26.1943359375, 27.498046875, 28.8017578125, 30.10546875, 31.4091796875, 32.712890625, 34.0166015625, 35.3203125, 36.6240234375, 37.927734375, 39.2314453125, 40.53515625, 41.8388671875, 43.142578125, 44.4462890625, 45.75]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 11.0, 161.0, 591.0, 237.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.8463134765625, -177.69480895996094, -165.54330444335938, -153.39181518554688, -141.24029541015625, -129.08880615234375, -116.93730163574219, -104.78579711914062, -92.63429260253906, -80.4827880859375, -68.33128356933594, -56.179786682128906, -44.028282165527344, -31.87677764892578, -19.72528076171875, -7.5737762451171875, 4.577728271484375, 16.729230880737305, 28.880733489990234, 41.03223419189453, 53.183738708496094, 65.33524322509766, 77.48674011230469, 89.63824462890625, 101.78974914550781, 113.94125366210938, 126.09275817871094, 138.2442626953125, 150.395751953125, 162.54727172851562, 174.69876098632812, 186.8502655029297, 199.00177001953125, 211.1532745361328, 223.30477905273438, 235.45626831054688, 247.6077880859375, 259.75927734375, 271.9107666015625, 284.0622863769531, 296.21380615234375, 308.36529541015625, 320.5168151855469, 332.6683044433594, 344.81982421875, 356.9713134765625, 369.122802734375, 381.2743225097656, 393.4258117675781, 405.5773010253906, 417.72882080078125, 429.88031005859375, 442.0318298339844, 454.1833190917969, 466.3348388671875, 478.486328125, 490.6378173828125, 502.789306640625, 514.9407958984375, 527.0923461914062, 539.2438354492188, 551.3953247070312, 563.5468139648438, 575.6983642578125, 587.849853515625]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 8.0, 9.0, 18.0, 8.0, 18.0, 10.0, 25.0, 28.0, 22.0, 17.0, 33.0, 39.0, 26.0, 35.0, 45.0, 35.0, 43.0, 41.0, 52.0, 45.0, 35.0, 45.0, 33.0, 31.0, 33.0, 23.0, 27.0, 28.0, 24.0, 25.0, 19.0, 24.0, 19.0, 6.0, 10.0, 9.0, 7.0, 9.0, 2.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-66.0582275390625, -64.1529541015625, -62.24768829345703, -60.3424186706543, -58.43714904785156, -56.53187942504883, -54.626609802246094, -52.721336364746094, -50.816070556640625, -48.91080093383789, -47.005531311035156, -45.10026168823242, -43.19499206542969, -41.28972244262695, -39.38445281982422, -37.47917938232422, -35.573909759521484, -33.66864013671875, -31.763370513916016, -29.85810089111328, -27.952831268310547, -26.047561645507812, -24.142290115356445, -22.23702049255371, -20.331750869750977, -18.426481246948242, -16.521211624145508, -14.615941047668457, -12.710671424865723, -10.805401802062988, -8.900131225585938, -6.994861602783203, -5.089595794677734, -3.184325933456421, -1.2790560722351074, 0.6262140274047852, 2.5314836502075195, 4.436753273010254, 6.342023849487305, 8.247293472290039, 10.152563095092773, 12.057832717895508, 13.963102340698242, 15.868372917175293, 17.773643493652344, 19.678913116455078, 21.584182739257812, 23.489452362060547, 25.39472198486328, 27.299991607666016, 29.20526123046875, 31.110530853271484, 33.01580047607422, 34.92107009887695, 36.82633972167969, 38.73161315917969, 40.636878967285156, 42.54214859008789, 44.447418212890625, 46.35268783569336, 48.257957458496094, 50.16322708129883, 52.06849670410156, 53.97377014160156, 55.8790397644043]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 7.0, 1.0, 5.0, 11.0, 6.0, 7.0, 11.0, 11.0, 16.0, 20.0, 17.0, 17.0, 19.0, 24.0, 25.0, 22.0, 33.0, 30.0, 31.0, 35.0, 41.0, 39.0, 34.0, 32.0, 38.0, 37.0, 29.0, 53.0, 25.0, 25.0, 31.0, 39.0, 28.0, 18.0, 21.0, 20.0, 20.0, 18.0, 13.0, 13.0, 13.0, 9.0, 11.0, 6.0, 4.0, 4.0, 10.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-8.8125, -8.5201416015625, -8.227783203125, -7.9354248046875, -7.64306640625, -7.3507080078125, -7.058349609375, -6.7659912109375, -6.4736328125, -6.1812744140625, -5.888916015625, -5.5965576171875, -5.30419921875, -5.0118408203125, -4.719482421875, -4.4271240234375, -4.134765625, -3.8424072265625, -3.550048828125, -3.2576904296875, -2.96533203125, -2.6729736328125, -2.380615234375, -2.0882568359375, -1.7958984375, -1.5035400390625, -1.211181640625, -0.9188232421875, -0.62646484375, -0.3341064453125, -0.041748046875, 0.2506103515625, 0.54296875, 0.8353271484375, 1.127685546875, 1.4200439453125, 1.71240234375, 2.0047607421875, 2.297119140625, 2.5894775390625, 2.8818359375, 3.1741943359375, 3.466552734375, 3.7589111328125, 4.05126953125, 4.3436279296875, 4.635986328125, 4.9283447265625, 5.220703125, 5.5130615234375, 5.805419921875, 6.0977783203125, 6.39013671875, 6.6824951171875, 6.974853515625, 7.2672119140625, 7.5595703125, 7.8519287109375, 8.144287109375, 8.4366455078125, 8.72900390625, 9.0213623046875, 9.313720703125, 9.6060791015625, 9.8984375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 0.0, 12.0, 10.0, 20.0, 47.0, 51.0, 61.0, 96.0, 113.0, 197.0, 283.0, 362.0, 527.0, 696.0, 919.0, 1392.0, 1771.0, 2357.0, 3209.0, 4532.0, 6028.0, 8022.0, 11299.0, 15827.0, 22373.0, 32714.0, 49536.0, 79752.0, 145300.0, 291712.0, 136195.0, 75889.0, 47683.0, 31735.0, 21818.0, 15291.0, 10764.0, 8038.0, 5821.0, 4109.0, 3219.0, 2353.0, 1735.0, 1261.0, 972.0, 697.0, 504.0, 342.0, 261.0, 216.0, 132.0, 113.0, 69.0, 39.0, 25.0, 17.0, 22.0, 13.0, 6.0, 8.0], "bins": [-2.3359375, -2.26611328125, -2.1962890625, -2.12646484375, -2.056640625, -1.98681640625, -1.9169921875, -1.84716796875, -1.77734375, -1.70751953125, -1.6376953125, -1.56787109375, -1.498046875, -1.42822265625, -1.3583984375, -1.28857421875, -1.21875, -1.14892578125, -1.0791015625, -1.00927734375, -0.939453125, -0.86962890625, -0.7998046875, -0.72998046875, -0.66015625, -0.59033203125, -0.5205078125, -0.45068359375, -0.380859375, -0.31103515625, -0.2412109375, -0.17138671875, -0.1015625, -0.03173828125, 0.0380859375, 0.10791015625, 0.177734375, 0.24755859375, 0.3173828125, 0.38720703125, 0.45703125, 0.52685546875, 0.5966796875, 0.66650390625, 0.736328125, 0.80615234375, 0.8759765625, 0.94580078125, 1.015625, 1.08544921875, 1.1552734375, 1.22509765625, 1.294921875, 1.36474609375, 1.4345703125, 1.50439453125, 1.57421875, 1.64404296875, 1.7138671875, 1.78369140625, 1.853515625, 1.92333984375, 1.9931640625, 2.06298828125, 2.1328125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 5.0, 12.0, 12.0, 8.0, 12.0, 9.0, 20.0, 10.0, 21.0, 22.0, 24.0, 25.0, 31.0, 26.0, 46.0, 40.0, 45.0, 39.0, 54.0, 1053.0, 31.0, 36.0, 48.0, 39.0, 31.0, 42.0, 34.0, 32.0, 26.0, 25.0, 20.0, 22.0, 18.0, 13.0, 19.0, 11.0, 9.0, 11.0, 7.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-7.12890625, -6.91802978515625, -6.7071533203125, -6.49627685546875, -6.285400390625, -6.07452392578125, -5.8636474609375, -5.65277099609375, -5.44189453125, -5.23101806640625, -5.0201416015625, -4.80926513671875, -4.598388671875, -4.38751220703125, -4.1766357421875, -3.96575927734375, -3.7548828125, -3.54400634765625, -3.3331298828125, -3.12225341796875, -2.911376953125, -2.70050048828125, -2.4896240234375, -2.27874755859375, -2.06787109375, -1.85699462890625, -1.6461181640625, -1.43524169921875, -1.224365234375, -1.01348876953125, -0.8026123046875, -0.59173583984375, -0.380859375, -0.16998291015625, 0.0408935546875, 0.25177001953125, 0.462646484375, 0.67352294921875, 0.8843994140625, 1.09527587890625, 1.30615234375, 1.51702880859375, 1.7279052734375, 1.93878173828125, 2.149658203125, 2.36053466796875, 2.5714111328125, 2.78228759765625, 2.9931640625, 3.20404052734375, 3.4149169921875, 3.62579345703125, 3.836669921875, 4.04754638671875, 4.2584228515625, 4.46929931640625, 4.68017578125, 4.89105224609375, 5.1019287109375, 5.31280517578125, 5.523681640625, 5.73455810546875, 5.9454345703125, 6.15631103515625, 6.3671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 12.0, 6.0, 9.0, 13.0, 30.0, 32.0, 54.0, 77.0, 114.0, 212.0, 208.0, 348.0, 503.0, 714.0, 1029.0, 1507.0, 2157.0, 3129.0, 4466.0, 6195.0, 9138.0, 13569.0, 20225.0, 30660.0, 47669.0, 76137.0, 134545.0, 1348040.0, 156008.0, 85106.0, 52370.0, 33727.0, 22047.0, 14712.0, 9972.0, 6812.0, 4647.0, 3339.0, 2304.0, 1669.0, 1127.0, 760.0, 507.0, 399.0, 258.0, 186.0, 118.0, 93.0, 52.0, 49.0, 28.0, 23.0, 12.0, 5.0, 9.0, 3.0, 1.0, 6.0], "bins": [-2.677734375, -2.598052978515625, -2.51837158203125, -2.438690185546875, -2.3590087890625, -2.279327392578125, -2.19964599609375, -2.119964599609375, -2.040283203125, -1.960601806640625, -1.88092041015625, -1.801239013671875, -1.7215576171875, -1.641876220703125, -1.56219482421875, -1.482513427734375, -1.40283203125, -1.323150634765625, -1.24346923828125, -1.163787841796875, -1.0841064453125, -1.004425048828125, -0.92474365234375, -0.845062255859375, -0.765380859375, -0.685699462890625, -0.60601806640625, -0.526336669921875, -0.4466552734375, -0.366973876953125, -0.28729248046875, -0.207611083984375, -0.1279296875, -0.048248291015625, 0.03143310546875, 0.111114501953125, 0.1907958984375, 0.270477294921875, 0.35015869140625, 0.429840087890625, 0.509521484375, 0.589202880859375, 0.66888427734375, 0.748565673828125, 0.8282470703125, 0.907928466796875, 0.98760986328125, 1.067291259765625, 1.14697265625, 1.226654052734375, 1.30633544921875, 1.386016845703125, 1.4656982421875, 1.545379638671875, 1.62506103515625, 1.704742431640625, 1.784423828125, 1.864105224609375, 1.94378662109375, 2.023468017578125, 2.1031494140625, 2.182830810546875, 2.26251220703125, 2.342193603515625, 2.421875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 7.0, 13.0, 15.0, 27.0, 26.0, 23.0, 38.0, 45.0, 57.0, 71.0, 85.0, 78.0, 103.0, 69.0, 63.0, 49.0, 47.0, 37.0, 31.0, 35.0, 19.0, 10.0, 18.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005221366882324219, -0.0005052313208580017, -0.0004883259534835815, -0.0004714205861091614, -0.0004545152187347412, -0.00043760985136032104, -0.0004207044839859009, -0.0004037991166114807, -0.00038689374923706055, -0.0003699883818626404, -0.0003530830144882202, -0.00033617764711380005, -0.0003192722797393799, -0.0003023669123649597, -0.00028546154499053955, -0.0002685561776161194, -0.0002516508102416992, -0.00023474544286727905, -0.0002178400754928589, -0.00020093470811843872, -0.00018402934074401855, -0.0001671239733695984, -0.00015021860599517822, -0.00013331323862075806, -0.00011640787124633789, -9.950250387191772e-05, -8.259713649749756e-05, -6.569176912307739e-05, -4.8786401748657227e-05, -3.188103437423706e-05, -1.4975666999816895e-05, 1.9297003746032715e-06, 1.8835067749023438e-05, 3.5740435123443604e-05, 5.264580249786377e-05, 6.955116987228394e-05, 8.64565372467041e-05, 0.00010336190462112427, 0.00012026727199554443, 0.0001371726393699646, 0.00015407800674438477, 0.00017098337411880493, 0.0001878887414932251, 0.00020479410886764526, 0.00022169947624206543, 0.0002386048436164856, 0.00025551021099090576, 0.00027241557836532593, 0.0002893209457397461, 0.00030622631311416626, 0.0003231316804885864, 0.0003400370478630066, 0.00035694241523742676, 0.0003738477826118469, 0.0003907531499862671, 0.00040765851736068726, 0.0004245638847351074, 0.0004414692521095276, 0.00045837461948394775, 0.0004752799868583679, 0.0004921853542327881, 0.0005090907216072083, 0.0005259960889816284, 0.0005429014563560486, 0.0005598068237304688]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 6.0, 6.0, 10.0, 19.0, 27.0, 36.0, 54.0, 65.0, 102.0, 140.0, 208.0, 429.0, 1018.0, 309499.0, 734604.0, 1123.0, 499.0, 219.0, 140.0, 90.0, 68.0, 45.0, 36.0, 35.0, 17.0, 12.0, 10.0, 12.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01123046875, -0.010890603065490723, -0.010550737380981445, -0.010210871696472168, -0.00987100601196289, -0.009531140327453613, -0.009191274642944336, -0.008851408958435059, -0.008511543273925781, -0.008171677589416504, -0.007831811904907227, -0.007491946220397949, -0.007152080535888672, -0.0068122148513793945, -0.006472349166870117, -0.00613248348236084, -0.0057926177978515625, -0.005452752113342285, -0.005112886428833008, -0.0047730207443237305, -0.004433155059814453, -0.004093289375305176, -0.0037534236907958984, -0.003413558006286621, -0.0030736923217773438, -0.0027338266372680664, -0.002393960952758789, -0.0020540952682495117, -0.0017142295837402344, -0.001374363899230957, -0.0010344982147216797, -0.0006946325302124023, -0.000354766845703125, -1.4901161193847656e-05, 0.0003249645233154297, 0.000664830207824707, 0.0010046958923339844, 0.0013445615768432617, 0.001684427261352539, 0.0020242929458618164, 0.0023641586303710938, 0.002704024314880371, 0.0030438899993896484, 0.0033837556838989258, 0.003723621368408203, 0.0040634870529174805, 0.004403352737426758, 0.004743218421936035, 0.0050830841064453125, 0.00542294979095459, 0.005762815475463867, 0.0061026811599731445, 0.006442546844482422, 0.006782412528991699, 0.0071222782135009766, 0.007462143898010254, 0.007802009582519531, 0.008141875267028809, 0.008481740951538086, 0.008821606636047363, 0.00916147232055664, 0.009501338005065918, 0.009841203689575195, 0.010181069374084473, 0.01052093505859375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 57.0, 625.0, 318.0, 13.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002935346565209329, -0.00024281709920614958, -0.00019209952733945101, -0.00014138195547275245, -9.066439815796912e-05, -3.994684084318578e-05, 1.0770745575428009e-05, 6.148830289021134e-05, 0.00011220586020499468, 0.000162923417519778, 0.00021364098938647658, 0.00026435856125317514, 0.0003150761185679585, 0.0003657936758827418, 0.0004165112623013556, 0.00046722881961613894, 0.0005179463769309223, 0.0005686639342457056, 0.0006193814915604889, 0.0006700990488752723, 0.0007208166643977165, 0.0007715341635048389, 0.0008222517790272832, 0.0008729693363420665, 0.0009236868936568499, 0.0009744044509716332, 0.0010251220082864165, 0.0010758396238088608, 0.0011265571229159832, 0.0011772747384384274, 0.0012279923539608717, 0.0012787098530679941, 0.0013294273521751165, 0.0013801449676975608, 0.0014308624668046832, 0.0014815800823271275, 0.0015322975814342499, 0.0015830151969566941, 0.0016337328124791384, 0.0016844503115862608, 0.0017351678106933832, 0.0017858854262158275, 0.0018366029253229499, 0.0018873205408453941, 0.0019380380399525166, 0.001988755539059639, 0.002039473270997405, 0.0020901907701045275, 0.0021409085020422935, 0.002191626001149416, 0.002242343733087182, 0.0022930612321943045, 0.002343778731301427, 0.0023944962304085493, 0.0024452139623463154, 0.002495931461453438, 0.0025466489605605602, 0.0025973664596676826, 0.0026480841916054487, 0.002698801690712571, 0.0027495191898196936, 0.002800236688926816, 0.002850954420864582, 0.0029016719199717045, 0.002952389419078827]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 7.0, 5.0, 5.0, 15.0, 17.0, 12.0, 17.0, 12.0, 19.0, 17.0, 24.0, 27.0, 34.0, 35.0, 27.0, 35.0, 48.0, 55.0, 45.0, 40.0, 44.0, 52.0, 33.0, 39.0, 35.0, 31.0, 41.0, 33.0, 29.0, 37.0, 19.0, 22.0, 11.0, 13.0, 10.0, 11.0, 10.0, 4.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019627809524536133, -0.00018920749425888062, -0.0001821368932723999, -0.0001750662922859192, -0.00016799569129943848, -0.00016092509031295776, -0.00015385448932647705, -0.00014678388833999634, -0.00013971328735351562, -0.0001326426863670349, -0.0001255720853805542, -0.00011850148439407349, -0.00011143088340759277, -0.00010436028242111206, -9.728968143463135e-05, -9.021908044815063e-05, -8.314847946166992e-05, -7.607787847518921e-05, -6.90072774887085e-05, -6.193667650222778e-05, -5.486607551574707e-05, -4.779547452926636e-05, -4.0724873542785645e-05, -3.365427255630493e-05, -2.658367156982422e-05, -1.9513070583343506e-05, -1.2442469596862793e-05, -5.37186861038208e-06, 1.6987323760986328e-06, 8.769333362579346e-06, 1.583993434906006e-05, 2.291053533554077e-05, 2.9981136322021484e-05, 3.70517373085022e-05, 4.412233829498291e-05, 5.119293928146362e-05, 5.8263540267944336e-05, 6.533414125442505e-05, 7.240474224090576e-05, 7.947534322738647e-05, 8.654594421386719e-05, 9.36165452003479e-05, 0.00010068714618682861, 0.00010775774717330933, 0.00011482834815979004, 0.00012189894914627075, 0.00012896955013275146, 0.00013604015111923218, 0.0001431107521057129, 0.0001501813530921936, 0.00015725195407867432, 0.00016432255506515503, 0.00017139315605163574, 0.00017846375703811646, 0.00018553435802459717, 0.00019260495901107788, 0.0001996755599975586, 0.0002067461609840393, 0.00021381676197052002, 0.00022088736295700073, 0.00022795796394348145, 0.00023502856492996216, 0.00024209916591644287, 0.0002491697669029236, 0.0002562403678894043]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 7.0, 1.0, 5.0, 11.0, 6.0, 7.0, 11.0, 11.0, 16.0, 20.0, 17.0, 17.0, 19.0, 24.0, 25.0, 22.0, 33.0, 30.0, 31.0, 35.0, 41.0, 40.0, 33.0, 32.0, 38.0, 37.0, 29.0, 53.0, 25.0, 25.0, 31.0, 39.0, 28.0, 18.0, 21.0, 20.0, 20.0, 18.0, 13.0, 13.0, 13.0, 9.0, 11.0, 6.0, 4.0, 4.0, 10.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-8.8125, -8.5201416015625, -8.227783203125, -7.9354248046875, -7.64306640625, -7.3507080078125, -7.058349609375, -6.7659912109375, -6.4736328125, -6.1812744140625, -5.888916015625, -5.5965576171875, -5.30419921875, -5.0118408203125, -4.719482421875, -4.4271240234375, -4.134765625, -3.8424072265625, -3.550048828125, -3.2576904296875, -2.96533203125, -2.6729736328125, -2.380615234375, -2.0882568359375, -1.7958984375, -1.5035400390625, -1.211181640625, -0.9188232421875, -0.62646484375, -0.3341064453125, -0.041748046875, 0.2506103515625, 0.54296875, 0.8353271484375, 1.127685546875, 1.4200439453125, 1.71240234375, 2.0047607421875, 2.297119140625, 2.5894775390625, 2.8818359375, 3.1741943359375, 3.466552734375, 3.7589111328125, 4.05126953125, 4.3436279296875, 4.635986328125, 4.9283447265625, 5.220703125, 5.5130615234375, 5.805419921875, 6.0977783203125, 6.39013671875, 6.6824951171875, 6.974853515625, 7.2672119140625, 7.5595703125, 7.8519287109375, 8.144287109375, 8.4366455078125, 8.72900390625, 9.0213623046875, 9.313720703125, 9.6060791015625, 9.8984375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 9.0, 17.0, 14.0, 26.0, 37.0, 33.0, 54.0, 65.0, 86.0, 98.0, 154.0, 175.0, 225.0, 274.0, 374.0, 534.0, 849.0, 1952.0, 6248.0, 27755.0, 177321.0, 711946.0, 94118.0, 17602.0, 4425.0, 1441.0, 700.0, 462.0, 376.0, 249.0, 187.0, 156.0, 139.0, 100.0, 79.0, 58.0, 43.0, 28.0, 21.0, 23.0, 16.0, 13.0, 15.0, 12.0, 13.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-22.65625, -21.909912109375, -21.16357421875, -20.417236328125, -19.6708984375, -18.924560546875, -18.17822265625, -17.431884765625, -16.685546875, -15.939208984375, -15.19287109375, -14.446533203125, -13.7001953125, -12.953857421875, -12.20751953125, -11.461181640625, -10.71484375, -9.968505859375, -9.22216796875, -8.475830078125, -7.7294921875, -6.983154296875, -6.23681640625, -5.490478515625, -4.744140625, -3.997802734375, -3.25146484375, -2.505126953125, -1.7587890625, -1.012451171875, -0.26611328125, 0.480224609375, 1.2265625, 1.972900390625, 2.71923828125, 3.465576171875, 4.2119140625, 4.958251953125, 5.70458984375, 6.450927734375, 7.197265625, 7.943603515625, 8.68994140625, 9.436279296875, 10.1826171875, 10.928955078125, 11.67529296875, 12.421630859375, 13.16796875, 13.914306640625, 14.66064453125, 15.406982421875, 16.1533203125, 16.899658203125, 17.64599609375, 18.392333984375, 19.138671875, 19.885009765625, 20.63134765625, 21.377685546875, 22.1240234375, 22.870361328125, 23.61669921875, 24.363037109375, 25.109375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 13.0, 19.0, 15.0, 26.0, 20.0, 23.0, 31.0, 29.0, 44.0, 38.0, 44.0, 59.0, 94.0, 211.0, 1536.0, 299.0, 115.0, 65.0, 51.0, 44.0, 41.0, 37.0, 30.0, 25.0, 29.0, 25.0, 9.0, 15.0, 10.0, 6.0, 8.0, 6.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.90625, -38.68359375, -37.4609375, -36.23828125, -35.015625, -33.79296875, -32.5703125, -31.34765625, -30.125, -28.90234375, -27.6796875, -26.45703125, -25.234375, -24.01171875, -22.7890625, -21.56640625, -20.34375, -19.12109375, -17.8984375, -16.67578125, -15.453125, -14.23046875, -13.0078125, -11.78515625, -10.5625, -9.33984375, -8.1171875, -6.89453125, -5.671875, -4.44921875, -3.2265625, -2.00390625, -0.78125, 0.44140625, 1.6640625, 2.88671875, 4.109375, 5.33203125, 6.5546875, 7.77734375, 9.0, 10.22265625, 11.4453125, 12.66796875, 13.890625, 15.11328125, 16.3359375, 17.55859375, 18.78125, 20.00390625, 21.2265625, 22.44921875, 23.671875, 24.89453125, 26.1171875, 27.33984375, 28.5625, 29.78515625, 31.0078125, 32.23046875, 33.453125, 34.67578125, 35.8984375, 37.12109375, 38.34375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 8.0, 8.0, 12.0, 13.0, 16.0, 16.0, 34.0, 29.0, 50.0, 42.0, 73.0, 109.0, 143.0, 244.0, 642.0, 1797.0, 23692.0, 3080446.0, 34757.0, 2010.0, 642.0, 282.0, 172.0, 107.0, 68.0, 50.0, 45.0, 39.0, 39.0, 28.0, 16.0, 17.0, 7.0, 11.0, 6.0, 5.0, 4.0, 2.0, 9.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.6875, -97.390625, -94.09375, -90.796875, -87.5, -84.203125, -80.90625, -77.609375, -74.3125, -71.015625, -67.71875, -64.421875, -61.125, -57.828125, -54.53125, -51.234375, -47.9375, -44.640625, -41.34375, -38.046875, -34.75, -31.453125, -28.15625, -24.859375, -21.5625, -18.265625, -14.96875, -11.671875, -8.375, -5.078125, -1.78125, 1.515625, 4.8125, 8.109375, 11.40625, 14.703125, 18.0, 21.296875, 24.59375, 27.890625, 31.1875, 34.484375, 37.78125, 41.078125, 44.375, 47.671875, 50.96875, 54.265625, 57.5625, 60.859375, 64.15625, 67.453125, 70.75, 74.046875, 77.34375, 80.640625, 83.9375, 87.234375, 90.53125, 93.828125, 97.125, 100.421875, 103.71875, 107.015625, 110.3125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [3.0, 11.0, 96.0, 549.0, 319.0, 38.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.00372886657715, -19.84703826904297, -12.690346717834473, -5.533655166625977, 1.6230354309082031, 8.779726028442383, 15.936418533325195, 23.093107223510742, 30.249799728393555, 37.406490325927734, 44.56318283081055, 51.719871520996094, 58.876564025878906, 66.03325653076172, 73.18994903564453, 80.34663391113281, 87.50332641601562, 94.66001892089844, 101.81671142578125, 108.97340393066406, 116.13008880615234, 123.28678131103516, 130.4434814453125, 137.60015869140625, 144.75685119628906, 151.91354370117188, 159.0702362060547, 166.2269287109375, 173.3836212158203, 180.54031372070312, 187.69699096679688, 194.8536834716797, 202.01039123535156, 209.16708374023438, 216.3237762451172, 223.48046875, 230.6371612548828, 237.79385375976562, 244.95053100585938, 252.1072235107422, 259.263916015625, 266.42059326171875, 273.5773010253906, 280.7339782714844, 287.89068603515625, 295.04736328125, 302.2040710449219, 309.3607482910156, 316.5174560546875, 323.67413330078125, 330.8308410644531, 337.9875183105469, 345.14422607421875, 352.3009033203125, 359.4576110839844, 366.6142883300781, 373.7709655761719, 380.9276428222656, 388.0843505859375, 395.24102783203125, 402.3977355957031, 409.5544128417969, 416.71112060546875, 423.8677978515625, 431.0245056152344]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 9.0, 4.0, 6.0, 9.0, 13.0, 10.0, 15.0, 17.0, 14.0, 15.0, 22.0, 20.0, 15.0, 35.0, 29.0, 34.0, 41.0, 35.0, 38.0, 31.0, 31.0, 34.0, 34.0, 37.0, 36.0, 35.0, 42.0, 45.0, 28.0, 37.0, 33.0, 24.0, 24.0, 26.0, 20.0, 26.0, 17.0, 7.0, 14.0, 7.0, 5.0, 7.0, 9.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-84.48446655273438, -81.71961975097656, -78.95477294921875, -76.18992614746094, -73.42507934570312, -70.66023254394531, -67.8953857421875, -65.13054656982422, -62.365699768066406, -59.600852966308594, -56.83600616455078, -54.07115936279297, -51.30631637573242, -48.54146957397461, -45.7766227722168, -43.01177978515625, -40.24692916870117, -37.48208236694336, -34.71723556518555, -31.952390670776367, -29.187545776367188, -26.422698974609375, -23.657852172851562, -20.893007278442383, -18.12816047668457, -15.363314628601074, -12.598468780517578, -9.833621978759766, -7.0687761306762695, -4.303930282592773, -1.539083480834961, 1.2257614135742188, 3.9906082153320312, 6.755454063415527, 9.520299911499023, 12.285146713256836, 15.049992561340332, 17.814838409423828, 20.57968521118164, 23.34453010559082, 26.109376907348633, 28.874223709106445, 31.639068603515625, 34.40391540527344, 37.16876220703125, 39.93360900878906, 42.698455810546875, 45.46329879760742, 48.228145599365234, 50.99299240112305, 53.75783920288086, 56.522682189941406, 59.28752899169922, 62.05237579345703, 64.81722259521484, 67.58206939697266, 70.34691619873047, 73.11176300048828, 75.8766098022461, 78.6414566040039, 81.40630340576172, 84.171142578125, 86.93598937988281, 89.70083618164062, 92.46568298339844]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 4.0, 4.0, 6.0, 6.0, 11.0, 15.0, 9.0, 14.0, 12.0, 23.0, 22.0, 18.0, 30.0, 21.0, 36.0, 31.0, 33.0, 41.0, 41.0, 39.0, 31.0, 35.0, 43.0, 33.0, 44.0, 39.0, 33.0, 43.0, 26.0, 32.0, 32.0, 24.0, 23.0, 20.0, 15.0, 14.0, 15.0, 10.0, 9.0, 8.0, 12.0, 9.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 8.0, 1.0, 2.0, 3.0, 2.0], "bins": [-11.2578125, -10.9180908203125, -10.578369140625, -10.2386474609375, -9.89892578125, -9.5592041015625, -9.219482421875, -8.8797607421875, -8.5400390625, -8.2003173828125, -7.860595703125, -7.5208740234375, -7.18115234375, -6.8414306640625, -6.501708984375, -6.1619873046875, -5.822265625, -5.4825439453125, -5.142822265625, -4.8031005859375, -4.46337890625, -4.1236572265625, -3.783935546875, -3.4442138671875, -3.1044921875, -2.7647705078125, -2.425048828125, -2.0853271484375, -1.74560546875, -1.4058837890625, -1.066162109375, -0.7264404296875, -0.38671875, -0.0469970703125, 0.292724609375, 0.6324462890625, 0.97216796875, 1.3118896484375, 1.651611328125, 1.9913330078125, 2.3310546875, 2.6707763671875, 3.010498046875, 3.3502197265625, 3.68994140625, 4.0296630859375, 4.369384765625, 4.7091064453125, 5.048828125, 5.3885498046875, 5.728271484375, 6.0679931640625, 6.40771484375, 6.7474365234375, 7.087158203125, 7.4268798828125, 7.7666015625, 8.1063232421875, 8.446044921875, 8.7857666015625, 9.12548828125, 9.4652099609375, 9.804931640625, 10.1446533203125, 10.484375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 11.0, 8.0, 28.0, 22.0, 24.0, 29.0, 28.0, 41.0, 48.0, 77.0, 94.0, 132.0, 176.0, 240.0, 350.0, 655.0, 1593.0, 6382.0, 50228.0, 568827.0, 2378133.0, 1067285.0, 104566.0, 10579.0, 2300.0, 867.0, 419.0, 293.0, 196.0, 133.0, 109.0, 92.0, 57.0, 40.0, 51.0, 26.0, 27.0, 24.0, 17.0, 13.0, 12.0, 8.0, 7.0, 10.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-22.109375, -21.410888671875, -20.71240234375, -20.013916015625, -19.3154296875, -18.616943359375, -17.91845703125, -17.219970703125, -16.521484375, -15.822998046875, -15.12451171875, -14.426025390625, -13.7275390625, -13.029052734375, -12.33056640625, -11.632080078125, -10.93359375, -10.235107421875, -9.53662109375, -8.838134765625, -8.1396484375, -7.441162109375, -6.74267578125, -6.044189453125, -5.345703125, -4.647216796875, -3.94873046875, -3.250244140625, -2.5517578125, -1.853271484375, -1.15478515625, -0.456298828125, 0.2421875, 0.940673828125, 1.63916015625, 2.337646484375, 3.0361328125, 3.734619140625, 4.43310546875, 5.131591796875, 5.830078125, 6.528564453125, 7.22705078125, 7.925537109375, 8.6240234375, 9.322509765625, 10.02099609375, 10.719482421875, 11.41796875, 12.116455078125, 12.81494140625, 13.513427734375, 14.2119140625, 14.910400390625, 15.60888671875, 16.307373046875, 17.005859375, 17.704345703125, 18.40283203125, 19.101318359375, 19.7998046875, 20.498291015625, 21.19677734375, 21.895263671875, 22.59375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 4.0, 18.0, 21.0, 30.0, 47.0, 94.0, 124.0, 207.0, 314.0, 457.0, 607.0, 629.0, 489.0, 356.0, 222.0, 145.0, 87.0, 81.0, 36.0, 33.0, 16.0, 11.0, 9.0, 11.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.890625, -29.0859375, -28.28125, -27.4765625, -26.671875, -25.8671875, -25.0625, -24.2578125, -23.453125, -22.6484375, -21.84375, -21.0390625, -20.234375, -19.4296875, -18.625, -17.8203125, -17.015625, -16.2109375, -15.40625, -14.6015625, -13.796875, -12.9921875, -12.1875, -11.3828125, -10.578125, -9.7734375, -8.96875, -8.1640625, -7.359375, -6.5546875, -5.75, -4.9453125, -4.140625, -3.3359375, -2.53125, -1.7265625, -0.921875, -0.1171875, 0.6875, 1.4921875, 2.296875, 3.1015625, 3.90625, 4.7109375, 5.515625, 6.3203125, 7.125, 7.9296875, 8.734375, 9.5390625, 10.34375, 11.1484375, 11.953125, 12.7578125, 13.5625, 14.3671875, 15.171875, 15.9765625, 16.78125, 17.5859375, 18.390625, 19.1953125, 20.0, 20.8046875, 21.609375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 4.0, 13.0, 11.0, 30.0, 62.0, 78.0, 140.0, 265.0, 494.0, 998.0, 3170.0, 34075.0, 3406075.0, 733502.0, 11772.0, 1981.0, 738.0, 380.0, 207.0, 118.0, 58.0, 39.0, 29.0, 10.0, 8.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.5625, -62.3974609375, -60.232421875, -58.0673828125, -55.90234375, -53.7373046875, -51.572265625, -49.4072265625, -47.2421875, -45.0771484375, -42.912109375, -40.7470703125, -38.58203125, -36.4169921875, -34.251953125, -32.0869140625, -29.921875, -27.7568359375, -25.591796875, -23.4267578125, -21.26171875, -19.0966796875, -16.931640625, -14.7666015625, -12.6015625, -10.4365234375, -8.271484375, -6.1064453125, -3.94140625, -1.7763671875, 0.388671875, 2.5537109375, 4.71875, 6.8837890625, 9.048828125, 11.2138671875, 13.37890625, 15.5439453125, 17.708984375, 19.8740234375, 22.0390625, 24.2041015625, 26.369140625, 28.5341796875, 30.69921875, 32.8642578125, 35.029296875, 37.1943359375, 39.359375, 41.5244140625, 43.689453125, 45.8544921875, 48.01953125, 50.1845703125, 52.349609375, 54.5146484375, 56.6796875, 58.8447265625, 61.009765625, 63.1748046875, 65.33984375, 67.5048828125, 69.669921875, 71.8349609375, 74.0]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 7.0, 405.0, 594.0, 10.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.93930053710938, -111.90988159179688, -89.88045501708984, -67.85102844238281, -45.82160949707031, -23.792190551757812, -1.76275634765625, 20.26666259765625, 42.29608154296875, 64.32550048828125, 86.35492706298828, 108.38435363769531, 130.4137725830078, 152.4431915283203, 174.47262573242188, 196.50204467773438, 218.53146362304688, 240.56088256835938, 262.5903015136719, 284.6197509765625, 306.649169921875, 328.6785888671875, 350.7080078125, 372.7374267578125, 394.766845703125, 416.7962646484375, 438.82568359375, 460.8551025390625, 482.884521484375, 504.9139404296875, 526.943359375, 548.9727783203125, 571.002197265625, 593.0316162109375, 615.06103515625, 637.0904541015625, 659.119873046875, 681.1492919921875, 703.1787109375, 725.2081298828125, 747.237548828125, 769.2669677734375, 791.29638671875, 813.3258056640625, 835.355224609375, 857.3846435546875, 879.4140625, 901.4434814453125, 923.4729614257812, 945.5023803710938, 967.5317993164062, 989.5612182617188, 1011.5906372070312, 1033.6201171875, 1055.6495361328125, 1077.678955078125, 1099.7083740234375, 1121.73779296875, 1143.7672119140625, 1165.796630859375, 1187.8260498046875, 1209.85546875, 1231.8848876953125, 1253.914306640625, 1275.9437255859375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 10.0, 5.0, 8.0, 18.0, 13.0, 9.0, 14.0, 26.0, 11.0, 18.0, 19.0, 37.0, 29.0, 31.0, 37.0, 34.0, 45.0, 33.0, 42.0, 45.0, 44.0, 49.0, 42.0, 41.0, 33.0, 36.0, 30.0, 28.0, 27.0, 17.0, 24.0, 16.0, 16.0, 17.0, 18.0, 18.0, 4.0, 13.0, 9.0, 5.0, 12.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-62.558265686035156, -60.59885025024414, -58.63943862915039, -56.680023193359375, -54.720611572265625, -52.76119613647461, -50.801780700683594, -48.842369079589844, -46.88295364379883, -44.92353820800781, -42.96412658691406, -41.00471115112305, -39.0452995300293, -37.08588409423828, -35.12647247314453, -33.167057037353516, -31.207643508911133, -29.24822998046875, -27.288816452026367, -25.329402923583984, -23.36998748779297, -21.410573959350586, -19.451160430908203, -17.491744995117188, -15.532332420349121, -13.572918891906738, -11.613504409790039, -9.654090881347656, -7.694676876068115, -5.735262870788574, -3.7758493423461914, -1.8164348602294922, 0.14297866821289062, 2.1023926734924316, 4.061806678771973, 6.0212202072143555, 7.9806342124938965, 9.940048217773438, 11.89946174621582, 13.85887622833252, 15.818289756774902, 17.7777042388916, 19.737117767333984, 21.696531295776367, 23.65594482421875, 25.615360260009766, 27.574771881103516, 29.53418731689453, 31.493600845336914, 33.4530143737793, 35.41242980957031, 37.37184143066406, 39.33125686645508, 41.290672302246094, 43.250083923339844, 45.20949935913086, 47.16891098022461, 49.128326416015625, 51.087738037109375, 53.04715347290039, 55.00656509399414, 56.965980529785156, 58.925392150878906, 60.88480758666992, 62.84422302246094]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 11.0, 7.0, 12.0, 13.0, 17.0, 16.0, 22.0, 23.0, 20.0, 29.0, 33.0, 28.0, 36.0, 39.0, 46.0, 48.0, 51.0, 52.0, 47.0, 47.0, 40.0, 41.0, 44.0, 45.0, 32.0, 33.0, 21.0, 28.0, 17.0, 16.0, 19.0, 10.0, 8.0, 11.0, 13.0, 8.0, 6.0, 1.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.78125, -12.3668212890625, -11.952392578125, -11.5379638671875, -11.12353515625, -10.7091064453125, -10.294677734375, -9.8802490234375, -9.4658203125, -9.0513916015625, -8.636962890625, -8.2225341796875, -7.80810546875, -7.3936767578125, -6.979248046875, -6.5648193359375, -6.150390625, -5.7359619140625, -5.321533203125, -4.9071044921875, -4.49267578125, -4.0782470703125, -3.663818359375, -3.2493896484375, -2.8349609375, -2.4205322265625, -2.006103515625, -1.5916748046875, -1.17724609375, -0.7628173828125, -0.348388671875, 0.0660400390625, 0.48046875, 0.8948974609375, 1.309326171875, 1.7237548828125, 2.13818359375, 2.5526123046875, 2.967041015625, 3.3814697265625, 3.7958984375, 4.2103271484375, 4.624755859375, 5.0391845703125, 5.45361328125, 5.8680419921875, 6.282470703125, 6.6968994140625, 7.111328125, 7.5257568359375, 7.940185546875, 8.3546142578125, 8.76904296875, 9.1834716796875, 9.597900390625, 10.0123291015625, 10.4267578125, 10.8411865234375, 11.255615234375, 11.6700439453125, 12.08447265625, 12.4989013671875, 12.913330078125, 13.3277587890625, 13.7421875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 3.0, 17.0, 17.0, 16.0, 26.0, 41.0, 62.0, 93.0, 126.0, 203.0, 286.0, 434.0, 550.0, 840.0, 1350.0, 2028.0, 3126.0, 4773.0, 7308.0, 11410.0, 17389.0, 27456.0, 45015.0, 77806.0, 150911.0, 361029.0, 142529.0, 74629.0, 43757.0, 26756.0, 16886.0, 10973.0, 7024.0, 4633.0, 3077.0, 1998.0, 1308.0, 823.0, 588.0, 360.0, 271.0, 194.0, 146.0, 87.0, 53.0, 47.0, 29.0, 22.0, 13.0, 7.0, 6.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.333984375, -3.22802734375, -3.1220703125, -3.01611328125, -2.91015625, -2.80419921875, -2.6982421875, -2.59228515625, -2.486328125, -2.38037109375, -2.2744140625, -2.16845703125, -2.0625, -1.95654296875, -1.8505859375, -1.74462890625, -1.638671875, -1.53271484375, -1.4267578125, -1.32080078125, -1.21484375, -1.10888671875, -1.0029296875, -0.89697265625, -0.791015625, -0.68505859375, -0.5791015625, -0.47314453125, -0.3671875, -0.26123046875, -0.1552734375, -0.04931640625, 0.056640625, 0.16259765625, 0.2685546875, 0.37451171875, 0.48046875, 0.58642578125, 0.6923828125, 0.79833984375, 0.904296875, 1.01025390625, 1.1162109375, 1.22216796875, 1.328125, 1.43408203125, 1.5400390625, 1.64599609375, 1.751953125, 1.85791015625, 1.9638671875, 2.06982421875, 2.17578125, 2.28173828125, 2.3876953125, 2.49365234375, 2.599609375, 2.70556640625, 2.8115234375, 2.91748046875, 3.0234375, 3.12939453125, 3.2353515625, 3.34130859375, 3.447265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 5.0, 11.0, 7.0, 19.0, 20.0, 13.0, 18.0, 22.0, 33.0, 23.0, 27.0, 37.0, 28.0, 32.0, 34.0, 37.0, 44.0, 45.0, 1064.0, 49.0, 36.0, 44.0, 41.0, 39.0, 33.0, 33.0, 33.0, 25.0, 22.0, 24.0, 16.0, 13.0, 22.0, 8.0, 12.0, 7.0, 7.0, 4.0, 5.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.27734375, -7.03668212890625, -6.7960205078125, -6.55535888671875, -6.314697265625, -6.07403564453125, -5.8333740234375, -5.59271240234375, -5.35205078125, -5.11138916015625, -4.8707275390625, -4.63006591796875, -4.389404296875, -4.14874267578125, -3.9080810546875, -3.66741943359375, -3.4267578125, -3.18609619140625, -2.9454345703125, -2.70477294921875, -2.464111328125, -2.22344970703125, -1.9827880859375, -1.74212646484375, -1.50146484375, -1.26080322265625, -1.0201416015625, -0.77947998046875, -0.538818359375, -0.29815673828125, -0.0574951171875, 0.18316650390625, 0.423828125, 0.66448974609375, 0.9051513671875, 1.14581298828125, 1.386474609375, 1.62713623046875, 1.8677978515625, 2.10845947265625, 2.34912109375, 2.58978271484375, 2.8304443359375, 3.07110595703125, 3.311767578125, 3.55242919921875, 3.7930908203125, 4.03375244140625, 4.2744140625, 4.51507568359375, 4.7557373046875, 4.99639892578125, 5.237060546875, 5.47772216796875, 5.7183837890625, 5.95904541015625, 6.19970703125, 6.44036865234375, 6.6810302734375, 6.92169189453125, 7.162353515625, 7.40301513671875, 7.6436767578125, 7.88433837890625, 8.125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 12.0, 14.0, 21.0, 38.0, 62.0, 83.0, 110.0, 193.0, 285.0, 454.0, 663.0, 1006.0, 1366.0, 2046.0, 2948.0, 4324.0, 6662.0, 9589.0, 14474.0, 21984.0, 34060.0, 52673.0, 84523.0, 153866.0, 1363543.0, 129226.0, 75077.0, 47468.0, 30415.0, 19638.0, 13083.0, 8774.0, 5817.0, 4110.0, 2619.0, 1865.0, 1338.0, 883.0, 567.0, 416.0, 290.0, 164.0, 145.0, 87.0, 52.0, 32.0, 23.0, 23.0, 9.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.76171875, -2.670806884765625, -2.57989501953125, -2.488983154296875, -2.3980712890625, -2.307159423828125, -2.21624755859375, -2.125335693359375, -2.034423828125, -1.943511962890625, -1.85260009765625, -1.761688232421875, -1.6707763671875, -1.579864501953125, -1.48895263671875, -1.398040771484375, -1.30712890625, -1.216217041015625, -1.12530517578125, -1.034393310546875, -0.9434814453125, -0.852569580078125, -0.76165771484375, -0.670745849609375, -0.579833984375, -0.488922119140625, -0.39801025390625, -0.307098388671875, -0.2161865234375, -0.125274658203125, -0.03436279296875, 0.056549072265625, 0.1474609375, 0.238372802734375, 0.32928466796875, 0.420196533203125, 0.5111083984375, 0.602020263671875, 0.69293212890625, 0.783843994140625, 0.874755859375, 0.965667724609375, 1.05657958984375, 1.147491455078125, 1.2384033203125, 1.329315185546875, 1.42022705078125, 1.511138916015625, 1.60205078125, 1.692962646484375, 1.78387451171875, 1.874786376953125, 1.9656982421875, 2.056610107421875, 2.14752197265625, 2.238433837890625, 2.329345703125, 2.420257568359375, 2.51116943359375, 2.602081298828125, 2.6929931640625, 2.783905029296875, 2.87481689453125, 2.965728759765625, 3.056640625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 6.0, 6.0, 5.0, 4.0, 11.0, 11.0, 20.0, 15.0, 18.0, 28.0, 28.0, 21.0, 28.0, 31.0, 40.0, 53.0, 52.0, 36.0, 57.0, 56.0, 53.0, 61.0, 53.0, 34.0, 35.0, 38.0, 28.0, 26.0, 17.0, 20.0, 10.0, 24.0, 14.0, 9.0, 10.0, 7.0, 4.0, 5.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00044727325439453125, -0.0004339739680290222, -0.0004206746816635132, -0.00040737539529800415, -0.0003940761089324951, -0.0003807768225669861, -0.00036747753620147705, -0.000354178249835968, -0.000340878963470459, -0.00032757967710494995, -0.0003142803907394409, -0.0003009811043739319, -0.00028768181800842285, -0.0002743825316429138, -0.0002610832452774048, -0.00024778395891189575, -0.00023448467254638672, -0.00022118538618087769, -0.00020788609981536865, -0.00019458681344985962, -0.00018128752708435059, -0.00016798824071884155, -0.00015468895435333252, -0.00014138966798782349, -0.00012809038162231445, -0.00011479109525680542, -0.00010149180889129639, -8.819252252578735e-05, -7.489323616027832e-05, -6.159394979476929e-05, -4.8294663429260254e-05, -3.499537706375122e-05, -2.1696090698242188e-05, -8.396804332733154e-06, 4.902482032775879e-06, 1.8201768398284912e-05, 3.1501054763793945e-05, 4.480034112930298e-05, 5.809962749481201e-05, 7.139891386032104e-05, 8.469820022583008e-05, 9.799748659133911e-05, 0.00011129677295684814, 0.00012459605932235718, 0.0001378953456878662, 0.00015119463205337524, 0.00016449391841888428, 0.0001777932047843933, 0.00019109249114990234, 0.00020439177751541138, 0.0002176910638809204, 0.00023099035024642944, 0.0002442896366119385, 0.0002575889229774475, 0.00027088820934295654, 0.0002841874957084656, 0.0002974867820739746, 0.00031078606843948364, 0.0003240853548049927, 0.0003373846411705017, 0.00035068392753601074, 0.0003639832139015198, 0.0003772825002670288, 0.00039058178663253784, 0.0004038810729980469]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 12.0, 11.0, 11.0, 11.0, 15.0, 16.0, 26.0, 35.0, 33.0, 37.0, 52.0, 56.0, 101.0, 113.0, 161.0, 253.0, 364.0, 669.0, 3091.0, 876117.0, 164126.0, 1386.0, 556.0, 320.0, 233.0, 159.0, 120.0, 89.0, 64.0, 47.0, 44.0, 45.0, 27.0, 25.0, 23.0, 13.0, 11.0, 15.0, 13.0, 12.0, 9.0, 8.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.007381439208984375, -0.007142126560211182, -0.006902813911437988, -0.006663501262664795, -0.0064241886138916016, -0.006184875965118408, -0.005945563316345215, -0.0057062506675720215, -0.005466938018798828, -0.005227625370025635, -0.004988312721252441, -0.004749000072479248, -0.004509687423706055, -0.004270374774932861, -0.004031062126159668, -0.0037917494773864746, -0.0035524368286132812, -0.003313124179840088, -0.0030738115310668945, -0.002834498882293701, -0.002595186233520508, -0.0023558735847473145, -0.002116560935974121, -0.0018772482872009277, -0.0016379356384277344, -0.001398622989654541, -0.0011593103408813477, -0.0009199976921081543, -0.0006806850433349609, -0.0004413723945617676, -0.00020205974578857422, 3.725290298461914e-05, 0.0002765655517578125, 0.0005158782005310059, 0.0007551908493041992, 0.0009945034980773926, 0.001233816146850586, 0.0014731287956237793, 0.0017124414443969727, 0.001951754093170166, 0.0021910667419433594, 0.0024303793907165527, 0.002669692039489746, 0.0029090046882629395, 0.003148317337036133, 0.003387629985809326, 0.0036269426345825195, 0.003866255283355713, 0.004105567932128906, 0.0043448805809021, 0.004584193229675293, 0.004823505878448486, 0.00506281852722168, 0.005302131175994873, 0.005541443824768066, 0.00578075647354126, 0.006020069122314453, 0.0062593817710876465, 0.00649869441986084, 0.006738007068634033, 0.0069773197174072266, 0.00721663236618042, 0.007455945014953613, 0.007695257663726807, 0.0079345703125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 130.0, 524.0, 309.0, 43.0, 2.0, 0.0, 1.0], "bins": [-0.0024589516688138247, -0.00241710152477026, -0.002375251380726695, -0.0023334012366831303, -0.002291551325470209, -0.0022497011814266443, -0.0022078510373830795, -0.0021660008933395147, -0.00212415074929595, -0.002082300605252385, -0.0020404504612088203, -0.0019986003171652555, -0.0019567501731216908, -0.0019149001454934478, -0.0018730501178652048, -0.00183119997382164, -0.0017893498297780752, -0.0017474996857345104, -0.0017056495416909456, -0.0016637995140627027, -0.0016219493700191379, -0.001580099225975573, -0.00153824919834733, -0.0014963990543037653, -0.0014545489102602005, -0.0014126987662166357, -0.001370848622173071, -0.001328998594544828, -0.0012871484505012631, -0.0012452983064576983, -0.0012034482788294554, -0.0011615981347858906, -0.0011197479907423258, -0.001077897846698761, -0.0010360477026551962, -0.0009941976750269532, -0.0009523475309833884, -0.0009104973869398236, -0.0008686473011039197, -0.0008267972152680159, -0.0007849470712244511, -0.0007430969271808863, -0.0007012468413449824, -0.0006593967555090785, -0.0006175466114655137, -0.0005756964674219489, -0.000533846381586045, -0.0004919962957501411, -0.00045014615170657635, -0.000408296036766842, -0.00036644592182710767, -0.00032459580688737333, -0.000282745691947639, -0.00024089557700790465, -0.0001990454620681703, -0.00015719534712843597, -0.0001153452176367864, -7.349510269705206e-05, -3.164498775731772e-05, 1.0205127182416618e-05, 5.205524212215096e-05, 9.39053570618853e-05, 0.00013575547200161964, 0.00017760558694135398, 0.00021945570188108832]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 3.0, 10.0, 9.0, 8.0, 10.0, 18.0, 9.0, 24.0, 27.0, 31.0, 37.0, 35.0, 31.0, 35.0, 41.0, 58.0, 60.0, 46.0, 66.0, 36.0, 49.0, 40.0, 32.0, 28.0, 45.0, 33.0, 35.0, 27.0, 18.0, 19.0, 17.0, 15.0, 10.0, 7.0, 10.0, 1.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002516508102416992, -0.00024271663278341293, -0.00023378245532512665, -0.00022484827786684036, -0.00021591410040855408, -0.0002069799229502678, -0.0001980457454919815, -0.00018911156803369522, -0.00018017739057540894, -0.00017124321311712265, -0.00016230903565883636, -0.00015337485820055008, -0.0001444406807422638, -0.0001355065032839775, -0.00012657232582569122, -0.00011763814836740494, -0.00010870397090911865, -9.976979345083237e-05, -9.083561599254608e-05, -8.19014385342598e-05, -7.296726107597351e-05, -6.403308361768723e-05, -5.509890615940094e-05, -4.6164728701114655e-05, -3.723055124282837e-05, -2.8296373784542084e-05, -1.93621963262558e-05, -1.0428018867969513e-05, -1.4938414096832275e-06, 7.440336048603058e-06, 1.6374513506889343e-05, 2.530869096517563e-05, 3.4242868423461914e-05, 4.31770458817482e-05, 5.2111223340034485e-05, 6.104540079832077e-05, 6.997957825660706e-05, 7.891375571489334e-05, 8.784793317317963e-05, 9.678211063146591e-05, 0.0001057162880897522, 0.00011465046554803848, 0.00012358464300632477, 0.00013251882046461105, 0.00014145299792289734, 0.00015038717538118362, 0.0001593213528394699, 0.0001682555302977562, 0.00017718970775604248, 0.00018612388521432877, 0.00019505806267261505, 0.00020399224013090134, 0.00021292641758918762, 0.0002218605950474739, 0.0002307947725057602, 0.00023972894996404648, 0.00024866312742233276, 0.00025759730488061905, 0.00026653148233890533, 0.0002754656597971916, 0.0002843998372554779, 0.0002933340147137642, 0.0003022681921720505, 0.00031120236963033676, 0.00032013654708862305]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 11.0, 7.0, 12.0, 13.0, 17.0, 16.0, 22.0, 23.0, 20.0, 29.0, 33.0, 28.0, 37.0, 38.0, 48.0, 47.0, 50.0, 52.0, 48.0, 46.0, 40.0, 42.0, 43.0, 45.0, 32.0, 33.0, 21.0, 28.0, 18.0, 15.0, 19.0, 10.0, 8.0, 11.0, 13.0, 8.0, 6.0, 1.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.7734375, -12.359130859375, -11.94482421875, -11.530517578125, -11.1162109375, -10.701904296875, -10.28759765625, -9.873291015625, -9.458984375, -9.044677734375, -8.63037109375, -8.216064453125, -7.8017578125, -7.387451171875, -6.97314453125, -6.558837890625, -6.14453125, -5.730224609375, -5.31591796875, -4.901611328125, -4.4873046875, -4.072998046875, -3.65869140625, -3.244384765625, -2.830078125, -2.415771484375, -2.00146484375, -1.587158203125, -1.1728515625, -0.758544921875, -0.34423828125, 0.070068359375, 0.484375, 0.898681640625, 1.31298828125, 1.727294921875, 2.1416015625, 2.555908203125, 2.97021484375, 3.384521484375, 3.798828125, 4.213134765625, 4.62744140625, 5.041748046875, 5.4560546875, 5.870361328125, 6.28466796875, 6.698974609375, 7.11328125, 7.527587890625, 7.94189453125, 8.356201171875, 8.7705078125, 9.184814453125, 9.59912109375, 10.013427734375, 10.427734375, 10.842041015625, 11.25634765625, 11.670654296875, 12.0849609375, 12.499267578125, 12.91357421875, 13.327880859375, 13.7421875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 6.0, 9.0, 12.0, 19.0, 24.0, 44.0, 38.0, 56.0, 75.0, 109.0, 161.0, 237.0, 316.0, 609.0, 1043.0, 1973.0, 4321.0, 10256.0, 27286.0, 77914.0, 232954.0, 413396.0, 179522.0, 60687.0, 21553.0, 8237.0, 3540.0, 1684.0, 957.0, 496.0, 310.0, 192.0, 143.0, 81.0, 67.0, 64.0, 46.0, 29.0, 24.0, 15.0, 15.0, 12.0, 7.0, 1.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4765625, -14.9671630859375, -14.457763671875, -13.9483642578125, -13.43896484375, -12.9295654296875, -12.420166015625, -11.9107666015625, -11.4013671875, -10.8919677734375, -10.382568359375, -9.8731689453125, -9.36376953125, -8.8543701171875, -8.344970703125, -7.8355712890625, -7.326171875, -6.8167724609375, -6.307373046875, -5.7979736328125, -5.28857421875, -4.7791748046875, -4.269775390625, -3.7603759765625, -3.2509765625, -2.7415771484375, -2.232177734375, -1.7227783203125, -1.21337890625, -0.7039794921875, -0.194580078125, 0.3148193359375, 0.82421875, 1.3336181640625, 1.843017578125, 2.3524169921875, 2.86181640625, 3.3712158203125, 3.880615234375, 4.3900146484375, 4.8994140625, 5.4088134765625, 5.918212890625, 6.4276123046875, 6.93701171875, 7.4464111328125, 7.955810546875, 8.4652099609375, 8.974609375, 9.4840087890625, 9.993408203125, 10.5028076171875, 11.01220703125, 11.5216064453125, 12.031005859375, 12.5404052734375, 13.0498046875, 13.5592041015625, 14.068603515625, 14.5780029296875, 15.08740234375, 15.5968017578125, 16.106201171875, 16.6156005859375, 17.125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 5.0, 8.0, 6.0, 6.0, 6.0, 3.0, 9.0, 9.0, 21.0, 10.0, 14.0, 19.0, 20.0, 33.0, 29.0, 31.0, 30.0, 47.0, 58.0, 69.0, 126.0, 207.0, 1502.0, 226.0, 121.0, 60.0, 52.0, 36.0, 38.0, 35.0, 32.0, 18.0, 21.0, 22.0, 17.0, 13.0, 20.0, 14.0, 11.0, 11.0, 9.0, 6.0, 3.0, 2.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.3125, -34.19287109375, -33.0732421875, -31.95361328125, -30.833984375, -29.71435546875, -28.5947265625, -27.47509765625, -26.35546875, -25.23583984375, -24.1162109375, -22.99658203125, -21.876953125, -20.75732421875, -19.6376953125, -18.51806640625, -17.3984375, -16.27880859375, -15.1591796875, -14.03955078125, -12.919921875, -11.80029296875, -10.6806640625, -9.56103515625, -8.44140625, -7.32177734375, -6.2021484375, -5.08251953125, -3.962890625, -2.84326171875, -1.7236328125, -0.60400390625, 0.515625, 1.63525390625, 2.7548828125, 3.87451171875, 4.994140625, 6.11376953125, 7.2333984375, 8.35302734375, 9.47265625, 10.59228515625, 11.7119140625, 12.83154296875, 13.951171875, 15.07080078125, 16.1904296875, 17.31005859375, 18.4296875, 19.54931640625, 20.6689453125, 21.78857421875, 22.908203125, 24.02783203125, 25.1474609375, 26.26708984375, 27.38671875, 28.50634765625, 29.6259765625, 30.74560546875, 31.865234375, 32.98486328125, 34.1044921875, 35.22412109375, 36.34375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 11.0, 8.0, 5.0, 8.0, 14.0, 19.0, 27.0, 37.0, 47.0, 83.0, 142.0, 226.0, 413.0, 706.0, 2330.0, 115273.0, 2988693.0, 34695.0, 1438.0, 565.0, 341.0, 216.0, 120.0, 91.0, 54.0, 24.0, 31.0, 17.0, 15.0, 10.0, 6.0, 6.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-82.4375, -79.5322265625, -76.626953125, -73.7216796875, -70.81640625, -67.9111328125, -65.005859375, -62.1005859375, -59.1953125, -56.2900390625, -53.384765625, -50.4794921875, -47.57421875, -44.6689453125, -41.763671875, -38.8583984375, -35.953125, -33.0478515625, -30.142578125, -27.2373046875, -24.33203125, -21.4267578125, -18.521484375, -15.6162109375, -12.7109375, -9.8056640625, -6.900390625, -3.9951171875, -1.08984375, 1.8154296875, 4.720703125, 7.6259765625, 10.53125, 13.4365234375, 16.341796875, 19.2470703125, 22.15234375, 25.0576171875, 27.962890625, 30.8681640625, 33.7734375, 36.6787109375, 39.583984375, 42.4892578125, 45.39453125, 48.2998046875, 51.205078125, 54.1103515625, 57.015625, 59.9208984375, 62.826171875, 65.7314453125, 68.63671875, 71.5419921875, 74.447265625, 77.3525390625, 80.2578125, 83.1630859375, 86.068359375, 88.9736328125, 91.87890625, 94.7841796875, 97.689453125, 100.5947265625, 103.5]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.0, 436.0, 430.0, 66.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-364.7219543457031, -356.0268859863281, -347.331787109375, -338.63671875, -329.9416198730469, -321.2465515136719, -312.55145263671875, -303.85638427734375, -295.1612854003906, -286.4662170410156, -277.7711181640625, -269.0760498046875, -260.3809509277344, -251.6858673095703, -242.99078369140625, -234.29571533203125, -225.6006317138672, -216.90554809570312, -208.21046447753906, -199.515380859375, -190.82029724121094, -182.12521362304688, -173.43014526367188, -164.73504638671875, -156.03997802734375, -147.3448944091797, -138.64981079101562, -129.95472717285156, -121.2596435546875, -112.56455993652344, -103.8694839477539, -95.17440032958984, -86.47929382324219, -77.78421020507812, -69.08912658691406, -60.394046783447266, -51.6989631652832, -43.00387954711914, -34.308799743652344, -25.61371612548828, -16.91863250732422, -8.223549842834473, 0.47153282165527344, 9.166614532470703, 17.861698150634766, 26.556781768798828, 35.251861572265625, 43.94694519042969, 52.64202880859375, 61.33711242675781, 70.03219604492188, 78.72727966308594, 87.42236328125, 96.11744689941406, 104.8125228881836, 113.50760650634766, 122.20269012451172, 130.89776611328125, 139.5928497314453, 148.28793334960938, 156.98301696777344, 165.6781005859375, 174.37318420410156, 183.06826782226562, 191.7633514404297]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 7.0, 9.0, 6.0, 7.0, 11.0, 7.0, 8.0, 23.0, 12.0, 19.0, 22.0, 16.0, 29.0, 23.0, 34.0, 43.0, 40.0, 31.0, 39.0, 33.0, 33.0, 44.0, 40.0, 46.0, 38.0, 37.0, 29.0, 28.0, 30.0, 26.0, 33.0, 27.0, 21.0, 22.0, 20.0, 13.0, 12.0, 17.0, 12.0, 17.0, 4.0, 3.0, 9.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-72.80058288574219, -70.37996673583984, -67.95935821533203, -65.53874206542969, -63.11812973022461, -60.69751739501953, -58.27690124511719, -55.85628890991211, -53.43567657470703, -51.01506423950195, -48.594451904296875, -46.17383575439453, -43.75322341918945, -41.332611083984375, -38.91199493408203, -36.49138259887695, -34.070770263671875, -31.650157928466797, -29.229543685913086, -26.808929443359375, -24.388317108154297, -21.96770477294922, -19.547090530395508, -17.126476287841797, -14.705863952636719, -12.285250663757324, -9.86463737487793, -7.444024085998535, -5.023410797119141, -2.602797508239746, -0.18218421936035156, 2.2384300231933594, 4.659049987792969, 7.079663276672363, 9.500276565551758, 11.920889854431152, 14.341503143310547, 16.762115478515625, 19.182729721069336, 21.603343963623047, 24.023956298828125, 26.444568634033203, 28.865182876586914, 31.285797119140625, 33.7064094543457, 36.12702178955078, 38.547637939453125, 40.9682502746582, 43.38886260986328, 45.80947494506836, 48.23008728027344, 50.65070343017578, 53.07131576538086, 55.49192810058594, 57.91254425048828, 60.33315658569336, 62.75376892089844, 65.17438507080078, 67.5949935913086, 70.01560974121094, 72.43621826171875, 74.8568344116211, 77.27745056152344, 79.69805908203125, 82.1186752319336]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 8.0, 6.0, 7.0, 8.0, 12.0, 21.0, 12.0, 18.0, 16.0, 15.0, 25.0, 26.0, 32.0, 29.0, 52.0, 40.0, 45.0, 51.0, 38.0, 42.0, 44.0, 54.0, 43.0, 48.0, 53.0, 36.0, 32.0, 30.0, 36.0, 30.0, 14.0, 13.0, 16.0, 14.0, 10.0, 4.0, 8.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0234375, -13.5802001953125, -13.136962890625, -12.6937255859375, -12.25048828125, -11.8072509765625, -11.364013671875, -10.9207763671875, -10.4775390625, -10.0343017578125, -9.591064453125, -9.1478271484375, -8.70458984375, -8.2613525390625, -7.818115234375, -7.3748779296875, -6.931640625, -6.4884033203125, -6.045166015625, -5.6019287109375, -5.15869140625, -4.7154541015625, -4.272216796875, -3.8289794921875, -3.3857421875, -2.9425048828125, -2.499267578125, -2.0560302734375, -1.61279296875, -1.1695556640625, -0.726318359375, -0.2830810546875, 0.16015625, 0.6033935546875, 1.046630859375, 1.4898681640625, 1.93310546875, 2.3763427734375, 2.819580078125, 3.2628173828125, 3.7060546875, 4.1492919921875, 4.592529296875, 5.0357666015625, 5.47900390625, 5.9222412109375, 6.365478515625, 6.8087158203125, 7.251953125, 7.6951904296875, 8.138427734375, 8.5816650390625, 9.02490234375, 9.4681396484375, 9.911376953125, 10.3546142578125, 10.7978515625, 11.2410888671875, 11.684326171875, 12.1275634765625, 12.57080078125, 13.0140380859375, 13.457275390625, 13.9005126953125, 14.34375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 6.0, 10.0, 9.0, 19.0, 21.0, 21.0, 29.0, 37.0, 45.0, 77.0, 102.0, 161.0, 264.0, 445.0, 806.0, 1894.0, 5555.0, 23622.0, 134130.0, 712461.0, 1826554.0, 1156836.0, 271376.0, 45235.0, 9115.0, 2740.0, 1127.0, 595.0, 314.0, 201.0, 111.0, 96.0, 57.0, 35.0, 44.0, 25.0, 20.0, 12.0, 14.0, 8.0, 15.0, 3.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-17.328125, -16.798095703125, -16.26806640625, -15.738037109375, -15.2080078125, -14.677978515625, -14.14794921875, -13.617919921875, -13.087890625, -12.557861328125, -12.02783203125, -11.497802734375, -10.9677734375, -10.437744140625, -9.90771484375, -9.377685546875, -8.84765625, -8.317626953125, -7.78759765625, -7.257568359375, -6.7275390625, -6.197509765625, -5.66748046875, -5.137451171875, -4.607421875, -4.077392578125, -3.54736328125, -3.017333984375, -2.4873046875, -1.957275390625, -1.42724609375, -0.897216796875, -0.3671875, 0.162841796875, 0.69287109375, 1.222900390625, 1.7529296875, 2.282958984375, 2.81298828125, 3.343017578125, 3.873046875, 4.403076171875, 4.93310546875, 5.463134765625, 5.9931640625, 6.523193359375, 7.05322265625, 7.583251953125, 8.11328125, 8.643310546875, 9.17333984375, 9.703369140625, 10.2333984375, 10.763427734375, 11.29345703125, 11.823486328125, 12.353515625, 12.883544921875, 13.41357421875, 13.943603515625, 14.4736328125, 15.003662109375, 15.53369140625, 16.063720703125, 16.59375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 1.0, 2.0, 10.0, 5.0, 9.0, 9.0, 19.0, 27.0, 29.0, 35.0, 56.0, 79.0, 107.0, 165.0, 205.0, 282.0, 415.0, 452.0, 478.0, 439.0, 351.0, 260.0, 199.0, 117.0, 74.0, 62.0, 49.0, 32.0, 37.0, 25.0, 7.0, 12.0, 11.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.765625, -17.1787109375, -16.591796875, -16.0048828125, -15.41796875, -14.8310546875, -14.244140625, -13.6572265625, -13.0703125, -12.4833984375, -11.896484375, -11.3095703125, -10.72265625, -10.1357421875, -9.548828125, -8.9619140625, -8.375, -7.7880859375, -7.201171875, -6.6142578125, -6.02734375, -5.4404296875, -4.853515625, -4.2666015625, -3.6796875, -3.0927734375, -2.505859375, -1.9189453125, -1.33203125, -0.7451171875, -0.158203125, 0.4287109375, 1.015625, 1.6025390625, 2.189453125, 2.7763671875, 3.36328125, 3.9501953125, 4.537109375, 5.1240234375, 5.7109375, 6.2978515625, 6.884765625, 7.4716796875, 8.05859375, 8.6455078125, 9.232421875, 9.8193359375, 10.40625, 10.9931640625, 11.580078125, 12.1669921875, 12.75390625, 13.3408203125, 13.927734375, 14.5146484375, 15.1015625, 15.6884765625, 16.275390625, 16.8623046875, 17.44921875, 18.0361328125, 18.623046875, 19.2099609375, 19.796875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 11.0, 9.0, 14.0, 14.0, 22.0, 33.0, 46.0, 72.0, 93.0, 172.0, 284.0, 496.0, 1062.0, 2749.0, 8864.0, 37198.0, 240681.0, 2298373.0, 1429062.0, 140039.0, 24588.0, 6297.0, 2115.0, 874.0, 429.0, 230.0, 163.0, 91.0, 61.0, 39.0, 23.0, 19.0, 12.0, 19.0, 7.0, 0.0, 10.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-30.984375, -30.12060546875, -29.2568359375, -28.39306640625, -27.529296875, -26.66552734375, -25.8017578125, -24.93798828125, -24.07421875, -23.21044921875, -22.3466796875, -21.48291015625, -20.619140625, -19.75537109375, -18.8916015625, -18.02783203125, -17.1640625, -16.30029296875, -15.4365234375, -14.57275390625, -13.708984375, -12.84521484375, -11.9814453125, -11.11767578125, -10.25390625, -9.39013671875, -8.5263671875, -7.66259765625, -6.798828125, -5.93505859375, -5.0712890625, -4.20751953125, -3.34375, -2.47998046875, -1.6162109375, -0.75244140625, 0.111328125, 0.97509765625, 1.8388671875, 2.70263671875, 3.56640625, 4.43017578125, 5.2939453125, 6.15771484375, 7.021484375, 7.88525390625, 8.7490234375, 9.61279296875, 10.4765625, 11.34033203125, 12.2041015625, 13.06787109375, 13.931640625, 14.79541015625, 15.6591796875, 16.52294921875, 17.38671875, 18.25048828125, 19.1142578125, 19.97802734375, 20.841796875, 21.70556640625, 22.5693359375, 23.43310546875, 24.296875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 11.0, 178.0, 538.0, 259.0, 26.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.17774200439453, -114.42102813720703, -103.66431427001953, -92.90760040283203, -82.15088653564453, -71.39417266845703, -60.63745880126953, -49.88074493408203, -39.12403106689453, -28.36731719970703, -17.61060333251953, -6.853889465332031, 3.9028244018554688, 14.659538269042969, 25.41625213623047, 36.17296600341797, 46.92967987060547, 57.68639373779297, 68.44310760498047, 79.19982147216797, 89.95653533935547, 100.71324920654297, 111.46996307373047, 122.22667694091797, 132.9833984375, 143.7401123046875, 154.496826171875, 165.2535400390625, 176.01025390625, 186.7669677734375, 197.523681640625, 208.2803955078125, 219.037109375, 229.7938232421875, 240.550537109375, 251.3072509765625, 262.06396484375, 272.8206787109375, 283.577392578125, 294.3341064453125, 305.0908203125, 315.8475341796875, 326.604248046875, 337.3609619140625, 348.11767578125, 358.8743896484375, 369.631103515625, 380.3878173828125, 391.14453125, 401.9012451171875, 412.657958984375, 423.4146728515625, 434.17138671875, 444.9281005859375, 455.684814453125, 466.4415283203125, 477.1982421875, 487.9549560546875, 498.711669921875, 509.4683837890625, 520.22509765625, 530.9818115234375, 541.738525390625, 552.4952392578125, 563.251953125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 9.0, 8.0, 14.0, 7.0, 12.0, 18.0, 24.0, 22.0, 29.0, 24.0, 21.0, 25.0, 40.0, 55.0, 43.0, 42.0, 31.0, 42.0, 43.0, 47.0, 36.0, 33.0, 44.0, 34.0, 42.0, 35.0, 31.0, 27.0, 20.0, 20.0, 27.0, 18.0, 14.0, 14.0, 10.0, 5.0, 7.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.1490364074707, -54.22444152832031, -52.299842834472656, -50.375247955322266, -48.45064926147461, -46.52605438232422, -44.60145568847656, -42.67686080932617, -40.75226593017578, -38.82767105102539, -36.903072357177734, -34.978477478027344, -33.05387878417969, -31.129283905029297, -29.204687118530273, -27.28009033203125, -25.355491638183594, -23.43089485168457, -21.506298065185547, -19.581703186035156, -17.6571044921875, -15.732508659362793, -13.807912826538086, -11.883316040039062, -9.958719253540039, -8.034122467041016, -6.10952615737915, -4.184929847717285, -2.2603330612182617, -0.3357362747192383, 1.5888595581054688, 3.513456344604492, 5.43804931640625, 7.362646102905273, 9.287242889404297, 11.211838722229004, 13.136435508728027, 15.06103229522705, 16.985628128051758, 18.91022491455078, 20.834821701049805, 22.759418487548828, 24.68401527404785, 26.608612060546875, 28.533206939697266, 30.457805633544922, 32.38240051269531, 34.30699920654297, 36.23159408569336, 38.15618896484375, 40.080787658691406, 42.0053825378418, 43.92998123168945, 45.854576110839844, 47.7791748046875, 49.70376968383789, 51.62836456298828, 53.55295944213867, 55.47755813598633, 57.40215301513672, 59.326751708984375, 61.251346588134766, 63.175941467285156, 65.10054016113281, 67.02513885498047]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 7.0, 9.0, 12.0, 12.0, 10.0, 19.0, 9.0, 15.0, 17.0, 25.0, 17.0, 21.0, 30.0, 27.0, 28.0, 39.0, 37.0, 44.0, 47.0, 42.0, 35.0, 40.0, 36.0, 51.0, 28.0, 33.0, 29.0, 42.0, 28.0, 27.0, 24.0, 19.0, 20.0, 27.0, 12.0, 16.0, 9.0, 14.0, 8.0, 6.0, 5.0, 6.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-12.0546875, -11.6754150390625, -11.296142578125, -10.9168701171875, -10.53759765625, -10.1583251953125, -9.779052734375, -9.3997802734375, -9.0205078125, -8.6412353515625, -8.261962890625, -7.8826904296875, -7.50341796875, -7.1241455078125, -6.744873046875, -6.3656005859375, -5.986328125, -5.6070556640625, -5.227783203125, -4.8485107421875, -4.46923828125, -4.0899658203125, -3.710693359375, -3.3314208984375, -2.9521484375, -2.5728759765625, -2.193603515625, -1.8143310546875, -1.43505859375, -1.0557861328125, -0.676513671875, -0.2972412109375, 0.08203125, 0.4613037109375, 0.840576171875, 1.2198486328125, 1.59912109375, 1.9783935546875, 2.357666015625, 2.7369384765625, 3.1162109375, 3.4954833984375, 3.874755859375, 4.2540283203125, 4.63330078125, 5.0125732421875, 5.391845703125, 5.7711181640625, 6.150390625, 6.5296630859375, 6.908935546875, 7.2882080078125, 7.66748046875, 8.0467529296875, 8.426025390625, 8.8052978515625, 9.1845703125, 9.5638427734375, 9.943115234375, 10.3223876953125, 10.70166015625, 11.0809326171875, 11.460205078125, 11.8394775390625, 12.21875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 14.0, 8.0, 7.0, 22.0, 28.0, 53.0, 68.0, 84.0, 161.0, 195.0, 303.0, 424.0, 603.0, 932.0, 1279.0, 1892.0, 2617.0, 3949.0, 5604.0, 8073.0, 11732.0, 17144.0, 26184.0, 40700.0, 66046.0, 121540.0, 302263.0, 190521.0, 91385.0, 53194.0, 33039.0, 21622.0, 14361.0, 9994.0, 6831.0, 4878.0, 3337.0, 2342.0, 1641.0, 1108.0, 741.0, 536.0, 335.0, 257.0, 149.0, 117.0, 82.0, 59.0, 32.0, 28.0, 19.0, 11.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-3.1015625, -3.00396728515625, -2.9063720703125, -2.80877685546875, -2.711181640625, -2.61358642578125, -2.5159912109375, -2.41839599609375, -2.32080078125, -2.22320556640625, -2.1256103515625, -2.02801513671875, -1.930419921875, -1.83282470703125, -1.7352294921875, -1.63763427734375, -1.5400390625, -1.44244384765625, -1.3448486328125, -1.24725341796875, -1.149658203125, -1.05206298828125, -0.9544677734375, -0.85687255859375, -0.75927734375, -0.66168212890625, -0.5640869140625, -0.46649169921875, -0.368896484375, -0.27130126953125, -0.1737060546875, -0.07611083984375, 0.021484375, 0.11907958984375, 0.2166748046875, 0.31427001953125, 0.411865234375, 0.50946044921875, 0.6070556640625, 0.70465087890625, 0.80224609375, 0.89984130859375, 0.9974365234375, 1.09503173828125, 1.192626953125, 1.29022216796875, 1.3878173828125, 1.48541259765625, 1.5830078125, 1.68060302734375, 1.7781982421875, 1.87579345703125, 1.973388671875, 2.07098388671875, 2.1685791015625, 2.26617431640625, 2.36376953125, 2.46136474609375, 2.5589599609375, 2.65655517578125, 2.754150390625, 2.85174560546875, 2.9493408203125, 3.04693603515625, 3.14453125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 6.0, 4.0, 3.0, 10.0, 6.0, 8.0, 8.0, 12.0, 11.0, 19.0, 25.0, 16.0, 23.0, 18.0, 23.0, 32.0, 25.0, 41.0, 45.0, 46.0, 37.0, 36.0, 38.0, 36.0, 1054.0, 37.0, 35.0, 30.0, 29.0, 24.0, 31.0, 41.0, 40.0, 20.0, 24.0, 21.0, 12.0, 8.0, 19.0, 9.0, 6.0, 9.0, 12.0, 11.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.5703125, -7.334228515625, -7.09814453125, -6.862060546875, -6.6259765625, -6.389892578125, -6.15380859375, -5.917724609375, -5.681640625, -5.445556640625, -5.20947265625, -4.973388671875, -4.7373046875, -4.501220703125, -4.26513671875, -4.029052734375, -3.79296875, -3.556884765625, -3.32080078125, -3.084716796875, -2.8486328125, -2.612548828125, -2.37646484375, -2.140380859375, -1.904296875, -1.668212890625, -1.43212890625, -1.196044921875, -0.9599609375, -0.723876953125, -0.48779296875, -0.251708984375, -0.015625, 0.220458984375, 0.45654296875, 0.692626953125, 0.9287109375, 1.164794921875, 1.40087890625, 1.636962890625, 1.873046875, 2.109130859375, 2.34521484375, 2.581298828125, 2.8173828125, 3.053466796875, 3.28955078125, 3.525634765625, 3.76171875, 3.997802734375, 4.23388671875, 4.469970703125, 4.7060546875, 4.942138671875, 5.17822265625, 5.414306640625, 5.650390625, 5.886474609375, 6.12255859375, 6.358642578125, 6.5947265625, 6.830810546875, 7.06689453125, 7.302978515625, 7.5390625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 25.0, 26.0, 34.0, 56.0, 98.0, 138.0, 190.0, 283.0, 430.0, 590.0, 802.0, 1160.0, 1581.0, 2190.0, 2981.0, 4206.0, 6033.0, 8782.0, 12422.0, 18132.0, 27330.0, 40683.0, 62950.0, 100419.0, 191653.0, 1299109.0, 108980.0, 68348.0, 43975.0, 29235.0, 19490.0, 13370.0, 8925.0, 6501.0, 4590.0, 3304.0, 2318.0, 1661.0, 1190.0, 888.0, 622.0, 441.0, 314.0, 221.0, 153.0, 96.0, 87.0, 34.0, 20.0, 27.0, 10.0, 10.0, 6.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.8515625, -2.7626953125, -2.673828125, -2.5849609375, -2.49609375, -2.4072265625, -2.318359375, -2.2294921875, -2.140625, -2.0517578125, -1.962890625, -1.8740234375, -1.78515625, -1.6962890625, -1.607421875, -1.5185546875, -1.4296875, -1.3408203125, -1.251953125, -1.1630859375, -1.07421875, -0.9853515625, -0.896484375, -0.8076171875, -0.71875, -0.6298828125, -0.541015625, -0.4521484375, -0.36328125, -0.2744140625, -0.185546875, -0.0966796875, -0.0078125, 0.0810546875, 0.169921875, 0.2587890625, 0.34765625, 0.4365234375, 0.525390625, 0.6142578125, 0.703125, 0.7919921875, 0.880859375, 0.9697265625, 1.05859375, 1.1474609375, 1.236328125, 1.3251953125, 1.4140625, 1.5029296875, 1.591796875, 1.6806640625, 1.76953125, 1.8583984375, 1.947265625, 2.0361328125, 2.125, 2.2138671875, 2.302734375, 2.3916015625, 2.48046875, 2.5693359375, 2.658203125, 2.7470703125, 2.8359375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 10.0, 13.0, 13.0, 19.0, 20.0, 30.0, 58.0, 68.0, 117.0, 152.0, 119.0, 111.0, 65.0, 54.0, 45.0, 20.0, 23.0, 8.0, 11.0, 6.0, 10.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009703636169433594, -0.0009442195296287537, -0.000918075442314148, -0.0008919313549995422, -0.0008657872676849365, -0.0008396431803703308, -0.0008134990930557251, -0.0007873550057411194, -0.0007612109184265137, -0.000735066831111908, -0.0007089227437973022, -0.0006827786564826965, -0.0006566345691680908, -0.0006304904818534851, -0.0006043463945388794, -0.0005782023072242737, -0.000552058219909668, -0.0005259141325950623, -0.0004997700452804565, -0.00047362595796585083, -0.0004474818706512451, -0.0004213377833366394, -0.0003951936960220337, -0.000369049608707428, -0.00034290552139282227, -0.00031676143407821655, -0.00029061734676361084, -0.0002644732594490051, -0.00023832917213439941, -0.0002121850848197937, -0.000186040997505188, -0.00015989691019058228, -0.00013375282287597656, -0.00010760873556137085, -8.146464824676514e-05, -5.5320560932159424e-05, -2.917647361755371e-05, -3.032386302947998e-06, 2.3111701011657715e-05, 4.925578832626343e-05, 7.539987564086914e-05, 0.00010154396295547485, 0.00012768805027008057, 0.00015383213758468628, 0.000179976224899292, 0.0002061203122138977, 0.00023226439952850342, 0.00025840848684310913, 0.00028455257415771484, 0.00031069666147232056, 0.00033684074878692627, 0.000362984836101532, 0.0003891289234161377, 0.0004152730107307434, 0.0004414170980453491, 0.00046756118535995483, 0.0004937052726745605, 0.0005198493599891663, 0.000545993447303772, 0.0005721375346183777, 0.0005982816219329834, 0.0006244257092475891, 0.0006505697965621948, 0.0006767138838768005, 0.0007028579711914062]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 7.0, 3.0, 6.0, 4.0, 18.0, 15.0, 21.0, 20.0, 30.0, 34.0, 81.0, 144.0, 214.0, 418.0, 1402.0, 1031262.0, 13427.0, 681.0, 328.0, 171.0, 81.0, 51.0, 42.0, 30.0, 21.0, 16.0, 15.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01374053955078125, -0.01322638988494873, -0.012712240219116211, -0.012198090553283691, -0.011683940887451172, -0.011169791221618652, -0.010655641555786133, -0.010141491889953613, -0.009627342224121094, -0.009113192558288574, -0.008599042892456055, -0.008084893226623535, -0.007570743560791016, -0.007056593894958496, -0.0065424442291259766, -0.006028294563293457, -0.0055141448974609375, -0.004999995231628418, -0.0044858455657958984, -0.003971695899963379, -0.0034575462341308594, -0.00294339656829834, -0.0024292469024658203, -0.0019150972366333008, -0.0014009475708007812, -0.0008867979049682617, -0.0003726482391357422, 0.00014150142669677734, 0.0006556510925292969, 0.0011698007583618164, 0.001683950424194336, 0.0021981000900268555, 0.002712249755859375, 0.0032263994216918945, 0.003740549087524414, 0.004254698753356934, 0.004768848419189453, 0.005282998085021973, 0.005797147750854492, 0.006311297416687012, 0.006825447082519531, 0.007339596748352051, 0.00785374641418457, 0.00836789608001709, 0.00888204574584961, 0.009396195411682129, 0.009910345077514648, 0.010424494743347168, 0.010938644409179688, 0.011452794075012207, 0.011966943740844727, 0.012481093406677246, 0.012995243072509766, 0.013509392738342285, 0.014023542404174805, 0.014537692070007324, 0.015051841735839844, 0.015565991401672363, 0.016080141067504883, 0.016594290733337402, 0.017108440399169922, 0.01762259006500244, 0.01813673973083496, 0.01865088939666748, 0.0191650390625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 16.0, 50.0, 140.0, 303.0, 298.0, 161.0, 36.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008547219913452864, -0.0008295704610645771, -0.0008044189889915287, -0.0007792674587108195, -0.0007541159866377711, -0.0007289644563570619, -0.0007038129260763526, -0.0006786614540033042, -0.0006535099819302559, -0.0006283584516495466, -0.0006032069795764983, -0.000578055449295789, -0.0005529039772227407, -0.0005277524469420314, -0.0005026009166613221, -0.00047744944458827376, -0.0004522979143075645, -0.0004271464131306857, -0.0004019949119538069, -0.0003768433816730976, -0.00035169190960004926, -0.00032654037931934, -0.0003013888781424612, -0.00027623737696558237, -0.00025108587578870356, -0.00022593437461182475, -0.00020078287343494594, -0.0001756313577061519, -0.0001504798565292731, -0.00012532835535239428, -0.00010017683962360024, -7.502533844672143e-05, -4.9873837269842625e-05, -2.4722332454985008e-05, 4.291723598726094e-07, 2.5580680812709033e-05, 5.0732181989587843e-05, 7.588368316646665e-05, 0.00010103519889526069, 0.0001261867000721395, 0.0001513382012490183, 0.00017648970242589712, 0.00020164120360277593, 0.00022679271933156997, 0.000251944235060364, 0.00027709570713341236, 0.00030224723741412163, 0.00032739873859100044, 0.00035255023976787925, 0.00037770174094475806, 0.00040285324212163687, 0.00042800477240234613, 0.0004531562444753945, 0.00047830777475610375, 0.0005034592468291521, 0.0005286107771098614, 0.0005537623073905706, 0.0005789138376712799, 0.0006040653097443283, 0.0006292168400250375, 0.0006543683120980859, 0.0006795198423787951, 0.0007046713726595044, 0.0007298228447325528, 0.0007549743168056011]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 5.0, 4.0, 12.0, 14.0, 19.0, 15.0, 16.0, 27.0, 24.0, 31.0, 32.0, 35.0, 45.0, 40.0, 29.0, 47.0, 29.0, 29.0, 52.0, 57.0, 37.0, 46.0, 33.0, 41.0, 40.0, 26.0, 36.0, 26.0, 32.0, 17.0, 25.0, 11.0, 12.0, 13.0, 12.0, 8.0, 5.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003191232681274414, -0.00030984170734882355, -0.0003005601465702057, -0.00029127858579158783, -0.00028199702501296997, -0.0002727154642343521, -0.00026343390345573425, -0.0002541523426771164, -0.00024487078189849854, -0.00023558922111988068, -0.00022630766034126282, -0.00021702609956264496, -0.0002077445387840271, -0.00019846297800540924, -0.00018918141722679138, -0.00017989985644817352, -0.00017061829566955566, -0.0001613367348909378, -0.00015205517411231995, -0.0001427736133337021, -0.00013349205255508423, -0.00012421049177646637, -0.00011492893099784851, -0.00010564737021923065, -9.636580944061279e-05, -8.708424866199493e-05, -7.780268788337708e-05, -6.852112710475922e-05, -5.923956632614136e-05, -4.99580055475235e-05, -4.067644476890564e-05, -3.139488399028778e-05, -2.2113323211669922e-05, -1.2831762433052063e-05, -3.550201654434204e-06, 5.731359124183655e-06, 1.5012919902801514e-05, 2.4294480681419373e-05, 3.357604146003723e-05, 4.285760223865509e-05, 5.213916301727295e-05, 6.142072379589081e-05, 7.070228457450867e-05, 7.998384535312653e-05, 8.926540613174438e-05, 9.854696691036224e-05, 0.0001078285276889801, 0.00011711008846759796, 0.00012639164924621582, 0.00013567321002483368, 0.00014495477080345154, 0.0001542363315820694, 0.00016351789236068726, 0.00017279945313930511, 0.00018208101391792297, 0.00019136257469654083, 0.0002006441354751587, 0.00020992569625377655, 0.0002192072570323944, 0.00022848881781101227, 0.00023777037858963013, 0.000247051939368248, 0.00025633350014686584, 0.0002656150609254837, 0.00027489662170410156]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 7.0, 9.0, 12.0, 12.0, 10.0, 19.0, 9.0, 15.0, 17.0, 25.0, 17.0, 21.0, 30.0, 27.0, 28.0, 39.0, 37.0, 44.0, 47.0, 42.0, 35.0, 40.0, 36.0, 51.0, 28.0, 33.0, 29.0, 42.0, 28.0, 27.0, 24.0, 19.0, 20.0, 27.0, 12.0, 16.0, 9.0, 14.0, 8.0, 6.0, 5.0, 6.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-12.0546875, -11.6754150390625, -11.296142578125, -10.9168701171875, -10.53759765625, -10.1583251953125, -9.779052734375, -9.3997802734375, -9.0205078125, -8.6412353515625, -8.261962890625, -7.8826904296875, -7.50341796875, -7.1241455078125, -6.744873046875, -6.3656005859375, -5.986328125, -5.6070556640625, -5.227783203125, -4.8485107421875, -4.46923828125, -4.0899658203125, -3.710693359375, -3.3314208984375, -2.9521484375, -2.5728759765625, -2.193603515625, -1.8143310546875, -1.43505859375, -1.0557861328125, -0.676513671875, -0.2972412109375, 0.08203125, 0.4613037109375, 0.840576171875, 1.2198486328125, 1.59912109375, 1.9783935546875, 2.357666015625, 2.7369384765625, 3.1162109375, 3.4954833984375, 3.874755859375, 4.2540283203125, 4.63330078125, 5.0125732421875, 5.391845703125, 5.7711181640625, 6.150390625, 6.5296630859375, 6.908935546875, 7.2882080078125, 7.66748046875, 8.0467529296875, 8.426025390625, 8.8052978515625, 9.1845703125, 9.5638427734375, 9.943115234375, 10.3223876953125, 10.70166015625, 11.0809326171875, 11.460205078125, 11.8394775390625, 12.21875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 12.0, 22.0, 16.0, 21.0, 34.0, 40.0, 64.0, 72.0, 105.0, 148.0, 192.0, 237.0, 358.0, 525.0, 800.0, 1353.0, 2511.0, 5719.0, 15060.0, 44479.0, 127636.0, 303592.0, 322192.0, 143678.0, 49390.0, 16851.0, 6259.0, 2911.0, 1534.0, 865.0, 518.0, 335.0, 274.0, 184.0, 118.0, 109.0, 89.0, 54.0, 51.0, 34.0, 31.0, 18.0, 12.0, 13.0, 10.0, 3.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.640625, -16.13720703125, -15.6337890625, -15.13037109375, -14.626953125, -14.12353515625, -13.6201171875, -13.11669921875, -12.61328125, -12.10986328125, -11.6064453125, -11.10302734375, -10.599609375, -10.09619140625, -9.5927734375, -9.08935546875, -8.5859375, -8.08251953125, -7.5791015625, -7.07568359375, -6.572265625, -6.06884765625, -5.5654296875, -5.06201171875, -4.55859375, -4.05517578125, -3.5517578125, -3.04833984375, -2.544921875, -2.04150390625, -1.5380859375, -1.03466796875, -0.53125, -0.02783203125, 0.4755859375, 0.97900390625, 1.482421875, 1.98583984375, 2.4892578125, 2.99267578125, 3.49609375, 3.99951171875, 4.5029296875, 5.00634765625, 5.509765625, 6.01318359375, 6.5166015625, 7.02001953125, 7.5234375, 8.02685546875, 8.5302734375, 9.03369140625, 9.537109375, 10.04052734375, 10.5439453125, 11.04736328125, 11.55078125, 12.05419921875, 12.5576171875, 13.06103515625, 13.564453125, 14.06787109375, 14.5712890625, 15.07470703125, 15.578125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 15.0, 18.0, 20.0, 26.0, 25.0, 31.0, 33.0, 32.0, 61.0, 68.0, 78.0, 128.0, 307.0, 1432.0, 249.0, 131.0, 61.0, 35.0, 51.0, 40.0, 31.0, 35.0, 22.0, 20.0, 19.0, 11.0, 12.0, 9.0, 7.0, 12.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.875, -37.6357421875, -36.396484375, -35.1572265625, -33.91796875, -32.6787109375, -31.439453125, -30.2001953125, -28.9609375, -27.7216796875, -26.482421875, -25.2431640625, -24.00390625, -22.7646484375, -21.525390625, -20.2861328125, -19.046875, -17.8076171875, -16.568359375, -15.3291015625, -14.08984375, -12.8505859375, -11.611328125, -10.3720703125, -9.1328125, -7.8935546875, -6.654296875, -5.4150390625, -4.17578125, -2.9365234375, -1.697265625, -0.4580078125, 0.78125, 2.0205078125, 3.259765625, 4.4990234375, 5.73828125, 6.9775390625, 8.216796875, 9.4560546875, 10.6953125, 11.9345703125, 13.173828125, 14.4130859375, 15.65234375, 16.8916015625, 18.130859375, 19.3701171875, 20.609375, 21.8486328125, 23.087890625, 24.3271484375, 25.56640625, 26.8056640625, 28.044921875, 29.2841796875, 30.5234375, 31.7626953125, 33.001953125, 34.2412109375, 35.48046875, 36.7197265625, 37.958984375, 39.1982421875, 40.4375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 5.0, 7.0, 7.0, 9.0, 14.0, 16.0, 26.0, 24.0, 44.0, 71.0, 84.0, 124.0, 191.0, 330.0, 587.0, 1186.0, 12733.0, 2792290.0, 332074.0, 3729.0, 859.0, 451.0, 274.0, 179.0, 109.0, 77.0, 51.0, 43.0, 28.0, 13.0, 18.0, 9.0, 15.0, 3.0, 4.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-92.9375, -90.10546875, -87.2734375, -84.44140625, -81.609375, -78.77734375, -75.9453125, -73.11328125, -70.28125, -67.44921875, -64.6171875, -61.78515625, -58.953125, -56.12109375, -53.2890625, -50.45703125, -47.625, -44.79296875, -41.9609375, -39.12890625, -36.296875, -33.46484375, -30.6328125, -27.80078125, -24.96875, -22.13671875, -19.3046875, -16.47265625, -13.640625, -10.80859375, -7.9765625, -5.14453125, -2.3125, 0.51953125, 3.3515625, 6.18359375, 9.015625, 11.84765625, 14.6796875, 17.51171875, 20.34375, 23.17578125, 26.0078125, 28.83984375, 31.671875, 34.50390625, 37.3359375, 40.16796875, 43.0, 45.83203125, 48.6640625, 51.49609375, 54.328125, 57.16015625, 59.9921875, 62.82421875, 65.65625, 68.48828125, 71.3203125, 74.15234375, 76.984375, 79.81640625, 82.6484375, 85.48046875, 88.3125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 12.0, 57.0, 163.0, 326.0, 281.0, 108.0, 45.0, 15.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.46192169189453, -36.72151184082031, -31.98110008239746, -27.24068832397461, -22.50027847290039, -17.759868621826172, -13.01945686340332, -8.279045104980469, -3.53863525390625, 1.2017755508422852, 5.94218635559082, 10.682597160339355, 15.42300796508789, 20.16341781616211, 24.90382957458496, 29.644241333007812, 34.38465118408203, 39.12506103515625, 43.86547088623047, 48.60588455200195, 53.34629440307617, 58.08670425415039, 62.827117919921875, 67.5675277709961, 72.30793762207031, 77.04834747314453, 81.78875732421875, 86.52916717529297, 91.26957702636719, 96.00999450683594, 100.75040435791016, 105.49081420898438, 110.23123168945312, 114.97164154052734, 119.71205139160156, 124.45246124267578, 129.19287109375, 133.93328857421875, 138.67369079589844, 143.4141082763672, 148.15451049804688, 152.89492797851562, 157.6353302001953, 162.37574768066406, 167.11614990234375, 171.8565673828125, 176.5969696044922, 181.33738708496094, 186.0778045654297, 190.81822204589844, 195.55862426757812, 200.29904174804688, 205.03944396972656, 209.7798614501953, 214.520263671875, 219.26068115234375, 224.0010986328125, 228.74151611328125, 233.48191833496094, 238.2223358154297, 242.96273803710938, 247.70315551757812, 252.4435577392578, 257.1839599609375, 261.92437744140625]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 6.0, 8.0, 4.0, 8.0, 10.0, 6.0, 17.0, 14.0, 18.0, 20.0, 21.0, 30.0, 34.0, 33.0, 34.0, 45.0, 36.0, 41.0, 45.0, 50.0, 37.0, 39.0, 35.0, 42.0, 51.0, 30.0, 36.0, 27.0, 30.0, 29.0, 28.0, 13.0, 25.0, 19.0, 12.0, 14.0, 13.0, 10.0, 8.0, 4.0, 2.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.55532836914062, -74.0134506225586, -71.47157287597656, -68.92969512939453, -66.3878173828125, -63.84593963623047, -61.30406188964844, -58.762184143066406, -56.220306396484375, -53.678428649902344, -51.13655090332031, -48.59467315673828, -46.05279541015625, -43.51091766357422, -40.96903991699219, -38.427162170410156, -35.885284423828125, -33.343406677246094, -30.801528930664062, -28.25965118408203, -25.7177734375, -23.17589569091797, -20.634017944335938, -18.092140197753906, -15.550262451171875, -13.008384704589844, -10.466506958007812, -7.924629211425781, -5.38275146484375, -2.8408737182617188, -0.2989959716796875, 2.2428817749023438, 4.784751892089844, 7.326629638671875, 9.868507385253906, 12.410385131835938, 14.952262878417969, 17.494140625, 20.03601837158203, 22.577896118164062, 25.119773864746094, 27.661651611328125, 30.203529357910156, 32.74540710449219, 35.28728485107422, 37.82916259765625, 40.37104034423828, 42.91291809082031, 45.454795837402344, 47.996673583984375, 50.538551330566406, 53.08042907714844, 55.62230682373047, 58.1641845703125, 60.70606231689453, 63.24794006347656, 65.7898178100586, 68.33169555664062, 70.87357330322266, 73.41545104980469, 75.95732879638672, 78.49920654296875, 81.04108428955078, 83.58296203613281, 86.12483978271484]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 11.0, 5.0, 11.0, 7.0, 12.0, 7.0, 16.0, 16.0, 28.0, 22.0, 23.0, 37.0, 24.0, 25.0, 32.0, 36.0, 47.0, 33.0, 44.0, 39.0, 45.0, 43.0, 26.0, 47.0, 28.0, 44.0, 33.0, 34.0, 38.0, 25.0, 24.0, 19.0, 20.0, 15.0, 22.0, 9.0, 8.0, 8.0, 7.0, 7.0, 5.0, 10.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.8359375, -13.4339599609375, -13.031982421875, -12.6300048828125, -12.22802734375, -11.8260498046875, -11.424072265625, -11.0220947265625, -10.6201171875, -10.2181396484375, -9.816162109375, -9.4141845703125, -9.01220703125, -8.6102294921875, -8.208251953125, -7.8062744140625, -7.404296875, -7.0023193359375, -6.600341796875, -6.1983642578125, -5.79638671875, -5.3944091796875, -4.992431640625, -4.5904541015625, -4.1884765625, -3.7864990234375, -3.384521484375, -2.9825439453125, -2.58056640625, -2.1785888671875, -1.776611328125, -1.3746337890625, -0.97265625, -0.5706787109375, -0.168701171875, 0.2332763671875, 0.63525390625, 1.0372314453125, 1.439208984375, 1.8411865234375, 2.2431640625, 2.6451416015625, 3.047119140625, 3.4490966796875, 3.85107421875, 4.2530517578125, 4.655029296875, 5.0570068359375, 5.458984375, 5.8609619140625, 6.262939453125, 6.6649169921875, 7.06689453125, 7.4688720703125, 7.870849609375, 8.2728271484375, 8.6748046875, 9.0767822265625, 9.478759765625, 9.8807373046875, 10.28271484375, 10.6846923828125, 11.086669921875, 11.4886474609375, 11.890625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 8.0, 0.0, 6.0, 8.0, 13.0, 10.0, 21.0, 12.0, 22.0, 22.0, 26.0, 45.0, 52.0, 56.0, 74.0, 118.0, 157.0, 196.0, 247.0, 319.0, 439.0, 1371.0, 2875796.0, 1312474.0, 1083.0, 350.0, 272.0, 252.0, 178.0, 139.0, 106.0, 81.0, 64.0, 44.0, 40.0, 34.0, 26.0, 25.0, 22.0, 13.0, 9.0, 10.0, 12.0, 6.0, 5.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-147.25, -142.78125, -138.3125, -133.84375, -129.375, -124.90625, -120.4375, -115.96875, -111.5, -107.03125, -102.5625, -98.09375, -93.625, -89.15625, -84.6875, -80.21875, -75.75, -71.28125, -66.8125, -62.34375, -57.875, -53.40625, -48.9375, -44.46875, -40.0, -35.53125, -31.0625, -26.59375, -22.125, -17.65625, -13.1875, -8.71875, -4.25, 0.21875, 4.6875, 9.15625, 13.625, 18.09375, 22.5625, 27.03125, 31.5, 35.96875, 40.4375, 44.90625, 49.375, 53.84375, 58.3125, 62.78125, 67.25, 71.71875, 76.1875, 80.65625, 85.125, 89.59375, 94.0625, 98.53125, 103.0, 107.46875, 111.9375, 116.40625, 120.875, 125.34375, 129.8125, 134.28125, 138.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 9.0, 9.0, 8.0, 15.0, 25.0, 27.0, 51.0, 47.0, 63.0, 80.0, 98.0, 151.0, 220.0, 272.0, 361.0, 479.0, 490.0, 409.0, 316.0, 265.0, 171.0, 120.0, 90.0, 78.0, 44.0, 32.0, 29.0, 24.0, 16.0, 10.0, 11.0, 6.0, 11.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.359375, -18.776123046875, -18.19287109375, -17.609619140625, -17.0263671875, -16.443115234375, -15.85986328125, -15.276611328125, -14.693359375, -14.110107421875, -13.52685546875, -12.943603515625, -12.3603515625, -11.777099609375, -11.19384765625, -10.610595703125, -10.02734375, -9.444091796875, -8.86083984375, -8.277587890625, -7.6943359375, -7.111083984375, -6.52783203125, -5.944580078125, -5.361328125, -4.778076171875, -4.19482421875, -3.611572265625, -3.0283203125, -2.445068359375, -1.86181640625, -1.278564453125, -0.6953125, -0.112060546875, 0.47119140625, 1.054443359375, 1.6376953125, 2.220947265625, 2.80419921875, 3.387451171875, 3.970703125, 4.553955078125, 5.13720703125, 5.720458984375, 6.3037109375, 6.886962890625, 7.47021484375, 8.053466796875, 8.63671875, 9.219970703125, 9.80322265625, 10.386474609375, 10.9697265625, 11.552978515625, 12.13623046875, 12.719482421875, 13.302734375, 13.885986328125, 14.46923828125, 15.052490234375, 15.6357421875, 16.218994140625, 16.80224609375, 17.385498046875, 17.96875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 12.0, 17.0, 13.0, 20.0, 31.0, 24.0, 33.0, 35.0, 70.0, 103.0, 221.0, 676.0, 10775.0, 3691016.0, 487374.0, 2930.0, 433.0, 155.0, 85.0, 55.0, 39.0, 30.0, 22.0, 28.0, 12.0, 19.0, 10.0, 11.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.6875, -78.525390625, -75.36328125, -72.201171875, -69.0390625, -65.876953125, -62.71484375, -59.552734375, -56.390625, -53.228515625, -50.06640625, -46.904296875, -43.7421875, -40.580078125, -37.41796875, -34.255859375, -31.09375, -27.931640625, -24.76953125, -21.607421875, -18.4453125, -15.283203125, -12.12109375, -8.958984375, -5.796875, -2.634765625, 0.52734375, 3.689453125, 6.8515625, 10.013671875, 13.17578125, 16.337890625, 19.5, 22.662109375, 25.82421875, 28.986328125, 32.1484375, 35.310546875, 38.47265625, 41.634765625, 44.796875, 47.958984375, 51.12109375, 54.283203125, 57.4453125, 60.607421875, 63.76953125, 66.931640625, 70.09375, 73.255859375, 76.41796875, 79.580078125, 82.7421875, 85.904296875, 89.06640625, 92.228515625, 95.390625, 98.552734375, 101.71484375, 104.876953125, 108.0390625, 111.201171875, 114.36328125, 117.525390625, 120.6875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 77.0, 556.0, 353.0, 26.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-484.9032897949219, -472.0851745605469, -459.26708984375, -446.448974609375, -433.6308898925781, -420.8127746582031, -407.99468994140625, -395.17657470703125, -382.35845947265625, -369.54034423828125, -356.7222595214844, -343.9041442871094, -331.0860595703125, -318.2679443359375, -305.4498291015625, -292.6317443847656, -279.81365966796875, -266.99554443359375, -254.17745971679688, -241.35934448242188, -228.541259765625, -215.72314453125, -202.90504455566406, -190.08694458007812, -177.2688446044922, -164.45074462890625, -151.6326446533203, -138.81454467773438, -125.9964370727539, -113.17833709716797, -100.3602294921875, -87.54212951660156, -74.72406005859375, -61.90596008300781, -49.08785629272461, -36.269752502441406, -23.45165252685547, -10.633552551269531, 2.1845550537109375, 15.002655029296875, 27.820755004882812, 40.63885498046875, 53.45695877075195, 66.27506256103516, 79.0931625366211, 91.91126251220703, 104.7293701171875, 117.54747009277344, 130.36557006835938, 143.1836700439453, 156.00177001953125, 168.81988525390625, 181.63796997070312, 194.45608520507812, 207.27418518066406, 220.09228515625, 232.91038513183594, 245.72848510742188, 258.5466003417969, 271.36468505859375, 284.18280029296875, 297.0008850097656, 309.8190002441406, 322.6370849609375, 335.4552001953125]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 7.0, 2.0, 3.0, 13.0, 8.0, 20.0, 8.0, 21.0, 18.0, 21.0, 22.0, 22.0, 22.0, 30.0, 27.0, 26.0, 31.0, 42.0, 30.0, 29.0, 48.0, 47.0, 44.0, 40.0, 42.0, 31.0, 39.0, 22.0, 23.0, 32.0, 36.0, 32.0, 31.0, 21.0, 20.0, 20.0, 10.0, 10.0, 16.0, 10.0, 4.0, 9.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0], "bins": [-78.47827911376953, -76.45101928710938, -74.42375183105469, -72.39649200439453, -70.36923217773438, -68.34196472167969, -66.31470489501953, -64.28744506835938, -62.26017761230469, -60.232913970947266, -58.20565414428711, -56.17839050292969, -54.151126861572266, -52.123863220214844, -50.09660339355469, -48.069339752197266, -46.04207992553711, -44.01481628417969, -41.98755645751953, -39.96029281616211, -37.93302917480469, -35.90576934814453, -33.87850570678711, -31.851242065429688, -29.8239803314209, -27.79671859741211, -25.769454956054688, -23.7421932220459, -21.71493148803711, -19.687667846679688, -17.6604061126709, -15.633143424987793, -13.605884552001953, -11.578621864318848, -9.551359176635742, -7.524097442626953, -5.496834754943848, -3.469572067260742, -1.4423103332519531, 0.5849523544311523, 2.612215042114258, 4.639477729797363, 6.6667399406433105, 8.694002151489258, 10.721264839172363, 12.748527526855469, 14.775789260864258, 16.803050994873047, 18.83031463623047, 20.857576370239258, 22.88484001159668, 24.91210174560547, 26.93936538696289, 28.96662712097168, 30.99388885498047, 33.02115249633789, 35.04841613769531, 37.075679779052734, 39.10293960571289, 41.13020324707031, 43.157466888427734, 45.184730529785156, 47.21199035644531, 49.239253997802734, 51.26651382446289]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 11.0, 11.0, 8.0, 6.0, 13.0, 14.0, 15.0, 22.0, 21.0, 28.0, 30.0, 23.0, 29.0, 32.0, 28.0, 30.0, 29.0, 36.0, 38.0, 35.0, 39.0, 33.0, 30.0, 38.0, 40.0, 34.0, 32.0, 32.0, 28.0, 31.0, 19.0, 29.0, 20.0, 19.0, 11.0, 20.0, 13.0, 11.0, 8.0, 6.0, 8.0, 9.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.328125, -10.9697265625, -10.611328125, -10.2529296875, -9.89453125, -9.5361328125, -9.177734375, -8.8193359375, -8.4609375, -8.1025390625, -7.744140625, -7.3857421875, -7.02734375, -6.6689453125, -6.310546875, -5.9521484375, -5.59375, -5.2353515625, -4.876953125, -4.5185546875, -4.16015625, -3.8017578125, -3.443359375, -3.0849609375, -2.7265625, -2.3681640625, -2.009765625, -1.6513671875, -1.29296875, -0.9345703125, -0.576171875, -0.2177734375, 0.140625, 0.4990234375, 0.857421875, 1.2158203125, 1.57421875, 1.9326171875, 2.291015625, 2.6494140625, 3.0078125, 3.3662109375, 3.724609375, 4.0830078125, 4.44140625, 4.7998046875, 5.158203125, 5.5166015625, 5.875, 6.2333984375, 6.591796875, 6.9501953125, 7.30859375, 7.6669921875, 8.025390625, 8.3837890625, 8.7421875, 9.1005859375, 9.458984375, 9.8173828125, 10.17578125, 10.5341796875, 10.892578125, 11.2509765625, 11.609375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 14.0, 16.0, 24.0, 31.0, 39.0, 70.0, 117.0, 162.0, 263.0, 339.0, 554.0, 874.0, 1307.0, 1902.0, 2951.0, 4615.0, 6991.0, 11045.0, 17585.0, 28657.0, 47469.0, 83801.0, 169735.0, 344956.0, 140732.0, 72727.0, 41933.0, 25550.0, 15763.0, 9914.0, 6339.0, 4193.0, 2652.0, 1768.0, 1184.0, 770.0, 485.0, 336.0, 231.0, 151.0, 106.0, 56.0, 51.0, 31.0, 21.0, 11.0, 10.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.716796875, -3.602020263671875, -3.48724365234375, -3.372467041015625, -3.2576904296875, -3.142913818359375, -3.02813720703125, -2.913360595703125, -2.798583984375, -2.683807373046875, -2.56903076171875, -2.454254150390625, -2.3394775390625, -2.224700927734375, -2.10992431640625, -1.995147705078125, -1.88037109375, -1.765594482421875, -1.65081787109375, -1.536041259765625, -1.4212646484375, -1.306488037109375, -1.19171142578125, -1.076934814453125, -0.962158203125, -0.847381591796875, -0.73260498046875, -0.617828369140625, -0.5030517578125, -0.388275146484375, -0.27349853515625, -0.158721923828125, -0.0439453125, 0.070831298828125, 0.18560791015625, 0.300384521484375, 0.4151611328125, 0.529937744140625, 0.64471435546875, 0.759490966796875, 0.874267578125, 0.989044189453125, 1.10382080078125, 1.218597412109375, 1.3333740234375, 1.448150634765625, 1.56292724609375, 1.677703857421875, 1.79248046875, 1.907257080078125, 2.02203369140625, 2.136810302734375, 2.2515869140625, 2.366363525390625, 2.48114013671875, 2.595916748046875, 2.710693359375, 2.825469970703125, 2.94024658203125, 3.055023193359375, 3.1697998046875, 3.284576416015625, 3.39935302734375, 3.514129638671875, 3.62890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 2.0, 6.0, 10.0, 12.0, 13.0, 10.0, 13.0, 21.0, 13.0, 22.0, 28.0, 29.0, 37.0, 33.0, 37.0, 43.0, 42.0, 37.0, 53.0, 1080.0, 35.0, 46.0, 40.0, 42.0, 29.0, 40.0, 26.0, 29.0, 33.0, 22.0, 12.0, 17.0, 21.0, 18.0, 21.0, 12.0, 9.0, 10.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.98046875, -7.71441650390625, -7.4483642578125, -7.18231201171875, -6.916259765625, -6.65020751953125, -6.3841552734375, -6.11810302734375, -5.85205078125, -5.58599853515625, -5.3199462890625, -5.05389404296875, -4.787841796875, -4.52178955078125, -4.2557373046875, -3.98968505859375, -3.7236328125, -3.45758056640625, -3.1915283203125, -2.92547607421875, -2.659423828125, -2.39337158203125, -2.1273193359375, -1.86126708984375, -1.59521484375, -1.32916259765625, -1.0631103515625, -0.79705810546875, -0.531005859375, -0.26495361328125, 0.0010986328125, 0.26715087890625, 0.533203125, 0.79925537109375, 1.0653076171875, 1.33135986328125, 1.597412109375, 1.86346435546875, 2.1295166015625, 2.39556884765625, 2.66162109375, 2.92767333984375, 3.1937255859375, 3.45977783203125, 3.725830078125, 3.99188232421875, 4.2579345703125, 4.52398681640625, 4.7900390625, 5.05609130859375, 5.3221435546875, 5.58819580078125, 5.854248046875, 6.12030029296875, 6.3863525390625, 6.65240478515625, 6.91845703125, 7.18450927734375, 7.4505615234375, 7.71661376953125, 7.982666015625, 8.24871826171875, 8.5147705078125, 8.78082275390625, 9.046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 13.0, 22.0, 27.0, 28.0, 53.0, 67.0, 97.0, 162.0, 264.0, 342.0, 499.0, 829.0, 1226.0, 1789.0, 2683.0, 4076.0, 5908.0, 8746.0, 13354.0, 20787.0, 32095.0, 51054.0, 83677.0, 156857.0, 1377491.0, 130653.0, 74260.0, 45649.0, 29304.0, 18727.0, 11957.0, 7897.0, 5548.0, 3594.0, 2512.0, 1599.0, 1041.0, 712.0, 537.0, 333.0, 182.0, 149.0, 121.0, 81.0, 42.0, 34.0, 16.0, 13.0, 8.0, 8.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.080078125, -2.97869873046875, -2.8773193359375, -2.77593994140625, -2.674560546875, -2.57318115234375, -2.4718017578125, -2.37042236328125, -2.26904296875, -2.16766357421875, -2.0662841796875, -1.96490478515625, -1.863525390625, -1.76214599609375, -1.6607666015625, -1.55938720703125, -1.4580078125, -1.35662841796875, -1.2552490234375, -1.15386962890625, -1.052490234375, -0.95111083984375, -0.8497314453125, -0.74835205078125, -0.64697265625, -0.54559326171875, -0.4442138671875, -0.34283447265625, -0.241455078125, -0.14007568359375, -0.0386962890625, 0.06268310546875, 0.1640625, 0.26544189453125, 0.3668212890625, 0.46820068359375, 0.569580078125, 0.67095947265625, 0.7723388671875, 0.87371826171875, 0.97509765625, 1.07647705078125, 1.1778564453125, 1.27923583984375, 1.380615234375, 1.48199462890625, 1.5833740234375, 1.68475341796875, 1.7861328125, 1.88751220703125, 1.9888916015625, 2.09027099609375, 2.191650390625, 2.29302978515625, 2.3944091796875, 2.49578857421875, 2.59716796875, 2.69854736328125, 2.7999267578125, 2.90130615234375, 3.002685546875, 3.10406494140625, 3.2054443359375, 3.30682373046875, 3.408203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 11.0, 6.0, 9.0, 10.0, 7.0, 16.0, 12.0, 13.0, 17.0, 25.0, 35.0, 32.0, 32.0, 50.0, 47.0, 78.0, 73.0, 73.0, 63.0, 67.0, 67.0, 36.0, 53.0, 32.0, 21.0, 15.0, 21.0, 14.0, 8.0, 13.0, 13.0, 3.0, 7.0, 5.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0005106925964355469, -0.0004961714148521423, -0.0004816502332687378, -0.00046712905168533325, -0.0004526078701019287, -0.00043808668851852417, -0.00042356550693511963, -0.0004090443253517151, -0.00039452314376831055, -0.000380001962184906, -0.00036548078060150146, -0.0003509595990180969, -0.0003364384174346924, -0.00032191723585128784, -0.0003073960542678833, -0.00029287487268447876, -0.0002783536911010742, -0.0002638325095176697, -0.00024931132793426514, -0.0002347901463508606, -0.00022026896476745605, -0.00020574778318405151, -0.00019122660160064697, -0.00017670542001724243, -0.0001621842384338379, -0.00014766305685043335, -0.0001331418752670288, -0.00011862069368362427, -0.00010409951210021973, -8.957833051681519e-05, -7.505714893341064e-05, -6.0535967350006104e-05, -4.601478576660156e-05, -3.149360418319702e-05, -1.697242259979248e-05, -2.4512410163879395e-06, 1.2069940567016602e-05, 2.6591122150421143e-05, 4.1112303733825684e-05, 5.5633485317230225e-05, 7.015466690063477e-05, 8.46758484840393e-05, 9.919703006744385e-05, 0.00011371821165084839, 0.00012823939323425293, 0.00014276057481765747, 0.000157281756401062, 0.00017180293798446655, 0.0001863241195678711, 0.00020084530115127563, 0.00021536648273468018, 0.00022988766431808472, 0.00024440884590148926, 0.0002589300274848938, 0.00027345120906829834, 0.0002879723906517029, 0.0003024935722351074, 0.00031701475381851196, 0.0003315359354019165, 0.00034605711698532104, 0.0003605782985687256, 0.0003750994801521301, 0.00038962066173553467, 0.0004041418433189392, 0.00041866302490234375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 9.0, 10.0, 17.0, 17.0, 17.0, 33.0, 32.0, 49.0, 77.0, 110.0, 145.0, 219.0, 343.0, 601.0, 1453.0, 214910.0, 826468.0, 2148.0, 654.0, 374.0, 243.0, 153.0, 117.0, 67.0, 46.0, 51.0, 28.0, 27.0, 21.0, 21.0, 17.0, 13.0, 12.0, 14.0, 7.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00809478759765625, -0.007816672325134277, -0.007538557052612305, -0.007260441780090332, -0.006982326507568359, -0.006704211235046387, -0.006426095962524414, -0.006147980690002441, -0.005869865417480469, -0.005591750144958496, -0.0053136348724365234, -0.005035519599914551, -0.004757404327392578, -0.0044792890548706055, -0.004201173782348633, -0.00392305850982666, -0.0036449432373046875, -0.003366827964782715, -0.003088712692260742, -0.0028105974197387695, -0.002532482147216797, -0.0022543668746948242, -0.0019762516021728516, -0.001698136329650879, -0.0014200210571289062, -0.0011419057846069336, -0.0008637905120849609, -0.0005856752395629883, -0.0003075599670410156, -2.944469451904297e-05, 0.0002486705780029297, 0.0005267858505249023, 0.000804901123046875, 0.0010830163955688477, 0.0013611316680908203, 0.001639246940612793, 0.0019173622131347656, 0.0021954774856567383, 0.002473592758178711, 0.0027517080307006836, 0.0030298233032226562, 0.003307938575744629, 0.0035860538482666016, 0.0038641691207885742, 0.004142284393310547, 0.0044203996658325195, 0.004698514938354492, 0.004976630210876465, 0.0052547454833984375, 0.00553286075592041, 0.005810976028442383, 0.0060890913009643555, 0.006367206573486328, 0.006645321846008301, 0.0069234371185302734, 0.007201552391052246, 0.007479667663574219, 0.007757782936096191, 0.008035898208618164, 0.008314013481140137, 0.00859212875366211, 0.008870244026184082, 0.009148359298706055, 0.009426474571228027, 0.00970458984375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 22.0, 391.0, 540.0, 56.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022824176121503115, -0.002228217665106058, -0.0021740177180618048, -0.0021198177710175514, -0.0020656175911426544, -0.002011417644098401, -0.0019572176970541477, -0.0019030177500098944, -0.001848817802965641, -0.0017946178559213877, -0.0017404177924618125, -0.0016862178454175591, -0.0016320178983733058, -0.0015778178349137306, -0.0015236178878694773, -0.001469417940825224, -0.0014152178773656487, -0.0013610179303213954, -0.0013068178668618202, -0.0012526179198175669, -0.0011984179727733135, -0.0011442180257290602, -0.001090017962269485, -0.0010358180152252316, -0.0009816179517656565, -0.0009274179465137422, -0.0008732179994694889, -0.0008190179942175746, -0.0007648180471733212, -0.000710618041921407, -0.0006564180366694927, -0.0006022180896252394, -0.0005480180261656642, -0.0004938180209137499, -0.0004396180738694966, -0.0003854180686175823, -0.0003312180924694985, -0.0002770181163214147, -0.00022281811106950045, -0.00016861813492141664, -0.00011441815877333283, -6.0218175349291414e-05, -6.018191925249994e-06, 4.818179877474904e-05, 0.00010238177492283285, 0.00015658175107091665, 0.00021078175632283092, 0.0002649817324709147, 0.00031918170861899853, 0.00037338168476708233, 0.00042758166091516614, 0.0004817816661670804, 0.0005359816132113338, 0.000590181618463248, 0.0006443816237151623, 0.0006985815707594156, 0.0007527815760113299, 0.0008069815812632442, 0.0008611815283074975, 0.0009153815335594118, 0.000969581538811326, 0.0010237814858555794, 0.0010779814328998327, 0.001132181496359408, 0.0011863814434036613]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 4.0, 2.0, 3.0, 6.0, 9.0, 2.0, 9.0, 8.0, 11.0, 11.0, 12.0, 20.0, 19.0, 13.0, 25.0, 30.0, 26.0, 30.0, 35.0, 25.0, 29.0, 33.0, 39.0, 41.0, 38.0, 44.0, 44.0, 39.0, 36.0, 28.0, 38.0, 27.0, 41.0, 26.0, 27.0, 19.0, 24.0, 21.0, 13.0, 21.0, 11.0, 10.0, 3.0, 9.0, 11.0, 10.0, 7.0, 12.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019061565399169922, -0.00018392875790596008, -0.00017724186182022095, -0.0001705549657344818, -0.00016386806964874268, -0.00015718117356300354, -0.0001504942774772644, -0.00014380738139152527, -0.00013712048530578613, -0.000130433589220047, -0.00012374669313430786, -0.00011705979704856873, -0.00011037290096282959, -0.00010368600487709045, -9.699910879135132e-05, -9.031221270561218e-05, -8.362531661987305e-05, -7.693842053413391e-05, -7.025152444839478e-05, -6.356462836265564e-05, -5.6877732276916504e-05, -5.019083619117737e-05, -4.350394010543823e-05, -3.68170440196991e-05, -3.013014793395996e-05, -2.3443251848220825e-05, -1.675635576248169e-05, -1.0069459676742554e-05, -3.382563591003418e-06, 3.3043324947357178e-06, 9.991228580474854e-06, 1.667812466621399e-05, 2.3365020751953125e-05, 3.005191683769226e-05, 3.6738812923431396e-05, 4.342570900917053e-05, 5.011260509490967e-05, 5.6799501180648804e-05, 6.348639726638794e-05, 7.017329335212708e-05, 7.686018943786621e-05, 8.354708552360535e-05, 9.023398160934448e-05, 9.692087769508362e-05, 0.00010360777378082275, 0.00011029466986656189, 0.00011698156595230103, 0.00012366846203804016, 0.0001303553581237793, 0.00013704225420951843, 0.00014372915029525757, 0.0001504160463809967, 0.00015710294246673584, 0.00016378983855247498, 0.0001704767346382141, 0.00017716363072395325, 0.00018385052680969238, 0.00019053742289543152, 0.00019722431898117065, 0.0002039112150669098, 0.00021059811115264893, 0.00021728500723838806, 0.0002239719033241272, 0.00023065879940986633, 0.00023734569549560547]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 11.0, 11.0, 8.0, 6.0, 13.0, 14.0, 15.0, 22.0, 21.0, 28.0, 30.0, 23.0, 29.0, 32.0, 28.0, 30.0, 29.0, 36.0, 38.0, 36.0, 38.0, 33.0, 30.0, 38.0, 40.0, 34.0, 32.0, 32.0, 28.0, 31.0, 19.0, 29.0, 20.0, 19.0, 11.0, 20.0, 13.0, 11.0, 8.0, 6.0, 8.0, 9.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.328125, -10.9697265625, -10.611328125, -10.2529296875, -9.89453125, -9.5361328125, -9.177734375, -8.8193359375, -8.4609375, -8.1025390625, -7.744140625, -7.3857421875, -7.02734375, -6.6689453125, -6.310546875, -5.9521484375, -5.59375, -5.2353515625, -4.876953125, -4.5185546875, -4.16015625, -3.8017578125, -3.443359375, -3.0849609375, -2.7265625, -2.3681640625, -2.009765625, -1.6513671875, -1.29296875, -0.9345703125, -0.576171875, -0.2177734375, 0.140625, 0.4990234375, 0.857421875, 1.2158203125, 1.57421875, 1.9326171875, 2.291015625, 2.6494140625, 3.0078125, 3.3662109375, 3.724609375, 4.0830078125, 4.44140625, 4.7998046875, 5.158203125, 5.5166015625, 5.875, 6.2333984375, 6.591796875, 6.9501953125, 7.30859375, 7.6669921875, 8.025390625, 8.3837890625, 8.7421875, 9.1005859375, 9.458984375, 9.8173828125, 10.17578125, 10.5341796875, 10.892578125, 11.2509765625, 11.609375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 8.0, 5.0, 6.0, 6.0, 6.0, 16.0, 24.0, 30.0, 40.0, 57.0, 52.0, 65.0, 83.0, 120.0, 167.0, 197.0, 259.0, 312.0, 405.0, 546.0, 688.0, 949.0, 1379.0, 2331.0, 5334.0, 20094.0, 96969.0, 394622.0, 393268.0, 97130.0, 20237.0, 5393.0, 2310.0, 1332.0, 992.0, 718.0, 507.0, 420.0, 336.0, 248.0, 217.0, 172.0, 106.0, 82.0, 64.0, 57.0, 51.0, 37.0, 38.0, 24.0, 9.0, 10.0, 7.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0], "bins": [-21.953125, -21.26708984375, -20.5810546875, -19.89501953125, -19.208984375, -18.52294921875, -17.8369140625, -17.15087890625, -16.46484375, -15.77880859375, -15.0927734375, -14.40673828125, -13.720703125, -13.03466796875, -12.3486328125, -11.66259765625, -10.9765625, -10.29052734375, -9.6044921875, -8.91845703125, -8.232421875, -7.54638671875, -6.8603515625, -6.17431640625, -5.48828125, -4.80224609375, -4.1162109375, -3.43017578125, -2.744140625, -2.05810546875, -1.3720703125, -0.68603515625, 0.0, 0.68603515625, 1.3720703125, 2.05810546875, 2.744140625, 3.43017578125, 4.1162109375, 4.80224609375, 5.48828125, 6.17431640625, 6.8603515625, 7.54638671875, 8.232421875, 8.91845703125, 9.6044921875, 10.29052734375, 10.9765625, 11.66259765625, 12.3486328125, 13.03466796875, 13.720703125, 14.40673828125, 15.0927734375, 15.77880859375, 16.46484375, 17.15087890625, 17.8369140625, 18.52294921875, 19.208984375, 19.89501953125, 20.5810546875, 21.26708984375, 21.953125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 8.0, 6.0, 4.0, 7.0, 18.0, 11.0, 16.0, 16.0, 19.0, 26.0, 28.0, 38.0, 52.0, 32.0, 48.0, 63.0, 88.0, 182.0, 1421.0, 364.0, 143.0, 82.0, 58.0, 55.0, 60.0, 26.0, 35.0, 26.0, 22.0, 24.0, 25.0, 9.0, 9.0, 8.0, 3.0, 7.0, 3.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.5, -39.370361328125, -38.24072265625, -37.111083984375, -35.9814453125, -34.851806640625, -33.72216796875, -32.592529296875, -31.462890625, -30.333251953125, -29.20361328125, -28.073974609375, -26.9443359375, -25.814697265625, -24.68505859375, -23.555419921875, -22.42578125, -21.296142578125, -20.16650390625, -19.036865234375, -17.9072265625, -16.777587890625, -15.64794921875, -14.518310546875, -13.388671875, -12.259033203125, -11.12939453125, -9.999755859375, -8.8701171875, -7.740478515625, -6.61083984375, -5.481201171875, -4.3515625, -3.221923828125, -2.09228515625, -0.962646484375, 0.1669921875, 1.296630859375, 2.42626953125, 3.555908203125, 4.685546875, 5.815185546875, 6.94482421875, 8.074462890625, 9.2041015625, 10.333740234375, 11.46337890625, 12.593017578125, 13.72265625, 14.852294921875, 15.98193359375, 17.111572265625, 18.2412109375, 19.370849609375, 20.50048828125, 21.630126953125, 22.759765625, 23.889404296875, 25.01904296875, 26.148681640625, 27.2783203125, 28.407958984375, 29.53759765625, 30.667236328125, 31.796875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 8.0, 16.0, 13.0, 15.0, 19.0, 28.0, 36.0, 38.0, 61.0, 92.0, 131.0, 201.0, 309.0, 498.0, 1009.0, 3408.0, 3119106.0, 17467.0, 1477.0, 630.0, 341.0, 204.0, 160.0, 101.0, 77.0, 49.0, 49.0, 22.0, 25.0, 16.0, 13.0, 9.0, 11.0, 10.0, 10.0, 6.0, 6.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-161.25, -156.314453125, -151.37890625, -146.443359375, -141.5078125, -136.572265625, -131.63671875, -126.701171875, -121.765625, -116.830078125, -111.89453125, -106.958984375, -102.0234375, -97.087890625, -92.15234375, -87.216796875, -82.28125, -77.345703125, -72.41015625, -67.474609375, -62.5390625, -57.603515625, -52.66796875, -47.732421875, -42.796875, -37.861328125, -32.92578125, -27.990234375, -23.0546875, -18.119140625, -13.18359375, -8.248046875, -3.3125, 1.623046875, 6.55859375, 11.494140625, 16.4296875, 21.365234375, 26.30078125, 31.236328125, 36.171875, 41.107421875, 46.04296875, 50.978515625, 55.9140625, 60.849609375, 65.78515625, 70.720703125, 75.65625, 80.591796875, 85.52734375, 90.462890625, 95.3984375, 100.333984375, 105.26953125, 110.205078125, 115.140625, 120.076171875, 125.01171875, 129.947265625, 134.8828125, 139.818359375, 144.75390625, 149.689453125, 154.625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 13.0, 45.0, 126.0, 244.0, 291.0, 196.0, 53.0, 32.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.0416259765625, -178.5869598388672, -174.1322784423828, -169.6776123046875, -165.2229461669922, -160.7682647705078, -156.3135986328125, -151.8589324951172, -147.4042510986328, -142.9495849609375, -138.49490356445312, -134.0402374267578, -129.5855712890625, -125.13088989257812, -120.67622375488281, -116.22154998779297, -111.76688385009766, -107.31221008300781, -102.8575439453125, -98.40287017822266, -93.94819641113281, -89.4935302734375, -85.03885650634766, -80.58418273925781, -76.1295166015625, -71.67484283447266, -67.22017669677734, -62.7655029296875, -58.310829162597656, -53.85615921020508, -49.4014892578125, -44.946815490722656, -40.492149353027344, -36.037479400634766, -31.582805633544922, -27.128135681152344, -22.673463821411133, -18.218791961669922, -13.764122009277344, -9.309450149536133, -4.854778289794922, -0.40010690689086914, 4.054564476013184, 8.509235382080078, 12.963907241821289, 17.4185791015625, 21.873249053955078, 26.32792091369629, 30.7825927734375, 35.23726272583008, 39.69193649291992, 44.1466064453125, 48.601280212402344, 53.05595016479492, 57.5106201171875, 61.965293884277344, 66.41996765136719, 70.87464141845703, 75.32930755615234, 79.78398132324219, 84.23865509033203, 88.69332885742188, 93.14799499511719, 97.60266876220703, 102.05733489990234]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 10.0, 15.0, 11.0, 22.0, 11.0, 15.0, 23.0, 33.0, 28.0, 34.0, 29.0, 38.0, 48.0, 30.0, 39.0, 48.0, 43.0, 39.0, 48.0, 40.0, 39.0, 40.0, 30.0, 31.0, 39.0, 28.0, 22.0, 19.0, 21.0, 11.0, 14.0, 9.0, 15.0, 7.0, 11.0, 10.0, 5.0, 9.0, 4.0, 4.0, 3.0, 0.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-83.04354858398438, -80.30003356933594, -77.5565185546875, -74.8130111694336, -72.06949615478516, -69.32598114013672, -66.58247375488281, -63.838958740234375, -61.09544372558594, -58.3519287109375, -55.60841751098633, -52.864906311035156, -50.12139129638672, -47.37787628173828, -44.63436508178711, -41.89085388183594, -39.1473388671875, -36.40382385253906, -33.66031265258789, -30.916799545288086, -28.17328643798828, -25.429773330688477, -22.686260223388672, -19.942747116088867, -17.199234008789062, -14.455720901489258, -11.712207794189453, -8.968694686889648, -6.225181579589844, -3.481668472290039, -0.7381553649902344, 2.0053577423095703, 4.748870849609375, 7.49238395690918, 10.235897064208984, 12.979410171508789, 15.722923278808594, 18.4664363861084, 21.209949493408203, 23.953462600708008, 26.696975708007812, 29.440488815307617, 32.18400192260742, 34.927513122558594, 37.67102813720703, 40.41454315185547, 43.15805435180664, 45.90156555175781, 48.64508056640625, 51.38859558105469, 54.13210678100586, 56.87561798095703, 59.61913299560547, 62.362648010253906, 65.10615539550781, 67.84967041015625, 70.59318542480469, 73.33670043945312, 76.08021545410156, 78.82372283935547, 81.5672378540039, 84.31075286865234, 87.05426025390625, 89.79777526855469, 92.54129028320312]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 8.0, 8.0, 11.0, 15.0, 20.0, 20.0, 20.0, 19.0, 32.0, 25.0, 32.0, 22.0, 23.0, 24.0, 39.0, 35.0, 34.0, 37.0, 38.0, 35.0, 44.0, 32.0, 33.0, 34.0, 28.0, 30.0, 25.0, 30.0, 19.0, 24.0, 29.0, 21.0, 19.0, 13.0, 12.0, 13.0, 7.0, 8.0, 9.0, 3.0, 9.0, 8.0, 13.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.7890625, -10.452392578125, -10.11572265625, -9.779052734375, -9.4423828125, -9.105712890625, -8.76904296875, -8.432373046875, -8.095703125, -7.759033203125, -7.42236328125, -7.085693359375, -6.7490234375, -6.412353515625, -6.07568359375, -5.739013671875, -5.40234375, -5.065673828125, -4.72900390625, -4.392333984375, -4.0556640625, -3.718994140625, -3.38232421875, -3.045654296875, -2.708984375, -2.372314453125, -2.03564453125, -1.698974609375, -1.3623046875, -1.025634765625, -0.68896484375, -0.352294921875, -0.015625, 0.321044921875, 0.65771484375, 0.994384765625, 1.3310546875, 1.667724609375, 2.00439453125, 2.341064453125, 2.677734375, 3.014404296875, 3.35107421875, 3.687744140625, 4.0244140625, 4.361083984375, 4.69775390625, 5.034423828125, 5.37109375, 5.707763671875, 6.04443359375, 6.381103515625, 6.7177734375, 7.054443359375, 7.39111328125, 7.727783203125, 8.064453125, 8.401123046875, 8.73779296875, 9.074462890625, 9.4111328125, 9.747802734375, 10.08447265625, 10.421142578125, 10.7578125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 11.0, 22.0, 23.0, 39.0, 62.0, 102.0, 167.0, 299.0, 563.0, 1242.0, 3545.0, 15234.0, 180481.0, 2101764.0, 1741333.0, 131735.0, 12494.0, 2868.0, 1117.0, 518.0, 263.0, 146.0, 88.0, 58.0, 35.0, 20.0, 20.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.71875, -30.725830078125, -29.73291015625, -28.739990234375, -27.7470703125, -26.754150390625, -25.76123046875, -24.768310546875, -23.775390625, -22.782470703125, -21.78955078125, -20.796630859375, -19.8037109375, -18.810791015625, -17.81787109375, -16.824951171875, -15.83203125, -14.839111328125, -13.84619140625, -12.853271484375, -11.8603515625, -10.867431640625, -9.87451171875, -8.881591796875, -7.888671875, -6.895751953125, -5.90283203125, -4.909912109375, -3.9169921875, -2.924072265625, -1.93115234375, -0.938232421875, 0.0546875, 1.047607421875, 2.04052734375, 3.033447265625, 4.0263671875, 5.019287109375, 6.01220703125, 7.005126953125, 7.998046875, 8.990966796875, 9.98388671875, 10.976806640625, 11.9697265625, 12.962646484375, 13.95556640625, 14.948486328125, 15.94140625, 16.934326171875, 17.92724609375, 18.920166015625, 19.9130859375, 20.906005859375, 21.89892578125, 22.891845703125, 23.884765625, 24.877685546875, 25.87060546875, 26.863525390625, 27.8564453125, 28.849365234375, 29.84228515625, 30.835205078125, 31.828125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 10.0, 6.0, 10.0, 13.0, 17.0, 22.0, 27.0, 43.0, 41.0, 72.0, 83.0, 110.0, 118.0, 183.0, 195.0, 260.0, 323.0, 380.0, 446.0, 368.0, 284.0, 237.0, 163.0, 127.0, 125.0, 85.0, 65.0, 48.0, 39.0, 44.0, 27.0, 22.0, 18.0, 11.0, 13.0, 14.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.495361328125, -15.91259765625, -15.329833984375, -14.7470703125, -14.164306640625, -13.58154296875, -12.998779296875, -12.416015625, -11.833251953125, -11.25048828125, -10.667724609375, -10.0849609375, -9.502197265625, -8.91943359375, -8.336669921875, -7.75390625, -7.171142578125, -6.58837890625, -6.005615234375, -5.4228515625, -4.840087890625, -4.25732421875, -3.674560546875, -3.091796875, -2.509033203125, -1.92626953125, -1.343505859375, -0.7607421875, -0.177978515625, 0.40478515625, 0.987548828125, 1.5703125, 2.153076171875, 2.73583984375, 3.318603515625, 3.9013671875, 4.484130859375, 5.06689453125, 5.649658203125, 6.232421875, 6.815185546875, 7.39794921875, 7.980712890625, 8.5634765625, 9.146240234375, 9.72900390625, 10.311767578125, 10.89453125, 11.477294921875, 12.06005859375, 12.642822265625, 13.2255859375, 13.808349609375, 14.39111328125, 14.973876953125, 15.556640625, 16.139404296875, 16.72216796875, 17.304931640625, 17.8876953125, 18.470458984375, 19.05322265625, 19.635986328125, 20.21875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 10.0, 9.0, 15.0, 38.0, 66.0, 75.0, 166.0, 309.0, 586.0, 1221.0, 2891.0, 14435.0, 460884.0, 3577866.0, 124204.0, 7354.0, 2184.0, 979.0, 453.0, 228.0, 124.0, 86.0, 41.0, 20.0, 14.0, 14.0, 5.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.375, -58.71337890625, -57.0517578125, -55.39013671875, -53.728515625, -52.06689453125, -50.4052734375, -48.74365234375, -47.08203125, -45.42041015625, -43.7587890625, -42.09716796875, -40.435546875, -38.77392578125, -37.1123046875, -35.45068359375, -33.7890625, -32.12744140625, -30.4658203125, -28.80419921875, -27.142578125, -25.48095703125, -23.8193359375, -22.15771484375, -20.49609375, -18.83447265625, -17.1728515625, -15.51123046875, -13.849609375, -12.18798828125, -10.5263671875, -8.86474609375, -7.203125, -5.54150390625, -3.8798828125, -2.21826171875, -0.556640625, 1.10498046875, 2.7666015625, 4.42822265625, 6.08984375, 7.75146484375, 9.4130859375, 11.07470703125, 12.736328125, 14.39794921875, 16.0595703125, 17.72119140625, 19.3828125, 21.04443359375, 22.7060546875, 24.36767578125, 26.029296875, 27.69091796875, 29.3525390625, 31.01416015625, 32.67578125, 34.33740234375, 35.9990234375, 37.66064453125, 39.322265625, 40.98388671875, 42.6455078125, 44.30712890625, 45.96875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 13.0, 105.0, 508.0, 322.0, 58.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.77920532226562, -183.43270874023438, -171.08621215820312, -158.73971557617188, -146.39321899414062, -134.04672241210938, -121.70024108886719, -109.35374450683594, -97.00724792480469, -84.66075134277344, -72.31425476074219, -59.96776580810547, -47.62126922607422, -35.27477264404297, -22.92828369140625, -10.581787109375, 1.76470947265625, 14.111204147338867, 26.457698822021484, 38.80419158935547, 51.15068817138672, 63.49718475341797, 75.84367370605469, 88.19017028808594, 100.53666687011719, 112.88316345214844, 125.22966003417969, 137.57614135742188, 149.92263793945312, 162.26913452148438, 174.61563110351562, 186.96212768554688, 199.30865478515625, 211.6551513671875, 224.00164794921875, 236.34814453125, 248.69464111328125, 261.0411376953125, 273.38763427734375, 285.734130859375, 298.08062744140625, 310.4271240234375, 322.77362060546875, 335.1201171875, 347.46661376953125, 359.8131103515625, 372.15960693359375, 384.506103515625, 396.8525695800781, 409.1990661621094, 421.5455627441406, 433.8920593261719, 446.2385559082031, 458.5850524902344, 470.9315185546875, 483.27801513671875, 495.62451171875, 507.97100830078125, 520.3175048828125, 532.6640014648438, 545.010498046875, 557.3569946289062, 569.7034912109375, 582.0499877929688, 594.396484375]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 7.0, 6.0, 6.0, 7.0, 5.0, 11.0, 11.0, 10.0, 16.0, 16.0, 17.0, 17.0, 23.0, 28.0, 33.0, 28.0, 27.0, 54.0, 35.0, 36.0, 28.0, 45.0, 39.0, 40.0, 28.0, 26.0, 33.0, 48.0, 36.0, 28.0, 18.0, 28.0, 22.0, 28.0, 18.0, 20.0, 19.0, 16.0, 19.0, 10.0, 12.0, 9.0, 6.0, 9.0, 7.0, 6.0, 6.0, 0.0, 3.0, 2.0, 4.0, 3.0], "bins": [-84.19775390625, -81.83589172363281, -79.47402954101562, -77.11216735839844, -74.75030517578125, -72.38844299316406, -70.02658081054688, -67.66472625732422, -65.30286407470703, -62.941001892089844, -60.579139709472656, -58.21727752685547, -55.85541915893555, -53.49355697631836, -51.13169479370117, -48.76983642578125, -46.4079704284668, -44.04610824584961, -41.68424606323242, -39.3223876953125, -36.96052551269531, -34.598663330078125, -32.23680114746094, -29.874940872192383, -27.513078689575195, -25.151216506958008, -22.789356231689453, -20.427494049072266, -18.065631866455078, -15.703771591186523, -13.341909408569336, -10.980049133300781, -8.618186950683594, -6.256325721740723, -3.8944640159606934, -1.532602310180664, 0.829258918762207, 3.191120147705078, 5.552982330322266, 7.91484260559082, 10.276704788208008, 12.638566017150879, 15.00042724609375, 17.362289428710938, 19.724151611328125, 22.08601188659668, 24.447874069213867, 26.809734344482422, 29.17159652709961, 31.533458709716797, 33.895320892333984, 36.257179260253906, 38.619041442871094, 40.98090362548828, 43.34276580810547, 45.704627990722656, 48.066490173339844, 50.42835235595703, 52.79021453857422, 55.152076721191406, 57.51393508911133, 59.875797271728516, 62.2376594543457, 64.59951782226562, 66.96138000488281]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 6.0, 4.0, 9.0, 10.0, 15.0, 19.0, 18.0, 17.0, 24.0, 27.0, 31.0, 22.0, 40.0, 43.0, 44.0, 47.0, 55.0, 43.0, 55.0, 53.0, 40.0, 40.0, 53.0, 39.0, 33.0, 39.0, 33.0, 30.0, 21.0, 22.0, 18.0, 10.0, 11.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.3426513671875, -8.997802734375, -8.6529541015625, -8.30810546875, -7.9632568359375, -7.618408203125, -7.2735595703125, -6.9287109375, -6.5838623046875, -6.239013671875, -5.8941650390625, -5.54931640625, -5.2044677734375, -4.859619140625, -4.5147705078125, -4.169921875, -3.8250732421875, -3.480224609375, -3.1353759765625, -2.79052734375, -2.4456787109375, -2.100830078125, -1.7559814453125, -1.4111328125, -1.0662841796875, -0.721435546875, -0.3765869140625, -0.03173828125, 0.3131103515625, 0.657958984375, 1.0028076171875, 1.34765625, 1.6925048828125, 2.037353515625, 2.3822021484375, 2.72705078125, 3.0718994140625, 3.416748046875, 3.7615966796875, 4.1064453125, 4.4512939453125, 4.796142578125, 5.1409912109375, 5.48583984375, 5.8306884765625, 6.175537109375, 6.5203857421875, 6.865234375, 7.2100830078125, 7.554931640625, 7.8997802734375, 8.24462890625, 8.5894775390625, 8.934326171875, 9.2791748046875, 9.6240234375, 9.9688720703125, 10.313720703125, 10.6585693359375, 11.00341796875, 11.3482666015625, 11.693115234375, 12.0379638671875, 12.3828125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 11.0, 7.0, 13.0, 40.0, 36.0, 58.0, 98.0, 143.0, 200.0, 329.0, 492.0, 843.0, 1432.0, 2307.0, 3965.0, 6899.0, 11931.0, 21226.0, 37914.0, 71019.0, 148408.0, 392547.0, 172599.0, 79198.0, 41886.0, 23386.0, 13126.0, 7491.0, 4418.0, 2532.0, 1548.0, 918.0, 564.0, 323.0, 200.0, 168.0, 84.0, 78.0, 36.0, 27.0, 13.0, 13.0, 7.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.83660888671875, -2.7337646484375, -2.63092041015625, -2.528076171875, -2.42523193359375, -2.3223876953125, -2.21954345703125, -2.11669921875, -2.01385498046875, -1.9110107421875, -1.80816650390625, -1.705322265625, -1.60247802734375, -1.4996337890625, -1.39678955078125, -1.2939453125, -1.19110107421875, -1.0882568359375, -0.98541259765625, -0.882568359375, -0.77972412109375, -0.6768798828125, -0.57403564453125, -0.47119140625, -0.36834716796875, -0.2655029296875, -0.16265869140625, -0.059814453125, 0.04302978515625, 0.1458740234375, 0.24871826171875, 0.3515625, 0.45440673828125, 0.5572509765625, 0.66009521484375, 0.762939453125, 0.86578369140625, 0.9686279296875, 1.07147216796875, 1.17431640625, 1.27716064453125, 1.3800048828125, 1.48284912109375, 1.585693359375, 1.68853759765625, 1.7913818359375, 1.89422607421875, 1.9970703125, 2.09991455078125, 2.2027587890625, 2.30560302734375, 2.408447265625, 2.51129150390625, 2.6141357421875, 2.71697998046875, 2.81982421875, 2.92266845703125, 3.0255126953125, 3.12835693359375, 3.231201171875, 3.33404541015625, 3.4368896484375, 3.53973388671875, 3.642578125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 1.0, 3.0, 10.0, 12.0, 13.0, 15.0, 17.0, 17.0, 26.0, 19.0, 29.0, 27.0, 25.0, 46.0, 43.0, 32.0, 40.0, 33.0, 40.0, 1055.0, 44.0, 38.0, 31.0, 39.0, 51.0, 36.0, 35.0, 26.0, 34.0, 23.0, 26.0, 29.0, 23.0, 16.0, 13.0, 11.0, 8.0, 5.0, 9.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.484375, -6.29254150390625, -6.1007080078125, -5.90887451171875, -5.717041015625, -5.52520751953125, -5.3333740234375, -5.14154052734375, -4.94970703125, -4.75787353515625, -4.5660400390625, -4.37420654296875, -4.182373046875, -3.99053955078125, -3.7987060546875, -3.60687255859375, -3.4150390625, -3.22320556640625, -3.0313720703125, -2.83953857421875, -2.647705078125, -2.45587158203125, -2.2640380859375, -2.07220458984375, -1.88037109375, -1.68853759765625, -1.4967041015625, -1.30487060546875, -1.113037109375, -0.92120361328125, -0.7293701171875, -0.53753662109375, -0.345703125, -0.15386962890625, 0.0379638671875, 0.22979736328125, 0.421630859375, 0.61346435546875, 0.8052978515625, 0.99713134765625, 1.18896484375, 1.38079833984375, 1.5726318359375, 1.76446533203125, 1.956298828125, 2.14813232421875, 2.3399658203125, 2.53179931640625, 2.7236328125, 2.91546630859375, 3.1072998046875, 3.29913330078125, 3.490966796875, 3.68280029296875, 3.8746337890625, 4.06646728515625, 4.25830078125, 4.45013427734375, 4.6419677734375, 4.83380126953125, 5.025634765625, 5.21746826171875, 5.4093017578125, 5.60113525390625, 5.79296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 10.0, 15.0, 23.0, 29.0, 49.0, 71.0, 115.0, 163.0, 236.0, 342.0, 531.0, 801.0, 1169.0, 1681.0, 2477.0, 3773.0, 5829.0, 8648.0, 12786.0, 19801.0, 30794.0, 49210.0, 77923.0, 129132.0, 1344212.0, 158202.0, 90254.0, 56674.0, 35842.0, 22323.0, 14748.0, 9822.0, 6441.0, 4235.0, 2842.0, 1990.0, 1259.0, 878.0, 607.0, 390.0, 282.0, 189.0, 98.0, 91.0, 48.0, 28.0, 32.0, 15.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0], "bins": [-2.4453125, -2.372650146484375, -2.29998779296875, -2.227325439453125, -2.1546630859375, -2.082000732421875, -2.00933837890625, -1.936676025390625, -1.864013671875, -1.791351318359375, -1.71868896484375, -1.646026611328125, -1.5733642578125, -1.500701904296875, -1.42803955078125, -1.355377197265625, -1.28271484375, -1.210052490234375, -1.13739013671875, -1.064727783203125, -0.9920654296875, -0.919403076171875, -0.84674072265625, -0.774078369140625, -0.701416015625, -0.628753662109375, -0.55609130859375, -0.483428955078125, -0.4107666015625, -0.338104248046875, -0.26544189453125, -0.192779541015625, -0.1201171875, -0.047454833984375, 0.02520751953125, 0.097869873046875, 0.1705322265625, 0.243194580078125, 0.31585693359375, 0.388519287109375, 0.461181640625, 0.533843994140625, 0.60650634765625, 0.679168701171875, 0.7518310546875, 0.824493408203125, 0.89715576171875, 0.969818115234375, 1.04248046875, 1.115142822265625, 1.18780517578125, 1.260467529296875, 1.3331298828125, 1.405792236328125, 1.47845458984375, 1.551116943359375, 1.623779296875, 1.696441650390625, 1.76910400390625, 1.841766357421875, 1.9144287109375, 1.987091064453125, 2.05975341796875, 2.132415771484375, 2.205078125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 5.0, 5.0, 12.0, 14.0, 12.0, 24.0, 37.0, 40.0, 49.0, 62.0, 93.0, 83.0, 79.0, 82.0, 71.0, 55.0, 58.0, 40.0, 31.0, 19.0, 18.0, 14.0, 14.0, 12.0, 9.0, 10.0, 4.0, 6.0, 4.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003509521484375, -0.0003390386700630188, -0.0003271251916885376, -0.0003152117133140564, -0.0003032982349395752, -0.000291384756565094, -0.0002794712781906128, -0.0002675577998161316, -0.0002556443214416504, -0.0002437308430671692, -0.000231817364692688, -0.0002199038863182068, -0.00020799040794372559, -0.00019607692956924438, -0.00018416345119476318, -0.00017224997282028198, -0.00016033649444580078, -0.00014842301607131958, -0.00013650953769683838, -0.00012459605932235718, -0.00011268258094787598, -0.00010076910257339478, -8.885562419891357e-05, -7.694214582443237e-05, -6.502866744995117e-05, -5.311518907546997e-05, -4.120171070098877e-05, -2.928823232650757e-05, -1.7374753952026367e-05, -5.461275577545166e-06, 6.452202796936035e-06, 1.8365681171417236e-05, 3.0279159545898438e-05, 4.219263792037964e-05, 5.410611629486084e-05, 6.601959466934204e-05, 7.793307304382324e-05, 8.984655141830444e-05, 0.00010176002979278564, 0.00011367350816726685, 0.00012558698654174805, 0.00013750046491622925, 0.00014941394329071045, 0.00016132742166519165, 0.00017324090003967285, 0.00018515437841415405, 0.00019706785678863525, 0.00020898133516311646, 0.00022089481353759766, 0.00023280829191207886, 0.00024472177028656006, 0.00025663524866104126, 0.00026854872703552246, 0.00028046220541000366, 0.00029237568378448486, 0.00030428916215896606, 0.00031620264053344727, 0.00032811611890792847, 0.00034002959728240967, 0.00035194307565689087, 0.00036385655403137207, 0.00037577003240585327, 0.00038768351078033447, 0.0003995969891548157, 0.0004115104675292969]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 12.0, 7.0, 6.0, 12.0, 19.0, 12.0, 24.0, 35.0, 34.0, 44.0, 47.0, 67.0, 110.0, 179.0, 300.0, 435.0, 952.0, 16965.0, 1016227.0, 10887.0, 909.0, 419.0, 236.0, 182.0, 124.0, 87.0, 51.0, 35.0, 24.0, 15.0, 16.0, 19.0, 11.0, 8.0, 2.0, 3.0, 4.0, 7.0, 6.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00719451904296875, -0.006979525089263916, -0.006764531135559082, -0.006549537181854248, -0.006334543228149414, -0.00611954927444458, -0.005904555320739746, -0.005689561367034912, -0.005474567413330078, -0.005259573459625244, -0.00504457950592041, -0.004829585552215576, -0.004614591598510742, -0.004399597644805908, -0.004184603691101074, -0.00396960973739624, -0.0037546157836914062, -0.0035396218299865723, -0.0033246278762817383, -0.0031096339225769043, -0.0028946399688720703, -0.0026796460151672363, -0.0024646520614624023, -0.0022496581077575684, -0.0020346641540527344, -0.0018196702003479004, -0.0016046762466430664, -0.0013896822929382324, -0.0011746883392333984, -0.0009596943855285645, -0.0007447004318237305, -0.0005297064781188965, -0.0003147125244140625, -9.971857070922852e-05, 0.00011527538299560547, 0.00033026933670043945, 0.0005452632904052734, 0.0007602572441101074, 0.0009752511978149414, 0.0011902451515197754, 0.0014052391052246094, 0.0016202330589294434, 0.0018352270126342773, 0.0020502209663391113, 0.0022652149200439453, 0.0024802088737487793, 0.0026952028274536133, 0.0029101967811584473, 0.0031251907348632812, 0.0033401846885681152, 0.0035551786422729492, 0.003770172595977783, 0.003985166549682617, 0.004200160503387451, 0.004415154457092285, 0.004630148410797119, 0.004845142364501953, 0.005060136318206787, 0.005275130271911621, 0.005490124225616455, 0.005705118179321289, 0.005920112133026123, 0.006135106086730957, 0.006350100040435791, 0.006565093994140625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 68.0, 617.0, 311.0, 17.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023424976971000433, -0.002295452170073986, -0.002248406410217285, -0.002201360883191228, -0.002154315123334527, -0.0021072695963084698, -0.002060223836451769, -0.0020131783094257116, -0.0019661325495690107, -0.0019190869061276317, -0.0018720412626862526, -0.0018249956192448735, -0.0017779499758034945, -0.0017309044487774372, -0.0016838586889207363, -0.001636813161894679, -0.0015897676348686218, -0.0015427219914272428, -0.0014956763479858637, -0.0014486307045444846, -0.0014015850611031055, -0.0013545395340770483, -0.0013074937742203474, -0.0012604482471942902, -0.0012134024873375893, -0.0011663568438962102, -0.0011193112004548311, -0.001072265557013452, -0.001025219913572073, -0.0009781743865460157, -0.0009311286848969758, -0.0008840830996632576, -0.0008370374562218785, -0.0007899918127804995, -0.0007429461693391204, -0.0006959005258977413, -0.0006488549406640232, -0.0006018092972226441, -0.000554763653781265, -0.0005077180685475469, -0.00046067239600233734, -0.00041362675256095827, -0.00036658113822340965, -0.0003195354947820306, -0.0002724898513406515, -0.0002254442370031029, -0.00017839859356172383, -0.00013135297922417521, -8.430733578279614e-05, -3.7261703255353495e-05, 9.783929272089154e-06, 5.682956543751061e-05, 0.00010387519432697445, 0.0001509208232164383, 0.00019796646665781736, 0.000245012080995366, 0.00029205772443674505, 0.0003391033678781241, 0.00038614898221567273, 0.0004331946256570518, 0.00048024026909843087, 0.000527285854332149, 0.0005743314977735281, 0.0006213771412149072, 0.0006684227846562862]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 4.0, 7.0, 9.0, 15.0, 14.0, 18.0, 24.0, 18.0, 21.0, 27.0, 23.0, 24.0, 32.0, 33.0, 41.0, 35.0, 54.0, 44.0, 46.0, 55.0, 45.0, 36.0, 34.0, 31.0, 30.0, 35.0, 39.0, 21.0, 22.0, 23.0, 24.0, 15.0, 18.0, 13.0, 10.0, 14.0, 9.0, 8.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0001773834228515625, -0.00017187371850013733, -0.00016636401414871216, -0.000160854309797287, -0.00015534460544586182, -0.00014983490109443665, -0.00014432519674301147, -0.0001388154923915863, -0.00013330578804016113, -0.00012779608368873596, -0.0001222863793373108, -0.00011677667498588562, -0.00011126697063446045, -0.00010575726628303528, -0.00010024756193161011, -9.473785758018494e-05, -8.922815322875977e-05, -8.37184488773346e-05, -7.820874452590942e-05, -7.269904017448425e-05, -6.718933582305908e-05, -6.167963147163391e-05, -5.616992712020874e-05, -5.066022276878357e-05, -4.51505184173584e-05, -3.964081406593323e-05, -3.413110971450806e-05, -2.8621405363082886e-05, -2.3111701011657715e-05, -1.7601996660232544e-05, -1.2092292308807373e-05, -6.582587957382202e-06, -1.0728836059570312e-06, 4.43682074546814e-06, 9.94652509689331e-06, 1.545622944831848e-05, 2.0965933799743652e-05, 2.6475638151168823e-05, 3.1985342502593994e-05, 3.7495046854019165e-05, 4.3004751205444336e-05, 4.851445555686951e-05, 5.402415990829468e-05, 5.953386425971985e-05, 6.504356861114502e-05, 7.055327296257019e-05, 7.606297731399536e-05, 8.157268166542053e-05, 8.70823860168457e-05, 9.259209036827087e-05, 9.810179471969604e-05, 0.00010361149907112122, 0.00010912120342254639, 0.00011463090777397156, 0.00012014061212539673, 0.0001256503164768219, 0.00013116002082824707, 0.00013666972517967224, 0.0001421794295310974, 0.00014768913388252258, 0.00015319883823394775, 0.00015870854258537292, 0.0001642182469367981, 0.00016972795128822327, 0.00017523765563964844]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 6.0, 4.0, 9.0, 10.0, 15.0, 19.0, 18.0, 17.0, 24.0, 27.0, 31.0, 22.0, 40.0, 43.0, 44.0, 47.0, 55.0, 43.0, 55.0, 53.0, 40.0, 40.0, 53.0, 39.0, 33.0, 39.0, 33.0, 30.0, 21.0, 22.0, 18.0, 10.0, 11.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.3426513671875, -8.997802734375, -8.6529541015625, -8.30810546875, -7.9632568359375, -7.618408203125, -7.2735595703125, -6.9287109375, -6.5838623046875, -6.239013671875, -5.8941650390625, -5.54931640625, -5.2044677734375, -4.859619140625, -4.5147705078125, -4.169921875, -3.8250732421875, -3.480224609375, -3.1353759765625, -2.79052734375, -2.4456787109375, -2.100830078125, -1.7559814453125, -1.4111328125, -1.0662841796875, -0.721435546875, -0.3765869140625, -0.03173828125, 0.3131103515625, 0.657958984375, 1.0028076171875, 1.34765625, 1.6925048828125, 2.037353515625, 2.3822021484375, 2.72705078125, 3.0718994140625, 3.416748046875, 3.7615966796875, 4.1064453125, 4.4512939453125, 4.796142578125, 5.1409912109375, 5.48583984375, 5.8306884765625, 6.175537109375, 6.5203857421875, 6.865234375, 7.2100830078125, 7.554931640625, 7.8997802734375, 8.24462890625, 8.5894775390625, 8.934326171875, 9.2791748046875, 9.6240234375, 9.9688720703125, 10.313720703125, 10.6585693359375, 11.00341796875, 11.3482666015625, 11.693115234375, 12.0379638671875, 12.3828125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 10.0, 9.0, 10.0, 28.0, 47.0, 61.0, 68.0, 105.0, 145.0, 196.0, 270.0, 372.0, 537.0, 717.0, 1018.0, 1484.0, 2250.0, 3770.0, 9547.0, 66880.0, 622291.0, 294413.0, 28865.0, 6110.0, 2940.0, 1972.0, 1271.0, 914.0, 619.0, 470.0, 329.0, 243.0, 155.0, 121.0, 97.0, 62.0, 54.0, 33.0, 27.0, 18.0, 10.0, 10.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.84375, -26.968505859375, -26.09326171875, -25.218017578125, -24.3427734375, -23.467529296875, -22.59228515625, -21.717041015625, -20.841796875, -19.966552734375, -19.09130859375, -18.216064453125, -17.3408203125, -16.465576171875, -15.59033203125, -14.715087890625, -13.83984375, -12.964599609375, -12.08935546875, -11.214111328125, -10.3388671875, -9.463623046875, -8.58837890625, -7.713134765625, -6.837890625, -5.962646484375, -5.08740234375, -4.212158203125, -3.3369140625, -2.461669921875, -1.58642578125, -0.711181640625, 0.1640625, 1.039306640625, 1.91455078125, 2.789794921875, 3.6650390625, 4.540283203125, 5.41552734375, 6.290771484375, 7.166015625, 8.041259765625, 8.91650390625, 9.791748046875, 10.6669921875, 11.542236328125, 12.41748046875, 13.292724609375, 14.16796875, 15.043212890625, 15.91845703125, 16.793701171875, 17.6689453125, 18.544189453125, 19.41943359375, 20.294677734375, 21.169921875, 22.045166015625, 22.92041015625, 23.795654296875, 24.6708984375, 25.546142578125, 26.42138671875, 27.296630859375, 28.171875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 7.0, 7.0, 18.0, 12.0, 11.0, 13.0, 14.0, 13.0, 32.0, 24.0, 32.0, 40.0, 36.0, 41.0, 64.0, 78.0, 127.0, 202.0, 1398.0, 238.0, 139.0, 109.0, 67.0, 51.0, 36.0, 31.0, 27.0, 31.0, 20.0, 14.0, 14.0, 15.0, 9.0, 8.0, 9.0, 9.0, 12.0, 11.0, 5.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.96875, -21.25, -20.53125, -19.8125, -19.09375, -18.375, -17.65625, -16.9375, -16.21875, -15.5, -14.78125, -14.0625, -13.34375, -12.625, -11.90625, -11.1875, -10.46875, -9.75, -9.03125, -8.3125, -7.59375, -6.875, -6.15625, -5.4375, -4.71875, -4.0, -3.28125, -2.5625, -1.84375, -1.125, -0.40625, 0.3125, 1.03125, 1.75, 2.46875, 3.1875, 3.90625, 4.625, 5.34375, 6.0625, 6.78125, 7.5, 8.21875, 8.9375, 9.65625, 10.375, 11.09375, 11.8125, 12.53125, 13.25, 13.96875, 14.6875, 15.40625, 16.125, 16.84375, 17.5625, 18.28125, 19.0, 19.71875, 20.4375, 21.15625, 21.875, 22.59375, 23.3125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 8.0, 7.0, 10.0, 18.0, 20.0, 18.0, 26.0, 27.0, 48.0, 51.0, 82.0, 92.0, 126.0, 201.0, 314.0, 598.0, 1172.0, 2594.0, 40897.0, 3087255.0, 7966.0, 1870.0, 875.0, 460.0, 260.0, 186.0, 139.0, 83.0, 70.0, 38.0, 28.0, 38.0, 21.0, 11.0, 7.0, 11.0, 13.0, 12.0, 11.0, 7.0, 5.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-102.0625, -99.1728515625, -96.283203125, -93.3935546875, -90.50390625, -87.6142578125, -84.724609375, -81.8349609375, -78.9453125, -76.0556640625, -73.166015625, -70.2763671875, -67.38671875, -64.4970703125, -61.607421875, -58.7177734375, -55.828125, -52.9384765625, -50.048828125, -47.1591796875, -44.26953125, -41.3798828125, -38.490234375, -35.6005859375, -32.7109375, -29.8212890625, -26.931640625, -24.0419921875, -21.15234375, -18.2626953125, -15.373046875, -12.4833984375, -9.59375, -6.7041015625, -3.814453125, -0.9248046875, 1.96484375, 4.8544921875, 7.744140625, 10.6337890625, 13.5234375, 16.4130859375, 19.302734375, 22.1923828125, 25.08203125, 27.9716796875, 30.861328125, 33.7509765625, 36.640625, 39.5302734375, 42.419921875, 45.3095703125, 48.19921875, 51.0888671875, 53.978515625, 56.8681640625, 59.7578125, 62.6474609375, 65.537109375, 68.4267578125, 71.31640625, 74.2060546875, 77.095703125, 79.9853515625, 82.875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 30.0, 116.0, 209.0, 334.0, 201.0, 88.0, 18.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-296.62420654296875, -290.95709228515625, -285.2899475097656, -279.6228332519531, -273.9557189941406, -268.28857421875, -262.6214599609375, -256.954345703125, -251.28721618652344, -245.62008666992188, -239.95297241210938, -234.2858428955078, -228.61871337890625, -222.95159912109375, -217.2844696044922, -211.61734008789062, -205.95022583007812, -200.28309631347656, -194.61598205566406, -188.9488525390625, -183.28173828125, -177.61460876464844, -171.94747924804688, -166.28036499023438, -160.6132354736328, -154.94610595703125, -149.27899169921875, -143.6118621826172, -137.94473266601562, -132.27761840820312, -126.61048889160156, -120.94336700439453, -115.27623748779297, -109.60911560058594, -103.94198608398438, -98.27486419677734, -92.60774230957031, -86.94062042236328, -81.27349853515625, -75.60636901855469, -69.93924713134766, -64.27212524414062, -58.60499954223633, -52.93787384033203, -47.270751953125, -41.60363006591797, -35.93650436401367, -30.269378662109375, -24.602256774902344, -18.93513298034668, -13.268009185791016, -7.600885391235352, -1.9337615966796875, 3.7333621978759766, 9.40048599243164, 15.067611694335938, 20.73473358154297, 26.401857376098633, 32.0689811706543, 37.736106872558594, 43.403228759765625, 49.070350646972656, 54.73747634887695, 60.40460205078125, 66.07172393798828]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 9.0, 5.0, 9.0, 7.0, 7.0, 16.0, 12.0, 18.0, 19.0, 26.0, 17.0, 21.0, 32.0, 22.0, 32.0, 34.0, 40.0, 49.0, 32.0, 34.0, 29.0, 41.0, 45.0, 38.0, 44.0, 33.0, 49.0, 39.0, 35.0, 23.0, 31.0, 23.0, 17.0, 16.0, 19.0, 10.0, 9.0, 9.0, 13.0, 5.0, 4.0, 4.0, 5.0, 11.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-67.85401153564453, -65.82284545898438, -63.791683197021484, -61.76051712036133, -59.72935104370117, -57.69818878173828, -55.667022705078125, -53.63585662841797, -51.60469055175781, -49.573524475097656, -47.542362213134766, -45.51119613647461, -43.48003005981445, -41.44886779785156, -39.417701721191406, -37.38653564453125, -35.35537338256836, -33.3242073059082, -31.29304313659668, -29.261878967285156, -27.230712890625, -25.199548721313477, -23.168384552001953, -21.137218475341797, -19.106054306030273, -17.07489013671875, -15.043724060058594, -13.01255989074707, -10.98139476776123, -8.95022964477539, -6.919065475463867, -4.887900352478027, -2.856739044189453, -0.8255741596221924, 1.2055907249450684, 3.23675537109375, 5.26792049407959, 7.29908561706543, 9.330249786376953, 11.361414909362793, 13.392580032348633, 15.423745155334473, 17.454910278320312, 19.486074447631836, 21.51723861694336, 23.548404693603516, 25.57956886291504, 27.610733032226562, 29.64189910888672, 31.673063278198242, 33.704227447509766, 35.73539352416992, 37.76655960083008, 39.79772186279297, 41.828887939453125, 43.86005401611328, 45.89122009277344, 47.922386169433594, 49.953548431396484, 51.98471450805664, 54.0158805847168, 56.04704284667969, 58.078208923339844, 60.109375, 62.14053726196289]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 16.0, 10.0, 11.0, 14.0, 23.0, 16.0, 19.0, 26.0, 37.0, 37.0, 42.0, 42.0, 36.0, 62.0, 51.0, 55.0, 61.0, 54.0, 46.0, 46.0, 40.0, 29.0, 29.0, 35.0, 44.0, 14.0, 15.0, 11.0, 16.0, 11.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.568115234375, -10.20654296875, -9.844970703125, -9.4833984375, -9.121826171875, -8.76025390625, -8.398681640625, -8.037109375, -7.675537109375, -7.31396484375, -6.952392578125, -6.5908203125, -6.229248046875, -5.86767578125, -5.506103515625, -5.14453125, -4.782958984375, -4.42138671875, -4.059814453125, -3.6982421875, -3.336669921875, -2.97509765625, -2.613525390625, -2.251953125, -1.890380859375, -1.52880859375, -1.167236328125, -0.8056640625, -0.444091796875, -0.08251953125, 0.279052734375, 0.640625, 1.002197265625, 1.36376953125, 1.725341796875, 2.0869140625, 2.448486328125, 2.81005859375, 3.171630859375, 3.533203125, 3.894775390625, 4.25634765625, 4.617919921875, 4.9794921875, 5.341064453125, 5.70263671875, 6.064208984375, 6.42578125, 6.787353515625, 7.14892578125, 7.510498046875, 7.8720703125, 8.233642578125, 8.59521484375, 8.956787109375, 9.318359375, 9.679931640625, 10.04150390625, 10.403076171875, 10.7646484375, 11.126220703125, 11.48779296875, 11.849365234375, 12.2109375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 3.0, 3.0, 8.0, 6.0, 6.0, 10.0, 14.0, 25.0, 16.0, 32.0, 34.0, 43.0, 48.0, 67.0, 91.0, 110.0, 194.0, 318.0, 528.0, 1145.0, 2575.0, 7029.0, 26271.0, 207154.0, 1806448.0, 1873369.0, 228518.0, 27607.0, 7395.0, 2518.0, 1115.0, 524.0, 339.0, 197.0, 120.0, 79.0, 71.0, 41.0, 37.0, 35.0, 27.0, 15.0, 20.0, 17.0, 15.0, 13.0, 6.0, 7.0, 4.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0], "bins": [-23.390625, -22.68212890625, -21.9736328125, -21.26513671875, -20.556640625, -19.84814453125, -19.1396484375, -18.43115234375, -17.72265625, -17.01416015625, -16.3056640625, -15.59716796875, -14.888671875, -14.18017578125, -13.4716796875, -12.76318359375, -12.0546875, -11.34619140625, -10.6376953125, -9.92919921875, -9.220703125, -8.51220703125, -7.8037109375, -7.09521484375, -6.38671875, -5.67822265625, -4.9697265625, -4.26123046875, -3.552734375, -2.84423828125, -2.1357421875, -1.42724609375, -0.71875, -0.01025390625, 0.6982421875, 1.40673828125, 2.115234375, 2.82373046875, 3.5322265625, 4.24072265625, 4.94921875, 5.65771484375, 6.3662109375, 7.07470703125, 7.783203125, 8.49169921875, 9.2001953125, 9.90869140625, 10.6171875, 11.32568359375, 12.0341796875, 12.74267578125, 13.451171875, 14.15966796875, 14.8681640625, 15.57666015625, 16.28515625, 16.99365234375, 17.7021484375, 18.41064453125, 19.119140625, 19.82763671875, 20.5361328125, 21.24462890625, 21.953125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 3.0, 7.0, 15.0, 14.0, 22.0, 16.0, 48.0, 48.0, 88.0, 91.0, 160.0, 211.0, 236.0, 357.0, 458.0, 509.0, 443.0, 372.0, 279.0, 202.0, 128.0, 105.0, 81.0, 43.0, 34.0, 24.0, 17.0, 14.0, 6.0, 9.0, 2.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0390625, -14.4530029296875, -13.866943359375, -13.2808837890625, -12.69482421875, -12.1087646484375, -11.522705078125, -10.9366455078125, -10.3505859375, -9.7645263671875, -9.178466796875, -8.5924072265625, -8.00634765625, -7.4202880859375, -6.834228515625, -6.2481689453125, -5.662109375, -5.0760498046875, -4.489990234375, -3.9039306640625, -3.31787109375, -2.7318115234375, -2.145751953125, -1.5596923828125, -0.9736328125, -0.3875732421875, 0.198486328125, 0.7845458984375, 1.37060546875, 1.9566650390625, 2.542724609375, 3.1287841796875, 3.71484375, 4.3009033203125, 4.886962890625, 5.4730224609375, 6.05908203125, 6.6451416015625, 7.231201171875, 7.8172607421875, 8.4033203125, 8.9893798828125, 9.575439453125, 10.1614990234375, 10.74755859375, 11.3336181640625, 11.919677734375, 12.5057373046875, 13.091796875, 13.6778564453125, 14.263916015625, 14.8499755859375, 15.43603515625, 16.0220947265625, 16.608154296875, 17.1942138671875, 17.7802734375, 18.3663330078125, 18.952392578125, 19.5384521484375, 20.12451171875, 20.7105712890625, 21.296630859375, 21.8826904296875, 22.46875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 4.0, 10.0, 8.0, 20.0, 18.0, 27.0, 55.0, 93.0, 169.0, 304.0, 639.0, 1573.0, 5300.0, 63567.0, 3869898.0, 240345.0, 8159.0, 2190.0, 845.0, 450.0, 234.0, 146.0, 72.0, 42.0, 33.0, 27.0, 15.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.03125, -52.37548828125, -50.7197265625, -49.06396484375, -47.408203125, -45.75244140625, -44.0966796875, -42.44091796875, -40.78515625, -39.12939453125, -37.4736328125, -35.81787109375, -34.162109375, -32.50634765625, -30.8505859375, -29.19482421875, -27.5390625, -25.88330078125, -24.2275390625, -22.57177734375, -20.916015625, -19.26025390625, -17.6044921875, -15.94873046875, -14.29296875, -12.63720703125, -10.9814453125, -9.32568359375, -7.669921875, -6.01416015625, -4.3583984375, -2.70263671875, -1.046875, 0.60888671875, 2.2646484375, 3.92041015625, 5.576171875, 7.23193359375, 8.8876953125, 10.54345703125, 12.19921875, 13.85498046875, 15.5107421875, 17.16650390625, 18.822265625, 20.47802734375, 22.1337890625, 23.78955078125, 25.4453125, 27.10107421875, 28.7568359375, 30.41259765625, 32.068359375, 33.72412109375, 35.3798828125, 37.03564453125, 38.69140625, 40.34716796875, 42.0029296875, 43.65869140625, 45.314453125, 46.97021484375, 48.6259765625, 50.28173828125, 51.9375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 76.0, 660.0, 261.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-433.57232666015625, -417.31134033203125, -401.05035400390625, -384.78936767578125, -368.52838134765625, -352.26739501953125, -336.00640869140625, -319.74542236328125, -303.48443603515625, -287.22344970703125, -270.96246337890625, -254.70147705078125, -238.44049072265625, -222.17950439453125, -205.9185333251953, -189.6575469970703, -173.39657592773438, -157.13558959960938, -140.87460327148438, -124.6136245727539, -108.3526382446289, -92.0916519165039, -75.83067321777344, -59.56968688964844, -43.30870056152344, -27.04771614074707, -10.786731719970703, 5.474250793457031, 21.73523712158203, 37.99622344970703, 54.2572021484375, 70.5181884765625, 86.7791748046875, 103.0401611328125, 119.3011474609375, 135.5621337890625, 151.8231201171875, 168.0841064453125, 184.34507751464844, 200.60606384277344, 216.86705017089844, 233.12803649902344, 249.38902282714844, 265.6499938964844, 281.9109802246094, 298.1719665527344, 314.4329528808594, 330.6939392089844, 346.9549255371094, 363.2159118652344, 379.4768981933594, 395.7378845214844, 411.9988708496094, 428.2598571777344, 444.52081298828125, 460.78179931640625, 477.04278564453125, 493.30377197265625, 509.56475830078125, 525.8257446289062, 542.0867309570312, 558.3477172851562, 574.6087036132812, 590.8696899414062, 607.1306762695312]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 7.0, 8.0, 4.0, 8.0, 9.0, 8.0, 21.0, 10.0, 21.0, 18.0, 26.0, 20.0, 30.0, 25.0, 24.0, 32.0, 40.0, 39.0, 38.0, 36.0, 44.0, 40.0, 34.0, 48.0, 23.0, 46.0, 38.0, 37.0, 38.0, 25.0, 27.0, 25.0, 21.0, 18.0, 9.0, 25.0, 9.0, 18.0, 11.0, 6.0, 6.0, 9.0, 4.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.023075103759766, -57.93684005737305, -55.85060119628906, -53.764366149902344, -51.678131103515625, -49.59189224243164, -47.50565719604492, -45.41941833496094, -43.33318328857422, -41.2469482421875, -39.160709381103516, -37.0744743347168, -34.98823547363281, -32.902000427246094, -30.815765380859375, -28.729528427124023, -26.643291473388672, -24.55705451965332, -22.47081756591797, -20.38458251953125, -18.2983455657959, -16.212108612060547, -14.125872611999512, -12.039636611938477, -9.953399658203125, -7.867163181304932, -5.780926704406738, -3.694690227508545, -1.6084537506103516, 0.477783203125, 2.564019203186035, 4.65025520324707, 6.7364959716796875, 8.822732925415039, 10.908968925476074, 12.99520492553711, 15.081441879272461, 17.167678833007812, 19.25391387939453, 21.340150833129883, 23.426387786865234, 25.512624740600586, 27.598861694335938, 29.685096740722656, 31.771333694458008, 33.85757064819336, 35.94380569458008, 38.03004455566406, 40.11627960205078, 42.2025146484375, 44.288753509521484, 46.3749885559082, 48.46122741699219, 50.547462463378906, 52.633697509765625, 54.719932556152344, 56.80617141723633, 58.89240646362305, 60.97864532470703, 63.06488037109375, 65.15111541748047, 67.23735046386719, 69.32359313964844, 71.40982818603516, 73.49606323242188]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 10.0, 14.0, 16.0, 14.0, 15.0, 20.0, 16.0, 15.0, 33.0, 25.0, 25.0, 33.0, 41.0, 45.0, 39.0, 51.0, 46.0, 57.0, 51.0, 38.0, 37.0, 37.0, 37.0, 36.0, 32.0, 30.0, 31.0, 22.0, 20.0, 19.0, 19.0, 16.0, 11.0, 11.0, 15.0, 1.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.6796875, -8.421630859375, -8.16357421875, -7.905517578125, -7.6474609375, -7.389404296875, -7.13134765625, -6.873291015625, -6.615234375, -6.357177734375, -6.09912109375, -5.841064453125, -5.5830078125, -5.324951171875, -5.06689453125, -4.808837890625, -4.55078125, -4.292724609375, -4.03466796875, -3.776611328125, -3.5185546875, -3.260498046875, -3.00244140625, -2.744384765625, -2.486328125, -2.228271484375, -1.97021484375, -1.712158203125, -1.4541015625, -1.196044921875, -0.93798828125, -0.679931640625, -0.421875, -0.163818359375, 0.09423828125, 0.352294921875, 0.6103515625, 0.868408203125, 1.12646484375, 1.384521484375, 1.642578125, 1.900634765625, 2.15869140625, 2.416748046875, 2.6748046875, 2.932861328125, 3.19091796875, 3.448974609375, 3.70703125, 3.965087890625, 4.22314453125, 4.481201171875, 4.7392578125, 4.997314453125, 5.25537109375, 5.513427734375, 5.771484375, 6.029541015625, 6.28759765625, 6.545654296875, 6.8037109375, 7.061767578125, 7.31982421875, 7.577880859375, 7.8359375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 5.0, 7.0, 7.0, 17.0, 24.0, 30.0, 33.0, 57.0, 69.0, 84.0, 136.0, 202.0, 223.0, 425.0, 558.0, 833.0, 1220.0, 1667.0, 2525.0, 3450.0, 5262.0, 7654.0, 11475.0, 16573.0, 25169.0, 38025.0, 59343.0, 98651.0, 213844.0, 269535.0, 106269.0, 62966.0, 40117.0, 26681.0, 17718.0, 11975.0, 7988.0, 5543.0, 3686.0, 2605.0, 1841.0, 1277.0, 827.0, 606.0, 387.0, 269.0, 206.0, 114.0, 112.0, 77.0, 55.0, 56.0, 22.0, 30.0, 10.0, 16.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.8779296875, -1.819366455078125, -1.76080322265625, -1.702239990234375, -1.6436767578125, -1.585113525390625, -1.52655029296875, -1.467987060546875, -1.409423828125, -1.350860595703125, -1.29229736328125, -1.233734130859375, -1.1751708984375, -1.116607666015625, -1.05804443359375, -0.999481201171875, -0.94091796875, -0.882354736328125, -0.82379150390625, -0.765228271484375, -0.7066650390625, -0.648101806640625, -0.58953857421875, -0.530975341796875, -0.472412109375, -0.413848876953125, -0.35528564453125, -0.296722412109375, -0.2381591796875, -0.179595947265625, -0.12103271484375, -0.062469482421875, -0.00390625, 0.054656982421875, 0.11322021484375, 0.171783447265625, 0.2303466796875, 0.288909912109375, 0.34747314453125, 0.406036376953125, 0.464599609375, 0.523162841796875, 0.58172607421875, 0.640289306640625, 0.6988525390625, 0.757415771484375, 0.81597900390625, 0.874542236328125, 0.93310546875, 0.991668701171875, 1.05023193359375, 1.108795166015625, 1.1673583984375, 1.225921630859375, 1.28448486328125, 1.343048095703125, 1.401611328125, 1.460174560546875, 1.51873779296875, 1.577301025390625, 1.6358642578125, 1.694427490234375, 1.75299072265625, 1.811553955078125, 1.8701171875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 6.0, 6.0, 7.0, 11.0, 17.0, 13.0, 10.0, 22.0, 13.0, 31.0, 23.0, 19.0, 33.0, 30.0, 44.0, 37.0, 48.0, 45.0, 47.0, 1067.0, 46.0, 34.0, 38.0, 40.0, 42.0, 39.0, 26.0, 26.0, 26.0, 30.0, 25.0, 29.0, 24.0, 14.0, 14.0, 7.0, 10.0, 5.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.52850341796875, -5.3656005859375, -5.20269775390625, -5.039794921875, -4.87689208984375, -4.7139892578125, -4.55108642578125, -4.38818359375, -4.22528076171875, -4.0623779296875, -3.89947509765625, -3.736572265625, -3.57366943359375, -3.4107666015625, -3.24786376953125, -3.0849609375, -2.92205810546875, -2.7591552734375, -2.59625244140625, -2.433349609375, -2.27044677734375, -2.1075439453125, -1.94464111328125, -1.78173828125, -1.61883544921875, -1.4559326171875, -1.29302978515625, -1.130126953125, -0.96722412109375, -0.8043212890625, -0.64141845703125, -0.478515625, -0.31561279296875, -0.1527099609375, 0.01019287109375, 0.173095703125, 0.33599853515625, 0.4989013671875, 0.66180419921875, 0.82470703125, 0.98760986328125, 1.1505126953125, 1.31341552734375, 1.476318359375, 1.63922119140625, 1.8021240234375, 1.96502685546875, 2.1279296875, 2.29083251953125, 2.4537353515625, 2.61663818359375, 2.779541015625, 2.94244384765625, 3.1053466796875, 3.26824951171875, 3.43115234375, 3.59405517578125, 3.7569580078125, 3.91986083984375, 4.082763671875, 4.24566650390625, 4.4085693359375, 4.57147216796875, 4.734375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 0.0, 10.0, 11.0, 22.0, 23.0, 45.0, 80.0, 103.0, 151.0, 267.0, 407.0, 594.0, 958.0, 1395.0, 2142.0, 3200.0, 5093.0, 7639.0, 11688.0, 18367.0, 28456.0, 45866.0, 74656.0, 133784.0, 1371828.0, 161529.0, 85791.0, 52472.0, 32530.0, 20128.0, 13156.0, 8612.0, 5500.0, 3632.0, 2320.0, 1627.0, 1026.0, 728.0, 461.0, 287.0, 204.0, 119.0, 84.0, 47.0, 37.0, 16.0, 22.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.142578125, -2.0788726806640625, -2.015167236328125, -1.9514617919921875, -1.88775634765625, -1.8240509033203125, -1.760345458984375, -1.6966400146484375, -1.6329345703125, -1.5692291259765625, -1.505523681640625, -1.4418182373046875, -1.37811279296875, -1.3144073486328125, -1.250701904296875, -1.1869964599609375, -1.123291015625, -1.0595855712890625, -0.995880126953125, -0.9321746826171875, -0.86846923828125, -0.8047637939453125, -0.741058349609375, -0.6773529052734375, -0.6136474609375, -0.5499420166015625, -0.486236572265625, -0.4225311279296875, -0.35882568359375, -0.2951202392578125, -0.231414794921875, -0.1677093505859375, -0.10400390625, -0.0402984619140625, 0.023406982421875, 0.0871124267578125, 0.15081787109375, 0.2145233154296875, 0.278228759765625, 0.3419342041015625, 0.4056396484375, 0.4693450927734375, 0.533050537109375, 0.5967559814453125, 0.66046142578125, 0.7241668701171875, 0.787872314453125, 0.8515777587890625, 0.915283203125, 0.9789886474609375, 1.042694091796875, 1.1063995361328125, 1.17010498046875, 1.2338104248046875, 1.297515869140625, 1.3612213134765625, 1.4249267578125, 1.4886322021484375, 1.552337646484375, 1.6160430908203125, 1.67974853515625, 1.7434539794921875, 1.807159423828125, 1.8708648681640625, 1.9345703125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 11.0, 10.0, 9.0, 10.0, 10.0, 19.0, 16.0, 19.0, 35.0, 19.0, 31.0, 48.0, 47.0, 66.0, 51.0, 71.0, 64.0, 71.0, 50.0, 42.0, 51.0, 39.0, 30.0, 22.0, 22.0, 27.0, 20.0, 16.0, 8.0, 10.0, 6.0, 9.0, 9.0, 4.0, 2.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003330707550048828, -0.0003230385482311249, -0.00031300634145736694, -0.000302974134683609, -0.0002929419279098511, -0.00028290972113609314, -0.0002728775143623352, -0.00026284530758857727, -0.00025281310081481934, -0.0002427808940410614, -0.00023274868726730347, -0.00022271648049354553, -0.0002126842737197876, -0.00020265206694602966, -0.00019261986017227173, -0.0001825876533985138, -0.00017255544662475586, -0.00016252323985099792, -0.00015249103307724, -0.00014245882630348206, -0.00013242661952972412, -0.0001223944127559662, -0.00011236220598220825, -0.00010232999920845032, -9.229779243469238e-05, -8.226558566093445e-05, -7.223337888717651e-05, -6.220117211341858e-05, -5.2168965339660645e-05, -4.213675856590271e-05, -3.2104551792144775e-05, -2.207234501838684e-05, -1.2040138244628906e-05, -2.0079314708709717e-06, 8.024275302886963e-06, 1.8056482076644897e-05, 2.8088688850402832e-05, 3.8120895624160767e-05, 4.81531023979187e-05, 5.8185309171676636e-05, 6.821751594543457e-05, 7.82497227191925e-05, 8.828192949295044e-05, 9.831413626670837e-05, 0.00010834634304046631, 0.00011837854981422424, 0.00012841075658798218, 0.0001384429633617401, 0.00014847517013549805, 0.00015850737690925598, 0.00016853958368301392, 0.00017857179045677185, 0.00018860399723052979, 0.00019863620400428772, 0.00020866841077804565, 0.0002187006175518036, 0.00022873282432556152, 0.00023876503109931946, 0.0002487972378730774, 0.00025882944464683533, 0.00026886165142059326, 0.0002788938581943512, 0.00028892606496810913, 0.00029895827174186707, 0.000308990478515625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 12.0, 14.0, 14.0, 26.0, 19.0, 21.0, 38.0, 36.0, 63.0, 64.0, 90.0, 125.0, 176.0, 288.0, 388.0, 625.0, 1409.0, 116673.0, 923404.0, 2642.0, 830.0, 466.0, 328.0, 177.0, 134.0, 115.0, 78.0, 57.0, 53.0, 32.0, 32.0, 21.0, 20.0, 13.0, 4.0, 8.0, 12.0, 4.0, 9.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004985809326171875, -0.00480884313583374, -0.0046318769454956055, -0.004454910755157471, -0.004277944564819336, -0.004100978374481201, -0.003924012184143066, -0.0037470459938049316, -0.003570079803466797, -0.003393113613128662, -0.0032161474227905273, -0.0030391812324523926, -0.002862215042114258, -0.002685248851776123, -0.0025082826614379883, -0.0023313164710998535, -0.0021543502807617188, -0.001977384090423584, -0.0018004179000854492, -0.0016234517097473145, -0.0014464855194091797, -0.001269519329071045, -0.0010925531387329102, -0.0009155869483947754, -0.0007386207580566406, -0.0005616545677185059, -0.0003846883773803711, -0.00020772218704223633, -3.075599670410156e-05, 0.0001462101936340332, 0.00032317638397216797, 0.0005001425743103027, 0.0006771087646484375, 0.0008540749549865723, 0.001031041145324707, 0.0012080073356628418, 0.0013849735260009766, 0.0015619397163391113, 0.001738905906677246, 0.0019158720970153809, 0.0020928382873535156, 0.0022698044776916504, 0.002446770668029785, 0.00262373685836792, 0.0028007030487060547, 0.0029776692390441895, 0.0031546354293823242, 0.003331601619720459, 0.0035085678100585938, 0.0036855340003967285, 0.0038625001907348633, 0.004039466381072998, 0.004216432571411133, 0.004393398761749268, 0.004570364952087402, 0.004747331142425537, 0.004924297332763672, 0.005101263523101807, 0.005278229713439941, 0.005455195903778076, 0.005632162094116211, 0.005809128284454346, 0.0059860944747924805, 0.006163060665130615, 0.00634002685546875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 14.0, 11.0, 126.0, 277.0, 289.0, 208.0, 64.0, 17.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004347774083726108, -0.0004204344004392624, -0.00040609139250591397, -0.00039174838457256556, -0.0003774054057430476, -0.0003630623978096992, -0.00034871938987635076, -0.00033437638194300234, -0.0003200334031134844, -0.00030569039518013597, -0.00029134738724678755, -0.00027700437931343913, -0.00026266140048392117, -0.00024831839255057275, -0.00023397538461722434, -0.00021963237668387592, -0.0002052893687505275, -0.00019094636081717908, -0.0001766033674357459, -0.00016226035950239748, -0.0001479173661209643, -0.00013357435818761587, -0.00011923135025426745, -0.00010488834959687665, -9.054534893948585e-05, -7.620234828209504e-05, -6.185934762470424e-05, -4.7516339691355824e-05, -3.317333903396502e-05, -1.8830338376574218e-05, -4.487330443225801e-06, 9.855670214165002e-06, 2.4198670871555805e-05, 3.854167152894661e-05, 5.288467582431622e-05, 6.722768011968583e-05, 8.157068077707663e-05, 9.591368143446743e-05, 0.00011025668936781585, 0.00012459969730116427, 0.00013894269068259746, 0.00015328569861594588, 0.00016762869199737906, 0.00018197169993072748, 0.0001963147078640759, 0.0002106577012455091, 0.0002250007091788575, 0.0002393437025602907, 0.0002536867104936391, 0.00026802971842698753, 0.00028237272636033595, 0.0002967157051898539, 0.0003110587131232023, 0.00032540172105655074, 0.00033974472898989916, 0.0003540877369232476, 0.000368430744856596, 0.0003827737527899444, 0.00039711676072329283, 0.00041145976865664124, 0.0004258027474861592, 0.0004401457554195076, 0.00045448876335285604, 0.00046883177128620446, 0.0004831747501157224]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 6.0, 7.0, 13.0, 9.0, 11.0, 16.0, 21.0, 22.0, 15.0, 30.0, 22.0, 27.0, 33.0, 44.0, 44.0, 34.0, 40.0, 39.0, 37.0, 42.0, 39.0, 45.0, 48.0, 33.0, 31.0, 29.0, 49.0, 25.0, 21.0, 23.0, 25.0, 18.0, 16.0, 16.0, 12.0, 12.0, 11.0, 5.0, 7.0, 5.0, 4.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001729130744934082, -0.00016749370843172073, -0.00016207434237003326, -0.0001566549763083458, -0.00015123561024665833, -0.00014581624418497086, -0.00014039687812328339, -0.00013497751206159592, -0.00012955814599990845, -0.00012413877993822098, -0.00011871941387653351, -0.00011330004781484604, -0.00010788068175315857, -0.0001024613156914711, -9.704194962978363e-05, -9.162258356809616e-05, -8.620321750640869e-05, -8.078385144472122e-05, -7.536448538303375e-05, -6.994511932134628e-05, -6.452575325965881e-05, -5.9106387197971344e-05, -5.3687021136283875e-05, -4.8267655074596405e-05, -4.2848289012908936e-05, -3.7428922951221466e-05, -3.2009556889533997e-05, -2.6590190827846527e-05, -2.1170824766159058e-05, -1.5751458704471588e-05, -1.0332092642784119e-05, -4.912726581096649e-06, 5.066394805908203e-07, 5.92600554227829e-06, 1.134537160396576e-05, 1.676473766565323e-05, 2.2184103727340698e-05, 2.7603469789028168e-05, 3.302283585071564e-05, 3.844220191240311e-05, 4.3861567974090576e-05, 4.9280934035778046e-05, 5.4700300097465515e-05, 6.0119666159152985e-05, 6.553903222084045e-05, 7.095839828252792e-05, 7.637776434421539e-05, 8.179713040590286e-05, 8.721649646759033e-05, 9.26358625292778e-05, 9.805522859096527e-05, 0.00010347459465265274, 0.00010889396071434021, 0.00011431332677602768, 0.00011973269283771515, 0.00012515205889940262, 0.0001305714249610901, 0.00013599079102277756, 0.00014141015708446503, 0.0001468295231461525, 0.00015224888920783997, 0.00015766825526952744, 0.0001630876213312149, 0.00016850698739290237, 0.00017392635345458984]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 10.0, 14.0, 16.0, 14.0, 15.0, 20.0, 16.0, 15.0, 33.0, 25.0, 25.0, 33.0, 41.0, 45.0, 39.0, 51.0, 46.0, 57.0, 51.0, 38.0, 37.0, 37.0, 37.0, 36.0, 32.0, 30.0, 31.0, 22.0, 20.0, 19.0, 19.0, 16.0, 11.0, 11.0, 15.0, 1.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.6796875, -8.421630859375, -8.16357421875, -7.905517578125, -7.6474609375, -7.389404296875, -7.13134765625, -6.873291015625, -6.615234375, -6.357177734375, -6.09912109375, -5.841064453125, -5.5830078125, -5.324951171875, -5.06689453125, -4.808837890625, -4.55078125, -4.292724609375, -4.03466796875, -3.776611328125, -3.5185546875, -3.260498046875, -3.00244140625, -2.744384765625, -2.486328125, -2.228271484375, -1.97021484375, -1.712158203125, -1.4541015625, -1.196044921875, -0.93798828125, -0.679931640625, -0.421875, -0.163818359375, 0.09423828125, 0.352294921875, 0.6103515625, 0.868408203125, 1.12646484375, 1.384521484375, 1.642578125, 1.900634765625, 2.15869140625, 2.416748046875, 2.6748046875, 2.932861328125, 3.19091796875, 3.448974609375, 3.70703125, 3.965087890625, 4.22314453125, 4.481201171875, 4.7392578125, 4.997314453125, 5.25537109375, 5.513427734375, 5.771484375, 6.029541015625, 6.28759765625, 6.545654296875, 6.8037109375, 7.061767578125, 7.31982421875, 7.577880859375, 7.8359375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 9.0, 3.0, 18.0, 23.0, 49.0, 39.0, 55.0, 79.0, 124.0, 135.0, 201.0, 314.0, 454.0, 682.0, 1129.0, 2037.0, 4318.0, 12114.0, 50005.0, 338058.0, 528544.0, 81070.0, 17195.0, 5640.0, 2490.0, 1284.0, 783.0, 513.0, 299.0, 235.0, 185.0, 109.0, 91.0, 70.0, 50.0, 32.0, 32.0, 19.0, 12.0, 11.0, 9.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.140625, -15.653564453125, -15.16650390625, -14.679443359375, -14.1923828125, -13.705322265625, -13.21826171875, -12.731201171875, -12.244140625, -11.757080078125, -11.27001953125, -10.782958984375, -10.2958984375, -9.808837890625, -9.32177734375, -8.834716796875, -8.34765625, -7.860595703125, -7.37353515625, -6.886474609375, -6.3994140625, -5.912353515625, -5.42529296875, -4.938232421875, -4.451171875, -3.964111328125, -3.47705078125, -2.989990234375, -2.5029296875, -2.015869140625, -1.52880859375, -1.041748046875, -0.5546875, -0.067626953125, 0.41943359375, 0.906494140625, 1.3935546875, 1.880615234375, 2.36767578125, 2.854736328125, 3.341796875, 3.828857421875, 4.31591796875, 4.802978515625, 5.2900390625, 5.777099609375, 6.26416015625, 6.751220703125, 7.23828125, 7.725341796875, 8.21240234375, 8.699462890625, 9.1865234375, 9.673583984375, 10.16064453125, 10.647705078125, 11.134765625, 11.621826171875, 12.10888671875, 12.595947265625, 13.0830078125, 13.570068359375, 14.05712890625, 14.544189453125, 15.03125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 6.0, 12.0, 10.0, 16.0, 15.0, 21.0, 17.0, 34.0, 29.0, 41.0, 49.0, 56.0, 82.0, 173.0, 1488.0, 404.0, 172.0, 87.0, 69.0, 35.0, 45.0, 38.0, 26.0, 21.0, 19.0, 11.0, 8.0, 15.0, 8.0, 7.0, 4.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.328125, -23.515380859375, -22.70263671875, -21.889892578125, -21.0771484375, -20.264404296875, -19.45166015625, -18.638916015625, -17.826171875, -17.013427734375, -16.20068359375, -15.387939453125, -14.5751953125, -13.762451171875, -12.94970703125, -12.136962890625, -11.32421875, -10.511474609375, -9.69873046875, -8.885986328125, -8.0732421875, -7.260498046875, -6.44775390625, -5.635009765625, -4.822265625, -4.009521484375, -3.19677734375, -2.384033203125, -1.5712890625, -0.758544921875, 0.05419921875, 0.866943359375, 1.6796875, 2.492431640625, 3.30517578125, 4.117919921875, 4.9306640625, 5.743408203125, 6.55615234375, 7.368896484375, 8.181640625, 8.994384765625, 9.80712890625, 10.619873046875, 11.4326171875, 12.245361328125, 13.05810546875, 13.870849609375, 14.68359375, 15.496337890625, 16.30908203125, 17.121826171875, 17.9345703125, 18.747314453125, 19.56005859375, 20.372802734375, 21.185546875, 21.998291015625, 22.81103515625, 23.623779296875, 24.4365234375, 25.249267578125, 26.06201171875, 26.874755859375, 27.6875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 10.0, 17.0, 16.0, 20.0, 28.0, 47.0, 50.0, 94.0, 107.0, 193.0, 259.0, 557.0, 1458.0, 8677.0, 3101117.0, 29461.0, 1951.0, 667.0, 326.0, 204.0, 134.0, 75.0, 55.0, 46.0, 22.0, 24.0, 26.0, 20.0, 7.0, 9.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-54.09375, -52.32763671875, -50.5615234375, -48.79541015625, -47.029296875, -45.26318359375, -43.4970703125, -41.73095703125, -39.96484375, -38.19873046875, -36.4326171875, -34.66650390625, -32.900390625, -31.13427734375, -29.3681640625, -27.60205078125, -25.8359375, -24.06982421875, -22.3037109375, -20.53759765625, -18.771484375, -17.00537109375, -15.2392578125, -13.47314453125, -11.70703125, -9.94091796875, -8.1748046875, -6.40869140625, -4.642578125, -2.87646484375, -1.1103515625, 0.65576171875, 2.421875, 4.18798828125, 5.9541015625, 7.72021484375, 9.486328125, 11.25244140625, 13.0185546875, 14.78466796875, 16.55078125, 18.31689453125, 20.0830078125, 21.84912109375, 23.615234375, 25.38134765625, 27.1474609375, 28.91357421875, 30.6796875, 32.44580078125, 34.2119140625, 35.97802734375, 37.744140625, 39.51025390625, 41.2763671875, 43.04248046875, 44.80859375, 46.57470703125, 48.3408203125, 50.10693359375, 51.873046875, 53.63916015625, 55.4052734375, 57.17138671875, 58.9375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [19.0, 51.0, 248.0, 450.0, 182.0, 49.0, 11.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.610172271728516, -8.819649696350098, -5.02912712097168, -1.2386045455932617, 2.5519180297851562, 6.342441558837891, 10.132963180541992, 13.923484802246094, 17.714008331298828, 21.504531860351562, 25.295053482055664, 29.085575103759766, 32.8760986328125, 36.666622161865234, 40.45714569091797, 44.24766540527344, 48.03818893432617, 51.828712463378906, 55.619232177734375, 59.40975570678711, 63.200279235839844, 66.99079895019531, 70.78132629394531, 74.57184600830078, 78.36236572265625, 82.15288543701172, 85.94341278076172, 89.73393249511719, 93.52445983886719, 97.31497955322266, 101.10549926757812, 104.89602661132812, 108.68655395507812, 112.4770736694336, 116.2676010131836, 120.05812072753906, 123.84864807128906, 127.63916778564453, 131.4296875, 135.22021484375, 139.0107421875, 142.80126953125, 146.59178161621094, 150.38230895996094, 154.17283630371094, 157.96334838867188, 161.75387573242188, 165.54440307617188, 169.3349151611328, 173.1254425048828, 176.91595458984375, 180.70648193359375, 184.49700927734375, 188.28753662109375, 192.0780487060547, 195.8685760498047, 199.65908813476562, 203.44961547851562, 207.24012756347656, 211.03065490722656, 214.82118225097656, 218.6116943359375, 222.4022216796875, 226.1927490234375, 229.9832763671875]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 8.0, 4.0, 5.0, 7.0, 7.0, 11.0, 11.0, 16.0, 19.0, 35.0, 26.0, 42.0, 36.0, 38.0, 40.0, 48.0, 40.0, 37.0, 57.0, 52.0, 35.0, 42.0, 26.0, 30.0, 43.0, 34.0, 30.0, 31.0, 30.0, 25.0, 21.0, 27.0, 11.0, 11.0, 13.0, 15.0, 6.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-53.00392532348633, -51.40496826171875, -49.80601119995117, -48.207054138183594, -46.608097076416016, -45.00914001464844, -43.41018295288086, -41.81122589111328, -40.2122688293457, -38.613311767578125, -37.01435470581055, -35.41539764404297, -33.81644058227539, -32.21748352050781, -30.618526458740234, -29.019569396972656, -27.420610427856445, -25.821653366088867, -24.22269630432129, -22.62373924255371, -21.024782180786133, -19.425825119018555, -17.826866149902344, -16.227909088134766, -14.628952980041504, -13.029995918273926, -11.431038856506348, -9.832080841064453, -8.233123779296875, -6.634167194366455, -5.035209655761719, -3.4362525939941406, -1.8372955322265625, -0.23833835124969482, 1.3606188297271729, 2.95957612991333, 4.558533191680908, 6.157490253448486, 7.756447792053223, 9.3554048538208, 10.954361915588379, 12.553318977355957, 14.152276039123535, 15.75123405456543, 17.350191116333008, 18.949148178100586, 20.548105239868164, 22.147062301635742, 23.74601936340332, 25.3449764251709, 26.943933486938477, 28.542890548706055, 30.141847610473633, 31.74080467224121, 33.33976364135742, 34.938720703125, 36.53767776489258, 38.136634826660156, 39.735591888427734, 41.33454895019531, 42.93350601196289, 44.53246307373047, 46.13142013549805, 47.730377197265625, 49.3293342590332]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 8.0, 8.0, 13.0, 15.0, 15.0, 22.0, 23.0, 24.0, 25.0, 43.0, 39.0, 37.0, 40.0, 45.0, 45.0, 49.0, 45.0, 43.0, 46.0, 47.0, 55.0, 26.0, 35.0, 30.0, 32.0, 26.0, 31.0, 13.0, 24.0, 14.0, 12.0, 15.0, 7.0, 5.0, 6.0, 6.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.1484375, -10.8441162109375, -10.539794921875, -10.2354736328125, -9.93115234375, -9.6268310546875, -9.322509765625, -9.0181884765625, -8.7138671875, -8.4095458984375, -8.105224609375, -7.8009033203125, -7.49658203125, -7.1922607421875, -6.887939453125, -6.5836181640625, -6.279296875, -5.9749755859375, -5.670654296875, -5.3663330078125, -5.06201171875, -4.7576904296875, -4.453369140625, -4.1490478515625, -3.8447265625, -3.5404052734375, -3.236083984375, -2.9317626953125, -2.62744140625, -2.3231201171875, -2.018798828125, -1.7144775390625, -1.41015625, -1.1058349609375, -0.801513671875, -0.4971923828125, -0.19287109375, 0.1114501953125, 0.415771484375, 0.7200927734375, 1.0244140625, 1.3287353515625, 1.633056640625, 1.9373779296875, 2.24169921875, 2.5460205078125, 2.850341796875, 3.1546630859375, 3.458984375, 3.7633056640625, 4.067626953125, 4.3719482421875, 4.67626953125, 4.9805908203125, 5.284912109375, 5.5892333984375, 5.8935546875, 6.1978759765625, 6.502197265625, 6.8065185546875, 7.11083984375, 7.4151611328125, 7.719482421875, 8.0238037109375, 8.328125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 10.0, 9.0, 9.0, 11.0, 12.0, 23.0, 21.0, 40.0, 45.0, 60.0, 99.0, 110.0, 160.0, 209.0, 310.0, 549.0, 781.0, 1335.0, 3538.0, 38922.0, 2809211.0, 1315662.0, 17073.0, 2695.0, 1203.0, 645.0, 392.0, 306.0, 214.0, 174.0, 119.0, 83.0, 72.0, 52.0, 25.0, 28.0, 14.0, 13.0, 9.0, 12.0, 7.0, 9.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0], "bins": [-56.0, -54.4814453125, -52.962890625, -51.4443359375, -49.92578125, -48.4072265625, -46.888671875, -45.3701171875, -43.8515625, -42.3330078125, -40.814453125, -39.2958984375, -37.77734375, -36.2587890625, -34.740234375, -33.2216796875, -31.703125, -30.1845703125, -28.666015625, -27.1474609375, -25.62890625, -24.1103515625, -22.591796875, -21.0732421875, -19.5546875, -18.0361328125, -16.517578125, -14.9990234375, -13.48046875, -11.9619140625, -10.443359375, -8.9248046875, -7.40625, -5.8876953125, -4.369140625, -2.8505859375, -1.33203125, 0.1865234375, 1.705078125, 3.2236328125, 4.7421875, 6.2607421875, 7.779296875, 9.2978515625, 10.81640625, 12.3349609375, 13.853515625, 15.3720703125, 16.890625, 18.4091796875, 19.927734375, 21.4462890625, 22.96484375, 24.4833984375, 26.001953125, 27.5205078125, 29.0390625, 30.5576171875, 32.076171875, 33.5947265625, 35.11328125, 36.6318359375, 38.150390625, 39.6689453125, 41.1875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 10.0, 11.0, 9.0, 30.0, 48.0, 52.0, 109.0, 200.0, 291.0, 470.0, 622.0, 689.0, 545.0, 384.0, 229.0, 135.0, 80.0, 54.0, 30.0, 15.0, 13.0, 14.0, 5.0, 3.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.390625, -20.70751953125, -20.0244140625, -19.34130859375, -18.658203125, -17.97509765625, -17.2919921875, -16.60888671875, -15.92578125, -15.24267578125, -14.5595703125, -13.87646484375, -13.193359375, -12.51025390625, -11.8271484375, -11.14404296875, -10.4609375, -9.77783203125, -9.0947265625, -8.41162109375, -7.728515625, -7.04541015625, -6.3623046875, -5.67919921875, -4.99609375, -4.31298828125, -3.6298828125, -2.94677734375, -2.263671875, -1.58056640625, -0.8974609375, -0.21435546875, 0.46875, 1.15185546875, 1.8349609375, 2.51806640625, 3.201171875, 3.88427734375, 4.5673828125, 5.25048828125, 5.93359375, 6.61669921875, 7.2998046875, 7.98291015625, 8.666015625, 9.34912109375, 10.0322265625, 10.71533203125, 11.3984375, 12.08154296875, 12.7646484375, 13.44775390625, 14.130859375, 14.81396484375, 15.4970703125, 16.18017578125, 16.86328125, 17.54638671875, 18.2294921875, 18.91259765625, 19.595703125, 20.27880859375, 20.9619140625, 21.64501953125, 22.328125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 8.0, 21.0, 30.0, 50.0, 95.0, 177.0, 343.0, 584.0, 1207.0, 2747.0, 7677.0, 36324.0, 373870.0, 3025278.0, 673280.0, 56186.0, 10137.0, 3282.0, 1388.0, 711.0, 360.0, 217.0, 127.0, 52.0, 46.0, 20.0, 7.0, 8.0, 6.0, 6.0, 7.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.328125, -20.6533203125, -19.978515625, -19.3037109375, -18.62890625, -17.9541015625, -17.279296875, -16.6044921875, -15.9296875, -15.2548828125, -14.580078125, -13.9052734375, -13.23046875, -12.5556640625, -11.880859375, -11.2060546875, -10.53125, -9.8564453125, -9.181640625, -8.5068359375, -7.83203125, -7.1572265625, -6.482421875, -5.8076171875, -5.1328125, -4.4580078125, -3.783203125, -3.1083984375, -2.43359375, -1.7587890625, -1.083984375, -0.4091796875, 0.265625, 0.9404296875, 1.615234375, 2.2900390625, 2.96484375, 3.6396484375, 4.314453125, 4.9892578125, 5.6640625, 6.3388671875, 7.013671875, 7.6884765625, 8.36328125, 9.0380859375, 9.712890625, 10.3876953125, 11.0625, 11.7373046875, 12.412109375, 13.0869140625, 13.76171875, 14.4365234375, 15.111328125, 15.7861328125, 16.4609375, 17.1357421875, 17.810546875, 18.4853515625, 19.16015625, 19.8349609375, 20.509765625, 21.1845703125, 21.859375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 7.0, 14.0, 20.0, 27.0, 34.0, 54.0, 52.0, 82.0, 83.0, 107.0, 106.0, 90.0, 84.0, 61.0, 50.0, 45.0, 25.0, 20.0, 18.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.49153900146484, -72.17437744140625, -68.85720825195312, -65.54004669189453, -62.22288513183594, -58.905723571777344, -55.588558197021484, -52.271392822265625, -48.95423126220703, -45.63706970214844, -42.31990432739258, -39.00273895263672, -35.685577392578125, -32.36841583251953, -29.051250457763672, -25.734086990356445, -22.41692352294922, -19.099760055541992, -15.782596588134766, -12.465433120727539, -9.148269653320312, -5.831106185913086, -2.5139427185058594, 0.8032207489013672, 4.120384216308594, 7.43754768371582, 10.754711151123047, 14.071874618530273, 17.3890380859375, 20.706201553344727, 24.023365020751953, 27.34052848815918, 30.657684326171875, 33.97484588623047, 37.29201126098633, 40.60917663574219, 43.92633819580078, 47.243499755859375, 50.560665130615234, 53.877830505371094, 57.19499206542969, 60.51215362548828, 63.82931900024414, 67.146484375, 70.4636459350586, 73.78080749511719, 77.09797668457031, 80.4151382446289, 83.7322998046875, 87.0494613647461, 90.36662292480469, 93.68379211425781, 97.0009536743164, 100.318115234375, 103.63528442382812, 106.95244598388672, 110.26960754394531, 113.5867691040039, 116.9039306640625, 120.22109985351562, 123.53826141357422, 126.85542297363281, 130.17259216308594, 133.48974609375, 136.80691528320312]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 10.0, 6.0, 12.0, 14.0, 9.0, 15.0, 12.0, 28.0, 31.0, 27.0, 39.0, 32.0, 43.0, 35.0, 47.0, 37.0, 46.0, 37.0, 37.0, 40.0, 51.0, 31.0, 34.0, 32.0, 45.0, 29.0, 28.0, 23.0, 23.0, 15.0, 21.0, 18.0, 13.0, 15.0, 8.0, 7.0, 6.0, 5.0, 4.0, 5.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.383052825927734, -48.646949768066406, -46.91084671020508, -45.17474365234375, -43.43864059448242, -41.702537536621094, -39.966434478759766, -38.23033142089844, -36.49422836303711, -34.75812530517578, -33.02202224731445, -31.285919189453125, -29.549816131591797, -27.81371307373047, -26.07761001586914, -24.341506958007812, -22.605403900146484, -20.869300842285156, -19.133197784423828, -17.3970947265625, -15.660991668701172, -13.924888610839844, -12.188785552978516, -10.452682495117188, -8.71657943725586, -6.980476379394531, -5.244373321533203, -3.508270263671875, -1.7721672058105469, -0.03606414794921875, 1.7000389099121094, 3.4361419677734375, 5.172245025634766, 6.908348083496094, 8.644451141357422, 10.38055419921875, 12.116657257080078, 13.852760314941406, 15.588863372802734, 17.324966430664062, 19.06106948852539, 20.79717254638672, 22.533275604248047, 24.269378662109375, 26.005481719970703, 27.74158477783203, 29.47768783569336, 31.213790893554688, 32.949893951416016, 34.685997009277344, 36.42210006713867, 38.158203125, 39.89430618286133, 41.630409240722656, 43.366512298583984, 45.10261535644531, 46.83871841430664, 48.57482147216797, 50.3109245300293, 52.047027587890625, 53.78313064575195, 55.51923370361328, 57.25533676147461, 58.99143981933594, 60.727542877197266]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 12.0, 8.0, 13.0, 8.0, 11.0, 15.0, 16.0, 20.0, 23.0, 25.0, 33.0, 27.0, 48.0, 42.0, 39.0, 39.0, 51.0, 36.0, 52.0, 44.0, 44.0, 34.0, 40.0, 40.0, 34.0, 33.0, 27.0, 33.0, 16.0, 23.0, 15.0, 12.0, 16.0, 16.0, 12.0, 5.0, 7.0, 4.0, 6.0, 2.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.25, -82.2626953125, -79.275390625, -76.2880859375, -73.30078125, -70.3134765625, -67.326171875, -64.3388671875, -61.3515625, -58.3642578125, -55.376953125, -52.3896484375, -49.40234375, -46.4150390625, -43.427734375, -40.4404296875, -37.453125, -34.4658203125, -31.478515625, -28.4912109375, -25.50390625, -22.5166015625, -19.529296875, -16.5419921875, -13.5546875, -10.5673828125, -7.580078125, -4.5927734375, -1.60546875, 1.3818359375, 4.369140625, 7.3564453125, 10.34375, 13.3310546875, 16.318359375, 19.3056640625, 22.29296875, 25.2802734375, 28.267578125, 31.2548828125, 34.2421875, 37.2294921875, 40.216796875, 43.2041015625, 46.19140625, 49.1787109375, 52.166015625, 55.1533203125, 58.140625, 61.1279296875, 64.115234375, 67.1025390625, 70.08984375, 73.0771484375, 76.064453125, 79.0517578125, 82.0390625, 85.0263671875, 88.013671875, 91.0009765625, 93.98828125, 96.9755859375, 99.962890625, 102.9501953125, 105.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 5.0, 13.0, 20.0, 24.0, 48.0, 61.0, 91.0, 143.0, 208.0, 320.0, 468.0, 729.0, 1085.0, 1642.0, 2387.0, 3579.0, 5340.0, 8105.0, 11998.0, 18757.0, 30027.0, 50637.0, 91290.0, 202936.0, 333031.0, 120670.0, 62986.0, 36718.0, 22436.0, 14465.0, 9400.0, 6236.0, 4198.0, 2844.0, 1884.0, 1215.0, 887.0, 565.0, 381.0, 225.0, 171.0, 130.0, 70.0, 44.0, 30.0, 20.0, 17.0, 10.0, 2.0, 4.0, 0.0, 3.0, 2.0], "bins": [-27.265625, -26.490966796875, -25.71630859375, -24.941650390625, -24.1669921875, -23.392333984375, -22.61767578125, -21.843017578125, -21.068359375, -20.293701171875, -19.51904296875, -18.744384765625, -17.9697265625, -17.195068359375, -16.42041015625, -15.645751953125, -14.87109375, -14.096435546875, -13.32177734375, -12.547119140625, -11.7724609375, -10.997802734375, -10.22314453125, -9.448486328125, -8.673828125, -7.899169921875, -7.12451171875, -6.349853515625, -5.5751953125, -4.800537109375, -4.02587890625, -3.251220703125, -2.4765625, -1.701904296875, -0.92724609375, -0.152587890625, 0.6220703125, 1.396728515625, 2.17138671875, 2.946044921875, 3.720703125, 4.495361328125, 5.27001953125, 6.044677734375, 6.8193359375, 7.593994140625, 8.36865234375, 9.143310546875, 9.91796875, 10.692626953125, 11.46728515625, 12.241943359375, 13.0166015625, 13.791259765625, 14.56591796875, 15.340576171875, 16.115234375, 16.889892578125, 17.66455078125, 18.439208984375, 19.2138671875, 19.988525390625, 20.76318359375, 21.537841796875, 22.3125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 7.0, 10.0, 11.0, 6.0, 16.0, 21.0, 15.0, 31.0, 21.0, 26.0, 39.0, 30.0, 33.0, 40.0, 37.0, 30.0, 41.0, 43.0, 1058.0, 39.0, 45.0, 34.0, 34.0, 29.0, 32.0, 29.0, 28.0, 30.0, 33.0, 28.0, 16.0, 18.0, 17.0, 17.0, 13.0, 11.0, 9.0, 5.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-55.96875, -54.208984375, -52.44921875, -50.689453125, -48.9296875, -47.169921875, -45.41015625, -43.650390625, -41.890625, -40.130859375, -38.37109375, -36.611328125, -34.8515625, -33.091796875, -31.33203125, -29.572265625, -27.8125, -26.052734375, -24.29296875, -22.533203125, -20.7734375, -19.013671875, -17.25390625, -15.494140625, -13.734375, -11.974609375, -10.21484375, -8.455078125, -6.6953125, -4.935546875, -3.17578125, -1.416015625, 0.34375, 2.103515625, 3.86328125, 5.623046875, 7.3828125, 9.142578125, 10.90234375, 12.662109375, 14.421875, 16.181640625, 17.94140625, 19.701171875, 21.4609375, 23.220703125, 24.98046875, 26.740234375, 28.5, 30.259765625, 32.01953125, 33.779296875, 35.5390625, 37.298828125, 39.05859375, 40.818359375, 42.578125, 44.337890625, 46.09765625, 47.857421875, 49.6171875, 51.376953125, 53.13671875, 54.896484375, 56.65625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 16.0, 29.0, 35.0, 52.0, 79.0, 131.0, 185.0, 265.0, 368.0, 526.0, 754.0, 1059.0, 1383.0, 2019.0, 2919.0, 4389.0, 6152.0, 9088.0, 13508.0, 20205.0, 30740.0, 46916.0, 72180.0, 116561.0, 1333126.0, 170839.0, 89928.0, 58345.0, 37971.0, 25294.0, 16498.0, 11098.0, 7474.0, 5258.0, 3465.0, 2492.0, 1711.0, 1201.0, 819.0, 606.0, 458.0, 317.0, 212.0, 156.0, 89.0, 76.0, 51.0, 29.0, 20.0, 7.0, 13.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-21.0, -20.338623046875, -19.67724609375, -19.015869140625, -18.3544921875, -17.693115234375, -17.03173828125, -16.370361328125, -15.708984375, -15.047607421875, -14.38623046875, -13.724853515625, -13.0634765625, -12.402099609375, -11.74072265625, -11.079345703125, -10.41796875, -9.756591796875, -9.09521484375, -8.433837890625, -7.7724609375, -7.111083984375, -6.44970703125, -5.788330078125, -5.126953125, -4.465576171875, -3.80419921875, -3.142822265625, -2.4814453125, -1.820068359375, -1.15869140625, -0.497314453125, 0.1640625, 0.825439453125, 1.48681640625, 2.148193359375, 2.8095703125, 3.470947265625, 4.13232421875, 4.793701171875, 5.455078125, 6.116455078125, 6.77783203125, 7.439208984375, 8.1005859375, 8.761962890625, 9.42333984375, 10.084716796875, 10.74609375, 11.407470703125, 12.06884765625, 12.730224609375, 13.3916015625, 14.052978515625, 14.71435546875, 15.375732421875, 16.037109375, 16.698486328125, 17.35986328125, 18.021240234375, 18.6826171875, 19.343994140625, 20.00537109375, 20.666748046875, 21.328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 9.0, 9.0, 5.0, 15.0, 22.0, 28.0, 32.0, 32.0, 44.0, 52.0, 50.0, 52.0, 68.0, 96.0, 65.0, 64.0, 71.0, 46.0, 41.0, 30.0, 24.0, 23.0, 16.0, 12.0, 17.0, 5.0, 8.0, 6.0, 6.0, 6.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0042724609375, -0.004152268171310425, -0.00403207540512085, -0.003911882638931274, -0.0037916898727416992, -0.003671497106552124, -0.003551304340362549, -0.0034311115741729736, -0.0033109188079833984, -0.0031907260417938232, -0.003070533275604248, -0.002950340509414673, -0.0028301477432250977, -0.0027099549770355225, -0.0025897622108459473, -0.002469569444656372, -0.002349376678466797, -0.0022291839122772217, -0.0021089911460876465, -0.0019887983798980713, -0.001868605613708496, -0.001748412847518921, -0.0016282200813293457, -0.0015080273151397705, -0.0013878345489501953, -0.0012676417827606201, -0.001147449016571045, -0.0010272562503814697, -0.0009070634841918945, -0.0007868707180023193, -0.0006666779518127441, -0.0005464851856231689, -0.00042629241943359375, -0.00030609965324401855, -0.00018590688705444336, -6.571412086486816e-05, 5.447864532470703e-05, 0.00017467141151428223, 0.0002948641777038574, 0.0004150569438934326, 0.0005352497100830078, 0.000655442476272583, 0.0007756352424621582, 0.0008958280086517334, 0.0010160207748413086, 0.0011362135410308838, 0.001256406307220459, 0.0013765990734100342, 0.0014967918395996094, 0.0016169846057891846, 0.0017371773719787598, 0.001857370138168335, 0.00197756290435791, 0.0020977556705474854, 0.0022179484367370605, 0.0023381412029266357, 0.002458333969116211, 0.002578526735305786, 0.0026987195014953613, 0.0028189122676849365, 0.0029391050338745117, 0.003059297800064087, 0.003179490566253662, 0.0032996833324432373, 0.0034198760986328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 3.0, 7.0, 15.0, 18.0, 26.0, 30.0, 42.0, 63.0, 81.0, 119.0, 197.0, 324.0, 482.0, 952.0, 1904.0, 4202.0, 10197.0, 28772.0, 88503.0, 307866.0, 414357.0, 126333.0, 39433.0, 13861.0, 5553.0, 2417.0, 1159.0, 637.0, 361.0, 180.0, 146.0, 93.0, 74.0, 44.0, 26.0, 26.0, 14.0, 9.0, 4.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205078125, -0.01980423927307129, -0.019100666046142578, -0.018397092819213867, -0.017693519592285156, -0.016989946365356445, -0.016286373138427734, -0.015582799911499023, -0.014879226684570312, -0.014175653457641602, -0.01347208023071289, -0.01276850700378418, -0.012064933776855469, -0.011361360549926758, -0.010657787322998047, -0.009954214096069336, -0.009250640869140625, -0.008547067642211914, -0.007843494415283203, -0.007139921188354492, -0.006436347961425781, -0.00573277473449707, -0.005029201507568359, -0.0043256282806396484, -0.0036220550537109375, -0.0029184818267822266, -0.0022149085998535156, -0.0015113353729248047, -0.0008077621459960938, -0.00010418891906738281, 0.0005993843078613281, 0.001302957534790039, 0.00200653076171875, 0.002710103988647461, 0.003413677215576172, 0.004117250442504883, 0.004820823669433594, 0.005524396896362305, 0.006227970123291016, 0.0069315433502197266, 0.0076351165771484375, 0.008338689804077148, 0.00904226303100586, 0.00974583625793457, 0.010449409484863281, 0.011152982711791992, 0.011856555938720703, 0.012560129165649414, 0.013263702392578125, 0.013967275619506836, 0.014670848846435547, 0.015374422073364258, 0.01607799530029297, 0.01678156852722168, 0.01748514175415039, 0.0181887149810791, 0.018892288208007812, 0.019595861434936523, 0.020299434661865234, 0.021003007888793945, 0.021706581115722656, 0.022410154342651367, 0.023113727569580078, 0.02381730079650879, 0.0245208740234375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 11.0, 12.0, 22.0, 34.0, 42.0, 90.0, 119.0, 143.0, 137.0, 125.0, 86.0, 78.0, 44.0, 34.0, 10.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.008746042847633362, -0.008561247028410435, -0.008376451209187508, -0.00819165538996458, -0.008006859570741653, -0.007822063751518726, -0.007637267932295799, -0.007452472113072872, -0.007267676293849945, -0.007082880474627018, -0.006898084655404091, -0.006713288836181164, -0.006528493016958237, -0.00634369719773531, -0.0061589013785123825, -0.005974105559289455, -0.005789309740066528, -0.005604513920843601, -0.005419718101620674, -0.005234922282397747, -0.00505012646317482, -0.004865330643951893, -0.004680534824728966, -0.004495739005506039, -0.004310943186283112, -0.0041261473670601845, -0.003941351547837257, -0.0037565557286143303, -0.003571759909391403, -0.003386964090168476, -0.003202168270945549, -0.003017372451722622, -0.0028325768653303385, -0.0026477810461074114, -0.0024629852268844843, -0.002278189407661557, -0.00209339358843863, -0.001908597769215703, -0.001723801949992776, -0.0015390061307698488, -0.0013542103115469217, -0.0011694144923239946, -0.0009846186731010675, -0.0007998228538781404, -0.0006150270346552134, -0.00043023121543228626, -0.00024543539620935917, -6.0639576986432076e-05, 0.00012415624223649502, 0.0003089520614594221, 0.0004937478806823492, 0.0006785436999052763, 0.0008633395191282034, 0.0010481353383511305, 0.0012329311575740576, 0.0014177269767969847, 0.0016025227960199118, 0.0017873186152428389, 0.001972114434465766, 0.002156910253688693, 0.00234170607291162, 0.0025265018921345472, 0.0027112977113574743, 0.0028960935305804014, 0.0030808893498033285]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 12.0, 9.0, 9.0, 6.0, 18.0, 16.0, 14.0, 17.0, 23.0, 26.0, 32.0, 37.0, 31.0, 33.0, 33.0, 36.0, 44.0, 31.0, 34.0, 36.0, 38.0, 37.0, 40.0, 38.0, 32.0, 34.0, 36.0, 26.0, 18.0, 24.0, 23.0, 25.0, 18.0, 14.0, 12.0, 17.0, 11.0, 11.0, 4.0, 11.0, 10.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0015822052955627441, -0.0015275003388524055, -0.001472795382142067, -0.0014180904254317284, -0.0013633854687213898, -0.0013086805120110512, -0.0012539755553007126, -0.001199270598590374, -0.0011445656418800354, -0.0010898606851696968, -0.0010351557284593582, -0.0009804507717490196, -0.000925745815038681, -0.0008710408583283424, -0.0008163359016180038, -0.0007616309449076653, -0.0007069259881973267, -0.0006522210314869881, -0.0005975160747766495, -0.0005428111180663109, -0.0004881061613559723, -0.0004334012046456337, -0.0003786962479352951, -0.0003239912912249565, -0.0002692863345146179, -0.00021458137780427933, -0.00015987642109394073, -0.00010517146438360214, -5.046650767326355e-05, 4.238449037075043e-06, 5.8943405747413635e-05, 0.00011364836245775223, 0.00016835331916809082, 0.0002230582758784294, 0.000277763232588768, 0.0003324681892991066, 0.0003871731460094452, 0.0004418781027197838, 0.0004965830594301224, 0.000551288016140461, 0.0006059929728507996, 0.0006606979295611382, 0.0007154028862714767, 0.0007701078429818153, 0.0008248127996921539, 0.0008795177564024925, 0.0009342227131128311, 0.0009889276698231697, 0.0010436326265335083, 0.001098337583243847, 0.0011530425399541855, 0.001207747496664524, 0.0012624524533748627, 0.0013171574100852013, 0.0013718623667955399, 0.0014265673235058784, 0.001481272280216217, 0.0015359772369265556, 0.0015906821936368942, 0.0016453871503472328, 0.0017000921070575714, 0.00175479706376791, 0.0018095020204782486, 0.0018642069771885872, 0.0019189119338989258]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 12.0, 8.0, 13.0, 8.0, 11.0, 15.0, 17.0, 20.0, 22.0, 25.0, 33.0, 27.0, 49.0, 41.0, 39.0, 39.0, 51.0, 36.0, 52.0, 44.0, 44.0, 34.0, 40.0, 40.0, 34.0, 33.0, 27.0, 32.0, 16.0, 24.0, 15.0, 12.0, 16.0, 16.0, 12.0, 5.0, 7.0, 4.0, 6.0, 2.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.1875, -82.2021484375, -79.216796875, -76.2314453125, -73.24609375, -70.2607421875, -67.275390625, -64.2900390625, -61.3046875, -58.3193359375, -55.333984375, -52.3486328125, -49.36328125, -46.3779296875, -43.392578125, -40.4072265625, -37.421875, -34.4365234375, -31.451171875, -28.4658203125, -25.48046875, -22.4951171875, -19.509765625, -16.5244140625, -13.5390625, -10.5537109375, -7.568359375, -4.5830078125, -1.59765625, 1.3876953125, 4.373046875, 7.3583984375, 10.34375, 13.3291015625, 16.314453125, 19.2998046875, 22.28515625, 25.2705078125, 28.255859375, 31.2412109375, 34.2265625, 37.2119140625, 40.197265625, 43.1826171875, 46.16796875, 49.1533203125, 52.138671875, 55.1240234375, 58.109375, 61.0947265625, 64.080078125, 67.0654296875, 70.05078125, 73.0361328125, 76.021484375, 79.0068359375, 81.9921875, 84.9775390625, 87.962890625, 90.9482421875, 93.93359375, 96.9189453125, 99.904296875, 102.8896484375, 105.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 11.0, 11.0, 13.0, 26.0, 32.0, 39.0, 63.0, 77.0, 131.0, 161.0, 320.0, 487.0, 887.0, 1627.0, 3473.0, 8766.0, 29500.0, 127620.0, 479288.0, 301839.0, 66037.0, 16768.0, 5755.0, 2561.0, 1233.0, 684.0, 408.0, 228.0, 140.0, 108.0, 87.0, 39.0, 37.0, 27.0, 21.0, 10.0, 7.0, 6.0, 9.0, 6.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -18.186279296875, -17.57568359375, -16.965087890625, -16.3544921875, -15.743896484375, -15.13330078125, -14.522705078125, -13.912109375, -13.301513671875, -12.69091796875, -12.080322265625, -11.4697265625, -10.859130859375, -10.24853515625, -9.637939453125, -9.02734375, -8.416748046875, -7.80615234375, -7.195556640625, -6.5849609375, -5.974365234375, -5.36376953125, -4.753173828125, -4.142578125, -3.531982421875, -2.92138671875, -2.310791015625, -1.7001953125, -1.089599609375, -0.47900390625, 0.131591796875, 0.7421875, 1.352783203125, 1.96337890625, 2.573974609375, 3.1845703125, 3.795166015625, 4.40576171875, 5.016357421875, 5.626953125, 6.237548828125, 6.84814453125, 7.458740234375, 8.0693359375, 8.679931640625, 9.29052734375, 9.901123046875, 10.51171875, 11.122314453125, 11.73291015625, 12.343505859375, 12.9541015625, 13.564697265625, 14.17529296875, 14.785888671875, 15.396484375, 16.007080078125, 16.61767578125, 17.228271484375, 17.8388671875, 18.449462890625, 19.06005859375, 19.670654296875, 20.28125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 3.0, 8.0, 8.0, 12.0, 8.0, 16.0, 19.0, 22.0, 30.0, 30.0, 37.0, 45.0, 48.0, 47.0, 62.0, 50.0, 69.0, 2082.0, 45.0, 39.0, 44.0, 47.0, 38.0, 30.0, 35.0, 31.0, 24.0, 27.0, 19.0, 10.0, 16.0, 12.0, 4.0, 7.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-156.625, -151.9375, -147.25, -142.5625, -137.875, -133.1875, -128.5, -123.8125, -119.125, -114.4375, -109.75, -105.0625, -100.375, -95.6875, -91.0, -86.3125, -81.625, -76.9375, -72.25, -67.5625, -62.875, -58.1875, -53.5, -48.8125, -44.125, -39.4375, -34.75, -30.0625, -25.375, -20.6875, -16.0, -11.3125, -6.625, -1.9375, 2.75, 7.4375, 12.125, 16.8125, 21.5, 26.1875, 30.875, 35.5625, 40.25, 44.9375, 49.625, 54.3125, 59.0, 63.6875, 68.375, 73.0625, 77.75, 82.4375, 87.125, 91.8125, 96.5, 101.1875, 105.875, 110.5625, 115.25, 119.9375, 124.625, 129.3125, 134.0, 138.6875, 143.375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 9.0, 5.0, 7.0, 9.0, 6.0, 9.0, 11.0, 17.0, 27.0, 37.0, 36.0, 56.0, 81.0, 131.0, 166.0, 262.0, 363.0, 579.0, 910.0, 1821.0, 5193.0, 24970.0, 228391.0, 2743818.0, 116558.0, 14604.0, 3704.0, 1468.0, 831.0, 483.0, 355.0, 241.0, 146.0, 109.0, 76.0, 48.0, 42.0, 21.0, 24.0, 18.0, 17.0, 7.0, 6.0, 8.0, 8.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-28.484375, -27.63037109375, -26.7763671875, -25.92236328125, -25.068359375, -24.21435546875, -23.3603515625, -22.50634765625, -21.65234375, -20.79833984375, -19.9443359375, -19.09033203125, -18.236328125, -17.38232421875, -16.5283203125, -15.67431640625, -14.8203125, -13.96630859375, -13.1123046875, -12.25830078125, -11.404296875, -10.55029296875, -9.6962890625, -8.84228515625, -7.98828125, -7.13427734375, -6.2802734375, -5.42626953125, -4.572265625, -3.71826171875, -2.8642578125, -2.01025390625, -1.15625, -0.30224609375, 0.5517578125, 1.40576171875, 2.259765625, 3.11376953125, 3.9677734375, 4.82177734375, 5.67578125, 6.52978515625, 7.3837890625, 8.23779296875, 9.091796875, 9.94580078125, 10.7998046875, 11.65380859375, 12.5078125, 13.36181640625, 14.2158203125, 15.06982421875, 15.923828125, 16.77783203125, 17.6318359375, 18.48583984375, 19.33984375, 20.19384765625, 21.0478515625, 21.90185546875, 22.755859375, 23.60986328125, 24.4638671875, 25.31787109375, 26.171875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 29.0, 83.0, 180.0, 259.0, 217.0, 121.0, 37.0, 26.0, 14.0, 7.0, 1.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-159.02296447753906, -145.42848205566406, -131.83401489257812, -118.23953247070312, -104.64506530761719, -91.05058288574219, -77.45610809326172, -63.86163330078125, -50.26715850830078, -36.67268371582031, -23.07820701599121, -9.48373031616211, 4.110744476318359, 17.705223083496094, 31.299697875976562, 44.89417266845703, 58.4886474609375, 72.08312225341797, 85.67759704589844, 99.27207946777344, 112.86654663085938, 126.46102905273438, 140.05551147460938, 153.6499786376953, 167.24444580078125, 180.83892822265625, 194.4333953857422, 208.0278778076172, 221.62234497070312, 235.21682739257812, 248.81130981445312, 262.40576171875, 276.0002746582031, 289.5947570800781, 303.1892395019531, 316.78369140625, 330.378173828125, 343.97265625, 357.567138671875, 371.16162109375, 384.7560729980469, 398.3505554199219, 411.9450378417969, 425.53948974609375, 439.13397216796875, 452.72845458984375, 466.32293701171875, 479.91741943359375, 493.51190185546875, 507.10638427734375, 520.7008666992188, 534.2953491210938, 547.8898315429688, 561.4842529296875, 575.0787353515625, 588.6732177734375, 602.2677001953125, 615.8621826171875, 629.4566650390625, 643.0511474609375, 656.6456298828125, 670.2401123046875, 683.8345336914062, 697.4290161132812, 711.0234985351562]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 6.0, 5.0, 13.0, 9.0, 20.0, 19.0, 25.0, 22.0, 30.0, 36.0, 32.0, 28.0, 34.0, 50.0, 51.0, 55.0, 48.0, 60.0, 51.0, 38.0, 40.0, 47.0, 39.0, 35.0, 32.0, 29.0, 25.0, 23.0, 26.0, 20.0, 8.0, 13.0, 13.0, 6.0, 5.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-203.40155029296875, -197.100830078125, -190.80010986328125, -184.4993896484375, -178.1986541748047, -171.89793395996094, -165.5972137451172, -159.29649353027344, -152.99575805664062, -146.69503784179688, -140.39431762695312, -134.09359741210938, -127.79286193847656, -121.49214172363281, -115.19142150878906, -108.89070129394531, -102.58998107910156, -96.28926086425781, -89.98853302001953, -83.68781280517578, -77.3870849609375, -71.08636474609375, -64.78564453125, -58.484920501708984, -52.18419647216797, -45.88347244262695, -39.58274841308594, -33.28202819824219, -26.981304168701172, -20.680580139160156, -14.379859924316406, -8.07913589477539, -1.7784271240234375, 4.522295951843262, 10.823019027709961, 17.123741149902344, 23.42446517944336, 29.725189208984375, 36.025909423828125, 42.32663345336914, 48.627357482910156, 54.92808151245117, 61.22880554199219, 67.52952575683594, 73.83024597167969, 80.13097381591797, 86.43169403076172, 92.732421875, 99.03314208984375, 105.3338623046875, 111.63459014892578, 117.93531036376953, 124.23603820800781, 130.53675842285156, 136.8374786376953, 143.13819885253906, 149.43893432617188, 155.73965454101562, 162.04037475585938, 168.34109497070312, 174.64183044433594, 180.9425506591797, 187.24327087402344, 193.5439910888672, 199.84471130371094]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 9.0, 18.0, 17.0, 36.0, 46.0, 75.0, 116.0, 148.0, 236.0, 379.0, 525.0, 764.0, 1112.0, 1549.0, 2414.0, 3534.0, 5849.0, 1017226.0, 4817.0, 3088.0, 2148.0, 1416.0, 1010.0, 609.0, 438.0, 294.0, 220.0, 146.0, 92.0, 58.0, 63.0, 36.0, 21.0, 16.0, 7.0, 8.0, 5.0, 2.0, 0.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.07732009887695, -33.693241119384766, -32.30916213989258, -30.925085067749023, -29.54100799560547, -28.15692901611328, -26.772850036621094, -25.388771057128906, -24.00469398498535, -22.620615005493164, -21.23653793334961, -19.852458953857422, -18.468379974365234, -17.08430290222168, -15.700223922729492, -14.316145896911621, -12.93206787109375, -11.547989845275879, -10.163911819458008, -8.77983283996582, -7.395754814147949, -6.011676788330078, -4.627597808837891, -3.2435197830200195, -1.8594417572021484, -0.47536349296569824, 0.908714771270752, 2.2927932739257812, 3.6768712997436523, 5.060949325561523, 6.445028305053711, 7.829106330871582, 9.213188171386719, 10.59726619720459, 11.981344223022461, 13.365423202514648, 14.74950122833252, 16.13357925415039, 17.517658233642578, 18.901737213134766, 20.28581428527832, 21.669893264770508, 23.053970336914062, 24.43804931640625, 25.822128295898438, 27.206205368041992, 28.59028434753418, 29.974361419677734, 31.358440399169922, 32.74251937866211, 34.1265983581543, 35.51067352294922, 36.894752502441406, 38.278831481933594, 39.66291046142578, 41.04698944091797, 42.431068420410156, 43.815147399902344, 45.19922637939453, 46.58330535888672, 47.96738052368164, 49.35145950317383, 50.735538482666016, 52.1196174621582, 53.503692626953125]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 13.0, 32.0, 70.0, 94.0, 168.0, 34792.0, 51429804.0, 197.0, 55.0, 33.0, 29.0, 38.0, 27.0, 26.0, 19.0, 8.0, 9.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8377.4619140625, -8042.63916015625, -7707.81640625, -7372.99365234375, -7038.1708984375, -6703.34765625, -6368.52490234375, -6033.7021484375, -5698.87939453125, -5364.056640625, -5029.23388671875, -4694.4111328125, -4359.587890625, -4024.765380859375, -3689.9423828125, -3355.11962890625, -3020.296875, -2685.47412109375, -2350.6513671875, -2015.828369140625, -1681.005615234375, -1346.182861328125, -1011.3599853515625, -676.537109375, -341.71435546875, -6.89154052734375, 327.9312744140625, 662.7540893554688, 997.576904296875, 1332.399658203125, 1667.2225341796875, 2002.04541015625, 2336.8671875, 2671.68994140625, 3006.5126953125, 3341.335693359375, 3676.158447265625, 4010.981201171875, 4345.80419921875, 4680.626953125, 5015.44970703125, 5350.2724609375, 5685.09521484375, 6019.91796875, 6354.7412109375, 6689.5634765625, 7024.38671875, 7359.20947265625, 7694.0322265625, 8028.85498046875, 8363.677734375, 8698.5009765625, 9033.3232421875, 9368.146484375, 9702.96875, 10037.7919921875, 10372.615234375, 10707.4384765625, 11042.2607421875, 11377.083984375, 11711.90625, 12046.7294921875, 12381.5517578125, 12716.375, 13051.197265625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 5.0, 4.0, 11.0, 13.0, 25.0, 37.0, 63.0, 93.0, 124.0, 199.0, 235.0, 366.0, 603.0, 819.0, 1173.0, 1640.0, 2453.0, 3507.0, 5422.0, 7626.0, 11444.0, 16883.0, 25605.0, 37473.0, 58535.0, 88931.0, 142680.0, 243272.0, 587873.0, 3854257.0, 560189.0, 236408.0, 141051.0, 89528.0, 58309.0, 37847.0, 24960.0, 16963.0, 11161.0, 7599.0, 4988.0, 3421.0, 2355.0, 1586.0, 1229.0, 723.0, 545.0, 369.0, 275.0, 192.0, 121.0, 80.0, 64.0, 35.0, 28.0, 24.0, 5.0, 12.0, 5.0, 6.0], "bins": [-10.4921875, -10.1788330078125, -9.865478515625, -9.5521240234375, -9.23876953125, -8.9254150390625, -8.612060546875, -8.2987060546875, -7.9853515625, -7.6719970703125, -7.358642578125, -7.0452880859375, -6.73193359375, -6.4185791015625, -6.105224609375, -5.7918701171875, -5.478515625, -5.1651611328125, -4.851806640625, -4.5384521484375, -4.22509765625, -3.9117431640625, -3.598388671875, -3.2850341796875, -2.9716796875, -2.6583251953125, -2.344970703125, -2.0316162109375, -1.71826171875, -1.4049072265625, -1.091552734375, -0.7781982421875, -0.46484375, -0.1514892578125, 0.161865234375, 0.4752197265625, 0.78857421875, 1.1019287109375, 1.415283203125, 1.7286376953125, 2.0419921875, 2.3553466796875, 2.668701171875, 2.9820556640625, 3.29541015625, 3.6087646484375, 3.922119140625, 4.2354736328125, 4.548828125, 4.8621826171875, 5.175537109375, 5.4888916015625, 5.80224609375, 6.1156005859375, 6.428955078125, 6.7423095703125, 7.0556640625, 7.3690185546875, 7.682373046875, 7.9957275390625, 8.30908203125, 8.6224365234375, 8.935791015625, 9.2491455078125, 9.5625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 12.0, 13.0, 9.0, 10.0, 18.0, 12.0, 10.0, 24.0, 27.0, 18.0, 21.0, 25.0, 25.0, 27.0, 35.0, 46.0, 52.0, 101.0, 209.0, 598.0, 173.0, 110.0, 56.0, 32.0, 29.0, 38.0, 28.0, 35.0, 41.0, 27.0, 28.0, 20.0, 17.0, 20.0, 8.0, 7.0, 14.0, 8.0, 10.0, 2.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.6669921875, -17.068359375, -16.4697265625, -15.87109375, -15.2724609375, -14.673828125, -14.0751953125, -13.4765625, -12.8779296875, -12.279296875, -11.6806640625, -11.08203125, -10.4833984375, -9.884765625, -9.2861328125, -8.6875, -8.0888671875, -7.490234375, -6.8916015625, -6.29296875, -5.6943359375, -5.095703125, -4.4970703125, -3.8984375, -3.2998046875, -2.701171875, -2.1025390625, -1.50390625, -0.9052734375, -0.306640625, 0.2919921875, 0.890625, 1.4892578125, 2.087890625, 2.6865234375, 3.28515625, 3.8837890625, 4.482421875, 5.0810546875, 5.6796875, 6.2783203125, 6.876953125, 7.4755859375, 8.07421875, 8.6728515625, 9.271484375, 9.8701171875, 10.46875, 11.0673828125, 11.666015625, 12.2646484375, 12.86328125, 13.4619140625, 14.060546875, 14.6591796875, 15.2578125, 15.8564453125, 16.455078125, 17.0537109375, 17.65234375, 18.2509765625, 18.849609375, 19.4482421875, 20.046875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 6.0, 3.0, 15.0, 12.0, 15.0, 21.0, 47.0, 53.0, 93.0, 149.0, 197.0, 286.0, 445.0, 615.0, 974.0, 1484.0, 2355.0, 3606.0, 5354.0, 8402.0, 12873.0, 19991.0, 31225.0, 50276.0, 83745.0, 144959.0, 282325.0, 869526.0, 3814000.0, 463680.0, 203623.0, 112426.0, 65549.0, 40191.0, 25679.0, 16676.0, 10613.0, 6868.0, 4533.0, 2945.0, 1902.0, 1256.0, 793.0, 576.0, 325.0, 236.0, 167.0, 152.0, 57.0, 38.0, 37.0, 22.0, 15.0, 17.0, 7.0, 1.0, 8.0, 0.0, 0.0, 6.0], "bins": [-11.3984375, -11.0452880859375, -10.692138671875, -10.3389892578125, -9.98583984375, -9.6326904296875, -9.279541015625, -8.9263916015625, -8.5732421875, -8.2200927734375, -7.866943359375, -7.5137939453125, -7.16064453125, -6.8074951171875, -6.454345703125, -6.1011962890625, -5.748046875, -5.3948974609375, -5.041748046875, -4.6885986328125, -4.33544921875, -3.9822998046875, -3.629150390625, -3.2760009765625, -2.9228515625, -2.5697021484375, -2.216552734375, -1.8634033203125, -1.51025390625, -1.1571044921875, -0.803955078125, -0.4508056640625, -0.09765625, 0.2554931640625, 0.608642578125, 0.9617919921875, 1.31494140625, 1.6680908203125, 2.021240234375, 2.3743896484375, 2.7275390625, 3.0806884765625, 3.433837890625, 3.7869873046875, 4.14013671875, 4.4932861328125, 4.846435546875, 5.1995849609375, 5.552734375, 5.9058837890625, 6.259033203125, 6.6121826171875, 6.96533203125, 7.3184814453125, 7.671630859375, 8.0247802734375, 8.3779296875, 8.7310791015625, 9.084228515625, 9.4373779296875, 9.79052734375, 10.1436767578125, 10.496826171875, 10.8499755859375, 11.203125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 10.0, 9.0, 7.0, 8.0, 12.0, 6.0, 22.0, 11.0, 18.0, 14.0, 23.0, 18.0, 25.0, 30.0, 41.0, 31.0, 41.0, 71.0, 88.0, 162.0, 418.0, 356.0, 130.0, 67.0, 49.0, 54.0, 39.0, 37.0, 27.0, 18.0, 34.0, 24.0, 23.0, 23.0, 10.0, 11.0, 16.0, 10.0, 8.0, 8.0, 6.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.6875, -15.2254638671875, -14.763427734375, -14.3013916015625, -13.83935546875, -13.3773193359375, -12.915283203125, -12.4532470703125, -11.9912109375, -11.5291748046875, -11.067138671875, -10.6051025390625, -10.14306640625, -9.6810302734375, -9.218994140625, -8.7569580078125, -8.294921875, -7.8328857421875, -7.370849609375, -6.9088134765625, -6.44677734375, -5.9847412109375, -5.522705078125, -5.0606689453125, -4.5986328125, -4.1365966796875, -3.674560546875, -3.2125244140625, -2.75048828125, -2.2884521484375, -1.826416015625, -1.3643798828125, -0.90234375, -0.4403076171875, 0.021728515625, 0.4837646484375, 0.94580078125, 1.4078369140625, 1.869873046875, 2.3319091796875, 2.7939453125, 3.2559814453125, 3.718017578125, 4.1800537109375, 4.64208984375, 5.1041259765625, 5.566162109375, 6.0281982421875, 6.490234375, 6.9522705078125, 7.414306640625, 7.8763427734375, 8.33837890625, 8.8004150390625, 9.262451171875, 9.7244873046875, 10.1865234375, 10.6485595703125, 11.110595703125, 11.5726318359375, 12.03466796875, 12.4967041015625, 12.958740234375, 13.4207763671875, 13.8828125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 8.0, 6.0, 3.0, 24.0, 12.0, 8.0, 25.0, 13.0, 34.0, 55.0, 62.0, 85.0, 81.0, 90.0, 206.0, 266.0, 317.0, 410.0, 441.0, 669.0, 1008.0, 1212.0, 1849.0, 3122.0, 5180.0, 10196.0, 20968.0, 56548.0, 487228.0, 5591005.0, 61677.0, 22469.0, 10323.0, 5459.0, 3325.0, 2020.0, 1369.0, 894.0, 718.0, 484.0, 382.0, 246.0, 158.0, 177.0, 152.0, 110.0, 70.0, 44.0, 23.0, 62.0, 48.0, 41.0, 26.0, 14.0, 15.0, 0.0, 6.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-29.9375, -28.97265625, -28.0078125, -27.04296875, -26.078125, -25.11328125, -24.1484375, -23.18359375, -22.21875, -21.25390625, -20.2890625, -19.32421875, -18.359375, -17.39453125, -16.4296875, -15.46484375, -14.5, -13.53515625, -12.5703125, -11.60546875, -10.640625, -9.67578125, -8.7109375, -7.74609375, -6.78125, -5.81640625, -4.8515625, -3.88671875, -2.921875, -1.95703125, -0.9921875, -0.02734375, 0.9375, 1.90234375, 2.8671875, 3.83203125, 4.796875, 5.76171875, 6.7265625, 7.69140625, 8.65625, 9.62109375, 10.5859375, 11.55078125, 12.515625, 13.48046875, 14.4453125, 15.41015625, 16.375, 17.33984375, 18.3046875, 19.26953125, 20.234375, 21.19921875, 22.1640625, 23.12890625, 24.09375, 25.05859375, 26.0234375, 26.98828125, 27.953125, 28.91796875, 29.8828125, 30.84765625, 31.8125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 1.0, 5.0, 5.0, 6.0, 11.0, 9.0, 4.0, 7.0, 17.0, 15.0, 22.0, 21.0, 23.0, 29.0, 24.0, 37.0, 42.0, 52.0, 62.0, 106.0, 161.0, 300.0, 396.0, 151.0, 64.0, 60.0, 59.0, 35.0, 33.0, 31.0, 30.0, 37.0, 26.0, 16.0, 16.0, 23.0, 18.0, 13.0, 16.0, 6.0, 4.0, 5.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3359375, -10.0030517578125, -9.670166015625, -9.3372802734375, -9.00439453125, -8.6715087890625, -8.338623046875, -8.0057373046875, -7.6728515625, -7.3399658203125, -7.007080078125, -6.6741943359375, -6.34130859375, -6.0084228515625, -5.675537109375, -5.3426513671875, -5.009765625, -4.6768798828125, -4.343994140625, -4.0111083984375, -3.67822265625, -3.3453369140625, -3.012451171875, -2.6795654296875, -2.3466796875, -2.0137939453125, -1.680908203125, -1.3480224609375, -1.01513671875, -0.6822509765625, -0.349365234375, -0.0164794921875, 0.31640625, 0.6492919921875, 0.982177734375, 1.3150634765625, 1.64794921875, 1.9808349609375, 2.313720703125, 2.6466064453125, 2.9794921875, 3.3123779296875, 3.645263671875, 3.9781494140625, 4.31103515625, 4.6439208984375, 4.976806640625, 5.3096923828125, 5.642578125, 5.9754638671875, 6.308349609375, 6.6412353515625, 6.97412109375, 7.3070068359375, 7.639892578125, 7.9727783203125, 8.3056640625, 8.6385498046875, 8.971435546875, 9.3043212890625, 9.63720703125, 9.9700927734375, 10.302978515625, 10.6358642578125, 10.96875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 0.0, 3.0, 17.0, 22.0, 87.0, 226.0, 459.0, 111.0, 44.0, 17.0, 11.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-113.41607666015625, -111.28523254394531, -109.15438842773438, -107.02354431152344, -104.8927001953125, -102.76184844970703, -100.6310043334961, -98.50016021728516, -96.36931610107422, -94.23847198486328, -92.10762786865234, -89.9767837524414, -87.84593200683594, -85.715087890625, -83.58424377441406, -81.45339965820312, -79.32255554199219, -77.19171142578125, -75.06086730957031, -72.93002319335938, -70.79917907714844, -68.66832733154297, -66.53748321533203, -64.4066390991211, -62.275794982910156, -60.14495086669922, -58.01410675048828, -55.88325881958008, -53.75241470336914, -51.6215705871582, -49.49072265625, -47.35987854003906, -45.229042053222656, -43.09819793701172, -40.96735382080078, -38.83650588989258, -36.70566177368164, -34.5748176574707, -32.4439697265625, -30.313125610351562, -28.182281494140625, -26.051437377929688, -23.920591354370117, -21.789745330810547, -19.65890121459961, -17.528057098388672, -15.397211074829102, -13.266366004943848, -11.135520935058594, -9.00467586517334, -6.873830795288086, -4.742985725402832, -2.612140655517578, -0.4812955856323242, 1.6495494842529297, 3.7803945541381836, 5.9112396240234375, 8.042084693908691, 10.172929763793945, 12.3037748336792, 14.434619903564453, 16.56546401977539, 18.69631004333496, 20.82715606689453, 22.95800018310547]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 4.0, 7.0, 8.0, 13.0, 10.0, 9.0, 7.0, 18.0, 15.0, 19.0, 20.0, 24.0, 27.0, 40.0, 39.0, 38.0, 41.0, 35.0, 45.0, 48.0, 49.0, 46.0, 42.0, 29.0, 46.0, 48.0, 34.0, 36.0, 37.0, 27.0, 23.0, 19.0, 21.0, 16.0, 15.0, 7.0, 7.0, 14.0, 4.0, 6.0, 1.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.135906219482422, -17.60097312927246, -17.0660400390625, -16.53110694885254, -15.996174812316895, -15.461241722106934, -14.926309585571289, -14.391376495361328, -13.856443405151367, -13.321510314941406, -12.786577224731445, -12.2516450881958, -11.71671199798584, -11.181778907775879, -10.646846771240234, -10.111913681030273, -9.576980590820312, -9.042047500610352, -8.50711441040039, -7.972182273864746, -7.437249183654785, -6.902316093444824, -6.3673834800720215, -5.832450866699219, -5.297517776489258, -4.762584686279297, -4.227652072906494, -3.6927192211151123, -3.1577863693237305, -2.6228535175323486, -2.087920665740967, -1.552987813949585, -1.0180530548095703, -0.4831202030181885, 0.05181264877319336, 0.5867455005645752, 1.121678352355957, 1.6566112041473389, 2.1915440559387207, 2.7264769077301025, 3.2614097595214844, 3.796342611312866, 4.331275463104248, 4.866208076477051, 5.401141166687012, 5.936074256896973, 6.471006870269775, 7.005939483642578, 7.540872573852539, 8.0758056640625, 8.610738754272461, 9.145670890808105, 9.680603981018066, 10.215537071228027, 10.750469207763672, 11.285402297973633, 11.820335388183594, 12.355268478393555, 12.890201568603516, 13.42513370513916, 13.960066795349121, 14.494999885559082, 15.029932022094727, 15.564865112304688, 16.09979820251465]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 1.0, 4.0, 3.0, 7.0, 12.0, 14.0, 15.0, 25.0, 36.0, 53.0, 68.0, 124.0, 172.0, 280.0, 440.0, 712.0, 1191.0, 2115.0, 3895.0, 8197.0, 20380.0, 4058996.0, 74234.0, 12005.0, 5033.0, 2470.0, 1368.0, 791.0, 499.0, 359.0, 226.0, 143.0, 104.0, 85.0, 48.0, 39.0, 43.0, 24.0, 16.0, 10.0, 10.0, 12.0, 7.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0311431884765625, -0.02988886833190918, -0.02863454818725586, -0.02738022804260254, -0.02612590789794922, -0.0248715877532959, -0.023617267608642578, -0.022362947463989258, -0.021108627319335938, -0.019854307174682617, -0.018599987030029297, -0.017345666885375977, -0.016091346740722656, -0.014837026596069336, -0.013582706451416016, -0.012328386306762695, -0.011074066162109375, -0.009819746017456055, -0.008565425872802734, -0.007311105728149414, -0.006056785583496094, -0.0048024654388427734, -0.003548145294189453, -0.002293825149536133, -0.0010395050048828125, 0.0002148151397705078, 0.0014691352844238281, 0.0027234554290771484, 0.003977775573730469, 0.005232095718383789, 0.006486415863037109, 0.00774073600769043, 0.00899505615234375, 0.01024937629699707, 0.01150369644165039, 0.012758016586303711, 0.014012336730957031, 0.015266656875610352, 0.016520977020263672, 0.017775297164916992, 0.019029617309570312, 0.020283937454223633, 0.021538257598876953, 0.022792577743530273, 0.024046897888183594, 0.025301218032836914, 0.026555538177490234, 0.027809858322143555, 0.029064178466796875, 0.030318498611450195, 0.031572818756103516, 0.032827138900756836, 0.034081459045410156, 0.03533577919006348, 0.0365900993347168, 0.03784441947937012, 0.03909873962402344, 0.04035305976867676, 0.04160737991333008, 0.0428617000579834, 0.04411602020263672, 0.04537034034729004, 0.04662466049194336, 0.04787898063659668, 0.04913330078125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 1.0, 3.0, 7.0, 7.0, 2.0, 13.0, 7.0, 10.0, 9.0, 19.0, 14.0, 112.0, 662.0, 44.0, 11.0, 14.0, 8.0, 10.0, 5.0, 6.0, 7.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019044876098632812, -0.0018287450075149536, -0.001753002405166626, -0.0016772598028182983, -0.0016015172004699707, -0.001525774598121643, -0.0014500319957733154, -0.0013742893934249878, -0.0012985467910766602, -0.0012228041887283325, -0.0011470615863800049, -0.0010713189840316772, -0.0009955763816833496, -0.000919833779335022, -0.0008440911769866943, -0.0007683485746383667, -0.0006926059722900391, -0.0006168633699417114, -0.0005411207675933838, -0.00046537816524505615, -0.0003896355628967285, -0.0003138929605484009, -0.00023815035820007324, -0.0001624077558517456, -8.666515350341797e-05, -1.0922551155090332e-05, 6.48200511932373e-05, 0.00014056265354156494, 0.00021630525588989258, 0.0002920478582382202, 0.00036779046058654785, 0.0004435330629348755, 0.0005192756652832031, 0.0005950182676315308, 0.0006707608699798584, 0.000746503472328186, 0.0008222460746765137, 0.0008979886770248413, 0.0009737312793731689, 0.0010494738817214966, 0.0011252164840698242, 0.0012009590864181519, 0.0012767016887664795, 0.0013524442911148071, 0.0014281868934631348, 0.0015039294958114624, 0.00157967209815979, 0.0016554147005081177, 0.0017311573028564453, 0.001806899905204773, 0.0018826425075531006, 0.0019583851099014282, 0.002034127712249756, 0.0021098703145980835, 0.002185612916946411, 0.0022613555192947388, 0.0023370981216430664, 0.002412840723991394, 0.0024885833263397217, 0.0025643259286880493, 0.002640068531036377, 0.0027158111333847046, 0.0027915537357330322, 0.00286729633808136, 0.0029430389404296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 5.0, 6.0, 12.0, 18.0, 12.0, 42.0, 51.0, 41.0, 74.0, 113.0, 155.0, 248.0, 365.0, 586.0, 1108.0, 2006.0, 4913.0, 17302.0, 202003.0, 3916176.0, 35511.0, 7264.0, 2856.0, 1328.0, 784.0, 394.0, 266.0, 184.0, 134.0, 83.0, 60.0, 49.0, 30.0, 32.0, 24.0, 9.0, 10.0, 8.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050994873046875, -0.04930591583251953, -0.04761695861816406, -0.045928001403808594, -0.044239044189453125, -0.042550086975097656, -0.04086112976074219, -0.03917217254638672, -0.03748321533203125, -0.03579425811767578, -0.03410530090332031, -0.032416343688964844, -0.030727386474609375, -0.029038429260253906, -0.027349472045898438, -0.02566051483154297, -0.0239715576171875, -0.02228260040283203, -0.020593643188476562, -0.018904685974121094, -0.017215728759765625, -0.015526771545410156, -0.013837814331054688, -0.012148857116699219, -0.01045989990234375, -0.008770942687988281, -0.0070819854736328125, -0.005393028259277344, -0.003704071044921875, -0.0020151138305664062, -0.0003261566162109375, 0.0013628005981445312, 0.0030517578125, 0.004740715026855469, 0.0064296722412109375, 0.008118629455566406, 0.009807586669921875, 0.011496543884277344, 0.013185501098632812, 0.014874458312988281, 0.01656341552734375, 0.01825237274169922, 0.019941329956054688, 0.021630287170410156, 0.023319244384765625, 0.025008201599121094, 0.026697158813476562, 0.02838611602783203, 0.0300750732421875, 0.03176403045654297, 0.03345298767089844, 0.035141944885253906, 0.036830902099609375, 0.038519859313964844, 0.04020881652832031, 0.04189777374267578, 0.04358673095703125, 0.04527568817138672, 0.04696464538574219, 0.048653602600097656, 0.050342559814453125, 0.052031517028808594, 0.05372047424316406, 0.05540943145751953, 0.057098388671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 6.0, 6.0, 12.0, 13.0, 13.0, 6.0, 17.0, 10.0, 22.0, 35.0, 31.0, 36.0, 44.0, 54.0, 75.0, 123.0, 365.0, 2483.0, 280.0, 84.0, 64.0, 38.0, 44.0, 31.0, 30.0, 30.0, 24.0, 18.0, 13.0, 13.0, 8.0, 10.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004741668701171875, -0.004574477672576904, -0.004407286643981934, -0.004240095615386963, -0.004072904586791992, -0.0039057135581970215, -0.0037385225296020508, -0.00357133150100708, -0.0034041404724121094, -0.0032369494438171387, -0.003069758415222168, -0.0029025673866271973, -0.0027353763580322266, -0.002568185329437256, -0.002400994300842285, -0.0022338032722473145, -0.0020666122436523438, -0.001899421215057373, -0.0017322301864624023, -0.0015650391578674316, -0.001397848129272461, -0.0012306571006774902, -0.0010634660720825195, -0.0008962750434875488, -0.0007290840148925781, -0.0005618929862976074, -0.0003947019577026367, -0.00022751092910766602, -6.031990051269531e-05, 0.00010687112808227539, 0.0002740621566772461, 0.0004412531852722168, 0.0006084442138671875, 0.0007756352424621582, 0.0009428262710571289, 0.0011100172996520996, 0.0012772083282470703, 0.001444399356842041, 0.0016115903854370117, 0.0017787814140319824, 0.0019459724426269531, 0.002113163471221924, 0.0022803544998168945, 0.0024475455284118652, 0.002614736557006836, 0.0027819275856018066, 0.0029491186141967773, 0.003116309642791748, 0.0032835006713867188, 0.0034506916999816895, 0.00361788272857666, 0.003785073757171631, 0.0039522647857666016, 0.004119455814361572, 0.004286646842956543, 0.004453837871551514, 0.004621028900146484, 0.004788219928741455, 0.004955410957336426, 0.0051226019859313965, 0.005289793014526367, 0.005456984043121338, 0.005624175071716309, 0.005791366100311279, 0.00595855712890625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 10.0, 15.0, 12.0, 47.0, 175.0, 570.0, 100.0, 42.0, 15.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.11550533771514893, -0.112838976085186, -0.11017262190580368, -0.10750626027584076, -0.10483989864587784, -0.10217353701591492, -0.09950718283653259, -0.09684082120656967, -0.09417445957660675, -0.09150809794664383, -0.0888417437672615, -0.08617538213729858, -0.08350902050733566, -0.08084265887737274, -0.07817630469799042, -0.0755099430680275, -0.07284358888864517, -0.07017722725868225, -0.06751087307929993, -0.064844511449337, -0.062178149819374084, -0.05951179191470146, -0.05684543401002884, -0.05417907238006592, -0.051512714475393295, -0.04884635657072067, -0.04617999494075775, -0.04351363703608513, -0.040847279131412506, -0.038180917501449585, -0.03551455959677696, -0.03284820169210434, -0.030181847512722015, -0.027515487745404243, -0.02484912797808647, -0.02218277007341385, -0.019516410306096077, -0.016850050538778305, -0.014183692634105682, -0.01151733286678791, -0.008850973099470139, -0.006184613797813654, -0.0035182544961571693, -0.000851895660161972, 0.0018144641071557999, 0.004480823874473572, 0.0071471817791461945, 0.009813541546463966, 0.012479901313781738, 0.01514626108109951, 0.017812620848417282, 0.020478978753089905, 0.023145338520407677, 0.02581169828772545, 0.02847805619239807, 0.031144415959715843, 0.033810775727033615, 0.03647713363170624, 0.03914349526166916, 0.04180985316634178, 0.044476211071014404, 0.047142572700977325, 0.04980893060564995, 0.05247528851032257, 0.05514165014028549]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 11.0, 11.0, 11.0, 14.0, 11.0, 25.0, 28.0, 30.0, 45.0, 50.0, 52.0, 57.0, 50.0, 73.0, 67.0, 61.0, 60.0, 52.0, 52.0, 45.0, 28.0, 41.0, 30.0, 17.0, 14.0, 8.0, 13.0, 7.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.022283852100372314, -0.021612493321299553, -0.02094113454222679, -0.02026977576315403, -0.01959841698408127, -0.018927058205008507, -0.018255699425935745, -0.017584340646862984, -0.016912981867790222, -0.01624162308871746, -0.015570264309644699, -0.014898905530571938, -0.014227546751499176, -0.013556187972426414, -0.012884829193353653, -0.012213470414280891, -0.01154211163520813, -0.010870752856135368, -0.010199394077062607, -0.009528035297989845, -0.008856676518917084, -0.008185317739844322, -0.007513958960771561, -0.006842600181698799, -0.006171241402626038, -0.005499882623553276, -0.0048285238444805145, -0.004157165065407753, -0.0034858062863349915, -0.00281444750726223, -0.0021430887281894684, -0.0014717299491167068, -0.0008003711700439453, -0.00012901239097118378, 0.0005423463881015778, 0.0012137051671743393, 0.0018850639462471008, 0.0025564227253198624, 0.003227781504392624, 0.0038991402834653854, 0.004570499062538147, 0.0052418578416109085, 0.00591321662068367, 0.006584575399756432, 0.007255934178829193, 0.007927292957901955, 0.008598651736974716, 0.009270010516047478, 0.00994136929512024, 0.010612728074193, 0.011284086853265762, 0.011955445632338524, 0.012626804411411285, 0.013298163190484047, 0.013969521969556808, 0.01464088074862957, 0.015312239527702332, 0.015983598306775093, 0.016654957085847855, 0.017326315864920616, 0.017997674643993378, 0.01866903342306614, 0.0193403922021389, 0.020011750981211662, 0.020683109760284424]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 22.0, 10.0, 37.0, 33.0, 53.0, 89.0, 101.0, 160.0, 217.0, 362.0, 554.0, 847.0, 1392.0, 2352.0, 4054.0, 7583.0, 16275.0, 59601.0, 904031.0, 26712.0, 10831.0, 5423.0, 2910.0, 1756.0, 1051.0, 691.0, 408.0, 304.0, 183.0, 166.0, 103.0, 58.0, 53.0, 31.0, 18.0, 25.0, 14.0, 6.0, 6.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.03564453125, -0.034539222717285156, -0.03343391418457031, -0.03232860565185547, -0.031223297119140625, -0.03011798858642578, -0.029012680053710938, -0.027907371520996094, -0.02680206298828125, -0.025696754455566406, -0.024591445922851562, -0.02348613739013672, -0.022380828857421875, -0.02127552032470703, -0.020170211791992188, -0.019064903259277344, -0.0179595947265625, -0.016854286193847656, -0.015748977661132812, -0.014643669128417969, -0.013538360595703125, -0.012433052062988281, -0.011327743530273438, -0.010222434997558594, -0.00911712646484375, -0.008011817932128906, -0.0069065093994140625, -0.005801200866699219, -0.004695892333984375, -0.0035905838012695312, -0.0024852752685546875, -0.0013799667358398438, -0.000274658203125, 0.0008306503295898438, 0.0019359588623046875, 0.0030412673950195312, 0.004146575927734375, 0.005251884460449219, 0.0063571929931640625, 0.007462501525878906, 0.00856781005859375, 0.009673118591308594, 0.010778427124023438, 0.011883735656738281, 0.012989044189453125, 0.014094352722167969, 0.015199661254882812, 0.016304969787597656, 0.0174102783203125, 0.018515586853027344, 0.019620895385742188, 0.02072620391845703, 0.021831512451171875, 0.02293682098388672, 0.024042129516601562, 0.025147438049316406, 0.02625274658203125, 0.027358055114746094, 0.028463363647460938, 0.02956867218017578, 0.030673980712890625, 0.03177928924560547, 0.03288459777832031, 0.033989906311035156, 0.03509521484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 3.0, 6.0, 0.0, 6.0, 6.0, 6.0, 5.0, 10.0, 9.0, 7.0, 15.0, 18.0, 13.0, 528.0, 267.0, 23.0, 12.0, 9.0, 11.0, 7.0, 7.0, 5.0, 7.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018768310546875, -0.0018014013767242432, -0.0017259716987609863, -0.0016505420207977295, -0.0015751123428344727, -0.0014996826648712158, -0.001424252986907959, -0.0013488233089447021, -0.0012733936309814453, -0.0011979639530181885, -0.0011225342750549316, -0.0010471045970916748, -0.000971674919128418, -0.0008962452411651611, -0.0008208155632019043, -0.0007453858852386475, -0.0006699562072753906, -0.0005945265293121338, -0.000519096851348877, -0.0004436671733856201, -0.0003682374954223633, -0.00029280781745910645, -0.0002173781394958496, -0.00014194846153259277, -6.651878356933594e-05, 8.910894393920898e-06, 8.434057235717773e-05, 0.00015977025032043457, 0.0002351999282836914, 0.00031062960624694824, 0.0003860592842102051, 0.0004614889621734619, 0.0005369186401367188, 0.0006123483180999756, 0.0006877779960632324, 0.0007632076740264893, 0.0008386373519897461, 0.0009140670299530029, 0.0009894967079162598, 0.0010649263858795166, 0.0011403560638427734, 0.0012157857418060303, 0.0012912154197692871, 0.001366645097732544, 0.0014420747756958008, 0.0015175044536590576, 0.0015929341316223145, 0.0016683638095855713, 0.0017437934875488281, 0.001819223165512085, 0.0018946528434753418, 0.0019700825214385986, 0.0020455121994018555, 0.0021209418773651123, 0.002196371555328369, 0.002271801233291626, 0.002347230911254883, 0.0024226605892181396, 0.0024980902671813965, 0.0025735199451446533, 0.00264894962310791, 0.002724379301071167, 0.002799808979034424, 0.0028752386569976807, 0.0029506683349609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 10.0, 11.0, 11.0, 22.0, 22.0, 31.0, 54.0, 52.0, 81.0, 106.0, 124.0, 176.0, 253.0, 337.0, 554.0, 819.0, 1219.0, 2172.0, 3998.0, 8719.0, 28503.0, 586766.0, 370958.0, 25511.0, 8122.0, 3856.0, 2170.0, 1294.0, 758.0, 515.0, 388.0, 265.0, 166.0, 123.0, 94.0, 79.0, 58.0, 36.0, 26.0, 18.0, 24.0, 13.0, 9.0, 6.0, 8.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.03948974609375, -0.03829193115234375, -0.0370941162109375, -0.03589630126953125, -0.034698486328125, -0.03350067138671875, -0.0323028564453125, -0.03110504150390625, -0.0299072265625, -0.02870941162109375, -0.0275115966796875, -0.02631378173828125, -0.025115966796875, -0.02391815185546875, -0.0227203369140625, -0.02152252197265625, -0.02032470703125, -0.01912689208984375, -0.0179290771484375, -0.01673126220703125, -0.015533447265625, -0.01433563232421875, -0.0131378173828125, -0.01194000244140625, -0.0107421875, -0.00954437255859375, -0.0083465576171875, -0.00714874267578125, -0.005950927734375, -0.00475311279296875, -0.0035552978515625, -0.00235748291015625, -0.00115966796875, 3.814697265625e-05, 0.0012359619140625, 0.00243377685546875, 0.003631591796875, 0.00482940673828125, 0.0060272216796875, 0.00722503662109375, 0.0084228515625, 0.00962066650390625, 0.0108184814453125, 0.01201629638671875, 0.013214111328125, 0.01441192626953125, 0.0156097412109375, 0.01680755615234375, 0.01800537109375, 0.01920318603515625, 0.0204010009765625, 0.02159881591796875, 0.022796630859375, 0.02399444580078125, 0.0251922607421875, 0.02639007568359375, 0.027587890625, 0.02878570556640625, 0.0299835205078125, 0.03118133544921875, 0.032379150390625, 0.03357696533203125, 0.0347747802734375, 0.03597259521484375, 0.03717041015625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 7.0, 7.0, 6.0, 8.0, 4.0, 14.0, 15.0, 13.0, 20.0, 22.0, 15.0, 24.0, 23.0, 37.0, 42.0, 32.0, 34.0, 35.0, 35.0, 41.0, 46.0, 31.0, 36.0, 37.0, 27.0, 35.0, 29.0, 34.0, 29.0, 29.0, 30.0, 23.0, 20.0, 26.0, 15.0, 15.0, 16.0, 12.0, 12.0, 9.0, 12.0, 6.0, 5.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.00794219970703125, -0.00770038366317749, -0.0074585676193237305, -0.007216751575469971, -0.006974935531616211, -0.006733119487762451, -0.006491303443908691, -0.006249487400054932, -0.006007671356201172, -0.005765855312347412, -0.005524039268493652, -0.005282223224639893, -0.005040407180786133, -0.004798591136932373, -0.004556775093078613, -0.0043149590492248535, -0.004073143005371094, -0.003831326961517334, -0.0035895109176635742, -0.0033476948738098145, -0.0031058788299560547, -0.002864062786102295, -0.002622246742248535, -0.0023804306983947754, -0.0021386146545410156, -0.0018967986106872559, -0.001654982566833496, -0.0014131665229797363, -0.0011713504791259766, -0.0009295344352722168, -0.000687718391418457, -0.00044590234756469727, -0.0002040863037109375, 3.7729740142822266e-05, 0.00027954578399658203, 0.0005213618278503418, 0.0007631778717041016, 0.0010049939155578613, 0.001246809959411621, 0.0014886260032653809, 0.0017304420471191406, 0.0019722580909729004, 0.00221407413482666, 0.00245589017868042, 0.0026977062225341797, 0.0029395222663879395, 0.0031813383102416992, 0.003423154354095459, 0.0036649703979492188, 0.0039067864418029785, 0.004148602485656738, 0.004390418529510498, 0.004632234573364258, 0.004874050617218018, 0.005115866661071777, 0.005357682704925537, 0.005599498748779297, 0.005841314792633057, 0.006083130836486816, 0.006324946880340576, 0.006566762924194336, 0.006808578968048096, 0.0070503950119018555, 0.007292211055755615, 0.007534027099609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 9.0, 7.0, 6.0, 12.0, 16.0, 19.0, 34.0, 80.0, 348.0, 3697.0, 1034520.0, 8982.0, 589.0, 108.0, 31.0, 17.0, 18.0, 16.0, 10.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04913330078125, -0.04775428771972656, -0.046375274658203125, -0.04499626159667969, -0.04361724853515625, -0.04223823547363281, -0.040859222412109375, -0.03948020935058594, -0.0381011962890625, -0.03672218322753906, -0.035343170166015625, -0.03396415710449219, -0.03258514404296875, -0.031206130981445312, -0.029827117919921875, -0.028448104858398438, -0.027069091796875, -0.025690078735351562, -0.024311065673828125, -0.022932052612304688, -0.02155303955078125, -0.020174026489257812, -0.018795013427734375, -0.017416000366210938, -0.0160369873046875, -0.014657974243164062, -0.013278961181640625, -0.011899948120117188, -0.01052093505859375, -0.009141921997070312, -0.007762908935546875, -0.0063838958740234375, -0.0050048828125, -0.0036258697509765625, -0.002246856689453125, -0.0008678436279296875, 0.00051116943359375, 0.0018901824951171875, 0.003269195556640625, 0.0046482086181640625, 0.0060272216796875, 0.0074062347412109375, 0.008785247802734375, 0.010164260864257812, 0.01154327392578125, 0.012922286987304688, 0.014301300048828125, 0.015680313110351562, 0.017059326171875, 0.018438339233398438, 0.019817352294921875, 0.021196365356445312, 0.02257537841796875, 0.023954391479492188, 0.025333404541015625, 0.026712417602539062, 0.0280914306640625, 0.029470443725585938, 0.030849456787109375, 0.03222846984863281, 0.03360748291015625, 0.03498649597167969, 0.036365509033203125, 0.03774452209472656, 0.03912353515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 7.0, 6.0, 2.0, 11.0, 4.0, 14.0, 18.0, 17.0, 44.0, 103.0, 266.0, 285.0, 83.0, 43.0, 21.0, 12.0, 7.0, 7.0, 4.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0022640228271484375, -0.002201065421104431, -0.002138108015060425, -0.0020751506090164185, -0.002012193202972412, -0.0019492357969284058, -0.0018862783908843994, -0.001823320984840393, -0.0017603635787963867, -0.0016974061727523804, -0.001634448766708374, -0.0015714913606643677, -0.0015085339546203613, -0.001445576548576355, -0.0013826191425323486, -0.0013196617364883423, -0.001256704330444336, -0.0011937469244003296, -0.0011307895183563232, -0.001067832112312317, -0.0010048747062683105, -0.0009419173002243042, -0.0008789598941802979, -0.0008160024881362915, -0.0007530450820922852, -0.0006900876760482788, -0.0006271302700042725, -0.0005641728639602661, -0.0005012154579162598, -0.0004382580518722534, -0.00037530064582824707, -0.0003123432397842407, -0.0002493858337402344, -0.00018642842769622803, -0.00012347102165222168, -6.051361560821533e-05, 2.4437904357910156e-06, 6.540119647979736e-05, 0.0001283586025238037, 0.00019131600856781006, 0.0002542734146118164, 0.00031723082065582275, 0.0003801882266998291, 0.00044314563274383545, 0.0005061030387878418, 0.0005690604448318481, 0.0006320178508758545, 0.0006949752569198608, 0.0007579326629638672, 0.0008208900690078735, 0.0008838474750518799, 0.0009468048810958862, 0.0010097622871398926, 0.001072719693183899, 0.0011356770992279053, 0.0011986345052719116, 0.001261591911315918, 0.0013245493173599243, 0.0013875067234039307, 0.001450464129447937, 0.0015134215354919434, 0.0015763789415359497, 0.001639336347579956, 0.0017022937536239624, 0.0017652511596679688]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 7.0, 12.0, 14.0, 13.0, 21.0, 27.0, 38.0, 57.0, 86.0, 147.0, 262.0, 457.0, 1018.0, 2536.0, 12593.0, 987770.0, 36384.0, 4218.0, 1367.0, 607.0, 361.0, 187.0, 125.0, 74.0, 56.0, 42.0, 23.0, 11.0, 6.0, 10.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.023193359375, -0.022504806518554688, -0.021816253662109375, -0.021127700805664062, -0.02043914794921875, -0.019750595092773438, -0.019062042236328125, -0.018373489379882812, -0.0176849365234375, -0.016996383666992188, -0.016307830810546875, -0.015619277954101562, -0.01493072509765625, -0.014242172241210938, -0.013553619384765625, -0.012865066528320312, -0.012176513671875, -0.011487960815429688, -0.010799407958984375, -0.010110855102539062, -0.00942230224609375, -0.008733749389648438, -0.008045196533203125, -0.0073566436767578125, -0.0066680908203125, -0.0059795379638671875, -0.005290985107421875, -0.0046024322509765625, -0.00391387939453125, -0.0032253265380859375, -0.002536773681640625, -0.0018482208251953125, -0.00115966796875, -0.0004711151123046875, 0.000217437744140625, 0.0009059906005859375, 0.00159454345703125, 0.0022830963134765625, 0.002971649169921875, 0.0036602020263671875, 0.0043487548828125, 0.0050373077392578125, 0.005725860595703125, 0.0064144134521484375, 0.00710296630859375, 0.0077915191650390625, 0.008480072021484375, 0.009168624877929688, 0.009857177734375, 0.010545730590820312, 0.011234283447265625, 0.011922836303710938, 0.01261138916015625, 0.013299942016601562, 0.013988494873046875, 0.014677047729492188, 0.0153656005859375, 0.016054153442382812, 0.016742706298828125, 0.017431259155273438, 0.01811981201171875, 0.018808364868164062, 0.019496917724609375, 0.020185470581054688, 0.0208740234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 12.0, 7.0, 9.0, 14.0, 12.0, 25.0, 36.0, 64.0, 178.0, 370.0, 99.0, 37.0, 20.0, 20.0, 17.0, 9.0, 17.0, 8.0, 7.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005023956298828125, -0.00487285852432251, -0.0047217607498168945, -0.004570662975311279, -0.004419565200805664, -0.004268467426300049, -0.004117369651794434, -0.003966271877288818, -0.003815174102783203, -0.003664076328277588, -0.0035129785537719727, -0.0033618807792663574, -0.003210783004760742, -0.003059685230255127, -0.0029085874557495117, -0.0027574896812438965, -0.0026063919067382812, -0.002455294132232666, -0.0023041963577270508, -0.0021530985832214355, -0.0020020008087158203, -0.001850903034210205, -0.0016998052597045898, -0.0015487074851989746, -0.0013976097106933594, -0.0012465119361877441, -0.001095414161682129, -0.0009443163871765137, -0.0007932186126708984, -0.0006421208381652832, -0.000491023063659668, -0.00033992528915405273, -0.0001888275146484375, -3.7729740142822266e-05, 0.00011336803436279297, 0.0002644658088684082, 0.00041556358337402344, 0.0005666613578796387, 0.0007177591323852539, 0.0008688569068908691, 0.0010199546813964844, 0.0011710524559020996, 0.0013221502304077148, 0.00147324800491333, 0.0016243457794189453, 0.0017754435539245605, 0.0019265413284301758, 0.002077639102935791, 0.0022287368774414062, 0.0023798346519470215, 0.0025309324264526367, 0.002682030200958252, 0.002833127975463867, 0.0029842257499694824, 0.0031353235244750977, 0.003286421298980713, 0.003437519073486328, 0.0035886168479919434, 0.0037397146224975586, 0.003890812397003174, 0.004041910171508789, 0.004193007946014404, 0.0043441057205200195, 0.004495203495025635, 0.00464630126953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 9.0, 10.0, 15.0, 30.0, 130.0, 636.0, 95.0, 18.0, 9.0, 13.0, 8.0, 2.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26637715101242065, -0.254488468170166, -0.242599755525589, -0.23071107268333435, -0.21882237493991852, -0.20693367719650269, -0.19504499435424805, -0.18315629661083221, -0.17126759886741638, -0.15937890112400055, -0.14749020338058472, -0.13560152053833008, -0.12371282279491425, -0.11182412505149841, -0.09993543475866318, -0.08804674446582794, -0.07615804672241211, -0.06426934897899628, -0.05238065868616104, -0.04049196466803551, -0.028603270649909973, -0.01671457663178444, -0.004825882613658905, 0.007062807679176331, 0.018951505422592163, 0.030840199440717697, 0.04272889345884323, 0.054617587476968765, 0.0665062814950943, 0.07839497923851013, 0.09028366953134537, 0.1021723598241806, 0.11406102776527405, 0.12594972550868988, 0.1378384232521057, 0.14972710609436035, 0.16161580383777618, 0.17350450158119202, 0.18539318442344666, 0.1972818821668625, 0.20917057991027832, 0.22105927765369415, 0.23294797539710999, 0.24483665823936462, 0.25672537088394165, 0.2686140537261963, 0.2805027365684509, 0.29239141941070557, 0.3042801320552826, 0.31616881489753723, 0.32805752754211426, 0.3399462103843689, 0.35183489322662354, 0.36372360587120056, 0.3756122887134552, 0.3875010013580322, 0.39938968420028687, 0.4112783670425415, 0.42316707968711853, 0.43505576252937317, 0.4469444751739502, 0.45883315801620483, 0.4707218408584595, 0.4826105237007141, 0.49449923634529114]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 10.0, 13.0, 9.0, 10.0, 18.0, 29.0, 42.0, 86.0, 136.0, 197.0, 141.0, 111.0, 62.0, 39.0, 16.0, 12.0, 13.0, 9.0, 10.0, 4.0, 5.0, 8.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21385985612869263, -0.2080519199371338, -0.20224396884441376, -0.19643603265285492, -0.19062809646129608, -0.18482014536857605, -0.1790122091770172, -0.17320427298545837, -0.16739633679389954, -0.1615884006023407, -0.15578044950962067, -0.14997251331806183, -0.144164577126503, -0.13835662603378296, -0.13254868984222412, -0.12674075365066528, -0.12093280255794525, -0.11512485891580582, -0.10931692272424698, -0.10350897908210754, -0.0977010428905487, -0.09189309924840927, -0.08608515560626984, -0.080277219414711, -0.07446927577257156, -0.06866133213043213, -0.06285339593887329, -0.057045452296733856, -0.05123751237988472, -0.045429572463035583, -0.03962162882089615, -0.03381368890404701, -0.028005748987197876, -0.02219780907034874, -0.016389867290854454, -0.010581925511360168, -0.004773985594511032, 0.0010339543223381042, 0.006841897964477539, 0.012649837881326675, 0.018457777798175812, 0.024265717715024948, 0.030073659494519234, 0.03588160127401352, 0.041689541190862656, 0.04749748110771179, 0.05330542474985123, 0.05911336466670036, 0.0649213045835495, 0.07072924822568893, 0.07653718441724777, 0.08234512805938721, 0.08815306425094604, 0.09396100789308548, 0.09976895153522491, 0.10557688772678375, 0.11138483136892319, 0.11719277501106262, 0.12300071120262146, 0.1288086473941803, 0.13461659848690033, 0.14042453467845917, 0.1462324857711792, 0.15204042196273804, 0.15784835815429688]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 6.0, 13.0, 14.0, 13.0, 20.0, 30.0, 29.0, 58.0, 140.0, 2663.0, 4164606.0, 25798.0, 618.0, 111.0, 38.0, 30.0, 17.0, 14.0, 16.0, 8.0, 6.0, 5.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5, -3.3526611328125, -3.205322265625, -3.0579833984375, -2.91064453125, -2.7633056640625, -2.615966796875, -2.4686279296875, -2.3212890625, -2.1739501953125, -2.026611328125, -1.8792724609375, -1.73193359375, -1.5845947265625, -1.437255859375, -1.2899169921875, -1.142578125, -0.9952392578125, -0.847900390625, -0.7005615234375, -0.55322265625, -0.4058837890625, -0.258544921875, -0.1112060546875, 0.0361328125, 0.1834716796875, 0.330810546875, 0.4781494140625, 0.62548828125, 0.7728271484375, 0.920166015625, 1.0675048828125, 1.21484375, 1.3621826171875, 1.509521484375, 1.6568603515625, 1.80419921875, 1.9515380859375, 2.098876953125, 2.2462158203125, 2.3935546875, 2.5408935546875, 2.688232421875, 2.8355712890625, 2.98291015625, 3.1302490234375, 3.277587890625, 3.4249267578125, 3.572265625, 3.7196044921875, 3.866943359375, 4.0142822265625, 4.16162109375, 4.3089599609375, 4.456298828125, 4.6036376953125, 4.7509765625, 4.8983154296875, 5.045654296875, 5.1929931640625, 5.34033203125, 5.4876708984375, 5.635009765625, 5.7823486328125, 5.9296875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 1.0, 4.0, 6.0, 7.0, 4.0, 14.0, 7.0, 6.0, 10.0, 19.0, 17.0, 351.0, 430.0, 35.0, 11.0, 11.0, 8.0, 8.0, 9.0, 5.0, 7.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018367767333984375, -0.0017633140087127686, -0.0016898512840270996, -0.0016163885593414307, -0.0015429258346557617, -0.0014694631099700928, -0.0013960003852844238, -0.0013225376605987549, -0.001249074935913086, -0.001175612211227417, -0.001102149486541748, -0.001028686761856079, -0.0009552240371704102, -0.0008817613124847412, -0.0008082985877990723, -0.0007348358631134033, -0.0006613731384277344, -0.0005879104137420654, -0.0005144476890563965, -0.00044098496437072754, -0.0003675222396850586, -0.00029405951499938965, -0.0002205967903137207, -0.00014713406562805176, -7.367134094238281e-05, -2.086162567138672e-07, 7.325410842895508e-05, 0.00014671683311462402, 0.00022017955780029297, 0.0002936422824859619, 0.00036710500717163086, 0.0004405677318572998, 0.0005140304565429688, 0.0005874931812286377, 0.0006609559059143066, 0.0007344186305999756, 0.0008078813552856445, 0.0008813440799713135, 0.0009548068046569824, 0.0010282695293426514, 0.0011017322540283203, 0.0011751949787139893, 0.0012486577033996582, 0.0013221204280853271, 0.001395583152770996, 0.001469045877456665, 0.001542508602142334, 0.001615971326828003, 0.0016894340515136719, 0.0017628967761993408, 0.0018363595008850098, 0.0019098222255706787, 0.0019832849502563477, 0.0020567476749420166, 0.0021302103996276855, 0.0022036731243133545, 0.0022771358489990234, 0.0023505985736846924, 0.0024240612983703613, 0.0024975240230560303, 0.0025709867477416992, 0.002644449472427368, 0.002717912197113037, 0.002791374921798706, 0.002864837646484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 8.0, 10.0, 17.0, 17.0, 19.0, 29.0, 39.0, 33.0, 44.0, 41.0, 63.0, 73.0, 84.0, 133.0, 140.0, 399.0, 12130.0, 4174005.0, 5859.0, 332.0, 148.0, 120.0, 103.0, 77.0, 66.0, 55.0, 59.0, 36.0, 24.0, 27.0, 22.0, 19.0, 5.0, 11.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.603515625, -0.5806732177734375, -0.557830810546875, -0.5349884033203125, -0.51214599609375, -0.4893035888671875, -0.466461181640625, -0.4436187744140625, -0.4207763671875, -0.3979339599609375, -0.375091552734375, -0.3522491455078125, -0.32940673828125, -0.3065643310546875, -0.283721923828125, -0.2608795166015625, -0.238037109375, -0.2151947021484375, -0.192352294921875, -0.1695098876953125, -0.14666748046875, -0.1238250732421875, -0.100982666015625, -0.0781402587890625, -0.0552978515625, -0.0324554443359375, -0.009613037109375, 0.0132293701171875, 0.03607177734375, 0.0589141845703125, 0.081756591796875, 0.1045989990234375, 0.12744140625, 0.1502838134765625, 0.173126220703125, 0.1959686279296875, 0.21881103515625, 0.2416534423828125, 0.264495849609375, 0.2873382568359375, 0.3101806640625, 0.3330230712890625, 0.355865478515625, 0.3787078857421875, 0.40155029296875, 0.4243927001953125, 0.447235107421875, 0.4700775146484375, 0.492919921875, 0.5157623291015625, 0.538604736328125, 0.5614471435546875, 0.58428955078125, 0.6071319580078125, 0.629974365234375, 0.6528167724609375, 0.6756591796875, 0.6985015869140625, 0.721343994140625, 0.7441864013671875, 0.76702880859375, 0.7898712158203125, 0.812713623046875, 0.8355560302734375, 0.8583984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 8.0, 13.0, 13.0, 16.0, 21.0, 35.0, 36.0, 37.0, 41.0, 44.0, 68.0, 70.0, 95.0, 122.0, 131.0, 164.0, 374.0, 1535.0, 292.0, 172.0, 126.0, 125.0, 101.0, 71.0, 70.0, 57.0, 54.0, 36.0, 26.0, 29.0, 21.0, 16.0, 8.0, 11.0, 5.0, 10.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004657745361328125, -0.004481017589569092, -0.004304289817810059, -0.004127562046051025, -0.003950834274291992, -0.003774106502532959, -0.0035973787307739258, -0.0034206509590148926, -0.0032439231872558594, -0.003067195415496826, -0.002890467643737793, -0.0027137398719787598, -0.0025370121002197266, -0.0023602843284606934, -0.00218355655670166, -0.002006828784942627, -0.0018301010131835938, -0.0016533732414245605, -0.0014766454696655273, -0.0012999176979064941, -0.001123189926147461, -0.0009464621543884277, -0.0007697343826293945, -0.0005930066108703613, -0.0004162788391113281, -0.00023955106735229492, -6.282329559326172e-05, 0.00011390447616577148, 0.0002906322479248047, 0.0004673600196838379, 0.0006440877914428711, 0.0008208155632019043, 0.0009975433349609375, 0.0011742711067199707, 0.001350998878479004, 0.0015277266502380371, 0.0017044544219970703, 0.0018811821937561035, 0.0020579099655151367, 0.00223463773727417, 0.002411365509033203, 0.0025880932807922363, 0.0027648210525512695, 0.0029415488243103027, 0.003118276596069336, 0.003295004367828369, 0.0034717321395874023, 0.0036484599113464355, 0.0038251876831054688, 0.004001915454864502, 0.004178643226623535, 0.004355370998382568, 0.0045320987701416016, 0.004708826541900635, 0.004885554313659668, 0.005062282085418701, 0.005239009857177734, 0.005415737628936768, 0.005592465400695801, 0.005769193172454834, 0.005945920944213867, 0.0061226487159729, 0.006299376487731934, 0.006476104259490967, 0.00665283203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 8.0, 14.0, 33.0, 76.0, 298.0, 359.0, 111.0, 37.0, 27.0, 10.0, 10.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185691237449646, -0.18147197365760803, -0.17725272476673126, -0.1730334609746933, -0.16881419718265533, -0.16459494829177856, -0.1603756844997406, -0.15615642070770264, -0.15193715691566467, -0.1477178931236267, -0.14349864423274994, -0.13927938044071198, -0.135060116648674, -0.13084086775779724, -0.12662160396575928, -0.12240234017372131, -0.11818309128284454, -0.11396383494138718, -0.10974457114934921, -0.10552531480789185, -0.10130605101585388, -0.09708679467439651, -0.09286753833293915, -0.08864827454090118, -0.08442901819944382, -0.08020976185798645, -0.07599049806594849, -0.07177124172449112, -0.06755198538303375, -0.06333272159099579, -0.05911346524953842, -0.054894205182790756, -0.05067494511604309, -0.046455685049295425, -0.04223642498254776, -0.03801716864109039, -0.03379790857434273, -0.029578648507595062, -0.025359390303492546, -0.02114013209939003, -0.016920872032642365, -0.012701612897217274, -0.008482353761792183, -0.004263094626367092, -4.383549094200134e-05, 0.004175424575805664, 0.00839468277990818, 0.012613940984010696, 0.016833201050758362, 0.021052461117506027, 0.025271719321608543, 0.02949097752571106, 0.033710237592458725, 0.03792949765920639, 0.04214875400066376, 0.04636801406741142, 0.05058727413415909, 0.054806534200906754, 0.05902579426765442, 0.06324505060911179, 0.06746430695056915, 0.07168357074260712, 0.07590282708406448, 0.08012208342552185, 0.08434134721755981]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 2.0, 5.0, 9.0, 12.0, 20.0, 17.0, 24.0, 26.0, 37.0, 43.0, 41.0, 36.0, 49.0, 49.0, 47.0, 66.0, 54.0, 57.0, 62.0, 51.0, 47.0, 41.0, 44.0, 30.0, 23.0, 22.0, 21.0, 19.0, 17.0, 7.0, 5.0, 6.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04750263690948486, -0.04616200178861618, -0.0448213666677475, -0.043480727821588516, -0.04214009270071983, -0.04079945757985115, -0.03945881873369217, -0.038118183612823486, -0.0367775484919548, -0.03543691337108612, -0.03409627825021744, -0.032755639404058456, -0.031415004283189774, -0.03007436916232109, -0.02873373217880726, -0.027393095195293427, -0.026052460074424744, -0.02471182495355606, -0.02337118797004223, -0.022030550986528397, -0.020689915865659714, -0.01934928074479103, -0.0180086437612772, -0.016668006777763367, -0.015327371656894684, -0.013986735604703426, -0.012646099552512169, -0.011305463500320911, -0.009964827448129654, -0.008624191395938396, -0.007283555343747139, -0.0059429192915558815, -0.004602283239364624, -0.0032616471871733665, -0.001921011134982109, -0.0005803750827908516, 0.0007602609694004059, 0.0021008970215916634, 0.003441533073782921, 0.004782169125974178, 0.006122805178165436, 0.007463441230356693, 0.00880407728254795, 0.010144713334739208, 0.011485349386930466, 0.012825985439121723, 0.01416662149131298, 0.015507257543504238, 0.016847893595695496, 0.01818852871656418, 0.01952916570007801, 0.020869802683591843, 0.022210437804460526, 0.02355107292532921, 0.02489170990884304, 0.026232346892356873, 0.027572982013225555, 0.02891361713409424, 0.03025425411760807, 0.0315948911011219, 0.032935526221990585, 0.03427616134285927, 0.03561680018901825, 0.03695743530988693, 0.038298070430755615]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 16.0, 19.0, 33.0, 30.0, 33.0, 59.0, 100.0, 142.0, 190.0, 277.0, 423.0, 593.0, 888.0, 1414.0, 2152.0, 3574.0, 6303.0, 11994.0, 28886.0, 892565.0, 61372.0, 16804.0, 8245.0, 4574.0, 2737.0, 1682.0, 1103.0, 731.0, 498.0, 326.0, 256.0, 153.0, 106.0, 79.0, 50.0, 31.0, 28.0, 23.0, 11.0, 16.0, 8.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.047607421875, -0.04615211486816406, -0.044696807861328125, -0.04324150085449219, -0.04178619384765625, -0.04033088684082031, -0.038875579833984375, -0.03742027282714844, -0.0359649658203125, -0.03450965881347656, -0.033054351806640625, -0.03159904479980469, -0.03014373779296875, -0.028688430786132812, -0.027233123779296875, -0.025777816772460938, -0.024322509765625, -0.022867202758789062, -0.021411895751953125, -0.019956588745117188, -0.01850128173828125, -0.017045974731445312, -0.015590667724609375, -0.014135360717773438, -0.0126800537109375, -0.011224746704101562, -0.009769439697265625, -0.008314132690429688, -0.00685882568359375, -0.0054035186767578125, -0.003948211669921875, -0.0024929046630859375, -0.00103759765625, 0.0004177093505859375, 0.001873016357421875, 0.0033283233642578125, 0.00478363037109375, 0.0062389373779296875, 0.007694244384765625, 0.009149551391601562, 0.0106048583984375, 0.012060165405273438, 0.013515472412109375, 0.014970779418945312, 0.01642608642578125, 0.017881393432617188, 0.019336700439453125, 0.020792007446289062, 0.022247314453125, 0.023702621459960938, 0.025157928466796875, 0.026613235473632812, 0.02806854248046875, 0.029523849487304688, 0.030979156494140625, 0.03243446350097656, 0.0338897705078125, 0.03534507751464844, 0.036800384521484375, 0.03825569152832031, 0.03971099853515625, 0.04116630554199219, 0.042621612548828125, 0.04407691955566406, 0.0455322265625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 6.0, 8.0, 13.0, 7.0, 12.0, 13.0, 15.0, 103.0, 606.0, 111.0, 12.0, 11.0, 5.0, 12.0, 7.0, 8.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018367767333984375, -0.001764446496963501, -0.0016921162605285645, -0.001619786024093628, -0.0015474557876586914, -0.0014751255512237549, -0.0014027953147888184, -0.0013304650783538818, -0.0012581348419189453, -0.0011858046054840088, -0.0011134743690490723, -0.0010411441326141357, -0.0009688138961791992, -0.0008964836597442627, -0.0008241534233093262, -0.0007518231868743896, -0.0006794929504394531, -0.0006071627140045166, -0.0005348324775695801, -0.00046250224113464355, -0.00039017200469970703, -0.0003178417682647705, -0.000245511531829834, -0.00017318129539489746, -0.00010085105895996094, -2.8520822525024414e-05, 4.380941390991211e-05, 0.00011613965034484863, 0.00018846988677978516, 0.0002608001232147217, 0.0003331303596496582, 0.0004054605960845947, 0.00047779083251953125, 0.0005501210689544678, 0.0006224513053894043, 0.0006947815418243408, 0.0007671117782592773, 0.0008394420146942139, 0.0009117722511291504, 0.000984102487564087, 0.0010564327239990234, 0.00112876296043396, 0.0012010931968688965, 0.001273423433303833, 0.0013457536697387695, 0.001418083906173706, 0.0014904141426086426, 0.001562744379043579, 0.0016350746154785156, 0.0017074048519134521, 0.0017797350883483887, 0.0018520653247833252, 0.0019243955612182617, 0.0019967257976531982, 0.0020690560340881348, 0.0021413862705230713, 0.002213716506958008, 0.0022860467433929443, 0.002358376979827881, 0.0024307072162628174, 0.002503037452697754, 0.0025753676891326904, 0.002647697925567627, 0.0027200281620025635, 0.0027923583984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 5.0, 7.0, 10.0, 6.0, 12.0, 13.0, 15.0, 19.0, 13.0, 19.0, 19.0, 32.0, 34.0, 59.0, 96.0, 488.0, 3904.0, 626243.0, 412766.0, 3834.0, 493.0, 125.0, 63.0, 33.0, 35.0, 30.0, 30.0, 24.0, 17.0, 21.0, 13.0, 9.0, 5.0, 8.0, 9.0, 8.0, 3.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11773681640625, -0.11381053924560547, -0.10988426208496094, -0.1059579849243164, -0.10203170776367188, -0.09810543060302734, -0.09417915344238281, -0.09025287628173828, -0.08632659912109375, -0.08240032196044922, -0.07847404479980469, -0.07454776763916016, -0.07062149047851562, -0.0666952133178711, -0.06276893615722656, -0.05884265899658203, -0.0549163818359375, -0.05099010467529297, -0.04706382751464844, -0.043137550354003906, -0.039211273193359375, -0.035284996032714844, -0.03135871887207031, -0.02743244171142578, -0.02350616455078125, -0.01957988739013672, -0.015653610229492188, -0.011727333068847656, -0.007801055908203125, -0.0038747787475585938, 5.14984130859375e-05, 0.003977775573730469, 0.007904052734375, 0.011830329895019531, 0.015756607055664062, 0.019682884216308594, 0.023609161376953125, 0.027535438537597656, 0.03146171569824219, 0.03538799285888672, 0.03931427001953125, 0.04324054718017578, 0.04716682434082031, 0.051093101501464844, 0.055019378662109375, 0.058945655822753906, 0.06287193298339844, 0.06679821014404297, 0.0707244873046875, 0.07465076446533203, 0.07857704162597656, 0.0825033187866211, 0.08642959594726562, 0.09035587310791016, 0.09428215026855469, 0.09820842742919922, 0.10213470458984375, 0.10606098175048828, 0.10998725891113281, 0.11391353607177734, 0.11783981323242188, 0.1217660903930664, 0.12569236755371094, 0.12961864471435547, 0.133544921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 2.0, 2.0, 8.0, 6.0, 5.0, 4.0, 5.0, 13.0, 11.0, 16.0, 18.0, 20.0, 19.0, 24.0, 20.0, 29.0, 22.0, 31.0, 34.0, 42.0, 36.0, 38.0, 57.0, 43.0, 37.0, 49.0, 37.0, 39.0, 46.0, 21.0, 27.0, 49.0, 29.0, 22.0, 30.0, 24.0, 15.0, 8.0, 11.0, 7.0, 12.0, 4.0, 9.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.005970001220703125, -0.005774199962615967, -0.005578398704528809, -0.00538259744644165, -0.005186796188354492, -0.004990994930267334, -0.004795193672180176, -0.004599392414093018, -0.004403591156005859, -0.004207789897918701, -0.004011988639831543, -0.0038161873817443848, -0.0036203861236572266, -0.0034245848655700684, -0.00322878360748291, -0.003032982349395752, -0.0028371810913085938, -0.0026413798332214355, -0.0024455785751342773, -0.002249777317047119, -0.002053976058959961, -0.0018581748008728027, -0.0016623735427856445, -0.0014665722846984863, -0.0012707710266113281, -0.00107496976852417, -0.0008791685104370117, -0.0006833672523498535, -0.0004875659942626953, -0.0002917647361755371, -9.59634780883789e-05, 9.98377799987793e-05, 0.0002956390380859375, 0.0004914402961730957, 0.0006872415542602539, 0.0008830428123474121, 0.0010788440704345703, 0.0012746453285217285, 0.0014704465866088867, 0.001666247844696045, 0.0018620491027832031, 0.0020578503608703613, 0.0022536516189575195, 0.0024494528770446777, 0.002645254135131836, 0.002841055393218994, 0.0030368566513061523, 0.0032326579093933105, 0.0034284591674804688, 0.003624260425567627, 0.003820061683654785, 0.004015862941741943, 0.0042116641998291016, 0.00440746545791626, 0.004603266716003418, 0.004799067974090576, 0.004994869232177734, 0.005190670490264893, 0.005386471748352051, 0.005582273006439209, 0.005778074264526367, 0.005973875522613525, 0.006169676780700684, 0.006365478038787842, 0.006561279296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 7.0, 8.0, 9.0, 27.0, 30.0, 71.0, 240.0, 3148.0, 1042781.0, 1893.0, 198.0, 73.0, 22.0, 12.0, 11.0, 11.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1365966796875, -0.1334514617919922, -0.13030624389648438, -0.12716102600097656, -0.12401580810546875, -0.12087059020996094, -0.11772537231445312, -0.11458015441894531, -0.1114349365234375, -0.10828971862792969, -0.10514450073242188, -0.10199928283691406, -0.09885406494140625, -0.09570884704589844, -0.09256362915039062, -0.08941841125488281, -0.086273193359375, -0.08312797546386719, -0.07998275756835938, -0.07683753967285156, -0.07369232177734375, -0.07054710388183594, -0.06740188598632812, -0.06425666809082031, -0.0611114501953125, -0.05796623229980469, -0.054821014404296875, -0.05167579650878906, -0.04853057861328125, -0.04538536071777344, -0.042240142822265625, -0.03909492492675781, -0.03594970703125, -0.03280448913574219, -0.029659271240234375, -0.026514053344726562, -0.02336883544921875, -0.020223617553710938, -0.017078399658203125, -0.013933181762695312, -0.0107879638671875, -0.0076427459716796875, -0.004497528076171875, -0.0013523101806640625, 0.00179290771484375, 0.0049381256103515625, 0.008083343505859375, 0.011228561401367188, 0.014373779296875, 0.017518997192382812, 0.020664215087890625, 0.023809432983398438, 0.02695465087890625, 0.030099868774414062, 0.033245086669921875, 0.03639030456542969, 0.0395355224609375, 0.04268074035644531, 0.045825958251953125, 0.04897117614746094, 0.05211639404296875, 0.05526161193847656, 0.058406829833984375, 0.06155204772949219, 0.064697265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 9.0, 13.0, 15.0, 42.0, 556.0, 255.0, 39.0, 24.0, 9.0, 12.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0045928955078125, -0.004362344741821289, -0.004131793975830078, -0.003901243209838867, -0.0036706924438476562, -0.0034401416778564453, -0.0032095909118652344, -0.0029790401458740234, -0.0027484893798828125, -0.0025179386138916016, -0.0022873878479003906, -0.0020568370819091797, -0.0018262863159179688, -0.0015957355499267578, -0.0013651847839355469, -0.001134634017944336, -0.000904083251953125, -0.0006735324859619141, -0.0004429817199707031, -0.0002124309539794922, 1.811981201171875e-05, 0.0002486705780029297, 0.0004792213439941406, 0.0007097721099853516, 0.0009403228759765625, 0.0011708736419677734, 0.0014014244079589844, 0.0016319751739501953, 0.0018625259399414062, 0.002093076705932617, 0.002323627471923828, 0.002554178237915039, 0.00278472900390625, 0.003015279769897461, 0.003245830535888672, 0.003476381301879883, 0.0037069320678710938, 0.003937482833862305, 0.004168033599853516, 0.0043985843658447266, 0.0046291351318359375, 0.0048596858978271484, 0.005090236663818359, 0.00532078742980957, 0.005551338195800781, 0.005781888961791992, 0.006012439727783203, 0.006242990493774414, 0.006473541259765625, 0.006704092025756836, 0.006934642791748047, 0.007165193557739258, 0.007395744323730469, 0.00762629508972168, 0.00785684585571289, 0.008087396621704102, 0.008317947387695312, 0.008548498153686523, 0.008779048919677734, 0.009009599685668945, 0.009240150451660156, 0.009470701217651367, 0.009701251983642578, 0.009931802749633789, 0.010162353515625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 12.0, 17.0, 51.0, 185.0, 2442.0, 1043158.0, 2382.0, 187.0, 63.0, 18.0, 6.0, 7.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09759521484375, -0.09459209442138672, -0.09158897399902344, -0.08858585357666016, -0.08558273315429688, -0.0825796127319336, -0.07957649230957031, -0.07657337188720703, -0.07357025146484375, -0.07056713104248047, -0.06756401062011719, -0.0645608901977539, -0.061557769775390625, -0.058554649353027344, -0.05555152893066406, -0.05254840850830078, -0.0495452880859375, -0.04654216766357422, -0.04353904724121094, -0.040535926818847656, -0.037532806396484375, -0.034529685974121094, -0.03152656555175781, -0.02852344512939453, -0.02552032470703125, -0.02251720428466797, -0.019514083862304688, -0.016510963439941406, -0.013507843017578125, -0.010504722595214844, -0.0075016021728515625, -0.004498481750488281, -0.001495361328125, 0.0015077590942382812, 0.0045108795166015625, 0.007513999938964844, 0.010517120361328125, 0.013520240783691406, 0.016523361206054688, 0.01952648162841797, 0.02252960205078125, 0.02553272247314453, 0.028535842895507812, 0.031538963317871094, 0.034542083740234375, 0.037545204162597656, 0.04054832458496094, 0.04355144500732422, 0.0465545654296875, 0.04955768585205078, 0.05256080627441406, 0.055563926696777344, 0.058567047119140625, 0.061570167541503906, 0.06457328796386719, 0.06757640838623047, 0.07057952880859375, 0.07358264923095703, 0.07658576965332031, 0.0795888900756836, 0.08259201049804688, 0.08559513092041016, 0.08859825134277344, 0.09160137176513672, 0.0946044921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 3.0, 7.0, 4.0, 11.0, 13.0, 16.0, 21.0, 24.0, 42.0, 85.0, 415.0, 156.0, 74.0, 33.0, 32.0, 16.0, 9.0, 10.0, 4.0, 5.0, 6.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.006862640380859375, -0.006653428077697754, -0.006444215774536133, -0.006235003471374512, -0.006025791168212891, -0.0058165788650512695, -0.0056073665618896484, -0.005398154258728027, -0.005188941955566406, -0.004979729652404785, -0.004770517349243164, -0.004561305046081543, -0.004352092742919922, -0.004142880439758301, -0.00393366813659668, -0.0037244558334350586, -0.0035152435302734375, -0.0033060312271118164, -0.0030968189239501953, -0.0028876066207885742, -0.002678394317626953, -0.002469182014465332, -0.002259969711303711, -0.00205075740814209, -0.0018415451049804688, -0.0016323328018188477, -0.0014231204986572266, -0.0012139081954956055, -0.0010046958923339844, -0.0007954835891723633, -0.0005862712860107422, -0.0003770589828491211, -0.0001678466796875, 4.1365623474121094e-05, 0.0002505779266357422, 0.0004597902297973633, 0.0006690025329589844, 0.0008782148361206055, 0.0010874271392822266, 0.0012966394424438477, 0.0015058517456054688, 0.0017150640487670898, 0.001924276351928711, 0.002133488655090332, 0.002342700958251953, 0.0025519132614135742, 0.0027611255645751953, 0.0029703378677368164, 0.0031795501708984375, 0.0033887624740600586, 0.0035979747772216797, 0.0038071870803833008, 0.004016399383544922, 0.004225611686706543, 0.004434823989868164, 0.004644036293029785, 0.004853248596191406, 0.005062460899353027, 0.0052716732025146484, 0.0054808855056762695, 0.005690097808837891, 0.005899310111999512, 0.006108522415161133, 0.006317734718322754, 0.006526947021484375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 31.0, 199.0, 618.0, 92.0, 31.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10193368047475815, -0.09288366138935089, -0.08383363485336304, -0.07478360831737518, -0.06573358923196793, -0.05668356642127037, -0.047633543610572815, -0.03858352452516556, -0.029533497989177704, -0.02048347517848015, -0.011433452367782593, -0.0023834295570850372, 0.006666593253612518, 0.015716616064310074, 0.02476663887500763, 0.033816657960414886, 0.04286668449640274, 0.051916707307100296, 0.06096673011779785, 0.0700167566537857, 0.07906677573919296, 0.08811679482460022, 0.09716682136058807, 0.10621684044599533, 0.11526686698198318, 0.12431688606739044, 0.1333669126033783, 0.14241693913936615, 0.151466965675354, 0.16051697731018066, 0.16956700384616852, 0.17861703038215637, 0.18766707181930542, 0.19671709835529327, 0.20576712489128113, 0.2148171365261078, 0.22386716306209564, 0.2329171895980835, 0.24196720123291016, 0.2510172128677368, 0.26006725430488586, 0.2691172659397125, 0.2781673073768616, 0.28721731901168823, 0.2962673306465149, 0.30531737208366394, 0.3143673837184906, 0.32341742515563965, 0.3324674367904663, 0.34151744842529297, 0.350567489862442, 0.3596175014972687, 0.3686675429344177, 0.3777175545692444, 0.38676756620407104, 0.3958175778388977, 0.40486761927604675, 0.4139176309108734, 0.42296767234802246, 0.4320176839828491, 0.4410676956176758, 0.45011773705482483, 0.4591677486896515, 0.46821779012680054, 0.4772678017616272]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 9.0, 16.0, 15.0, 28.0, 32.0, 27.0, 39.0, 44.0, 46.0, 56.0, 68.0, 77.0, 77.0, 74.0, 58.0, 55.0, 59.0, 37.0, 36.0, 25.0, 21.0, 14.0, 12.0, 14.0, 4.0, 5.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.053205668926239014, -0.05142106115818024, -0.04963645339012146, -0.04785184934735298, -0.046067241579294205, -0.04428263381123543, -0.04249802976846695, -0.04071342200040817, -0.038928814232349396, -0.03714420646429062, -0.03535959869623184, -0.033574994653463364, -0.03179038688540459, -0.03000577911734581, -0.028221173211932182, -0.026436567306518555, -0.024651959538459778, -0.022867351770401, -0.021082745864987373, -0.019298139959573746, -0.01751353219151497, -0.015728924423456192, -0.013944318518042564, -0.012159711681306362, -0.01037510484457016, -0.008590498007833958, -0.006805891171097755, -0.005021284334361553, -0.003236677497625351, -0.0014520706608891487, 0.00033253617584705353, 0.0021171430125832558, 0.003901749849319458, 0.00568635668605566, 0.0074709635227918625, 0.009255570359528065, 0.011040177196264267, 0.01282478403300047, 0.014609390869736671, 0.0163939967751503, 0.018178604543209076, 0.019963212311267853, 0.02174781821668148, 0.023532424122095108, 0.025317031890153885, 0.027101639658212662, 0.02888624556362629, 0.030670851469039917, 0.032455459237098694, 0.03424006700515747, 0.03602467477321625, 0.037809278815984726, 0.0395938865840435, 0.04137849435210228, 0.04316309839487076, 0.044947706162929535, 0.04673231393098831, 0.04851692169904709, 0.050301529467105865, 0.052086133509874344, 0.05387074127793312, 0.0556553490459919, 0.057439953088760376, 0.05922456085681915, 0.06100916862487793]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 0.0, 8.0, 4.0, 8.0, 0.0, 10.0, 12.0, 8.0, 10.0, 10.0, 16.0, 26.0, 16.0, 16.0, 28.0, 24.0, 281.0, 4193482.0, 148.0, 23.0, 22.0, 24.0, 12.0, 14.0, 12.0, 16.0, 10.0, 8.0, 6.0, 0.0, 8.0, 4.0, 4.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.662109375, -2.552642822265625, -2.44317626953125, -2.333709716796875, -2.2242431640625, -2.114776611328125, -2.00531005859375, -1.895843505859375, -1.786376953125, -1.676910400390625, -1.56744384765625, -1.457977294921875, -1.3485107421875, -1.239044189453125, -1.12957763671875, -1.020111083984375, -0.91064453125, -0.801177978515625, -0.69171142578125, -0.582244873046875, -0.4727783203125, -0.363311767578125, -0.25384521484375, -0.144378662109375, -0.034912109375, 0.074554443359375, 0.18402099609375, 0.293487548828125, 0.4029541015625, 0.512420654296875, 0.62188720703125, 0.731353759765625, 0.8408203125, 0.950286865234375, 1.05975341796875, 1.169219970703125, 1.2786865234375, 1.388153076171875, 1.49761962890625, 1.607086181640625, 1.716552734375, 1.826019287109375, 1.93548583984375, 2.044952392578125, 2.1544189453125, 2.263885498046875, 2.37335205078125, 2.482818603515625, 2.59228515625, 2.701751708984375, 2.81121826171875, 2.920684814453125, 3.0301513671875, 3.139617919921875, 3.24908447265625, 3.358551025390625, 3.468017578125, 3.577484130859375, 3.68695068359375, 3.796417236328125, 3.9058837890625, 4.015350341796875, 4.12481689453125, 4.234283447265625, 4.34375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 5.0, 9.0, 5.0, 12.0, 9.0, 13.0, 12.0, 19.0, 113.0, 479.0, 203.0, 28.0, 18.0, 9.0, 7.0, 7.0, 7.0, 8.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018596649169921875, -0.0017921626567840576, -0.0017246603965759277, -0.0016571581363677979, -0.001589655876159668, -0.001522153615951538, -0.0014546513557434082, -0.0013871490955352783, -0.0013196468353271484, -0.0012521445751190186, -0.0011846423149108887, -0.0011171400547027588, -0.001049637794494629, -0.000982135534286499, -0.0009146332740783691, -0.0008471310138702393, -0.0007796287536621094, -0.0007121264934539795, -0.0006446242332458496, -0.0005771219730377197, -0.0005096197128295898, -0.00044211745262145996, -0.0003746151924133301, -0.0003071129322052002, -0.0002396106719970703, -0.00017210841178894043, -0.00010460615158081055, -3.7103891372680664e-05, 3.039836883544922e-05, 9.79006290435791e-05, 0.00016540288925170898, 0.00023290514945983887, 0.00030040740966796875, 0.00036790966987609863, 0.0004354119300842285, 0.0005029141902923584, 0.0005704164505004883, 0.0006379187107086182, 0.000705420970916748, 0.0007729232311248779, 0.0008404254913330078, 0.0009079277515411377, 0.0009754300117492676, 0.0010429322719573975, 0.0011104345321655273, 0.0011779367923736572, 0.0012454390525817871, 0.001312941312789917, 0.0013804435729980469, 0.0014479458332061768, 0.0015154480934143066, 0.0015829503536224365, 0.0016504526138305664, 0.0017179548740386963, 0.0017854571342468262, 0.001852959394454956, 0.001920461654663086, 0.001987963914871216, 0.0020554661750793457, 0.0021229684352874756, 0.0021904706954956055, 0.0022579729557037354, 0.0023254752159118652, 0.002392977476119995, 0.002460479736328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 13.0, 9.0, 12.0, 25.0, 24.0, 39.0, 34.0, 59.0, 76.0, 121.0, 203.0, 407.0, 4191991.0, 559.0, 213.0, 135.0, 78.0, 68.0, 47.0, 26.0, 29.0, 25.0, 17.0, 14.0, 14.0, 4.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58251953125, -0.5628738403320312, -0.5432281494140625, -0.5235824584960938, -0.503936767578125, -0.48429107666015625, -0.4646453857421875, -0.44499969482421875, -0.42535400390625, -0.40570831298828125, -0.3860626220703125, -0.36641693115234375, -0.346771240234375, -0.32712554931640625, -0.3074798583984375, -0.28783416748046875, -0.2681884765625, -0.24854278564453125, -0.2288970947265625, -0.20925140380859375, -0.189605712890625, -0.16996002197265625, -0.1503143310546875, -0.13066864013671875, -0.11102294921875, -0.09137725830078125, -0.0717315673828125, -0.05208587646484375, -0.032440185546875, -0.01279449462890625, 0.0068511962890625, 0.02649688720703125, 0.046142578125, 0.06578826904296875, 0.0854339599609375, 0.10507965087890625, 0.124725341796875, 0.14437103271484375, 0.1640167236328125, 0.18366241455078125, 0.20330810546875, 0.22295379638671875, 0.2425994873046875, 0.26224517822265625, 0.281890869140625, 0.30153656005859375, 0.3211822509765625, 0.34082794189453125, 0.3604736328125, 0.38011932373046875, 0.3997650146484375, 0.41941070556640625, 0.439056396484375, 0.45870208740234375, 0.4783477783203125, 0.49799346923828125, 0.51763916015625, 0.5372848510742188, 0.5569305419921875, 0.5765762329101562, 0.596221923828125, 0.6158676147460938, 0.6355133056640625, 0.6551589965820312, 0.6748046875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 13.0, 18.0, 16.0, 22.0, 36.0, 39.0, 42.0, 89.0, 123.0, 207.0, 432.0, 1612.0, 652.0, 272.0, 144.0, 91.0, 66.0, 44.0, 31.0, 30.0, 22.0, 16.0, 10.0, 6.0, 7.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0038471221923828125, -0.0037132203578948975, -0.0035793185234069824, -0.0034454166889190674, -0.0033115148544311523, -0.0031776130199432373, -0.0030437111854553223, -0.0029098093509674072, -0.002775907516479492, -0.002642005681991577, -0.002508103847503662, -0.002374202013015747, -0.002240300178527832, -0.002106398344039917, -0.001972496509552002, -0.001838594675064087, -0.0017046928405761719, -0.0015707910060882568, -0.0014368891716003418, -0.0013029873371124268, -0.0011690855026245117, -0.0010351836681365967, -0.0009012818336486816, -0.0007673799991607666, -0.0006334781646728516, -0.0004995763301849365, -0.0003656744956970215, -0.00023177266120910645, -9.78708267211914e-05, 3.603100776672363e-05, 0.00016993284225463867, 0.0003038346767425537, 0.00043773651123046875, 0.0005716383457183838, 0.0007055401802062988, 0.0008394420146942139, 0.0009733438491821289, 0.001107245683670044, 0.001241147518157959, 0.001375049352645874, 0.001508951187133789, 0.001642853021621704, 0.0017767548561096191, 0.0019106566905975342, 0.0020445585250854492, 0.0021784603595733643, 0.0023123621940612793, 0.0024462640285491943, 0.0025801658630371094, 0.0027140676975250244, 0.0028479695320129395, 0.0029818713665008545, 0.0031157732009887695, 0.0032496750354766846, 0.0033835768699645996, 0.0035174787044525146, 0.0036513805389404297, 0.0037852823734283447, 0.00391918420791626, 0.004053086042404175, 0.00418698787689209, 0.004320889711380005, 0.00445479154586792, 0.004588693380355835, 0.00472259521484375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 34.0, 979.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6301983594894409, -0.6192108988761902, -0.6082234978675842, -0.5972360372543335, -0.5862486362457275, -0.5752611756324768, -0.5642737150192261, -0.5532863140106201, -0.5422988533973694, -0.5313113927841187, -0.5203239917755127, -0.509336531162262, -0.4983491003513336, -0.4873616695404053, -0.47637423872947693, -0.4653868079185486, -0.4543994069099426, -0.4434119760990143, -0.43242454528808594, -0.4214370846748352, -0.41044965386390686, -0.3994622230529785, -0.38847479224205017, -0.3774873614311218, -0.3664999008178711, -0.35551247000694275, -0.3445250391960144, -0.33353757858276367, -0.3225501477718353, -0.311562716960907, -0.30057528614997864, -0.2895878553390503, -0.27860039472579956, -0.2676129639148712, -0.25662553310394287, -0.24563808739185333, -0.234650656580925, -0.22366321086883545, -0.2126757800579071, -0.20168834924697876, -0.19070091843605042, -0.17971348762512207, -0.16872604191303253, -0.1577386111021042, -0.14675118029117584, -0.1357637345790863, -0.12477630376815796, -0.11378887295722961, -0.10280143469572067, -0.09181399643421173, -0.08082656562328339, -0.06983912736177444, -0.0588516928255558, -0.04786425828933716, -0.03687682002782822, -0.025889389216899872, -0.01490195095539093, -0.003914515487849712, 0.007072919979691505, 0.018060356378555298, 0.02904779091477394, 0.040035225450992584, 0.051022663712501526, 0.06201009452342987, 0.07299753278493881]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 12.0, 15.0, 18.0, 19.0, 39.0, 57.0, 60.0, 59.0, 97.0, 99.0, 98.0, 79.0, 78.0, 56.0, 52.0, 43.0, 27.0, 15.0, 15.0, 3.0, 8.0, 5.0, 5.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02575206756591797, -0.02501755580306053, -0.024283042177557945, -0.02354852855205536, -0.022814016789197922, -0.022079505026340485, -0.021344991400837898, -0.020610477775335312, -0.019875966012477875, -0.019141454249620438, -0.01840694062411785, -0.017672426998615265, -0.016937915235757828, -0.01620340347290039, -0.015468889847397804, -0.014734377153217793, -0.01399986445903778, -0.013265351764857769, -0.012530839070677757, -0.011796326376497746, -0.011061813682317734, -0.010327300988137722, -0.00959278829395771, -0.008858275599777699, -0.008123762905597687, -0.007389250211417675, -0.006654737517237663, -0.0059202248230576515, -0.00518571212887764, -0.004451199434697628, -0.0037166867405176163, -0.0029821740463376045, -0.0022476613521575928, -0.001513148657977581, -0.0007786359637975693, -4.4123269617557526e-05, 0.0006903894245624542, 0.001424902118742466, 0.0021594148129224777, 0.0028939275071024895, 0.0036284402012825012, 0.004362952895462513, 0.005097465589642525, 0.0058319782838225365, 0.006566490978002548, 0.00730100367218256, 0.008035516366362572, 0.008770029060542583, 0.009504541754722595, 0.010239054448902607, 0.010973567143082619, 0.01170807983726263, 0.012442592531442642, 0.013177105225622654, 0.013911617919802666, 0.014646130613982677, 0.01538064330816269, 0.016115155071020126, 0.016849668696522713, 0.0175841823220253, 0.018318694084882736, 0.019053205847740173, 0.01978771947324276, 0.020522233098745346, 0.021256744861602783]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 5.0, 8.0, 17.0, 4.0, 17.0, 23.0, 23.0, 33.0, 31.0, 31.0, 31.0, 46.0, 54.0, 119.0, 1085.0, 72374.0, 968184.0, 5801.0, 297.0, 70.0, 42.0, 41.0, 33.0, 34.0, 25.0, 26.0, 18.0, 15.0, 13.0, 10.0, 8.0, 7.0, 6.0, 10.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.059356689453125, -0.05771923065185547, -0.05608177185058594, -0.054444313049316406, -0.052806854248046875, -0.051169395446777344, -0.04953193664550781, -0.04789447784423828, -0.04625701904296875, -0.04461956024169922, -0.04298210144042969, -0.041344642639160156, -0.039707183837890625, -0.038069725036621094, -0.03643226623535156, -0.03479480743408203, -0.0331573486328125, -0.03151988983154297, -0.029882431030273438, -0.028244972229003906, -0.026607513427734375, -0.024970054626464844, -0.023332595825195312, -0.02169513702392578, -0.02005767822265625, -0.01842021942138672, -0.016782760620117188, -0.015145301818847656, -0.013507843017578125, -0.011870384216308594, -0.010232925415039062, -0.008595466613769531, -0.0069580078125, -0.005320549011230469, -0.0036830902099609375, -0.0020456314086914062, -0.000408172607421875, 0.0012292861938476562, 0.0028667449951171875, 0.004504203796386719, 0.00614166259765625, 0.007779121398925781, 0.009416580200195312, 0.011054039001464844, 0.012691497802734375, 0.014328956604003906, 0.015966415405273438, 0.01760387420654297, 0.0192413330078125, 0.02087879180908203, 0.022516250610351562, 0.024153709411621094, 0.025791168212890625, 0.027428627014160156, 0.029066085815429688, 0.03070354461669922, 0.03234100341796875, 0.03397846221923828, 0.03561592102050781, 0.037253379821777344, 0.038890838623046875, 0.040528297424316406, 0.04216575622558594, 0.04380321502685547, 0.045440673828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 2.0, 5.0, 5.0, 8.0, 16.0, 14.0, 16.0, 31.0, 30.0, 60.0, 80.0, 67.0, 102.0, 95.0, 101.0, 87.0, 73.0, 61.0, 39.0, 47.0, 20.0, 17.0, 8.0, 13.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0027484893798828125, -0.0026895254850387573, -0.002630561590194702, -0.002571597695350647, -0.002512633800506592, -0.0024536699056625366, -0.0023947060108184814, -0.0023357421159744263, -0.002276778221130371, -0.002217814326286316, -0.0021588504314422607, -0.0020998865365982056, -0.0020409226417541504, -0.001981958746910095, -0.00192299485206604, -0.0018640309572219849, -0.0018050670623779297, -0.0017461031675338745, -0.0016871392726898193, -0.0016281753778457642, -0.001569211483001709, -0.0015102475881576538, -0.0014512836933135986, -0.0013923197984695435, -0.0013333559036254883, -0.001274392008781433, -0.001215428113937378, -0.0011564642190933228, -0.0010975003242492676, -0.0010385364294052124, -0.0009795725345611572, -0.000920608639717102, -0.0008616447448730469, -0.0008026808500289917, -0.0007437169551849365, -0.0006847530603408813, -0.0006257891654968262, -0.000566825270652771, -0.0005078613758087158, -0.00044889748096466064, -0.00038993358612060547, -0.0003309696912765503, -0.0002720057964324951, -0.00021304190158843994, -0.00015407800674438477, -9.511411190032959e-05, -3.6150217056274414e-05, 2.2813677787780762e-05, 8.177757263183594e-05, 0.0001407414674758911, 0.0001997053623199463, 0.00025866925716400146, 0.00031763315200805664, 0.0003765970468521118, 0.000435560941696167, 0.0004945248365402222, 0.0005534887313842773, 0.0006124526262283325, 0.0006714165210723877, 0.0007303804159164429, 0.000789344310760498, 0.0008483082056045532, 0.0009072721004486084, 0.0009662359952926636, 0.0010251998901367188]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 10.0, 11.0, 15.0, 18.0, 20.0, 33.0, 35.0, 48.0, 91.0, 125.0, 156.0, 279.0, 469.0, 1181.0, 4984.0, 44445.0, 737244.0, 240128.0, 14980.0, 2481.0, 721.0, 321.0, 215.0, 139.0, 100.0, 72.0, 58.0, 48.0, 32.0, 22.0, 22.0, 11.0, 7.0, 10.0, 7.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026611328125, -0.025823354721069336, -0.025035381317138672, -0.024247407913208008, -0.023459434509277344, -0.02267146110534668, -0.021883487701416016, -0.02109551429748535, -0.020307540893554688, -0.019519567489624023, -0.01873159408569336, -0.017943620681762695, -0.01715564727783203, -0.016367673873901367, -0.015579700469970703, -0.014791727066040039, -0.014003753662109375, -0.013215780258178711, -0.012427806854248047, -0.011639833450317383, -0.010851860046386719, -0.010063886642456055, -0.00927591323852539, -0.008487939834594727, -0.0076999664306640625, -0.0069119930267333984, -0.006124019622802734, -0.00533604621887207, -0.004548072814941406, -0.003760099411010742, -0.002972126007080078, -0.002184152603149414, -0.00139617919921875, -0.0006082057952880859, 0.00017976760864257812, 0.0009677410125732422, 0.0017557144165039062, 0.0025436878204345703, 0.0033316612243652344, 0.0041196346282958984, 0.0049076080322265625, 0.0056955814361572266, 0.006483554840087891, 0.007271528244018555, 0.008059501647949219, 0.008847475051879883, 0.009635448455810547, 0.010423421859741211, 0.011211395263671875, 0.011999368667602539, 0.012787342071533203, 0.013575315475463867, 0.014363288879394531, 0.015151262283325195, 0.01593923568725586, 0.016727209091186523, 0.017515182495117188, 0.01830315589904785, 0.019091129302978516, 0.01987910270690918, 0.020667076110839844, 0.021455049514770508, 0.022243022918701172, 0.023030996322631836, 0.0238189697265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 8.0, 5.0, 11.0, 16.0, 17.0, 18.0, 18.0, 24.0, 32.0, 25.0, 20.0, 24.0, 36.0, 42.0, 47.0, 45.0, 42.0, 40.0, 40.0, 37.0, 46.0, 26.0, 32.0, 42.0, 29.0, 24.0, 34.0, 26.0, 27.0, 18.0, 26.0, 17.0, 17.0, 15.0, 16.0, 7.0, 7.0, 9.0, 11.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.005279541015625, -0.005106568336486816, -0.004933595657348633, -0.004760622978210449, -0.004587650299072266, -0.004414677619934082, -0.0042417049407958984, -0.004068732261657715, -0.0038957595825195312, -0.0037227869033813477, -0.003549814224243164, -0.0033768415451049805, -0.003203868865966797, -0.0030308961868286133, -0.0028579235076904297, -0.002684950828552246, -0.0025119781494140625, -0.002339005470275879, -0.0021660327911376953, -0.0019930601119995117, -0.0018200874328613281, -0.0016471147537231445, -0.001474142074584961, -0.0013011693954467773, -0.0011281967163085938, -0.0009552240371704102, -0.0007822513580322266, -0.000609278678894043, -0.0004363059997558594, -0.0002633333206176758, -9.036064147949219e-05, 8.26120376586914e-05, 0.000255584716796875, 0.0004285573959350586, 0.0006015300750732422, 0.0007745027542114258, 0.0009474754333496094, 0.001120448112487793, 0.0012934207916259766, 0.0014663934707641602, 0.0016393661499023438, 0.0018123388290405273, 0.001985311508178711, 0.0021582841873168945, 0.002331256866455078, 0.0025042295455932617, 0.0026772022247314453, 0.002850174903869629, 0.0030231475830078125, 0.003196120262145996, 0.0033690929412841797, 0.0035420656204223633, 0.003715038299560547, 0.0038880109786987305, 0.004060983657836914, 0.004233956336975098, 0.004406929016113281, 0.004579901695251465, 0.0047528743743896484, 0.004925847053527832, 0.005098819732666016, 0.005271792411804199, 0.005444765090942383, 0.005617737770080566, 0.00579071044921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 5.0, 7.0, 7.0, 7.0, 5.0, 16.0, 13.0, 22.0, 27.0, 31.0, 41.0, 60.0, 110.0, 125.0, 311.0, 791.0, 2971.0, 21981.0, 738288.0, 268003.0, 12307.0, 2146.0, 599.0, 225.0, 137.0, 78.0, 49.0, 41.0, 24.0, 21.0, 19.0, 15.0, 15.0, 11.0, 6.0, 10.0, 5.0, 3.0, 5.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02032470703125, -0.019620895385742188, -0.018917083740234375, -0.018213272094726562, -0.01750946044921875, -0.016805648803710938, -0.016101837158203125, -0.015398025512695312, -0.0146942138671875, -0.013990402221679688, -0.013286590576171875, -0.012582778930664062, -0.01187896728515625, -0.011175155639648438, -0.010471343994140625, -0.009767532348632812, -0.009063720703125, -0.008359909057617188, -0.007656097412109375, -0.0069522857666015625, -0.00624847412109375, -0.0055446624755859375, -0.004840850830078125, -0.0041370391845703125, -0.0034332275390625, -0.0027294158935546875, -0.002025604248046875, -0.0013217926025390625, -0.00061798095703125, 8.58306884765625e-05, 0.000789642333984375, 0.0014934539794921875, 0.002197265625, 0.0029010772705078125, 0.003604888916015625, 0.0043087005615234375, 0.00501251220703125, 0.0057163238525390625, 0.006420135498046875, 0.0071239471435546875, 0.0078277587890625, 0.008531570434570312, 0.009235382080078125, 0.009939193725585938, 0.01064300537109375, 0.011346817016601562, 0.012050628662109375, 0.012754440307617188, 0.013458251953125, 0.014162063598632812, 0.014865875244140625, 0.015569686889648438, 0.01627349853515625, 0.016977310180664062, 0.017681121826171875, 0.018384933471679688, 0.0190887451171875, 0.019792556762695312, 0.020496368408203125, 0.021200180053710938, 0.02190399169921875, 0.022607803344726562, 0.023311614990234375, 0.024015426635742188, 0.02471923828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 12.0, 14.0, 25.0, 42.0, 104.0, 334.0, 262.0, 72.0, 42.0, 20.0, 7.0, 10.0, 9.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029087066650390625, -0.00028004124760627747, -0.0002692118287086487, -0.0002583824098110199, -0.0002475529909133911, -0.00023672357201576233, -0.00022589415311813354, -0.00021506473422050476, -0.00020423531532287598, -0.0001934058964252472, -0.0001825764775276184, -0.00017174705862998962, -0.00016091763973236084, -0.00015008822083473206, -0.00013925880193710327, -0.0001284293830394745, -0.0001175999641418457, -0.00010677054524421692, -9.594112634658813e-05, -8.511170744895935e-05, -7.428228855133057e-05, -6.345286965370178e-05, -5.2623450756073e-05, -4.1794031858444214e-05, -3.096461296081543e-05, -2.0135194063186646e-05, -9.305775165557861e-06, 1.5236437320709229e-06, 1.2353062629699707e-05, 2.318248152732849e-05, 3.4011900424957275e-05, 4.484131932258606e-05, 5.5670738220214844e-05, 6.650015711784363e-05, 7.732957601547241e-05, 8.81589949131012e-05, 9.898841381072998e-05, 0.00010981783270835876, 0.00012064725160598755, 0.00013147667050361633, 0.00014230608940124512, 0.0001531355082988739, 0.00016396492719650269, 0.00017479434609413147, 0.00018562376499176025, 0.00019645318388938904, 0.00020728260278701782, 0.0002181120216846466, 0.0002289414405822754, 0.00023977085947990417, 0.00025060027837753296, 0.00026142969727516174, 0.00027225911617279053, 0.0002830885350704193, 0.0002939179539680481, 0.0003047473728656769, 0.00031557679176330566, 0.00032640621066093445, 0.00033723562955856323, 0.000348065048456192, 0.0003588944673538208, 0.0003697238862514496, 0.00038055330514907837, 0.00039138272404670715, 0.00040221214294433594]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 7.0, 5.0, 6.0, 13.0, 9.0, 19.0, 33.0, 61.0, 139.0, 461.0, 3878.0, 999612.0, 42622.0, 1247.0, 244.0, 73.0, 38.0, 26.0, 22.0, 12.0, 6.0, 10.0, 4.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0882568359375, -0.08539009094238281, -0.08252334594726562, -0.07965660095214844, -0.07678985595703125, -0.07392311096191406, -0.07105636596679688, -0.06818962097167969, -0.0653228759765625, -0.06245613098144531, -0.059589385986328125, -0.05672264099121094, -0.05385589599609375, -0.05098915100097656, -0.048122406005859375, -0.04525566101074219, -0.042388916015625, -0.03952217102050781, -0.036655426025390625, -0.03378868103027344, -0.03092193603515625, -0.028055191040039062, -0.025188446044921875, -0.022321701049804688, -0.0194549560546875, -0.016588211059570312, -0.013721466064453125, -0.010854721069335938, -0.00798797607421875, -0.0051212310791015625, -0.002254486083984375, 0.0006122589111328125, 0.00347900390625, 0.0063457489013671875, 0.009212493896484375, 0.012079238891601562, 0.01494598388671875, 0.017812728881835938, 0.020679473876953125, 0.023546218872070312, 0.0264129638671875, 0.029279708862304688, 0.032146453857421875, 0.03501319885253906, 0.03787994384765625, 0.04074668884277344, 0.043613433837890625, 0.04648017883300781, 0.049346923828125, 0.05221366882324219, 0.055080413818359375, 0.05794715881347656, 0.06081390380859375, 0.06368064880371094, 0.06654739379882812, 0.06941413879394531, 0.0722808837890625, 0.07514762878417969, 0.07801437377929688, 0.08088111877441406, 0.08374786376953125, 0.08661460876464844, 0.08948135375976562, 0.09234809875488281, 0.09521484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 17.0, 25.0, 62.0, 154.0, 375.0, 205.0, 69.0, 36.0, 14.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.031951904296875, -0.03120255470275879, -0.030453205108642578, -0.029703855514526367, -0.028954505920410156, -0.028205156326293945, -0.027455806732177734, -0.026706457138061523, -0.025957107543945312, -0.0252077579498291, -0.02445840835571289, -0.02370905876159668, -0.02295970916748047, -0.022210359573364258, -0.021461009979248047, -0.020711660385131836, -0.019962310791015625, -0.019212961196899414, -0.018463611602783203, -0.017714262008666992, -0.01696491241455078, -0.01621556282043457, -0.01546621322631836, -0.014716863632202148, -0.013967514038085938, -0.013218164443969727, -0.012468814849853516, -0.011719465255737305, -0.010970115661621094, -0.010220766067504883, -0.009471416473388672, -0.008722066879272461, -0.00797271728515625, -0.007223367691040039, -0.006474018096923828, -0.005724668502807617, -0.004975318908691406, -0.004225969314575195, -0.0034766197204589844, -0.0027272701263427734, -0.0019779205322265625, -0.0012285709381103516, -0.0004792213439941406, 0.0002701282501220703, 0.0010194778442382812, 0.0017688274383544922, 0.002518177032470703, 0.003267526626586914, 0.004016876220703125, 0.004766225814819336, 0.005515575408935547, 0.006264925003051758, 0.007014274597167969, 0.00776362419128418, 0.00851297378540039, 0.009262323379516602, 0.010011672973632812, 0.010761022567749023, 0.011510372161865234, 0.012259721755981445, 0.013009071350097656, 0.013758420944213867, 0.014507770538330078, 0.015257120132446289, 0.0160064697265625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 20.0, 848.0, 142.0, 4.0, 1.0, 1.0], "bins": [-1.373142957687378, -1.3501344919204712, -1.3271260261535645, -1.3041174411773682, -1.2811089754104614, -1.2581005096435547, -1.235092043876648, -1.2120834589004517, -1.189074993133545, -1.1660665273666382, -1.1430580615997314, -1.1200494766235352, -1.0970410108566284, -1.0740325450897217, -1.051024079322815, -1.0280154943466187, -1.005007028579712, -0.9819985628128052, -0.9589900374412537, -0.9359815716743469, -0.9129730463027954, -0.8899645805358887, -0.8669560551643372, -0.8439475893974304, -0.8209391236305237, -0.7979306578636169, -0.7749221324920654, -0.7519136667251587, -0.7289051413536072, -0.7058966755867004, -0.6828881502151489, -0.6598796844482422, -0.6368711590766907, -0.6138626933097839, -0.5908541679382324, -0.5678457021713257, -0.5448371767997742, -0.5218287110328674, -0.4988201856613159, -0.4758117198944092, -0.45280319452285767, -0.42979469895362854, -0.4067862033843994, -0.3837777078151703, -0.36076921224594116, -0.33776071667671204, -0.3147522211074829, -0.29174375534057617, -0.26873522996902466, -0.24572673439979553, -0.2227182388305664, -0.19970974326133728, -0.17670124769210815, -0.15369275212287903, -0.1306842714548111, -0.10767577588558197, -0.08466729521751404, -0.06165879964828491, -0.038650307804346085, -0.015641815960407257, 0.007366679608821869, 0.030375175178050995, 0.053383663296699524, 0.07639215886592865, 0.09940065443515778]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 18.0, 23.0, 16.0, 32.0, 49.0, 49.0, 61.0, 63.0, 76.0, 67.0, 82.0, 59.0, 71.0, 81.0, 50.0, 54.0, 37.0, 28.0, 31.0, 16.0, 16.0, 8.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039511680603027344, -0.03701457381248474, -0.03451746329665184, -0.03202035278081894, -0.029523245990276337, -0.027026137337088585, -0.024529028683900833, -0.02203192003071308, -0.01953481137752533, -0.017037702724337578, -0.014540594071149826, -0.012043485417962074, -0.009546376764774323, -0.007049268111586571, -0.004552159458398819, -0.002055050805211067, 0.00044205784797668457, 0.0029391665011644363, 0.005436275154352188, 0.00793338380753994, 0.010430492460727692, 0.012927601113915443, 0.015424709767103195, 0.017921818420290947, 0.0204189270734787, 0.02291603572666645, 0.025413144379854202, 0.027910253033041954, 0.030407361686229706, 0.03290446847677231, 0.03540157899260521, 0.03789868950843811, 0.04039579629898071, 0.042892903089523315, 0.045390013605356216, 0.04788712412118912, 0.05038423091173172, 0.05288133770227432, 0.055378448218107224, 0.057875558733940125, 0.06037266552448273, 0.06286977231502533, 0.06536687910556793, 0.06786399334669113, 0.07036110013723373, 0.07285820692777634, 0.07535532116889954, 0.07785242795944214, 0.08034953474998474, 0.08284664154052734, 0.08534374833106995, 0.08784086257219315, 0.09033796936273575, 0.09283507615327835, 0.09533219039440155, 0.09782929718494415, 0.10032640397548676, 0.10282351076602936, 0.10532061755657196, 0.10781773179769516, 0.11031483858823776, 0.11281194537878036, 0.11530905961990356, 0.11780616641044617, 0.12030327320098877]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 14.0, 23.0, 23.0, 49.0, 81.0, 126.0, 250.0, 513.0, 1238.0, 4178256.0, 12843.0, 545.0, 193.0, 71.0, 40.0, 11.0, 6.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.264404296875, -0.25939035415649414, -0.2543764114379883, -0.24936246871948242, -0.24434852600097656, -0.2393345832824707, -0.23432064056396484, -0.22930669784545898, -0.22429275512695312, -0.21927881240844727, -0.2142648696899414, -0.20925092697143555, -0.2042369842529297, -0.19922304153442383, -0.19420909881591797, -0.1891951560974121, -0.18418121337890625, -0.1791672706604004, -0.17415332794189453, -0.16913938522338867, -0.1641254425048828, -0.15911149978637695, -0.1540975570678711, -0.14908361434936523, -0.14406967163085938, -0.13905572891235352, -0.13404178619384766, -0.1290278434753418, -0.12401390075683594, -0.11899995803833008, -0.11398601531982422, -0.10897207260131836, -0.1039581298828125, -0.09894418716430664, -0.09393024444580078, -0.08891630172729492, -0.08390235900878906, -0.0788884162902832, -0.07387447357177734, -0.06886053085327148, -0.06384658813476562, -0.058832645416259766, -0.053818702697753906, -0.04880475997924805, -0.04379081726074219, -0.03877687454223633, -0.03376293182373047, -0.02874898910522461, -0.02373504638671875, -0.01872110366821289, -0.013707160949707031, -0.008693218231201172, -0.0036792755126953125, 0.0013346672058105469, 0.006348609924316406, 0.011362552642822266, 0.016376495361328125, 0.021390438079833984, 0.026404380798339844, 0.0314183235168457, 0.03643226623535156, 0.04144620895385742, 0.04646015167236328, 0.05147409439086914, 0.056488037109375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 4.0, 13.0, 8.0, 21.0, 28.0, 33.0, 50.0, 54.0, 78.0, 88.0, 105.0, 97.0, 99.0, 92.0, 72.0, 53.0, 36.0, 23.0, 15.0, 14.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.003265380859375, -0.0031944215297698975, -0.003123462200164795, -0.0030525028705596924, -0.00298154354095459, -0.0029105842113494873, -0.0028396248817443848, -0.0027686655521392822, -0.0026977062225341797, -0.002626746892929077, -0.0025557875633239746, -0.002484828233718872, -0.0024138689041137695, -0.002342909574508667, -0.0022719502449035645, -0.002200990915298462, -0.0021300315856933594, -0.002059072256088257, -0.0019881129264831543, -0.0019171535968780518, -0.0018461942672729492, -0.0017752349376678467, -0.0017042756080627441, -0.0016333162784576416, -0.001562356948852539, -0.0014913976192474365, -0.001420438289642334, -0.0013494789600372314, -0.001278519630432129, -0.0012075603008270264, -0.0011366009712219238, -0.0010656416416168213, -0.0009946823120117188, -0.0009237229824066162, -0.0008527636528015137, -0.0007818043231964111, -0.0007108449935913086, -0.0006398856639862061, -0.0005689263343811035, -0.000497967004776001, -0.00042700767517089844, -0.0003560483455657959, -0.00028508901596069336, -0.00021412968635559082, -0.00014317035675048828, -7.221102714538574e-05, -1.2516975402832031e-06, 6.970763206481934e-05, 0.00014066696166992188, 0.00021162629127502441, 0.00028258562088012695, 0.0003535449504852295, 0.00042450428009033203, 0.0004954636096954346, 0.0005664229393005371, 0.0006373822689056396, 0.0007083415985107422, 0.0007793009281158447, 0.0008502602577209473, 0.0009212195873260498, 0.0009921789169311523, 0.0010631382465362549, 0.0011340975761413574, 0.00120505690574646, 0.0012760162353515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 10.0, 13.0, 36.0, 48.0, 98.0, 128.0, 169.0, 252.0, 762.0, 4189696.0, 2360.0, 261.0, 166.0, 111.0, 69.0, 42.0, 35.0, 14.0, 10.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65185546875, -0.6372528076171875, -0.622650146484375, -0.6080474853515625, -0.59344482421875, -0.5788421630859375, -0.564239501953125, -0.5496368408203125, -0.5350341796875, -0.5204315185546875, -0.505828857421875, -0.4912261962890625, -0.47662353515625, -0.4620208740234375, -0.447418212890625, -0.4328155517578125, -0.418212890625, -0.4036102294921875, -0.389007568359375, -0.3744049072265625, -0.35980224609375, -0.3451995849609375, -0.330596923828125, -0.3159942626953125, -0.3013916015625, -0.2867889404296875, -0.272186279296875, -0.2575836181640625, -0.24298095703125, -0.2283782958984375, -0.213775634765625, -0.1991729736328125, -0.1845703125, -0.1699676513671875, -0.155364990234375, -0.1407623291015625, -0.12615966796875, -0.1115570068359375, -0.096954345703125, -0.0823516845703125, -0.0677490234375, -0.0531463623046875, -0.038543701171875, -0.0239410400390625, -0.00933837890625, 0.0052642822265625, 0.019866943359375, 0.0344696044921875, 0.049072265625, 0.0636749267578125, 0.078277587890625, 0.0928802490234375, 0.10748291015625, 0.1220855712890625, 0.136688232421875, 0.1512908935546875, 0.1658935546875, 0.1804962158203125, 0.195098876953125, 0.2097015380859375, 0.22430419921875, 0.2389068603515625, 0.253509521484375, 0.2681121826171875, 0.28271484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 18.0, 306.0, 3605.0, 138.0, 17.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.064453125, -0.06330907344818115, -0.062165021896362305, -0.06102097034454346, -0.05987691879272461, -0.05873286724090576, -0.057588815689086914, -0.056444764137268066, -0.05530071258544922, -0.05415666103363037, -0.05301260948181152, -0.051868557929992676, -0.05072450637817383, -0.04958045482635498, -0.04843640327453613, -0.047292351722717285, -0.04614830017089844, -0.04500424861907959, -0.04386019706726074, -0.042716145515441895, -0.04157209396362305, -0.0404280424118042, -0.03928399085998535, -0.038139939308166504, -0.036995887756347656, -0.03585183620452881, -0.03470778465270996, -0.03356373310089111, -0.032419681549072266, -0.03127562999725342, -0.03013157844543457, -0.028987526893615723, -0.027843475341796875, -0.026699423789978027, -0.02555537223815918, -0.024411320686340332, -0.023267269134521484, -0.022123217582702637, -0.02097916603088379, -0.01983511447906494, -0.018691062927246094, -0.017547011375427246, -0.0164029598236084, -0.01525890827178955, -0.014114856719970703, -0.012970805168151855, -0.011826753616333008, -0.01068270206451416, -0.009538650512695312, -0.008394598960876465, -0.007250547409057617, -0.0061064958572387695, -0.004962444305419922, -0.0038183927536010742, -0.0026743412017822266, -0.001530289649963379, -0.00038623809814453125, 0.0007578134536743164, 0.001901865005493164, 0.0030459165573120117, 0.004189968109130859, 0.005334019660949707, 0.006478071212768555, 0.007622122764587402, 0.00876617431640625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 13.0, 55.0, 277.0, 561.0, 80.0, 10.0, 12.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6964147090911865, -0.6833183765411377, -0.6702221035957336, -0.6571257710456848, -0.644029438495636, -0.6309331059455872, -0.6178368330001831, -0.6047405004501343, -0.5916441679000854, -0.5785478353500366, -0.5654515624046326, -0.5523552298545837, -0.5392588973045349, -0.5261625647544861, -0.513066291809082, -0.4999699592590332, -0.48687365651130676, -0.4737773537635803, -0.4606810212135315, -0.44758471846580505, -0.4344883859157562, -0.4213920831680298, -0.40829575061798096, -0.3951994478702545, -0.3821031451225281, -0.36900684237480164, -0.3559105098247528, -0.34281420707702637, -0.32971787452697754, -0.3166215717792511, -0.30352526903152466, -0.29042893648147583, -0.277332603931427, -0.26423630118370056, -0.25113996863365173, -0.2380436658859253, -0.22494733333587646, -0.21185103058815002, -0.1987547129392624, -0.18565839529037476, -0.17256207764148712, -0.1594657599925995, -0.14636944234371185, -0.13327312469482422, -0.12017681449651718, -0.10708049684762955, -0.09398418664932251, -0.08088786900043488, -0.06779155135154724, -0.05469523370265961, -0.04159891977906227, -0.028502605855464935, -0.015406288206577301, -0.0023099705576896667, 0.01078633964061737, 0.023882657289505005, 0.03697897493839264, 0.05007529258728027, 0.06317161023616791, 0.07626792043447495, 0.08936423808336258, 0.10246055573225021, 0.11555686593055725, 0.12865318357944489, 0.14174950122833252]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 14.0, 20.0, 42.0, 74.0, 104.0, 135.0, 156.0, 157.0, 108.0, 93.0, 40.0, 29.0, 18.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1467735767364502, -0.14198756217956543, -0.13720156252384186, -0.1324155479669571, -0.12762954831123352, -0.12284353375434875, -0.11805751919746399, -0.11327151209115982, -0.10848550498485565, -0.10369949787855148, -0.09891349077224731, -0.09412747621536255, -0.08934146910905838, -0.08455546200275421, -0.07976944744586945, -0.07498344033956528, -0.07019743323326111, -0.06541142612695694, -0.06062541529536247, -0.055839404463768005, -0.05105339735746384, -0.04626739025115967, -0.0414813794195652, -0.036695368587970734, -0.031909361481666565, -0.027123352512717247, -0.02233734354376793, -0.01755133457481861, -0.012765325605869293, -0.007979316636919975, -0.0031933076679706573, 0.0015927031636238098, 0.0063787102699279785, 0.011164719238877296, 0.015950728207826614, 0.020736737176775932, 0.02552274614572525, 0.030308755114674568, 0.035094764083623886, 0.03988077491521835, 0.04466678202152252, 0.04945278912782669, 0.05423879995942116, 0.059024810791015625, 0.0638108178973198, 0.06859682500362396, 0.07338283956050873, 0.0781688466668129, 0.08295485377311707, 0.08774086087942123, 0.0925268679857254, 0.09731288254261017, 0.10209888964891434, 0.1068848967552185, 0.11167091131210327, 0.11645691841840744, 0.12124292552471161, 0.12602894008159637, 0.13081493973731995, 0.1356009542942047, 0.14038696885108948, 0.14517296850681305, 0.14995898306369781, 0.1547449827194214, 0.15953099727630615]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 7.0, 4.0, 5.0, 14.0, 3.0, 12.0, 15.0, 19.0, 20.0, 29.0, 47.0, 65.0, 100.0, 172.0, 253.0, 464.0, 950.0, 2402.0, 9665.0, 64449.0, 826133.0, 123631.0, 14052.0, 3350.0, 1180.0, 581.0, 304.0, 196.0, 111.0, 79.0, 59.0, 38.0, 35.0, 27.0, 12.0, 13.0, 10.0, 11.0, 4.0, 6.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-0.07342529296875, -0.07117462158203125, -0.0689239501953125, -0.06667327880859375, -0.064422607421875, -0.06217193603515625, -0.0599212646484375, -0.05767059326171875, -0.055419921875, -0.05316925048828125, -0.0509185791015625, -0.04866790771484375, -0.046417236328125, -0.04416656494140625, -0.0419158935546875, -0.03966522216796875, -0.03741455078125, -0.03516387939453125, -0.0329132080078125, -0.03066253662109375, -0.028411865234375, -0.02616119384765625, -0.0239105224609375, -0.02165985107421875, -0.0194091796875, -0.01715850830078125, -0.0149078369140625, -0.01265716552734375, -0.010406494140625, -0.00815582275390625, -0.0059051513671875, -0.00365447998046875, -0.00140380859375, 0.00084686279296875, 0.0030975341796875, 0.00534820556640625, 0.007598876953125, 0.00984954833984375, 0.0121002197265625, 0.01435089111328125, 0.0166015625, 0.01885223388671875, 0.0211029052734375, 0.02335357666015625, 0.025604248046875, 0.02785491943359375, 0.0301055908203125, 0.03235626220703125, 0.03460693359375, 0.03685760498046875, 0.0391082763671875, 0.04135894775390625, 0.043609619140625, 0.04586029052734375, 0.0481109619140625, 0.05036163330078125, 0.0526123046875, 0.05486297607421875, 0.0571136474609375, 0.05936431884765625, 0.061614990234375, 0.06386566162109375, 0.0661163330078125, 0.06836700439453125, 0.07061767578125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 14.0, 34.0, 35.0, 43.0, 76.0, 85.0, 131.0, 118.0, 117.0, 99.0, 75.0, 50.0, 38.0, 24.0, 19.0, 11.0, 6.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00800323486328125, -0.00777745246887207, -0.007551670074462891, -0.007325887680053711, -0.007100105285644531, -0.0068743228912353516, -0.006648540496826172, -0.006422758102416992, -0.0061969757080078125, -0.005971193313598633, -0.005745410919189453, -0.0055196285247802734, -0.005293846130371094, -0.005068063735961914, -0.004842281341552734, -0.004616498947143555, -0.004390716552734375, -0.004164934158325195, -0.003939151763916016, -0.003713369369506836, -0.0034875869750976562, -0.0032618045806884766, -0.003036022186279297, -0.002810239791870117, -0.0025844573974609375, -0.002358675003051758, -0.002132892608642578, -0.0019071102142333984, -0.0016813278198242188, -0.001455545425415039, -0.0012297630310058594, -0.0010039806365966797, -0.0007781982421875, -0.0005524158477783203, -0.0003266334533691406, -0.00010085105895996094, 0.00012493133544921875, 0.00035071372985839844, 0.0005764961242675781, 0.0008022785186767578, 0.0010280609130859375, 0.0012538433074951172, 0.0014796257019042969, 0.0017054080963134766, 0.0019311904907226562, 0.002156972885131836, 0.0023827552795410156, 0.0026085376739501953, 0.002834320068359375, 0.0030601024627685547, 0.0032858848571777344, 0.003511667251586914, 0.0037374496459960938, 0.0039632320404052734, 0.004189014434814453, 0.004414796829223633, 0.0046405792236328125, 0.004866361618041992, 0.005092144012451172, 0.0053179264068603516, 0.005543708801269531, 0.005769491195678711, 0.005995273590087891, 0.00622105598449707, 0.00644683837890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 11.0, 10.0, 14.0, 21.0, 26.0, 37.0, 51.0, 77.0, 152.0, 346.0, 1014.0, 4052.0, 26348.0, 568964.0, 420815.0, 21549.0, 3461.0, 892.0, 318.0, 142.0, 78.0, 49.0, 35.0, 23.0, 19.0, 11.0, 12.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05523681640625, -0.053452491760253906, -0.05166816711425781, -0.04988384246826172, -0.048099517822265625, -0.04631519317626953, -0.04453086853027344, -0.042746543884277344, -0.04096221923828125, -0.039177894592285156, -0.03739356994628906, -0.03560924530029297, -0.033824920654296875, -0.03204059600830078, -0.030256271362304688, -0.028471946716308594, -0.0266876220703125, -0.024903297424316406, -0.023118972778320312, -0.02133464813232422, -0.019550323486328125, -0.01776599884033203, -0.015981674194335938, -0.014197349548339844, -0.01241302490234375, -0.010628700256347656, -0.008844375610351562, -0.007060050964355469, -0.005275726318359375, -0.0034914016723632812, -0.0017070770263671875, 7.724761962890625e-05, 0.001861572265625, 0.0036458969116210938, 0.0054302215576171875, 0.007214546203613281, 0.008998870849609375, 0.010783195495605469, 0.012567520141601562, 0.014351844787597656, 0.01613616943359375, 0.017920494079589844, 0.019704818725585938, 0.02148914337158203, 0.023273468017578125, 0.02505779266357422, 0.026842117309570312, 0.028626441955566406, 0.0304107666015625, 0.032195091247558594, 0.03397941589355469, 0.03576374053955078, 0.037548065185546875, 0.03933238983154297, 0.04111671447753906, 0.042901039123535156, 0.04468536376953125, 0.046469688415527344, 0.04825401306152344, 0.05003833770751953, 0.051822662353515625, 0.05360698699951172, 0.05539131164550781, 0.057175636291503906, 0.0589599609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 7.0, 8.0, 6.0, 17.0, 16.0, 26.0, 17.0, 26.0, 40.0, 40.0, 38.0, 62.0, 68.0, 63.0, 62.0, 64.0, 55.0, 57.0, 58.0, 62.0, 39.0, 34.0, 28.0, 26.0, 16.0, 14.0, 12.0, 11.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184783935546875, -0.0178835391998291, -0.017288684844970703, -0.016693830490112305, -0.016098976135253906, -0.015504121780395508, -0.01490926742553711, -0.014314413070678711, -0.013719558715820312, -0.013124704360961914, -0.012529850006103516, -0.011934995651245117, -0.011340141296386719, -0.01074528694152832, -0.010150432586669922, -0.009555578231811523, -0.008960723876953125, -0.008365869522094727, -0.007771015167236328, -0.00717616081237793, -0.006581306457519531, -0.005986452102661133, -0.005391597747802734, -0.004796743392944336, -0.0042018890380859375, -0.003607034683227539, -0.0030121803283691406, -0.002417325973510742, -0.0018224716186523438, -0.0012276172637939453, -0.0006327629089355469, -3.790855407714844e-05, 0.00055694580078125, 0.0011518001556396484, 0.0017466545104980469, 0.0023415088653564453, 0.0029363632202148438, 0.003531217575073242, 0.004126071929931641, 0.004720926284790039, 0.0053157806396484375, 0.005910634994506836, 0.006505489349365234, 0.007100343704223633, 0.007695198059082031, 0.00829005241394043, 0.008884906768798828, 0.009479761123657227, 0.010074615478515625, 0.010669469833374023, 0.011264324188232422, 0.01185917854309082, 0.012454032897949219, 0.013048887252807617, 0.013643741607666016, 0.014238595962524414, 0.014833450317382812, 0.015428304672241211, 0.01602315902709961, 0.016618013381958008, 0.017212867736816406, 0.017807722091674805, 0.018402576446533203, 0.0189974308013916, 0.01959228515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 9.0, 12.0, 15.0, 11.0, 30.0, 32.0, 47.0, 92.0, 204.0, 406.0, 891.0, 2672.0, 12909.0, 722256.0, 297016.0, 8254.0, 2157.0, 773.0, 343.0, 164.0, 92.0, 54.0, 32.0, 21.0, 10.0, 16.0, 10.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052459716796875, -0.05095624923706055, -0.049452781677246094, -0.04794931411743164, -0.04644584655761719, -0.044942378997802734, -0.04343891143798828, -0.04193544387817383, -0.040431976318359375, -0.03892850875854492, -0.03742504119873047, -0.035921573638916016, -0.03441810607910156, -0.03291463851928711, -0.031411170959472656, -0.029907703399658203, -0.02840423583984375, -0.026900768280029297, -0.025397300720214844, -0.02389383316040039, -0.022390365600585938, -0.020886898040771484, -0.01938343048095703, -0.017879962921142578, -0.016376495361328125, -0.014873027801513672, -0.013369560241699219, -0.011866092681884766, -0.010362625122070312, -0.00885915756225586, -0.007355690002441406, -0.005852222442626953, -0.0043487548828125, -0.002845287322998047, -0.0013418197631835938, 0.00016164779663085938, 0.0016651153564453125, 0.0031685829162597656, 0.004672050476074219, 0.006175518035888672, 0.007678985595703125, 0.009182453155517578, 0.010685920715332031, 0.012189388275146484, 0.013692855834960938, 0.01519632339477539, 0.016699790954589844, 0.018203258514404297, 0.01970672607421875, 0.021210193634033203, 0.022713661193847656, 0.02421712875366211, 0.025720596313476562, 0.027224063873291016, 0.02872753143310547, 0.030230998992919922, 0.031734466552734375, 0.03323793411254883, 0.03474140167236328, 0.036244869232177734, 0.03774833679199219, 0.03925180435180664, 0.040755271911621094, 0.04225873947143555, 0.04376220703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 2.0, 11.0, 12.0, 10.0, 23.0, 16.0, 32.0, 33.0, 41.0, 51.0, 89.0, 120.0, 153.0, 131.0, 87.0, 49.0, 37.0, 40.0, 17.0, 13.0, 11.0, 11.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011807680130004883, -0.00011302437633275986, -0.00010797195136547089, -0.00010291952639818192, -9.786710143089294e-05, -9.281467646360397e-05, -8.7762251496315e-05, -8.270982652902603e-05, -7.765740156173706e-05, -7.260497659444809e-05, -6.755255162715912e-05, -6.250012665987015e-05, -5.744770169258118e-05, -5.2395276725292206e-05, -4.7342851758003235e-05, -4.2290426790714264e-05, -3.723800182342529e-05, -3.218557685613632e-05, -2.713315188884735e-05, -2.208072692155838e-05, -1.702830195426941e-05, -1.1975876986980438e-05, -6.923452019691467e-06, -1.8710270524024963e-06, 3.1813979148864746e-06, 8.233822882175446e-06, 1.3286247849464417e-05, 1.8338672816753387e-05, 2.339109778404236e-05, 2.844352275133133e-05, 3.34959477186203e-05, 3.854837268590927e-05, 4.360079765319824e-05, 4.865322262048721e-05, 5.3705647587776184e-05, 5.8758072555065155e-05, 6.381049752235413e-05, 6.88629224896431e-05, 7.391534745693207e-05, 7.896777242422104e-05, 8.402019739151001e-05, 8.907262235879898e-05, 9.412504732608795e-05, 9.917747229337692e-05, 0.0001042298972606659, 0.00010928232222795486, 0.00011433474719524384, 0.0001193871721625328, 0.00012443959712982178, 0.00012949202209711075, 0.00013454444706439972, 0.0001395968720316887, 0.00014464929699897766, 0.00014970172196626663, 0.0001547541469335556, 0.00015980657190084457, 0.00016485899686813354, 0.00016991142183542252, 0.0001749638468027115, 0.00018001627177000046, 0.00018506869673728943, 0.0001901211217045784, 0.00019517354667186737, 0.00020022597163915634, 0.0002052783966064453]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 3.0, 8.0, 17.0, 23.0, 50.0, 91.0, 217.0, 771.0, 6566.0, 801366.0, 234682.0, 3753.0, 627.0, 192.0, 79.0, 48.0, 25.0, 8.0, 9.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.057861328125, -0.05553627014160156, -0.053211212158203125, -0.05088615417480469, -0.04856109619140625, -0.04623603820800781, -0.043910980224609375, -0.04158592224121094, -0.0392608642578125, -0.03693580627441406, -0.034610748291015625, -0.03228569030761719, -0.02996063232421875, -0.027635574340820312, -0.025310516357421875, -0.022985458374023438, -0.020660400390625, -0.018335342407226562, -0.016010284423828125, -0.013685226440429688, -0.01136016845703125, -0.009035110473632812, -0.006710052490234375, -0.0043849945068359375, -0.0020599365234375, 0.0002651214599609375, 0.002590179443359375, 0.0049152374267578125, 0.00724029541015625, 0.009565353393554688, 0.011890411376953125, 0.014215469360351562, 0.01654052734375, 0.018865585327148438, 0.021190643310546875, 0.023515701293945312, 0.02584075927734375, 0.028165817260742188, 0.030490875244140625, 0.03281593322753906, 0.0351409912109375, 0.03746604919433594, 0.039791107177734375, 0.04211616516113281, 0.04444122314453125, 0.04676628112792969, 0.049091339111328125, 0.05141639709472656, 0.053741455078125, 0.05606651306152344, 0.058391571044921875, 0.06071662902832031, 0.06304168701171875, 0.06536674499511719, 0.06769180297851562, 0.07001686096191406, 0.0723419189453125, 0.07466697692871094, 0.07699203491210938, 0.07931709289550781, 0.08164215087890625, 0.08396720886230469, 0.08629226684570312, 0.08861732482910156, 0.0909423828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 2.0, 6.0, 16.0, 17.0, 32.0, 39.0, 83.0, 137.0, 173.0, 188.0, 132.0, 63.0, 30.0, 28.0, 18.0, 11.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016326904296875, -0.015503883361816406, -0.014680862426757812, -0.013857841491699219, -0.013034820556640625, -0.012211799621582031, -0.011388778686523438, -0.010565757751464844, -0.00974273681640625, -0.008919715881347656, -0.008096694946289062, -0.007273674011230469, -0.006450653076171875, -0.005627632141113281, -0.0048046112060546875, -0.003981590270996094, -0.0031585693359375, -0.0023355484008789062, -0.0015125274658203125, -0.0006895065307617188, 0.000133514404296875, 0.0009565353393554688, 0.0017795562744140625, 0.0026025772094726562, 0.00342559814453125, 0.004248619079589844, 0.0050716400146484375, 0.005894660949707031, 0.006717681884765625, 0.007540702819824219, 0.008363723754882812, 0.009186744689941406, 0.010009765625, 0.010832786560058594, 0.011655807495117188, 0.012478828430175781, 0.013301849365234375, 0.014124870300292969, 0.014947891235351562, 0.015770912170410156, 0.01659393310546875, 0.017416954040527344, 0.018239974975585938, 0.01906299591064453, 0.019886016845703125, 0.02070903778076172, 0.021532058715820312, 0.022355079650878906, 0.0231781005859375, 0.024001121520996094, 0.024824142456054688, 0.02564716339111328, 0.026470184326171875, 0.02729320526123047, 0.028116226196289062, 0.028939247131347656, 0.02976226806640625, 0.030585289001464844, 0.03140830993652344, 0.03223133087158203, 0.033054351806640625, 0.03387737274169922, 0.03470039367675781, 0.035523414611816406, 0.036346435546875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 320.0, 605.0, 59.0, 12.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6035652160644531, -1.5738805532455444, -1.5441958904266357, -1.514511227607727, -1.4848265647888184, -1.4551417827606201, -1.4254571199417114, -1.3957724571228027, -1.366087794303894, -1.3364031314849854, -1.3067184686660767, -1.277033805847168, -1.2473490238189697, -1.217664361000061, -1.1879796981811523, -1.1582950353622437, -1.128610372543335, -1.0989257097244263, -1.0692410469055176, -1.0395563840866089, -1.0098717212677002, -0.9801869988441467, -0.9505022764205933, -0.9208176136016846, -0.8911329507827759, -0.8614482879638672, -0.8317636251449585, -0.802078902721405, -0.7723942399024963, -0.7427095770835876, -0.7130248546600342, -0.6833401918411255, -0.6536555290222168, -0.6239708662033081, -0.5942862033843994, -0.564601480960846, -0.5349168181419373, -0.5052321553230286, -0.4755474627017975, -0.4458627700805664, -0.4161781072616577, -0.386493444442749, -0.35680875182151794, -0.32712405920028687, -0.2974393963813782, -0.2677547335624695, -0.2380700409412384, -0.20838536322116852, -0.17870068550109863, -0.14901600778102875, -0.11933133006095886, -0.08964665234088898, -0.05996197462081909, -0.030277296900749207, -0.0005926191806793213, 0.029092058539390564, 0.05877673625946045, 0.08846141397953033, 0.11814609169960022, 0.1478307694196701, 0.17751544713974, 0.20720012485980988, 0.23688480257987976, 0.26656949520111084, 0.29625415802001953]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 9.0, 6.0, 12.0, 14.0, 35.0, 29.0, 37.0, 44.0, 66.0, 70.0, 64.0, 77.0, 75.0, 78.0, 75.0, 62.0, 59.0, 44.0, 40.0, 27.0, 33.0, 19.0, 11.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15021491050720215, -0.14463640749454498, -0.13905788958072662, -0.13347938656806946, -0.1279008835554123, -0.12232237309217453, -0.11674386262893677, -0.1111653596162796, -0.10558684915304184, -0.10000833868980408, -0.09442983567714691, -0.08885132521390915, -0.08327281475067139, -0.07769431173801422, -0.07211580127477646, -0.0665372908115387, -0.06095878779888153, -0.05538028106093407, -0.0498017743229866, -0.04422326385974884, -0.038644757121801376, -0.03306625038385391, -0.02748773992061615, -0.021909233182668686, -0.016330726444721222, -0.010752218775451183, -0.005173711106181145, 0.0004047974944114685, 0.0059833042323589325, 0.011561810970306396, 0.01714032143354416, 0.022718828171491623, 0.028297334909439087, 0.03387584164738655, 0.039454348385334015, 0.04503285884857178, 0.05061136558651924, 0.056189872324466705, 0.06176838278770447, 0.06734688580036163, 0.0729253962635994, 0.07850390672683716, 0.08408240973949432, 0.08966092020273209, 0.09523943066596985, 0.10081793367862701, 0.10639644414186478, 0.11197495460510254, 0.1175534576177597, 0.12313196808099747, 0.12871047854423523, 0.1342889815568924, 0.13986748456954956, 0.14544600248336792, 0.15102450549602509, 0.15660300850868225, 0.1621815264225006, 0.16776002943515778, 0.17333854734897614, 0.1789170503616333, 0.18449555337429047, 0.19007405638694763, 0.195652574300766, 0.20123107731342316, 0.20680958032608032]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 14.0, 12.0, 6.0, 9.0, 13.0, 14.0, 20.0, 19.0, 17.0, 33.0, 43.0, 50.0, 79.0, 103.0, 161.0, 310.0, 498.0, 1084.0, 3094.0, 14618.0, 235106.0, 3880559.0, 49414.0, 6590.0, 1561.0, 510.0, 179.0, 84.0, 30.0, 16.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.1549072265625, -0.1517624855041504, -0.14861774444580078, -0.14547300338745117, -0.14232826232910156, -0.13918352127075195, -0.13603878021240234, -0.13289403915405273, -0.12974929809570312, -0.12660455703735352, -0.1234598159790039, -0.1203150749206543, -0.11717033386230469, -0.11402559280395508, -0.11088085174560547, -0.10773611068725586, -0.10459136962890625, -0.10144662857055664, -0.09830188751220703, -0.09515714645385742, -0.09201240539550781, -0.0888676643371582, -0.0857229232788086, -0.08257818222045898, -0.07943344116210938, -0.07628870010375977, -0.07314395904541016, -0.06999921798706055, -0.06685447692871094, -0.06370973587036133, -0.06056499481201172, -0.05742025375366211, -0.0542755126953125, -0.05113077163696289, -0.04798603057861328, -0.04484128952026367, -0.04169654846191406, -0.03855180740356445, -0.035407066345214844, -0.032262325286865234, -0.029117584228515625, -0.025972843170166016, -0.022828102111816406, -0.019683361053466797, -0.016538619995117188, -0.013393878936767578, -0.010249137878417969, -0.007104396820068359, -0.00395965576171875, -0.0008149147033691406, 0.0023298263549804688, 0.005474567413330078, 0.008619308471679688, 0.011764049530029297, 0.014908790588378906, 0.018053531646728516, 0.021198272705078125, 0.024343013763427734, 0.027487754821777344, 0.030632495880126953, 0.03377723693847656, 0.03692197799682617, 0.04006671905517578, 0.04321146011352539, 0.046356201171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 9.0, 15.0, 22.0, 38.0, 70.0, 60.0, 115.0, 108.0, 118.0, 122.0, 100.0, 66.0, 53.0, 35.0, 27.0, 15.0, 12.0, 7.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0105438232421875, -0.010295510292053223, -0.010047197341918945, -0.009798884391784668, -0.00955057144165039, -0.009302258491516113, -0.009053945541381836, -0.008805632591247559, -0.008557319641113281, -0.008309006690979004, -0.008060693740844727, -0.007812380790710449, -0.007564067840576172, -0.0073157548904418945, -0.007067441940307617, -0.00681912899017334, -0.0065708160400390625, -0.006322503089904785, -0.006074190139770508, -0.0058258771896362305, -0.005577564239501953, -0.005329251289367676, -0.0050809383392333984, -0.004832625389099121, -0.004584312438964844, -0.004335999488830566, -0.004087686538696289, -0.0038393735885620117, -0.0035910606384277344, -0.003342747688293457, -0.0030944347381591797, -0.0028461217880249023, -0.002597808837890625, -0.0023494958877563477, -0.0021011829376220703, -0.001852869987487793, -0.0016045570373535156, -0.0013562440872192383, -0.001107931137084961, -0.0008596181869506836, -0.0006113052368164062, -0.0003629922866821289, -0.00011467933654785156, 0.00013363361358642578, 0.0003819465637207031, 0.0006302595138549805, 0.0008785724639892578, 0.0011268854141235352, 0.0013751983642578125, 0.0016235113143920898, 0.0018718242645263672, 0.0021201372146606445, 0.002368450164794922, 0.0026167631149291992, 0.0028650760650634766, 0.003113389015197754, 0.0033617019653320312, 0.0036100149154663086, 0.003858327865600586, 0.004106640815734863, 0.004354953765869141, 0.004603266716003418, 0.004851579666137695, 0.005099892616271973, 0.00534820556640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 6.0, 9.0, 26.0, 37.0, 73.0, 164.0, 499.0, 3898.0, 4186095.0, 2940.0, 345.0, 113.0, 46.0, 22.0, 9.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83544921875, -0.8185672760009766, -0.8016853332519531, -0.7848033905029297, -0.7679214477539062, -0.7510395050048828, -0.7341575622558594, -0.7172756195068359, -0.7003936767578125, -0.6835117340087891, -0.6666297912597656, -0.6497478485107422, -0.6328659057617188, -0.6159839630126953, -0.5991020202636719, -0.5822200775146484, -0.565338134765625, -0.5484561920166016, -0.5315742492675781, -0.5146923065185547, -0.49781036376953125, -0.4809284210205078, -0.4640464782714844, -0.44716453552246094, -0.4302825927734375, -0.41340065002441406, -0.3965187072753906, -0.3796367645263672, -0.36275482177734375, -0.3458728790283203, -0.3289909362792969, -0.31210899353027344, -0.29522705078125, -0.27834510803222656, -0.2614631652832031, -0.2445812225341797, -0.22769927978515625, -0.2108173370361328, -0.19393539428710938, -0.17705345153808594, -0.1601715087890625, -0.14328956604003906, -0.12640762329101562, -0.10952568054199219, -0.09264373779296875, -0.07576179504394531, -0.058879852294921875, -0.04199790954589844, -0.025115966796875, -0.008234024047851562, 0.008647918701171875, 0.025529861450195312, 0.04241180419921875, 0.05929374694824219, 0.07617568969726562, 0.09305763244628906, 0.1099395751953125, 0.12682151794433594, 0.14370346069335938, 0.1605854034423828, 0.17746734619140625, 0.1943492889404297, 0.21123123168945312, 0.22811317443847656, 0.2449951171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 10.0, 20.0, 68.0, 365.0, 3204.0, 315.0, 61.0, 18.0, 8.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.07147216796875, -0.07018482685089111, -0.06889748573303223, -0.06761014461517334, -0.06632280349731445, -0.06503546237945557, -0.06374812126159668, -0.06246078014373779, -0.061173439025878906, -0.05988609790802002, -0.05859875679016113, -0.057311415672302246, -0.05602407455444336, -0.05473673343658447, -0.053449392318725586, -0.0521620512008667, -0.05087471008300781, -0.049587368965148926, -0.04830002784729004, -0.04701268672943115, -0.045725345611572266, -0.04443800449371338, -0.04315066337585449, -0.041863322257995605, -0.04057598114013672, -0.03928864002227783, -0.038001298904418945, -0.03671395778656006, -0.03542661666870117, -0.034139275550842285, -0.0328519344329834, -0.03156459331512451, -0.030277252197265625, -0.02898991107940674, -0.02770256996154785, -0.026415228843688965, -0.025127887725830078, -0.02384054660797119, -0.022553205490112305, -0.021265864372253418, -0.01997852325439453, -0.018691182136535645, -0.017403841018676758, -0.01611649990081787, -0.014829158782958984, -0.013541817665100098, -0.012254476547241211, -0.010967135429382324, -0.009679794311523438, -0.00839245319366455, -0.007105112075805664, -0.005817770957946777, -0.004530429840087891, -0.003243088722229004, -0.001955747604370117, -0.0006684064865112305, 0.0006189346313476562, 0.001906275749206543, 0.0031936168670654297, 0.004480957984924316, 0.005768299102783203, 0.00705564022064209, 0.008342981338500977, 0.009630322456359863, 0.01091766357421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 19.0, 23.0, 49.0, 129.0, 340.0, 266.0, 91.0, 29.0, 15.0, 9.0, 8.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.3429376482963562, -0.3360814154148102, -0.32922518253326416, -0.32236894965171814, -0.3155127167701721, -0.3086565136909485, -0.30180028080940247, -0.29494404792785645, -0.2880878150463104, -0.2812315821647644, -0.2743753492832184, -0.26751911640167236, -0.26066291332244873, -0.2538066804409027, -0.2469504475593567, -0.24009421467781067, -0.23323798179626465, -0.22638174891471863, -0.2195255160331726, -0.21266929805278778, -0.20581306517124176, -0.19895683228969574, -0.1921006143093109, -0.1852443814277649, -0.17838814854621887, -0.17153191566467285, -0.16467568278312683, -0.157819464802742, -0.15096323192119598, -0.14410699903964996, -0.13725078105926514, -0.13039454817771912, -0.1235383003950119, -0.11668206751346588, -0.10982584208250046, -0.10296961665153503, -0.09611338376998901, -0.089257150888443, -0.08240092545747757, -0.07554470002651215, -0.06868846714496613, -0.0618322379887104, -0.05497600883245468, -0.04811977967619896, -0.04126355051994324, -0.034407321363687515, -0.027551092207431793, -0.02069486305117607, -0.013838633894920349, -0.006982404738664627, -0.00012617558240890503, 0.006730053573846817, 0.013586282730102539, 0.02044251188635826, 0.027298741042613983, 0.034154970198869705, 0.04101119935512543, 0.04786742851138115, 0.05472365766763687, 0.06157988682389259, 0.06843611598014832, 0.07529234886169434, 0.08214857429265976, 0.08900479972362518, 0.0958610326051712]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 13.0, 10.0, 25.0, 25.0, 32.0, 58.0, 83.0, 82.0, 110.0, 104.0, 126.0, 78.0, 85.0, 55.0, 36.0, 35.0, 18.0, 18.0, 10.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16021275520324707, -0.15531077980995178, -0.1504087895154953, -0.1455068141222, -0.14060482382774353, -0.13570284843444824, -0.13080085813999176, -0.12589888274669647, -0.12099689990282059, -0.1160949170589447, -0.11119293421506882, -0.10629095137119293, -0.10138897597789764, -0.09648698568344116, -0.09158501029014587, -0.08668302744626999, -0.0817810446023941, -0.07687906175851822, -0.07197707891464233, -0.06707509607076645, -0.06217311695218086, -0.05727113410830498, -0.05236915498971939, -0.047467172145843506, -0.04256518930196762, -0.037663206458091736, -0.03276122361421585, -0.027859244495630264, -0.02295726165175438, -0.018055278807878494, -0.013153297826647758, -0.008251316845417023, -0.0033493340015411377, 0.0015526479110121727, 0.006454629823565483, 0.011356611736118793, 0.016258593648672104, 0.02116057649254799, 0.026062557473778725, 0.03096453845500946, 0.035866521298885345, 0.04076850414276123, 0.045670486986637115, 0.0505724661052227, 0.05547444894909859, 0.06037643179297447, 0.06527841091156006, 0.07018039375543594, 0.07508237659931183, 0.07998435944318771, 0.0848863422870636, 0.08978832513093948, 0.09469030797481537, 0.09959228336811066, 0.10449426621198654, 0.10939624905586243, 0.11429823189973831, 0.1192002147436142, 0.12410219758749008, 0.12900418043136597, 0.13390615582466125, 0.13880814611911774, 0.14371012151241302, 0.1486121118068695, 0.1535140872001648]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 10.0, 14.0, 21.0, 11.0, 30.0, 36.0, 41.0, 86.0, 95.0, 149.0, 233.0, 355.0, 626.0, 1446.0, 4431.0, 19117.0, 130379.0, 752462.0, 114377.0, 17479.0, 4067.0, 1291.0, 666.0, 340.0, 258.0, 163.0, 101.0, 79.0, 58.0, 35.0, 24.0, 25.0, 12.0, 11.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.087158203125, -0.08483219146728516, -0.08250617980957031, -0.08018016815185547, -0.07785415649414062, -0.07552814483642578, -0.07320213317871094, -0.0708761215209961, -0.06855010986328125, -0.0662240982055664, -0.06389808654785156, -0.06157207489013672, -0.059246063232421875, -0.05692005157470703, -0.05459403991699219, -0.052268028259277344, -0.0499420166015625, -0.047616004943847656, -0.04528999328613281, -0.04296398162841797, -0.040637969970703125, -0.03831195831298828, -0.03598594665527344, -0.033659934997558594, -0.03133392333984375, -0.029007911682128906, -0.026681900024414062, -0.02435588836669922, -0.022029876708984375, -0.01970386505126953, -0.017377853393554688, -0.015051841735839844, -0.012725830078125, -0.010399818420410156, -0.008073806762695312, -0.005747795104980469, -0.003421783447265625, -0.0010957717895507812, 0.0012302398681640625, 0.0035562515258789062, 0.00588226318359375, 0.008208274841308594, 0.010534286499023438, 0.012860298156738281, 0.015186309814453125, 0.01751232147216797, 0.019838333129882812, 0.022164344787597656, 0.0244903564453125, 0.026816368103027344, 0.029142379760742188, 0.03146839141845703, 0.033794403076171875, 0.03612041473388672, 0.03844642639160156, 0.040772438049316406, 0.04309844970703125, 0.045424461364746094, 0.04775047302246094, 0.05007648468017578, 0.052402496337890625, 0.05472850799560547, 0.05705451965332031, 0.059380531311035156, 0.06170654296875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 10.0, 12.0, 24.0, 38.0, 44.0, 83.0, 79.0, 106.0, 112.0, 94.0, 108.0, 86.0, 69.0, 51.0, 32.0, 18.0, 9.0, 9.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013153076171875, -0.012775421142578125, -0.01239776611328125, -0.012020111083984375, -0.0116424560546875, -0.011264801025390625, -0.01088714599609375, -0.010509490966796875, -0.0101318359375, -0.009754180908203125, -0.00937652587890625, -0.008998870849609375, -0.0086212158203125, -0.008243560791015625, -0.00786590576171875, -0.007488250732421875, -0.007110595703125, -0.006732940673828125, -0.00635528564453125, -0.005977630615234375, -0.0055999755859375, -0.005222320556640625, -0.00484466552734375, -0.004467010498046875, -0.00408935546875, -0.003711700439453125, -0.00333404541015625, -0.002956390380859375, -0.0025787353515625, -0.002201080322265625, -0.00182342529296875, -0.001445770263671875, -0.001068115234375, -0.000690460205078125, -0.00031280517578125, 6.4849853515625e-05, 0.0004425048828125, 0.000820159912109375, 0.00119781494140625, 0.001575469970703125, 0.001953125, 0.002330780029296875, 0.00270843505859375, 0.003086090087890625, 0.0034637451171875, 0.003841400146484375, 0.00421905517578125, 0.004596710205078125, 0.004974365234375, 0.005352020263671875, 0.00572967529296875, 0.006107330322265625, 0.0064849853515625, 0.006862640380859375, 0.00724029541015625, 0.007617950439453125, 0.00799560546875, 0.008373260498046875, 0.00875091552734375, 0.009128570556640625, 0.0095062255859375, 0.009883880615234375, 0.01026153564453125, 0.010639190673828125, 0.011016845703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 11.0, 9.0, 13.0, 20.0, 37.0, 48.0, 96.0, 179.0, 312.0, 634.0, 1609.0, 4259.0, 14562.0, 67359.0, 593688.0, 309783.0, 40539.0, 9934.0, 3107.0, 1188.0, 522.0, 250.0, 148.0, 77.0, 47.0, 39.0, 21.0, 11.0, 9.0, 10.0, 5.0, 5.0, 2.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04681396484375, -0.04524564743041992, -0.043677330017089844, -0.042109012603759766, -0.04054069519042969, -0.03897237777709961, -0.03740406036376953, -0.03583574295043945, -0.034267425537109375, -0.0326991081237793, -0.03113079071044922, -0.02956247329711914, -0.027994155883789062, -0.026425838470458984, -0.024857521057128906, -0.023289203643798828, -0.02172088623046875, -0.020152568817138672, -0.018584251403808594, -0.017015933990478516, -0.015447616577148438, -0.01387929916381836, -0.012310981750488281, -0.010742664337158203, -0.009174346923828125, -0.007606029510498047, -0.006037712097167969, -0.004469394683837891, -0.0029010772705078125, -0.0013327598571777344, 0.00023555755615234375, 0.0018038749694824219, 0.0033721923828125, 0.004940509796142578, 0.006508827209472656, 0.008077144622802734, 0.009645462036132812, 0.01121377944946289, 0.012782096862792969, 0.014350414276123047, 0.015918731689453125, 0.017487049102783203, 0.01905536651611328, 0.02062368392944336, 0.022192001342773438, 0.023760318756103516, 0.025328636169433594, 0.026896953582763672, 0.02846527099609375, 0.030033588409423828, 0.031601905822753906, 0.033170223236083984, 0.03473854064941406, 0.03630685806274414, 0.03787517547607422, 0.0394434928894043, 0.041011810302734375, 0.04258012771606445, 0.04414844512939453, 0.04571676254272461, 0.04728507995605469, 0.048853397369384766, 0.050421714782714844, 0.05199003219604492, 0.053558349609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 10.0, 8.0, 13.0, 12.0, 18.0, 25.0, 31.0, 31.0, 40.0, 48.0, 44.0, 66.0, 51.0, 59.0, 67.0, 83.0, 61.0, 50.0, 44.0, 49.0, 34.0, 28.0, 26.0, 26.0, 17.0, 8.0, 11.0, 7.0, 8.0, 5.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0284423828125, -0.027497291564941406, -0.026552200317382812, -0.02560710906982422, -0.024662017822265625, -0.02371692657470703, -0.022771835327148438, -0.021826744079589844, -0.02088165283203125, -0.019936561584472656, -0.018991470336914062, -0.01804637908935547, -0.017101287841796875, -0.01615619659423828, -0.015211105346679688, -0.014266014099121094, -0.0133209228515625, -0.012375831604003906, -0.011430740356445312, -0.010485649108886719, -0.009540557861328125, -0.008595466613769531, -0.0076503753662109375, -0.006705284118652344, -0.00576019287109375, -0.004815101623535156, -0.0038700103759765625, -0.0029249191284179688, -0.001979827880859375, -0.0010347366333007812, -8.96453857421875e-05, 0.0008554458618164062, 0.001800537109375, 0.0027456283569335938, 0.0036907196044921875, 0.004635810852050781, 0.005580902099609375, 0.006525993347167969, 0.0074710845947265625, 0.008416175842285156, 0.00936126708984375, 0.010306358337402344, 0.011251449584960938, 0.012196540832519531, 0.013141632080078125, 0.014086723327636719, 0.015031814575195312, 0.015976905822753906, 0.0169219970703125, 0.017867088317871094, 0.018812179565429688, 0.01975727081298828, 0.020702362060546875, 0.02164745330810547, 0.022592544555664062, 0.023537635803222656, 0.02448272705078125, 0.025427818298339844, 0.026372909545898438, 0.02731800079345703, 0.028263092041015625, 0.02920818328857422, 0.030153274536132812, 0.031098365783691406, 0.03204345703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 5.0, 6.0, 13.0, 15.0, 16.0, 21.0, 31.0, 30.0, 48.0, 58.0, 74.0, 125.0, 213.0, 510.0, 1619.0, 6545.0, 83742.0, 896115.0, 51644.0, 5318.0, 1338.0, 431.0, 200.0, 117.0, 73.0, 52.0, 46.0, 26.0, 24.0, 18.0, 19.0, 17.0, 8.0, 11.0, 11.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.037078857421875, -0.03603243827819824, -0.034986019134521484, -0.03393959999084473, -0.03289318084716797, -0.03184676170349121, -0.030800342559814453, -0.029753923416137695, -0.028707504272460938, -0.02766108512878418, -0.026614665985107422, -0.025568246841430664, -0.024521827697753906, -0.02347540855407715, -0.02242898941040039, -0.021382570266723633, -0.020336151123046875, -0.019289731979370117, -0.01824331283569336, -0.0171968936920166, -0.016150474548339844, -0.015104055404663086, -0.014057636260986328, -0.01301121711730957, -0.011964797973632812, -0.010918378829956055, -0.009871959686279297, -0.008825540542602539, -0.007779121398925781, -0.0067327022552490234, -0.005686283111572266, -0.004639863967895508, -0.00359344482421875, -0.002547025680541992, -0.0015006065368652344, -0.00045418739318847656, 0.0005922317504882812, 0.001638650894165039, 0.002685070037841797, 0.0037314891815185547, 0.0047779083251953125, 0.00582432746887207, 0.006870746612548828, 0.007917165756225586, 0.008963584899902344, 0.010010004043579102, 0.01105642318725586, 0.012102842330932617, 0.013149261474609375, 0.014195680618286133, 0.01524209976196289, 0.01628851890563965, 0.017334938049316406, 0.018381357192993164, 0.019427776336669922, 0.02047419548034668, 0.021520614624023438, 0.022567033767700195, 0.023613452911376953, 0.02465987205505371, 0.02570629119873047, 0.026752710342407227, 0.027799129486083984, 0.028845548629760742, 0.0298919677734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 10.0, 10.0, 13.0, 28.0, 29.0, 32.0, 55.0, 65.0, 97.0, 99.0, 102.0, 106.0, 100.0, 70.0, 42.0, 51.0, 22.0, 17.0, 17.0, 10.0, 12.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001189112663269043, -0.0001155780628323555, -0.0001122448593378067, -0.0001089116558432579, -0.0001055784523487091, -0.00010224524885416031, -9.891204535961151e-05, -9.557884186506271e-05, -9.224563837051392e-05, -8.891243487596512e-05, -8.557923138141632e-05, -8.224602788686752e-05, -7.891282439231873e-05, -7.557962089776993e-05, -7.224641740322113e-05, -6.891321390867233e-05, -6.558001041412354e-05, -6.224680691957474e-05, -5.891360342502594e-05, -5.558039993047714e-05, -5.2247196435928345e-05, -4.891399294137955e-05, -4.558078944683075e-05, -4.224758595228195e-05, -3.8914382457733154e-05, -3.558117896318436e-05, -3.224797546863556e-05, -2.891477197408676e-05, -2.5581568479537964e-05, -2.2248364984989166e-05, -1.891516149044037e-05, -1.558195799589157e-05, -1.2248754501342773e-05, -8.915551006793976e-06, -5.582347512245178e-06, -2.2491440176963806e-06, 1.084059476852417e-06, 4.417262971401215e-06, 7.750466465950012e-06, 1.108366996049881e-05, 1.4416873455047607e-05, 1.7750076949596405e-05, 2.1083280444145203e-05, 2.4416483938694e-05, 2.7749687433242798e-05, 3.1082890927791595e-05, 3.441609442234039e-05, 3.774929791688919e-05, 4.108250141143799e-05, 4.4415704905986786e-05, 4.7748908400535583e-05, 5.108211189508438e-05, 5.441531538963318e-05, 5.7748518884181976e-05, 6.108172237873077e-05, 6.441492587327957e-05, 6.774812936782837e-05, 7.108133286237717e-05, 7.441453635692596e-05, 7.774773985147476e-05, 8.108094334602356e-05, 8.441414684057236e-05, 8.774735033512115e-05, 9.108055382966995e-05, 9.441375732421875e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 6.0, 9.0, 17.0, 37.0, 84.0, 150.0, 507.0, 2133.0, 21395.0, 809818.0, 205762.0, 7039.0, 1059.0, 292.0, 107.0, 44.0, 25.0, 13.0, 11.0, 11.0, 6.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032257080078125, -0.03105306625366211, -0.02984905242919922, -0.028645038604736328, -0.027441024780273438, -0.026237010955810547, -0.025032997131347656, -0.023828983306884766, -0.022624969482421875, -0.021420955657958984, -0.020216941833496094, -0.019012928009033203, -0.017808914184570312, -0.016604900360107422, -0.015400886535644531, -0.01419687271118164, -0.01299285888671875, -0.01178884506225586, -0.010584831237792969, -0.009380817413330078, -0.008176803588867188, -0.006972789764404297, -0.005768775939941406, -0.004564762115478516, -0.003360748291015625, -0.0021567344665527344, -0.0009527206420898438, 0.0002512931823730469, 0.0014553070068359375, 0.002659320831298828, 0.0038633346557617188, 0.005067348480224609, 0.0062713623046875, 0.007475376129150391, 0.008679389953613281, 0.009883403778076172, 0.011087417602539062, 0.012291431427001953, 0.013495445251464844, 0.014699459075927734, 0.015903472900390625, 0.017107486724853516, 0.018311500549316406, 0.019515514373779297, 0.020719528198242188, 0.021923542022705078, 0.02312755584716797, 0.02433156967163086, 0.02553558349609375, 0.02673959732055664, 0.02794361114501953, 0.029147624969482422, 0.030351638793945312, 0.0315556526184082, 0.032759666442871094, 0.033963680267333984, 0.035167694091796875, 0.036371707916259766, 0.037575721740722656, 0.03877973556518555, 0.03998374938964844, 0.04118776321411133, 0.04239177703857422, 0.04359579086303711, 0.0447998046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 4.0, 12.0, 14.0, 20.0, 43.0, 70.0, 124.0, 155.0, 155.0, 147.0, 100.0, 52.0, 33.0, 15.0, 9.0, 10.0, 3.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0177764892578125, -0.017098665237426758, -0.016420841217041016, -0.015743017196655273, -0.015065193176269531, -0.014387369155883789, -0.013709545135498047, -0.013031721115112305, -0.012353897094726562, -0.01167607307434082, -0.010998249053955078, -0.010320425033569336, -0.009642601013183594, -0.008964776992797852, -0.00828695297241211, -0.007609128952026367, -0.006931304931640625, -0.006253480911254883, -0.005575656890869141, -0.0048978328704833984, -0.004220008850097656, -0.003542184829711914, -0.002864360809326172, -0.0021865367889404297, -0.0015087127685546875, -0.0008308887481689453, -0.00015306472778320312, 0.0005247592926025391, 0.0012025833129882812, 0.0018804073333740234, 0.0025582313537597656, 0.003236055374145508, 0.00391387939453125, 0.004591703414916992, 0.005269527435302734, 0.0059473514556884766, 0.006625175476074219, 0.007302999496459961, 0.007980823516845703, 0.008658647537231445, 0.009336471557617188, 0.01001429557800293, 0.010692119598388672, 0.011369943618774414, 0.012047767639160156, 0.012725591659545898, 0.01340341567993164, 0.014081239700317383, 0.014759063720703125, 0.015436887741088867, 0.01611471176147461, 0.01679253578186035, 0.017470359802246094, 0.018148183822631836, 0.018826007843017578, 0.01950383186340332, 0.020181655883789062, 0.020859479904174805, 0.021537303924560547, 0.02221512794494629, 0.02289295196533203, 0.023570775985717773, 0.024248600006103516, 0.024926424026489258, 0.025604248046875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 5.0, 24.0, 56.0, 261.0, 470.0, 146.0, 41.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9824375510215759, -0.9636198878288269, -0.9448022246360779, -0.9259845614433289, -0.9071669578552246, -0.8883492946624756, -0.8695316314697266, -0.8507139682769775, -0.8318963050842285, -0.8130786418914795, -0.7942609786987305, -0.7754433155059814, -0.7566256523132324, -0.7378080487251282, -0.7189903855323792, -0.7001727223396301, -0.6813550591468811, -0.6625373959541321, -0.6437197327613831, -0.624902069568634, -0.6060844659805298, -0.5872668027877808, -0.5684491395950317, -0.5496314764022827, -0.5308138132095337, -0.5119961500167847, -0.49317848682403564, -0.474360853433609, -0.45554319024086, -0.43672552704811096, -0.4179078936576843, -0.3990902304649353, -0.3802725672721863, -0.36145490407943726, -0.34263724088668823, -0.3238196074962616, -0.3050019443035126, -0.28618428111076355, -0.2673666477203369, -0.2485489845275879, -0.22973130643367767, -0.21091365814208984, -0.19209599494934082, -0.1732783317565918, -0.15446068346500397, -0.13564303517341614, -0.11682537198066711, -0.09800772368907928, -0.07919006049633026, -0.060372404754161835, -0.04155474901199341, -0.02273709326982498, -0.003919437527656555, 0.014898218214511871, 0.0337158739566803, 0.05253352224826813, 0.07135118544101715, 0.09016884118318558, 0.108986496925354, 0.12780416011810303, 0.14662180840969086, 0.1654394567012787, 0.1842571198940277, 0.20307476818561554, 0.22189243137836456]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 8.0, 9.0, 15.0, 19.0, 22.0, 24.0, 32.0, 36.0, 49.0, 59.0, 56.0, 55.0, 77.0, 69.0, 56.0, 75.0, 55.0, 46.0, 37.0, 41.0, 39.0, 27.0, 22.0, 14.0, 16.0, 11.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20135772228240967, -0.19570404291152954, -0.19005036354064941, -0.1843966841697693, -0.17874300479888916, -0.17308932542800903, -0.1674356460571289, -0.16178196668624878, -0.15612828731536865, -0.15047460794448853, -0.1448209285736084, -0.13916724920272827, -0.13351356983184814, -0.12785989046096802, -0.12220621109008789, -0.11655253171920776, -0.11089885234832764, -0.10524517297744751, -0.09959149360656738, -0.09393781423568726, -0.08828413486480713, -0.082630455493927, -0.07697677612304688, -0.07132309675216675, -0.06566941738128662, -0.060015738010406494, -0.05436205863952637, -0.04870837926864624, -0.04305469989776611, -0.037401020526885986, -0.03174734115600586, -0.026093661785125732, -0.020439982414245605, -0.014786303043365479, -0.009132623672485352, -0.0034789443016052246, 0.0021747350692749023, 0.00782841444015503, 0.013482093811035156, 0.019135773181915283, 0.02478945255279541, 0.030443131923675537, 0.036096811294555664, 0.04175049066543579, 0.04740417003631592, 0.053057849407196045, 0.05871152877807617, 0.0643652081489563, 0.07001888751983643, 0.07567256689071655, 0.08132624626159668, 0.0869799256324768, 0.09263360500335693, 0.09828728437423706, 0.10394096374511719, 0.10959464311599731, 0.11524832248687744, 0.12090200185775757, 0.1265556812286377, 0.13220936059951782, 0.13786303997039795, 0.14351671934127808, 0.1491703987121582, 0.15482407808303833, 0.16047775745391846]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 1.0, 12.0, 11.0, 12.0, 34.0, 43.0, 71.0, 105.0, 191.0, 363.0, 665.0, 1816.0, 8148.0, 175702.0, 3970799.0, 31349.0, 3541.0, 839.0, 303.0, 133.0, 67.0, 26.0, 15.0, 9.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1671142578125, -0.16333961486816406, -0.15956497192382812, -0.1557903289794922, -0.15201568603515625, -0.1482410430908203, -0.14446640014648438, -0.14069175720214844, -0.1369171142578125, -0.13314247131347656, -0.12936782836914062, -0.1255931854248047, -0.12181854248046875, -0.11804389953613281, -0.11426925659179688, -0.11049461364746094, -0.106719970703125, -0.10294532775878906, -0.09917068481445312, -0.09539604187011719, -0.09162139892578125, -0.08784675598144531, -0.08407211303710938, -0.08029747009277344, -0.0765228271484375, -0.07274818420410156, -0.06897354125976562, -0.06519889831542969, -0.06142425537109375, -0.05764961242675781, -0.053874969482421875, -0.05010032653808594, -0.04632568359375, -0.04255104064941406, -0.038776397705078125, -0.03500175476074219, -0.03122711181640625, -0.027452468872070312, -0.023677825927734375, -0.019903182983398438, -0.0161285400390625, -0.012353897094726562, -0.008579254150390625, -0.0048046112060546875, -0.00102996826171875, 0.0027446746826171875, 0.006519317626953125, 0.010293960571289062, 0.014068603515625, 0.017843246459960938, 0.021617889404296875, 0.025392532348632812, 0.02916717529296875, 0.03294181823730469, 0.036716461181640625, 0.04049110412597656, 0.0442657470703125, 0.04804039001464844, 0.051815032958984375, 0.05558967590332031, 0.05936431884765625, 0.06313896179199219, 0.06691360473632812, 0.07068824768066406, 0.074462890625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 8.0, 11.0, 14.0, 24.0, 35.0, 53.0, 57.0, 79.0, 63.0, 84.0, 90.0, 99.0, 70.0, 72.0, 57.0, 49.0, 46.0, 27.0, 20.0, 14.0, 7.0, 3.0, 6.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0124359130859375, -0.012122154235839844, -0.011808395385742188, -0.011494636535644531, -0.011180877685546875, -0.010867118835449219, -0.010553359985351562, -0.010239601135253906, -0.00992584228515625, -0.009612083435058594, -0.009298324584960938, -0.008984565734863281, -0.008670806884765625, -0.008357048034667969, -0.008043289184570312, -0.007729530334472656, -0.007415771484375, -0.007102012634277344, -0.0067882537841796875, -0.006474494934082031, -0.006160736083984375, -0.005846977233886719, -0.0055332183837890625, -0.005219459533691406, -0.00490570068359375, -0.004591941833496094, -0.0042781829833984375, -0.003964424133300781, -0.003650665283203125, -0.0033369064331054688, -0.0030231475830078125, -0.0027093887329101562, -0.0023956298828125, -0.0020818710327148438, -0.0017681121826171875, -0.0014543533325195312, -0.001140594482421875, -0.0008268356323242188, -0.0005130767822265625, -0.00019931793212890625, 0.00011444091796875, 0.00042819976806640625, 0.0007419586181640625, 0.0010557174682617188, 0.001369476318359375, 0.0016832351684570312, 0.0019969940185546875, 0.0023107528686523438, 0.00262451171875, 0.0029382705688476562, 0.0032520294189453125, 0.0035657882690429688, 0.003879547119140625, 0.004193305969238281, 0.0045070648193359375, 0.004820823669433594, 0.00513458251953125, 0.005448341369628906, 0.0057621002197265625, 0.006075859069824219, 0.006389617919921875, 0.006703376770019531, 0.0070171356201171875, 0.007330894470214844, 0.0076446533203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 13.0, 13.0, 20.0, 32.0, 36.0, 50.0, 74.0, 118.0, 237.0, 694.0, 4162881.0, 29111.0, 427.0, 203.0, 90.0, 60.0, 55.0, 29.0, 26.0, 17.0, 24.0, 25.0, 13.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264892578125, -0.2515449523925781, -0.23819732666015625, -0.22484970092773438, -0.2115020751953125, -0.19815444946289062, -0.18480682373046875, -0.17145919799804688, -0.158111572265625, -0.14476394653320312, -0.13141632080078125, -0.11806869506835938, -0.1047210693359375, -0.09137344360351562, -0.07802581787109375, -0.06467819213867188, -0.05133056640625, -0.037982940673828125, -0.02463531494140625, -0.011287689208984375, 0.0020599365234375, 0.015407562255859375, 0.02875518798828125, 0.042102813720703125, 0.055450439453125, 0.06879806518554688, 0.08214569091796875, 0.09549331665039062, 0.1088409423828125, 0.12218856811523438, 0.13553619384765625, 0.14888381958007812, 0.1622314453125, 0.17557907104492188, 0.18892669677734375, 0.20227432250976562, 0.2156219482421875, 0.22896957397460938, 0.24231719970703125, 0.2556648254394531, 0.269012451171875, 0.2823600769042969, 0.29570770263671875, 0.3090553283691406, 0.3224029541015625, 0.3357505798339844, 0.34909820556640625, 0.3624458312988281, 0.37579345703125, 0.3891410827636719, 0.40248870849609375, 0.4158363342285156, 0.4291839599609375, 0.4425315856933594, 0.45587921142578125, 0.4692268371582031, 0.482574462890625, 0.4959220886230469, 0.5092697143554688, 0.5226173400878906, 0.5359649658203125, 0.5493125915527344, 0.5626602172851562, 0.5760078430175781, 0.58935546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 13.0, 87.0, 3347.0, 603.0, 33.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04315185546875, -0.04085540771484375, -0.0385589599609375, -0.03626251220703125, -0.033966064453125, -0.03166961669921875, -0.0293731689453125, -0.02707672119140625, -0.0247802734375, -0.02248382568359375, -0.0201873779296875, -0.01789093017578125, -0.015594482421875, -0.01329803466796875, -0.0110015869140625, -0.00870513916015625, -0.00640869140625, -0.00411224365234375, -0.0018157958984375, 0.00048065185546875, 0.002777099609375, 0.00507354736328125, 0.0073699951171875, 0.00966644287109375, 0.011962890625, 0.01425933837890625, 0.0165557861328125, 0.01885223388671875, 0.021148681640625, 0.02344512939453125, 0.0257415771484375, 0.02803802490234375, 0.03033447265625, 0.03263092041015625, 0.0349273681640625, 0.03722381591796875, 0.039520263671875, 0.04181671142578125, 0.0441131591796875, 0.04640960693359375, 0.0487060546875, 0.05100250244140625, 0.0532989501953125, 0.05559539794921875, 0.057891845703125, 0.06018829345703125, 0.0624847412109375, 0.06478118896484375, 0.06707763671875, 0.06937408447265625, 0.0716705322265625, 0.07396697998046875, 0.076263427734375, 0.07855987548828125, 0.0808563232421875, 0.08315277099609375, 0.08544921875, 0.08774566650390625, 0.0900421142578125, 0.09233856201171875, 0.094635009765625, 0.09693145751953125, 0.0992279052734375, 0.10152435302734375, 0.10382080078125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 64.0, 740.0, 184.0, 12.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5950915813446045, -0.5774247050285339, -0.5597577691078186, -0.542090892791748, -0.5244239568710327, -0.5067570805549622, -0.4890902042388916, -0.47142329812049866, -0.4537563920021057, -0.43608948588371277, -0.4184225797653198, -0.40075570344924927, -0.3830887973308563, -0.3654218912124634, -0.3477550148963928, -0.3300881087779999, -0.31242120265960693, -0.294754296541214, -0.27708739042282104, -0.2594205141067505, -0.24175360798835754, -0.2240867018699646, -0.20641981065273285, -0.1887529194355011, -0.17108601331710815, -0.1534191071987152, -0.13575221598148346, -0.11808531731367111, -0.10041841864585876, -0.08275151997804642, -0.06508462131023407, -0.04741772264242172, -0.029750823974609375, -0.012083925306797028, 0.00558297336101532, 0.023249872028827667, 0.040916770696640015, 0.05858366936445236, 0.07625056803226471, 0.09391746670007706, 0.1115843653678894, 0.12925127148628235, 0.1469181627035141, 0.16458505392074585, 0.1822519600391388, 0.19991886615753174, 0.2175857573747635, 0.23525264859199524, 0.2529195547103882, 0.27058646082878113, 0.2882533669471741, 0.30592024326324463, 0.3235871493816376, 0.3412540555000305, 0.3589209318161011, 0.376587837934494, 0.39425474405288696, 0.4119216501712799, 0.42958855628967285, 0.4472554326057434, 0.46492233872413635, 0.4825892448425293, 0.5002561211585999, 0.5179230570793152, 0.5355899333953857]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 15.0, 33.0, 62.0, 86.0, 140.0, 155.0, 150.0, 125.0, 103.0, 59.0, 40.0, 18.0, 8.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.18072974681854248, -0.17625586688518524, -0.171781986951828, -0.16730810701847076, -0.16283422708511353, -0.1583603471517563, -0.15388646721839905, -0.14941257238388062, -0.14493870735168457, -0.14046482741832733, -0.1359909474849701, -0.13151706755161285, -0.12704318761825562, -0.12256930768489838, -0.11809542030096054, -0.1136215403676033, -0.10914765298366547, -0.10467377305030823, -0.10019989311695099, -0.09572601318359375, -0.09125213325023651, -0.08677825331687927, -0.08230436593294144, -0.0778304859995842, -0.07335660606622696, -0.06888272613286972, -0.06440884619951248, -0.059934962540864944, -0.055461082607507706, -0.05098720267415047, -0.04651331901550293, -0.04203943908214569, -0.03756555914878845, -0.03309167921543121, -0.028617797419428825, -0.024143915623426437, -0.0196700356900692, -0.01519615575671196, -0.010722273960709572, -0.006248392164707184, -0.001774512231349945, 0.0026993686333298683, 0.007173249498009682, 0.011647130362689495, 0.01612101122736931, 0.020594891160726547, 0.025068772956728935, 0.029542654752731323, 0.03401653468608856, 0.0384904146194458, 0.04296429455280304, 0.04743817821145058, 0.051912058144807816, 0.056385938078165054, 0.06085982173681259, 0.06533370167016983, 0.06980758160352707, 0.07428146153688431, 0.07875534147024155, 0.08322922140359879, 0.08770310878753662, 0.09217698872089386, 0.0966508686542511, 0.10112474858760834, 0.10559862852096558]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 9.0, 7.0, 8.0, 15.0, 23.0, 25.0, 41.0, 50.0, 81.0, 104.0, 148.0, 240.0, 361.0, 625.0, 1184.0, 2506.0, 6938.0, 21447.0, 83780.0, 471233.0, 366427.0, 65177.0, 17411.0, 5750.0, 2225.0, 1046.0, 573.0, 359.0, 230.0, 136.0, 102.0, 73.0, 62.0, 36.0, 33.0, 33.0, 16.0, 10.0, 10.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.037506103515625, -0.0362091064453125, -0.034912109375, -0.0336151123046875, -0.032318115234375, -0.0310211181640625, -0.02972412109375, -0.0284271240234375, -0.027130126953125, -0.0258331298828125, -0.0245361328125, -0.0232391357421875, -0.021942138671875, -0.0206451416015625, -0.01934814453125, -0.0180511474609375, -0.016754150390625, -0.0154571533203125, -0.01416015625, -0.0128631591796875, -0.011566162109375, -0.0102691650390625, -0.00897216796875, -0.0076751708984375, -0.006378173828125, -0.0050811767578125, -0.0037841796875, -0.0024871826171875, -0.001190185546875, 0.0001068115234375, 0.00140380859375, 0.0027008056640625, 0.003997802734375, 0.0052947998046875, 0.006591796875, 0.0078887939453125, 0.009185791015625, 0.0104827880859375, 0.01177978515625, 0.0130767822265625, 0.014373779296875, 0.0156707763671875, 0.0169677734375, 0.0182647705078125, 0.019561767578125, 0.0208587646484375, 0.02215576171875, 0.0234527587890625, 0.024749755859375, 0.0260467529296875, 0.02734375, 0.0286407470703125, 0.029937744140625, 0.0312347412109375, 0.03253173828125, 0.0338287353515625, 0.035125732421875, 0.0364227294921875, 0.0377197265625, 0.0390167236328125, 0.040313720703125, 0.0416107177734375, 0.04290771484375, 0.0442047119140625, 0.045501708984375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 10.0, 10.0, 15.0, 27.0, 49.0, 40.0, 62.0, 62.0, 74.0, 81.0, 96.0, 97.0, 72.0, 68.0, 53.0, 48.0, 32.0, 37.0, 20.0, 18.0, 11.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01052093505859375, -0.010216593742370605, -0.009912252426147461, -0.009607911109924316, -0.009303569793701172, -0.008999228477478027, -0.008694887161254883, -0.008390545845031738, -0.008086204528808594, -0.007781863212585449, -0.007477521896362305, -0.00717318058013916, -0.006868839263916016, -0.006564497947692871, -0.0062601566314697266, -0.005955815315246582, -0.0056514739990234375, -0.005347132682800293, -0.0050427913665771484, -0.004738450050354004, -0.004434108734130859, -0.004129767417907715, -0.0038254261016845703, -0.0035210847854614258, -0.0032167434692382812, -0.0029124021530151367, -0.002608060836791992, -0.0023037195205688477, -0.001999378204345703, -0.0016950368881225586, -0.001390695571899414, -0.0010863542556762695, -0.000782012939453125, -0.00047767162322998047, -0.00017333030700683594, 0.0001310110092163086, 0.0004353523254394531, 0.0007396936416625977, 0.0010440349578857422, 0.0013483762741088867, 0.0016527175903320312, 0.0019570589065551758, 0.0022614002227783203, 0.002565741539001465, 0.0028700828552246094, 0.003174424171447754, 0.0034787654876708984, 0.003783106803894043, 0.0040874481201171875, 0.004391789436340332, 0.0046961307525634766, 0.005000472068786621, 0.005304813385009766, 0.00560915470123291, 0.005913496017456055, 0.006217837333679199, 0.006522178649902344, 0.006826519966125488, 0.007130861282348633, 0.007435202598571777, 0.007739543914794922, 0.008043885231018066, 0.008348226547241211, 0.008652567863464355, 0.0089569091796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 7.0, 9.0, 13.0, 13.0, 36.0, 37.0, 52.0, 94.0, 155.0, 304.0, 593.0, 1192.0, 2813.0, 7534.0, 27747.0, 165569.0, 682992.0, 125254.0, 22746.0, 6643.0, 2434.0, 1030.0, 534.0, 273.0, 153.0, 109.0, 73.0, 44.0, 27.0, 20.0, 18.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.057952880859375, -0.05648326873779297, -0.05501365661621094, -0.053544044494628906, -0.052074432373046875, -0.050604820251464844, -0.04913520812988281, -0.04766559600830078, -0.04619598388671875, -0.04472637176513672, -0.04325675964355469, -0.041787147521972656, -0.040317535400390625, -0.038847923278808594, -0.03737831115722656, -0.03590869903564453, -0.0344390869140625, -0.03296947479248047, -0.03149986267089844, -0.030030250549316406, -0.028560638427734375, -0.027091026306152344, -0.025621414184570312, -0.02415180206298828, -0.02268218994140625, -0.02121257781982422, -0.019742965698242188, -0.018273353576660156, -0.016803741455078125, -0.015334129333496094, -0.013864517211914062, -0.012394905090332031, -0.01092529296875, -0.009455680847167969, -0.007986068725585938, -0.006516456604003906, -0.005046844482421875, -0.0035772323608398438, -0.0021076202392578125, -0.0006380081176757812, 0.00083160400390625, 0.0023012161254882812, 0.0037708282470703125, 0.005240440368652344, 0.006710052490234375, 0.008179664611816406, 0.009649276733398438, 0.011118888854980469, 0.0125885009765625, 0.014058113098144531, 0.015527725219726562, 0.016997337341308594, 0.018466949462890625, 0.019936561584472656, 0.021406173706054688, 0.02287578582763672, 0.02434539794921875, 0.02581501007080078, 0.027284622192382812, 0.028754234313964844, 0.030223846435546875, 0.031693458557128906, 0.03316307067871094, 0.03463268280029297, 0.036102294921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 3.0, 7.0, 7.0, 8.0, 12.0, 20.0, 20.0, 37.0, 34.0, 46.0, 49.0, 54.0, 67.0, 54.0, 69.0, 70.0, 71.0, 66.0, 46.0, 49.0, 31.0, 42.0, 28.0, 22.0, 17.0, 12.0, 19.0, 5.0, 8.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.04034423828125, -0.03930783271789551, -0.038271427154541016, -0.03723502159118652, -0.03619861602783203, -0.03516221046447754, -0.03412580490112305, -0.033089399337768555, -0.03205299377441406, -0.03101658821105957, -0.029980182647705078, -0.028943777084350586, -0.027907371520996094, -0.0268709659576416, -0.02583456039428711, -0.024798154830932617, -0.023761749267578125, -0.022725343704223633, -0.02168893814086914, -0.02065253257751465, -0.019616127014160156, -0.018579721450805664, -0.017543315887451172, -0.01650691032409668, -0.015470504760742188, -0.014434099197387695, -0.013397693634033203, -0.012361288070678711, -0.011324882507324219, -0.010288476943969727, -0.009252071380615234, -0.008215665817260742, -0.00717926025390625, -0.006142854690551758, -0.005106449127197266, -0.0040700435638427734, -0.0030336380004882812, -0.001997232437133789, -0.0009608268737792969, 7.557868957519531e-05, 0.0011119842529296875, 0.0021483898162841797, 0.003184795379638672, 0.004221200942993164, 0.005257606506347656, 0.0062940120697021484, 0.007330417633056641, 0.008366823196411133, 0.009403228759765625, 0.010439634323120117, 0.01147603988647461, 0.012512445449829102, 0.013548851013183594, 0.014585256576538086, 0.015621662139892578, 0.01665806770324707, 0.017694473266601562, 0.018730878829956055, 0.019767284393310547, 0.02080368995666504, 0.02184009552001953, 0.022876501083374023, 0.023912906646728516, 0.024949312210083008, 0.0259857177734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 17.0, 13.0, 16.0, 24.0, 26.0, 40.0, 62.0, 83.0, 106.0, 198.0, 415.0, 858.0, 2508.0, 13498.0, 237576.0, 746077.0, 39497.0, 4952.0, 1307.0, 521.0, 265.0, 146.0, 104.0, 64.0, 45.0, 33.0, 29.0, 23.0, 9.0, 11.0, 5.0, 8.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0219573974609375, -0.021150827407836914, -0.020344257354736328, -0.019537687301635742, -0.018731117248535156, -0.01792454719543457, -0.017117977142333984, -0.0163114070892334, -0.015504837036132812, -0.014698266983032227, -0.01389169692993164, -0.013085126876831055, -0.012278556823730469, -0.011471986770629883, -0.010665416717529297, -0.009858846664428711, -0.009052276611328125, -0.008245706558227539, -0.007439136505126953, -0.006632566452026367, -0.005825996398925781, -0.005019426345825195, -0.004212856292724609, -0.0034062862396240234, -0.0025997161865234375, -0.0017931461334228516, -0.0009865760803222656, -0.0001800060272216797, 0.0006265640258789062, 0.0014331340789794922, 0.002239704132080078, 0.003046274185180664, 0.00385284423828125, 0.004659414291381836, 0.005465984344482422, 0.006272554397583008, 0.007079124450683594, 0.00788569450378418, 0.008692264556884766, 0.009498834609985352, 0.010305404663085938, 0.011111974716186523, 0.01191854476928711, 0.012725114822387695, 0.013531684875488281, 0.014338254928588867, 0.015144824981689453, 0.01595139503479004, 0.016757965087890625, 0.01756453514099121, 0.018371105194091797, 0.019177675247192383, 0.01998424530029297, 0.020790815353393555, 0.02159738540649414, 0.022403955459594727, 0.023210525512695312, 0.0240170955657959, 0.024823665618896484, 0.02563023567199707, 0.026436805725097656, 0.027243375778198242, 0.028049945831298828, 0.028856515884399414, 0.0296630859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 12.0, 9.0, 10.0, 22.0, 33.0, 51.0, 74.0, 120.0, 179.0, 173.0, 121.0, 79.0, 60.0, 21.0, 15.0, 11.0, 12.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017535686492919922, -0.00017154216766357422, -0.00016772747039794922, -0.00016391277313232422, -0.00016009807586669922, -0.00015628337860107422, -0.00015246868133544922, -0.00014865398406982422, -0.00014483928680419922, -0.00014102458953857422, -0.00013720989227294922, -0.00013339519500732422, -0.00012958049774169922, -0.00012576580047607422, -0.00012195110321044922, -0.00011813640594482422, -0.00011432170867919922, -0.00011050701141357422, -0.00010669231414794922, -0.00010287761688232422, -9.906291961669922e-05, -9.524822235107422e-05, -9.143352508544922e-05, -8.761882781982422e-05, -8.380413055419922e-05, -7.998943328857422e-05, -7.617473602294922e-05, -7.236003875732422e-05, -6.854534149169922e-05, -6.473064422607422e-05, -6.091594696044922e-05, -5.710124969482422e-05, -5.328655242919922e-05, -4.947185516357422e-05, -4.565715789794922e-05, -4.184246063232422e-05, -3.802776336669922e-05, -3.421306610107422e-05, -3.039836883544922e-05, -2.658367156982422e-05, -2.276897430419922e-05, -1.895427703857422e-05, -1.5139579772949219e-05, -1.1324882507324219e-05, -7.510185241699219e-06, -3.6954879760742188e-06, 1.1920928955078125e-07, 3.933906555175781e-06, 7.748603820800781e-06, 1.1563301086425781e-05, 1.537799835205078e-05, 1.919269561767578e-05, 2.300739288330078e-05, 2.682209014892578e-05, 3.063678741455078e-05, 3.445148468017578e-05, 3.826618194580078e-05, 4.208087921142578e-05, 4.589557647705078e-05, 4.971027374267578e-05, 5.352497100830078e-05, 5.733966827392578e-05, 6.115436553955078e-05, 6.496906280517578e-05, 6.878376007080078e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 13.0, 10.0, 18.0, 41.0, 56.0, 83.0, 147.0, 348.0, 1060.0, 6410.0, 161668.0, 844594.0, 30172.0, 2745.0, 693.0, 208.0, 116.0, 60.0, 44.0, 23.0, 25.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.046295166015625, -0.04524970054626465, -0.0442042350769043, -0.043158769607543945, -0.042113304138183594, -0.04106783866882324, -0.04002237319946289, -0.03897690773010254, -0.03793144226074219, -0.036885976791381836, -0.035840511322021484, -0.03479504585266113, -0.03374958038330078, -0.03270411491394043, -0.03165864944458008, -0.030613183975219727, -0.029567718505859375, -0.028522253036499023, -0.027476787567138672, -0.02643132209777832, -0.02538585662841797, -0.024340391159057617, -0.023294925689697266, -0.022249460220336914, -0.021203994750976562, -0.02015852928161621, -0.01911306381225586, -0.018067598342895508, -0.017022132873535156, -0.015976667404174805, -0.014931201934814453, -0.013885736465454102, -0.01284027099609375, -0.011794805526733398, -0.010749340057373047, -0.009703874588012695, -0.008658409118652344, -0.007612943649291992, -0.006567478179931641, -0.005522012710571289, -0.0044765472412109375, -0.003431081771850586, -0.0023856163024902344, -0.0013401508331298828, -0.00029468536376953125, 0.0007507801055908203, 0.0017962455749511719, 0.0028417110443115234, 0.003887176513671875, 0.0049326419830322266, 0.005978107452392578, 0.00702357292175293, 0.008069038391113281, 0.009114503860473633, 0.010159969329833984, 0.011205434799194336, 0.012250900268554688, 0.013296365737915039, 0.01434183120727539, 0.015387296676635742, 0.016432762145996094, 0.017478227615356445, 0.018523693084716797, 0.01956915855407715, 0.0206146240234375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 3.0, 10.0, 14.0, 24.0, 21.0, 48.0, 74.0, 153.0, 170.0, 157.0, 107.0, 83.0, 52.0, 29.0, 14.0, 8.0, 5.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.02655029296875, -0.025900959968566895, -0.02525162696838379, -0.024602293968200684, -0.023952960968017578, -0.023303627967834473, -0.022654294967651367, -0.02200496196746826, -0.021355628967285156, -0.02070629596710205, -0.020056962966918945, -0.01940762996673584, -0.018758296966552734, -0.01810896396636963, -0.017459630966186523, -0.016810297966003418, -0.016160964965820312, -0.015511631965637207, -0.014862298965454102, -0.014212965965270996, -0.01356363296508789, -0.012914299964904785, -0.01226496696472168, -0.011615633964538574, -0.010966300964355469, -0.010316967964172363, -0.009667634963989258, -0.009018301963806152, -0.008368968963623047, -0.007719635963439941, -0.007070302963256836, -0.0064209699630737305, -0.005771636962890625, -0.0051223039627075195, -0.004472970962524414, -0.0038236379623413086, -0.003174304962158203, -0.0025249719619750977, -0.0018756389617919922, -0.0012263059616088867, -0.0005769729614257812, 7.236003875732422e-05, 0.0007216930389404297, 0.0013710260391235352, 0.0020203590393066406, 0.002669692039489746, 0.0033190250396728516, 0.003968358039855957, 0.0046176910400390625, 0.005267024040222168, 0.0059163570404052734, 0.006565690040588379, 0.007215023040771484, 0.00786435604095459, 0.008513689041137695, 0.0091630220413208, 0.009812355041503906, 0.010461688041687012, 0.011111021041870117, 0.011760354042053223, 0.012409687042236328, 0.013059020042419434, 0.013708353042602539, 0.014357686042785645, 0.01500701904296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 9.0, 17.0, 27.0, 56.0, 131.0, 238.0, 258.0, 134.0, 55.0, 24.0, 20.0, 14.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0], "bins": [-0.5437684655189514, -0.5331311225891113, -0.5224937796592712, -0.5118564367294312, -0.5012190937995911, -0.490581750869751, -0.4799444079399109, -0.4693070650100708, -0.4586697220802307, -0.4480323791503906, -0.43739503622055054, -0.42675769329071045, -0.41612035036087036, -0.4054830074310303, -0.3948456645011902, -0.3842083215713501, -0.37357097864151, -0.3629336357116699, -0.35229629278182983, -0.34165894985198975, -0.33102160692214966, -0.32038426399230957, -0.3097469210624695, -0.2991095781326294, -0.2884722352027893, -0.2778348922729492, -0.26719754934310913, -0.25656020641326904, -0.24592286348342896, -0.23528552055358887, -0.22464817762374878, -0.2140108346939087, -0.20337346196174622, -0.19273611903190613, -0.18209877610206604, -0.17146143317222595, -0.16082409024238586, -0.15018674731254578, -0.1395494043827057, -0.1289120614528656, -0.11827471852302551, -0.10763737559318542, -0.09700003266334534, -0.08636268973350525, -0.07572534680366516, -0.06508800387382507, -0.054450660943984985, -0.0438133180141449, -0.03317597508430481, -0.02253863215446472, -0.011901289224624634, -0.001263946294784546, 0.009373396635055542, 0.02001073956489563, 0.030648082494735718, 0.041285425424575806, 0.051922768354415894, 0.06256011128425598, 0.07319745421409607, 0.08383479714393616, 0.09447214007377625, 0.10510948300361633, 0.11574682593345642, 0.1263841688632965, 0.1370215117931366]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 9.0, 9.0, 17.0, 17.0, 22.0, 20.0, 36.0, 26.0, 24.0, 39.0, 39.0, 43.0, 36.0, 46.0, 52.0, 52.0, 53.0, 63.0, 48.0, 42.0, 34.0, 40.0, 34.0, 34.0, 36.0, 16.0, 17.0, 19.0, 16.0, 13.0, 7.0, 6.0, 10.0, 4.0, 2.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17190831899642944, -0.16710087656974792, -0.1622934341430664, -0.1574859917163849, -0.15267854928970337, -0.14787112176418304, -0.14306367933750153, -0.13825623691082, -0.1334487944841385, -0.12864135205745697, -0.12383390963077545, -0.11902647465467453, -0.11421903222799301, -0.10941158980131149, -0.10460415482521057, -0.09979671239852905, -0.09498926997184753, -0.09018182754516602, -0.0853743851184845, -0.08056695014238358, -0.07575950771570206, -0.07095206528902054, -0.06614463031291962, -0.0613371878862381, -0.05652974545955658, -0.05172230303287506, -0.04691486433148384, -0.04210742563009262, -0.0372999832034111, -0.032492540776729584, -0.027685102075338364, -0.022877663373947144, -0.018070220947265625, -0.013262780383229256, -0.008455339819192886, -0.003647899255156517, 0.0011595413088798523, 0.005966981872916222, 0.010774422436952591, 0.015581861138343811, 0.02038930356502533, 0.0251967441290617, 0.030004184693098068, 0.03481162339448929, 0.03961906582117081, 0.044426508247852325, 0.049233946949243546, 0.054041385650634766, 0.058848828077316284, 0.0636562705039978, 0.06846371293067932, 0.07327114790678024, 0.07807859033346176, 0.08288603276014328, 0.0876934677362442, 0.09250091016292572, 0.09730835258960724, 0.10211579501628876, 0.10692323744297028, 0.1117306724190712, 0.11653811484575272, 0.12134555727243423, 0.12615299224853516, 0.13096043467521667, 0.1357678771018982]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 6.0, 8.0, 16.0, 15.0, 20.0, 28.0, 30.0, 40.0, 82.0, 90.0, 122.0, 237.0, 394.0, 625.0, 1252.0, 2817.0, 7784.0, 28793.0, 274637.0, 3705485.0, 141153.0, 20853.0, 5900.0, 2102.0, 846.0, 385.0, 220.0, 121.0, 77.0, 40.0, 39.0, 19.0, 9.0, 7.0, 6.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07012939453125, -0.0682535171508789, -0.06637763977050781, -0.06450176239013672, -0.06262588500976562, -0.06075000762939453, -0.05887413024902344, -0.056998252868652344, -0.05512237548828125, -0.053246498107910156, -0.05137062072753906, -0.04949474334716797, -0.047618865966796875, -0.04574298858642578, -0.04386711120605469, -0.041991233825683594, -0.0401153564453125, -0.038239479064941406, -0.03636360168457031, -0.03448772430419922, -0.032611846923828125, -0.03073596954345703, -0.028860092163085938, -0.026984214782714844, -0.02510833740234375, -0.023232460021972656, -0.021356582641601562, -0.01948070526123047, -0.017604827880859375, -0.01572895050048828, -0.013853073120117188, -0.011977195739746094, -0.010101318359375, -0.008225440979003906, -0.0063495635986328125, -0.004473686218261719, -0.002597808837890625, -0.0007219314575195312, 0.0011539459228515625, 0.0030298233032226562, 0.00490570068359375, 0.006781578063964844, 0.008657455444335938, 0.010533332824707031, 0.012409210205078125, 0.014285087585449219, 0.016160964965820312, 0.018036842346191406, 0.0199127197265625, 0.021788597106933594, 0.023664474487304688, 0.02554035186767578, 0.027416229248046875, 0.02929210662841797, 0.031167984008789062, 0.033043861389160156, 0.03491973876953125, 0.036795616149902344, 0.03867149353027344, 0.04054737091064453, 0.042423248291015625, 0.04429912567138672, 0.04617500305175781, 0.048050880432128906, 0.0499267578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 0.0, 11.0, 11.0, 13.0, 21.0, 37.0, 45.0, 57.0, 70.0, 80.0, 87.0, 94.0, 99.0, 60.0, 66.0, 55.0, 52.0, 38.0, 34.0, 30.0, 20.0, 4.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01041412353515625, -0.010114312171936035, -0.00981450080871582, -0.009514689445495605, -0.00921487808227539, -0.008915066719055176, -0.008615255355834961, -0.008315443992614746, -0.008015632629394531, -0.007715821266174316, -0.0074160099029541016, -0.007116198539733887, -0.006816387176513672, -0.006516575813293457, -0.006216764450073242, -0.005916953086853027, -0.0056171417236328125, -0.005317330360412598, -0.005017518997192383, -0.004717707633972168, -0.004417896270751953, -0.004118084907531738, -0.0038182735443115234, -0.0035184621810913086, -0.0032186508178710938, -0.002918839454650879, -0.002619028091430664, -0.0023192167282104492, -0.0020194053649902344, -0.0017195940017700195, -0.0014197826385498047, -0.0011199712753295898, -0.000820159912109375, -0.0005203485488891602, -0.0002205371856689453, 7.927417755126953e-05, 0.0003790855407714844, 0.0006788969039916992, 0.000978708267211914, 0.001278519630432129, 0.0015783309936523438, 0.0018781423568725586, 0.0021779537200927734, 0.0024777650833129883, 0.002777576446533203, 0.003077387809753418, 0.003377199172973633, 0.0036770105361938477, 0.0039768218994140625, 0.004276633262634277, 0.004576444625854492, 0.004876255989074707, 0.005176067352294922, 0.005475878715515137, 0.0057756900787353516, 0.006075501441955566, 0.006375312805175781, 0.006675124168395996, 0.006974935531616211, 0.007274746894836426, 0.007574558258056641, 0.007874369621276855, 0.00817418098449707, 0.008473992347717285, 0.0087738037109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 10.0, 19.0, 25.0, 32.0, 58.0, 107.0, 178.0, 343.0, 808.0, 2708.0, 12433.0, 775159.0, 3379586.0, 17422.0, 3533.0, 1089.0, 386.0, 164.0, 95.0, 44.0, 31.0, 19.0, 11.0, 5.0, 4.0, 9.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11993408203125, -0.1161947250366211, -0.11245536804199219, -0.10871601104736328, -0.10497665405273438, -0.10123729705810547, -0.09749794006347656, -0.09375858306884766, -0.09001922607421875, -0.08627986907958984, -0.08254051208496094, -0.07880115509033203, -0.07506179809570312, -0.07132244110107422, -0.06758308410644531, -0.0638437271118164, -0.0601043701171875, -0.056365013122558594, -0.05262565612792969, -0.04888629913330078, -0.045146942138671875, -0.04140758514404297, -0.03766822814941406, -0.033928871154785156, -0.03018951416015625, -0.026450157165527344, -0.022710800170898438, -0.01897144317626953, -0.015232086181640625, -0.011492729187011719, -0.0077533721923828125, -0.004014015197753906, -0.000274658203125, 0.0034646987915039062, 0.0072040557861328125, 0.010943412780761719, 0.014682769775390625, 0.01842212677001953, 0.022161483764648438, 0.025900840759277344, 0.02964019775390625, 0.033379554748535156, 0.03711891174316406, 0.04085826873779297, 0.044597625732421875, 0.04833698272705078, 0.05207633972167969, 0.055815696716308594, 0.0595550537109375, 0.0632944107055664, 0.06703376770019531, 0.07077312469482422, 0.07451248168945312, 0.07825183868408203, 0.08199119567871094, 0.08573055267333984, 0.08946990966796875, 0.09320926666259766, 0.09694862365722656, 0.10068798065185547, 0.10442733764648438, 0.10816669464111328, 0.11190605163574219, 0.1156454086303711, 0.119384765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 2.0, 11.0, 12.0, 23.0, 52.0, 150.0, 523.0, 2232.0, 743.0, 173.0, 73.0, 23.0, 12.0, 10.0, 9.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04351806640625, -0.0424959659576416, -0.0414738655090332, -0.040451765060424805, -0.039429664611816406, -0.03840756416320801, -0.03738546371459961, -0.03636336326599121, -0.03534126281738281, -0.034319162368774414, -0.033297061920166016, -0.03227496147155762, -0.03125286102294922, -0.03023076057434082, -0.029208660125732422, -0.028186559677124023, -0.027164459228515625, -0.026142358779907227, -0.025120258331298828, -0.02409815788269043, -0.02307605743408203, -0.022053956985473633, -0.021031856536865234, -0.020009756088256836, -0.018987655639648438, -0.01796555519104004, -0.01694345474243164, -0.015921354293823242, -0.014899253845214844, -0.013877153396606445, -0.012855052947998047, -0.011832952499389648, -0.01081085205078125, -0.009788751602172852, -0.008766651153564453, -0.007744550704956055, -0.006722450256347656, -0.005700349807739258, -0.004678249359130859, -0.003656148910522461, -0.0026340484619140625, -0.001611948013305664, -0.0005898475646972656, 0.0004322528839111328, 0.0014543533325195312, 0.0024764537811279297, 0.003498554229736328, 0.0045206546783447266, 0.005542755126953125, 0.0065648555755615234, 0.007586956024169922, 0.00860905647277832, 0.009631156921386719, 0.010653257369995117, 0.011675357818603516, 0.012697458267211914, 0.013719558715820312, 0.014741659164428711, 0.01576375961303711, 0.016785860061645508, 0.017807960510253906, 0.018830060958862305, 0.019852161407470703, 0.0208742618560791, 0.0218963623046875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 9.0, 29.0, 234.0, 547.0, 159.0, 20.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2559463381767273, -0.24125222861766815, -0.226558119058609, -0.21186402440071106, -0.19716991484165192, -0.18247580528259277, -0.16778171062469482, -0.15308760106563568, -0.13839349150657654, -0.1236993819475174, -0.10900527983903885, -0.0943111777305603, -0.07961706817150116, -0.06492295861244202, -0.05022885650396347, -0.035534754395484924, -0.02084064483642578, -0.006146539002656937, 0.008547566831111908, 0.023241672664880753, 0.0379357784986496, 0.05262988805770874, 0.06732399016618729, 0.08201809227466583, 0.09671220183372498, 0.11140631139278412, 0.12610042095184326, 0.1407945156097412, 0.15548862516880035, 0.1701827347278595, 0.18487682938575745, 0.1995709389448166, 0.21426504850387573, 0.22895915806293488, 0.24365326762199402, 0.25834736227989197, 0.2730414867401123, 0.28773558139801025, 0.3024296760559082, 0.31712377071380615, 0.3318178951740265, 0.34651198983192444, 0.3612061142921448, 0.3759002089500427, 0.3905943036079407, 0.405288428068161, 0.41998252272605896, 0.4346766471862793, 0.44937074184417725, 0.4640648365020752, 0.47875896096229553, 0.4934530556201935, 0.5081471800804138, 0.5228412747383118, 0.5375353693962097, 0.5522294640541077, 0.5669236183166504, 0.5816177129745483, 0.5963118076324463, 0.611005961894989, 0.625700056552887, 0.6403941512107849, 0.6550882458686829, 0.6697823405265808, 0.6844764351844788]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 12.0, 20.0, 22.0, 33.0, 38.0, 49.0, 51.0, 57.0, 79.0, 68.0, 61.0, 79.0, 70.0, 62.0, 37.0, 54.0, 44.0, 39.0, 28.0, 19.0, 10.0, 17.0, 11.0, 3.0, 7.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06843847036361694, -0.06586591899394989, -0.06329336017370224, -0.06072080880403519, -0.058148253709077835, -0.05557569861412048, -0.05300314724445343, -0.05043059214949608, -0.04785803705453873, -0.045285481959581375, -0.04271292686462402, -0.04014037549495697, -0.03756782039999962, -0.03499526530504227, -0.032422713935375214, -0.029850158840417862, -0.02727760374546051, -0.02470504865050316, -0.022132495418190956, -0.019559942185878754, -0.016987387090921402, -0.014414832927286625, -0.011842278763651848, -0.009269725531339645, -0.006697170436382294, -0.004124616272747517, -0.0015520621091127396, 0.0010204920545220375, 0.0035930462181568146, 0.006165600381791592, 0.008738154545426369, 0.011310707777738571, 0.013883262872695923, 0.016455817967653275, 0.019028371199965477, 0.02160092443227768, 0.02417347952723503, 0.026746034622192383, 0.029318587854504585, 0.03189114108681679, 0.03446369618177414, 0.03703625127673149, 0.03960880637168884, 0.042181357741355896, 0.04475391283631325, 0.0473264679312706, 0.04989901930093765, 0.052471574395895004, 0.055044129490852356, 0.05761668458580971, 0.06018923968076706, 0.06276179105043411, 0.06533434987068176, 0.06790690124034882, 0.07047945261001587, 0.07305200397968292, 0.07562456279993057, 0.07819711416959763, 0.08076967298984528, 0.08334222435951233, 0.08591477572917938, 0.08848733454942703, 0.09105988591909409, 0.09363244473934174, 0.09620499610900879]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 11.0, 14.0, 27.0, 37.0, 54.0, 82.0, 104.0, 184.0, 265.0, 448.0, 885.0, 1843.0, 4894.0, 18747.0, 102742.0, 640525.0, 230667.0, 34056.0, 7733.0, 2552.0, 1188.0, 559.0, 314.0, 215.0, 120.0, 93.0, 50.0, 41.0, 32.0, 17.0, 10.0, 10.0, 13.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04364013671875, -0.04211902618408203, -0.04059791564941406, -0.039076805114746094, -0.037555694580078125, -0.036034584045410156, -0.03451347351074219, -0.03299236297607422, -0.03147125244140625, -0.02995014190673828, -0.028429031372070312, -0.026907920837402344, -0.025386810302734375, -0.023865699768066406, -0.022344589233398438, -0.02082347869873047, -0.0193023681640625, -0.01778125762939453, -0.016260147094726562, -0.014739036560058594, -0.013217926025390625, -0.011696815490722656, -0.010175704956054688, -0.008654594421386719, -0.00713348388671875, -0.005612373352050781, -0.0040912628173828125, -0.0025701522827148438, -0.001049041748046875, 0.00047206878662109375, 0.0019931793212890625, 0.0035142898559570312, 0.005035400390625, 0.006556510925292969, 0.008077621459960938, 0.009598731994628906, 0.011119842529296875, 0.012640953063964844, 0.014162063598632812, 0.01568317413330078, 0.01720428466796875, 0.01872539520263672, 0.020246505737304688, 0.021767616271972656, 0.023288726806640625, 0.024809837341308594, 0.026330947875976562, 0.02785205841064453, 0.0293731689453125, 0.03089427947998047, 0.03241539001464844, 0.033936500549316406, 0.035457611083984375, 0.036978721618652344, 0.03849983215332031, 0.04002094268798828, 0.04154205322265625, 0.04306316375732422, 0.04458427429199219, 0.046105384826660156, 0.047626495361328125, 0.049147605895996094, 0.05066871643066406, 0.05218982696533203, 0.0537109375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 10.0, 17.0, 22.0, 26.0, 44.0, 64.0, 82.0, 82.0, 99.0, 106.0, 98.0, 78.0, 65.0, 63.0, 49.0, 34.0, 27.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01024627685546875, -0.009930729866027832, -0.009615182876586914, -0.009299635887145996, -0.008984088897705078, -0.00866854190826416, -0.008352994918823242, -0.008037447929382324, -0.007721900939941406, -0.007406353950500488, -0.00709080696105957, -0.006775259971618652, -0.006459712982177734, -0.006144165992736816, -0.0058286190032958984, -0.0055130720138549805, -0.0051975250244140625, -0.0048819780349731445, -0.0045664310455322266, -0.004250884056091309, -0.003935337066650391, -0.0036197900772094727, -0.0033042430877685547, -0.0029886960983276367, -0.0026731491088867188, -0.0023576021194458008, -0.002042055130004883, -0.0017265081405639648, -0.0014109611511230469, -0.001095414161682129, -0.0007798671722412109, -0.00046432018280029297, -0.000148773193359375, 0.00016677379608154297, 0.00048232078552246094, 0.0007978677749633789, 0.0011134147644042969, 0.0014289617538452148, 0.0017445087432861328, 0.0020600557327270508, 0.0023756027221679688, 0.0026911497116088867, 0.0030066967010498047, 0.0033222436904907227, 0.0036377906799316406, 0.003953337669372559, 0.0042688846588134766, 0.0045844316482543945, 0.0048999786376953125, 0.0052155256271362305, 0.0055310726165771484, 0.005846619606018066, 0.006162166595458984, 0.006477713584899902, 0.00679326057434082, 0.007108807563781738, 0.007424354553222656, 0.007739901542663574, 0.008055448532104492, 0.00837099552154541, 0.008686542510986328, 0.009002089500427246, 0.009317636489868164, 0.009633183479309082, 0.00994873046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 10.0, 11.0, 18.0, 19.0, 31.0, 51.0, 66.0, 122.0, 164.0, 249.0, 379.0, 590.0, 1002.0, 1685.0, 3012.0, 5252.0, 9548.0, 18160.0, 36287.0, 75553.0, 176218.0, 316742.0, 218676.0, 93922.0, 43304.0, 21537.0, 11213.0, 6139.0, 3487.0, 1945.0, 1206.0, 700.0, 445.0, 281.0, 183.0, 96.0, 66.0, 53.0, 37.0, 25.0, 23.0, 10.0, 10.0, 10.0, 3.0, 4.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.014495849609375, -0.014037609100341797, -0.013579368591308594, -0.01312112808227539, -0.012662887573242188, -0.012204647064208984, -0.011746406555175781, -0.011288166046142578, -0.010829925537109375, -0.010371685028076172, -0.009913444519042969, -0.009455204010009766, -0.008996963500976562, -0.00853872299194336, -0.008080482482910156, -0.007622241973876953, -0.00716400146484375, -0.006705760955810547, -0.006247520446777344, -0.005789279937744141, -0.0053310394287109375, -0.004872798919677734, -0.004414558410644531, -0.003956317901611328, -0.003498077392578125, -0.003039836883544922, -0.0025815963745117188, -0.0021233558654785156, -0.0016651153564453125, -0.0012068748474121094, -0.0007486343383789062, -0.0002903938293457031, 0.0001678466796875, 0.0006260871887207031, 0.0010843276977539062, 0.0015425682067871094, 0.0020008087158203125, 0.0024590492248535156, 0.0029172897338867188, 0.003375530242919922, 0.003833770751953125, 0.004292011260986328, 0.004750251770019531, 0.005208492279052734, 0.0056667327880859375, 0.006124973297119141, 0.006583213806152344, 0.007041454315185547, 0.00749969482421875, 0.007957935333251953, 0.008416175842285156, 0.00887441635131836, 0.009332656860351562, 0.009790897369384766, 0.010249137878417969, 0.010707378387451172, 0.011165618896484375, 0.011623859405517578, 0.012082099914550781, 0.012540340423583984, 0.012998580932617188, 0.01345682144165039, 0.013915061950683594, 0.014373302459716797, 0.01483154296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 7.0, 7.0, 11.0, 21.0, 10.0, 13.0, 20.0, 30.0, 28.0, 21.0, 37.0, 26.0, 36.0, 41.0, 48.0, 46.0, 54.0, 42.0, 47.0, 37.0, 31.0, 44.0, 33.0, 39.0, 31.0, 39.0, 27.0, 21.0, 26.0, 23.0, 19.0, 12.0, 13.0, 9.0, 9.0, 7.0, 2.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0189971923828125, -0.018414020538330078, -0.017830848693847656, -0.017247676849365234, -0.016664505004882812, -0.01608133316040039, -0.015498161315917969, -0.014914989471435547, -0.014331817626953125, -0.013748645782470703, -0.013165473937988281, -0.01258230209350586, -0.011999130249023438, -0.011415958404541016, -0.010832786560058594, -0.010249614715576172, -0.00966644287109375, -0.009083271026611328, -0.008500099182128906, -0.007916927337646484, -0.0073337554931640625, -0.006750583648681641, -0.006167411804199219, -0.005584239959716797, -0.005001068115234375, -0.004417896270751953, -0.0038347244262695312, -0.0032515525817871094, -0.0026683807373046875, -0.0020852088928222656, -0.0015020370483398438, -0.0009188652038574219, -0.000335693359375, 0.0002474784851074219, 0.0008306503295898438, 0.0014138221740722656, 0.0019969940185546875, 0.0025801658630371094, 0.0031633377075195312, 0.003746509552001953, 0.004329681396484375, 0.004912853240966797, 0.005496025085449219, 0.006079196929931641, 0.0066623687744140625, 0.007245540618896484, 0.007828712463378906, 0.008411884307861328, 0.00899505615234375, 0.009578227996826172, 0.010161399841308594, 0.010744571685791016, 0.011327743530273438, 0.01191091537475586, 0.012494087219238281, 0.013077259063720703, 0.013660430908203125, 0.014243602752685547, 0.014826774597167969, 0.01540994644165039, 0.015993118286132812, 0.016576290130615234, 0.017159461975097656, 0.017742633819580078, 0.0183258056640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 12.0, 10.0, 21.0, 20.0, 30.0, 44.0, 52.0, 86.0, 111.0, 175.0, 301.0, 460.0, 912.0, 1988.0, 6060.0, 23481.0, 123450.0, 476880.0, 330899.0, 63385.0, 13233.0, 3681.0, 1386.0, 680.0, 380.0, 229.0, 153.0, 113.0, 71.0, 59.0, 46.0, 27.0, 22.0, 23.0, 16.0, 10.0, 8.0, 5.0, 5.0, 4.0, 6.0, 2.0, 1.0, 3.0], "bins": [-0.01239013671875, -0.012062430381774902, -0.011734724044799805, -0.011407017707824707, -0.01107931137084961, -0.010751605033874512, -0.010423898696899414, -0.010096192359924316, -0.009768486022949219, -0.009440779685974121, -0.009113073348999023, -0.008785367012023926, -0.008457660675048828, -0.00812995433807373, -0.007802248001098633, -0.007474541664123535, -0.0071468353271484375, -0.00681912899017334, -0.006491422653198242, -0.0061637163162231445, -0.005836009979248047, -0.005508303642272949, -0.0051805973052978516, -0.004852890968322754, -0.004525184631347656, -0.004197478294372559, -0.003869771957397461, -0.0035420656204223633, -0.0032143592834472656, -0.002886652946472168, -0.0025589466094970703, -0.0022312402725219727, -0.001903533935546875, -0.0015758275985717773, -0.0012481212615966797, -0.000920414924621582, -0.0005927085876464844, -0.0002650022506713867, 6.270408630371094e-05, 0.0003904104232788086, 0.0007181167602539062, 0.001045823097229004, 0.0013735294342041016, 0.0017012357711791992, 0.002028942108154297, 0.0023566484451293945, 0.002684354782104492, 0.00301206111907959, 0.0033397674560546875, 0.003667473793029785, 0.003995180130004883, 0.0043228864669799805, 0.004650592803955078, 0.004978299140930176, 0.0053060054779052734, 0.005633711814880371, 0.005961418151855469, 0.006289124488830566, 0.006616830825805664, 0.006944537162780762, 0.007272243499755859, 0.007599949836730957, 0.007927656173706055, 0.008255362510681152, 0.00858306884765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 5.0, 4.0, 15.0, 22.0, 22.0, 33.0, 55.0, 62.0, 86.0, 86.0, 106.0, 100.0, 90.0, 83.0, 58.0, 54.0, 40.0, 29.0, 17.0, 14.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.56382942199707e-05, -7.303338497877121e-05, -7.042847573757172e-05, -6.782356649637222e-05, -6.521865725517273e-05, -6.261374801397324e-05, -6.000883877277374e-05, -5.740392953157425e-05, -5.4799020290374756e-05, -5.219411104917526e-05, -4.958920180797577e-05, -4.6984292566776276e-05, -4.437938332557678e-05, -4.177447408437729e-05, -3.9169564843177795e-05, -3.65646556019783e-05, -3.395974636077881e-05, -3.1354837119579315e-05, -2.8749927878379822e-05, -2.614501863718033e-05, -2.3540109395980835e-05, -2.093520015478134e-05, -1.8330290913581848e-05, -1.5725381672382355e-05, -1.3120472431182861e-05, -1.0515563189983368e-05, -7.910653948783875e-06, -5.305744707584381e-06, -2.7008354663848877e-06, -9.592622518539429e-08, 2.508983016014099e-06, 5.1138922572135925e-06, 7.718801498413086e-06, 1.032371073961258e-05, 1.2928619980812073e-05, 1.5533529222011566e-05, 1.813843846321106e-05, 2.0743347704410553e-05, 2.3348256945610046e-05, 2.595316618680954e-05, 2.8558075428009033e-05, 3.1162984669208527e-05, 3.376789391040802e-05, 3.6372803151607513e-05, 3.897771239280701e-05, 4.15826216340065e-05, 4.4187530875205994e-05, 4.679244011640549e-05, 4.939734935760498e-05, 5.2002258598804474e-05, 5.460716784000397e-05, 5.721207708120346e-05, 5.9816986322402954e-05, 6.242189556360245e-05, 6.502680480480194e-05, 6.763171404600143e-05, 7.023662328720093e-05, 7.284153252840042e-05, 7.544644176959991e-05, 7.805135101079941e-05, 8.06562602519989e-05, 8.32611694931984e-05, 8.586607873439789e-05, 8.847098797559738e-05, 9.107589721679688e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 2.0, 5.0, 7.0, 15.0, 32.0, 47.0, 61.0, 114.0, 176.0, 322.0, 588.0, 1409.0, 4172.0, 17925.0, 131465.0, 580564.0, 267140.0, 34321.0, 6508.0, 1931.0, 840.0, 407.0, 178.0, 121.0, 78.0, 48.0, 21.0, 22.0, 15.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0158538818359375, -0.015433073043823242, -0.015012264251708984, -0.014591455459594727, -0.014170646667480469, -0.013749837875366211, -0.013329029083251953, -0.012908220291137695, -0.012487411499023438, -0.01206660270690918, -0.011645793914794922, -0.011224985122680664, -0.010804176330566406, -0.010383367538452148, -0.00996255874633789, -0.009541749954223633, -0.009120941162109375, -0.008700132369995117, -0.00827932357788086, -0.007858514785766602, -0.007437705993652344, -0.007016897201538086, -0.006596088409423828, -0.00617527961730957, -0.0057544708251953125, -0.005333662033081055, -0.004912853240966797, -0.004492044448852539, -0.004071235656738281, -0.0036504268646240234, -0.0032296180725097656, -0.002808809280395508, -0.00238800048828125, -0.001967191696166992, -0.0015463829040527344, -0.0011255741119384766, -0.0007047653198242188, -0.00028395652770996094, 0.00013685226440429688, 0.0005576610565185547, 0.0009784698486328125, 0.0013992786407470703, 0.0018200874328613281, 0.002240896224975586, 0.0026617050170898438, 0.0030825138092041016, 0.0035033226013183594, 0.003924131393432617, 0.004344940185546875, 0.004765748977661133, 0.005186557769775391, 0.0056073665618896484, 0.006028175354003906, 0.006448984146118164, 0.006869792938232422, 0.00729060173034668, 0.0077114105224609375, 0.008132219314575195, 0.008553028106689453, 0.008973836898803711, 0.009394645690917969, 0.009815454483032227, 0.010236263275146484, 0.010657072067260742, 0.011077880859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 11.0, 30.0, 27.0, 59.0, 87.0, 109.0, 143.0, 149.0, 122.0, 96.0, 46.0, 44.0, 22.0, 13.0, 11.0, 9.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0171051025390625, -0.01657271385192871, -0.016040325164794922, -0.015507936477661133, -0.014975547790527344, -0.014443159103393555, -0.013910770416259766, -0.013378381729125977, -0.012845993041992188, -0.012313604354858398, -0.01178121566772461, -0.01124882698059082, -0.010716438293457031, -0.010184049606323242, -0.009651660919189453, -0.009119272232055664, -0.008586883544921875, -0.008054494857788086, -0.007522106170654297, -0.006989717483520508, -0.006457328796386719, -0.00592494010925293, -0.005392551422119141, -0.0048601627349853516, -0.0043277740478515625, -0.0037953853607177734, -0.0032629966735839844, -0.0027306079864501953, -0.0021982192993164062, -0.0016658306121826172, -0.0011334419250488281, -0.0006010532379150391, -6.866455078125e-05, 0.00046372413635253906, 0.0009961128234863281, 0.0015285015106201172, 0.0020608901977539062, 0.0025932788848876953, 0.0031256675720214844, 0.0036580562591552734, 0.0041904449462890625, 0.0047228336334228516, 0.005255222320556641, 0.00578761100769043, 0.006319999694824219, 0.006852388381958008, 0.007384777069091797, 0.007917165756225586, 0.008449554443359375, 0.008981943130493164, 0.009514331817626953, 0.010046720504760742, 0.010579109191894531, 0.01111149787902832, 0.01164388656616211, 0.012176275253295898, 0.012708663940429688, 0.013241052627563477, 0.013773441314697266, 0.014305830001831055, 0.014838218688964844, 0.015370607376098633, 0.015902996063232422, 0.01643538475036621, 0.0169677734375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 3.0, 6.0, 13.0, 20.0, 37.0, 46.0, 59.0, 90.0, 112.0, 142.0, 121.0, 98.0, 75.0, 59.0, 37.0, 22.0, 26.0, 13.0, 5.0, 8.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07135280966758728, -0.06702051311731339, -0.06268821656703949, -0.058355916291475296, -0.0540236197412014, -0.049691323190927505, -0.04535902291536331, -0.041026726365089417, -0.03669442981481552, -0.032362133264541626, -0.02802983485162258, -0.023697536438703537, -0.01936523988842964, -0.015032943338155746, -0.010700644925236702, -0.0063683465123176575, -0.002036049962043762, 0.0022962475195527077, 0.0066285450011491776, 0.010960842482745647, 0.015293139964342117, 0.019625436514616013, 0.023957734927535057, 0.0282900333404541, 0.032622329890728, 0.03695462644100189, 0.04128692299127579, 0.04561922326683998, 0.049951519817113876, 0.05428381636738777, 0.058616116642951965, 0.06294841319322586, 0.06728069484233856, 0.07161299139261246, 0.07594528794288635, 0.08027758449316025, 0.08460988104343414, 0.08894218504428864, 0.09327448159456253, 0.09760677814483643, 0.10193907469511032, 0.10627137124538422, 0.11060366779565811, 0.114935964345932, 0.1192682683467865, 0.1236005574464798, 0.1279328614473343, 0.1322651505470276, 0.13659745454788208, 0.14092975854873657, 0.14526204764842987, 0.14959435164928436, 0.15392664074897766, 0.15825894474983215, 0.16259123384952545, 0.16692353785037994, 0.17125582695007324, 0.17558813095092773, 0.17992042005062103, 0.18425272405147552, 0.18858501315116882, 0.19291731715202332, 0.1972496062517166, 0.2015819102525711, 0.2059142142534256]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 4.0, 4.0, 3.0, 7.0, 5.0, 14.0, 12.0, 15.0, 17.0, 15.0, 25.0, 26.0, 32.0, 34.0, 31.0, 34.0, 27.0, 50.0, 45.0, 31.0, 39.0, 43.0, 42.0, 38.0, 36.0, 42.0, 42.0, 34.0, 27.0, 32.0, 19.0, 27.0, 20.0, 17.0, 14.0, 18.0, 13.0, 7.0, 11.0, 17.0, 5.0, 9.0, 5.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.09580373764038086, -0.09271527081727982, -0.08962679654359818, -0.08653832972049713, -0.08344985544681549, -0.08036138862371445, -0.0772729218006134, -0.07418444752693176, -0.07109598070383072, -0.06800751388072968, -0.06491903960704803, -0.06183057278394699, -0.05874210223555565, -0.05565363168716431, -0.05256516486406326, -0.04947669431567192, -0.04638822376728058, -0.043299753218889236, -0.040211282670497894, -0.03712281584739685, -0.03403434529900551, -0.030945874750614166, -0.027857406064867973, -0.02476893737912178, -0.021680466830730438, -0.018591996282339096, -0.015503527596592903, -0.012415057979524136, -0.009326588362455368, -0.0062381187453866005, -0.003149649128317833, -6.118044257164001e-05, 0.003027290105819702, 0.00611575972288847, 0.009204229339957237, 0.012292698957026005, 0.015381168574094772, 0.018469639122486115, 0.021558107808232307, 0.0246465764939785, 0.027735047042369843, 0.030823517590761185, 0.03391198813915253, 0.03700045496225357, 0.04008892551064491, 0.043177396059036255, 0.0462658628821373, 0.04935433343052864, 0.05244280397891998, 0.055531274527311325, 0.05861974507570267, 0.06170821189880371, 0.06479668617248535, 0.0678851529955864, 0.07097361981868744, 0.07406209409236908, 0.07715056091547012, 0.08023902773857117, 0.08332750201225281, 0.08641596883535385, 0.0895044356584549, 0.09259290993213654, 0.09568137675523758, 0.09876984357833862, 0.10185831785202026]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 2.0, 3.0, 4.0, 12.0, 16.0, 25.0, 19.0, 31.0, 48.0, 78.0, 125.0, 185.0, 318.0, 531.0, 1214.0, 2942.0, 8911.0, 41510.0, 1063662.0, 3000141.0, 58037.0, 10746.0, 3158.0, 1250.0, 561.0, 282.0, 180.0, 113.0, 54.0, 42.0, 25.0, 26.0, 8.0, 9.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03570556640625, -0.03455686569213867, -0.033408164978027344, -0.032259464263916016, -0.031110763549804688, -0.02996206283569336, -0.02881336212158203, -0.027664661407470703, -0.026515960693359375, -0.025367259979248047, -0.02421855926513672, -0.02306985855102539, -0.021921157836914062, -0.020772457122802734, -0.019623756408691406, -0.018475055694580078, -0.01732635498046875, -0.016177654266357422, -0.015028953552246094, -0.013880252838134766, -0.012731552124023438, -0.01158285140991211, -0.010434150695800781, -0.009285449981689453, -0.008136749267578125, -0.006988048553466797, -0.005839347839355469, -0.004690647125244141, -0.0035419464111328125, -0.0023932456970214844, -0.0012445449829101562, -9.584426879882812e-05, 0.0010528564453125, 0.002201557159423828, 0.0033502578735351562, 0.004498958587646484, 0.0056476593017578125, 0.006796360015869141, 0.007945060729980469, 0.009093761444091797, 0.010242462158203125, 0.011391162872314453, 0.012539863586425781, 0.01368856430053711, 0.014837265014648438, 0.015985965728759766, 0.017134666442871094, 0.018283367156982422, 0.01943206787109375, 0.020580768585205078, 0.021729469299316406, 0.022878170013427734, 0.024026870727539062, 0.02517557144165039, 0.02632427215576172, 0.027472972869873047, 0.028621673583984375, 0.029770374298095703, 0.03091907501220703, 0.03206777572631836, 0.03321647644042969, 0.034365177154541016, 0.035513877868652344, 0.03666257858276367, 0.037811279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 18.0, 25.0, 27.0, 34.0, 50.0, 71.0, 69.0, 66.0, 84.0, 96.0, 78.0, 99.0, 67.0, 58.0, 45.0, 26.0, 37.0, 9.0, 10.0, 9.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.009368896484375, -0.009078264236450195, -0.00878763198852539, -0.008496999740600586, -0.008206367492675781, -0.007915735244750977, -0.007625102996826172, -0.007334470748901367, -0.0070438385009765625, -0.006753206253051758, -0.006462574005126953, -0.0061719417572021484, -0.005881309509277344, -0.005590677261352539, -0.005300045013427734, -0.00500941276550293, -0.004718780517578125, -0.00442814826965332, -0.004137516021728516, -0.003846883773803711, -0.0035562515258789062, -0.0032656192779541016, -0.002974987030029297, -0.002684354782104492, -0.0023937225341796875, -0.002103090286254883, -0.0018124580383300781, -0.0015218257904052734, -0.0012311935424804688, -0.0009405612945556641, -0.0006499290466308594, -0.0003592967987060547, -6.866455078125e-05, 0.0002219676971435547, 0.0005125999450683594, 0.0008032321929931641, 0.0010938644409179688, 0.0013844966888427734, 0.0016751289367675781, 0.001965761184692383, 0.0022563934326171875, 0.002547025680541992, 0.002837657928466797, 0.0031282901763916016, 0.0034189224243164062, 0.003709554672241211, 0.004000186920166016, 0.00429081916809082, 0.004581451416015625, 0.00487208366394043, 0.005162715911865234, 0.005453348159790039, 0.005743980407714844, 0.0060346126556396484, 0.006325244903564453, 0.006615877151489258, 0.0069065093994140625, 0.007197141647338867, 0.007487773895263672, 0.0077784061431884766, 0.008069038391113281, 0.008359670639038086, 0.00865030288696289, 0.008940935134887695, 0.0092315673828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 11.0, 7.0, 11.0, 15.0, 22.0, 36.0, 49.0, 61.0, 98.0, 184.0, 282.0, 634.0, 1757.0, 6254.0, 31777.0, 698826.0, 3364615.0, 74578.0, 10566.0, 2712.0, 828.0, 400.0, 195.0, 110.0, 76.0, 55.0, 39.0, 22.0, 12.0, 17.0, 9.0, 4.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03253173828125, -0.03145408630371094, -0.030376434326171875, -0.029298782348632812, -0.02822113037109375, -0.027143478393554688, -0.026065826416015625, -0.024988174438476562, -0.0239105224609375, -0.022832870483398438, -0.021755218505859375, -0.020677566528320312, -0.01959991455078125, -0.018522262573242188, -0.017444610595703125, -0.016366958618164062, -0.015289306640625, -0.014211654663085938, -0.013134002685546875, -0.012056350708007812, -0.01097869873046875, -0.009901046752929688, -0.008823394775390625, -0.0077457427978515625, -0.0066680908203125, -0.0055904388427734375, -0.004512786865234375, -0.0034351348876953125, -0.00235748291015625, -0.0012798309326171875, -0.000202178955078125, 0.0008754730224609375, 0.001953125, 0.0030307769775390625, 0.004108428955078125, 0.0051860809326171875, 0.00626373291015625, 0.0073413848876953125, 0.008419036865234375, 0.009496688842773438, 0.0105743408203125, 0.011651992797851562, 0.012729644775390625, 0.013807296752929688, 0.01488494873046875, 0.015962600708007812, 0.017040252685546875, 0.018117904663085938, 0.019195556640625, 0.020273208618164062, 0.021350860595703125, 0.022428512573242188, 0.02350616455078125, 0.024583816528320312, 0.025661468505859375, 0.026739120483398438, 0.0278167724609375, 0.028894424438476562, 0.029972076416015625, 0.031049728393554688, 0.03212738037109375, 0.03320503234863281, 0.034282684326171875, 0.03536033630371094, 0.03643798828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 8.0, 2.0, 9.0, 10.0, 17.0, 22.0, 21.0, 52.0, 119.0, 233.0, 724.0, 1599.0, 719.0, 261.0, 141.0, 60.0, 28.0, 14.0, 13.0, 9.0, 5.0, 2.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01491546630859375, -0.014537572860717773, -0.014159679412841797, -0.01378178596496582, -0.013403892517089844, -0.013025999069213867, -0.01264810562133789, -0.012270212173461914, -0.011892318725585938, -0.011514425277709961, -0.011136531829833984, -0.010758638381958008, -0.010380744934082031, -0.010002851486206055, -0.009624958038330078, -0.009247064590454102, -0.008869171142578125, -0.008491277694702148, -0.008113384246826172, -0.007735490798950195, -0.007357597351074219, -0.006979703903198242, -0.006601810455322266, -0.006223917007446289, -0.0058460235595703125, -0.005468130111694336, -0.005090236663818359, -0.004712343215942383, -0.004334449768066406, -0.00395655632019043, -0.003578662872314453, -0.0032007694244384766, -0.0028228759765625, -0.0024449825286865234, -0.002067089080810547, -0.0016891956329345703, -0.0013113021850585938, -0.0009334087371826172, -0.0005555152893066406, -0.00017762184143066406, 0.0002002716064453125, 0.0005781650543212891, 0.0009560585021972656, 0.0013339519500732422, 0.0017118453979492188, 0.0020897388458251953, 0.002467632293701172, 0.0028455257415771484, 0.003223419189453125, 0.0036013126373291016, 0.003979206085205078, 0.004357099533081055, 0.004734992980957031, 0.005112886428833008, 0.005490779876708984, 0.005868673324584961, 0.0062465667724609375, 0.006624460220336914, 0.007002353668212891, 0.007380247116088867, 0.007758140563964844, 0.00813603401184082, 0.008513927459716797, 0.008891820907592773, 0.00926971435546875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 49.0, 340.0, 493.0, 103.0, 18.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24192523956298828, -0.23437495529651642, -0.22682467103004456, -0.2192743867635727, -0.21172410249710083, -0.20417381823062897, -0.1966235339641571, -0.18907324969768524, -0.18152296543121338, -0.17397268116474152, -0.16642239689826965, -0.1588721126317978, -0.15132182836532593, -0.14377154409885406, -0.1362212598323822, -0.12867097556591034, -0.12112069129943848, -0.11357040703296661, -0.10602012276649475, -0.09846983850002289, -0.09091955423355103, -0.08336926996707916, -0.0758189857006073, -0.06826870143413544, -0.060718417167663574, -0.05316813290119171, -0.04561784863471985, -0.038067564368247986, -0.030517280101776123, -0.02296699583530426, -0.015416711568832397, -0.007866427302360535, -0.0003161430358886719, 0.007234141230583191, 0.014784425497055054, 0.022334709763526917, 0.02988499402999878, 0.03743527829647064, 0.044985562562942505, 0.05253584682941437, 0.06008613109588623, 0.0676364153623581, 0.07518669962882996, 0.08273698389530182, 0.09028726816177368, 0.09783755242824554, 0.10538783669471741, 0.11293812096118927, 0.12048840522766113, 0.128038689494133, 0.13558897376060486, 0.14313925802707672, 0.15068954229354858, 0.15823982656002045, 0.1657901108264923, 0.17334039509296417, 0.18089067935943604, 0.1884409636259079, 0.19599124789237976, 0.20354153215885162, 0.2110918164253235, 0.21864210069179535, 0.2261923849582672, 0.23374266922473907, 0.24129295349121094]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 9.0, 5.0, 8.0, 9.0, 20.0, 18.0, 30.0, 46.0, 53.0, 59.0, 61.0, 54.0, 56.0, 73.0, 61.0, 68.0, 61.0, 52.0, 46.0, 47.0, 41.0, 34.0, 29.0, 14.0, 6.0, 13.0, 10.0, 4.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030660152435302734, -0.029400061815977097, -0.028139973059296608, -0.02687988430261612, -0.02561979368329048, -0.024359703063964844, -0.023099614307284355, -0.021839525550603867, -0.02057943493127823, -0.01931934431195259, -0.018059255555272102, -0.016799166798591614, -0.015539076179265976, -0.014278986491262913, -0.01301889680325985, -0.011758807115256786, -0.010498717427253723, -0.00923862773925066, -0.007978538051247597, -0.0067184483632445335, -0.00545835867524147, -0.004198268987238407, -0.002938179299235344, -0.0016780896112322807, -0.00041799992322921753, 0.0008420897647738457, 0.002102179452776909, 0.003362269140779972, 0.004622358828783035, 0.0058824485167860985, 0.007142538204789162, 0.008402627892792225, 0.009662717580795288, 0.010922807268798351, 0.012182896956801414, 0.013442986644804478, 0.014703076332807541, 0.01596316695213318, 0.017223255708813667, 0.018483344465494156, 0.019743435084819794, 0.02100352570414543, 0.02226361446082592, 0.02352370321750641, 0.024783793836832047, 0.026043884456157684, 0.027303973212838173, 0.02856406196951866, 0.0298241525888443, 0.031084243208169937, 0.032344333827495575, 0.033604420721530914, 0.03486451134085655, 0.03612460196018219, 0.03738468885421753, 0.03864477947354317, 0.039904870092868805, 0.04116496071219444, 0.04242505133152008, 0.04368513822555542, 0.04494522884488106, 0.046205319464206696, 0.047465406358242035, 0.04872549697756767, 0.04998558759689331]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 7.0, 3.0, 0.0, 4.0, 10.0, 10.0, 15.0, 14.0, 22.0, 30.0, 52.0, 79.0, 81.0, 128.0, 195.0, 290.0, 412.0, 732.0, 1275.0, 2494.0, 5932.0, 16201.0, 52594.0, 220383.0, 499032.0, 179790.0, 44252.0, 13941.0, 5190.0, 2275.0, 1147.0, 682.0, 414.0, 253.0, 175.0, 133.0, 94.0, 74.0, 36.0, 40.0, 19.0, 19.0, 8.0, 10.0, 7.0, 2.0, 4.0, 2.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023345947265625, -0.02252483367919922, -0.021703720092773438, -0.020882606506347656, -0.020061492919921875, -0.019240379333496094, -0.018419265747070312, -0.01759815216064453, -0.01677703857421875, -0.01595592498779297, -0.015134811401367188, -0.014313697814941406, -0.013492584228515625, -0.012671470642089844, -0.011850357055664062, -0.011029243469238281, -0.0102081298828125, -0.009387016296386719, -0.008565902709960938, -0.007744789123535156, -0.006923675537109375, -0.006102561950683594, -0.0052814483642578125, -0.004460334777832031, -0.00363922119140625, -0.0028181076049804688, -0.0019969940185546875, -0.0011758804321289062, -0.000354766845703125, 0.00046634674072265625, 0.0012874603271484375, 0.0021085739135742188, 0.0029296875, 0.0037508010864257812, 0.0045719146728515625, 0.005393028259277344, 0.006214141845703125, 0.007035255432128906, 0.007856369018554688, 0.008677482604980469, 0.00949859619140625, 0.010319709777832031, 0.011140823364257812, 0.011961936950683594, 0.012783050537109375, 0.013604164123535156, 0.014425277709960938, 0.015246391296386719, 0.0160675048828125, 0.01688861846923828, 0.017709732055664062, 0.018530845642089844, 0.019351959228515625, 0.020173072814941406, 0.020994186401367188, 0.02181529998779297, 0.02263641357421875, 0.02345752716064453, 0.024278640747070312, 0.025099754333496094, 0.025920867919921875, 0.026741981506347656, 0.027563095092773438, 0.02838420867919922, 0.029205322265625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 22.0, 32.0, 25.0, 45.0, 59.0, 67.0, 77.0, 82.0, 99.0, 96.0, 84.0, 80.0, 66.0, 48.0, 38.0, 20.0, 15.0, 10.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01035308837890625, -0.010053515434265137, -0.009753942489624023, -0.00945436954498291, -0.009154796600341797, -0.008855223655700684, -0.00855565071105957, -0.008256077766418457, -0.007956504821777344, -0.0076569318771362305, -0.007357358932495117, -0.007057785987854004, -0.006758213043212891, -0.006458640098571777, -0.006159067153930664, -0.005859494209289551, -0.0055599212646484375, -0.005260348320007324, -0.004960775375366211, -0.004661202430725098, -0.004361629486083984, -0.004062056541442871, -0.003762483596801758, -0.0034629106521606445, -0.0031633377075195312, -0.002863764762878418, -0.0025641918182373047, -0.0022646188735961914, -0.001965045928955078, -0.0016654729843139648, -0.0013659000396728516, -0.0010663270950317383, -0.000766754150390625, -0.0004671812057495117, -0.00016760826110839844, 0.00013196468353271484, 0.0004315376281738281, 0.0007311105728149414, 0.0010306835174560547, 0.001330256462097168, 0.0016298294067382812, 0.0019294023513793945, 0.002228975296020508, 0.002528548240661621, 0.0028281211853027344, 0.0031276941299438477, 0.003427267074584961, 0.0037268400192260742, 0.0040264129638671875, 0.004325985908508301, 0.004625558853149414, 0.004925131797790527, 0.005224704742431641, 0.005524277687072754, 0.005823850631713867, 0.0061234235763549805, 0.006422996520996094, 0.006722569465637207, 0.00702214241027832, 0.007321715354919434, 0.007621288299560547, 0.00792086124420166, 0.008220434188842773, 0.008520007133483887, 0.008819580078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 9.0, 18.0, 12.0, 24.0, 54.0, 79.0, 115.0, 164.0, 313.0, 447.0, 772.0, 1397.0, 2821.0, 5248.0, 10415.0, 22571.0, 51811.0, 132114.0, 308350.0, 296456.0, 124113.0, 48887.0, 21403.0, 9916.0, 5115.0, 2564.0, 1410.0, 788.0, 413.0, 265.0, 181.0, 106.0, 68.0, 26.0, 25.0, 24.0, 17.0, 10.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01358795166015625, -0.013118863105773926, -0.012649774551391602, -0.012180685997009277, -0.011711597442626953, -0.011242508888244629, -0.010773420333862305, -0.01030433177947998, -0.009835243225097656, -0.009366154670715332, -0.008897066116333008, -0.008427977561950684, -0.00795888900756836, -0.007489800453186035, -0.007020711898803711, -0.006551623344421387, -0.0060825347900390625, -0.005613446235656738, -0.005144357681274414, -0.00467526912689209, -0.004206180572509766, -0.0037370920181274414, -0.003268003463745117, -0.002798914909362793, -0.0023298263549804688, -0.0018607378005981445, -0.0013916492462158203, -0.0009225606918334961, -0.0004534721374511719, 1.5616416931152344e-05, 0.00048470497131347656, 0.0009537935256958008, 0.001422882080078125, 0.0018919706344604492, 0.0023610591888427734, 0.0028301477432250977, 0.003299236297607422, 0.003768324851989746, 0.00423741340637207, 0.0047065019607543945, 0.005175590515136719, 0.005644679069519043, 0.006113767623901367, 0.006582856178283691, 0.007051944732666016, 0.00752103328704834, 0.007990121841430664, 0.008459210395812988, 0.008928298950195312, 0.009397387504577637, 0.009866476058959961, 0.010335564613342285, 0.01080465316772461, 0.011273741722106934, 0.011742830276489258, 0.012211918830871582, 0.012681007385253906, 0.01315009593963623, 0.013619184494018555, 0.014088273048400879, 0.014557361602783203, 0.015026450157165527, 0.015495538711547852, 0.015964627265930176, 0.0164337158203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 2.0, 5.0, 5.0, 12.0, 11.0, 9.0, 16.0, 21.0, 21.0, 26.0, 29.0, 31.0, 38.0, 41.0, 47.0, 41.0, 31.0, 53.0, 50.0, 39.0, 51.0, 35.0, 43.0, 44.0, 30.0, 34.0, 44.0, 33.0, 21.0, 28.0, 24.0, 16.0, 13.0, 8.0, 17.0, 11.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.022216796875, -0.0215914249420166, -0.020966053009033203, -0.020340681076049805, -0.019715309143066406, -0.019089937210083008, -0.01846456527709961, -0.01783919334411621, -0.017213821411132812, -0.016588449478149414, -0.015963077545166016, -0.015337705612182617, -0.014712333679199219, -0.01408696174621582, -0.013461589813232422, -0.012836217880249023, -0.012210845947265625, -0.011585474014282227, -0.010960102081298828, -0.01033473014831543, -0.009709358215332031, -0.009083986282348633, -0.008458614349365234, -0.007833242416381836, -0.0072078704833984375, -0.006582498550415039, -0.005957126617431641, -0.005331754684448242, -0.004706382751464844, -0.004081010818481445, -0.003455638885498047, -0.0028302669525146484, -0.00220489501953125, -0.0015795230865478516, -0.0009541511535644531, -0.0003287792205810547, 0.00029659271240234375, 0.0009219646453857422, 0.0015473365783691406, 0.002172708511352539, 0.0027980804443359375, 0.003423452377319336, 0.004048824310302734, 0.004674196243286133, 0.005299568176269531, 0.00592494010925293, 0.006550312042236328, 0.0071756839752197266, 0.007801055908203125, 0.008426427841186523, 0.009051799774169922, 0.00967717170715332, 0.010302543640136719, 0.010927915573120117, 0.011553287506103516, 0.012178659439086914, 0.012804031372070312, 0.013429403305053711, 0.01405477523803711, 0.014680147171020508, 0.015305519104003906, 0.015930891036987305, 0.016556262969970703, 0.0171816349029541, 0.0178070068359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 11.0, 9.0, 18.0, 26.0, 42.0, 55.0, 72.0, 148.0, 259.0, 797.0, 2870.0, 17326.0, 275662.0, 686320.0, 56574.0, 5967.0, 1445.0, 423.0, 213.0, 128.0, 63.0, 37.0, 32.0, 15.0, 10.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.0213165283203125, -0.02082347869873047, -0.020330429077148438, -0.019837379455566406, -0.019344329833984375, -0.018851280212402344, -0.018358230590820312, -0.01786518096923828, -0.01737213134765625, -0.01687908172607422, -0.016386032104492188, -0.015892982482910156, -0.015399932861328125, -0.014906883239746094, -0.014413833618164062, -0.013920783996582031, -0.013427734375, -0.012934684753417969, -0.012441635131835938, -0.011948585510253906, -0.011455535888671875, -0.010962486267089844, -0.010469436645507812, -0.009976387023925781, -0.00948333740234375, -0.008990287780761719, -0.008497238159179688, -0.008004188537597656, -0.007511138916015625, -0.007018089294433594, -0.0065250396728515625, -0.006031990051269531, -0.0055389404296875, -0.005045890808105469, -0.0045528411865234375, -0.004059791564941406, -0.003566741943359375, -0.0030736923217773438, -0.0025806427001953125, -0.0020875930786132812, -0.00159454345703125, -0.0011014938354492188, -0.0006084442138671875, -0.00011539459228515625, 0.000377655029296875, 0.0008707046508789062, 0.0013637542724609375, 0.0018568038940429688, 0.002349853515625, 0.0028429031372070312, 0.0033359527587890625, 0.0038290023803710938, 0.004322052001953125, 0.004815101623535156, 0.0053081512451171875, 0.005801200866699219, 0.00629425048828125, 0.006787300109863281, 0.0072803497314453125, 0.007773399353027344, 0.008266448974609375, 0.008759498596191406, 0.009252548217773438, 0.009745597839355469, 0.0102386474609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 25.0, 37.0, 90.0, 122.0, 121.0, 179.0, 156.0, 107.0, 66.0, 42.0, 27.0, 16.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.09566879272461e-05, -8.674152195453644e-05, -8.252635598182678e-05, -7.831119000911713e-05, -7.409602403640747e-05, -6.988085806369781e-05, -6.566569209098816e-05, -6.14505261182785e-05, -5.723536014556885e-05, -5.302019417285919e-05, -4.8805028200149536e-05, -4.458986222743988e-05, -4.0374696254730225e-05, -3.615953028202057e-05, -3.194436430931091e-05, -2.7729198336601257e-05, -2.35140323638916e-05, -1.9298866391181946e-05, -1.508370041847229e-05, -1.0868534445762634e-05, -6.6533684730529785e-06, -2.4382025003433228e-06, 1.776963472366333e-06, 5.992129445075989e-06, 1.0207295417785645e-05, 1.44224613904953e-05, 1.8637627363204956e-05, 2.2852793335914612e-05, 2.7067959308624268e-05, 3.128312528133392e-05, 3.549829125404358e-05, 3.9713457226753235e-05, 4.392862319946289e-05, 4.8143789172172546e-05, 5.23589551448822e-05, 5.657412111759186e-05, 6.0789287090301514e-05, 6.500445306301117e-05, 6.921961903572083e-05, 7.343478500843048e-05, 7.764995098114014e-05, 8.186511695384979e-05, 8.608028292655945e-05, 9.02954488992691e-05, 9.451061487197876e-05, 9.872578084468842e-05, 0.00010294094681739807, 0.00010715611279010773, 0.00011137127876281738, 0.00011558644473552704, 0.0001198016107082367, 0.00012401677668094635, 0.000128231942653656, 0.00013244710862636566, 0.00013666227459907532, 0.00014087744057178497, 0.00014509260654449463, 0.00014930777251720428, 0.00015352293848991394, 0.0001577381044626236, 0.00016195327043533325, 0.0001661684364080429, 0.00017038360238075256, 0.00017459876835346222, 0.00017881393432617188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 10.0, 26.0, 40.0, 37.0, 64.0, 148.0, 232.0, 392.0, 816.0, 1824.0, 5059.0, 18182.0, 94837.0, 435400.0, 390626.0, 77710.0, 15380.0, 4506.0, 1593.0, 711.0, 403.0, 209.0, 132.0, 71.0, 45.0, 24.0, 16.0, 16.0, 9.0, 6.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00962066650390625, -0.009309768676757812, -0.008998870849609375, -0.008687973022460938, -0.0083770751953125, -0.008066177368164062, -0.007755279541015625, -0.0074443817138671875, -0.00713348388671875, -0.0068225860595703125, -0.006511688232421875, -0.0062007904052734375, -0.005889892578125, -0.0055789947509765625, -0.005268096923828125, -0.0049571990966796875, -0.00464630126953125, -0.0043354034423828125, -0.004024505615234375, -0.0037136077880859375, -0.0034027099609375, -0.0030918121337890625, -0.002780914306640625, -0.0024700164794921875, -0.00215911865234375, -0.0018482208251953125, -0.001537322998046875, -0.0012264251708984375, -0.00091552734375, -0.0006046295166015625, -0.000293731689453125, 1.71661376953125e-05, 0.00032806396484375, 0.0006389617919921875, 0.000949859619140625, 0.0012607574462890625, 0.0015716552734375, 0.0018825531005859375, 0.002193450927734375, 0.0025043487548828125, 0.00281524658203125, 0.0031261444091796875, 0.003437042236328125, 0.0037479400634765625, 0.004058837890625, 0.0043697357177734375, 0.004680633544921875, 0.0049915313720703125, 0.00530242919921875, 0.0056133270263671875, 0.005924224853515625, 0.0062351226806640625, 0.0065460205078125, 0.0068569183349609375, 0.007167816162109375, 0.0074787139892578125, 0.00778961181640625, 0.008100509643554688, 0.008411407470703125, 0.008722305297851562, 0.009033203125, 0.009344100952148438, 0.009654998779296875, 0.009965896606445312, 0.01027679443359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 7.0, 4.0, 8.0, 13.0, 18.0, 24.0, 21.0, 31.0, 40.0, 57.0, 63.0, 82.0, 71.0, 89.0, 104.0, 75.0, 70.0, 47.0, 49.0, 27.0, 26.0, 14.0, 11.0, 15.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00922393798828125, -0.00894784927368164, -0.008671760559082031, -0.008395671844482422, -0.008119583129882812, -0.007843494415283203, -0.007567405700683594, -0.007291316986083984, -0.007015228271484375, -0.006739139556884766, -0.006463050842285156, -0.006186962127685547, -0.0059108734130859375, -0.005634784698486328, -0.005358695983886719, -0.005082607269287109, -0.0048065185546875, -0.004530429840087891, -0.004254341125488281, -0.003978252410888672, -0.0037021636962890625, -0.003426074981689453, -0.0031499862670898438, -0.0028738975524902344, -0.002597808837890625, -0.0023217201232910156, -0.0020456314086914062, -0.0017695426940917969, -0.0014934539794921875, -0.0012173652648925781, -0.0009412765502929688, -0.0006651878356933594, -0.00038909912109375, -0.00011301040649414062, 0.00016307830810546875, 0.0004391670227050781, 0.0007152557373046875, 0.0009913444519042969, 0.0012674331665039062, 0.0015435218811035156, 0.001819610595703125, 0.0020956993103027344, 0.0023717880249023438, 0.002647876739501953, 0.0029239654541015625, 0.003200054168701172, 0.0034761428833007812, 0.0037522315979003906, 0.0040283203125, 0.004304409027099609, 0.004580497741699219, 0.004856586456298828, 0.0051326751708984375, 0.005408763885498047, 0.005684852600097656, 0.005960941314697266, 0.006237030029296875, 0.006513118743896484, 0.006789207458496094, 0.007065296173095703, 0.0073413848876953125, 0.007617473602294922, 0.007893562316894531, 0.00816965103149414, 0.00844573974609375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 7.0, 13.0, 10.0, 25.0, 47.0, 71.0, 135.0, 167.0, 181.0, 152.0, 91.0, 46.0, 25.0, 11.0, 12.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17151640355587006, -0.16563548147678375, -0.15975457429885864, -0.15387365221977234, -0.14799273014068604, -0.14211180806159973, -0.13623088598251343, -0.13034997880458832, -0.12446905672550201, -0.11858813464641571, -0.11270722001791, -0.1068263053894043, -0.100945383310318, -0.09506446123123169, -0.08918354660272598, -0.08330263197422028, -0.07742170989513397, -0.07154078781604767, -0.06565987318754196, -0.059778954833745956, -0.05389803647994995, -0.048017118126153946, -0.04213619977235794, -0.036255281418561935, -0.03037436306476593, -0.024493444710969925, -0.01861252635717392, -0.012731608003377914, -0.006850689649581909, -0.0009697712957859039, 0.004911147058010101, 0.010792065411806107, 0.016672998666763306, 0.02255391702055931, 0.028434835374355316, 0.03431575372815132, 0.04019667208194733, 0.04607759043574333, 0.05195850878953934, 0.05783942714333534, 0.06372034549713135, 0.06960126757621765, 0.07548218220472336, 0.08136309683322906, 0.08724401891231537, 0.09312494099140167, 0.09900585561990738, 0.10488677024841309, 0.11076769232749939, 0.1166486144065857, 0.1225295290350914, 0.1284104436635971, 0.1342913657426834, 0.14017228782176971, 0.14605319499969482, 0.15193411707878113, 0.15781503915786743, 0.16369596123695374, 0.16957688331604004, 0.17545779049396515, 0.18133871257305145, 0.18721963465213776, 0.19310054183006287, 0.19898146390914917, 0.20486238598823547]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 9.0, 5.0, 9.0, 12.0, 16.0, 26.0, 21.0, 32.0, 34.0, 41.0, 32.0, 34.0, 44.0, 40.0, 41.0, 48.0, 70.0, 50.0, 44.0, 56.0, 41.0, 41.0, 30.0, 36.0, 34.0, 29.0, 20.0, 20.0, 13.0, 7.0, 15.0, 11.0, 10.0, 5.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1271079182624817, -0.12351687997579575, -0.1199258416891098, -0.11633481085300446, -0.11274377256631851, -0.10915273427963257, -0.10556170344352722, -0.10197066515684128, -0.09837962687015533, -0.09478858858346939, -0.09119755029678345, -0.0876065194606781, -0.08401548117399216, -0.08042444288730621, -0.07683341205120087, -0.07324237376451492, -0.06965133547782898, -0.06606029719114304, -0.06246926262974739, -0.058878228068351746, -0.0552871897816658, -0.05169615149497986, -0.04810511693358421, -0.04451408237218857, -0.040923044085502625, -0.03733200579881668, -0.033740971237421036, -0.03014993481338024, -0.026558898389339447, -0.022967861965298653, -0.01937682554125786, -0.015785789117217064, -0.01219475269317627, -0.008603716269135475, -0.005012679845094681, -0.0014216434210538864, 0.002169393002986908, 0.005760429427027702, 0.009351465851068497, 0.012942502275109291, 0.016533538699150085, 0.02012457512319088, 0.023715611547231674, 0.02730664797127247, 0.030897684395313263, 0.03448872268199921, 0.03807975724339485, 0.0416707918047905, 0.04526183009147644, 0.048852868378162384, 0.05244390293955803, 0.056034937500953674, 0.05962597578763962, 0.06321701407432556, 0.06680804491043091, 0.07039908319711685, 0.0739901214838028, 0.07758115977048874, 0.08117219805717468, 0.08476322889328003, 0.08835426717996597, 0.09194530546665192, 0.09553633630275726, 0.0991273745894432, 0.10271841287612915]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 9.0, 21.0, 46.0, 129.0, 392.0, 1756.0, 18710.0, 4050333.0, 118152.0, 3811.0, 633.0, 195.0, 68.0, 22.0, 9.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033111572265625, -0.030286312103271484, -0.02746105194091797, -0.024635791778564453, -0.021810531616210938, -0.018985271453857422, -0.016160011291503906, -0.01333475112915039, -0.010509490966796875, -0.007684230804443359, -0.004858970642089844, -0.002033710479736328, 0.0007915496826171875, 0.003616809844970703, 0.006442070007324219, 0.009267330169677734, 0.01209259033203125, 0.014917850494384766, 0.01774311065673828, 0.020568370819091797, 0.023393630981445312, 0.026218891143798828, 0.029044151306152344, 0.03186941146850586, 0.034694671630859375, 0.03751993179321289, 0.040345191955566406, 0.04317045211791992, 0.04599571228027344, 0.04882097244262695, 0.05164623260498047, 0.054471492767333984, 0.0572967529296875, 0.060122013092041016, 0.06294727325439453, 0.06577253341674805, 0.06859779357910156, 0.07142305374145508, 0.0742483139038086, 0.07707357406616211, 0.07989883422851562, 0.08272409439086914, 0.08554935455322266, 0.08837461471557617, 0.09119987487792969, 0.0940251350402832, 0.09685039520263672, 0.09967565536499023, 0.10250091552734375, 0.10532617568969727, 0.10815143585205078, 0.1109766960144043, 0.11380195617675781, 0.11662721633911133, 0.11945247650146484, 0.12227773666381836, 0.12510299682617188, 0.1279282569885254, 0.1307535171508789, 0.13357877731323242, 0.13640403747558594, 0.13922929763793945, 0.14205455780029297, 0.14487981796264648, 0.147705078125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 5.0, 20.0, 23.0, 35.0, 37.0, 36.0, 62.0, 90.0, 72.0, 77.0, 74.0, 75.0, 78.0, 68.0, 65.0, 58.0, 35.0, 32.0, 15.0, 11.0, 7.0, 5.0, 8.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0101165771484375, -0.009822249412536621, -0.009527921676635742, -0.009233593940734863, -0.008939266204833984, -0.008644938468933105, -0.008350610733032227, -0.008056282997131348, -0.007761955261230469, -0.00746762752532959, -0.007173299789428711, -0.006878972053527832, -0.006584644317626953, -0.006290316581726074, -0.005995988845825195, -0.005701661109924316, -0.0054073333740234375, -0.005113005638122559, -0.00481867790222168, -0.004524350166320801, -0.004230022430419922, -0.003935694694519043, -0.003641366958618164, -0.003347039222717285, -0.0030527114868164062, -0.0027583837509155273, -0.0024640560150146484, -0.0021697282791137695, -0.0018754005432128906, -0.0015810728073120117, -0.0012867450714111328, -0.000992417335510254, -0.000698089599609375, -0.0004037618637084961, -0.00010943412780761719, 0.00018489360809326172, 0.0004792213439941406, 0.0007735490798950195, 0.0010678768157958984, 0.0013622045516967773, 0.0016565322875976562, 0.0019508600234985352, 0.002245187759399414, 0.002539515495300293, 0.002833843231201172, 0.0031281709671020508, 0.0034224987030029297, 0.0037168264389038086, 0.0040111541748046875, 0.004305481910705566, 0.004599809646606445, 0.004894137382507324, 0.005188465118408203, 0.005482792854309082, 0.005777120590209961, 0.00607144832611084, 0.006365776062011719, 0.006660103797912598, 0.0069544315338134766, 0.0072487592697143555, 0.007543087005615234, 0.007837414741516113, 0.008131742477416992, 0.008426070213317871, 0.00872039794921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 10.0, 9.0, 19.0, 14.0, 20.0, 36.0, 53.0, 69.0, 104.0, 155.0, 260.0, 478.0, 968.0, 2444.0, 7560.0, 33018.0, 339032.0, 3566965.0, 207091.0, 25252.0, 6310.0, 2194.0, 871.0, 469.0, 260.0, 176.0, 128.0, 96.0, 56.0, 32.0, 36.0, 23.0, 10.0, 11.0, 14.0, 17.0, 4.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.02435302734375, -0.023496150970458984, -0.02263927459716797, -0.021782398223876953, -0.020925521850585938, -0.020068645477294922, -0.019211769104003906, -0.01835489273071289, -0.017498016357421875, -0.01664113998413086, -0.015784263610839844, -0.014927387237548828, -0.014070510864257812, -0.013213634490966797, -0.012356758117675781, -0.011499881744384766, -0.01064300537109375, -0.009786128997802734, -0.008929252624511719, -0.008072376251220703, -0.0072154998779296875, -0.006358623504638672, -0.005501747131347656, -0.004644870758056641, -0.003787994384765625, -0.0029311180114746094, -0.0020742416381835938, -0.0012173652648925781, -0.0003604888916015625, 0.0004963874816894531, 0.0013532638549804688, 0.0022101402282714844, 0.0030670166015625, 0.003923892974853516, 0.004780769348144531, 0.005637645721435547, 0.0064945220947265625, 0.007351398468017578, 0.008208274841308594, 0.00906515121459961, 0.009922027587890625, 0.01077890396118164, 0.011635780334472656, 0.012492656707763672, 0.013349533081054688, 0.014206409454345703, 0.015063285827636719, 0.015920162200927734, 0.01677703857421875, 0.017633914947509766, 0.01849079132080078, 0.019347667694091797, 0.020204544067382812, 0.021061420440673828, 0.021918296813964844, 0.02277517318725586, 0.023632049560546875, 0.02448892593383789, 0.025345802307128906, 0.026202678680419922, 0.027059555053710938, 0.027916431427001953, 0.02877330780029297, 0.029630184173583984, 0.030487060546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 9.0, 13.0, 28.0, 27.0, 47.0, 59.0, 156.0, 317.0, 766.0, 1451.0, 634.0, 257.0, 119.0, 72.0, 40.0, 29.0, 18.0, 8.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00760650634765625, -0.007213711738586426, -0.0068209171295166016, -0.006428122520446777, -0.006035327911376953, -0.005642533302307129, -0.005249738693237305, -0.0048569440841674805, -0.004464149475097656, -0.004071354866027832, -0.003678560256958008, -0.0032857656478881836, -0.0028929710388183594, -0.002500176429748535, -0.002107381820678711, -0.0017145872116088867, -0.0013217926025390625, -0.0009289979934692383, -0.0005362033843994141, -0.00014340877532958984, 0.0002493858337402344, 0.0006421804428100586, 0.0010349750518798828, 0.001427769660949707, 0.0018205642700195312, 0.0022133588790893555, 0.0026061534881591797, 0.002998948097229004, 0.003391742706298828, 0.0037845373153686523, 0.0041773319244384766, 0.004570126533508301, 0.004962921142578125, 0.005355715751647949, 0.0057485103607177734, 0.006141304969787598, 0.006534099578857422, 0.006926894187927246, 0.00731968879699707, 0.0077124834060668945, 0.008105278015136719, 0.008498072624206543, 0.008890867233276367, 0.009283661842346191, 0.009676456451416016, 0.01006925106048584, 0.010462045669555664, 0.010854840278625488, 0.011247634887695312, 0.011640429496765137, 0.012033224105834961, 0.012426018714904785, 0.01281881332397461, 0.013211607933044434, 0.013604402542114258, 0.013997197151184082, 0.014389991760253906, 0.01478278636932373, 0.015175580978393555, 0.015568375587463379, 0.015961170196533203, 0.016353964805603027, 0.01674675941467285, 0.017139554023742676, 0.0175323486328125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 100.0, 415.0, 371.0, 90.0, 13.0, 10.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34768426418304443, -0.34057748317718506, -0.3334707021713257, -0.3263639509677887, -0.3192571699619293, -0.31215038895606995, -0.30504360795021057, -0.2979368567466736, -0.2908300757408142, -0.28372329473495483, -0.27661651372909546, -0.26950976252555847, -0.2624029815196991, -0.2552962005138397, -0.24818943440914154, -0.24108265340328217, -0.23397588729858398, -0.2268691062927246, -0.21976234018802643, -0.21265555918216705, -0.20554879307746887, -0.1984420120716095, -0.19133524596691132, -0.18422846496105194, -0.17712168395519257, -0.1700149029493332, -0.162908136844635, -0.15580135583877563, -0.14869458973407745, -0.14158780872821808, -0.1344810426235199, -0.12737426161766052, -0.12026749551296234, -0.11316072195768356, -0.10605394840240479, -0.09894717484712601, -0.09184040129184723, -0.08473362028598785, -0.07762685418128967, -0.0705200731754303, -0.06341330707073212, -0.05630653351545334, -0.04919975996017456, -0.04209298640489578, -0.034986212849617004, -0.027879435569047928, -0.02077266201376915, -0.013665888458490372, -0.006559111177921295, 0.0005476628430187702, 0.007654436863958836, 0.014761211350560188, 0.021867984905838966, 0.028974760323762894, 0.03608153387904167, 0.04318830743432045, 0.05029508098959923, 0.057401854544878006, 0.06450863182544708, 0.07161540538072586, 0.07872217893600464, 0.08582895249128342, 0.0929357260465622, 0.10004249960184097, 0.10714927315711975]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 14.0, 10.0, 14.0, 17.0, 30.0, 35.0, 47.0, 56.0, 47.0, 61.0, 51.0, 74.0, 76.0, 69.0, 50.0, 63.0, 46.0, 50.0, 40.0, 27.0, 37.0, 22.0, 16.0, 11.0, 16.0, 10.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03694802522659302, -0.03555016219615936, -0.03415229916572571, -0.03275443613529205, -0.0313565731048584, -0.029958710074424744, -0.02856084704399109, -0.027162984013557434, -0.02576512098312378, -0.024367257952690125, -0.02296939492225647, -0.021571531891822815, -0.02017366886138916, -0.018775805830955505, -0.01737794280052185, -0.015980079770088196, -0.014582216739654541, -0.013184353709220886, -0.011786490678787231, -0.010388627648353577, -0.008990764617919922, -0.007592901587486267, -0.006195038557052612, -0.0047971755266189575, -0.0033993124961853027, -0.002001449465751648, -0.0006035864353179932, 0.0007942765951156616, 0.0021921396255493164, 0.003590002655982971, 0.004987865686416626, 0.006385728716850281, 0.0077835917472839355, 0.00918145477771759, 0.010579317808151245, 0.0119771808385849, 0.013375043869018555, 0.01477290689945221, 0.016170769929885864, 0.01756863296031952, 0.018966495990753174, 0.02036435902118683, 0.021762222051620483, 0.023160085082054138, 0.024557948112487793, 0.025955811142921448, 0.027353674173355103, 0.028751537203788757, 0.030149400234222412, 0.03154726326465607, 0.03294512629508972, 0.034342989325523376, 0.03574085235595703, 0.037138715386390686, 0.03853657841682434, 0.039934441447257996, 0.04133230447769165, 0.042730167508125305, 0.04412803053855896, 0.045525893568992615, 0.04692375659942627, 0.048321619629859924, 0.04971948266029358, 0.051117345690727234, 0.05251520872116089]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 10.0, 5.0, 9.0, 10.0, 20.0, 22.0, 31.0, 32.0, 48.0, 75.0, 116.0, 151.0, 250.0, 392.0, 731.0, 1314.0, 2555.0, 5505.0, 13615.0, 45158.0, 284295.0, 573536.0, 84667.0, 20831.0, 7721.0, 3436.0, 1637.0, 914.0, 529.0, 298.0, 178.0, 136.0, 66.0, 78.0, 43.0, 35.0, 29.0, 13.0, 13.0, 15.0, 11.0, 4.0, 7.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.048919677734375, -0.047489166259765625, -0.04605865478515625, -0.044628143310546875, -0.0431976318359375, -0.041767120361328125, -0.04033660888671875, -0.038906097412109375, -0.0374755859375, -0.036045074462890625, -0.03461456298828125, -0.033184051513671875, -0.0317535400390625, -0.030323028564453125, -0.02889251708984375, -0.027462005615234375, -0.026031494140625, -0.024600982666015625, -0.02317047119140625, -0.021739959716796875, -0.0203094482421875, -0.018878936767578125, -0.01744842529296875, -0.016017913818359375, -0.01458740234375, -0.013156890869140625, -0.01172637939453125, -0.010295867919921875, -0.0088653564453125, -0.007434844970703125, -0.00600433349609375, -0.004573822021484375, -0.003143310546875, -0.001712799072265625, -0.00028228759765625, 0.001148223876953125, 0.0025787353515625, 0.004009246826171875, 0.00543975830078125, 0.006870269775390625, 0.00830078125, 0.009731292724609375, 0.01116180419921875, 0.012592315673828125, 0.0140228271484375, 0.015453338623046875, 0.01688385009765625, 0.018314361572265625, 0.019744873046875, 0.021175384521484375, 0.02260589599609375, 0.024036407470703125, 0.0254669189453125, 0.026897430419921875, 0.02832794189453125, 0.029758453369140625, 0.03118896484375, 0.032619476318359375, 0.03404998779296875, 0.035480499267578125, 0.0369110107421875, 0.038341522216796875, 0.03977203369140625, 0.041202545166015625, 0.042633056640625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 0.0, 6.0, 6.0, 7.0, 15.0, 19.0, 32.0, 29.0, 40.0, 58.0, 62.0, 70.0, 78.0, 83.0, 60.0, 60.0, 55.0, 68.0, 63.0, 54.0, 47.0, 24.0, 19.0, 14.0, 7.0, 6.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00827789306640625, -0.008011341094970703, -0.007744789123535156, -0.007478237152099609, -0.0072116851806640625, -0.006945133209228516, -0.006678581237792969, -0.006412029266357422, -0.006145477294921875, -0.005878925323486328, -0.005612373352050781, -0.005345821380615234, -0.0050792694091796875, -0.004812717437744141, -0.004546165466308594, -0.004279613494873047, -0.0040130615234375, -0.003746509552001953, -0.0034799575805664062, -0.0032134056091308594, -0.0029468536376953125, -0.0026803016662597656, -0.0024137496948242188, -0.002147197723388672, -0.001880645751953125, -0.0016140937805175781, -0.0013475418090820312, -0.0010809898376464844, -0.0008144378662109375, -0.0005478858947753906, -0.00028133392333984375, -1.4781951904296875e-05, 0.00025177001953125, 0.0005183219909667969, 0.0007848739624023438, 0.0010514259338378906, 0.0013179779052734375, 0.0015845298767089844, 0.0018510818481445312, 0.002117633819580078, 0.002384185791015625, 0.002650737762451172, 0.0029172897338867188, 0.0031838417053222656, 0.0034503936767578125, 0.0037169456481933594, 0.003983497619628906, 0.004250049591064453, 0.0045166015625, 0.004783153533935547, 0.005049705505371094, 0.005316257476806641, 0.0055828094482421875, 0.005849361419677734, 0.006115913391113281, 0.006382465362548828, 0.006649017333984375, 0.006915569305419922, 0.007182121276855469, 0.007448673248291016, 0.0077152252197265625, 0.00798177719116211, 0.008248329162597656, 0.008514881134033203, 0.00878143310546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 8.0, 11.0, 16.0, 18.0, 29.0, 33.0, 43.0, 80.0, 96.0, 150.0, 248.0, 356.0, 572.0, 1015.0, 1757.0, 3078.0, 5950.0, 12223.0, 28059.0, 76167.0, 250063.0, 422668.0, 155181.0, 50828.0, 20264.0, 9105.0, 4534.0, 2417.0, 1367.0, 772.0, 495.0, 313.0, 208.0, 122.0, 82.0, 71.0, 44.0, 32.0, 15.0, 18.0, 16.0, 8.0, 5.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0], "bins": [-0.020111083984375, -0.019524812698364258, -0.018938541412353516, -0.018352270126342773, -0.01776599884033203, -0.01717972755432129, -0.016593456268310547, -0.016007184982299805, -0.015420913696289062, -0.01483464241027832, -0.014248371124267578, -0.013662099838256836, -0.013075828552246094, -0.012489557266235352, -0.01190328598022461, -0.011317014694213867, -0.010730743408203125, -0.010144472122192383, -0.00955820083618164, -0.008971929550170898, -0.008385658264160156, -0.007799386978149414, -0.007213115692138672, -0.00662684440612793, -0.0060405731201171875, -0.005454301834106445, -0.004868030548095703, -0.004281759262084961, -0.0036954879760742188, -0.0031092166900634766, -0.0025229454040527344, -0.0019366741180419922, -0.00135040283203125, -0.0007641315460205078, -0.00017786026000976562, 0.00040841102600097656, 0.0009946823120117188, 0.001580953598022461, 0.002167224884033203, 0.0027534961700439453, 0.0033397674560546875, 0.00392603874206543, 0.004512310028076172, 0.005098581314086914, 0.005684852600097656, 0.0062711238861083984, 0.006857395172119141, 0.007443666458129883, 0.008029937744140625, 0.008616209030151367, 0.00920248031616211, 0.009788751602172852, 0.010375022888183594, 0.010961294174194336, 0.011547565460205078, 0.01213383674621582, 0.012720108032226562, 0.013306379318237305, 0.013892650604248047, 0.014478921890258789, 0.015065193176269531, 0.015651464462280273, 0.016237735748291016, 0.016824007034301758, 0.0174102783203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 8.0, 10.0, 6.0, 9.0, 17.0, 20.0, 25.0, 34.0, 37.0, 51.0, 36.0, 41.0, 36.0, 46.0, 48.0, 64.0, 46.0, 43.0, 52.0, 44.0, 47.0, 45.0, 35.0, 25.0, 32.0, 27.0, 25.0, 18.0, 10.0, 11.0, 6.0, 11.0, 8.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02093505859375, -0.020252227783203125, -0.01956939697265625, -0.018886566162109375, -0.0182037353515625, -0.017520904541015625, -0.01683807373046875, -0.016155242919921875, -0.015472412109375, -0.014789581298828125, -0.01410675048828125, -0.013423919677734375, -0.0127410888671875, -0.012058258056640625, -0.01137542724609375, -0.010692596435546875, -0.010009765625, -0.009326934814453125, -0.00864410400390625, -0.007961273193359375, -0.0072784423828125, -0.006595611572265625, -0.00591278076171875, -0.005229949951171875, -0.004547119140625, -0.003864288330078125, -0.00318145751953125, -0.002498626708984375, -0.0018157958984375, -0.001132965087890625, -0.00045013427734375, 0.000232696533203125, 0.00091552734375, 0.001598358154296875, 0.00228118896484375, 0.002964019775390625, 0.0036468505859375, 0.004329681396484375, 0.00501251220703125, 0.005695343017578125, 0.006378173828125, 0.007061004638671875, 0.00774383544921875, 0.008426666259765625, 0.0091094970703125, 0.009792327880859375, 0.01047515869140625, 0.011157989501953125, 0.0118408203125, 0.012523651123046875, 0.01320648193359375, 0.013889312744140625, 0.0145721435546875, 0.015254974365234375, 0.01593780517578125, 0.016620635986328125, 0.017303466796875, 0.017986297607421875, 0.01866912841796875, 0.019351959228515625, 0.0200347900390625, 0.020717620849609375, 0.02140045166015625, 0.022083282470703125, 0.02276611328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 13.0, 9.0, 13.0, 11.0, 22.0, 21.0, 19.0, 32.0, 41.0, 55.0, 87.0, 124.0, 188.0, 419.0, 931.0, 3531.0, 52239.0, 951563.0, 34519.0, 2928.0, 799.0, 368.0, 191.0, 130.0, 72.0, 56.0, 40.0, 26.0, 30.0, 17.0, 11.0, 12.0, 7.0, 3.0, 12.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.033111572265625, -0.03217744827270508, -0.031243324279785156, -0.030309200286865234, -0.029375076293945312, -0.02844095230102539, -0.02750682830810547, -0.026572704315185547, -0.025638580322265625, -0.024704456329345703, -0.02377033233642578, -0.02283620834350586, -0.021902084350585938, -0.020967960357666016, -0.020033836364746094, -0.019099712371826172, -0.01816558837890625, -0.017231464385986328, -0.016297340393066406, -0.015363216400146484, -0.014429092407226562, -0.01349496841430664, -0.012560844421386719, -0.011626720428466797, -0.010692596435546875, -0.009758472442626953, -0.008824348449707031, -0.00789022445678711, -0.0069561004638671875, -0.006021976470947266, -0.005087852478027344, -0.004153728485107422, -0.0032196044921875, -0.002285480499267578, -0.0013513565063476562, -0.0004172325134277344, 0.0005168914794921875, 0.0014510154724121094, 0.0023851394653320312, 0.003319263458251953, 0.004253387451171875, 0.005187511444091797, 0.006121635437011719, 0.007055759429931641, 0.007989883422851562, 0.008924007415771484, 0.009858131408691406, 0.010792255401611328, 0.01172637939453125, 0.012660503387451172, 0.013594627380371094, 0.014528751373291016, 0.015462875366210938, 0.01639699935913086, 0.01733112335205078, 0.018265247344970703, 0.019199371337890625, 0.020133495330810547, 0.02106761932373047, 0.02200174331665039, 0.022935867309570312, 0.023869991302490234, 0.024804115295410156, 0.025738239288330078, 0.02667236328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 14.0, 37.0, 98.0, 327.0, 358.0, 121.0, 33.0, 11.0, 10.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002512931823730469, -0.00023876875638961792, -0.00022624433040618896, -0.00021371990442276, -0.00020119547843933105, -0.0001886710524559021, -0.00017614662647247314, -0.0001636222004890442, -0.00015109777450561523, -0.00013857334852218628, -0.00012604892253875732, -0.00011352449655532837, -0.00010100007057189941, -8.847564458847046e-05, -7.59512186050415e-05, -6.342679262161255e-05, -5.0902366638183594e-05, -3.837794065475464e-05, -2.5853514671325684e-05, -1.3329088687896729e-05, -8.046627044677734e-07, 1.1719763278961182e-05, 2.4244189262390137e-05, 3.676861524581909e-05, 4.929304122924805e-05, 6.1817467212677e-05, 7.434189319610596e-05, 8.686631917953491e-05, 9.939074516296387e-05, 0.00011191517114639282, 0.00012443959712982178, 0.00013696402311325073, 0.0001494884490966797, 0.00016201287508010864, 0.0001745373010635376, 0.00018706172704696655, 0.0001995861530303955, 0.00021211057901382446, 0.00022463500499725342, 0.00023715943098068237, 0.00024968385696411133, 0.0002622082829475403, 0.00027473270893096924, 0.0002872571349143982, 0.00029978156089782715, 0.0003123059868812561, 0.00032483041286468506, 0.000337354838848114, 0.00034987926483154297, 0.0003624036908149719, 0.0003749281167984009, 0.00038745254278182983, 0.0003999769687652588, 0.00041250139474868774, 0.0004250258207321167, 0.00043755024671554565, 0.0004500746726989746, 0.00046259909868240356, 0.0004751235246658325, 0.0004876479506492615, 0.0005001723766326904, 0.0005126968026161194, 0.0005252212285995483, 0.0005377456545829773, 0.0005502700805664062]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 5.0, 1.0, 11.0, 15.0, 42.0, 69.0, 140.0, 323.0, 854.0, 3520.0, 52898.0, 946788.0, 39454.0, 3140.0, 760.0, 260.0, 123.0, 53.0, 36.0, 24.0, 16.0, 7.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033477783203125, -0.03262948989868164, -0.03178119659423828, -0.030932903289794922, -0.030084609985351562, -0.029236316680908203, -0.028388023376464844, -0.027539730072021484, -0.026691436767578125, -0.025843143463134766, -0.024994850158691406, -0.024146556854248047, -0.023298263549804688, -0.022449970245361328, -0.02160167694091797, -0.02075338363647461, -0.01990509033203125, -0.01905679702758789, -0.01820850372314453, -0.017360210418701172, -0.016511917114257812, -0.015663623809814453, -0.014815330505371094, -0.013967037200927734, -0.013118743896484375, -0.012270450592041016, -0.011422157287597656, -0.010573863983154297, -0.009725570678710938, -0.008877277374267578, -0.008028984069824219, -0.007180690765380859, -0.0063323974609375, -0.005484104156494141, -0.004635810852050781, -0.003787517547607422, -0.0029392242431640625, -0.002090930938720703, -0.0012426376342773438, -0.0003943443298339844, 0.000453948974609375, 0.0013022422790527344, 0.0021505355834960938, 0.002998828887939453, 0.0038471221923828125, 0.004695415496826172, 0.005543708801269531, 0.006392002105712891, 0.00724029541015625, 0.00808858871459961, 0.008936882019042969, 0.009785175323486328, 0.010633468627929688, 0.011481761932373047, 0.012330055236816406, 0.013178348541259766, 0.014026641845703125, 0.014874935150146484, 0.015723228454589844, 0.016571521759033203, 0.017419815063476562, 0.018268108367919922, 0.01911640167236328, 0.01996469497680664, 0.02081298828125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 7.0, 8.0, 16.0, 24.0, 42.0, 79.0, 123.0, 168.0, 181.0, 149.0, 90.0, 51.0, 26.0, 12.0, 9.0, 5.0, 4.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.032867431640625, -0.03218567371368408, -0.031503915786743164, -0.030822157859802246, -0.030140399932861328, -0.02945864200592041, -0.028776884078979492, -0.028095126152038574, -0.027413368225097656, -0.02673161029815674, -0.02604985237121582, -0.025368094444274902, -0.024686336517333984, -0.024004578590393066, -0.02332282066345215, -0.02264106273651123, -0.021959304809570312, -0.021277546882629395, -0.020595788955688477, -0.01991403102874756, -0.01923227310180664, -0.018550515174865723, -0.017868757247924805, -0.017186999320983887, -0.01650524139404297, -0.01582348346710205, -0.015141725540161133, -0.014459967613220215, -0.013778209686279297, -0.013096451759338379, -0.012414693832397461, -0.011732935905456543, -0.011051177978515625, -0.010369420051574707, -0.009687662124633789, -0.009005904197692871, -0.008324146270751953, -0.007642388343811035, -0.006960630416870117, -0.006278872489929199, -0.005597114562988281, -0.004915356636047363, -0.004233598709106445, -0.0035518407821655273, -0.0028700828552246094, -0.0021883249282836914, -0.0015065670013427734, -0.0008248090744018555, -0.0001430511474609375, 0.0005387067794799805, 0.0012204647064208984, 0.0019022226333618164, 0.0025839805603027344, 0.0032657384872436523, 0.00394749641418457, 0.004629254341125488, 0.005311012268066406, 0.005992770195007324, 0.006674528121948242, 0.00735628604888916, 0.008038043975830078, 0.008719801902770996, 0.009401559829711914, 0.010083317756652832, 0.01076507568359375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 30.0, 63.0, 222.0, 385.0, 194.0, 81.0, 17.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24824097752571106, -0.23308803141117096, -0.21793508529663086, -0.20278215408325195, -0.18762919306755066, -0.17247626185417175, -0.15732331573963165, -0.14217036962509155, -0.12701742351055145, -0.11186447739601135, -0.09671153128147125, -0.08155859261751175, -0.06640564650297165, -0.05125270038843155, -0.036099761724472046, -0.020946815609931946, -0.005793869495391846, 0.009359074756503105, 0.024512019008398056, 0.03966496139764786, 0.05481790751218796, 0.06997085362672806, 0.08512379229068756, 0.10027673840522766, 0.11542968451976776, 0.13058263063430786, 0.14573557674884796, 0.16088852286338806, 0.17604145407676697, 0.19119441509246826, 0.20634734630584717, 0.22150029242038727, 0.23665326833724976, 0.25180619955062866, 0.26695916056632996, 0.28211209177970886, 0.29726505279541016, 0.31241798400878906, 0.32757091522216797, 0.34272387623786926, 0.35787683725357056, 0.37302976846694946, 0.38818272948265076, 0.40333566069602966, 0.41848862171173096, 0.43364155292510986, 0.44879448413848877, 0.46394744515419006, 0.47910037636756897, 0.4942533075809479, 0.5094062685966492, 0.5245591998100281, 0.539712131023407, 0.5548651218414307, 0.5700180530548096, 0.5851709842681885, 0.6003239154815674, 0.6154768466949463, 0.6306297779083252, 0.6457827687263489, 0.6609356999397278, 0.6760886311531067, 0.6912415623664856, 0.7063945531845093, 0.7215474843978882]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 11.0, 5.0, 11.0, 9.0, 15.0, 15.0, 15.0, 13.0, 18.0, 20.0, 28.0, 26.0, 31.0, 31.0, 38.0, 33.0, 36.0, 35.0, 41.0, 52.0, 42.0, 38.0, 33.0, 41.0, 41.0, 41.0, 26.0, 28.0, 27.0, 26.0, 32.0, 23.0, 18.0, 14.0, 15.0, 16.0, 8.0, 8.0, 5.0, 7.0, 9.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08281546831130981, -0.0800701454281807, -0.07732482254505157, -0.07457949221134186, -0.07183416932821274, -0.06908884644508362, -0.0663435161113739, -0.06359819322824478, -0.06085287034511566, -0.05810754746198654, -0.05536222085356712, -0.052616894245147705, -0.049871571362018585, -0.047126248478889465, -0.04438092187047005, -0.04163559526205063, -0.03889027237892151, -0.03614494949579239, -0.03339962288737297, -0.0306542981415987, -0.027908973395824432, -0.025163648650050163, -0.022418323904275894, -0.019672999158501625, -0.016927674412727356, -0.014182349666953087, -0.011437024921178818, -0.008691700175404549, -0.0059463754296302795, -0.0032010506838560104, -0.00045572593808174133, 0.0022895988076925278, 0.005034923553466797, 0.007780248299241066, 0.010525573045015335, 0.013270897790789604, 0.016016222536563873, 0.018761547282338142, 0.02150687202811241, 0.02425219677388668, 0.02699752151966095, 0.02974284626543522, 0.03248817101120949, 0.035233497619628906, 0.037978820502758026, 0.040724143385887146, 0.043469469994306564, 0.04621479660272598, 0.0489601194858551, 0.05170544236898422, 0.05445076897740364, 0.05719609558582306, 0.05994141846895218, 0.0626867413520813, 0.06543207168579102, 0.06817739456892014, 0.07092271745204926, 0.07366804033517838, 0.0764133632183075, 0.07915869355201721, 0.08190401643514633, 0.08464933931827545, 0.08739466965198517, 0.09013999253511429, 0.09288531541824341]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 4.0, 12.0, 20.0, 18.0, 48.0, 57.0, 125.0, 169.0, 341.0, 732.0, 1769.0, 6132.0, 45814.0, 3948748.0, 174330.0, 11026.0, 2826.0, 1057.0, 449.0, 255.0, 143.0, 76.0, 52.0, 24.0, 11.0, 11.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05950927734375, -0.057793617248535156, -0.05607795715332031, -0.05436229705810547, -0.052646636962890625, -0.05093097686767578, -0.04921531677246094, -0.047499656677246094, -0.04578399658203125, -0.044068336486816406, -0.04235267639160156, -0.04063701629638672, -0.038921356201171875, -0.03720569610595703, -0.03549003601074219, -0.033774375915527344, -0.0320587158203125, -0.030343055725097656, -0.028627395629882812, -0.02691173553466797, -0.025196075439453125, -0.02348041534423828, -0.021764755249023438, -0.020049095153808594, -0.01833343505859375, -0.016617774963378906, -0.014902114868164062, -0.013186454772949219, -0.011470794677734375, -0.009755134582519531, -0.008039474487304688, -0.006323814392089844, -0.004608154296875, -0.0028924942016601562, -0.0011768341064453125, 0.0005388259887695312, 0.002254486083984375, 0.003970146179199219, 0.0056858062744140625, 0.007401466369628906, 0.00911712646484375, 0.010832786560058594, 0.012548446655273438, 0.014264106750488281, 0.015979766845703125, 0.01769542694091797, 0.019411087036132812, 0.021126747131347656, 0.0228424072265625, 0.024558067321777344, 0.026273727416992188, 0.02798938751220703, 0.029705047607421875, 0.03142070770263672, 0.03313636779785156, 0.034852027893066406, 0.03656768798828125, 0.038283348083496094, 0.03999900817871094, 0.04171466827392578, 0.043430328369140625, 0.04514598846435547, 0.04686164855957031, 0.048577308654785156, 0.05029296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 5.0, 6.0, 6.0, 7.0, 12.0, 21.0, 22.0, 36.0, 50.0, 43.0, 60.0, 70.0, 78.0, 76.0, 74.0, 78.0, 65.0, 56.0, 59.0, 55.0, 35.0, 22.0, 19.0, 11.0, 8.0, 11.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.00853729248046875, -0.008262872695922852, -0.007988452911376953, -0.007714033126831055, -0.007439613342285156, -0.007165193557739258, -0.006890773773193359, -0.006616353988647461, -0.0063419342041015625, -0.006067514419555664, -0.005793094635009766, -0.005518674850463867, -0.005244255065917969, -0.00496983528137207, -0.004695415496826172, -0.0044209957122802734, -0.004146575927734375, -0.0038721561431884766, -0.003597736358642578, -0.0033233165740966797, -0.0030488967895507812, -0.002774477005004883, -0.0025000572204589844, -0.002225637435913086, -0.0019512176513671875, -0.001676797866821289, -0.0014023780822753906, -0.0011279582977294922, -0.0008535385131835938, -0.0005791187286376953, -0.0003046989440917969, -3.0279159545898438e-05, 0.000244140625, 0.0005185604095458984, 0.0007929801940917969, 0.0010673999786376953, 0.0013418197631835938, 0.0016162395477294922, 0.0018906593322753906, 0.002165079116821289, 0.0024394989013671875, 0.002713918685913086, 0.0029883384704589844, 0.003262758255004883, 0.0035371780395507812, 0.0038115978240966797, 0.004086017608642578, 0.0043604373931884766, 0.004634857177734375, 0.0049092769622802734, 0.005183696746826172, 0.00545811653137207, 0.005732536315917969, 0.006006956100463867, 0.006281375885009766, 0.006555795669555664, 0.0068302154541015625, 0.007104635238647461, 0.007379055023193359, 0.007653474807739258, 0.007927894592285156, 0.008202314376831055, 0.008476734161376953, 0.008751153945922852, 0.00902557373046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 11.0, 9.0, 27.0, 40.0, 89.0, 172.0, 296.0, 577.0, 1353.0, 3643.0, 16714.0, 389293.0, 3726253.0, 45508.0, 6388.0, 2041.0, 906.0, 436.0, 238.0, 123.0, 80.0, 47.0, 12.0, 13.0, 7.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0335693359375, -0.032183170318603516, -0.03079700469970703, -0.029410839080810547, -0.028024673461914062, -0.026638507843017578, -0.025252342224121094, -0.02386617660522461, -0.022480010986328125, -0.02109384536743164, -0.019707679748535156, -0.018321514129638672, -0.016935348510742188, -0.015549182891845703, -0.014163017272949219, -0.012776851654052734, -0.01139068603515625, -0.010004520416259766, -0.008618354797363281, -0.007232189178466797, -0.0058460235595703125, -0.004459857940673828, -0.0030736923217773438, -0.0016875267028808594, -0.000301361083984375, 0.0010848045349121094, 0.0024709701538085938, 0.003857135772705078, 0.0052433013916015625, 0.006629467010498047, 0.008015632629394531, 0.009401798248291016, 0.0107879638671875, 0.012174129486083984, 0.013560295104980469, 0.014946460723876953, 0.016332626342773438, 0.017718791961669922, 0.019104957580566406, 0.02049112319946289, 0.021877288818359375, 0.02326345443725586, 0.024649620056152344, 0.026035785675048828, 0.027421951293945312, 0.028808116912841797, 0.03019428253173828, 0.031580448150634766, 0.03296661376953125, 0.034352779388427734, 0.03573894500732422, 0.0371251106262207, 0.03851127624511719, 0.03989744186401367, 0.041283607482910156, 0.04266977310180664, 0.044055938720703125, 0.04544210433959961, 0.046828269958496094, 0.04821443557739258, 0.04960060119628906, 0.05098676681518555, 0.05237293243408203, 0.053759098052978516, 0.055145263671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 15.0, 26.0, 87.0, 188.0, 804.0, 2233.0, 467.0, 143.0, 51.0, 19.0, 12.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0225067138671875, -0.021919727325439453, -0.021332740783691406, -0.02074575424194336, -0.020158767700195312, -0.019571781158447266, -0.01898479461669922, -0.018397808074951172, -0.017810821533203125, -0.017223834991455078, -0.01663684844970703, -0.016049861907958984, -0.015462875366210938, -0.01487588882446289, -0.014288902282714844, -0.013701915740966797, -0.01311492919921875, -0.012527942657470703, -0.011940956115722656, -0.01135396957397461, -0.010766983032226562, -0.010179996490478516, -0.009593009948730469, -0.009006023406982422, -0.008419036865234375, -0.007832050323486328, -0.007245063781738281, -0.006658077239990234, -0.0060710906982421875, -0.005484104156494141, -0.004897117614746094, -0.004310131072998047, -0.00372314453125, -0.003136157989501953, -0.0025491714477539062, -0.0019621849060058594, -0.0013751983642578125, -0.0007882118225097656, -0.00020122528076171875, 0.0003857612609863281, 0.000972747802734375, 0.0015597343444824219, 0.0021467208862304688, 0.0027337074279785156, 0.0033206939697265625, 0.003907680511474609, 0.004494667053222656, 0.005081653594970703, 0.00566864013671875, 0.006255626678466797, 0.006842613220214844, 0.007429599761962891, 0.008016586303710938, 0.008603572845458984, 0.009190559387207031, 0.009777545928955078, 0.010364532470703125, 0.010951519012451172, 0.011538505554199219, 0.012125492095947266, 0.012712478637695312, 0.01329946517944336, 0.013886451721191406, 0.014473438262939453, 0.0150604248046875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 13.0, 36.0, 59.0, 120.0, 195.0, 216.0, 180.0, 86.0, 48.0, 15.0, 14.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09401434659957886, -0.09120509773492813, -0.0883958488702774, -0.08558660745620728, -0.08277735859155655, -0.07996810972690582, -0.0771588608622551, -0.07434961199760437, -0.07154036313295364, -0.06873111426830292, -0.06592186540365219, -0.06311261653900146, -0.06030337139964104, -0.05749412626028061, -0.05468487739562988, -0.051875628530979156, -0.04906638339161873, -0.046257134526968, -0.043447889387607574, -0.04063864052295685, -0.03782939165830612, -0.035020142793655396, -0.03221089765429497, -0.02940164878964424, -0.026592401787638664, -0.023783154785633087, -0.02097390592098236, -0.018164658918976784, -0.015355410985648632, -0.01254616305232048, -0.009736916050314903, -0.006927667185664177, -0.0041184201836586, -0.0013091724831610918, 0.0015000752173364162, 0.004309322685003281, 0.007118570618331432, 0.009927818551659584, 0.012737065553665161, 0.015546314418315887, 0.018355561420321465, 0.02116480842232704, 0.023974057286977768, 0.026783304288983345, 0.029592551290988922, 0.03240180015563965, 0.035211049020290375, 0.0380202978849411, 0.04082954302430153, 0.043638791888952255, 0.04644803702831268, 0.04925728589296341, 0.052066534757614136, 0.05487578362226486, 0.05768502876162529, 0.060494277626276016, 0.06330352276563644, 0.06611277163028717, 0.0689220204949379, 0.07173126935958862, 0.07454051077365875, 0.07734975963830948, 0.0801590085029602, 0.08296825736761093, 0.08577750623226166]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 5.0, 14.0, 9.0, 10.0, 17.0, 31.0, 27.0, 31.0, 38.0, 41.0, 51.0, 55.0, 48.0, 55.0, 53.0, 69.0, 63.0, 52.0, 59.0, 39.0, 29.0, 51.0, 17.0, 33.0, 25.0, 20.0, 12.0, 12.0, 11.0, 4.0, 2.0, 5.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0357738733291626, -0.03460797667503357, -0.03344208002090454, -0.03227618709206581, -0.031110290437936783, -0.029944393783807755, -0.028778498992323875, -0.027612604200839996, -0.026446707546710968, -0.02528081089258194, -0.02411491610109806, -0.02294902130961418, -0.021783124655485153, -0.020617228001356125, -0.019451333209872246, -0.018285438418388367, -0.01711954176425934, -0.01595364511013031, -0.014787750318646431, -0.013621854595839977, -0.012455958873033524, -0.01129006315022707, -0.010124167427420616, -0.008958271704614162, -0.007792375981807709, -0.006626480259001255, -0.005460584536194801, -0.004294688813388348, -0.003128793090581894, -0.00196289736777544, -0.0007970016449689865, 0.0003688940778374672, 0.001534789800643921, 0.0027006855234503746, 0.0038665812462568283, 0.005032476969063282, 0.006198372691869736, 0.007364268414676189, 0.008530164137482643, 0.009696059860289097, 0.01086195558309555, 0.012027851305902004, 0.013193747028708458, 0.014359642751514912, 0.015525538474321365, 0.016691435128450394, 0.017857329919934273, 0.019023224711418152, 0.02018912136554718, 0.02135501801967621, 0.022520912811160088, 0.023686807602643967, 0.024852704256772995, 0.026018600910902023, 0.027184495702385902, 0.02835039049386978, 0.02951628714799881, 0.030682183802127838, 0.031848080456256866, 0.033013973385095596, 0.034179870039224625, 0.03534576669335365, 0.03651165962219238, 0.03767755627632141, 0.03884345293045044]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 12.0, 15.0, 20.0, 21.0, 27.0, 35.0, 66.0, 101.0, 158.0, 259.0, 490.0, 1032.0, 2381.0, 6378.0, 23540.0, 204386.0, 711946.0, 76451.0, 13482.0, 4257.0, 1706.0, 708.0, 420.0, 230.0, 144.0, 75.0, 57.0, 46.0, 22.0, 29.0, 19.0, 13.0, 8.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05413818359375, -0.05246257781982422, -0.05078697204589844, -0.049111366271972656, -0.047435760498046875, -0.045760154724121094, -0.04408454895019531, -0.04240894317626953, -0.04073333740234375, -0.03905773162841797, -0.03738212585449219, -0.035706520080566406, -0.034030914306640625, -0.032355308532714844, -0.030679702758789062, -0.02900409698486328, -0.0273284912109375, -0.02565288543701172, -0.023977279663085938, -0.022301673889160156, -0.020626068115234375, -0.018950462341308594, -0.017274856567382812, -0.015599250793457031, -0.01392364501953125, -0.012248039245605469, -0.010572433471679688, -0.008896827697753906, -0.007221221923828125, -0.005545616149902344, -0.0038700103759765625, -0.0021944046020507812, -0.000518798828125, 0.0011568069458007812, 0.0028324127197265625, 0.004508018493652344, 0.006183624267578125, 0.007859230041503906, 0.009534835815429688, 0.011210441589355469, 0.01288604736328125, 0.014561653137207031, 0.016237258911132812, 0.017912864685058594, 0.019588470458984375, 0.021264076232910156, 0.022939682006835938, 0.02461528778076172, 0.0262908935546875, 0.02796649932861328, 0.029642105102539062, 0.031317710876464844, 0.032993316650390625, 0.034668922424316406, 0.03634452819824219, 0.03802013397216797, 0.03969573974609375, 0.04137134552001953, 0.04304695129394531, 0.044722557067871094, 0.046398162841796875, 0.048073768615722656, 0.04974937438964844, 0.05142498016357422, 0.0531005859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 10.0, 12.0, 18.0, 22.0, 35.0, 48.0, 48.0, 63.0, 67.0, 77.0, 72.0, 96.0, 85.0, 58.0, 50.0, 57.0, 53.0, 26.0, 25.0, 17.0, 13.0, 11.0, 6.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.009124755859375, -0.00883948802947998, -0.008554220199584961, -0.008268952369689941, -0.007983684539794922, -0.007698416709899902, -0.007413148880004883, -0.007127881050109863, -0.006842613220214844, -0.006557345390319824, -0.006272077560424805, -0.005986809730529785, -0.005701541900634766, -0.005416274070739746, -0.0051310062408447266, -0.004845738410949707, -0.0045604705810546875, -0.004275202751159668, -0.0039899349212646484, -0.003704667091369629, -0.0034193992614746094, -0.00313413143157959, -0.0028488636016845703, -0.0025635957717895508, -0.0022783279418945312, -0.0019930601119995117, -0.0017077922821044922, -0.0014225244522094727, -0.0011372566223144531, -0.0008519887924194336, -0.0005667209625244141, -0.00028145313262939453, 3.814697265625e-06, 0.00028908252716064453, 0.0005743503570556641, 0.0008596181869506836, 0.0011448860168457031, 0.0014301538467407227, 0.0017154216766357422, 0.0020006895065307617, 0.0022859573364257812, 0.0025712251663208008, 0.0028564929962158203, 0.00314176082611084, 0.0034270286560058594, 0.003712296485900879, 0.0039975643157958984, 0.004282832145690918, 0.0045680999755859375, 0.004853367805480957, 0.0051386356353759766, 0.005423903465270996, 0.005709171295166016, 0.005994439125061035, 0.006279706954956055, 0.006564974784851074, 0.006850242614746094, 0.007135510444641113, 0.007420778274536133, 0.007706046104431152, 0.007991313934326172, 0.008276581764221191, 0.008561849594116211, 0.00884711742401123, 0.00913238525390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 6.0, 11.0, 18.0, 19.0, 23.0, 49.0, 63.0, 110.0, 130.0, 206.0, 312.0, 477.0, 831.0, 1376.0, 2174.0, 3720.0, 6636.0, 12590.0, 26632.0, 65750.0, 189221.0, 375256.0, 222853.0, 77494.0, 30539.0, 14300.0, 7359.0, 4029.0, 2374.0, 1479.0, 907.0, 570.0, 317.0, 223.0, 140.0, 108.0, 72.0, 53.0, 39.0, 22.0, 14.0, 16.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.014068603515625, -0.01362311840057373, -0.013177633285522461, -0.012732148170471191, -0.012286663055419922, -0.011841177940368652, -0.011395692825317383, -0.010950207710266113, -0.010504722595214844, -0.010059237480163574, -0.009613752365112305, -0.009168267250061035, -0.008722782135009766, -0.008277297019958496, -0.007831811904907227, -0.007386326789855957, -0.0069408416748046875, -0.006495356559753418, -0.0060498714447021484, -0.005604386329650879, -0.005158901214599609, -0.00471341609954834, -0.00426793098449707, -0.0038224458694458008, -0.0033769607543945312, -0.0029314756393432617, -0.002485990524291992, -0.0020405054092407227, -0.0015950202941894531, -0.0011495351791381836, -0.0007040500640869141, -0.00025856494903564453, 0.000186920166015625, 0.0006324052810668945, 0.001077890396118164, 0.0015233755111694336, 0.001968860626220703, 0.0024143457412719727, 0.002859830856323242, 0.0033053159713745117, 0.0037508010864257812, 0.004196286201477051, 0.00464177131652832, 0.00508725643157959, 0.005532741546630859, 0.005978226661682129, 0.0064237117767333984, 0.006869196891784668, 0.0073146820068359375, 0.007760167121887207, 0.008205652236938477, 0.008651137351989746, 0.009096622467041016, 0.009542107582092285, 0.009987592697143555, 0.010433077812194824, 0.010878562927246094, 0.011324048042297363, 0.011769533157348633, 0.012215018272399902, 0.012660503387451172, 0.013105988502502441, 0.013551473617553711, 0.01399695873260498, 0.01444244384765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 6.0, 7.0, 5.0, 15.0, 16.0, 18.0, 17.0, 27.0, 26.0, 37.0, 24.0, 32.0, 38.0, 47.0, 38.0, 47.0, 38.0, 54.0, 37.0, 34.0, 32.0, 45.0, 25.0, 37.0, 44.0, 30.0, 29.0, 36.0, 26.0, 16.0, 23.0, 16.0, 14.0, 15.0, 9.0, 9.0, 3.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0182037353515625, -0.0176239013671875, -0.0170440673828125, -0.0164642333984375, -0.0158843994140625, -0.0153045654296875, -0.0147247314453125, -0.0141448974609375, -0.0135650634765625, -0.0129852294921875, -0.0124053955078125, -0.0118255615234375, -0.0112457275390625, -0.0106658935546875, -0.0100860595703125, -0.0095062255859375, -0.0089263916015625, -0.0083465576171875, -0.0077667236328125, -0.0071868896484375, -0.0066070556640625, -0.0060272216796875, -0.0054473876953125, -0.0048675537109375, -0.0042877197265625, -0.0037078857421875, -0.0031280517578125, -0.0025482177734375, -0.0019683837890625, -0.0013885498046875, -0.0008087158203125, -0.0002288818359375, 0.0003509521484375, 0.0009307861328125, 0.0015106201171875, 0.0020904541015625, 0.0026702880859375, 0.0032501220703125, 0.0038299560546875, 0.0044097900390625, 0.0049896240234375, 0.0055694580078125, 0.0061492919921875, 0.0067291259765625, 0.0073089599609375, 0.0078887939453125, 0.0084686279296875, 0.0090484619140625, 0.0096282958984375, 0.0102081298828125, 0.0107879638671875, 0.0113677978515625, 0.0119476318359375, 0.0125274658203125, 0.0131072998046875, 0.0136871337890625, 0.0142669677734375, 0.0148468017578125, 0.0154266357421875, 0.0160064697265625, 0.0165863037109375, 0.0171661376953125, 0.0177459716796875, 0.0183258056640625, 0.0189056396484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 3.0, 2.0, 17.0, 21.0, 28.0, 47.0, 73.0, 113.0, 159.0, 288.0, 566.0, 1378.0, 6406.0, 86122.0, 852532.0, 91367.0, 6617.0, 1437.0, 591.0, 302.0, 171.0, 113.0, 89.0, 33.0, 35.0, 15.0, 11.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0264434814453125, -0.025790691375732422, -0.025137901306152344, -0.024485111236572266, -0.023832321166992188, -0.02317953109741211, -0.02252674102783203, -0.021873950958251953, -0.021221160888671875, -0.020568370819091797, -0.01991558074951172, -0.01926279067993164, -0.018610000610351562, -0.017957210540771484, -0.017304420471191406, -0.016651630401611328, -0.01599884033203125, -0.015346050262451172, -0.014693260192871094, -0.014040470123291016, -0.013387680053710938, -0.01273488998413086, -0.012082099914550781, -0.011429309844970703, -0.010776519775390625, -0.010123729705810547, -0.009470939636230469, -0.00881814956665039, -0.008165359497070312, -0.007512569427490234, -0.006859779357910156, -0.006206989288330078, -0.00555419921875, -0.004901409149169922, -0.004248619079589844, -0.0035958290100097656, -0.0029430389404296875, -0.0022902488708496094, -0.0016374588012695312, -0.0009846687316894531, -0.000331878662109375, 0.0003209114074707031, 0.0009737014770507812, 0.0016264915466308594, 0.0022792816162109375, 0.0029320716857910156, 0.0035848617553710938, 0.004237651824951172, 0.00489044189453125, 0.005543231964111328, 0.006196022033691406, 0.006848812103271484, 0.0075016021728515625, 0.00815439224243164, 0.008807182312011719, 0.009459972381591797, 0.010112762451171875, 0.010765552520751953, 0.011418342590332031, 0.01207113265991211, 0.012723922729492188, 0.013376712799072266, 0.014029502868652344, 0.014682292938232422, 0.0153350830078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 42.0, 216.0, 415.0, 238.0, 63.0, 23.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002067089080810547, -0.00019494816660881042, -0.00018318742513656616, -0.0001714266836643219, -0.00015966594219207764, -0.00014790520071983337, -0.0001361444592475891, -0.00012438371777534485, -0.00011262297630310059, -0.00010086223483085632, -8.910149335861206e-05, -7.73407518863678e-05, -6.558001041412354e-05, -5.381926894187927e-05, -4.205852746963501e-05, -3.0297785997390747e-05, -1.8537044525146484e-05, -6.776303052902222e-06, 4.984438419342041e-06, 1.6745179891586304e-05, 2.8505921363830566e-05, 4.026666283607483e-05, 5.202740430831909e-05, 6.378814578056335e-05, 7.554888725280762e-05, 8.730962872505188e-05, 9.907037019729614e-05, 0.0001108311116695404, 0.00012259185314178467, 0.00013435259461402893, 0.0001461133360862732, 0.00015787407755851746, 0.00016963481903076172, 0.00018139556050300598, 0.00019315630197525024, 0.0002049170434474945, 0.00021667778491973877, 0.00022843852639198303, 0.0002401992678642273, 0.00025196000933647156, 0.0002637207508087158, 0.0002754814922809601, 0.00028724223375320435, 0.0002990029752254486, 0.00031076371669769287, 0.00032252445816993713, 0.0003342851996421814, 0.00034604594111442566, 0.0003578066825866699, 0.0003695674240589142, 0.00038132816553115845, 0.0003930889070034027, 0.00040484964847564697, 0.00041661038994789124, 0.0004283711314201355, 0.00044013187289237976, 0.000451892614364624, 0.0004636533558368683, 0.00047541409730911255, 0.0004871748387813568, 0.0004989355802536011, 0.0005106963217258453, 0.0005224570631980896, 0.0005342178046703339, 0.0005459785461425781]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 12.0, 18.0, 21.0, 34.0, 64.0, 96.0, 236.0, 735.0, 3552.0, 53993.0, 873160.0, 109971.0, 5090.0, 984.0, 312.0, 114.0, 55.0, 37.0, 19.0, 6.0, 13.0, 7.0, 2.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.016510009765625, -0.015838623046875, -0.015167236328125, -0.014495849609375, -0.013824462890625, -0.013153076171875, -0.012481689453125, -0.011810302734375, -0.011138916015625, -0.010467529296875, -0.009796142578125, -0.009124755859375, -0.008453369140625, -0.007781982421875, -0.007110595703125, -0.006439208984375, -0.005767822265625, -0.005096435546875, -0.004425048828125, -0.003753662109375, -0.003082275390625, -0.002410888671875, -0.001739501953125, -0.001068115234375, -0.000396728515625, 0.000274658203125, 0.000946044921875, 0.001617431640625, 0.002288818359375, 0.002960205078125, 0.003631591796875, 0.004302978515625, 0.004974365234375, 0.005645751953125, 0.006317138671875, 0.006988525390625, 0.007659912109375, 0.008331298828125, 0.009002685546875, 0.009674072265625, 0.010345458984375, 0.011016845703125, 0.011688232421875, 0.012359619140625, 0.013031005859375, 0.013702392578125, 0.014373779296875, 0.015045166015625, 0.015716552734375, 0.016387939453125, 0.017059326171875, 0.017730712890625, 0.018402099609375, 0.019073486328125, 0.019744873046875, 0.020416259765625, 0.021087646484375, 0.021759033203125, 0.022430419921875, 0.023101806640625, 0.023773193359375, 0.024444580078125, 0.025115966796875, 0.025787353515625, 0.026458740234375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 5.0, 8.0, 3.0, 9.0, 7.0, 19.0, 24.0, 39.0, 66.0, 90.0, 90.0, 120.0, 114.0, 105.0, 94.0, 73.0, 44.0, 22.0, 16.0, 17.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01251983642578125, -0.012058854103088379, -0.011597871780395508, -0.011136889457702637, -0.010675907135009766, -0.010214924812316895, -0.009753942489624023, -0.009292960166931152, -0.008831977844238281, -0.00837099552154541, -0.007910013198852539, -0.007449030876159668, -0.006988048553466797, -0.006527066230773926, -0.006066083908081055, -0.005605101585388184, -0.0051441192626953125, -0.004683136940002441, -0.00422215461730957, -0.0037611722946166992, -0.003300189971923828, -0.002839207649230957, -0.002378225326538086, -0.0019172430038452148, -0.0014562606811523438, -0.0009952783584594727, -0.0005342960357666016, -7.331371307373047e-05, 0.0003876686096191406, 0.0008486509323120117, 0.0013096332550048828, 0.001770615577697754, 0.002231597900390625, 0.002692580223083496, 0.003153562545776367, 0.0036145448684692383, 0.004075527191162109, 0.0045365095138549805, 0.0049974918365478516, 0.005458474159240723, 0.005919456481933594, 0.006380438804626465, 0.006841421127319336, 0.007302403450012207, 0.007763385772705078, 0.00822436809539795, 0.00868535041809082, 0.009146332740783691, 0.009607315063476562, 0.010068297386169434, 0.010529279708862305, 0.010990262031555176, 0.011451244354248047, 0.011912226676940918, 0.012373208999633789, 0.01283419132232666, 0.013295173645019531, 0.013756155967712402, 0.014217138290405273, 0.014678120613098145, 0.015139102935791016, 0.015600085258483887, 0.016061067581176758, 0.01652204990386963, 0.0169830322265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 27.0, 128.0, 387.0, 358.0, 82.0, 18.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2876220643520355, -0.2707435190677643, -0.25386497378349304, -0.2369864284992218, -0.22010788321495056, -0.20322933793067932, -0.1863507777452469, -0.16947223246097565, -0.1525936871767044, -0.13571514189243317, -0.11883659660816193, -0.10195804387331009, -0.08507949858903885, -0.06820095330476761, -0.05132240056991577, -0.03444385528564453, -0.01756531000137329, -0.0006867628544569016, 0.016191784292459488, 0.03307033330202103, 0.04994887858629227, 0.06682742387056351, 0.08370597660541534, 0.10058452188968658, 0.11746306717395782, 0.13434161245822906, 0.1512201577425003, 0.16809871792793274, 0.18497726321220398, 0.20185580849647522, 0.21873435378074646, 0.2356128990650177, 0.25249141454696655, 0.2693699598312378, 0.28624850511550903, 0.3031270503997803, 0.3200055956840515, 0.33688414096832275, 0.353762686252594, 0.37064123153686523, 0.3875197768211365, 0.4043983221054077, 0.42127686738967896, 0.4381554126739502, 0.45503395795822144, 0.4719125032424927, 0.4887910485267639, 0.5056695938110352, 0.5225481986999512, 0.5394267439842224, 0.5563052892684937, 0.5731838345527649, 0.5900623798370361, 0.6069409251213074, 0.6238194704055786, 0.6406980156898499, 0.6575765609741211, 0.6744551062583923, 0.6913336515426636, 0.7082121968269348, 0.725090742111206, 0.7419692873954773, 0.7588478326797485, 0.7757263779640198, 0.792604923248291]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 4.0, 6.0, 13.0, 10.0, 13.0, 10.0, 17.0, 13.0, 14.0, 22.0, 27.0, 28.0, 34.0, 36.0, 37.0, 31.0, 32.0, 30.0, 33.0, 38.0, 46.0, 32.0, 41.0, 39.0, 42.0, 31.0, 32.0, 27.0, 30.0, 29.0, 21.0, 28.0, 25.0, 10.0, 19.0, 11.0, 11.0, 10.0, 10.0, 8.0, 11.0, 7.0, 2.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0826493501663208, -0.08013132959604263, -0.07761330902576447, -0.0750952959060669, -0.07257727533578873, -0.07005925476551056, -0.06754124164581299, -0.06502322107553482, -0.06250520050525665, -0.059987179934978485, -0.057469163089990616, -0.05495114624500275, -0.05243312567472458, -0.04991510510444641, -0.04739708825945854, -0.04487907141447067, -0.042361050844192505, -0.03984303027391434, -0.03732501342892647, -0.0348069965839386, -0.03228897601366043, -0.029770957306027412, -0.027252938598394394, -0.024734919890761375, -0.022216901183128357, -0.01969888247549534, -0.01718086376786232, -0.014662845060229301, -0.012144826352596283, -0.009626807644963264, -0.007108788937330246, -0.0045907702296972275, -0.002072751522064209, 0.0004452671855688095, 0.002963285893201828, 0.0054813046008348465, 0.007999323308467865, 0.010517342016100883, 0.013035360723733902, 0.01555337943136692, 0.01807139813899994, 0.020589416846632957, 0.023107435554265976, 0.025625454261898994, 0.028143472969532013, 0.03066149167716503, 0.03317951038479805, 0.03569752722978592, 0.03821554780006409, 0.040733568370342255, 0.043251585215330124, 0.04576960206031799, 0.04828762263059616, 0.05080564320087433, 0.0533236600458622, 0.05584167689085007, 0.058359697461128235, 0.0608777180314064, 0.06339573860168457, 0.06591375172138214, 0.06843177229166031, 0.07094979286193848, 0.07346780598163605, 0.07598582655191422, 0.07850384712219238]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 10.0, 11.0, 7.0, 18.0, 29.0, 37.0, 49.0, 56.0, 91.0, 115.0, 179.0, 205.0, 320.0, 454.0, 658.0, 1010.0, 1741.0, 3376.0, 7807.0, 27939.0, 376597.0, 3690174.0, 59534.0, 12701.0, 4853.0, 2322.0, 1344.0, 840.0, 517.0, 396.0, 230.0, 183.0, 146.0, 76.0, 73.0, 51.0, 37.0, 24.0, 24.0, 14.0, 6.0, 12.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.040679931640625, -0.03955650329589844, -0.038433074951171875, -0.03730964660644531, -0.03618621826171875, -0.03506278991699219, -0.033939361572265625, -0.03281593322753906, -0.0316925048828125, -0.030569076538085938, -0.029445648193359375, -0.028322219848632812, -0.02719879150390625, -0.026075363159179688, -0.024951934814453125, -0.023828506469726562, -0.022705078125, -0.021581649780273438, -0.020458221435546875, -0.019334793090820312, -0.01821136474609375, -0.017087936401367188, -0.015964508056640625, -0.014841079711914062, -0.0137176513671875, -0.012594223022460938, -0.011470794677734375, -0.010347366333007812, -0.00922393798828125, -0.008100509643554688, -0.006977081298828125, -0.0058536529541015625, -0.004730224609375, -0.0036067962646484375, -0.002483367919921875, -0.0013599395751953125, -0.00023651123046875, 0.0008869171142578125, 0.002010345458984375, 0.0031337738037109375, 0.0042572021484375, 0.0053806304931640625, 0.006504058837890625, 0.0076274871826171875, 0.00875091552734375, 0.009874343872070312, 0.010997772216796875, 0.012121200561523438, 0.01324462890625, 0.014368057250976562, 0.015491485595703125, 0.016614913940429688, 0.01773834228515625, 0.018861770629882812, 0.019985198974609375, 0.021108627319335938, 0.0222320556640625, 0.023355484008789062, 0.024478912353515625, 0.025602340698242188, 0.02672576904296875, 0.027849197387695312, 0.028972625732421875, 0.030096054077148438, 0.031219482421875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 15.0, 16.0, 21.0, 16.0, 32.0, 39.0, 38.0, 53.0, 73.0, 69.0, 93.0, 84.0, 65.0, 67.0, 71.0, 63.0, 45.0, 35.0, 23.0, 13.0, 18.0, 15.0, 9.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.0093231201171875, -0.00903463363647461, -0.008746147155761719, -0.008457660675048828, -0.008169174194335938, -0.007880687713623047, -0.007592201232910156, -0.007303714752197266, -0.007015228271484375, -0.006726741790771484, -0.006438255310058594, -0.006149768829345703, -0.0058612823486328125, -0.005572795867919922, -0.005284309387207031, -0.004995822906494141, -0.00470733642578125, -0.004418849945068359, -0.004130363464355469, -0.003841876983642578, -0.0035533905029296875, -0.003264904022216797, -0.0029764175415039062, -0.0026879310607910156, -0.002399444580078125, -0.0021109580993652344, -0.0018224716186523438, -0.0015339851379394531, -0.0012454986572265625, -0.0009570121765136719, -0.0006685256958007812, -0.0003800392150878906, -9.1552734375e-05, 0.00019693374633789062, 0.00048542022705078125, 0.0007739067077636719, 0.0010623931884765625, 0.0013508796691894531, 0.0016393661499023438, 0.0019278526306152344, 0.002216339111328125, 0.0025048255920410156, 0.0027933120727539062, 0.003081798553466797, 0.0033702850341796875, 0.003658771514892578, 0.003947257995605469, 0.004235744476318359, 0.00452423095703125, 0.004812717437744141, 0.005101203918457031, 0.005389690399169922, 0.0056781768798828125, 0.005966663360595703, 0.006255149841308594, 0.006543636322021484, 0.006832122802734375, 0.007120609283447266, 0.007409095764160156, 0.007697582244873047, 0.007986068725585938, 0.008274555206298828, 0.008563041687011719, 0.00885152816772461, 0.0091400146484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 8.0, 19.0, 30.0, 52.0, 86.0, 145.0, 311.0, 634.0, 1478.0, 4115.0, 15039.0, 133832.0, 3918551.0, 100459.0, 13228.0, 3627.0, 1375.0, 599.0, 343.0, 154.0, 93.0, 53.0, 32.0, 12.0, 13.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.053741455078125, -0.05260896682739258, -0.051476478576660156, -0.050343990325927734, -0.04921150207519531, -0.04807901382446289, -0.04694652557373047, -0.04581403732299805, -0.044681549072265625, -0.0435490608215332, -0.04241657257080078, -0.04128408432006836, -0.04015159606933594, -0.039019107818603516, -0.037886619567871094, -0.03675413131713867, -0.03562164306640625, -0.03448915481567383, -0.033356666564941406, -0.032224178314208984, -0.031091690063476562, -0.02995920181274414, -0.02882671356201172, -0.027694225311279297, -0.026561737060546875, -0.025429248809814453, -0.02429676055908203, -0.02316427230834961, -0.022031784057617188, -0.020899295806884766, -0.019766807556152344, -0.018634319305419922, -0.0175018310546875, -0.016369342803955078, -0.015236854553222656, -0.014104366302490234, -0.012971878051757812, -0.01183938980102539, -0.010706901550292969, -0.009574413299560547, -0.008441925048828125, -0.007309436798095703, -0.006176948547363281, -0.005044460296630859, -0.0039119720458984375, -0.0027794837951660156, -0.0016469955444335938, -0.0005145072937011719, 0.00061798095703125, 0.0017504692077636719, 0.0028829574584960938, 0.004015445709228516, 0.0051479339599609375, 0.006280422210693359, 0.007412910461425781, 0.008545398712158203, 0.009677886962890625, 0.010810375213623047, 0.011942863464355469, 0.01307535171508789, 0.014207839965820312, 0.015340328216552734, 0.016472816467285156, 0.017605304718017578, 0.01873779296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 10.0, 13.0, 28.0, 36.0, 61.0, 165.0, 555.0, 2315.0, 554.0, 169.0, 66.0, 31.0, 22.0, 13.0, 11.0, 3.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009490966796875, -0.009069204330444336, -0.008647441864013672, -0.008225679397583008, -0.007803916931152344, -0.00738215446472168, -0.006960391998291016, -0.0065386295318603516, -0.0061168670654296875, -0.0056951045989990234, -0.005273342132568359, -0.004851579666137695, -0.004429817199707031, -0.004008054733276367, -0.003586292266845703, -0.003164529800415039, -0.002742767333984375, -0.002321004867553711, -0.0018992424011230469, -0.0014774799346923828, -0.0010557174682617188, -0.0006339550018310547, -0.00021219253540039062, 0.00020956993103027344, 0.0006313323974609375, 0.0010530948638916016, 0.0014748573303222656, 0.0018966197967529297, 0.0023183822631835938, 0.002740144729614258, 0.003161907196044922, 0.003583669662475586, 0.00400543212890625, 0.004427194595336914, 0.004848957061767578, 0.005270719528198242, 0.005692481994628906, 0.00611424446105957, 0.006536006927490234, 0.0069577693939208984, 0.0073795318603515625, 0.0078012943267822266, 0.00822305679321289, 0.008644819259643555, 0.009066581726074219, 0.009488344192504883, 0.009910106658935547, 0.010331869125366211, 0.010753631591796875, 0.011175394058227539, 0.011597156524658203, 0.012018918991088867, 0.012440681457519531, 0.012862443923950195, 0.01328420639038086, 0.013705968856811523, 0.014127731323242188, 0.014549493789672852, 0.014971256256103516, 0.01539301872253418, 0.015814781188964844, 0.016236543655395508, 0.016658306121826172, 0.017080068588256836, 0.0175018310546875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 25.0, 84.0, 278.0, 331.0, 167.0, 60.0, 19.0, 13.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09847377240657806, -0.09486760944128036, -0.09126145392656326, -0.08765529096126556, -0.08404913544654846, -0.08044297248125076, -0.07683680951595306, -0.07323065400123596, -0.06962449103593826, -0.06601832807064056, -0.06241217255592346, -0.05880600959062576, -0.05519985035061836, -0.05159369111061096, -0.04798752814531326, -0.04438136890530586, -0.04077520966529846, -0.03716905042529106, -0.03356289118528366, -0.029956728219985962, -0.02635056897997856, -0.02274440973997116, -0.01913824863731861, -0.015532087534666061, -0.011925928294658661, -0.008319768123328686, -0.004713607951998711, -0.0011074477806687355, 0.0024987123906612396, 0.00610487163066864, 0.00971103273332119, 0.01331719383597374, 0.01692335307598114, 0.02052951231598854, 0.02413567341864109, 0.02774183452129364, 0.03134799376130104, 0.03495415300130844, 0.03856031596660614, 0.04216647520661354, 0.04577263444662094, 0.04937879368662834, 0.05298495292663574, 0.05659111589193344, 0.06019727513194084, 0.06380343437194824, 0.06740959733724594, 0.07101576030254364, 0.07462191581726074, 0.07822807878255844, 0.08183423429727554, 0.08544039726257324, 0.08904655277729034, 0.09265271574258804, 0.09625887870788574, 0.09986503422260284, 0.10347119718790054, 0.10707736015319824, 0.11068351566791534, 0.11428967863321304, 0.11789584159851074, 0.12150199711322784, 0.12510815262794495, 0.12871432304382324, 0.13232047855854034]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 9.0, 8.0, 15.0, 12.0, 14.0, 23.0, 37.0, 32.0, 21.0, 37.0, 33.0, 42.0, 41.0, 46.0, 43.0, 49.0, 48.0, 50.0, 50.0, 36.0, 47.0, 40.0, 38.0, 38.0, 29.0, 20.0, 24.0, 22.0, 19.0, 13.0, 12.0, 10.0, 11.0, 2.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.023458898067474365, -0.022695351392030716, -0.021931806579232216, -0.021168261766433716, -0.020404715090990067, -0.019641168415546417, -0.018877623602747917, -0.018114078789949417, -0.017350532114505768, -0.01658698543906212, -0.01582344062626362, -0.015059894882142544, -0.014296349138021469, -0.013532803393900394, -0.01276925764977932, -0.012005711905658245, -0.01124216616153717, -0.010478620417416096, -0.009715074673295021, -0.008951528929173946, -0.008187983185052872, -0.007424437440931797, -0.006660891696810722, -0.005897345952689648, -0.005133800208568573, -0.004370254464447498, -0.0036067087203264236, -0.002843162976205349, -0.0020796172320842743, -0.0013160714879631996, -0.0005525257438421249, 0.00021102000027894974, 0.0009745657444000244, 0.001738111488521099, 0.0025016572326421738, 0.0032652029767632484, 0.004028748720884323, 0.004792294465005398, 0.0055558402091264725, 0.006319385953247547, 0.007082931697368622, 0.007846477441489697, 0.008610023185610771, 0.009373568929731846, 0.01013711467385292, 0.010900660417973995, 0.01166420616209507, 0.012427751906216145, 0.01319129765033722, 0.013954843394458294, 0.014718389138579369, 0.015481934882700443, 0.016245480626821518, 0.017009027302265167, 0.017772572115063667, 0.018536116927862167, 0.019299663603305817, 0.020063210278749466, 0.020826755091547966, 0.021590299904346466, 0.022353846579790115, 0.023117393255233765, 0.023880938068032265, 0.024644482880830765, 0.025408029556274414]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 5.0, 16.0, 20.0, 32.0, 45.0, 56.0, 100.0, 127.0, 233.0, 375.0, 583.0, 960.0, 1744.0, 3589.0, 7602.0, 18063.0, 51291.0, 164968.0, 385804.0, 272961.0, 88605.0, 29311.0, 11461.0, 4927.0, 2458.0, 1256.0, 762.0, 412.0, 284.0, 171.0, 116.0, 78.0, 47.0, 19.0, 28.0, 17.0, 9.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0174560546875, -0.016888141632080078, -0.016320228576660156, -0.015752315521240234, -0.015184402465820312, -0.01461648941040039, -0.014048576354980469, -0.013480663299560547, -0.012912750244140625, -0.012344837188720703, -0.011776924133300781, -0.01120901107788086, -0.010641098022460938, -0.010073184967041016, -0.009505271911621094, -0.008937358856201172, -0.00836944580078125, -0.007801532745361328, -0.007233619689941406, -0.006665706634521484, -0.0060977935791015625, -0.005529880523681641, -0.004961967468261719, -0.004394054412841797, -0.003826141357421875, -0.003258228302001953, -0.0026903152465820312, -0.0021224021911621094, -0.0015544891357421875, -0.0009865760803222656, -0.00041866302490234375, 0.00014925003051757812, 0.0007171630859375, 0.0012850761413574219, 0.0018529891967773438, 0.0024209022521972656, 0.0029888153076171875, 0.0035567283630371094, 0.004124641418457031, 0.004692554473876953, 0.005260467529296875, 0.005828380584716797, 0.006396293640136719, 0.006964206695556641, 0.0075321197509765625, 0.008100032806396484, 0.008667945861816406, 0.009235858917236328, 0.00980377197265625, 0.010371685028076172, 0.010939598083496094, 0.011507511138916016, 0.012075424194335938, 0.01264333724975586, 0.013211250305175781, 0.013779163360595703, 0.014347076416015625, 0.014914989471435547, 0.015482902526855469, 0.01605081558227539, 0.016618728637695312, 0.017186641693115234, 0.017754554748535156, 0.018322467803955078, 0.018890380859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 14.0, 12.0, 20.0, 21.0, 26.0, 44.0, 47.0, 76.0, 87.0, 72.0, 82.0, 74.0, 68.0, 71.0, 75.0, 48.0, 40.0, 36.0, 25.0, 12.0, 18.0, 7.0, 6.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0098419189453125, -0.009534358978271484, -0.009226799011230469, -0.008919239044189453, -0.008611679077148438, -0.008304119110107422, -0.007996559143066406, -0.007688999176025391, -0.007381439208984375, -0.007073879241943359, -0.006766319274902344, -0.006458759307861328, -0.0061511993408203125, -0.005843639373779297, -0.005536079406738281, -0.005228519439697266, -0.00492095947265625, -0.004613399505615234, -0.004305839538574219, -0.003998279571533203, -0.0036907196044921875, -0.003383159637451172, -0.0030755996704101562, -0.0027680397033691406, -0.002460479736328125, -0.0021529197692871094, -0.0018453598022460938, -0.0015377998352050781, -0.0012302398681640625, -0.0009226799011230469, -0.0006151199340820312, -0.0003075599670410156, 0.0, 0.0003075599670410156, 0.0006151199340820312, 0.0009226799011230469, 0.0012302398681640625, 0.0015377998352050781, 0.0018453598022460938, 0.0021529197692871094, 0.002460479736328125, 0.0027680397033691406, 0.0030755996704101562, 0.003383159637451172, 0.0036907196044921875, 0.003998279571533203, 0.004305839538574219, 0.004613399505615234, 0.00492095947265625, 0.005228519439697266, 0.005536079406738281, 0.005843639373779297, 0.0061511993408203125, 0.006458759307861328, 0.006766319274902344, 0.007073879241943359, 0.007381439208984375, 0.007688999176025391, 0.007996559143066406, 0.008304119110107422, 0.008611679077148438, 0.008919239044189453, 0.009226799011230469, 0.009534358978271484, 0.0098419189453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 2.0, 5.0, 10.0, 10.0, 14.0, 21.0, 14.0, 45.0, 22.0, 44.0, 66.0, 91.0, 150.0, 210.0, 383.0, 640.0, 1168.0, 2436.0, 5525.0, 13738.0, 37113.0, 122773.0, 388178.0, 329737.0, 95432.0, 30145.0, 11292.0, 4599.0, 2137.0, 1025.0, 554.0, 319.0, 201.0, 122.0, 78.0, 63.0, 46.0, 33.0, 33.0, 22.0, 12.0, 10.0, 10.0, 14.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.01491546630859375, -0.014432787895202637, -0.013950109481811523, -0.01346743106842041, -0.012984752655029297, -0.012502074241638184, -0.01201939582824707, -0.011536717414855957, -0.011054039001464844, -0.01057136058807373, -0.010088682174682617, -0.009606003761291504, -0.00912332534790039, -0.008640646934509277, -0.008157968521118164, -0.007675290107727051, -0.0071926116943359375, -0.006709933280944824, -0.006227254867553711, -0.005744576454162598, -0.005261898040771484, -0.004779219627380371, -0.004296541213989258, -0.0038138628005981445, -0.0033311843872070312, -0.002848505973815918, -0.0023658275604248047, -0.0018831491470336914, -0.0014004707336425781, -0.0009177923202514648, -0.00043511390686035156, 4.756450653076172e-05, 0.000530242919921875, 0.0010129213333129883, 0.0014955997467041016, 0.001978278160095215, 0.002460956573486328, 0.0029436349868774414, 0.0034263134002685547, 0.003908991813659668, 0.004391670227050781, 0.0048743486404418945, 0.005357027053833008, 0.005839705467224121, 0.006322383880615234, 0.006805062294006348, 0.007287740707397461, 0.007770419120788574, 0.008253097534179688, 0.0087357759475708, 0.009218454360961914, 0.009701132774353027, 0.01018381118774414, 0.010666489601135254, 0.011149168014526367, 0.01163184642791748, 0.012114524841308594, 0.012597203254699707, 0.01307988166809082, 0.013562560081481934, 0.014045238494873047, 0.01452791690826416, 0.015010595321655273, 0.015493273735046387, 0.0159759521484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 4.0, 2.0, 6.0, 7.0, 4.0, 7.0, 5.0, 7.0, 6.0, 20.0, 16.0, 14.0, 24.0, 15.0, 22.0, 24.0, 32.0, 29.0, 35.0, 38.0, 33.0, 36.0, 48.0, 46.0, 41.0, 42.0, 34.0, 33.0, 53.0, 38.0, 38.0, 35.0, 31.0, 21.0, 16.0, 27.0, 12.0, 19.0, 17.0, 16.0, 12.0, 5.0, 8.0, 10.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0228118896484375, -0.02215099334716797, -0.021490097045898438, -0.020829200744628906, -0.020168304443359375, -0.019507408142089844, -0.018846511840820312, -0.01818561553955078, -0.01752471923828125, -0.01686382293701172, -0.016202926635742188, -0.015542030334472656, -0.014881134033203125, -0.014220237731933594, -0.013559341430664062, -0.012898445129394531, -0.012237548828125, -0.011576652526855469, -0.010915756225585938, -0.010254859924316406, -0.009593963623046875, -0.008933067321777344, -0.008272171020507812, -0.007611274719238281, -0.00695037841796875, -0.006289482116699219, -0.0056285858154296875, -0.004967689514160156, -0.004306793212890625, -0.0036458969116210938, -0.0029850006103515625, -0.0023241043090820312, -0.0016632080078125, -0.0010023117065429688, -0.0003414154052734375, 0.00031948089599609375, 0.000980377197265625, 0.0016412734985351562, 0.0023021697998046875, 0.0029630661010742188, 0.00362396240234375, 0.004284858703613281, 0.0049457550048828125, 0.005606651306152344, 0.006267547607421875, 0.006928443908691406, 0.0075893402099609375, 0.008250236511230469, 0.0089111328125, 0.009572029113769531, 0.010232925415039062, 0.010893821716308594, 0.011554718017578125, 0.012215614318847656, 0.012876510620117188, 0.013537406921386719, 0.01419830322265625, 0.014859199523925781, 0.015520095825195312, 0.016180992126464844, 0.016841888427734375, 0.017502784729003906, 0.018163681030273438, 0.01882457733154297, 0.0194854736328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 13.0, 25.0, 56.0, 141.0, 373.0, 1212.0, 4344.0, 23214.0, 330968.0, 631794.0, 46813.0, 6992.0, 1693.0, 542.0, 182.0, 91.0, 47.0, 16.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0176239013671875, -0.01714956760406494, -0.016675233840942383, -0.016200900077819824, -0.015726566314697266, -0.015252232551574707, -0.014777898788452148, -0.01430356502532959, -0.013829231262207031, -0.013354897499084473, -0.012880563735961914, -0.012406229972839355, -0.011931896209716797, -0.011457562446594238, -0.01098322868347168, -0.010508894920349121, -0.010034561157226562, -0.009560227394104004, -0.009085893630981445, -0.008611559867858887, -0.008137226104736328, -0.0076628923416137695, -0.007188558578491211, -0.006714224815368652, -0.006239891052246094, -0.005765557289123535, -0.0052912235260009766, -0.004816889762878418, -0.004342555999755859, -0.0038682222366333008, -0.003393888473510742, -0.0029195547103881836, -0.002445220947265625, -0.0019708871841430664, -0.0014965534210205078, -0.0010222196578979492, -0.0005478858947753906, -7.355213165283203e-05, 0.00040078163146972656, 0.0008751153945922852, 0.0013494491577148438, 0.0018237829208374023, 0.002298116683959961, 0.0027724504470825195, 0.003246784210205078, 0.0037211179733276367, 0.004195451736450195, 0.004669785499572754, 0.0051441192626953125, 0.005618453025817871, 0.00609278678894043, 0.006567120552062988, 0.007041454315185547, 0.0075157880783081055, 0.007990121841430664, 0.008464455604553223, 0.008938789367675781, 0.00941312313079834, 0.009887456893920898, 0.010361790657043457, 0.010836124420166016, 0.011310458183288574, 0.011784791946411133, 0.012259125709533691, 0.01273345947265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 8.0, 5.0, 22.0, 38.0, 87.0, 143.0, 223.0, 189.0, 146.0, 72.0, 45.0, 19.0, 10.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00018453598022460938, -0.00018042884767055511, -0.00017632171511650085, -0.0001722145825624466, -0.00016810745000839233, -0.00016400031745433807, -0.0001598931849002838, -0.00015578605234622955, -0.0001516789197921753, -0.00014757178723812103, -0.00014346465468406677, -0.0001393575221300125, -0.00013525038957595825, -0.000131143257021904, -0.00012703612446784973, -0.00012292899191379547, -0.00011882185935974121, -0.00011471472680568695, -0.00011060759425163269, -0.00010650046169757843, -0.00010239332914352417, -9.828619658946991e-05, -9.417906403541565e-05, -9.007193148136139e-05, -8.596479892730713e-05, -8.185766637325287e-05, -7.775053381919861e-05, -7.364340126514435e-05, -6.953626871109009e-05, -6.542913615703583e-05, -6.132200360298157e-05, -5.721487104892731e-05, -5.310773849487305e-05, -4.900060594081879e-05, -4.4893473386764526e-05, -4.0786340832710266e-05, -3.6679208278656006e-05, -3.2572075724601746e-05, -2.8464943170547485e-05, -2.4357810616493225e-05, -2.0250678062438965e-05, -1.6143545508384705e-05, -1.2036412954330444e-05, -7.929280400276184e-06, -3.822147846221924e-06, 2.849847078323364e-07, 4.392117261886597e-06, 8.499249815940857e-06, 1.2606382369995117e-05, 1.6713514924049377e-05, 2.0820647478103638e-05, 2.4927780032157898e-05, 2.9034912586212158e-05, 3.314204514026642e-05, 3.724917769432068e-05, 4.135631024837494e-05, 4.54634428024292e-05, 4.957057535648346e-05, 5.367770791053772e-05, 5.778484046459198e-05, 6.189197301864624e-05, 6.59991055727005e-05, 7.010623812675476e-05, 7.421337068080902e-05, 7.832050323486328e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 11.0, 16.0, 25.0, 38.0, 60.0, 94.0, 156.0, 327.0, 802.0, 3004.0, 20742.0, 381664.0, 599855.0, 35693.0, 4183.0, 1053.0, 360.0, 177.0, 113.0, 61.0, 38.0, 28.0, 18.0, 9.0, 8.0, 4.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208892822265625, -0.02035510540008545, -0.0198209285736084, -0.019286751747131348, -0.018752574920654297, -0.018218398094177246, -0.017684221267700195, -0.017150044441223145, -0.016615867614746094, -0.016081690788269043, -0.015547513961791992, -0.015013337135314941, -0.01447916030883789, -0.01394498348236084, -0.013410806655883789, -0.012876629829406738, -0.012342453002929688, -0.011808276176452637, -0.011274099349975586, -0.010739922523498535, -0.010205745697021484, -0.009671568870544434, -0.009137392044067383, -0.008603215217590332, -0.008069038391113281, -0.0075348615646362305, -0.00700068473815918, -0.006466507911682129, -0.005932331085205078, -0.005398154258728027, -0.0048639774322509766, -0.004329800605773926, -0.003795623779296875, -0.0032614469528198242, -0.0027272701263427734, -0.0021930932998657227, -0.0016589164733886719, -0.001124739646911621, -0.0005905628204345703, -5.638599395751953e-05, 0.00047779083251953125, 0.001011967658996582, 0.0015461444854736328, 0.0020803213119506836, 0.0026144981384277344, 0.003148674964904785, 0.003682851791381836, 0.004217028617858887, 0.0047512054443359375, 0.005285382270812988, 0.005819559097290039, 0.00635373592376709, 0.006887912750244141, 0.007422089576721191, 0.007956266403198242, 0.008490443229675293, 0.009024620056152344, 0.009558796882629395, 0.010092973709106445, 0.010627150535583496, 0.011161327362060547, 0.011695504188537598, 0.012229681015014648, 0.0127638578414917, 0.01329803466796875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 8.0, 21.0, 25.0, 39.0, 42.0, 60.0, 84.0, 91.0, 95.0, 105.0, 109.0, 77.0, 67.0, 59.0, 35.0, 36.0, 21.0, 6.0, 11.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01519775390625, -0.01482999324798584, -0.01446223258972168, -0.01409447193145752, -0.01372671127319336, -0.0133589506149292, -0.012991189956665039, -0.012623429298400879, -0.012255668640136719, -0.011887907981872559, -0.011520147323608398, -0.011152386665344238, -0.010784626007080078, -0.010416865348815918, -0.010049104690551758, -0.009681344032287598, -0.009313583374023438, -0.008945822715759277, -0.008578062057495117, -0.008210301399230957, -0.007842540740966797, -0.007474780082702637, -0.0071070194244384766, -0.006739258766174316, -0.006371498107910156, -0.006003737449645996, -0.005635976791381836, -0.005268216133117676, -0.004900455474853516, -0.0045326948165893555, -0.004164934158325195, -0.003797173500061035, -0.003429412841796875, -0.003061652183532715, -0.0026938915252685547, -0.0023261308670043945, -0.0019583702087402344, -0.0015906095504760742, -0.001222848892211914, -0.0008550882339477539, -0.00048732757568359375, -0.0001195669174194336, 0.00024819374084472656, 0.0006159543991088867, 0.0009837150573730469, 0.001351475715637207, 0.0017192363739013672, 0.0020869970321655273, 0.0024547576904296875, 0.0028225183486938477, 0.003190279006958008, 0.003558039665222168, 0.003925800323486328, 0.004293560981750488, 0.0046613216400146484, 0.005029082298278809, 0.005396842956542969, 0.005764603614807129, 0.006132364273071289, 0.006500124931335449, 0.006867885589599609, 0.0072356462478637695, 0.00760340690612793, 0.00797116756439209, 0.00833892822265625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 10.0, 40.0, 220.0, 413.0, 249.0, 64.0, 16.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7612881064414978, -0.7459147572517395, -0.730541467666626, -0.7151681184768677, -0.6997948288917542, -0.6844214797019958, -0.6690481901168823, -0.653674840927124, -0.6383015513420105, -0.6229282021522522, -0.6075549125671387, -0.5921815633773804, -0.5768082737922668, -0.5614349246025085, -0.546061635017395, -0.5306882858276367, -0.5153149366378784, -0.4999416172504425, -0.4845682978630066, -0.4691949784755707, -0.45382165908813477, -0.43844833970069885, -0.42307502031326294, -0.40770167112350464, -0.3923283815383911, -0.3769550621509552, -0.3615817427635193, -0.3462084233760834, -0.33083510398864746, -0.31546178460121155, -0.30008846521377563, -0.28471511602401733, -0.2693418562412262, -0.2539685368537903, -0.23859521746635437, -0.22322189807891846, -0.20784857869148254, -0.19247525930404663, -0.17710192501544952, -0.1617286056280136, -0.1463552862405777, -0.13098196685314178, -0.11560864746570587, -0.10023532062768936, -0.08486200124025345, -0.06948868185281754, -0.054115355014801025, -0.03874203562736511, -0.0233687162399292, -0.007995394989848137, 0.007377926260232925, 0.022751249372959137, 0.03812456876039505, 0.05349788814783096, 0.06887121498584747, 0.08424453437328339, 0.0996178537607193, 0.11499117314815521, 0.13036449253559113, 0.14573782682418823, 0.16111114621162415, 0.17648446559906006, 0.19185778498649597, 0.20723110437393188, 0.2226044237613678]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 5.0, 6.0, 10.0, 8.0, 5.0, 11.0, 10.0, 15.0, 14.0, 12.0, 19.0, 20.0, 21.0, 20.0, 26.0, 27.0, 32.0, 28.0, 32.0, 32.0, 35.0, 44.0, 44.0, 36.0, 54.0, 46.0, 38.0, 33.0, 33.0, 27.0, 29.0, 25.0, 28.0, 25.0, 13.0, 23.0, 18.0, 12.0, 17.0, 18.0, 15.0, 6.0, 6.0, 7.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.10703080892562866, -0.10381944477558136, -0.10060808807611465, -0.09739673137664795, -0.09418536722660065, -0.09097400307655334, -0.08776264637708664, -0.08455128967761993, -0.08133992552757263, -0.07812856137752533, -0.07491720467805862, -0.07170584797859192, -0.06849448382854462, -0.06528311967849731, -0.06207176297903061, -0.058860402554273605, -0.0556490421295166, -0.0524376817047596, -0.049226321280002594, -0.04601496085524559, -0.042803600430488586, -0.03959224000573158, -0.03638087958097458, -0.033169519156217575, -0.02995815873146057, -0.026746798306703568, -0.023535437881946564, -0.02032407745718956, -0.017112717032432556, -0.013901356607675552, -0.010689996182918549, -0.007478635758161545, -0.004267275333404541, -0.0010559149086475372, 0.0021554455161094666, 0.00536680594086647, 0.008578166365623474, 0.011789526790380478, 0.015000887215137482, 0.018212247639894485, 0.02142360806465149, 0.024634968489408493, 0.027846328914165497, 0.0310576893389225, 0.034269049763679504, 0.03748041018843651, 0.04069177061319351, 0.043903131037950516, 0.04711449146270752, 0.05032585188746452, 0.05353721231222153, 0.05674857273697853, 0.059959933161735535, 0.06317129731178284, 0.06638265401124954, 0.06959401071071625, 0.07280537486076355, 0.07601673901081085, 0.07922809571027756, 0.08243945240974426, 0.08565081655979156, 0.08886218070983887, 0.09207353740930557, 0.09528489410877228, 0.09849625825881958]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 14.0, 10.0, 18.0, 28.0, 30.0, 38.0, 78.0, 142.0, 248.0, 400.0, 681.0, 1333.0, 2883.0, 7645.0, 34391.0, 2496242.0, 1604704.0, 31994.0, 7432.0, 2801.0, 1328.0, 684.0, 390.0, 244.0, 144.0, 108.0, 58.0, 57.0, 37.0, 21.0, 19.0, 15.0, 6.0, 11.0, 8.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0295867919921875, -0.028631925582885742, -0.027677059173583984, -0.026722192764282227, -0.02576732635498047, -0.02481245994567871, -0.023857593536376953, -0.022902727127075195, -0.021947860717773438, -0.02099299430847168, -0.020038127899169922, -0.019083261489868164, -0.018128395080566406, -0.01717352867126465, -0.01621866226196289, -0.015263795852661133, -0.014308929443359375, -0.013354063034057617, -0.01239919662475586, -0.011444330215454102, -0.010489463806152344, -0.009534597396850586, -0.008579730987548828, -0.00762486457824707, -0.0066699981689453125, -0.005715131759643555, -0.004760265350341797, -0.003805398941040039, -0.0028505325317382812, -0.0018956661224365234, -0.0009407997131347656, 1.4066696166992188e-05, 0.00096893310546875, 0.0019237995147705078, 0.0028786659240722656, 0.0038335323333740234, 0.004788398742675781, 0.005743265151977539, 0.006698131561279297, 0.007652997970581055, 0.008607864379882812, 0.00956273078918457, 0.010517597198486328, 0.011472463607788086, 0.012427330017089844, 0.013382196426391602, 0.01433706283569336, 0.015291929244995117, 0.016246795654296875, 0.017201662063598633, 0.01815652847290039, 0.01911139488220215, 0.020066261291503906, 0.021021127700805664, 0.021975994110107422, 0.02293086051940918, 0.023885726928710938, 0.024840593338012695, 0.025795459747314453, 0.02675032615661621, 0.02770519256591797, 0.028660058975219727, 0.029614925384521484, 0.030569791793823242, 0.031524658203125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 13.0, 16.0, 15.0, 20.0, 36.0, 40.0, 52.0, 65.0, 76.0, 60.0, 86.0, 79.0, 78.0, 63.0, 87.0, 53.0, 34.0, 33.0, 28.0, 17.0, 8.0, 12.0, 7.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0106048583984375, -0.010284423828125, -0.0099639892578125, -0.0096435546875, -0.0093231201171875, -0.009002685546875, -0.0086822509765625, -0.00836181640625, -0.0080413818359375, -0.007720947265625, -0.0074005126953125, -0.007080078125, -0.0067596435546875, -0.006439208984375, -0.0061187744140625, -0.00579833984375, -0.0054779052734375, -0.005157470703125, -0.0048370361328125, -0.0045166015625, -0.0041961669921875, -0.003875732421875, -0.0035552978515625, -0.00323486328125, -0.0029144287109375, -0.002593994140625, -0.0022735595703125, -0.001953125, -0.0016326904296875, -0.001312255859375, -0.0009918212890625, -0.00067138671875, -0.0003509521484375, -3.0517578125e-05, 0.0002899169921875, 0.0006103515625, 0.0009307861328125, 0.001251220703125, 0.0015716552734375, 0.00189208984375, 0.0022125244140625, 0.002532958984375, 0.0028533935546875, 0.003173828125, 0.0034942626953125, 0.003814697265625, 0.0041351318359375, 0.00445556640625, 0.0047760009765625, 0.005096435546875, 0.0054168701171875, 0.0057373046875, 0.0060577392578125, 0.006378173828125, 0.0066986083984375, 0.00701904296875, 0.0073394775390625, 0.007659912109375, 0.0079803466796875, 0.00830078125, 0.0086212158203125, 0.008941650390625, 0.0092620849609375, 0.00958251953125, 0.0099029541015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 15.0, 10.0, 30.0, 35.0, 48.0, 82.0, 111.0, 209.0, 377.0, 832.0, 2342.0, 8810.0, 79299.0, 3963939.0, 122603.0, 10998.0, 2618.0, 928.0, 404.0, 231.0, 125.0, 86.0, 52.0, 40.0, 16.0, 15.0, 13.0, 4.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03179931640625, -0.03075885772705078, -0.029718399047851562, -0.028677940368652344, -0.027637481689453125, -0.026597023010253906, -0.025556564331054688, -0.02451610565185547, -0.02347564697265625, -0.02243518829345703, -0.021394729614257812, -0.020354270935058594, -0.019313812255859375, -0.018273353576660156, -0.017232894897460938, -0.01619243621826172, -0.0151519775390625, -0.014111518859863281, -0.013071060180664062, -0.012030601501464844, -0.010990142822265625, -0.009949684143066406, -0.008909225463867188, -0.007868766784667969, -0.00682830810546875, -0.005787849426269531, -0.0047473907470703125, -0.0037069320678710938, -0.002666473388671875, -0.0016260147094726562, -0.0005855560302734375, 0.00045490264892578125, 0.001495361328125, 0.0025358200073242188, 0.0035762786865234375, 0.004616737365722656, 0.005657196044921875, 0.006697654724121094, 0.0077381134033203125, 0.008778572082519531, 0.00981903076171875, 0.010859489440917969, 0.011899948120117188, 0.012940406799316406, 0.013980865478515625, 0.015021324157714844, 0.016061782836914062, 0.01710224151611328, 0.0181427001953125, 0.01918315887451172, 0.020223617553710938, 0.021264076232910156, 0.022304534912109375, 0.023344993591308594, 0.024385452270507812, 0.02542591094970703, 0.02646636962890625, 0.02750682830810547, 0.028547286987304688, 0.029587745666503906, 0.030628204345703125, 0.031668663024902344, 0.03270912170410156, 0.03374958038330078, 0.0347900390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 13.0, 18.0, 44.0, 98.0, 428.0, 2772.0, 468.0, 111.0, 50.0, 28.0, 17.0, 8.0, 5.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01068115234375, -0.01007223129272461, -0.009463310241699219, -0.008854389190673828, -0.008245468139648438, -0.007636547088623047, -0.007027626037597656, -0.006418704986572266, -0.005809783935546875, -0.005200862884521484, -0.004591941833496094, -0.003983020782470703, -0.0033740997314453125, -0.002765178680419922, -0.0021562576293945312, -0.0015473365783691406, -0.00093841552734375, -0.0003294944763183594, 0.00027942657470703125, 0.0008883476257324219, 0.0014972686767578125, 0.002106189727783203, 0.0027151107788085938, 0.0033240318298339844, 0.003932952880859375, 0.004541873931884766, 0.005150794982910156, 0.005759716033935547, 0.0063686370849609375, 0.006977558135986328, 0.007586479187011719, 0.00819540023803711, 0.0088043212890625, 0.00941324234008789, 0.010022163391113281, 0.010631084442138672, 0.011240005493164062, 0.011848926544189453, 0.012457847595214844, 0.013066768646240234, 0.013675689697265625, 0.014284610748291016, 0.014893531799316406, 0.015502452850341797, 0.016111373901367188, 0.016720294952392578, 0.01732921600341797, 0.01793813705444336, 0.01854705810546875, 0.01915597915649414, 0.01976490020751953, 0.020373821258544922, 0.020982742309570312, 0.021591663360595703, 0.022200584411621094, 0.022809505462646484, 0.023418426513671875, 0.024027347564697266, 0.024636268615722656, 0.025245189666748047, 0.025854110717773438, 0.026463031768798828, 0.02707195281982422, 0.02768087387084961, 0.028289794921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 8.0, 49.0, 253.0, 471.0, 163.0, 33.0, 9.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07124335318803787, -0.06655369699001312, -0.06186404079198837, -0.05717438459396362, -0.05248472839593887, -0.047795072197914124, -0.04310541972517967, -0.03841576352715492, -0.03372610732913017, -0.029036451131105423, -0.024346794933080673, -0.019657140597701073, -0.014967484399676323, -0.010277828201651573, -0.005588173866271973, -0.0008985176682472229, 0.003791138529777527, 0.008480794727802277, 0.013170449994504452, 0.017860105261206627, 0.022549761459231377, 0.027239417657256126, 0.03192907199263573, 0.03661872819066048, 0.041308384388685226, 0.045998040586709976, 0.050687696784734726, 0.05537734925746918, 0.06006700545549393, 0.06475666165351868, 0.06944631785154343, 0.07413597404956818, 0.07882562279701233, 0.08351527899503708, 0.08820493519306183, 0.09289459139108658, 0.09758424758911133, 0.10227390378713608, 0.10696355998516083, 0.11165320873260498, 0.11634287238121033, 0.12103252857923508, 0.12572218477725983, 0.13041183352470398, 0.13510149717330933, 0.13979114592075348, 0.14448080956935883, 0.14917045831680298, 0.15386012196540833, 0.15854977071285248, 0.16323943436145782, 0.16792908310890198, 0.17261874675750732, 0.17730839550495148, 0.18199805915355682, 0.18668770790100098, 0.19137735664844513, 0.19606700539588928, 0.20075666904449463, 0.20544631779193878, 0.21013598144054413, 0.21482563018798828, 0.21951529383659363, 0.22420494258403778, 0.22889460623264313]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 13.0, 11.0, 21.0, 34.0, 42.0, 40.0, 64.0, 67.0, 77.0, 80.0, 88.0, 82.0, 65.0, 56.0, 71.0, 48.0, 43.0, 26.0, 19.0, 11.0, 7.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05135703086853027, -0.04979030415415764, -0.048223577439785004, -0.04665685072541237, -0.045090124011039734, -0.0435233972966671, -0.041956670582294464, -0.04038994386792183, -0.038823217153549194, -0.03725649043917656, -0.035689763724803925, -0.03412303701043129, -0.032556310296058655, -0.03098958358168602, -0.029422856867313385, -0.02785613015294075, -0.026289403438568115, -0.02472267672419548, -0.023155950009822845, -0.02158922329545021, -0.020022496581077576, -0.01845576986670494, -0.016889043152332306, -0.015322316437959671, -0.013755589723587036, -0.012188863009214401, -0.010622136294841766, -0.009055409580469131, -0.007488682866096497, -0.005921956151723862, -0.004355229437351227, -0.002788502722978592, -0.001221776008605957, 0.00034495070576667786, 0.0019116774201393127, 0.0034784041345119476, 0.0050451308488845825, 0.006611857563257217, 0.008178584277629852, 0.009745310992002487, 0.011312037706375122, 0.012878764420747757, 0.014445491135120392, 0.016012217849493027, 0.01757894456386566, 0.019145671278238297, 0.02071239799261093, 0.022279124706983566, 0.0238458514213562, 0.025412578135728836, 0.02697930485010147, 0.028546031564474106, 0.03011275827884674, 0.031679484993219376, 0.03324621170759201, 0.034812938421964645, 0.03637966513633728, 0.037946391850709915, 0.03951311856508255, 0.041079845279455185, 0.04264657199382782, 0.044213298708200455, 0.04578002542257309, 0.047346752136945724, 0.04891347885131836]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 11.0, 8.0, 30.0, 28.0, 68.0, 126.0, 245.0, 445.0, 971.0, 2325.0, 6706.0, 24331.0, 148814.0, 664139.0, 162780.0, 26040.0, 7054.0, 2429.0, 1022.0, 447.0, 231.0, 120.0, 71.0, 44.0, 19.0, 15.0, 14.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0262908935546875, -0.025429487228393555, -0.02456808090209961, -0.023706674575805664, -0.02284526824951172, -0.021983861923217773, -0.021122455596923828, -0.020261049270629883, -0.019399642944335938, -0.018538236618041992, -0.017676830291748047, -0.0168154239654541, -0.015954017639160156, -0.015092611312866211, -0.014231204986572266, -0.01336979866027832, -0.012508392333984375, -0.01164698600769043, -0.010785579681396484, -0.009924173355102539, -0.009062767028808594, -0.008201360702514648, -0.007339954376220703, -0.006478548049926758, -0.0056171417236328125, -0.004755735397338867, -0.003894329071044922, -0.0030329227447509766, -0.0021715164184570312, -0.001310110092163086, -0.0004487037658691406, 0.0004127025604248047, 0.00127410888671875, 0.0021355152130126953, 0.0029969215393066406, 0.003858327865600586, 0.004719734191894531, 0.0055811405181884766, 0.006442546844482422, 0.007303953170776367, 0.008165359497070312, 0.009026765823364258, 0.009888172149658203, 0.010749578475952148, 0.011610984802246094, 0.012472391128540039, 0.013333797454833984, 0.01419520378112793, 0.015056610107421875, 0.01591801643371582, 0.016779422760009766, 0.01764082908630371, 0.018502235412597656, 0.0193636417388916, 0.020225048065185547, 0.021086454391479492, 0.021947860717773438, 0.022809267044067383, 0.023670673370361328, 0.024532079696655273, 0.02539348602294922, 0.026254892349243164, 0.02711629867553711, 0.027977705001831055, 0.028839111328125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 17.0, 22.0, 24.0, 33.0, 49.0, 60.0, 62.0, 87.0, 78.0, 76.0, 82.0, 91.0, 76.0, 61.0, 47.0, 35.0, 21.0, 22.0, 7.0, 9.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.01198577880859375, -0.01162874698638916, -0.01127171516418457, -0.01091468334197998, -0.01055765151977539, -0.0102006196975708, -0.009843587875366211, -0.009486556053161621, -0.009129524230957031, -0.008772492408752441, -0.008415460586547852, -0.008058428764343262, -0.007701396942138672, -0.007344365119934082, -0.006987333297729492, -0.006630301475524902, -0.0062732696533203125, -0.005916237831115723, -0.005559206008911133, -0.005202174186706543, -0.004845142364501953, -0.004488110542297363, -0.0041310787200927734, -0.0037740468978881836, -0.0034170150756835938, -0.003059983253479004, -0.002702951431274414, -0.0023459196090698242, -0.0019888877868652344, -0.0016318559646606445, -0.0012748241424560547, -0.0009177923202514648, -0.000560760498046875, -0.00020372867584228516, 0.0001533031463623047, 0.0005103349685668945, 0.0008673667907714844, 0.0012243986129760742, 0.001581430435180664, 0.001938462257385254, 0.0022954940795898438, 0.0026525259017944336, 0.0030095577239990234, 0.0033665895462036133, 0.003723621368408203, 0.004080653190612793, 0.004437685012817383, 0.004794716835021973, 0.0051517486572265625, 0.005508780479431152, 0.005865812301635742, 0.006222844123840332, 0.006579875946044922, 0.006936907768249512, 0.0072939395904541016, 0.007650971412658691, 0.008008003234863281, 0.008365035057067871, 0.008722066879272461, 0.00907909870147705, 0.00943613052368164, 0.00979316234588623, 0.01015019416809082, 0.01050722599029541, 0.0108642578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 11.0, 23.0, 30.0, 21.0, 48.0, 51.0, 78.0, 103.0, 189.0, 255.0, 510.0, 1010.0, 2282.0, 6585.0, 25805.0, 147570.0, 674208.0, 152240.0, 26091.0, 6805.0, 2348.0, 962.0, 493.0, 276.0, 167.0, 114.0, 78.0, 49.0, 24.0, 29.0, 16.0, 22.0, 11.0, 8.0, 7.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0215301513671875, -0.02090620994567871, -0.020282268524169922, -0.019658327102661133, -0.019034385681152344, -0.018410444259643555, -0.017786502838134766, -0.017162561416625977, -0.016538619995117188, -0.0159146785736084, -0.01529073715209961, -0.01466679573059082, -0.014042854309082031, -0.013418912887573242, -0.012794971466064453, -0.012171030044555664, -0.011547088623046875, -0.010923147201538086, -0.010299205780029297, -0.009675264358520508, -0.009051322937011719, -0.00842738151550293, -0.007803440093994141, -0.0071794986724853516, -0.0065555572509765625, -0.0059316158294677734, -0.005307674407958984, -0.004683732986450195, -0.004059791564941406, -0.003435850143432617, -0.002811908721923828, -0.002187967300415039, -0.00156402587890625, -0.0009400844573974609, -0.0003161430358886719, 0.0003077983856201172, 0.0009317398071289062, 0.0015556812286376953, 0.0021796226501464844, 0.0028035640716552734, 0.0034275054931640625, 0.0040514469146728516, 0.004675388336181641, 0.00529932975769043, 0.005923271179199219, 0.006547212600708008, 0.007171154022216797, 0.007795095443725586, 0.008419036865234375, 0.009042978286743164, 0.009666919708251953, 0.010290861129760742, 0.010914802551269531, 0.01153874397277832, 0.01216268539428711, 0.012786626815795898, 0.013410568237304688, 0.014034509658813477, 0.014658451080322266, 0.015282392501831055, 0.015906333923339844, 0.016530275344848633, 0.017154216766357422, 0.01777815818786621, 0.018402099609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 11.0, 9.0, 6.0, 7.0, 7.0, 15.0, 18.0, 23.0, 13.0, 21.0, 24.0, 32.0, 47.0, 34.0, 51.0, 42.0, 48.0, 49.0, 49.0, 48.0, 54.0, 46.0, 49.0, 61.0, 39.0, 36.0, 34.0, 20.0, 24.0, 14.0, 11.0, 13.0, 12.0, 9.0, 4.0, 1.0, 9.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.027374267578125, -0.026536226272583008, -0.025698184967041016, -0.024860143661499023, -0.02402210235595703, -0.02318406105041504, -0.022346019744873047, -0.021507978439331055, -0.020669937133789062, -0.01983189582824707, -0.018993854522705078, -0.018155813217163086, -0.017317771911621094, -0.0164797306060791, -0.01564168930053711, -0.014803647994995117, -0.013965606689453125, -0.013127565383911133, -0.01228952407836914, -0.011451482772827148, -0.010613441467285156, -0.009775400161743164, -0.008937358856201172, -0.00809931755065918, -0.0072612762451171875, -0.006423234939575195, -0.005585193634033203, -0.004747152328491211, -0.003909111022949219, -0.0030710697174072266, -0.0022330284118652344, -0.0013949871063232422, -0.00055694580078125, 0.0002810955047607422, 0.0011191368103027344, 0.0019571781158447266, 0.0027952194213867188, 0.003633260726928711, 0.004471302032470703, 0.005309343338012695, 0.0061473846435546875, 0.00698542594909668, 0.007823467254638672, 0.008661508560180664, 0.009499549865722656, 0.010337591171264648, 0.01117563247680664, 0.012013673782348633, 0.012851715087890625, 0.013689756393432617, 0.01452779769897461, 0.015365839004516602, 0.016203880310058594, 0.017041921615600586, 0.017879962921142578, 0.01871800422668457, 0.019556045532226562, 0.020394086837768555, 0.021232128143310547, 0.02207016944885254, 0.02290821075439453, 0.023746252059936523, 0.024584293365478516, 0.025422334671020508, 0.0262603759765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 5.0, 2.0, 1.0, 4.0, 6.0, 10.0, 21.0, 31.0, 38.0, 90.0, 148.0, 306.0, 776.0, 3190.0, 55984.0, 950201.0, 33840.0, 2586.0, 689.0, 298.0, 118.0, 84.0, 52.0, 21.0, 20.0, 20.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0285491943359375, -0.027843236923217773, -0.027137279510498047, -0.02643132209777832, -0.025725364685058594, -0.025019407272338867, -0.02431344985961914, -0.023607492446899414, -0.022901535034179688, -0.02219557762145996, -0.021489620208740234, -0.020783662796020508, -0.02007770538330078, -0.019371747970581055, -0.018665790557861328, -0.0179598331451416, -0.017253875732421875, -0.01654791831970215, -0.015841960906982422, -0.015136003494262695, -0.014430046081542969, -0.013724088668823242, -0.013018131256103516, -0.012312173843383789, -0.011606216430664062, -0.010900259017944336, -0.01019430160522461, -0.009488344192504883, -0.008782386779785156, -0.00807642936706543, -0.007370471954345703, -0.0066645145416259766, -0.00595855712890625, -0.0052525997161865234, -0.004546642303466797, -0.0038406848907470703, -0.0031347274780273438, -0.002428770065307617, -0.0017228126525878906, -0.001016855239868164, -0.0003108978271484375, 0.00039505958557128906, 0.0011010169982910156, 0.0018069744110107422, 0.0025129318237304688, 0.0032188892364501953, 0.003924846649169922, 0.0046308040618896484, 0.005336761474609375, 0.0060427188873291016, 0.006748676300048828, 0.007454633712768555, 0.008160591125488281, 0.008866548538208008, 0.009572505950927734, 0.010278463363647461, 0.010984420776367188, 0.011690378189086914, 0.01239633560180664, 0.013102293014526367, 0.013808250427246094, 0.01451420783996582, 0.015220165252685547, 0.015926122665405273, 0.016632080078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 7.0, 15.0, 10.0, 20.0, 28.0, 20.0, 41.0, 44.0, 63.0, 70.0, 87.0, 92.0, 90.0, 93.0, 78.0, 55.0, 37.0, 37.0, 33.0, 25.0, 17.0, 11.0, 7.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.516145706176758e-05, -7.336307317018509e-05, -7.15646892786026e-05, -6.976630538702011e-05, -6.796792149543762e-05, -6.616953760385513e-05, -6.437115371227264e-05, -6.257276982069016e-05, -6.0774385929107666e-05, -5.897600203752518e-05, -5.717761814594269e-05, -5.53792342543602e-05, -5.358085036277771e-05, -5.178246647119522e-05, -4.998408257961273e-05, -4.818569868803024e-05, -4.6387314796447754e-05, -4.4588930904865265e-05, -4.2790547013282776e-05, -4.099216312170029e-05, -3.91937792301178e-05, -3.739539533853531e-05, -3.559701144695282e-05, -3.379862755537033e-05, -3.200024366378784e-05, -3.0201859772205353e-05, -2.8403475880622864e-05, -2.6605091989040375e-05, -2.4806708097457886e-05, -2.3008324205875397e-05, -2.1209940314292908e-05, -1.941155642271042e-05, -1.761317253112793e-05, -1.581478863954544e-05, -1.4016404747962952e-05, -1.2218020856380463e-05, -1.0419636964797974e-05, -8.621253073215485e-06, -6.822869181632996e-06, -5.024485290050507e-06, -3.2261013984680176e-06, -1.4277175068855286e-06, 3.7066638469696045e-07, 2.1690502762794495e-06, 3.9674341678619385e-06, 5.7658180594444275e-06, 7.5642019510269165e-06, 9.362585842609406e-06, 1.1160969734191895e-05, 1.2959353625774384e-05, 1.4757737517356873e-05, 1.655612140893936e-05, 1.835450530052185e-05, 2.015288919210434e-05, 2.195127308368683e-05, 2.3749656975269318e-05, 2.5548040866851807e-05, 2.7346424758434296e-05, 2.9144808650016785e-05, 3.0943192541599274e-05, 3.274157643318176e-05, 3.453996032476425e-05, 3.633834421634674e-05, 3.813672810792923e-05, 3.993511199951172e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 5.0, 4.0, 6.0, 14.0, 11.0, 22.0, 44.0, 106.0, 224.0, 571.0, 2224.0, 20108.0, 785772.0, 230656.0, 6886.0, 1214.0, 370.0, 137.0, 83.0, 39.0, 26.0, 12.0, 8.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02301025390625, -0.02240157127380371, -0.021792888641357422, -0.021184206008911133, -0.020575523376464844, -0.019966840744018555, -0.019358158111572266, -0.018749475479125977, -0.018140792846679688, -0.0175321102142334, -0.01692342758178711, -0.01631474494934082, -0.01570606231689453, -0.015097379684448242, -0.014488697052001953, -0.013880014419555664, -0.013271331787109375, -0.012662649154663086, -0.012053966522216797, -0.011445283889770508, -0.010836601257324219, -0.01022791862487793, -0.00961923599243164, -0.009010553359985352, -0.008401870727539062, -0.0077931880950927734, -0.007184505462646484, -0.006575822830200195, -0.005967140197753906, -0.005358457565307617, -0.004749774932861328, -0.004141092300415039, -0.00353240966796875, -0.002923727035522461, -0.002315044403076172, -0.0017063617706298828, -0.0010976791381835938, -0.0004889965057373047, 0.00011968612670898438, 0.0007283687591552734, 0.0013370513916015625, 0.0019457340240478516, 0.0025544166564941406, 0.0031630992889404297, 0.0037717819213867188, 0.004380464553833008, 0.004989147186279297, 0.005597829818725586, 0.006206512451171875, 0.006815195083618164, 0.007423877716064453, 0.008032560348510742, 0.008641242980957031, 0.00924992561340332, 0.00985860824584961, 0.010467290878295898, 0.011075973510742188, 0.011684656143188477, 0.012293338775634766, 0.012902021408081055, 0.013510704040527344, 0.014119386672973633, 0.014728069305419922, 0.015336751937866211, 0.0159454345703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 9.0, 21.0, 49.0, 131.0, 240.0, 257.0, 161.0, 65.0, 26.0, 8.0, 7.0, 4.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0288543701171875, -0.028097152709960938, -0.027339935302734375, -0.026582717895507812, -0.02582550048828125, -0.025068283081054688, -0.024311065673828125, -0.023553848266601562, -0.022796630859375, -0.022039413452148438, -0.021282196044921875, -0.020524978637695312, -0.01976776123046875, -0.019010543823242188, -0.018253326416015625, -0.017496109008789062, -0.0167388916015625, -0.015981674194335938, -0.015224456787109375, -0.014467239379882812, -0.01371002197265625, -0.012952804565429688, -0.012195587158203125, -0.011438369750976562, -0.01068115234375, -0.009923934936523438, -0.009166717529296875, -0.008409500122070312, -0.00765228271484375, -0.0068950653076171875, -0.006137847900390625, -0.0053806304931640625, -0.0046234130859375, -0.0038661956787109375, -0.003108978271484375, -0.0023517608642578125, -0.00159454345703125, -0.0008373260498046875, -8.0108642578125e-05, 0.0006771087646484375, 0.001434326171875, 0.0021915435791015625, 0.002948760986328125, 0.0037059783935546875, 0.00446319580078125, 0.0052204132080078125, 0.005977630615234375, 0.0067348480224609375, 0.0074920654296875, 0.008249282836914062, 0.009006500244140625, 0.009763717651367188, 0.01052093505859375, 0.011278152465820312, 0.012035369873046875, 0.012792587280273438, 0.0135498046875, 0.014307022094726562, 0.015064239501953125, 0.015821456909179688, 0.01657867431640625, 0.017335891723632812, 0.018093109130859375, 0.018850326538085938, 0.0196075439453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 9.0, 14.0, 53.0, 200.0, 378.0, 254.0, 76.0, 19.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.6090952157974243, -0.5977507829666138, -0.5864062905311584, -0.5750618577003479, -0.5637174248695374, -0.5523729920387268, -0.5410284996032715, -0.5296840667724609, -0.5183396339416504, -0.5069952011108398, -0.4956507384777069, -0.484306275844574, -0.4729618430137634, -0.4616173803806305, -0.45027291774749756, -0.438928484916687, -0.4275840222835541, -0.41623955965042114, -0.4048951268196106, -0.39355066418647766, -0.3822062313556671, -0.3708617687225342, -0.35951733589172363, -0.3481728732585907, -0.33682841062545776, -0.32548394799232483, -0.3141395151615143, -0.30279505252838135, -0.2914506196975708, -0.28010615706443787, -0.26876169443130493, -0.2574172616004944, -0.24607279896736145, -0.2347283512353897, -0.22338390350341797, -0.21203944087028503, -0.2006950080394745, -0.18935054540634155, -0.1780060976743698, -0.16666164994239807, -0.15531720221042633, -0.1439727544784546, -0.13262830674648285, -0.12128385156393051, -0.10993940383195877, -0.09859495609998703, -0.08725050091743469, -0.07590605318546295, -0.06456160545349121, -0.05321715772151947, -0.04187270626425743, -0.030528254806995392, -0.01918380707502365, -0.00783935934305191, 0.0035050958395004272, 0.014849543571472168, 0.02619399130344391, 0.03753843903541565, 0.04888289049267769, 0.06022734194993973, 0.07157178968191147, 0.08291623741388321, 0.09426069259643555, 0.10560514032840729, 0.11694958806037903]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 7.0, 6.0, 7.0, 1.0, 15.0, 11.0, 13.0, 18.0, 17.0, 17.0, 23.0, 25.0, 24.0, 37.0, 34.0, 38.0, 39.0, 36.0, 28.0, 35.0, 59.0, 48.0, 45.0, 52.0, 37.0, 44.0, 37.0, 30.0, 24.0, 24.0, 17.0, 22.0, 26.0, 16.0, 18.0, 15.0, 14.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12144136428833008, -0.1178487241268158, -0.11425607651472092, -0.11066343635320663, -0.10707078874111176, -0.10347814857959747, -0.09988550841808319, -0.09629286825656891, -0.09270022064447403, -0.08910758048295975, -0.08551493287086487, -0.08192229270935059, -0.0783296525478363, -0.07473700493574142, -0.07114436477422714, -0.06755171716213226, -0.06395907700061798, -0.0603664331138134, -0.05677378922700882, -0.05318114906549454, -0.04958850517868996, -0.045995861291885376, -0.042403221130371094, -0.03881057724356651, -0.03521793335676193, -0.03162528946995735, -0.02803264744579792, -0.02444000542163849, -0.020847361534833908, -0.017254717648029327, -0.013662075623869896, -0.010069433599710464, -0.006476789712905884, -0.0028841467574238777, 0.0007084961980581284, 0.004301139153540134, 0.00789378210902214, 0.011486425995826721, 0.015079068019986153, 0.018671710044145584, 0.022264353930950165, 0.025856997817754745, 0.029449639841914177, 0.03304228186607361, 0.03663492575287819, 0.04022756963968277, 0.04382020980119705, 0.04741285368800163, 0.05100549757480621, 0.054598141461610794, 0.058190785348415375, 0.06178342550992966, 0.06537607312202454, 0.06896871328353882, 0.0725613534450531, 0.07615399360656738, 0.07974664121866226, 0.08333928138017654, 0.08693192899227142, 0.0905245691537857, 0.09411720931529999, 0.09770985692739487, 0.10130249708890915, 0.10489514470100403, 0.10848778486251831]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 14.0, 27.0, 27.0, 51.0, 72.0, 90.0, 140.0, 196.0, 284.0, 479.0, 1079.0, 5532.0, 288604.0, 3886530.0, 8139.0, 1398.0, 592.0, 329.0, 216.0, 159.0, 92.0, 68.0, 50.0, 29.0, 24.0, 15.0, 5.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0272064208984375, -0.025915861129760742, -0.024625301361083984, -0.023334741592407227, -0.02204418182373047, -0.02075362205505371, -0.019463062286376953, -0.018172502517700195, -0.016881942749023438, -0.01559138298034668, -0.014300823211669922, -0.013010263442993164, -0.011719703674316406, -0.010429143905639648, -0.00913858413696289, -0.007848024368286133, -0.006557464599609375, -0.005266904830932617, -0.003976345062255859, -0.0026857852935791016, -0.0013952255249023438, -0.00010466575622558594, 0.0011858940124511719, 0.0024764537811279297, 0.0037670135498046875, 0.005057573318481445, 0.006348133087158203, 0.007638692855834961, 0.008929252624511719, 0.010219812393188477, 0.011510372161865234, 0.012800931930541992, 0.01409149169921875, 0.015382051467895508, 0.016672611236572266, 0.017963171005249023, 0.01925373077392578, 0.02054429054260254, 0.021834850311279297, 0.023125410079956055, 0.024415969848632812, 0.02570652961730957, 0.026997089385986328, 0.028287649154663086, 0.029578208923339844, 0.0308687686920166, 0.03215932846069336, 0.03344988822937012, 0.034740447998046875, 0.03603100776672363, 0.03732156753540039, 0.03861212730407715, 0.039902687072753906, 0.041193246841430664, 0.04248380661010742, 0.04377436637878418, 0.04506492614746094, 0.046355485916137695, 0.04764604568481445, 0.04893660545349121, 0.05022716522216797, 0.05151772499084473, 0.052808284759521484, 0.05409884452819824, 0.055389404296875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 10.0, 17.0, 23.0, 29.0, 30.0, 53.0, 61.0, 78.0, 89.0, 73.0, 84.0, 95.0, 75.0, 63.0, 54.0, 48.0, 25.0, 28.0, 10.0, 10.0, 5.0, 14.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0119171142578125, -0.01154792308807373, -0.011178731918334961, -0.010809540748596191, -0.010440349578857422, -0.010071158409118652, -0.009701967239379883, -0.009332776069641113, -0.008963584899902344, -0.008594393730163574, -0.008225202560424805, -0.007856011390686035, -0.007486820220947266, -0.007117629051208496, -0.0067484378814697266, -0.006379246711730957, -0.0060100555419921875, -0.005640864372253418, -0.0052716732025146484, -0.004902482032775879, -0.004533290863037109, -0.00416409969329834, -0.0037949085235595703, -0.0034257173538208008, -0.0030565261840820312, -0.0026873350143432617, -0.002318143844604492, -0.0019489526748657227, -0.0015797615051269531, -0.0012105703353881836, -0.0008413791656494141, -0.00047218799591064453, -0.000102996826171875, 0.00026619434356689453, 0.0006353855133056641, 0.0010045766830444336, 0.0013737678527832031, 0.0017429590225219727, 0.002112150192260742, 0.0024813413619995117, 0.0028505325317382812, 0.0032197237014770508, 0.0035889148712158203, 0.00395810604095459, 0.004327297210693359, 0.004696488380432129, 0.0050656795501708984, 0.005434870719909668, 0.0058040618896484375, 0.006173253059387207, 0.0065424442291259766, 0.006911635398864746, 0.007280826568603516, 0.007650017738342285, 0.008019208908081055, 0.008388400077819824, 0.008757591247558594, 0.009126782417297363, 0.009495973587036133, 0.009865164756774902, 0.010234355926513672, 0.010603547096252441, 0.010972738265991211, 0.01134192943572998, 0.01171112060546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 9.0, 11.0, 17.0, 34.0, 44.0, 70.0, 103.0, 172.0, 350.0, 846.0, 2712.0, 17414.0, 3924044.0, 235864.0, 9459.0, 1868.0, 594.0, 259.0, 135.0, 104.0, 58.0, 41.0, 25.0, 14.0, 9.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0237274169921875, -0.02284407615661621, -0.021960735321044922, -0.021077394485473633, -0.020194053649902344, -0.019310712814331055, -0.018427371978759766, -0.017544031143188477, -0.016660690307617188, -0.0157773494720459, -0.01489400863647461, -0.01401066780090332, -0.013127326965332031, -0.012243986129760742, -0.011360645294189453, -0.010477304458618164, -0.009593963623046875, -0.008710622787475586, -0.007827281951904297, -0.006943941116333008, -0.006060600280761719, -0.00517725944519043, -0.004293918609619141, -0.0034105777740478516, -0.0025272369384765625, -0.0016438961029052734, -0.0007605552673339844, 0.0001227855682373047, 0.0010061264038085938, 0.0018894672393798828, 0.002772808074951172, 0.003656148910522461, 0.00453948974609375, 0.005422830581665039, 0.006306171417236328, 0.007189512252807617, 0.008072853088378906, 0.008956193923950195, 0.009839534759521484, 0.010722875595092773, 0.011606216430664062, 0.012489557266235352, 0.01337289810180664, 0.01425623893737793, 0.015139579772949219, 0.016022920608520508, 0.016906261444091797, 0.017789602279663086, 0.018672943115234375, 0.019556283950805664, 0.020439624786376953, 0.021322965621948242, 0.02220630645751953, 0.02308964729309082, 0.02397298812866211, 0.0248563289642334, 0.025739669799804688, 0.026623010635375977, 0.027506351470947266, 0.028389692306518555, 0.029273033142089844, 0.030156373977661133, 0.031039714813232422, 0.03192305564880371, 0.032806396484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 11.0, 20.0, 37.0, 110.0, 585.0, 3111.0, 112.0, 42.0, 22.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002635955810546875, -0.0024725794792175293, -0.0023092031478881836, -0.002145826816558838, -0.001982450485229492, -0.0018190741539001465, -0.0016556978225708008, -0.001492321491241455, -0.0013289451599121094, -0.0011655688285827637, -0.001002192497253418, -0.0008388161659240723, -0.0006754398345947266, -0.0005120635032653809, -0.00034868717193603516, -0.00018531084060668945, -2.193450927734375e-05, 0.00014144182205200195, 0.00030481815338134766, 0.00046819448471069336, 0.0006315708160400391, 0.0007949471473693848, 0.0009583234786987305, 0.0011216998100280762, 0.0012850761413574219, 0.0014484524726867676, 0.0016118288040161133, 0.001775205135345459, 0.0019385814666748047, 0.0021019577980041504, 0.002265334129333496, 0.002428710460662842, 0.0025920867919921875, 0.002755463123321533, 0.002918839454650879, 0.0030822157859802246, 0.0032455921173095703, 0.003408968448638916, 0.0035723447799682617, 0.0037357211112976074, 0.003899097442626953, 0.004062473773956299, 0.0042258501052856445, 0.00438922643661499, 0.004552602767944336, 0.004715979099273682, 0.004879355430603027, 0.005042731761932373, 0.005206108093261719, 0.0053694844245910645, 0.00553286075592041, 0.005696237087249756, 0.0058596134185791016, 0.006022989749908447, 0.006186366081237793, 0.006349742412567139, 0.006513118743896484, 0.00667649507522583, 0.006839871406555176, 0.0070032477378845215, 0.007166624069213867, 0.007330000400543213, 0.007493376731872559, 0.007656753063201904, 0.00782012939453125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 15.0, 60.0, 186.0, 283.0, 275.0, 124.0, 42.0, 12.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014445389620959759, -0.013472361490130424, -0.012499332427978516, -0.011526304297149181, -0.010553276166319847, -0.009580247104167938, -0.008607218973338604, -0.007634190376847982, -0.006661161780357361, -0.005688133183866739, -0.004715104587376118, -0.0037420764565467834, -0.002769047860056162, -0.0017960192635655403, -0.0008229911327362061, 0.0001500374637544155, 0.001123066060245037, 0.0020960946567356586, 0.0030691230203956366, 0.0040421513840556145, 0.005015179980546236, 0.005988208577036858, 0.006961236707866192, 0.007934264838695526, 0.008907293900847435, 0.00988032203167677, 0.010853351093828678, 0.011826379224658012, 0.012799408286809921, 0.013772436417639256, 0.01474546454846859, 0.0157184936106205, 0.01669152081012726, 0.017664549872279167, 0.018637577071785927, 0.019610606133937836, 0.020583635196089745, 0.021556664258241653, 0.022529691457748413, 0.023502720519900322, 0.02447574958205223, 0.02544877864420414, 0.0264218058437109, 0.027394834905862808, 0.028367863968014717, 0.029340893030166626, 0.030313920229673386, 0.031286947429180145, 0.0322599783539772, 0.03323300555348396, 0.03420603647828102, 0.03517906367778778, 0.03615209087729454, 0.0371251218020916, 0.03809814900159836, 0.03907117620110512, 0.04004420340061188, 0.04101723060011864, 0.041990261524915695, 0.042963288724422455, 0.043936315923929214, 0.04490934684872627, 0.04588237404823303, 0.04685540124773979, 0.04782843217253685]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 4.0, 6.0, 6.0, 7.0, 9.0, 18.0, 10.0, 13.0, 20.0, 27.0, 27.0, 34.0, 32.0, 25.0, 30.0, 44.0, 54.0, 39.0, 38.0, 44.0, 42.0, 31.0, 43.0, 38.0, 38.0, 21.0, 27.0, 35.0, 38.0, 17.0, 22.0, 23.0, 21.0, 16.0, 19.0, 13.0, 18.0, 13.0, 3.0, 5.0, 2.0, 4.0, 5.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.005124390125274658, -0.004947606474161148, -0.004770822823047638, -0.004594039171934128, -0.004417255520820618, -0.0042404718697071075, -0.004063688218593597, -0.0038869045674800873, -0.003710120916366577, -0.003533337265253067, -0.003356553614139557, -0.0031797699630260468, -0.0030029863119125366, -0.0028262026607990265, -0.0026494190096855164, -0.0024726353585720062, -0.002295851707458496, -0.002119068056344986, -0.0019422844052314758, -0.0017655007541179657, -0.0015887171030044556, -0.0014119334518909454, -0.0012351498007774353, -0.0010583661496639252, -0.000881582498550415, -0.0007047988474369049, -0.0005280151963233948, -0.00035123154520988464, -0.0001744478940963745, 2.33575701713562e-06, 0.00017911940813064575, 0.0003559030592441559, 0.000532686710357666, 0.0007094703614711761, 0.0008862540125846863, 0.0010630376636981964, 0.0012398213148117065, 0.0014166049659252167, 0.0015933886170387268, 0.001770172268152237, 0.001946955919265747, 0.002123739570379257, 0.0023005232214927673, 0.0024773068726062775, 0.0026540905237197876, 0.0028308741748332977, 0.003007657825946808, 0.003184441477060318, 0.003361225128173828, 0.0035380087792873383, 0.0037147924304008484, 0.0038915760815143585, 0.004068359732627869, 0.004245143383741379, 0.004421927034854889, 0.004598710685968399, 0.004775494337081909, 0.004952277988195419, 0.0051290616393089294, 0.00530584529042244, 0.00548262894153595, 0.00565941259264946, 0.00583619624376297, 0.00601297989487648, 0.00618976354598999]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 6.0, 11.0, 19.0, 31.0, 63.0, 97.0, 148.0, 307.0, 646.0, 1400.0, 3678.0, 12006.0, 51816.0, 295143.0, 526358.0, 122334.0, 23720.0, 6539.0, 2273.0, 951.0, 488.0, 207.0, 126.0, 68.0, 43.0, 20.0, 14.0, 14.0, 7.0, 5.0, 3.0, 0.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0216217041015625, -0.020929813385009766, -0.02023792266845703, -0.019546031951904297, -0.018854141235351562, -0.018162250518798828, -0.017470359802246094, -0.01677846908569336, -0.016086578369140625, -0.01539468765258789, -0.014702796936035156, -0.014010906219482422, -0.013319015502929688, -0.012627124786376953, -0.011935234069824219, -0.011243343353271484, -0.01055145263671875, -0.009859561920166016, -0.009167671203613281, -0.008475780487060547, -0.0077838897705078125, -0.007091999053955078, -0.006400108337402344, -0.005708217620849609, -0.005016326904296875, -0.004324436187744141, -0.0036325454711914062, -0.002940654754638672, -0.0022487640380859375, -0.0015568733215332031, -0.0008649826049804688, -0.00017309188842773438, 0.000518798828125, 0.0012106895446777344, 0.0019025802612304688, 0.002594470977783203, 0.0032863616943359375, 0.003978252410888672, 0.004670143127441406, 0.005362033843994141, 0.006053924560546875, 0.006745815277099609, 0.007437705993652344, 0.008129596710205078, 0.008821487426757812, 0.009513378143310547, 0.010205268859863281, 0.010897159576416016, 0.01158905029296875, 0.012280941009521484, 0.012972831726074219, 0.013664722442626953, 0.014356613159179688, 0.015048503875732422, 0.015740394592285156, 0.01643228530883789, 0.017124176025390625, 0.01781606674194336, 0.018507957458496094, 0.019199848175048828, 0.019891738891601562, 0.020583629608154297, 0.02127552032470703, 0.021967411041259766, 0.0226593017578125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 14.0, 17.0, 23.0, 28.0, 38.0, 48.0, 64.0, 66.0, 74.0, 71.0, 100.0, 83.0, 81.0, 63.0, 57.0, 42.0, 29.0, 29.0, 10.0, 15.0, 6.0, 14.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.011871337890625, -0.011504530906677246, -0.011137723922729492, -0.010770916938781738, -0.010404109954833984, -0.01003730297088623, -0.009670495986938477, -0.009303689002990723, -0.008936882019042969, -0.008570075035095215, -0.008203268051147461, -0.007836461067199707, -0.007469654083251953, -0.007102847099304199, -0.006736040115356445, -0.006369233131408691, -0.0060024261474609375, -0.005635619163513184, -0.00526881217956543, -0.004902005195617676, -0.004535198211669922, -0.004168391227722168, -0.003801584243774414, -0.00343477725982666, -0.0030679702758789062, -0.0027011632919311523, -0.0023343563079833984, -0.0019675493240356445, -0.0016007423400878906, -0.0012339353561401367, -0.0008671283721923828, -0.0005003213882446289, -0.000133514404296875, 0.0002332925796508789, 0.0006000995635986328, 0.0009669065475463867, 0.0013337135314941406, 0.0017005205154418945, 0.0020673274993896484, 0.0024341344833374023, 0.0028009414672851562, 0.00316774845123291, 0.003534555435180664, 0.003901362419128418, 0.004268169403076172, 0.004634976387023926, 0.00500178337097168, 0.005368590354919434, 0.0057353973388671875, 0.006102204322814941, 0.006469011306762695, 0.006835818290710449, 0.007202625274658203, 0.007569432258605957, 0.007936239242553711, 0.008303046226501465, 0.008669853210449219, 0.009036660194396973, 0.009403467178344727, 0.00977027416229248, 0.010137081146240234, 0.010503888130187988, 0.010870695114135742, 0.011237502098083496, 0.01160430908203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 7.0, 9.0, 18.0, 18.0, 18.0, 32.0, 28.0, 51.0, 40.0, 69.0, 82.0, 122.0, 183.0, 293.0, 618.0, 1310.0, 3445.0, 11023.0, 44694.0, 269462.0, 574229.0, 110190.0, 22139.0, 6177.0, 2172.0, 837.0, 384.0, 260.0, 153.0, 125.0, 76.0, 64.0, 51.0, 35.0, 25.0, 23.0, 12.0, 16.0, 10.0, 11.0, 8.0, 4.0, 7.0, 0.0, 7.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.0186614990234375, -0.018132328987121582, -0.017603158950805664, -0.017073988914489746, -0.016544818878173828, -0.01601564884185791, -0.015486478805541992, -0.014957308769226074, -0.014428138732910156, -0.013898968696594238, -0.01336979866027832, -0.012840628623962402, -0.012311458587646484, -0.011782288551330566, -0.011253118515014648, -0.01072394847869873, -0.010194778442382812, -0.009665608406066895, -0.009136438369750977, -0.008607268333435059, -0.00807809829711914, -0.007548928260803223, -0.007019758224487305, -0.006490588188171387, -0.005961418151855469, -0.005432248115539551, -0.004903078079223633, -0.004373908042907715, -0.003844738006591797, -0.003315567970275879, -0.002786397933959961, -0.002257227897644043, -0.001728057861328125, -0.001198887825012207, -0.0006697177886962891, -0.0001405477523803711, 0.0003886222839355469, 0.0009177923202514648, 0.0014469623565673828, 0.0019761323928833008, 0.0025053024291992188, 0.0030344724655151367, 0.0035636425018310547, 0.004092812538146973, 0.004621982574462891, 0.005151152610778809, 0.0056803226470947266, 0.0062094926834106445, 0.0067386627197265625, 0.0072678327560424805, 0.0077970027923583984, 0.008326172828674316, 0.008855342864990234, 0.009384512901306152, 0.00991368293762207, 0.010442852973937988, 0.010972023010253906, 0.011501193046569824, 0.012030363082885742, 0.01255953311920166, 0.013088703155517578, 0.013617873191833496, 0.014147043228149414, 0.014676213264465332, 0.01520538330078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 4.0, 13.0, 6.0, 13.0, 20.0, 21.0, 23.0, 34.0, 26.0, 39.0, 32.0, 37.0, 40.0, 53.0, 43.0, 44.0, 51.0, 46.0, 43.0, 42.0, 40.0, 49.0, 29.0, 25.0, 37.0, 31.0, 27.0, 22.0, 17.0, 13.0, 16.0, 11.0, 7.0, 5.0, 8.0, 10.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0249176025390625, -0.0241391658782959, -0.023360729217529297, -0.022582292556762695, -0.021803855895996094, -0.021025419235229492, -0.02024698257446289, -0.01946854591369629, -0.018690109252929688, -0.017911672592163086, -0.017133235931396484, -0.016354799270629883, -0.015576362609863281, -0.01479792594909668, -0.014019489288330078, -0.013241052627563477, -0.012462615966796875, -0.011684179306030273, -0.010905742645263672, -0.01012730598449707, -0.009348869323730469, -0.008570432662963867, -0.007791996002197266, -0.007013559341430664, -0.0062351226806640625, -0.005456686019897461, -0.004678249359130859, -0.003899812698364258, -0.0031213760375976562, -0.0023429393768310547, -0.0015645027160644531, -0.0007860660552978516, -7.62939453125e-06, 0.0007708072662353516, 0.0015492439270019531, 0.0023276805877685547, 0.0031061172485351562, 0.003884553909301758, 0.004662990570068359, 0.005441427230834961, 0.0062198638916015625, 0.006998300552368164, 0.007776737213134766, 0.008555173873901367, 0.009333610534667969, 0.01011204719543457, 0.010890483856201172, 0.011668920516967773, 0.012447357177734375, 0.013225793838500977, 0.014004230499267578, 0.01478266716003418, 0.015561103820800781, 0.016339540481567383, 0.017117977142333984, 0.017896413803100586, 0.018674850463867188, 0.01945328712463379, 0.02023172378540039, 0.021010160446166992, 0.021788597106933594, 0.022567033767700195, 0.023345470428466797, 0.0241239070892334, 0.02490234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 11.0, 14.0, 12.0, 26.0, 15.0, 34.0, 62.0, 95.0, 117.0, 191.0, 298.0, 512.0, 946.0, 1720.0, 3780.0, 9064.0, 25353.0, 80406.0, 279222.0, 429702.0, 147974.0, 43308.0, 14624.0, 5484.0, 2650.0, 1208.0, 637.0, 369.0, 257.0, 161.0, 87.0, 58.0, 45.0, 33.0, 22.0, 13.0, 10.0, 12.0, 2.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004711151123046875, -0.004560351371765137, -0.0044095516204833984, -0.00425875186920166, -0.004107952117919922, -0.003957152366638184, -0.0038063526153564453, -0.003655552864074707, -0.0035047531127929688, -0.0033539533615112305, -0.003203153610229492, -0.003052353858947754, -0.0029015541076660156, -0.0027507543563842773, -0.002599954605102539, -0.0024491548538208008, -0.0022983551025390625, -0.0021475553512573242, -0.001996755599975586, -0.0018459558486938477, -0.0016951560974121094, -0.001544356346130371, -0.0013935565948486328, -0.0012427568435668945, -0.0010919570922851562, -0.000941157341003418, -0.0007903575897216797, -0.0006395578384399414, -0.0004887580871582031, -0.00033795833587646484, -0.00018715858459472656, -3.635883331298828e-05, 0.00011444091796875, 0.0002652406692504883, 0.00041604042053222656, 0.0005668401718139648, 0.0007176399230957031, 0.0008684396743774414, 0.0010192394256591797, 0.001170039176940918, 0.0013208389282226562, 0.0014716386795043945, 0.0016224384307861328, 0.001773238182067871, 0.0019240379333496094, 0.0020748376846313477, 0.002225637435913086, 0.0023764371871948242, 0.0025272369384765625, 0.0026780366897583008, 0.002828836441040039, 0.0029796361923217773, 0.0031304359436035156, 0.003281235694885254, 0.003432035446166992, 0.0035828351974487305, 0.0037336349487304688, 0.003884434700012207, 0.004035234451293945, 0.004186034202575684, 0.004336833953857422, 0.00448763370513916, 0.0046384334564208984, 0.004789233207702637, 0.004940032958984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 8.0, 2.0, 14.0, 12.0, 12.0, 21.0, 20.0, 23.0, 36.0, 41.0, 47.0, 67.0, 71.0, 75.0, 64.0, 67.0, 68.0, 54.0, 47.0, 39.0, 41.0, 24.0, 33.0, 12.0, 22.0, 27.0, 10.0, 11.0, 4.0, 10.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.839897155761719e-05, -4.697777330875397e-05, -4.555657505989075e-05, -4.413537681102753e-05, -4.271417856216431e-05, -4.1292980313301086e-05, -3.9871782064437866e-05, -3.8450583815574646e-05, -3.7029385566711426e-05, -3.5608187317848206e-05, -3.4186989068984985e-05, -3.2765790820121765e-05, -3.1344592571258545e-05, -2.9923394322395325e-05, -2.8502196073532104e-05, -2.7080997824668884e-05, -2.5659799575805664e-05, -2.4238601326942444e-05, -2.2817403078079224e-05, -2.1396204829216003e-05, -1.9975006580352783e-05, -1.8553808331489563e-05, -1.7132610082626343e-05, -1.5711411833763123e-05, -1.4290213584899902e-05, -1.2869015336036682e-05, -1.1447817087173462e-05, -1.0026618838310242e-05, -8.605420589447021e-06, -7.184222340583801e-06, -5.763024091720581e-06, -4.341825842857361e-06, -2.9206275939941406e-06, -1.4994293451309204e-06, -7.82310962677002e-08, 1.34296715259552e-06, 2.7641654014587402e-06, 4.1853636503219604e-06, 5.606561899185181e-06, 7.027760148048401e-06, 8.448958396911621e-06, 9.870156645774841e-06, 1.1291354894638062e-05, 1.2712553143501282e-05, 1.4133751392364502e-05, 1.5554949641227722e-05, 1.6976147890090942e-05, 1.8397346138954163e-05, 1.9818544387817383e-05, 2.1239742636680603e-05, 2.2660940885543823e-05, 2.4082139134407043e-05, 2.5503337383270264e-05, 2.6924535632133484e-05, 2.8345733880996704e-05, 2.9766932129859924e-05, 3.1188130378723145e-05, 3.2609328627586365e-05, 3.4030526876449585e-05, 3.5451725125312805e-05, 3.6872923374176025e-05, 3.8294121623039246e-05, 3.9715319871902466e-05, 4.1136518120765686e-05, 4.2557716369628906e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 10.0, 9.0, 20.0, 40.0, 56.0, 116.0, 206.0, 454.0, 989.0, 2380.0, 6911.0, 24605.0, 119501.0, 515687.0, 300963.0, 56189.0, 13335.0, 4104.0, 1565.0, 692.0, 313.0, 155.0, 91.0, 54.0, 31.0, 20.0, 18.0, 7.0, 8.0, 7.0, 5.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00650787353515625, -0.006289303302764893, -0.006070733070373535, -0.005852162837982178, -0.00563359260559082, -0.005415022373199463, -0.0051964521408081055, -0.004977881908416748, -0.004759311676025391, -0.004540741443634033, -0.004322171211242676, -0.004103600978851318, -0.003885030746459961, -0.0036664605140686035, -0.003447890281677246, -0.0032293200492858887, -0.0030107498168945312, -0.002792179584503174, -0.0025736093521118164, -0.002355039119720459, -0.0021364688873291016, -0.0019178986549377441, -0.0016993284225463867, -0.0014807581901550293, -0.0012621879577636719, -0.0010436177253723145, -0.000825047492980957, -0.0006064772605895996, -0.0003879070281982422, -0.00016933679580688477, 4.9233436584472656e-05, 0.0002678036689758301, 0.0004863739013671875, 0.0007049441337585449, 0.0009235143661499023, 0.0011420845985412598, 0.0013606548309326172, 0.0015792250633239746, 0.001797795295715332, 0.0020163655281066895, 0.002234935760498047, 0.0024535059928894043, 0.0026720762252807617, 0.002890646457672119, 0.0031092166900634766, 0.003327786922454834, 0.0035463571548461914, 0.003764927387237549, 0.003983497619628906, 0.004202067852020264, 0.004420638084411621, 0.0046392083168029785, 0.004857778549194336, 0.005076348781585693, 0.005294919013977051, 0.005513489246368408, 0.005732059478759766, 0.005950629711151123, 0.0061691999435424805, 0.006387770175933838, 0.006606340408325195, 0.006824910640716553, 0.00704348087310791, 0.007262051105499268, 0.007480621337890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 9.0, 5.0, 10.0, 12.0, 22.0, 19.0, 37.0, 29.0, 41.0, 51.0, 55.0, 47.0, 86.0, 72.0, 72.0, 67.0, 67.0, 47.0, 49.0, 40.0, 34.0, 31.0, 22.0, 13.0, 13.0, 11.0, 5.0, 9.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005908966064453125, -0.005712628364562988, -0.0055162906646728516, -0.005319952964782715, -0.005123615264892578, -0.004927277565002441, -0.004730939865112305, -0.004534602165222168, -0.004338264465332031, -0.0041419267654418945, -0.003945589065551758, -0.003749251365661621, -0.0035529136657714844, -0.0033565759658813477, -0.003160238265991211, -0.0029639005661010742, -0.0027675628662109375, -0.0025712251663208008, -0.002374887466430664, -0.0021785497665405273, -0.0019822120666503906, -0.001785874366760254, -0.0015895366668701172, -0.0013931989669799805, -0.0011968612670898438, -0.001000523567199707, -0.0008041858673095703, -0.0006078481674194336, -0.0004115104675292969, -0.00021517276763916016, -1.8835067749023438e-05, 0.00017750263214111328, 0.00037384033203125, 0.0005701780319213867, 0.0007665157318115234, 0.0009628534317016602, 0.0011591911315917969, 0.0013555288314819336, 0.0015518665313720703, 0.001748204231262207, 0.0019445419311523438, 0.0021408796310424805, 0.002337217330932617, 0.002533555030822754, 0.0027298927307128906, 0.0029262304306030273, 0.003122568130493164, 0.0033189058303833008, 0.0035152435302734375, 0.0037115812301635742, 0.003907918930053711, 0.004104256629943848, 0.004300594329833984, 0.004496932029724121, 0.004693269729614258, 0.0048896074295043945, 0.005085945129394531, 0.005282282829284668, 0.005478620529174805, 0.005674958229064941, 0.005871295928955078, 0.006067633628845215, 0.0062639713287353516, 0.006460309028625488, 0.006656646728515625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 3.0, 14.0, 20.0, 26.0, 50.0, 60.0, 66.0, 102.0, 124.0, 116.0, 107.0, 81.0, 78.0, 45.0, 34.0, 29.0, 15.0, 6.0, 7.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06379878520965576, -0.06030626222491264, -0.056813742965459824, -0.053321219980716705, -0.049828700721263885, -0.04633617773652077, -0.04284365475177765, -0.03935113549232483, -0.03585861623287201, -0.03236609324812889, -0.02887357398867607, -0.025381051003932953, -0.021888531744480133, -0.018396008759737015, -0.014903487637639046, -0.011410966515541077, -0.007918443530797958, -0.004425922408699989, -0.000933400820940733, 0.0025591207668185234, 0.0060516418889164925, 0.009544163942337036, 0.013036685064435005, 0.016529206186532974, 0.020021727308630943, 0.023514248430728912, 0.02700676955282688, 0.03049929067492485, 0.03399181365966797, 0.03748433291912079, 0.04097685590386391, 0.044469378888607025, 0.047961898148059845, 0.05145442113280296, 0.05494694039225578, 0.0584394633769989, 0.06193198263645172, 0.06542450189590454, 0.06891702860593796, 0.07240954786539078, 0.0759020671248436, 0.07939458638429642, 0.08288711309432983, 0.08637963235378265, 0.08987215161323547, 0.0933646708726883, 0.09685719758272171, 0.10034971684217453, 0.10384224355220795, 0.10733476281166077, 0.11082728952169418, 0.114319808781147, 0.11781232804059982, 0.12130485475063324, 0.12479737401008606, 0.12828989326953888, 0.1317824125289917, 0.13527493178844452, 0.13876745104789734, 0.14225997030735016, 0.14575250446796417, 0.149245023727417, 0.1527375429868698, 0.15623006224632263, 0.15972258150577545]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 8.0, 3.0, 8.0, 10.0, 9.0, 18.0, 13.0, 14.0, 17.0, 20.0, 22.0, 25.0, 25.0, 24.0, 19.0, 39.0, 34.0, 33.0, 47.0, 47.0, 58.0, 37.0, 55.0, 47.0, 40.0, 37.0, 30.0, 33.0, 27.0, 30.0, 20.0, 26.0, 12.0, 16.0, 14.0, 14.0, 4.0, 12.0, 7.0, 6.0, 8.0, 5.0, 7.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.10489803552627563, -0.10159571468830109, -0.09829338639974594, -0.0949910581111908, -0.09168873727321625, -0.0883864164352417, -0.08508408814668655, -0.08178175985813141, -0.07847943902015686, -0.07517711818218231, -0.07187478989362717, -0.06857246160507202, -0.06527014076709747, -0.061967816203832626, -0.05866549164056778, -0.05536316707730293, -0.052060842514038086, -0.04875851795077324, -0.04545619338750839, -0.042153868824243546, -0.0388515442609787, -0.03554921969771385, -0.032246895134449005, -0.02894457057118416, -0.02564224600791931, -0.022339921444654465, -0.019037596881389618, -0.01573527231812477, -0.012432947754859924, -0.009130623191595078, -0.005828298628330231, -0.002525974065065384, 0.0007763504981994629, 0.00407867506146431, 0.0073809996247291565, 0.010683324187994003, 0.01398564875125885, 0.017287973314523697, 0.020590297877788544, 0.02389262244105339, 0.027194947004318237, 0.030497271567583084, 0.03379959613084793, 0.03710192069411278, 0.040404245257377625, 0.04370656982064247, 0.04700889438390732, 0.050311218947172165, 0.05361354351043701, 0.05691586807370186, 0.060218192636966705, 0.06352052092552185, 0.0668228417634964, 0.07012516260147095, 0.07342749089002609, 0.07672981917858124, 0.08003214001655579, 0.08333446085453033, 0.08663678914308548, 0.08993911743164062, 0.09324143826961517, 0.09654375910758972, 0.09984608739614487, 0.10314841568470001, 0.10645073652267456]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 9.0, 7.0, 7.0, 19.0, 24.0, 31.0, 47.0, 56.0, 70.0, 126.0, 210.0, 506.0, 1325.0, 5765.0, 70562.0, 4085396.0, 24730.0, 3433.0, 980.0, 374.0, 178.0, 105.0, 57.0, 66.0, 43.0, 25.0, 16.0, 19.0, 17.0, 16.0, 10.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.0379638671875, -0.03697371482849121, -0.03598356246948242, -0.03499341011047363, -0.034003257751464844, -0.033013105392456055, -0.032022953033447266, -0.031032800674438477, -0.030042648315429688, -0.0290524959564209, -0.02806234359741211, -0.02707219123840332, -0.02608203887939453, -0.025091886520385742, -0.024101734161376953, -0.023111581802368164, -0.022121429443359375, -0.021131277084350586, -0.020141124725341797, -0.019150972366333008, -0.01816082000732422, -0.01717066764831543, -0.01618051528930664, -0.015190362930297852, -0.014200210571289062, -0.013210058212280273, -0.012219905853271484, -0.011229753494262695, -0.010239601135253906, -0.009249448776245117, -0.008259296417236328, -0.007269144058227539, -0.00627899169921875, -0.005288839340209961, -0.004298686981201172, -0.003308534622192383, -0.0023183822631835938, -0.0013282299041748047, -0.0003380775451660156, 0.0006520748138427734, 0.0016422271728515625, 0.0026323795318603516, 0.0036225318908691406, 0.00461268424987793, 0.005602836608886719, 0.006592988967895508, 0.007583141326904297, 0.008573293685913086, 0.009563446044921875, 0.010553598403930664, 0.011543750762939453, 0.012533903121948242, 0.013524055480957031, 0.01451420783996582, 0.01550436019897461, 0.0164945125579834, 0.017484664916992188, 0.018474817276000977, 0.019464969635009766, 0.020455121994018555, 0.021445274353027344, 0.022435426712036133, 0.023425579071044922, 0.02441573143005371, 0.0254058837890625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 11.0, 11.0, 13.0, 18.0, 35.0, 36.0, 45.0, 72.0, 71.0, 69.0, 76.0, 79.0, 95.0, 84.0, 69.0, 49.0, 50.0, 21.0, 23.0, 21.0, 11.0, 10.0, 8.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.01168060302734375, -0.011319279670715332, -0.010957956314086914, -0.010596632957458496, -0.010235309600830078, -0.00987398624420166, -0.009512662887573242, -0.009151339530944824, -0.008790016174316406, -0.008428692817687988, -0.00806736946105957, -0.007706046104431152, -0.007344722747802734, -0.006983399391174316, -0.0066220760345458984, -0.0062607526779174805, -0.0058994293212890625, -0.0055381059646606445, -0.0051767826080322266, -0.004815459251403809, -0.004454135894775391, -0.004092812538146973, -0.0037314891815185547, -0.0033701658248901367, -0.0030088424682617188, -0.0026475191116333008, -0.002286195755004883, -0.0019248723983764648, -0.0015635490417480469, -0.001202225685119629, -0.0008409023284912109, -0.00047957897186279297, -0.000118255615234375, 0.00024306774139404297, 0.0006043910980224609, 0.0009657144546508789, 0.0013270378112792969, 0.0016883611679077148, 0.002049684524536133, 0.0024110078811645508, 0.0027723312377929688, 0.0031336545944213867, 0.0034949779510498047, 0.0038563013076782227, 0.004217624664306641, 0.004578948020935059, 0.0049402713775634766, 0.0053015947341918945, 0.0056629180908203125, 0.0060242414474487305, 0.0063855648040771484, 0.006746888160705566, 0.007108211517333984, 0.007469534873962402, 0.00783085823059082, 0.008192181587219238, 0.008553504943847656, 0.008914828300476074, 0.009276151657104492, 0.00963747501373291, 0.009998798370361328, 0.010360121726989746, 0.010721445083618164, 0.011082768440246582, 0.011444091796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 11.0, 8.0, 9.0, 16.0, 27.0, 34.0, 46.0, 86.0, 142.0, 189.0, 359.0, 700.0, 1467.0, 3334.0, 8996.0, 35438.0, 841806.0, 3246878.0, 38692.0, 9560.0, 3449.0, 1409.0, 699.0, 388.0, 220.0, 122.0, 68.0, 34.0, 29.0, 22.0, 17.0, 6.0, 10.0, 9.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01016998291015625, -0.009763598442077637, -0.009357213973999023, -0.00895082950592041, -0.008544445037841797, -0.008138060569763184, -0.00773167610168457, -0.007325291633605957, -0.006918907165527344, -0.0065125226974487305, -0.006106138229370117, -0.005699753761291504, -0.005293369293212891, -0.004886984825134277, -0.004480600357055664, -0.004074215888977051, -0.0036678314208984375, -0.0032614469528198242, -0.002855062484741211, -0.0024486780166625977, -0.0020422935485839844, -0.001635909080505371, -0.0012295246124267578, -0.0008231401443481445, -0.00041675567626953125, -1.0371208190917969e-05, 0.0003960132598876953, 0.0008023977279663086, 0.0012087821960449219, 0.0016151666641235352, 0.0020215511322021484, 0.0024279356002807617, 0.002834320068359375, 0.0032407045364379883, 0.0036470890045166016, 0.004053473472595215, 0.004459857940673828, 0.004866242408752441, 0.005272626876831055, 0.005679011344909668, 0.006085395812988281, 0.0064917802810668945, 0.006898164749145508, 0.007304549217224121, 0.007710933685302734, 0.008117318153381348, 0.008523702621459961, 0.008930087089538574, 0.009336471557617188, 0.0097428560256958, 0.010149240493774414, 0.010555624961853027, 0.01096200942993164, 0.011368393898010254, 0.011774778366088867, 0.01218116283416748, 0.012587547302246094, 0.012993931770324707, 0.01340031623840332, 0.013806700706481934, 0.014213085174560547, 0.01461946964263916, 0.015025854110717773, 0.015432238578796387, 0.015838623046875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 10.0, 11.0, 12.0, 11.0, 28.0, 28.0, 43.0, 82.0, 309.0, 2869.0, 396.0, 122.0, 54.0, 27.0, 16.0, 11.0, 10.0, 5.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0019426345825195312, -0.0018527060747146606, -0.00176277756690979, -0.0016728490591049194, -0.0015829205513000488, -0.0014929920434951782, -0.0014030635356903076, -0.001313135027885437, -0.0012232065200805664, -0.0011332780122756958, -0.0010433495044708252, -0.0009534209966659546, -0.000863492488861084, -0.0007735639810562134, -0.0006836354732513428, -0.0005937069654464722, -0.0005037784576416016, -0.00041384994983673096, -0.00032392144203186035, -0.00023399293422698975, -0.00014406442642211914, -5.4135918617248535e-05, 3.579258918762207e-05, 0.00012572109699249268, 0.00021564960479736328, 0.0003055781126022339, 0.0003955066204071045, 0.0004854351282119751, 0.0005753636360168457, 0.0006652921438217163, 0.0007552206516265869, 0.0008451491594314575, 0.0009350776672363281, 0.0010250061750411987, 0.0011149346828460693, 0.00120486319065094, 0.0012947916984558105, 0.0013847202062606812, 0.0014746487140655518, 0.0015645772218704224, 0.001654505729675293, 0.0017444342374801636, 0.0018343627452850342, 0.0019242912530899048, 0.0020142197608947754, 0.002104148268699646, 0.0021940767765045166, 0.002284005284309387, 0.002373933792114258, 0.0024638622999191284, 0.002553790807723999, 0.0026437193155288696, 0.0027336478233337402, 0.002823576331138611, 0.0029135048389434814, 0.003003433346748352, 0.0030933618545532227, 0.0031832903623580933, 0.003273218870162964, 0.0033631473779678345, 0.003453075885772705, 0.0035430043935775757, 0.0036329329013824463, 0.003722861409187317, 0.0038127899169921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 11.0, 59.0, 147.0, 250.0, 244.0, 182.0, 75.0, 22.0, 7.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013111122883856297, -0.012131751514971256, -0.011152379214763641, -0.010173007845878601, -0.00919363647699356, -0.00821426510810852, -0.007234893273562193, -0.006255521439015865, -0.005276150070130825, -0.004296778701245785, -0.003317406866699457, -0.0023380352649837732, -0.0013586636632680893, -0.000379292294383049, 0.0006000795401632786, 0.0015794513747096062, 0.0025588227435946465, 0.0035381943453103304, 0.004517565947026014, 0.005496937781572342, 0.006476309150457382, 0.0074556805193424225, 0.008435051888227463, 0.009414424188435078, 0.010393795557320118, 0.011373166926205158, 0.012352539226412773, 0.013331910595297813, 0.014311281964182854, 0.015290653333067894, 0.016270024701952934, 0.017249397933483124, 0.018228769302368164, 0.019208140671253204, 0.020187512040138245, 0.021166883409023285, 0.022146254777908325, 0.023125626146793365, 0.024104999378323555, 0.025084370747208595, 0.026063742116093636, 0.027043113484978676, 0.028022484853863716, 0.029001856222748756, 0.029981229454278946, 0.030960600823163986, 0.031939972192049026, 0.03291934356093407, 0.03389871492981911, 0.03487808629870415, 0.03585745766758919, 0.03683682903647423, 0.03781620040535927, 0.03879557177424431, 0.03977494314312935, 0.04075431823730469, 0.04173368960618973, 0.04271306097507477, 0.04369243234395981, 0.04467180371284485, 0.04565117508172989, 0.04663054645061493, 0.04760991781949997, 0.04858928918838501, 0.04956866055727005]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 9.0, 7.0, 16.0, 14.0, 12.0, 24.0, 22.0, 26.0, 28.0, 33.0, 28.0, 33.0, 31.0, 42.0, 45.0, 50.0, 37.0, 41.0, 42.0, 32.0, 32.0, 48.0, 38.0, 41.0, 39.0, 33.0, 34.0, 28.0, 22.0, 20.0, 18.0, 10.0, 9.0, 10.0, 6.0, 7.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0068076252937316895, -0.006594793871045113, -0.006381962448358536, -0.006169131025671959, -0.005956299602985382, -0.005743468180298805, -0.005530636757612228, -0.0053178053349256516, -0.005104973912239075, -0.004892142489552498, -0.004679311066865921, -0.004466479644179344, -0.004253648221492767, -0.0040408167988061905, -0.0038279853761196136, -0.003615153953433037, -0.00340232253074646, -0.003189491108059883, -0.0029766596853733063, -0.0027638282626867294, -0.0025509968400001526, -0.0023381654173135757, -0.002125333994626999, -0.001912502571940422, -0.0016996711492538452, -0.0014868397265672684, -0.0012740083038806915, -0.0010611768811941147, -0.0008483454585075378, -0.000635514035820961, -0.00042268261313438416, -0.0002098511904478073, 2.9802322387695312e-06, 0.00021581165492534637, 0.0004286430776119232, 0.0006414745002985001, 0.0008543059229850769, 0.0010671373456716537, 0.0012799687683582306, 0.0014928001910448074, 0.0017056316137313843, 0.0019184630364179611, 0.002131294459104538, 0.002344125881791115, 0.0025569573044776917, 0.0027697887271642685, 0.0029826201498508453, 0.003195451572537422, 0.003408282995223999, 0.003621114417910576, 0.0038339458405971527, 0.0040467772632837296, 0.004259608685970306, 0.004472440108656883, 0.00468527153134346, 0.004898102954030037, 0.005110934376716614, 0.005323765799403191, 0.0055365972220897675, 0.005749428644776344, 0.005962260067462921, 0.006175091490149498, 0.006387922912836075, 0.006600754335522652, 0.0068135857582092285]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 5.0, 9.0, 16.0, 21.0, 30.0, 70.0, 96.0, 188.0, 297.0, 620.0, 1269.0, 2930.0, 8025.0, 27429.0, 129946.0, 508565.0, 290458.0, 56177.0, 14161.0, 4537.0, 1838.0, 846.0, 457.0, 253.0, 135.0, 66.0, 32.0, 25.0, 23.0, 8.0, 9.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01425933837890625, -0.013726115226745605, -0.013192892074584961, -0.012659668922424316, -0.012126445770263672, -0.011593222618103027, -0.011059999465942383, -0.010526776313781738, -0.009993553161621094, -0.00946033000946045, -0.008927106857299805, -0.00839388370513916, -0.007860660552978516, -0.007327437400817871, -0.0067942142486572266, -0.006260991096496582, -0.0057277679443359375, -0.005194544792175293, -0.0046613216400146484, -0.004128098487854004, -0.0035948753356933594, -0.003061652183532715, -0.0025284290313720703, -0.0019952058792114258, -0.0014619827270507812, -0.0009287595748901367, -0.0003955364227294922, 0.00013768672943115234, 0.0006709098815917969, 0.0012041330337524414, 0.001737356185913086, 0.0022705793380737305, 0.002803802490234375, 0.0033370256423950195, 0.003870248794555664, 0.004403471946716309, 0.004936695098876953, 0.005469918251037598, 0.006003141403198242, 0.006536364555358887, 0.007069587707519531, 0.007602810859680176, 0.00813603401184082, 0.008669257164001465, 0.00920248031616211, 0.009735703468322754, 0.010268926620483398, 0.010802149772644043, 0.011335372924804688, 0.011868596076965332, 0.012401819229125977, 0.012935042381286621, 0.013468265533447266, 0.01400148868560791, 0.014534711837768555, 0.0150679349899292, 0.015601158142089844, 0.01613438129425049, 0.016667604446411133, 0.017200827598571777, 0.017734050750732422, 0.018267273902893066, 0.01880049705505371, 0.019333720207214355, 0.019866943359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 10.0, 7.0, 13.0, 16.0, 23.0, 30.0, 39.0, 47.0, 66.0, 76.0, 65.0, 82.0, 72.0, 87.0, 73.0, 75.0, 50.0, 40.0, 37.0, 22.0, 20.0, 12.0, 13.0, 9.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.01165008544921875, -0.011289715766906738, -0.010929346084594727, -0.010568976402282715, -0.010208606719970703, -0.009848237037658691, -0.00948786735534668, -0.009127497673034668, -0.008767127990722656, -0.008406758308410645, -0.008046388626098633, -0.007686018943786621, -0.007325649261474609, -0.006965279579162598, -0.006604909896850586, -0.006244540214538574, -0.0058841705322265625, -0.005523800849914551, -0.005163431167602539, -0.004803061485290527, -0.004442691802978516, -0.004082322120666504, -0.003721952438354492, -0.0033615827560424805, -0.0030012130737304688, -0.002640843391418457, -0.0022804737091064453, -0.0019201040267944336, -0.0015597343444824219, -0.0011993646621704102, -0.0008389949798583984, -0.0004786252975463867, -0.000118255615234375, 0.00024211406707763672, 0.0006024837493896484, 0.0009628534317016602, 0.0013232231140136719, 0.0016835927963256836, 0.0020439624786376953, 0.002404332160949707, 0.0027647018432617188, 0.0031250715255737305, 0.003485441207885742, 0.003845810890197754, 0.004206180572509766, 0.004566550254821777, 0.004926919937133789, 0.005287289619445801, 0.0056476593017578125, 0.006008028984069824, 0.006368398666381836, 0.006728768348693848, 0.007089138031005859, 0.007449507713317871, 0.007809877395629883, 0.008170247077941895, 0.008530616760253906, 0.008890986442565918, 0.00925135612487793, 0.009611725807189941, 0.009972095489501953, 0.010332465171813965, 0.010692834854125977, 0.011053204536437988, 0.01141357421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 11.0, 6.0, 9.0, 18.0, 14.0, 32.0, 47.0, 73.0, 104.0, 176.0, 255.0, 482.0, 1293.0, 4566.0, 37138.0, 579583.0, 394196.0, 24748.0, 3530.0, 1072.0, 436.0, 275.0, 135.0, 92.0, 86.0, 56.0, 25.0, 20.0, 13.0, 12.0, 19.0, 9.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02362060546875, -0.022924184799194336, -0.022227764129638672, -0.021531343460083008, -0.020834922790527344, -0.02013850212097168, -0.019442081451416016, -0.01874566078186035, -0.018049240112304688, -0.017352819442749023, -0.01665639877319336, -0.015959978103637695, -0.015263557434082031, -0.014567136764526367, -0.013870716094970703, -0.013174295425415039, -0.012477874755859375, -0.011781454086303711, -0.011085033416748047, -0.010388612747192383, -0.009692192077636719, -0.008995771408081055, -0.00829935073852539, -0.0076029300689697266, -0.0069065093994140625, -0.0062100887298583984, -0.005513668060302734, -0.00481724739074707, -0.004120826721191406, -0.003424406051635742, -0.002727985382080078, -0.002031564712524414, -0.00133514404296875, -0.0006387233734130859, 5.7697296142578125e-05, 0.0007541179656982422, 0.0014505386352539062, 0.0021469593048095703, 0.0028433799743652344, 0.0035398006439208984, 0.0042362213134765625, 0.0049326419830322266, 0.005629062652587891, 0.006325483322143555, 0.007021903991699219, 0.007718324661254883, 0.008414745330810547, 0.009111166000366211, 0.009807586669921875, 0.010504007339477539, 0.011200428009033203, 0.011896848678588867, 0.012593269348144531, 0.013289690017700195, 0.01398611068725586, 0.014682531356811523, 0.015378952026367188, 0.01607537269592285, 0.016771793365478516, 0.01746821403503418, 0.018164634704589844, 0.018861055374145508, 0.019557476043701172, 0.020253896713256836, 0.0209503173828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 10.0, 9.0, 11.0, 4.0, 17.0, 13.0, 18.0, 19.0, 18.0, 20.0, 39.0, 29.0, 39.0, 39.0, 51.0, 38.0, 42.0, 45.0, 43.0, 46.0, 44.0, 37.0, 56.0, 40.0, 39.0, 24.0, 44.0, 33.0, 20.0, 23.0, 11.0, 19.0, 7.0, 17.0, 9.0, 4.0, 9.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.022735595703125, -0.021991729736328125, -0.02124786376953125, -0.020503997802734375, -0.0197601318359375, -0.019016265869140625, -0.01827239990234375, -0.017528533935546875, -0.01678466796875, -0.016040802001953125, -0.01529693603515625, -0.014553070068359375, -0.0138092041015625, -0.013065338134765625, -0.01232147216796875, -0.011577606201171875, -0.010833740234375, -0.010089874267578125, -0.00934600830078125, -0.008602142333984375, -0.0078582763671875, -0.007114410400390625, -0.00637054443359375, -0.005626678466796875, -0.0048828125, -0.004138946533203125, -0.00339508056640625, -0.002651214599609375, -0.0019073486328125, -0.001163482666015625, -0.00041961669921875, 0.000324249267578125, 0.001068115234375, 0.001811981201171875, 0.00255584716796875, 0.003299713134765625, 0.0040435791015625, 0.004787445068359375, 0.00553131103515625, 0.006275177001953125, 0.00701904296875, 0.007762908935546875, 0.00850677490234375, 0.009250640869140625, 0.0099945068359375, 0.010738372802734375, 0.01148223876953125, 0.012226104736328125, 0.012969970703125, 0.013713836669921875, 0.01445770263671875, 0.015201568603515625, 0.0159454345703125, 0.016689300537109375, 0.01743316650390625, 0.018177032470703125, 0.0189208984375, 0.019664764404296875, 0.02040863037109375, 0.021152496337890625, 0.0218963623046875, 0.022640228271484375, 0.02338409423828125, 0.024127960205078125, 0.024871826171875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 11.0, 2.0, 15.0, 18.0, 30.0, 61.0, 102.0, 223.0, 564.0, 2281.0, 24377.0, 839414.0, 173789.0, 5980.0, 1026.0, 339.0, 144.0, 71.0, 51.0, 25.0, 18.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01187896728515625, -0.011450886726379395, -0.011022806167602539, -0.010594725608825684, -0.010166645050048828, -0.009738564491271973, -0.009310483932495117, -0.008882403373718262, -0.008454322814941406, -0.00802624225616455, -0.007598161697387695, -0.00717008113861084, -0.006742000579833984, -0.006313920021057129, -0.0058858394622802734, -0.005457758903503418, -0.0050296783447265625, -0.004601597785949707, -0.0041735172271728516, -0.003745436668395996, -0.0033173561096191406, -0.002889275550842285, -0.0024611949920654297, -0.0020331144332885742, -0.0016050338745117188, -0.0011769533157348633, -0.0007488727569580078, -0.00032079219818115234, 0.00010728836059570312, 0.0005353689193725586, 0.0009634494781494141, 0.0013915300369262695, 0.001819610595703125, 0.0022476911544799805, 0.002675771713256836, 0.0031038522720336914, 0.003531932830810547, 0.003960013389587402, 0.004388093948364258, 0.004816174507141113, 0.005244255065917969, 0.005672335624694824, 0.00610041618347168, 0.006528496742248535, 0.006956577301025391, 0.007384657859802246, 0.007812738418579102, 0.008240818977355957, 0.008668899536132812, 0.009096980094909668, 0.009525060653686523, 0.009953141212463379, 0.010381221771240234, 0.01080930233001709, 0.011237382888793945, 0.0116654634475708, 0.012093544006347656, 0.012521624565124512, 0.012949705123901367, 0.013377785682678223, 0.013805866241455078, 0.014233946800231934, 0.014662027359008789, 0.015090107917785645, 0.0155181884765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 8.0, 4.0, 8.0, 13.0, 20.0, 16.0, 19.0, 28.0, 24.0, 37.0, 37.0, 73.0, 48.0, 71.0, 55.0, 73.0, 87.0, 62.0, 56.0, 32.0, 40.0, 36.0, 29.0, 27.0, 26.0, 13.0, 11.0, 8.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5643577575683594e-05, -3.442354500293732e-05, -3.320351243019104e-05, -3.198347985744476e-05, -3.0763447284698486e-05, -2.954341471195221e-05, -2.8323382139205933e-05, -2.7103349566459656e-05, -2.588331699371338e-05, -2.4663284420967102e-05, -2.3443251848220825e-05, -2.222321927547455e-05, -2.100318670272827e-05, -1.9783154129981995e-05, -1.8563121557235718e-05, -1.734308898448944e-05, -1.6123056411743164e-05, -1.4903023838996887e-05, -1.368299126625061e-05, -1.2462958693504333e-05, -1.1242926120758057e-05, -1.002289354801178e-05, -8.802860975265503e-06, -7.582828402519226e-06, -6.362795829772949e-06, -5.142763257026672e-06, -3.9227306842803955e-06, -2.7026981115341187e-06, -1.4826655387878418e-06, -2.6263296604156494e-07, 9.57399606704712e-07, 2.1774321794509888e-06, 3.3974647521972656e-06, 4.6174973249435425e-06, 5.837529897689819e-06, 7.057562470436096e-06, 8.277595043182373e-06, 9.49762761592865e-06, 1.0717660188674927e-05, 1.1937692761421204e-05, 1.315772533416748e-05, 1.4377757906913757e-05, 1.5597790479660034e-05, 1.681782305240631e-05, 1.8037855625152588e-05, 1.9257888197898865e-05, 2.047792077064514e-05, 2.169795334339142e-05, 2.2917985916137695e-05, 2.4138018488883972e-05, 2.535805106163025e-05, 2.6578083634376526e-05, 2.7798116207122803e-05, 2.901814877986908e-05, 3.0238181352615356e-05, 3.145821392536163e-05, 3.267824649810791e-05, 3.389827907085419e-05, 3.5118311643600464e-05, 3.633834421634674e-05, 3.755837678909302e-05, 3.8778409361839294e-05, 3.999844193458557e-05, 4.121847450733185e-05, 4.2438507080078125e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 11.0, 18.0, 29.0, 34.0, 89.0, 184.0, 407.0, 957.0, 3586.0, 31584.0, 735521.0, 261322.0, 11436.0, 2063.0, 717.0, 285.0, 151.0, 57.0, 37.0, 13.0, 14.0, 11.0, 7.0, 10.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.013671875, -0.013300418853759766, -0.012928962707519531, -0.012557506561279297, -0.012186050415039062, -0.011814594268798828, -0.011443138122558594, -0.01107168197631836, -0.010700225830078125, -0.01032876968383789, -0.009957313537597656, -0.009585857391357422, -0.009214401245117188, -0.008842945098876953, -0.008471488952636719, -0.008100032806396484, -0.00772857666015625, -0.007357120513916016, -0.006985664367675781, -0.006614208221435547, -0.0062427520751953125, -0.005871295928955078, -0.005499839782714844, -0.005128383636474609, -0.004756927490234375, -0.004385471343994141, -0.004014015197753906, -0.003642559051513672, -0.0032711029052734375, -0.002899646759033203, -0.0025281906127929688, -0.0021567344665527344, -0.0017852783203125, -0.0014138221740722656, -0.0010423660278320312, -0.0006709098815917969, -0.0002994537353515625, 7.200241088867188e-05, 0.00044345855712890625, 0.0008149147033691406, 0.001186370849609375, 0.0015578269958496094, 0.0019292831420898438, 0.002300739288330078, 0.0026721954345703125, 0.003043651580810547, 0.0034151077270507812, 0.0037865638732910156, 0.00415802001953125, 0.004529476165771484, 0.004900932312011719, 0.005272388458251953, 0.0056438446044921875, 0.006015300750732422, 0.006386756896972656, 0.006758213043212891, 0.007129669189453125, 0.007501125335693359, 0.007872581481933594, 0.008244037628173828, 0.008615493774414062, 0.008986949920654297, 0.009358406066894531, 0.009729862213134766, 0.010101318359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 11.0, 10.0, 22.0, 33.0, 63.0, 135.0, 168.0, 162.0, 155.0, 96.0, 63.0, 44.0, 13.0, 15.0, 3.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017608642578125, -0.017150521278381348, -0.016692399978637695, -0.016234278678894043, -0.01577615737915039, -0.015318036079406738, -0.014859914779663086, -0.014401793479919434, -0.013943672180175781, -0.013485550880432129, -0.013027429580688477, -0.012569308280944824, -0.012111186981201172, -0.01165306568145752, -0.011194944381713867, -0.010736823081970215, -0.010278701782226562, -0.00982058048248291, -0.009362459182739258, -0.008904337882995605, -0.008446216583251953, -0.0079880952835083, -0.0075299739837646484, -0.007071852684020996, -0.006613731384277344, -0.006155610084533691, -0.005697488784790039, -0.005239367485046387, -0.004781246185302734, -0.004323124885559082, -0.0038650035858154297, -0.0034068822860717773, -0.002948760986328125, -0.0024906396865844727, -0.0020325183868408203, -0.001574397087097168, -0.0011162757873535156, -0.0006581544876098633, -0.00020003318786621094, 0.0002580881118774414, 0.0007162094116210938, 0.001174330711364746, 0.0016324520111083984, 0.0020905733108520508, 0.002548694610595703, 0.0030068159103393555, 0.003464937210083008, 0.00392305850982666, 0.0043811798095703125, 0.004839301109313965, 0.005297422409057617, 0.0057555437088012695, 0.006213665008544922, 0.006671786308288574, 0.0071299076080322266, 0.007588028907775879, 0.008046150207519531, 0.008504271507263184, 0.008962392807006836, 0.009420514106750488, 0.00987863540649414, 0.010336756706237793, 0.010794878005981445, 0.011252999305725098, 0.01171112060546875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 12.0, 19.0, 28.0, 73.0, 153.0, 227.0, 205.0, 148.0, 73.0, 33.0, 15.0, 9.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06512139737606049, -0.05953649431467056, -0.05395159125328064, -0.04836668819189072, -0.04278178513050079, -0.03719688206911087, -0.03161197900772095, -0.026027075946331024, -0.0204421728849411, -0.014857269823551178, -0.009272366762161255, -0.003687463700771332, 0.0018974393606185913, 0.007482342422008514, 0.013067245483398438, 0.01865214854478836, 0.024237051606178284, 0.029821954667568207, 0.03540685772895813, 0.04099176079034805, 0.046576663851737976, 0.0521615669131279, 0.05774646997451782, 0.06333137303590775, 0.06891627609729767, 0.07450117915868759, 0.08008608222007751, 0.08567098528146744, 0.09125588834285736, 0.09684079140424728, 0.10242569446563721, 0.10801059752702713, 0.11359548568725586, 0.11918038874864578, 0.1247652918100357, 0.13035020232200623, 0.13593509793281555, 0.14151999354362488, 0.1471049040555954, 0.15268981456756592, 0.15827471017837524, 0.16385960578918457, 0.1694445163011551, 0.1750294268131256, 0.18061432242393494, 0.18619921803474426, 0.19178412854671478, 0.1973690390586853, 0.20295393466949463, 0.20853883028030396, 0.21412374079227448, 0.219708651304245, 0.22529354691505432, 0.23087844252586365, 0.23646335303783417, 0.2420482635498047, 0.247633159160614, 0.25321805477142334, 0.25880295038223267, 0.2643878757953644, 0.2699727714061737, 0.27555766701698303, 0.28114259243011475, 0.2867274880409241, 0.2923123836517334]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 9.0, 9.0, 8.0, 7.0, 8.0, 9.0, 20.0, 20.0, 18.0, 19.0, 30.0, 27.0, 38.0, 39.0, 41.0, 41.0, 46.0, 53.0, 63.0, 50.0, 41.0, 50.0, 46.0, 38.0, 43.0, 30.0, 29.0, 32.0, 22.0, 24.0, 17.0, 9.0, 11.0, 8.0, 11.0, 10.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11191123723983765, -0.10828864574432373, -0.10466606169939041, -0.10104347765445709, -0.09742088615894318, -0.09379829466342926, -0.09017571061849594, -0.08655312657356262, -0.0829305350780487, -0.07930794358253479, -0.07568535953760147, -0.07206277549266815, -0.06844018399715424, -0.06481759250164032, -0.061195008456707, -0.05757242068648338, -0.053949832916259766, -0.05032724514603615, -0.04670465737581253, -0.04308206960558891, -0.039459481835365295, -0.03583689406514168, -0.03221430629491806, -0.028591718524694443, -0.024969130754470825, -0.021346542984247208, -0.01772395521402359, -0.014101367443799973, -0.010478779673576355, -0.006856191903352737, -0.00323360413312912, 0.0003889836370944977, 0.004011571407318115, 0.007634159177541733, 0.01125674694776535, 0.014879334717988968, 0.018501922488212585, 0.022124510258436203, 0.02574709802865982, 0.029369685798883438, 0.032992273569107056, 0.03661486133933067, 0.04023744910955429, 0.04386003687977791, 0.047482624650001526, 0.05110521242022514, 0.05472780019044876, 0.05835038796067238, 0.061972975730895996, 0.06559556722640991, 0.06921815127134323, 0.07284073531627655, 0.07646332681179047, 0.08008591830730438, 0.0837085023522377, 0.08733108639717102, 0.09095367789268494, 0.09457626938819885, 0.09819885343313217, 0.10182143747806549, 0.1054440289735794, 0.10906662046909332, 0.11268920451402664, 0.11631178855895996, 0.11993438005447388]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 8.0, 5.0, 11.0, 14.0, 21.0, 29.0, 28.0, 30.0, 49.0, 62.0, 105.0, 137.0, 264.0, 1190.0, 19721.0, 4163829.0, 7350.0, 714.0, 220.0, 128.0, 84.0, 54.0, 44.0, 40.0, 24.0, 22.0, 20.0, 17.0, 11.0, 16.0, 4.0, 7.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.055572509765625, -0.05380105972290039, -0.05202960968017578, -0.05025815963745117, -0.04848670959472656, -0.04671525955200195, -0.044943809509277344, -0.043172359466552734, -0.041400909423828125, -0.039629459381103516, -0.037858009338378906, -0.0360865592956543, -0.03431510925292969, -0.03254365921020508, -0.03077220916748047, -0.02900075912475586, -0.02722930908203125, -0.02545785903930664, -0.02368640899658203, -0.021914958953857422, -0.020143508911132812, -0.018372058868408203, -0.016600608825683594, -0.014829158782958984, -0.013057708740234375, -0.011286258697509766, -0.009514808654785156, -0.007743358612060547, -0.0059719085693359375, -0.004200458526611328, -0.0024290084838867188, -0.0006575584411621094, 0.0011138916015625, 0.0028853416442871094, 0.004656791687011719, 0.006428241729736328, 0.008199691772460938, 0.009971141815185547, 0.011742591857910156, 0.013514041900634766, 0.015285491943359375, 0.017056941986083984, 0.018828392028808594, 0.020599842071533203, 0.022371292114257812, 0.024142742156982422, 0.02591419219970703, 0.02768564224243164, 0.02945709228515625, 0.03122854232788086, 0.03299999237060547, 0.03477144241333008, 0.03654289245605469, 0.0383143424987793, 0.040085792541503906, 0.041857242584228516, 0.043628692626953125, 0.045400142669677734, 0.047171592712402344, 0.04894304275512695, 0.05071449279785156, 0.05248594284057617, 0.05425739288330078, 0.05602884292602539, 0.05780029296875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 10.0, 10.0, 6.0, 26.0, 20.0, 41.0, 45.0, 52.0, 60.0, 62.0, 68.0, 79.0, 73.0, 80.0, 69.0, 71.0, 52.0, 43.0, 30.0, 17.0, 21.0, 15.0, 12.0, 11.0, 8.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0112457275390625, -0.010895609855651855, -0.010545492172241211, -0.010195374488830566, -0.009845256805419922, -0.009495139122009277, -0.009145021438598633, -0.008794903755187988, -0.008444786071777344, -0.0080946683883667, -0.007744550704956055, -0.00739443302154541, -0.007044315338134766, -0.006694197654724121, -0.0063440799713134766, -0.005993962287902832, -0.0056438446044921875, -0.005293726921081543, -0.0049436092376708984, -0.004593491554260254, -0.004243373870849609, -0.003893256187438965, -0.0035431385040283203, -0.0031930208206176758, -0.0028429031372070312, -0.0024927854537963867, -0.002142667770385742, -0.0017925500869750977, -0.0014424324035644531, -0.0010923147201538086, -0.0007421970367431641, -0.00039207935333251953, -4.1961669921875e-05, 0.00030815601348876953, 0.0006582736968994141, 0.0010083913803100586, 0.0013585090637207031, 0.0017086267471313477, 0.002058744430541992, 0.0024088621139526367, 0.0027589797973632812, 0.0031090974807739258, 0.0034592151641845703, 0.003809332847595215, 0.004159450531005859, 0.004509568214416504, 0.0048596858978271484, 0.005209803581237793, 0.0055599212646484375, 0.005910038948059082, 0.0062601566314697266, 0.006610274314880371, 0.006960391998291016, 0.00731050968170166, 0.007660627365112305, 0.00801074504852295, 0.008360862731933594, 0.008710980415344238, 0.009061098098754883, 0.009411215782165527, 0.009761333465576172, 0.010111451148986816, 0.010461568832397461, 0.010811686515808105, 0.01116180419921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 8.0, 5.0, 6.0, 8.0, 7.0, 16.0, 19.0, 32.0, 45.0, 47.0, 60.0, 90.0, 116.0, 168.0, 250.0, 434.0, 826.0, 2021.0, 7761.0, 63252.0, 4076242.0, 33925.0, 5428.0, 1595.0, 678.0, 343.0, 259.0, 162.0, 123.0, 93.0, 60.0, 62.0, 44.0, 32.0, 18.0, 14.0, 17.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0226593017578125, -0.02193737030029297, -0.021215438842773438, -0.020493507385253906, -0.019771575927734375, -0.019049644470214844, -0.018327713012695312, -0.01760578155517578, -0.01688385009765625, -0.01616191864013672, -0.015439987182617188, -0.014718055725097656, -0.013996124267578125, -0.013274192810058594, -0.012552261352539062, -0.011830329895019531, -0.0111083984375, -0.010386466979980469, -0.009664535522460938, -0.008942604064941406, -0.008220672607421875, -0.007498741149902344, -0.0067768096923828125, -0.006054878234863281, -0.00533294677734375, -0.004611015319824219, -0.0038890838623046875, -0.0031671524047851562, -0.002445220947265625, -0.0017232894897460938, -0.0010013580322265625, -0.00027942657470703125, 0.0004425048828125, 0.0011644363403320312, 0.0018863677978515625, 0.0026082992553710938, 0.003330230712890625, 0.004052162170410156, 0.0047740936279296875, 0.005496025085449219, 0.00621795654296875, 0.006939888000488281, 0.0076618194580078125, 0.008383750915527344, 0.009105682373046875, 0.009827613830566406, 0.010549545288085938, 0.011271476745605469, 0.011993408203125, 0.012715339660644531, 0.013437271118164062, 0.014159202575683594, 0.014881134033203125, 0.015603065490722656, 0.016324996948242188, 0.01704692840576172, 0.01776885986328125, 0.01849079132080078, 0.019212722778320312, 0.019934654235839844, 0.020656585693359375, 0.021378517150878906, 0.022100448608398438, 0.02282238006591797, 0.0235443115234375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 15.0, 41.0, 276.0, 3646.0, 58.0, 26.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0102386474609375, -0.009910345077514648, -0.009582042694091797, -0.009253740310668945, -0.008925437927246094, -0.008597135543823242, -0.00826883316040039, -0.007940530776977539, -0.0076122283935546875, -0.007283926010131836, -0.006955623626708984, -0.006627321243286133, -0.006299018859863281, -0.00597071647644043, -0.005642414093017578, -0.0053141117095947266, -0.004985809326171875, -0.0046575069427490234, -0.004329204559326172, -0.00400090217590332, -0.0036725997924804688, -0.003344297409057617, -0.0030159950256347656, -0.002687692642211914, -0.0023593902587890625, -0.002031087875366211, -0.0017027854919433594, -0.0013744831085205078, -0.0010461807250976562, -0.0007178783416748047, -0.0003895759582519531, -6.127357482910156e-05, 0.00026702880859375, 0.0005953311920166016, 0.0009236335754394531, 0.0012519359588623047, 0.0015802383422851562, 0.0019085407257080078, 0.0022368431091308594, 0.002565145492553711, 0.0028934478759765625, 0.003221750259399414, 0.0035500526428222656, 0.003878355026245117, 0.004206657409667969, 0.00453495979309082, 0.004863262176513672, 0.0051915645599365234, 0.005519866943359375, 0.0058481693267822266, 0.006176471710205078, 0.00650477409362793, 0.006833076477050781, 0.007161378860473633, 0.007489681243896484, 0.007817983627319336, 0.008146286010742188, 0.008474588394165039, 0.00880289077758789, 0.009131193161010742, 0.009459495544433594, 0.009787797927856445, 0.010116100311279297, 0.010444402694702148, 0.010772705078125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 7.0, 19.0, 58.0, 241.0, 417.0, 200.0, 45.0, 9.0, 10.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043829768896102905, -0.04223943129181862, -0.040649089962244034, -0.03905875235795975, -0.03746841475367546, -0.035878077149391174, -0.03428773581981659, -0.0326973982155323, -0.031107060611248016, -0.02951672114431858, -0.027926383540034294, -0.02633604407310486, -0.024745706468820572, -0.023155367001891136, -0.0215650275349617, -0.019974689930677414, -0.018384350463747978, -0.016794010996818542, -0.015203673392534256, -0.01361333392560482, -0.012022996321320534, -0.010432656854391098, -0.008842318318784237, -0.007251979783177376, -0.005661641247570515, -0.0040713027119636536, -0.002480963943526149, -0.000890625175088644, 0.0006997133605182171, 0.0022900523617863655, 0.0038803908973932266, 0.005470729433000088, 0.007061067968606949, 0.00865140650421381, 0.010241745039820671, 0.011832084506750107, 0.013422422111034393, 0.015012761577963829, 0.016603101044893265, 0.01819343864917755, 0.019783776253461838, 0.021374115720391273, 0.02296445332467556, 0.024554792791604996, 0.026145130395889282, 0.027735469862818718, 0.029325809329748154, 0.03091614693403244, 0.032506488263607025, 0.03409682586789131, 0.0356871671974659, 0.03727750480175018, 0.03886784240603447, 0.040458180010318756, 0.04204852133989334, 0.04363885894417763, 0.045229196548461914, 0.0468195341527462, 0.048409875482320786, 0.05000021308660507, 0.05159055069088936, 0.053180888295173645, 0.05477122962474823, 0.056361567229032516, 0.0579519048333168]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 8.0, 8.0, 9.0, 13.0, 13.0, 16.0, 20.0, 22.0, 23.0, 25.0, 30.0, 34.0, 34.0, 34.0, 40.0, 39.0, 40.0, 47.0, 48.0, 35.0, 46.0, 35.0, 41.0, 40.0, 45.0, 35.0, 29.0, 24.0, 27.0, 29.0, 14.0, 23.0, 14.0, 10.0, 19.0, 7.0, 9.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007561683654785156, -0.007277561351656914, -0.006993439048528671, -0.006709316745400429, -0.006425194442272186, -0.006141072139143944, -0.005856949836015701, -0.005572827532887459, -0.005288705229759216, -0.005004582926630974, -0.004720460623502731, -0.004436338320374489, -0.004152216017246246, -0.003868093714118004, -0.0035839714109897614, -0.003299849107861519, -0.0030157268047332764, -0.002731604501605034, -0.0024474821984767914, -0.002163359895348549, -0.0018792375922203064, -0.001595115289092064, -0.0013109929859638214, -0.001026870682835579, -0.0007427483797073364, -0.00045862607657909393, -0.00017450377345085144, 0.00010961852967739105, 0.00039374083280563354, 0.000677863135933876, 0.0009619854390621185, 0.001246107742190361, 0.0015302300453186035, 0.001814352348446846, 0.0020984746515750885, 0.002382596954703331, 0.0026667192578315735, 0.002950841560959816, 0.0032349638640880585, 0.003519086167216301, 0.0038032084703445435, 0.004087330773472786, 0.0043714530766010284, 0.004655575379729271, 0.004939697682857513, 0.005223819985985756, 0.005507942289113998, 0.005792064592242241, 0.006076186895370483, 0.006360309198498726, 0.006644431501626968, 0.006928553804755211, 0.007212676107883453, 0.007496798411011696, 0.007780920714139938, 0.00806504301726818, 0.008349165320396423, 0.008633287623524666, 0.008917409926652908, 0.00920153222978115, 0.009485654532909393, 0.009769776836037636, 0.010053899139165878, 0.01033802144229412, 0.010622143745422363]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 5.0, 7.0, 4.0, 7.0, 5.0, 10.0, 14.0, 14.0, 22.0, 26.0, 41.0, 45.0, 62.0, 107.0, 161.0, 222.0, 377.0, 590.0, 961.0, 1674.0, 3019.0, 6610.0, 16765.0, 51856.0, 173009.0, 384996.0, 272527.0, 88731.0, 27354.0, 9678.0, 4222.0, 2143.0, 1199.0, 716.0, 464.0, 279.0, 220.0, 121.0, 74.0, 54.0, 40.0, 27.0, 30.0, 14.0, 10.0, 7.0, 11.0, 7.0, 2.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0], "bins": [-0.01042938232421875, -0.010100603103637695, -0.00977182388305664, -0.009443044662475586, -0.009114265441894531, -0.008785486221313477, -0.008456707000732422, -0.008127927780151367, -0.0077991485595703125, -0.007470369338989258, -0.007141590118408203, -0.0068128108978271484, -0.006484031677246094, -0.006155252456665039, -0.005826473236083984, -0.00549769401550293, -0.005168914794921875, -0.00484013557434082, -0.004511356353759766, -0.004182577133178711, -0.0038537979125976562, -0.0035250186920166016, -0.003196239471435547, -0.002867460250854492, -0.0025386810302734375, -0.002209901809692383, -0.0018811225891113281, -0.0015523433685302734, -0.0012235641479492188, -0.0008947849273681641, -0.0005660057067871094, -0.0002372264862060547, 9.1552734375e-05, 0.0004203319549560547, 0.0007491111755371094, 0.001077890396118164, 0.0014066696166992188, 0.0017354488372802734, 0.002064228057861328, 0.002393007278442383, 0.0027217864990234375, 0.003050565719604492, 0.003379344940185547, 0.0037081241607666016, 0.004036903381347656, 0.004365682601928711, 0.004694461822509766, 0.00502324104309082, 0.005352020263671875, 0.00568079948425293, 0.006009578704833984, 0.006338357925415039, 0.006667137145996094, 0.0069959163665771484, 0.007324695587158203, 0.007653474807739258, 0.007982254028320312, 0.008311033248901367, 0.008639812469482422, 0.008968591690063477, 0.009297370910644531, 0.009626150131225586, 0.00995492935180664, 0.010283708572387695, 0.01061248779296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 8.0, 8.0, 13.0, 24.0, 23.0, 38.0, 44.0, 47.0, 61.0, 61.0, 57.0, 75.0, 78.0, 72.0, 69.0, 61.0, 61.0, 46.0, 25.0, 29.0, 27.0, 11.0, 14.0, 17.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0114898681640625, -0.011134624481201172, -0.010779380798339844, -0.010424137115478516, -0.010068893432617188, -0.00971364974975586, -0.009358406066894531, -0.009003162384033203, -0.008647918701171875, -0.008292675018310547, -0.007937431335449219, -0.007582187652587891, -0.0072269439697265625, -0.006871700286865234, -0.006516456604003906, -0.006161212921142578, -0.00580596923828125, -0.005450725555419922, -0.005095481872558594, -0.004740238189697266, -0.0043849945068359375, -0.004029750823974609, -0.0036745071411132812, -0.003319263458251953, -0.002964019775390625, -0.002608776092529297, -0.0022535324096679688, -0.0018982887268066406, -0.0015430450439453125, -0.0011878013610839844, -0.0008325576782226562, -0.0004773139953613281, -0.0001220703125, 0.00023317337036132812, 0.0005884170532226562, 0.0009436607360839844, 0.0012989044189453125, 0.0016541481018066406, 0.0020093917846679688, 0.002364635467529297, 0.002719879150390625, 0.003075122833251953, 0.0034303665161132812, 0.0037856101989746094, 0.0041408538818359375, 0.004496097564697266, 0.004851341247558594, 0.005206584930419922, 0.00556182861328125, 0.005917072296142578, 0.006272315979003906, 0.006627559661865234, 0.0069828033447265625, 0.007338047027587891, 0.007693290710449219, 0.008048534393310547, 0.008403778076171875, 0.008759021759033203, 0.009114265441894531, 0.00946950912475586, 0.009824752807617188, 0.010179996490478516, 0.010535240173339844, 0.010890483856201172, 0.0112457275390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 10.0, 8.0, 17.0, 21.0, 39.0, 50.0, 70.0, 104.0, 150.0, 236.0, 385.0, 727.0, 1389.0, 3331.0, 10541.0, 76245.0, 724587.0, 202902.0, 18874.0, 4737.0, 1838.0, 933.0, 519.0, 280.0, 181.0, 107.0, 66.0, 55.0, 39.0, 34.0, 10.0, 15.0, 8.0, 12.0, 5.0, 3.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196685791015625, -0.01904773712158203, -0.018426895141601562, -0.017806053161621094, -0.017185211181640625, -0.016564369201660156, -0.015943527221679688, -0.015322685241699219, -0.01470184326171875, -0.014081001281738281, -0.013460159301757812, -0.012839317321777344, -0.012218475341796875, -0.011597633361816406, -0.010976791381835938, -0.010355949401855469, -0.009735107421875, -0.009114265441894531, -0.008493423461914062, -0.007872581481933594, -0.007251739501953125, -0.006630897521972656, -0.0060100555419921875, -0.005389213562011719, -0.00476837158203125, -0.004147529602050781, -0.0035266876220703125, -0.0029058456420898438, -0.002285003662109375, -0.0016641616821289062, -0.0010433197021484375, -0.00042247772216796875, 0.0001983642578125, 0.0008192062377929688, 0.0014400482177734375, 0.0020608901977539062, 0.002681732177734375, 0.0033025741577148438, 0.0039234161376953125, 0.004544258117675781, 0.00516510009765625, 0.005785942077636719, 0.0064067840576171875, 0.007027626037597656, 0.007648468017578125, 0.008269309997558594, 0.008890151977539062, 0.009510993957519531, 0.0101318359375, 0.010752677917480469, 0.011373519897460938, 0.011994361877441406, 0.012615203857421875, 0.013236045837402344, 0.013856887817382812, 0.014477729797363281, 0.01509857177734375, 0.01571941375732422, 0.016340255737304688, 0.016961097717285156, 0.017581939697265625, 0.018202781677246094, 0.018823623657226562, 0.01944446563720703, 0.0200653076171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 11.0, 8.0, 11.0, 15.0, 20.0, 21.0, 33.0, 23.0, 32.0, 35.0, 39.0, 60.0, 52.0, 62.0, 52.0, 53.0, 61.0, 57.0, 53.0, 46.0, 35.0, 41.0, 38.0, 21.0, 27.0, 23.0, 17.0, 14.0, 12.0, 3.0, 9.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0345458984375, -0.03341341018676758, -0.032280921936035156, -0.031148433685302734, -0.030015945434570312, -0.02888345718383789, -0.02775096893310547, -0.026618480682373047, -0.025485992431640625, -0.024353504180908203, -0.02322101593017578, -0.02208852767944336, -0.020956039428710938, -0.019823551177978516, -0.018691062927246094, -0.017558574676513672, -0.01642608642578125, -0.015293598175048828, -0.014161109924316406, -0.013028621673583984, -0.011896133422851562, -0.01076364517211914, -0.009631156921386719, -0.008498668670654297, -0.007366180419921875, -0.006233692169189453, -0.005101203918457031, -0.003968715667724609, -0.0028362274169921875, -0.0017037391662597656, -0.0005712509155273438, 0.0005612373352050781, 0.0016937255859375, 0.002826213836669922, 0.003958702087402344, 0.005091190338134766, 0.0062236785888671875, 0.007356166839599609, 0.008488655090332031, 0.009621143341064453, 0.010753631591796875, 0.011886119842529297, 0.013018608093261719, 0.01415109634399414, 0.015283584594726562, 0.016416072845458984, 0.017548561096191406, 0.018681049346923828, 0.01981353759765625, 0.020946025848388672, 0.022078514099121094, 0.023211002349853516, 0.024343490600585938, 0.02547597885131836, 0.02660846710205078, 0.027740955352783203, 0.028873443603515625, 0.030005931854248047, 0.03113842010498047, 0.03227090835571289, 0.03340339660644531, 0.034535884857177734, 0.035668373107910156, 0.03680086135864258, 0.037933349609375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 8.0, 4.0, 3.0, 15.0, 19.0, 18.0, 21.0, 34.0, 37.0, 72.0, 109.0, 166.0, 267.0, 440.0, 962.0, 2219.0, 6360.0, 104578.0, 912457.0, 14186.0, 3467.0, 1427.0, 710.0, 353.0, 218.0, 148.0, 72.0, 53.0, 37.0, 27.0, 14.0, 7.0, 12.0, 8.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.027862548828125, -0.027133703231811523, -0.026404857635498047, -0.02567601203918457, -0.024947166442871094, -0.024218320846557617, -0.02348947525024414, -0.022760629653930664, -0.022031784057617188, -0.02130293846130371, -0.020574092864990234, -0.019845247268676758, -0.01911640167236328, -0.018387556076049805, -0.017658710479736328, -0.01692986488342285, -0.016201019287109375, -0.015472173690795898, -0.014743328094482422, -0.014014482498168945, -0.013285636901855469, -0.012556791305541992, -0.011827945709228516, -0.011099100112915039, -0.010370254516601562, -0.009641408920288086, -0.00891256332397461, -0.008183717727661133, -0.007454872131347656, -0.00672602653503418, -0.005997180938720703, -0.0052683353424072266, -0.00453948974609375, -0.0038106441497802734, -0.003081798553466797, -0.0023529529571533203, -0.0016241073608398438, -0.0008952617645263672, -0.00016641616821289062, 0.0005624294281005859, 0.0012912750244140625, 0.002020120620727539, 0.0027489662170410156, 0.003477811813354492, 0.004206657409667969, 0.004935503005981445, 0.005664348602294922, 0.0063931941986083984, 0.007122039794921875, 0.007850885391235352, 0.008579730987548828, 0.009308576583862305, 0.010037422180175781, 0.010766267776489258, 0.011495113372802734, 0.012223958969116211, 0.012952804565429688, 0.013681650161743164, 0.01441049575805664, 0.015139341354370117, 0.015868186950683594, 0.01659703254699707, 0.017325878143310547, 0.018054723739624023, 0.0187835693359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 10.0, 10.0, 4.0, 14.0, 14.0, 27.0, 35.0, 42.0, 72.0, 85.0, 134.0, 151.0, 123.0, 79.0, 64.0, 37.0, 31.0, 23.0, 12.0, 8.0, 4.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984306335449219e-05, -5.7806260883808136e-05, -5.5769458413124084e-05, -5.373265594244003e-05, -5.169585347175598e-05, -4.965905100107193e-05, -4.762224853038788e-05, -4.558544605970383e-05, -4.3548643589019775e-05, -4.1511841118335724e-05, -3.947503864765167e-05, -3.743823617696762e-05, -3.540143370628357e-05, -3.336463123559952e-05, -3.1327828764915466e-05, -2.9291026294231415e-05, -2.7254223823547363e-05, -2.5217421352863312e-05, -2.318061888217926e-05, -2.114381641149521e-05, -1.9107013940811157e-05, -1.7070211470127106e-05, -1.5033408999443054e-05, -1.2996606528759003e-05, -1.0959804058074951e-05, -8.9230015873909e-06, -6.886199116706848e-06, -4.849396646022797e-06, -2.812594175338745e-06, -7.757917046546936e-07, 1.261010766029358e-06, 3.2978132367134094e-06, 5.334615707397461e-06, 7.3714181780815125e-06, 9.408220648765564e-06, 1.1445023119449615e-05, 1.3481825590133667e-05, 1.551862806081772e-05, 1.755543053150177e-05, 1.959223300218582e-05, 2.1629035472869873e-05, 2.3665837943553925e-05, 2.5702640414237976e-05, 2.7739442884922028e-05, 2.977624535560608e-05, 3.181304782629013e-05, 3.384985029697418e-05, 3.5886652767658234e-05, 3.7923455238342285e-05, 3.996025770902634e-05, 4.199706017971039e-05, 4.403386265039444e-05, 4.607066512107849e-05, 4.810746759176254e-05, 5.0144270062446594e-05, 5.2181072533130646e-05, 5.42178750038147e-05, 5.625467747449875e-05, 5.82914799451828e-05, 6.032828241586685e-05, 6.23650848865509e-05, 6.440188735723495e-05, 6.6438689827919e-05, 6.847549229860306e-05, 7.051229476928711e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 13.0, 12.0, 25.0, 40.0, 52.0, 92.0, 152.0, 254.0, 510.0, 981.0, 2325.0, 6759.0, 112213.0, 901373.0, 17106.0, 3597.0, 1480.0, 661.0, 341.0, 198.0, 129.0, 76.0, 35.0, 36.0, 21.0, 15.0, 5.0, 7.0, 4.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01873779296875, -0.018074512481689453, -0.017411231994628906, -0.01674795150756836, -0.016084671020507812, -0.015421390533447266, -0.014758110046386719, -0.014094829559326172, -0.013431549072265625, -0.012768268585205078, -0.012104988098144531, -0.011441707611083984, -0.010778427124023438, -0.01011514663696289, -0.009451866149902344, -0.008788585662841797, -0.00812530517578125, -0.007462024688720703, -0.006798744201660156, -0.006135463714599609, -0.0054721832275390625, -0.004808902740478516, -0.004145622253417969, -0.003482341766357422, -0.002819061279296875, -0.002155780792236328, -0.0014925003051757812, -0.0008292198181152344, -0.0001659393310546875, 0.0004973411560058594, 0.0011606216430664062, 0.0018239021301269531, 0.0024871826171875, 0.003150463104248047, 0.0038137435913085938, 0.004477024078369141, 0.0051403045654296875, 0.005803585052490234, 0.006466865539550781, 0.007130146026611328, 0.007793426513671875, 0.008456707000732422, 0.009119987487792969, 0.009783267974853516, 0.010446548461914062, 0.01110982894897461, 0.011773109436035156, 0.012436389923095703, 0.01309967041015625, 0.013762950897216797, 0.014426231384277344, 0.01508951187133789, 0.015752792358398438, 0.016416072845458984, 0.01707935333251953, 0.017742633819580078, 0.018405914306640625, 0.019069194793701172, 0.01973247528076172, 0.020395755767822266, 0.021059036254882812, 0.02172231674194336, 0.022385597229003906, 0.023048877716064453, 0.023712158203125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 9.0, 25.0, 165.0, 571.0, 155.0, 25.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07025146484375, -0.06842756271362305, -0.0666036605834961, -0.06477975845336914, -0.06295585632324219, -0.061131954193115234, -0.05930805206298828, -0.05748414993286133, -0.055660247802734375, -0.05383634567260742, -0.05201244354248047, -0.050188541412353516, -0.04836463928222656, -0.04654073715209961, -0.044716835021972656, -0.0428929328918457, -0.04106903076171875, -0.0392451286315918, -0.037421226501464844, -0.03559732437133789, -0.03377342224121094, -0.031949520111083984, -0.03012561798095703, -0.028301715850830078, -0.026477813720703125, -0.024653911590576172, -0.02283000946044922, -0.021006107330322266, -0.019182205200195312, -0.01735830307006836, -0.015534400939941406, -0.013710498809814453, -0.0118865966796875, -0.010062694549560547, -0.008238792419433594, -0.006414890289306641, -0.0045909881591796875, -0.0027670860290527344, -0.0009431838989257812, 0.0008807182312011719, 0.002704620361328125, 0.004528522491455078, 0.006352424621582031, 0.008176326751708984, 0.010000228881835938, 0.01182413101196289, 0.013648033142089844, 0.015471935272216797, 0.01729583740234375, 0.019119739532470703, 0.020943641662597656, 0.02276754379272461, 0.024591445922851562, 0.026415348052978516, 0.02823925018310547, 0.030063152313232422, 0.031887054443359375, 0.03371095657348633, 0.03553485870361328, 0.037358760833740234, 0.03918266296386719, 0.04100656509399414, 0.042830467224121094, 0.04465436935424805, 0.046478271484375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 16.0, 22.0, 24.0, 42.0, 73.0, 125.0, 159.0, 216.0, 172.0, 88.0, 24.0, 19.0, 10.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2453514188528061, -0.23803828656673431, -0.23072515428066254, -0.22341202199459076, -0.2160988748073578, -0.208785742521286, -0.20147261023521423, -0.19415947794914246, -0.18684634566307068, -0.1795332133769989, -0.17222008109092712, -0.16490694880485535, -0.15759381651878357, -0.1502806842327118, -0.14296753704547882, -0.13565440475940704, -0.12834127247333527, -0.12102814018726349, -0.11371500790119171, -0.10640186816453934, -0.09908873587846756, -0.09177560359239578, -0.08446246385574341, -0.07714933156967163, -0.06983619928359985, -0.06252306699752808, -0.055209930986166, -0.047896794974803925, -0.04058366268873215, -0.03327053040266037, -0.025957394391298294, -0.018644258379936218, -0.011331140995025635, -0.004018006846308708, 0.0032951273024082184, 0.010608261451125145, 0.01792139559984207, 0.02523452788591385, 0.032547663897275925, 0.039860799908638, 0.04717393219470978, 0.054487064480781555, 0.06180020049214363, 0.0691133365035057, 0.07642646878957748, 0.08373960107564926, 0.09105274081230164, 0.09836587309837341, 0.10567900538444519, 0.11299213767051697, 0.12030526995658875, 0.12761840224266052, 0.1349315345287323, 0.14224466681480408, 0.14955781400203705, 0.15687094628810883, 0.1641840785741806, 0.17149721086025238, 0.17881034314632416, 0.18612347543239594, 0.1934366226196289, 0.20074975490570068, 0.20806288719177246, 0.21537601947784424, 0.22268915176391602]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 11.0, 5.0, 9.0, 11.0, 8.0, 16.0, 21.0, 25.0, 18.0, 26.0, 35.0, 43.0, 40.0, 40.0, 52.0, 53.0, 50.0, 57.0, 49.0, 46.0, 51.0, 44.0, 43.0, 43.0, 35.0, 22.0, 26.0, 14.0, 17.0, 25.0, 21.0, 12.0, 6.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.19137269258499146, -0.1856820285320282, -0.17999134957790375, -0.1743006855249405, -0.16861000657081604, -0.16291934251785278, -0.15722867846488953, -0.15153801441192627, -0.14584733545780182, -0.14015667140483856, -0.1344659924507141, -0.12877532839775085, -0.123084656894207, -0.11739398539066315, -0.11170332133769989, -0.10601264983415604, -0.10032197833061218, -0.09463130682706833, -0.08894063532352448, -0.08324997127056122, -0.07755929976701736, -0.07186862826347351, -0.06617796421051025, -0.0604872927069664, -0.054796621203422546, -0.04910594969987869, -0.04341528192162514, -0.03772461414337158, -0.03203394263982773, -0.026343272998929024, -0.02065260335803032, -0.014961935579776764, -0.00927126407623291, -0.0035805944353342056, 0.002110075205564499, 0.007800744846463203, 0.013491414487361908, 0.019182084128260612, 0.024872753769159317, 0.030563421547412872, 0.036254093050956726, 0.04194476455450058, 0.047635432332754135, 0.05332610011100769, 0.059016771614551544, 0.0647074431180954, 0.07039810717105865, 0.07608877867460251, 0.08177945017814636, 0.08747012168169022, 0.09316079318523407, 0.09885145723819733, 0.10454212874174118, 0.11023280024528503, 0.11592346429824829, 0.12161413580179214, 0.127304807305336, 0.13299547135829926, 0.1386861503124237, 0.14437681436538696, 0.15006747841835022, 0.15575815737247467, 0.16144882142543793, 0.16713950037956238, 0.17283016443252563]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 6.0, 8.0, 9.0, 21.0, 11.0, 22.0, 28.0, 44.0, 57.0, 117.0, 128.0, 213.0, 356.0, 778.0, 1924.0, 8189.0, 130059.0, 4026011.0, 20309.0, 3491.0, 1152.0, 487.0, 277.0, 176.0, 112.0, 75.0, 60.0, 49.0, 23.0, 16.0, 21.0, 14.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.025238037109375, -0.02434396743774414, -0.02344989776611328, -0.022555828094482422, -0.021661758422851562, -0.020767688751220703, -0.019873619079589844, -0.018979549407958984, -0.018085479736328125, -0.017191410064697266, -0.016297340393066406, -0.015403270721435547, -0.014509201049804688, -0.013615131378173828, -0.012721061706542969, -0.01182699203491211, -0.01093292236328125, -0.01003885269165039, -0.009144783020019531, -0.008250713348388672, -0.0073566436767578125, -0.006462574005126953, -0.005568504333496094, -0.004674434661865234, -0.003780364990234375, -0.0028862953186035156, -0.0019922256469726562, -0.0010981559753417969, -0.0002040863037109375, 0.0006899833679199219, 0.0015840530395507812, 0.0024781227111816406, 0.0033721923828125, 0.004266262054443359, 0.005160331726074219, 0.006054401397705078, 0.0069484710693359375, 0.007842540740966797, 0.008736610412597656, 0.009630680084228516, 0.010524749755859375, 0.011418819427490234, 0.012312889099121094, 0.013206958770751953, 0.014101028442382812, 0.014995098114013672, 0.01588916778564453, 0.01678323745727539, 0.01767730712890625, 0.01857137680053711, 0.01946544647216797, 0.020359516143798828, 0.021253585815429688, 0.022147655487060547, 0.023041725158691406, 0.023935794830322266, 0.024829864501953125, 0.025723934173583984, 0.026618003845214844, 0.027512073516845703, 0.028406143188476562, 0.029300212860107422, 0.03019428253173828, 0.03108835220336914, 0.031982421875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 6.0, 8.0, 13.0, 25.0, 26.0, 25.0, 36.0, 42.0, 42.0, 61.0, 53.0, 65.0, 60.0, 75.0, 72.0, 76.0, 73.0, 54.0, 48.0, 34.0, 27.0, 15.0, 13.0, 11.0, 6.0, 9.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.011749267578125, -0.011382579803466797, -0.011015892028808594, -0.01064920425415039, -0.010282516479492188, -0.009915828704833984, -0.009549140930175781, -0.009182453155517578, -0.008815765380859375, -0.008449077606201172, -0.008082389831542969, -0.007715702056884766, -0.0073490142822265625, -0.006982326507568359, -0.006615638732910156, -0.006248950958251953, -0.00588226318359375, -0.005515575408935547, -0.005148887634277344, -0.004782199859619141, -0.0044155120849609375, -0.004048824310302734, -0.0036821365356445312, -0.003315448760986328, -0.002948760986328125, -0.002582073211669922, -0.0022153854370117188, -0.0018486976623535156, -0.0014820098876953125, -0.0011153221130371094, -0.0007486343383789062, -0.0003819465637207031, -1.52587890625e-05, 0.0003514289855957031, 0.0007181167602539062, 0.0010848045349121094, 0.0014514923095703125, 0.0018181800842285156, 0.0021848678588867188, 0.002551555633544922, 0.002918243408203125, 0.003284931182861328, 0.0036516189575195312, 0.004018306732177734, 0.0043849945068359375, 0.004751682281494141, 0.005118370056152344, 0.005485057830810547, 0.00585174560546875, 0.006218433380126953, 0.006585121154785156, 0.006951808929443359, 0.0073184967041015625, 0.007685184478759766, 0.008051872253417969, 0.008418560028076172, 0.008785247802734375, 0.009151935577392578, 0.009518623352050781, 0.009885311126708984, 0.010251998901367188, 0.01061868667602539, 0.010985374450683594, 0.011352062225341797, 0.01171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 5.0, 10.0, 17.0, 16.0, 26.0, 35.0, 43.0, 65.0, 79.0, 106.0, 164.0, 250.0, 556.0, 2839.0, 3088217.0, 1097657.0, 2703.0, 617.0, 292.0, 161.0, 104.0, 81.0, 59.0, 48.0, 36.0, 33.0, 21.0, 8.0, 8.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08837890625, -0.08577919006347656, -0.08317947387695312, -0.08057975769042969, -0.07798004150390625, -0.07538032531738281, -0.07278060913085938, -0.07018089294433594, -0.0675811767578125, -0.06498146057128906, -0.062381744384765625, -0.05978202819824219, -0.05718231201171875, -0.05458259582519531, -0.051982879638671875, -0.04938316345214844, -0.046783447265625, -0.04418373107910156, -0.041584014892578125, -0.03898429870605469, -0.03638458251953125, -0.03378486633300781, -0.031185150146484375, -0.028585433959960938, -0.0259857177734375, -0.023386001586914062, -0.020786285400390625, -0.018186569213867188, -0.01558685302734375, -0.012987136840820312, -0.010387420654296875, -0.0077877044677734375, -0.00518798828125, -0.0025882720947265625, 1.1444091796875e-05, 0.0026111602783203125, 0.00521087646484375, 0.0078105926513671875, 0.010410308837890625, 0.013010025024414062, 0.0156097412109375, 0.018209457397460938, 0.020809173583984375, 0.023408889770507812, 0.02600860595703125, 0.028608322143554688, 0.031208038330078125, 0.03380775451660156, 0.036407470703125, 0.03900718688964844, 0.041606903076171875, 0.04420661926269531, 0.04680633544921875, 0.04940605163574219, 0.052005767822265625, 0.05460548400878906, 0.0572052001953125, 0.05980491638183594, 0.062404632568359375, 0.06500434875488281, 0.06760406494140625, 0.07020378112792969, 0.07280349731445312, 0.07540321350097656, 0.0780029296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 27.0, 113.0, 3807.0, 95.0, 18.0, 13.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.045654296875, -0.044499874114990234, -0.04334545135498047, -0.0421910285949707, -0.04103660583496094, -0.03988218307495117, -0.038727760314941406, -0.03757333755493164, -0.036418914794921875, -0.03526449203491211, -0.034110069274902344, -0.03295564651489258, -0.03180122375488281, -0.030646800994873047, -0.02949237823486328, -0.028337955474853516, -0.02718353271484375, -0.026029109954833984, -0.02487468719482422, -0.023720264434814453, -0.022565841674804688, -0.021411418914794922, -0.020256996154785156, -0.01910257339477539, -0.017948150634765625, -0.01679372787475586, -0.015639305114746094, -0.014484882354736328, -0.013330459594726562, -0.012176036834716797, -0.011021614074707031, -0.009867191314697266, -0.0087127685546875, -0.007558345794677734, -0.006403923034667969, -0.005249500274658203, -0.0040950775146484375, -0.002940654754638672, -0.0017862319946289062, -0.0006318092346191406, 0.000522613525390625, 0.0016770362854003906, 0.0028314590454101562, 0.003985881805419922, 0.0051403045654296875, 0.006294727325439453, 0.007449150085449219, 0.008603572845458984, 0.00975799560546875, 0.010912418365478516, 0.012066841125488281, 0.013221263885498047, 0.014375686645507812, 0.015530109405517578, 0.016684532165527344, 0.01783895492553711, 0.018993377685546875, 0.02014780044555664, 0.021302223205566406, 0.022456645965576172, 0.023611068725585938, 0.024765491485595703, 0.02591991424560547, 0.027074337005615234, 0.028228759765625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 6.0, 7.0, 16.0, 24.0, 28.0, 45.0, 80.0, 112.0, 177.0, 186.0, 125.0, 95.0, 37.0, 27.0, 11.0, 11.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0940178856253624, -0.09185920655727386, -0.08970052003860474, -0.0875418409705162, -0.08538316190242767, -0.08322447538375854, -0.08106579631567001, -0.07890711724758148, -0.07674843072891235, -0.07458975166082382, -0.0724310651421547, -0.07027238607406616, -0.06811370700597763, -0.0659550279378891, -0.06379634141921997, -0.06163766235113144, -0.05947898328304291, -0.05732030048966408, -0.055161621421575546, -0.053002938628196716, -0.050844259560108185, -0.048685576766729355, -0.046526893973350525, -0.04436821490526199, -0.04220953211188316, -0.040050849318504333, -0.0378921702504158, -0.03573348745703697, -0.03357480466365814, -0.03141612559556961, -0.02925744280219078, -0.0270987618714571, -0.02494008094072342, -0.02278140000998974, -0.020622719079256058, -0.018464036285877228, -0.016305355355143547, -0.014146674424409866, -0.011987992562353611, -0.009829310700297356, -0.007670629769563675, -0.005511948373168707, -0.003353266976773739, -0.0011945855803787708, 0.0009640958160161972, 0.003122776746749878, 0.005281458608806133, 0.007440140470862389, 0.00959882140159607, 0.01175750233232975, 0.013916184194386005, 0.01607486605644226, 0.01823354698717594, 0.020392227917909622, 0.022550910711288452, 0.024709591642022133, 0.026868272572755814, 0.029026953503489494, 0.031185634434223175, 0.033344317227602005, 0.035503000020980835, 0.037661679089069366, 0.039820361882448196, 0.041979044675827026, 0.04413772374391556]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 4.0, 9.0, 3.0, 6.0, 9.0, 4.0, 10.0, 17.0, 15.0, 18.0, 30.0, 27.0, 40.0, 33.0, 34.0, 36.0, 44.0, 44.0, 56.0, 61.0, 51.0, 56.0, 35.0, 45.0, 50.0, 47.0, 39.0, 31.0, 30.0, 19.0, 15.0, 15.0, 11.0, 19.0, 11.0, 10.0, 5.0, 4.0, 0.0, 4.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04304862022399902, -0.04181289300322533, -0.04057716578245163, -0.039341434836387634, -0.03810570761561394, -0.03686998039484024, -0.035634249448776245, -0.03439852222800255, -0.03316279500722885, -0.031927067786455154, -0.03069133870303631, -0.029455609619617462, -0.028219882398843765, -0.02698415517807007, -0.025748426094651222, -0.024512697011232376, -0.02327696979045868, -0.022041242569684982, -0.020805513486266136, -0.01956978440284729, -0.018334057182073593, -0.017098329961299896, -0.01586260087788105, -0.014626872725784779, -0.013391144573688507, -0.012155416421592236, -0.010919688269495964, -0.009683960117399693, -0.008448231965303421, -0.0072125038132071495, -0.005976775661110878, -0.0047410475090146065, -0.003505319356918335, -0.0022695912048220634, -0.001033863052725792, 0.00020186509937047958, 0.001437593251466751, 0.0026733214035630226, 0.003909049555659294, 0.005144777707755566, 0.006380505859851837, 0.007616234011948109, 0.00885196216404438, 0.010087690316140652, 0.011323418468236923, 0.012559146620333195, 0.013794874772429466, 0.015030602924525738, 0.01626633107662201, 0.017502058297395706, 0.018737787380814552, 0.0199735164642334, 0.021209243685007095, 0.022444970905780792, 0.02368069998919964, 0.024916429072618484, 0.02615215629339218, 0.02738788351416588, 0.028623612597584724, 0.02985934168100357, 0.031095068901777267, 0.032330796122550964, 0.03356652706861496, 0.03480225428938866, 0.036037981510162354]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 9.0, 8.0, 8.0, 12.0, 18.0, 29.0, 50.0, 80.0, 131.0, 228.0, 491.0, 915.0, 2146.0, 5461.0, 15966.0, 60552.0, 267183.0, 489332.0, 152906.0, 35860.0, 10434.0, 3647.0, 1510.0, 726.0, 353.0, 189.0, 133.0, 53.0, 35.0, 27.0, 16.0, 14.0, 12.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0173797607421875, -0.01687324047088623, -0.01636672019958496, -0.01586019992828369, -0.015353679656982422, -0.014847159385681152, -0.014340639114379883, -0.013834118843078613, -0.013327598571777344, -0.012821078300476074, -0.012314558029174805, -0.011808037757873535, -0.011301517486572266, -0.010794997215270996, -0.010288476943969727, -0.009781956672668457, -0.009275436401367188, -0.008768916130065918, -0.008262395858764648, -0.007755875587463379, -0.007249355316162109, -0.00674283504486084, -0.00623631477355957, -0.005729794502258301, -0.005223274230957031, -0.004716753959655762, -0.004210233688354492, -0.0037037134170532227, -0.003197193145751953, -0.0026906728744506836, -0.002184152603149414, -0.0016776323318481445, -0.001171112060546875, -0.0006645917892456055, -0.00015807151794433594, 0.0003484487533569336, 0.0008549690246582031, 0.0013614892959594727, 0.0018680095672607422, 0.0023745298385620117, 0.0028810501098632812, 0.0033875703811645508, 0.0038940906524658203, 0.00440061092376709, 0.004907131195068359, 0.005413651466369629, 0.0059201717376708984, 0.006426692008972168, 0.0069332122802734375, 0.007439732551574707, 0.007946252822875977, 0.008452773094177246, 0.008959293365478516, 0.009465813636779785, 0.009972333908081055, 0.010478854179382324, 0.010985374450683594, 0.011491894721984863, 0.011998414993286133, 0.012504935264587402, 0.013011455535888672, 0.013517975807189941, 0.014024496078491211, 0.01453101634979248, 0.01503753662109375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 8.0, 8.0, 11.0, 16.0, 28.0, 20.0, 35.0, 42.0, 46.0, 44.0, 59.0, 65.0, 58.0, 73.0, 55.0, 69.0, 70.0, 61.0, 45.0, 43.0, 36.0, 22.0, 26.0, 8.0, 9.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0116729736328125, -0.01130211353302002, -0.010931253433227539, -0.010560393333435059, -0.010189533233642578, -0.009818673133850098, -0.009447813034057617, -0.009076952934265137, -0.008706092834472656, -0.008335232734680176, -0.007964372634887695, -0.007593512535095215, -0.007222652435302734, -0.006851792335510254, -0.0064809322357177734, -0.006110072135925293, -0.0057392120361328125, -0.005368351936340332, -0.0049974918365478516, -0.004626631736755371, -0.004255771636962891, -0.00388491153717041, -0.0035140514373779297, -0.0031431913375854492, -0.0027723312377929688, -0.0024014711380004883, -0.002030611038208008, -0.0016597509384155273, -0.0012888908386230469, -0.0009180307388305664, -0.0005471706390380859, -0.00017631053924560547, 0.000194549560546875, 0.0005654096603393555, 0.0009362697601318359, 0.0013071298599243164, 0.0016779899597167969, 0.0020488500595092773, 0.002419710159301758, 0.0027905702590942383, 0.0031614303588867188, 0.0035322904586791992, 0.0039031505584716797, 0.00427401065826416, 0.004644870758056641, 0.005015730857849121, 0.0053865909576416016, 0.005757451057434082, 0.0061283111572265625, 0.006499171257019043, 0.0068700313568115234, 0.007240891456604004, 0.007611751556396484, 0.007982611656188965, 0.008353471755981445, 0.008724331855773926, 0.009095191955566406, 0.009466052055358887, 0.009836912155151367, 0.010207772254943848, 0.010578632354736328, 0.010949492454528809, 0.011320352554321289, 0.01169121265411377, 0.01206207275390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 5.0, 6.0, 11.0, 14.0, 23.0, 27.0, 48.0, 57.0, 81.0, 145.0, 177.0, 265.0, 500.0, 931.0, 2032.0, 6234.0, 32699.0, 365442.0, 574691.0, 51342.0, 8540.0, 2614.0, 1076.0, 575.0, 339.0, 188.0, 148.0, 91.0, 67.0, 51.0, 31.0, 18.0, 20.0, 14.0, 5.0, 9.0, 5.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0209197998046875, -0.020175457000732422, -0.019431114196777344, -0.018686771392822266, -0.017942428588867188, -0.01719808578491211, -0.01645374298095703, -0.015709400177001953, -0.014965057373046875, -0.014220714569091797, -0.013476371765136719, -0.01273202896118164, -0.011987686157226562, -0.011243343353271484, -0.010499000549316406, -0.009754657745361328, -0.00901031494140625, -0.008265972137451172, -0.007521629333496094, -0.006777286529541016, -0.0060329437255859375, -0.005288600921630859, -0.004544258117675781, -0.003799915313720703, -0.003055572509765625, -0.002311229705810547, -0.0015668869018554688, -0.0008225440979003906, -7.82012939453125e-05, 0.0006661415100097656, 0.0014104843139648438, 0.002154827117919922, 0.002899169921875, 0.003643512725830078, 0.004387855529785156, 0.005132198333740234, 0.0058765411376953125, 0.006620883941650391, 0.007365226745605469, 0.008109569549560547, 0.008853912353515625, 0.009598255157470703, 0.010342597961425781, 0.01108694076538086, 0.011831283569335938, 0.012575626373291016, 0.013319969177246094, 0.014064311981201172, 0.01480865478515625, 0.015552997589111328, 0.016297340393066406, 0.017041683197021484, 0.017786026000976562, 0.01853036880493164, 0.01927471160888672, 0.020019054412841797, 0.020763397216796875, 0.021507740020751953, 0.02225208282470703, 0.02299642562866211, 0.023740768432617188, 0.024485111236572266, 0.025229454040527344, 0.025973796844482422, 0.0267181396484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 14.0, 9.0, 7.0, 8.0, 19.0, 28.0, 34.0, 45.0, 45.0, 47.0, 65.0, 54.0, 52.0, 62.0, 61.0, 63.0, 59.0, 59.0, 44.0, 43.0, 36.0, 27.0, 29.0, 30.0, 18.0, 13.0, 7.0, 5.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04315185546875, -0.041759490966796875, -0.04036712646484375, -0.038974761962890625, -0.0375823974609375, -0.036190032958984375, -0.03479766845703125, -0.033405303955078125, -0.032012939453125, -0.030620574951171875, -0.02922821044921875, -0.027835845947265625, -0.0264434814453125, -0.025051116943359375, -0.02365875244140625, -0.022266387939453125, -0.0208740234375, -0.019481658935546875, -0.01808929443359375, -0.016696929931640625, -0.0153045654296875, -0.013912200927734375, -0.01251983642578125, -0.011127471923828125, -0.009735107421875, -0.008342742919921875, -0.00695037841796875, -0.005558013916015625, -0.0041656494140625, -0.002773284912109375, -0.00138092041015625, 1.1444091796875e-05, 0.00140380859375, 0.002796173095703125, 0.00418853759765625, 0.005580902099609375, 0.0069732666015625, 0.008365631103515625, 0.00975799560546875, 0.011150360107421875, 0.012542724609375, 0.013935089111328125, 0.01532745361328125, 0.016719818115234375, 0.0181121826171875, 0.019504547119140625, 0.02089691162109375, 0.022289276123046875, 0.023681640625, 0.025074005126953125, 0.02646636962890625, 0.027858734130859375, 0.0292510986328125, 0.030643463134765625, 0.03203582763671875, 0.033428192138671875, 0.034820556640625, 0.036212921142578125, 0.03760528564453125, 0.038997650146484375, 0.0403900146484375, 0.041782379150390625, 0.04317474365234375, 0.044567108154296875, 0.04595947265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 4.0, 7.0, 7.0, 20.0, 18.0, 22.0, 31.0, 44.0, 89.0, 130.0, 290.0, 678.0, 1947.0, 8825.0, 96126.0, 840866.0, 87886.0, 8382.0, 1816.0, 694.0, 272.0, 152.0, 84.0, 37.0, 30.0, 25.0, 27.0, 10.0, 9.0, 9.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.014251708984375, -0.013899683952331543, -0.013547658920288086, -0.013195633888244629, -0.012843608856201172, -0.012491583824157715, -0.012139558792114258, -0.0117875337600708, -0.011435508728027344, -0.011083483695983887, -0.01073145866394043, -0.010379433631896973, -0.010027408599853516, -0.009675383567810059, -0.009323358535766602, -0.008971333503723145, -0.008619308471679688, -0.00826728343963623, -0.007915258407592773, -0.007563233375549316, -0.007211208343505859, -0.006859183311462402, -0.006507158279418945, -0.006155133247375488, -0.005803108215332031, -0.005451083183288574, -0.005099058151245117, -0.00474703311920166, -0.004395008087158203, -0.004042983055114746, -0.003690958023071289, -0.003338932991027832, -0.002986907958984375, -0.002634882926940918, -0.002282857894897461, -0.001930832862854004, -0.0015788078308105469, -0.0012267827987670898, -0.0008747577667236328, -0.0005227327346801758, -0.00017070770263671875, 0.00018131732940673828, 0.0005333423614501953, 0.0008853673934936523, 0.0012373924255371094, 0.0015894174575805664, 0.0019414424896240234, 0.0022934675216674805, 0.0026454925537109375, 0.0029975175857543945, 0.0033495426177978516, 0.0037015676498413086, 0.004053592681884766, 0.004405617713928223, 0.00475764274597168, 0.005109667778015137, 0.005461692810058594, 0.005813717842102051, 0.006165742874145508, 0.006517767906188965, 0.006869792938232422, 0.007221817970275879, 0.007573843002319336, 0.007925868034362793, 0.00827789306640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 11.0, 8.0, 16.0, 14.0, 24.0, 28.0, 41.0, 41.0, 70.0, 84.0, 72.0, 109.0, 99.0, 90.0, 67.0, 57.0, 34.0, 36.0, 25.0, 14.0, 18.0, 8.0, 7.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3272972106933594e-05, -4.185270518064499e-05, -4.0432438254356384e-05, -3.901217132806778e-05, -3.7591904401779175e-05, -3.617163747549057e-05, -3.4751370549201965e-05, -3.333110362291336e-05, -3.1910836696624756e-05, -3.049056977033615e-05, -2.9070302844047546e-05, -2.765003591775894e-05, -2.6229768991470337e-05, -2.4809502065181732e-05, -2.3389235138893127e-05, -2.1968968212604523e-05, -2.0548701286315918e-05, -1.9128434360027313e-05, -1.770816743373871e-05, -1.6287900507450104e-05, -1.4867633581161499e-05, -1.3447366654872894e-05, -1.202709972858429e-05, -1.0606832802295685e-05, -9.18656587600708e-06, -7.766298949718475e-06, -6.346032023429871e-06, -4.925765097141266e-06, -3.505498170852661e-06, -2.0852312445640564e-06, -6.649643182754517e-07, 7.553026080131531e-07, 2.175569534301758e-06, 3.5958364605903625e-06, 5.016103386878967e-06, 6.436370313167572e-06, 7.856637239456177e-06, 9.276904165744781e-06, 1.0697171092033386e-05, 1.2117438018321991e-05, 1.3537704944610596e-05, 1.49579718708992e-05, 1.6378238797187805e-05, 1.779850572347641e-05, 1.9218772649765015e-05, 2.063903957605362e-05, 2.2059306502342224e-05, 2.347957342863083e-05, 2.4899840354919434e-05, 2.632010728120804e-05, 2.7740374207496643e-05, 2.9160641133785248e-05, 3.058090806007385e-05, 3.200117498636246e-05, 3.342144191265106e-05, 3.484170883893967e-05, 3.626197576522827e-05, 3.7682242691516876e-05, 3.910250961780548e-05, 4.0522776544094086e-05, 4.194304347038269e-05, 4.3363310396671295e-05, 4.47835773229599e-05, 4.6203844249248505e-05, 4.762411117553711e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 19.0, 23.0, 49.0, 65.0, 133.0, 285.0, 706.0, 2518.0, 18554.0, 719232.0, 294034.0, 10024.0, 1784.0, 572.0, 240.0, 132.0, 65.0, 36.0, 21.0, 11.0, 11.0, 10.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0208282470703125, -0.020342469215393066, -0.019856691360473633, -0.0193709135055542, -0.018885135650634766, -0.018399357795715332, -0.0179135799407959, -0.017427802085876465, -0.01694202423095703, -0.016456246376037598, -0.015970468521118164, -0.01548469066619873, -0.014998912811279297, -0.014513134956359863, -0.01402735710144043, -0.013541579246520996, -0.013055801391601562, -0.012570023536682129, -0.012084245681762695, -0.011598467826843262, -0.011112689971923828, -0.010626912117004395, -0.010141134262084961, -0.009655356407165527, -0.009169578552246094, -0.00868380069732666, -0.008198022842407227, -0.007712244987487793, -0.007226467132568359, -0.006740689277648926, -0.006254911422729492, -0.005769133567810059, -0.005283355712890625, -0.004797577857971191, -0.004311800003051758, -0.0038260221481323242, -0.0033402442932128906, -0.002854466438293457, -0.0023686885833740234, -0.0018829107284545898, -0.0013971328735351562, -0.0009113550186157227, -0.00042557716369628906, 6.020069122314453e-05, 0.0005459785461425781, 0.0010317564010620117, 0.0015175342559814453, 0.002003312110900879, 0.0024890899658203125, 0.002974867820739746, 0.0034606456756591797, 0.003946423530578613, 0.004432201385498047, 0.0049179792404174805, 0.005403757095336914, 0.005889534950256348, 0.006375312805175781, 0.006861090660095215, 0.0073468685150146484, 0.007832646369934082, 0.008318424224853516, 0.00880420207977295, 0.009289979934692383, 0.009775757789611816, 0.01026153564453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 5.0, 6.0, 12.0, 11.0, 21.0, 38.0, 33.0, 71.0, 80.0, 117.0, 165.0, 151.0, 102.0, 73.0, 47.0, 31.0, 16.0, 10.0, 11.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007404327392578125, -0.006900966167449951, -0.006397604942321777, -0.0058942437171936035, -0.00539088249206543, -0.004887521266937256, -0.004384160041809082, -0.003880798816680908, -0.0033774375915527344, -0.0028740763664245605, -0.0023707151412963867, -0.0018673539161682129, -0.001363992691040039, -0.0008606314659118652, -0.0003572702407836914, 0.00014609098434448242, 0.0006494522094726562, 0.00115281343460083, 0.001656174659729004, 0.0021595358848571777, 0.0026628971099853516, 0.0031662583351135254, 0.0036696195602416992, 0.004172980785369873, 0.004676342010498047, 0.005179703235626221, 0.0056830644607543945, 0.006186425685882568, 0.006689786911010742, 0.007193148136138916, 0.00769650936126709, 0.008199870586395264, 0.008703231811523438, 0.009206593036651611, 0.009709954261779785, 0.010213315486907959, 0.010716676712036133, 0.011220037937164307, 0.01172339916229248, 0.012226760387420654, 0.012730121612548828, 0.013233482837677002, 0.013736844062805176, 0.01424020528793335, 0.014743566513061523, 0.015246927738189697, 0.01575028896331787, 0.016253650188446045, 0.01675701141357422, 0.017260372638702393, 0.017763733863830566, 0.01826709508895874, 0.018770456314086914, 0.019273817539215088, 0.01977717876434326, 0.020280539989471436, 0.02078390121459961, 0.021287262439727783, 0.021790623664855957, 0.02229398488998413, 0.022797346115112305, 0.02330070734024048, 0.023804068565368652, 0.024307429790496826, 0.024810791015625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 4.0, 2.0, 4.0, 10.0, 12.0, 26.0, 38.0, 69.0, 106.0, 159.0, 164.0, 165.0, 113.0, 56.0, 37.0, 12.0, 12.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13776442408561707, -0.13234345614910126, -0.12692247331142426, -0.12150149792432785, -0.11608052253723145, -0.11065954715013504, -0.10523857176303864, -0.09981760382652283, -0.09439662098884583, -0.08897564560174942, -0.08355467021465302, -0.07813369482755661, -0.0727127194404602, -0.0672917440533638, -0.061870772391557693, -0.05644979700446129, -0.05102882534265518, -0.04560784995555878, -0.04018687456846237, -0.03476589918136597, -0.02934492565691471, -0.023923950269818306, -0.01850297674536705, -0.013082001358270645, -0.00766102597117424, -0.0022400510497391224, 0.0031809238716959953, 0.008601898327469826, 0.01402287371456623, 0.019443849101662636, 0.02486482262611389, 0.030285798013210297, 0.0357067734003067, 0.04112774878740311, 0.04654872417449951, 0.05196969956159592, 0.05739067494869232, 0.06281165033578873, 0.06823262572288513, 0.07365359365940094, 0.07907457649707794, 0.08449555188417435, 0.08991652727127075, 0.09533750265836716, 0.10075847804546356, 0.10617945343255997, 0.11160042881965637, 0.11702139675617218, 0.12244237214326859, 0.127863347530365, 0.1332843154668808, 0.1387052983045578, 0.1441262662410736, 0.1495472490787506, 0.15496821701526642, 0.16038919985294342, 0.16581016778945923, 0.17123113572597504, 0.17665211856365204, 0.18207308650016785, 0.18749406933784485, 0.19291503727436066, 0.19833602011203766, 0.20375698804855347, 0.20917797088623047]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 6.0, 4.0, 6.0, 11.0, 8.0, 17.0, 15.0, 18.0, 21.0, 41.0, 26.0, 49.0, 47.0, 48.0, 57.0, 55.0, 51.0, 47.0, 50.0, 40.0, 59.0, 57.0, 38.0, 30.0, 29.0, 34.0, 28.0, 20.0, 15.0, 13.0, 18.0, 7.0, 13.0, 10.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15233856439590454, -0.1469634473323822, -0.14158833026885986, -0.13621321320533752, -0.13083809614181519, -0.12546297907829285, -0.12008786201477051, -0.11471274495124817, -0.10933762788772583, -0.10396251082420349, -0.09858739376068115, -0.09321227669715881, -0.08783715963363647, -0.08246204257011414, -0.0770869255065918, -0.07171180844306946, -0.06633669137954712, -0.06096157431602478, -0.05558645725250244, -0.0502113401889801, -0.044836223125457764, -0.039461106061935425, -0.034085988998413086, -0.028710871934890747, -0.023335754871368408, -0.01796063780784607, -0.01258552074432373, -0.007210403680801392, -0.0018352866172790527, 0.003539830446243286, 0.008914947509765625, 0.014290064573287964, 0.019665181636810303, 0.02504029870033264, 0.03041541576385498, 0.03579053282737732, 0.04116564989089966, 0.046540766954422, 0.051915884017944336, 0.057291001081466675, 0.06266611814498901, 0.06804123520851135, 0.07341635227203369, 0.07879146933555603, 0.08416658639907837, 0.08954170346260071, 0.09491682052612305, 0.10029193758964539, 0.10566705465316772, 0.11104217171669006, 0.1164172887802124, 0.12179240584373474, 0.12716752290725708, 0.13254263997077942, 0.13791775703430176, 0.1432928740978241, 0.14866799116134644, 0.15404310822486877, 0.1594182252883911, 0.16479334235191345, 0.1701684594154358, 0.17554357647895813, 0.18091869354248047, 0.1862938106060028, 0.19166892766952515]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [7.0, 8.0, 17.0, 40.0, 77.0, 121.0, 285.0, 672.0, 1619.0, 4491.0, 17174.0, 131301.0, 3785033.0, 223609.0, 20859.0, 5392.0, 1946.0, 758.0, 392.0, 196.0, 111.0, 78.0, 55.0, 23.0, 14.0, 10.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0088653564453125, -0.008160829544067383, -0.007456302642822266, -0.0067517757415771484, -0.006047248840332031, -0.005342721939086914, -0.004638195037841797, -0.00393366813659668, -0.0032291412353515625, -0.0025246143341064453, -0.0018200874328613281, -0.001115560531616211, -0.00041103363037109375, 0.00029349327087402344, 0.0009980201721191406, 0.0017025470733642578, 0.002407073974609375, 0.003111600875854492, 0.0038161277770996094, 0.0045206546783447266, 0.005225181579589844, 0.005929708480834961, 0.006634235382080078, 0.007338762283325195, 0.008043289184570312, 0.00874781608581543, 0.009452342987060547, 0.010156869888305664, 0.010861396789550781, 0.011565923690795898, 0.012270450592041016, 0.012974977493286133, 0.01367950439453125, 0.014384031295776367, 0.015088558197021484, 0.0157930850982666, 0.01649761199951172, 0.017202138900756836, 0.017906665802001953, 0.01861119270324707, 0.019315719604492188, 0.020020246505737305, 0.020724773406982422, 0.02142930030822754, 0.022133827209472656, 0.022838354110717773, 0.02354288101196289, 0.024247407913208008, 0.024951934814453125, 0.025656461715698242, 0.02636098861694336, 0.027065515518188477, 0.027770042419433594, 0.02847456932067871, 0.029179096221923828, 0.029883623123168945, 0.030588150024414062, 0.03129267692565918, 0.0319972038269043, 0.032701730728149414, 0.03340625762939453, 0.03411078453063965, 0.034815311431884766, 0.03551983833312988, 0.036224365234375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 9.0, 6.0, 4.0, 6.0, 17.0, 15.0, 21.0, 35.0, 34.0, 43.0, 66.0, 79.0, 68.0, 69.0, 80.0, 84.0, 75.0, 76.0, 49.0, 31.0, 39.0, 34.0, 21.0, 12.0, 16.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010650634765625, -0.010231256484985352, -0.009811878204345703, -0.009392499923706055, -0.008973121643066406, -0.008553743362426758, -0.00813436508178711, -0.007714986801147461, -0.0072956085205078125, -0.006876230239868164, -0.006456851959228516, -0.006037473678588867, -0.005618095397949219, -0.00519871711730957, -0.004779338836669922, -0.0043599605560302734, -0.003940582275390625, -0.0035212039947509766, -0.003101825714111328, -0.0026824474334716797, -0.0022630691528320312, -0.0018436908721923828, -0.0014243125915527344, -0.001004934310913086, -0.0005855560302734375, -0.00016617774963378906, 0.0002532005310058594, 0.0006725788116455078, 0.0010919570922851562, 0.0015113353729248047, 0.0019307136535644531, 0.0023500919342041016, 0.00276947021484375, 0.0031888484954833984, 0.003608226776123047, 0.004027605056762695, 0.004446983337402344, 0.004866361618041992, 0.005285739898681641, 0.005705118179321289, 0.0061244964599609375, 0.006543874740600586, 0.006963253021240234, 0.007382631301879883, 0.007802009582519531, 0.00822138786315918, 0.008640766143798828, 0.009060144424438477, 0.009479522705078125, 0.009898900985717773, 0.010318279266357422, 0.01073765754699707, 0.011157035827636719, 0.011576414108276367, 0.011995792388916016, 0.012415170669555664, 0.012834548950195312, 0.013253927230834961, 0.01367330551147461, 0.014092683792114258, 0.014512062072753906, 0.014931440353393555, 0.015350818634033203, 0.01577019691467285, 0.0161895751953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 19.0, 14.0, 26.0, 29.0, 49.0, 88.0, 163.0, 363.0, 1428.0, 9925.0, 158524.0, 3965390.0, 51900.0, 4863.0, 874.0, 282.0, 107.0, 73.0, 40.0, 32.0, 16.0, 17.0, 13.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.035736083984375, -0.03455781936645508, -0.033379554748535156, -0.032201290130615234, -0.031023025512695312, -0.02984476089477539, -0.02866649627685547, -0.027488231658935547, -0.026309967041015625, -0.025131702423095703, -0.02395343780517578, -0.02277517318725586, -0.021596908569335938, -0.020418643951416016, -0.019240379333496094, -0.018062114715576172, -0.01688385009765625, -0.015705585479736328, -0.014527320861816406, -0.013349056243896484, -0.012170791625976562, -0.01099252700805664, -0.009814262390136719, -0.008635997772216797, -0.007457733154296875, -0.006279468536376953, -0.005101203918457031, -0.003922939300537109, -0.0027446746826171875, -0.0015664100646972656, -0.00038814544677734375, 0.0007901191711425781, 0.0019683837890625, 0.003146648406982422, 0.004324913024902344, 0.005503177642822266, 0.0066814422607421875, 0.00785970687866211, 0.009037971496582031, 0.010216236114501953, 0.011394500732421875, 0.012572765350341797, 0.013751029968261719, 0.01492929458618164, 0.016107559204101562, 0.017285823822021484, 0.018464088439941406, 0.019642353057861328, 0.02082061767578125, 0.021998882293701172, 0.023177146911621094, 0.024355411529541016, 0.025533676147460938, 0.02671194076538086, 0.02789020538330078, 0.029068470001220703, 0.030246734619140625, 0.03142499923706055, 0.03260326385498047, 0.03378152847290039, 0.03495979309082031, 0.036138057708740234, 0.037316322326660156, 0.03849458694458008, 0.0396728515625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 8.0, 3.0, 3.0, 13.0, 13.0, 17.0, 27.0, 42.0, 67.0, 165.0, 457.0, 1282.0, 1158.0, 361.0, 172.0, 82.0, 42.0, 36.0, 31.0, 16.0, 17.0, 12.0, 9.0, 9.0, 2.0, 6.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022491455078125, -0.021789073944091797, -0.021086692810058594, -0.02038431167602539, -0.019681930541992188, -0.018979549407958984, -0.01827716827392578, -0.017574787139892578, -0.016872406005859375, -0.016170024871826172, -0.015467643737792969, -0.014765262603759766, -0.014062881469726562, -0.01336050033569336, -0.012658119201660156, -0.011955738067626953, -0.01125335693359375, -0.010550975799560547, -0.009848594665527344, -0.00914621353149414, -0.008443832397460938, -0.007741451263427734, -0.007039070129394531, -0.006336688995361328, -0.005634307861328125, -0.004931926727294922, -0.004229545593261719, -0.0035271644592285156, -0.0028247833251953125, -0.0021224021911621094, -0.0014200210571289062, -0.0007176399230957031, -1.52587890625e-05, 0.0006871223449707031, 0.0013895034790039062, 0.0020918846130371094, 0.0027942657470703125, 0.0034966468811035156, 0.004199028015136719, 0.004901409149169922, 0.005603790283203125, 0.006306171417236328, 0.007008552551269531, 0.007710933685302734, 0.008413314819335938, 0.00911569595336914, 0.009818077087402344, 0.010520458221435547, 0.01122283935546875, 0.011925220489501953, 0.012627601623535156, 0.01332998275756836, 0.014032363891601562, 0.014734745025634766, 0.015437126159667969, 0.016139507293701172, 0.016841888427734375, 0.017544269561767578, 0.01824665069580078, 0.018949031829833984, 0.019651412963867188, 0.02035379409790039, 0.021056175231933594, 0.021758556365966797, 0.0224609375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 14.0, 36.0, 125.0, 278.0, 325.0, 148.0, 38.0, 10.0, 7.0, 3.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1583833396434784, -0.14961114525794983, -0.14083895087242126, -0.1320667564868927, -0.12329456210136414, -0.11452236771583557, -0.105750173330307, -0.09697797894477844, -0.08820578455924988, -0.07943359017372131, -0.07066139578819275, -0.061889201402664185, -0.05311700701713562, -0.044344812631607056, -0.03557261824607849, -0.026800423860549927, -0.018028229475021362, -0.009256035089492798, -0.0004838407039642334, 0.008288353681564331, 0.017060548067092896, 0.02583274245262146, 0.034604936838150024, 0.04337713122367859, 0.05214932560920715, 0.06092151999473572, 0.06969371438026428, 0.07846590876579285, 0.08723810315132141, 0.09601029753684998, 0.10478249192237854, 0.1135546863079071, 0.12232691049575806, 0.13109910488128662, 0.13987129926681519, 0.14864349365234375, 0.15741568803787231, 0.16618788242340088, 0.17496007680892944, 0.183732271194458, 0.19250446557998657, 0.20127665996551514, 0.2100488543510437, 0.21882104873657227, 0.22759324312210083, 0.2363654375076294, 0.24513763189315796, 0.2539098262786865, 0.2626820206642151, 0.27145421504974365, 0.2802264094352722, 0.2889986038208008, 0.29777079820632935, 0.3065429925918579, 0.3153151869773865, 0.32408738136291504, 0.3328595757484436, 0.34163177013397217, 0.35040396451950073, 0.3591761589050293, 0.36794835329055786, 0.3767205476760864, 0.385492742061615, 0.39426493644714355, 0.4030371308326721]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 8.0, 17.0, 12.0, 10.0, 13.0, 18.0, 36.0, 31.0, 30.0, 44.0, 53.0, 64.0, 46.0, 52.0, 52.0, 61.0, 46.0, 50.0, 56.0, 44.0, 45.0, 46.0, 30.0, 28.0, 28.0, 24.0, 11.0, 14.0, 7.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10541015863418579, -0.1023077666759491, -0.0992053747177124, -0.09610298275947571, -0.09300059080123901, -0.08989819884300232, -0.08679580688476562, -0.08369341492652893, -0.08059102296829224, -0.07748863101005554, -0.07438623905181885, -0.07128384709358215, -0.06818145513534546, -0.06507906317710876, -0.06197667121887207, -0.058874279260635376, -0.05577188730239868, -0.05266949534416199, -0.04956710338592529, -0.0464647114276886, -0.043362319469451904, -0.04025992751121521, -0.037157535552978516, -0.03405514359474182, -0.030952751636505127, -0.027850359678268433, -0.02474796772003174, -0.021645575761795044, -0.01854318380355835, -0.015440791845321655, -0.012338399887084961, -0.009236007928848267, -0.006133615970611572, -0.003031224012374878, 7.11679458618164e-05, 0.0031735599040985107, 0.006275951862335205, 0.0093783438205719, 0.012480735778808594, 0.015583127737045288, 0.018685519695281982, 0.021787911653518677, 0.02489030361175537, 0.027992695569992065, 0.03109508752822876, 0.034197479486465454, 0.03729987144470215, 0.04040226340293884, 0.04350465536117554, 0.04660704731941223, 0.049709439277648926, 0.05281183123588562, 0.055914223194122314, 0.05901661515235901, 0.0621190071105957, 0.0652213990688324, 0.06832379102706909, 0.07142618298530579, 0.07452857494354248, 0.07763096690177917, 0.08073335886001587, 0.08383575081825256, 0.08693814277648926, 0.09004053473472595, 0.09314292669296265]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 15.0, 21.0, 28.0, 39.0, 55.0, 89.0, 121.0, 194.0, 263.0, 426.0, 748.0, 1243.0, 2160.0, 3930.0, 7568.0, 15461.0, 35413.0, 83618.0, 200074.0, 324560.0, 211293.0, 89665.0, 37650.0, 16361.0, 7959.0, 4086.0, 2201.0, 1263.0, 730.0, 446.0, 275.0, 198.0, 140.0, 83.0, 55.0, 39.0, 27.0, 21.0, 7.0, 2.0, 5.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0097808837890625, -0.00946056842803955, -0.009140253067016602, -0.008819937705993652, -0.008499622344970703, -0.008179306983947754, -0.007858991622924805, -0.0075386762619018555, -0.007218360900878906, -0.006898045539855957, -0.006577730178833008, -0.006257414817810059, -0.005937099456787109, -0.00561678409576416, -0.005296468734741211, -0.004976153373718262, -0.0046558380126953125, -0.004335522651672363, -0.004015207290649414, -0.003694891929626465, -0.0033745765686035156, -0.0030542612075805664, -0.002733945846557617, -0.002413630485534668, -0.0020933151245117188, -0.0017729997634887695, -0.0014526844024658203, -0.001132369041442871, -0.0008120536804199219, -0.0004917383193969727, -0.00017142295837402344, 0.00014889240264892578, 0.000469207763671875, 0.0007895231246948242, 0.0011098384857177734, 0.0014301538467407227, 0.0017504692077636719, 0.002070784568786621, 0.0023910999298095703, 0.0027114152908325195, 0.0030317306518554688, 0.003352046012878418, 0.003672361373901367, 0.003992676734924316, 0.004312992095947266, 0.004633307456970215, 0.004953622817993164, 0.005273938179016113, 0.0055942535400390625, 0.005914568901062012, 0.006234884262084961, 0.00655519962310791, 0.006875514984130859, 0.007195830345153809, 0.007516145706176758, 0.007836461067199707, 0.008156776428222656, 0.008477091789245605, 0.008797407150268555, 0.009117722511291504, 0.009438037872314453, 0.009758353233337402, 0.010078668594360352, 0.0103989839553833, 0.01071929931640625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 4.0, 6.0, 14.0, 10.0, 27.0, 32.0, 39.0, 37.0, 43.0, 60.0, 50.0, 67.0, 63.0, 66.0, 73.0, 64.0, 74.0, 54.0, 38.0, 46.0, 35.0, 18.0, 21.0, 14.0, 10.0, 11.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.01113128662109375, -0.01076650619506836, -0.010401725769042969, -0.010036945343017578, -0.009672164916992188, -0.009307384490966797, -0.008942604064941406, -0.008577823638916016, -0.008213043212890625, -0.007848262786865234, -0.007483482360839844, -0.007118701934814453, -0.0067539215087890625, -0.006389141082763672, -0.006024360656738281, -0.005659580230712891, -0.0052947998046875, -0.004930019378662109, -0.004565238952636719, -0.004200458526611328, -0.0038356781005859375, -0.003470897674560547, -0.0031061172485351562, -0.0027413368225097656, -0.002376556396484375, -0.0020117759704589844, -0.0016469955444335938, -0.0012822151184082031, -0.0009174346923828125, -0.0005526542663574219, -0.00018787384033203125, 0.00017690658569335938, 0.00054168701171875, 0.0009064674377441406, 0.0012712478637695312, 0.0016360282897949219, 0.0020008087158203125, 0.002365589141845703, 0.0027303695678710938, 0.0030951499938964844, 0.003459930419921875, 0.0038247108459472656, 0.004189491271972656, 0.004554271697998047, 0.0049190521240234375, 0.005283832550048828, 0.005648612976074219, 0.006013393402099609, 0.006378173828125, 0.006742954254150391, 0.007107734680175781, 0.007472515106201172, 0.007837295532226562, 0.008202075958251953, 0.008566856384277344, 0.008931636810302734, 0.009296417236328125, 0.009661197662353516, 0.010025978088378906, 0.010390758514404297, 0.010755538940429688, 0.011120319366455078, 0.011485099792480469, 0.01184988021850586, 0.01221466064453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 7.0, 12.0, 29.0, 43.0, 69.0, 115.0, 201.0, 360.0, 672.0, 1335.0, 3707.0, 19807.0, 378063.0, 608874.0, 27551.0, 4390.0, 1571.0, 760.0, 384.0, 237.0, 140.0, 73.0, 57.0, 27.0, 23.0, 14.0, 8.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.039215087890625, -0.03821134567260742, -0.037207603454589844, -0.036203861236572266, -0.03520011901855469, -0.03419637680053711, -0.03319263458251953, -0.03218889236450195, -0.031185150146484375, -0.030181407928466797, -0.02917766571044922, -0.02817392349243164, -0.027170181274414062, -0.026166439056396484, -0.025162696838378906, -0.024158954620361328, -0.02315521240234375, -0.022151470184326172, -0.021147727966308594, -0.020143985748291016, -0.019140243530273438, -0.01813650131225586, -0.01713275909423828, -0.016129016876220703, -0.015125274658203125, -0.014121532440185547, -0.013117790222167969, -0.01211404800415039, -0.011110305786132812, -0.010106563568115234, -0.009102821350097656, -0.008099079132080078, -0.0070953369140625, -0.006091594696044922, -0.005087852478027344, -0.004084110260009766, -0.0030803680419921875, -0.0020766258239746094, -0.0010728836059570312, -6.914138793945312e-05, 0.000934600830078125, 0.0019383430480957031, 0.0029420852661132812, 0.003945827484130859, 0.0049495697021484375, 0.005953311920166016, 0.006957054138183594, 0.007960796356201172, 0.00896453857421875, 0.009968280792236328, 0.010972023010253906, 0.011975765228271484, 0.012979507446289062, 0.01398324966430664, 0.014986991882324219, 0.015990734100341797, 0.016994476318359375, 0.017998218536376953, 0.01900196075439453, 0.02000570297241211, 0.021009445190429688, 0.022013187408447266, 0.023016929626464844, 0.024020671844482422, 0.0250244140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 6.0, 13.0, 6.0, 15.0, 22.0, 23.0, 15.0, 22.0, 34.0, 44.0, 41.0, 31.0, 58.0, 41.0, 51.0, 38.0, 37.0, 46.0, 38.0, 47.0, 47.0, 59.0, 27.0, 45.0, 23.0, 27.0, 23.0, 22.0, 16.0, 10.0, 14.0, 10.0, 7.0, 6.0, 4.0, 3.0, 13.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0308837890625, -0.029927968978881836, -0.028972148895263672, -0.028016328811645508, -0.027060508728027344, -0.02610468864440918, -0.025148868560791016, -0.02419304847717285, -0.023237228393554688, -0.022281408309936523, -0.02132558822631836, -0.020369768142700195, -0.01941394805908203, -0.018458127975463867, -0.017502307891845703, -0.01654648780822754, -0.015590667724609375, -0.014634847640991211, -0.013679027557373047, -0.012723207473754883, -0.011767387390136719, -0.010811567306518555, -0.00985574722290039, -0.008899927139282227, -0.007944107055664062, -0.0069882869720458984, -0.006032466888427734, -0.00507664680480957, -0.004120826721191406, -0.003165006637573242, -0.002209186553955078, -0.001253366470336914, -0.00029754638671875, 0.0006582736968994141, 0.0016140937805175781, 0.002569913864135742, 0.0035257339477539062, 0.00448155403137207, 0.005437374114990234, 0.0063931941986083984, 0.0073490142822265625, 0.008304834365844727, 0.00926065444946289, 0.010216474533081055, 0.011172294616699219, 0.012128114700317383, 0.013083934783935547, 0.014039754867553711, 0.014995574951171875, 0.01595139503479004, 0.016907215118408203, 0.017863035202026367, 0.01881885528564453, 0.019774675369262695, 0.02073049545288086, 0.021686315536499023, 0.022642135620117188, 0.02359795570373535, 0.024553775787353516, 0.02550959587097168, 0.026465415954589844, 0.027421236038208008, 0.028377056121826172, 0.029332876205444336, 0.0302886962890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 12.0, 11.0, 17.0, 24.0, 16.0, 41.0, 40.0, 77.0, 121.0, 250.0, 373.0, 747.0, 1545.0, 4424.0, 30148.0, 985486.0, 18566.0, 3685.0, 1380.0, 631.0, 352.0, 210.0, 133.0, 67.0, 66.0, 27.0, 24.0, 17.0, 15.0, 4.0, 9.0, 4.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.037750244140625, -0.03665351867675781, -0.035556793212890625, -0.03446006774902344, -0.03336334228515625, -0.03226661682128906, -0.031169891357421875, -0.030073165893554688, -0.0289764404296875, -0.027879714965820312, -0.026782989501953125, -0.025686264038085938, -0.02458953857421875, -0.023492813110351562, -0.022396087646484375, -0.021299362182617188, -0.02020263671875, -0.019105911254882812, -0.018009185791015625, -0.016912460327148438, -0.01581573486328125, -0.014719009399414062, -0.013622283935546875, -0.012525558471679688, -0.0114288330078125, -0.010332107543945312, -0.009235382080078125, -0.008138656616210938, -0.00704193115234375, -0.0059452056884765625, -0.004848480224609375, -0.0037517547607421875, -0.002655029296875, -0.0015583038330078125, -0.000461578369140625, 0.0006351470947265625, 0.00173187255859375, 0.0028285980224609375, 0.003925323486328125, 0.0050220489501953125, 0.0061187744140625, 0.0072154998779296875, 0.008312225341796875, 0.009408950805664062, 0.01050567626953125, 0.011602401733398438, 0.012699127197265625, 0.013795852661132812, 0.014892578125, 0.015989303588867188, 0.017086029052734375, 0.018182754516601562, 0.01927947998046875, 0.020376205444335938, 0.021472930908203125, 0.022569656372070312, 0.0236663818359375, 0.024763107299804688, 0.025859832763671875, 0.026956558227539062, 0.02805328369140625, 0.029150009155273438, 0.030246734619140625, 0.03134346008300781, 0.032440185546875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 14.0, 8.0, 19.0, 18.0, 23.0, 41.0, 37.0, 62.0, 62.0, 59.0, 87.0, 87.0, 65.0, 63.0, 57.0, 62.0, 33.0, 31.0, 35.0, 28.0, 8.0, 12.0, 9.0, 10.0, 7.0, 7.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6716461181640625e-05, -3.55355441570282e-05, -3.435462713241577e-05, -3.3173710107803345e-05, -3.199279308319092e-05, -3.081187605857849e-05, -2.9630959033966064e-05, -2.8450042009353638e-05, -2.726912498474121e-05, -2.6088207960128784e-05, -2.4907290935516357e-05, -2.372637391090393e-05, -2.2545456886291504e-05, -2.1364539861679077e-05, -2.018362283706665e-05, -1.9002705812454224e-05, -1.7821788787841797e-05, -1.664087176322937e-05, -1.5459954738616943e-05, -1.4279037714004517e-05, -1.309812068939209e-05, -1.1917203664779663e-05, -1.0736286640167236e-05, -9.55536961555481e-06, -8.374452590942383e-06, -7.193535566329956e-06, -6.012618541717529e-06, -4.8317015171051025e-06, -3.6507844924926758e-06, -2.469867467880249e-06, -1.2889504432678223e-06, -1.0803341865539551e-07, 1.0728836059570312e-06, 2.253800630569458e-06, 3.4347176551818848e-06, 4.6156346797943115e-06, 5.796551704406738e-06, 6.977468729019165e-06, 8.158385753631592e-06, 9.339302778244019e-06, 1.0520219802856445e-05, 1.1701136827468872e-05, 1.2882053852081299e-05, 1.4062970876693726e-05, 1.5243887901306152e-05, 1.642480492591858e-05, 1.7605721950531006e-05, 1.8786638975143433e-05, 1.996755599975586e-05, 2.1148473024368286e-05, 2.2329390048980713e-05, 2.351030707359314e-05, 2.4691224098205566e-05, 2.5872141122817993e-05, 2.705305814743042e-05, 2.8233975172042847e-05, 2.9414892196655273e-05, 3.05958092212677e-05, 3.177672624588013e-05, 3.2957643270492554e-05, 3.413856029510498e-05, 3.531947731971741e-05, 3.6500394344329834e-05, 3.768131136894226e-05, 3.886222839355469e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 10.0, 9.0, 11.0, 15.0, 21.0, 32.0, 39.0, 58.0, 109.0, 224.0, 674.0, 2017.0, 12253.0, 979585.0, 48095.0, 3717.0, 944.0, 334.0, 143.0, 102.0, 50.0, 19.0, 25.0, 9.0, 13.0, 7.0, 10.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0418701171875, -0.04069709777832031, -0.039524078369140625, -0.03835105895996094, -0.03717803955078125, -0.03600502014160156, -0.034832000732421875, -0.03365898132324219, -0.0324859619140625, -0.03131294250488281, -0.030139923095703125, -0.028966903686523438, -0.02779388427734375, -0.026620864868164062, -0.025447845458984375, -0.024274826049804688, -0.023101806640625, -0.021928787231445312, -0.020755767822265625, -0.019582748413085938, -0.01840972900390625, -0.017236709594726562, -0.016063690185546875, -0.014890670776367188, -0.0137176513671875, -0.012544631958007812, -0.011371612548828125, -0.010198593139648438, -0.00902557373046875, -0.007852554321289062, -0.006679534912109375, -0.0055065155029296875, -0.00433349609375, -0.0031604766845703125, -0.001987457275390625, -0.0008144378662109375, 0.00035858154296875, 0.0015316009521484375, 0.002704620361328125, 0.0038776397705078125, 0.0050506591796875, 0.0062236785888671875, 0.007396697998046875, 0.008569717407226562, 0.00974273681640625, 0.010915756225585938, 0.012088775634765625, 0.013261795043945312, 0.014434814453125, 0.015607833862304688, 0.016780853271484375, 0.017953872680664062, 0.01912689208984375, 0.020299911499023438, 0.021472930908203125, 0.022645950317382812, 0.0238189697265625, 0.024991989135742188, 0.026165008544921875, 0.027338027954101562, 0.02851104736328125, 0.029684066772460938, 0.030857086181640625, 0.03203010559082031, 0.033203125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 14.0, 20.0, 59.0, 106.0, 251.0, 246.0, 155.0, 71.0, 24.0, 18.0, 8.0, 0.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0364990234375, -0.03554248809814453, -0.03458595275878906, -0.033629417419433594, -0.032672882080078125, -0.031716346740722656, -0.030759811401367188, -0.02980327606201172, -0.02884674072265625, -0.02789020538330078, -0.026933670043945312, -0.025977134704589844, -0.025020599365234375, -0.024064064025878906, -0.023107528686523438, -0.02215099334716797, -0.0211944580078125, -0.02023792266845703, -0.019281387329101562, -0.018324851989746094, -0.017368316650390625, -0.016411781311035156, -0.015455245971679688, -0.014498710632324219, -0.01354217529296875, -0.012585639953613281, -0.011629104614257812, -0.010672569274902344, -0.009716033935546875, -0.008759498596191406, -0.0078029632568359375, -0.006846427917480469, -0.005889892578125, -0.004933357238769531, -0.0039768218994140625, -0.0030202865600585938, -0.002063751220703125, -0.0011072158813476562, -0.0001506805419921875, 0.0008058547973632812, 0.00176239013671875, 0.0027189254760742188, 0.0036754608154296875, 0.004631996154785156, 0.005588531494140625, 0.006545066833496094, 0.0075016021728515625, 0.008458137512207031, 0.0094146728515625, 0.010371208190917969, 0.011327743530273438, 0.012284278869628906, 0.013240814208984375, 0.014197349548339844, 0.015153884887695312, 0.01611042022705078, 0.01706695556640625, 0.01802349090576172, 0.018980026245117188, 0.019936561584472656, 0.020893096923828125, 0.021849632263183594, 0.022806167602539062, 0.02376270294189453, 0.02471923828125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 9.0, 14.0, 51.0, 206.0, 455.0, 217.0, 32.0, 9.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.1172791719436646, -1.0975604057312012, -1.0778415203094482, -1.0581227540969849, -1.038403868675232, -1.0186851024627686, -0.9989662170410156, -0.9792473912239075, -0.9595285654067993, -0.9398097395896912, -0.920090913772583, -0.9003720879554749, -0.8806532621383667, -0.8609344363212585, -0.8412156105041504, -0.8214967846870422, -0.8017779588699341, -0.7820591330528259, -0.7623403072357178, -0.7426214814186096, -0.7229026556015015, -0.7031838297843933, -0.6834650039672852, -0.663746178150177, -0.6440274119377136, -0.6243085861206055, -0.6045897603034973, -0.5848709344863892, -0.565152108669281, -0.5454332828521729, -0.5257144570350647, -0.5059956312179565, -0.486276775598526, -0.46655794978141785, -0.4468391239643097, -0.42712029814720154, -0.4074014723300934, -0.38768264651298523, -0.36796385049819946, -0.3482450246810913, -0.32852619886398315, -0.308807373046875, -0.28908854722976685, -0.2693697214126587, -0.24965089559555054, -0.22993206977844238, -0.21021325886249542, -0.19049443304538727, -0.17077559232711792, -0.15105676651000977, -0.1313379406929016, -0.11161912232637405, -0.0919002965092659, -0.07218147069215775, -0.05246265232563019, -0.032743826508522034, -0.01302500069141388, 0.006693823263049126, 0.02641264721751213, 0.04613146930932999, 0.06585029512643814, 0.0855691209435463, 0.10528793931007385, 0.125006765127182, 0.14472559094429016]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 7.0, 11.0, 11.0, 18.0, 18.0, 16.0, 23.0, 23.0, 27.0, 31.0, 38.0, 39.0, 51.0, 58.0, 51.0, 58.0, 46.0, 49.0, 45.0, 36.0, 46.0, 40.0, 42.0, 44.0, 15.0, 17.0, 20.0, 15.0, 18.0, 17.0, 18.0, 10.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12390303611755371, -0.11959967762231827, -0.11529632657766342, -0.11099296808242798, -0.10668961703777313, -0.10238625854253769, -0.09808290004730225, -0.0937795490026474, -0.08947619050741196, -0.08517283201217651, -0.08086948096752167, -0.07656612247228622, -0.07226276397705078, -0.06795941293239594, -0.06365605443716049, -0.05935269966721535, -0.0550493448972702, -0.05074599012732506, -0.04644263535737991, -0.04213927686214447, -0.037835922092199326, -0.03353256732225418, -0.029229210689663887, -0.024925854057073593, -0.02062249928712845, -0.016319144517183304, -0.01201578788459301, -0.007712432183325291, -0.0034090764820575714, 0.0008942782878875732, 0.005197634920477867, 0.009500991553068161, 0.013804346323013306, 0.01810770109295845, 0.022411057725548744, 0.026714414358139038, 0.031017769128084183, 0.03532112389802933, 0.03962448239326477, 0.043927837163209915, 0.04823119193315506, 0.052534546703100204, 0.05683790147304535, 0.06114125996828079, 0.06544461846351624, 0.06974796950817108, 0.07405132800340652, 0.07835468649864197, 0.08265803754329681, 0.08696139603853226, 0.0912647470831871, 0.09556810557842255, 0.09987145662307739, 0.10417481511831284, 0.10847817361354828, 0.11278152465820312, 0.11708488315343857, 0.12138824164867401, 0.12569159269332886, 0.1299949437379837, 0.13429830968379974, 0.1386016607284546, 0.14290501177310944, 0.14720837771892548, 0.15151172876358032]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 30.0, 97.0, 315.0, 3732431.0, 461009.0, 299.0, 81.0, 22.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09100341796875, -0.07580280303955078, -0.06060218811035156, -0.045401573181152344, -0.030200958251953125, -0.015000343322753906, 0.0002002716064453125, 0.015400886535644531, 0.03060150146484375, 0.04580211639404297, 0.06100273132324219, 0.0762033462524414, 0.09140396118164062, 0.10660457611083984, 0.12180519104003906, 0.13700580596923828, 0.1522064208984375, 0.16740703582763672, 0.18260765075683594, 0.19780826568603516, 0.21300888061523438, 0.2282094955444336, 0.2434101104736328, 0.25861072540283203, 0.27381134033203125, 0.28901195526123047, 0.3042125701904297, 0.3194131851196289, 0.3346138000488281, 0.34981441497802734, 0.36501502990722656, 0.3802156448364258, 0.395416259765625, 0.4106168746948242, 0.42581748962402344, 0.44101810455322266, 0.4562187194824219, 0.4714193344116211, 0.4866199493408203, 0.5018205642700195, 0.5170211791992188, 0.532221794128418, 0.5474224090576172, 0.5626230239868164, 0.5778236389160156, 0.5930242538452148, 0.6082248687744141, 0.6234254837036133, 0.6386260986328125, 0.6538267135620117, 0.6690273284912109, 0.6842279434204102, 0.6994285583496094, 0.7146291732788086, 0.7298297882080078, 0.745030403137207, 0.7602310180664062, 0.7754316329956055, 0.7906322479248047, 0.8058328628540039, 0.8210334777832031, 0.8362340927124023, 0.8514347076416016, 0.8666353225708008, 0.8818359375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 8.0, 5.0, 13.0, 14.0, 16.0, 33.0, 39.0, 54.0, 57.0, 74.0, 68.0, 63.0, 67.0, 91.0, 78.0, 71.0, 40.0, 44.0, 39.0, 27.0, 25.0, 27.0, 14.0, 12.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01158905029296875, -0.0111846923828125, -0.01078033447265625, -0.0103759765625, -0.00997161865234375, -0.0095672607421875, -0.00916290283203125, -0.008758544921875, -0.00835418701171875, -0.0079498291015625, -0.00754547119140625, -0.00714111328125, -0.00673675537109375, -0.0063323974609375, -0.00592803955078125, -0.005523681640625, -0.00511932373046875, -0.0047149658203125, -0.00431060791015625, -0.00390625, -0.00350189208984375, -0.0030975341796875, -0.00269317626953125, -0.002288818359375, -0.00188446044921875, -0.0014801025390625, -0.00107574462890625, -0.00067138671875, -0.00026702880859375, 0.0001373291015625, 0.00054168701171875, 0.000946044921875, 0.00135040283203125, 0.0017547607421875, 0.00215911865234375, 0.0025634765625, 0.00296783447265625, 0.0033721923828125, 0.00377655029296875, 0.004180908203125, 0.00458526611328125, 0.0049896240234375, 0.00539398193359375, 0.00579833984375, 0.00620269775390625, 0.0066070556640625, 0.00701141357421875, 0.007415771484375, 0.00782012939453125, 0.0082244873046875, 0.00862884521484375, 0.009033203125, 0.00943756103515625, 0.0098419189453125, 0.01024627685546875, 0.010650634765625, 0.01105499267578125, 0.0114593505859375, 0.01186370849609375, 0.01226806640625, 0.01267242431640625, 0.0130767822265625, 0.01348114013671875, 0.013885498046875, 0.01428985595703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 14.0, 21.0, 39.0, 75.0, 120.0, 288.0, 993.0, 10205.0, 3995052.0, 182189.0, 4138.0, 726.0, 217.0, 114.0, 48.0, 20.0, 10.0, 7.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07452392578125, -0.07238340377807617, -0.07024288177490234, -0.06810235977172852, -0.06596183776855469, -0.06382131576538086, -0.06168079376220703, -0.0595402717590332, -0.057399749755859375, -0.05525922775268555, -0.05311870574951172, -0.05097818374633789, -0.04883766174316406, -0.046697139739990234, -0.044556617736816406, -0.04241609573364258, -0.04027557373046875, -0.03813505172729492, -0.035994529724121094, -0.033854007720947266, -0.03171348571777344, -0.02957296371459961, -0.02743244171142578, -0.025291919708251953, -0.023151397705078125, -0.021010875701904297, -0.01887035369873047, -0.01672983169555664, -0.014589309692382812, -0.012448787689208984, -0.010308265686035156, -0.008167743682861328, -0.0060272216796875, -0.003886699676513672, -0.0017461776733398438, 0.0003943443298339844, 0.0025348663330078125, 0.004675388336181641, 0.006815910339355469, 0.008956432342529297, 0.011096954345703125, 0.013237476348876953, 0.015377998352050781, 0.01751852035522461, 0.019659042358398438, 0.021799564361572266, 0.023940086364746094, 0.026080608367919922, 0.02822113037109375, 0.030361652374267578, 0.032502174377441406, 0.034642696380615234, 0.03678321838378906, 0.03892374038696289, 0.04106426239013672, 0.04320478439331055, 0.045345306396484375, 0.0474858283996582, 0.04962635040283203, 0.05176687240600586, 0.05390739440917969, 0.056047916412353516, 0.058188438415527344, 0.06032896041870117, 0.062469482421875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 14.0, 26.0, 50.0, 126.0, 602.0, 2282.0, 687.0, 158.0, 59.0, 28.0, 9.0, 12.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047454833984375, -0.04615640640258789, -0.04485797882080078, -0.04355955123901367, -0.04226112365722656, -0.04096269607543945, -0.039664268493652344, -0.038365840911865234, -0.037067413330078125, -0.035768985748291016, -0.034470558166503906, -0.0331721305847168, -0.03187370300292969, -0.030575275421142578, -0.02927684783935547, -0.02797842025756836, -0.02667999267578125, -0.02538156509399414, -0.02408313751220703, -0.022784709930419922, -0.021486282348632812, -0.020187854766845703, -0.018889427185058594, -0.017590999603271484, -0.016292572021484375, -0.014994144439697266, -0.013695716857910156, -0.012397289276123047, -0.011098861694335938, -0.009800434112548828, -0.008502006530761719, -0.007203578948974609, -0.0059051513671875, -0.004606723785400391, -0.0033082962036132812, -0.002009868621826172, -0.0007114410400390625, 0.0005869865417480469, 0.0018854141235351562, 0.0031838417053222656, 0.004482269287109375, 0.005780696868896484, 0.007079124450683594, 0.008377552032470703, 0.009675979614257812, 0.010974407196044922, 0.012272834777832031, 0.01357126235961914, 0.01486968994140625, 0.01616811752319336, 0.01746654510498047, 0.018764972686767578, 0.020063400268554688, 0.021361827850341797, 0.022660255432128906, 0.023958683013916016, 0.025257110595703125, 0.026555538177490234, 0.027853965759277344, 0.029152393341064453, 0.030450820922851562, 0.03174924850463867, 0.03304767608642578, 0.03434610366821289, 0.03564453125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 31.0, 106.0, 325.0, 335.0, 119.0, 41.0, 13.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28381311893463135, -0.27367180585861206, -0.2635304927825928, -0.2533891499042511, -0.2432478368282318, -0.23310652375221252, -0.22296521067619324, -0.21282389760017395, -0.20268256962299347, -0.19254125654697418, -0.1823999285697937, -0.17225861549377441, -0.16211730241775513, -0.15197597444057465, -0.14183466136455536, -0.13169333338737488, -0.12155202031135559, -0.1114106997847557, -0.10126937925815582, -0.09112806618213654, -0.08098674565553665, -0.07084542512893677, -0.06070410832762718, -0.050562791526317596, -0.04042147099971771, -0.030280152335762978, -0.020138833671808243, -0.009997515007853508, 0.0001438036561012268, 0.01028512418270111, 0.020426440984010696, 0.030567757785320282, 0.040709108114242554, 0.05085042864084244, 0.06099174544215202, 0.07113306224346161, 0.08127438277006149, 0.09141570329666138, 0.10155701637268066, 0.11169833689928055, 0.12183965742588043, 0.13198097050189972, 0.1421222984790802, 0.1522636115550995, 0.16240492463111877, 0.17254625260829926, 0.18268756568431854, 0.19282889366149902, 0.2029702067375183, 0.2131115198135376, 0.22325284779071808, 0.23339416086673737, 0.24353548884391785, 0.25367680191993713, 0.2638181149959564, 0.2739594280719757, 0.2841007709503174, 0.29424208402633667, 0.30438339710235596, 0.31452473998069763, 0.3246660530567169, 0.3348073661327362, 0.3449486792087555, 0.3550899922847748, 0.36523130536079407]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 8.0, 4.0, 12.0, 23.0, 25.0, 36.0, 41.0, 61.0, 47.0, 55.0, 67.0, 76.0, 66.0, 73.0, 75.0, 63.0, 52.0, 48.0, 39.0, 33.0, 27.0, 18.0, 18.0, 14.0, 8.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.13489288091659546, -0.13153484463691711, -0.12817679345607758, -0.12481874972581863, -0.12146070599555969, -0.11810266226530075, -0.11474461853504181, -0.11138657480478287, -0.10802853107452393, -0.10467048734426498, -0.10131244361400604, -0.0979543998837471, -0.09459635615348816, -0.09123831242322922, -0.08788026869297028, -0.08452222496271133, -0.08116418123245239, -0.07780613750219345, -0.07444809377193451, -0.07109005004167557, -0.06773200631141663, -0.06437396258115768, -0.06101591885089874, -0.0576578751206398, -0.05429983139038086, -0.05094178766012192, -0.047583743929862976, -0.044225700199604034, -0.04086765646934509, -0.03750961273908615, -0.03415156900882721, -0.030793525278568268, -0.027435481548309326, -0.024077437818050385, -0.020719394087791443, -0.0173613503575325, -0.01400330662727356, -0.010645262897014618, -0.007287219166755676, -0.003929175436496735, -0.000571131706237793, 0.0027869120240211487, 0.00614495575428009, 0.009502999484539032, 0.012861043214797974, 0.016219086945056915, 0.019577130675315857, 0.0229351744055748, 0.02629321813583374, 0.029651261866092682, 0.033009305596351624, 0.036367349326610565, 0.03972539305686951, 0.04308343678712845, 0.04644148051738739, 0.04979952424764633, 0.05315756797790527, 0.056515611708164215, 0.05987365543842316, 0.0632316991686821, 0.06658974289894104, 0.06994778662919998, 0.07330583035945892, 0.07666387408971786, 0.0800219178199768]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 9.0, 16.0, 47.0, 113.0, 360.0, 1297.0, 5971.0, 38052.0, 374656.0, 556760.0, 60301.0, 8454.0, 1820.0, 451.0, 141.0, 56.0, 18.0, 12.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0295867919921875, -0.028453588485717773, -0.027320384979248047, -0.02618718147277832, -0.025053977966308594, -0.023920774459838867, -0.02278757095336914, -0.021654367446899414, -0.020521163940429688, -0.01938796043395996, -0.018254756927490234, -0.017121553421020508, -0.01598834991455078, -0.014855146408081055, -0.013721942901611328, -0.012588739395141602, -0.011455535888671875, -0.010322332382202148, -0.009189128875732422, -0.008055925369262695, -0.006922721862792969, -0.005789518356323242, -0.004656314849853516, -0.003523111343383789, -0.0023899078369140625, -0.001256704330444336, -0.00012350082397460938, 0.0010097026824951172, 0.0021429061889648438, 0.0032761096954345703, 0.004409313201904297, 0.0055425167083740234, 0.00667572021484375, 0.0078089237213134766, 0.008942127227783203, 0.01007533073425293, 0.011208534240722656, 0.012341737747192383, 0.01347494125366211, 0.014608144760131836, 0.015741348266601562, 0.01687455177307129, 0.018007755279541016, 0.019140958786010742, 0.02027416229248047, 0.021407365798950195, 0.022540569305419922, 0.02367377281188965, 0.024806976318359375, 0.0259401798248291, 0.027073383331298828, 0.028206586837768555, 0.02933979034423828, 0.030472993850708008, 0.031606197357177734, 0.03273940086364746, 0.03387260437011719, 0.035005807876586914, 0.03613901138305664, 0.03727221488952637, 0.038405418395996094, 0.03953862190246582, 0.04067182540893555, 0.04180502891540527, 0.042938232421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 10.0, 6.0, 3.0, 2.0, 7.0, 10.0, 14.0, 19.0, 33.0, 28.0, 36.0, 47.0, 60.0, 51.0, 56.0, 53.0, 65.0, 71.0, 76.0, 43.0, 51.0, 46.0, 43.0, 47.0, 30.0, 16.0, 24.0, 19.0, 13.0, 10.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01038360595703125, -0.010024189949035645, -0.009664773941040039, -0.009305357933044434, -0.008945941925048828, -0.008586525917053223, -0.008227109909057617, -0.007867693901062012, -0.007508277893066406, -0.007148861885070801, -0.006789445877075195, -0.00643002986907959, -0.006070613861083984, -0.005711197853088379, -0.0053517818450927734, -0.004992365837097168, -0.0046329498291015625, -0.004273533821105957, -0.0039141178131103516, -0.003554701805114746, -0.0031952857971191406, -0.002835869789123535, -0.0024764537811279297, -0.0021170377731323242, -0.0017576217651367188, -0.0013982057571411133, -0.0010387897491455078, -0.0006793737411499023, -0.0003199577331542969, 3.9458274841308594e-05, 0.00039887428283691406, 0.0007582902908325195, 0.001117706298828125, 0.0014771223068237305, 0.001836538314819336, 0.0021959543228149414, 0.002555370330810547, 0.0029147863388061523, 0.003274202346801758, 0.0036336183547973633, 0.003993034362792969, 0.004352450370788574, 0.00471186637878418, 0.005071282386779785, 0.005430698394775391, 0.005790114402770996, 0.0061495304107666016, 0.006508946418762207, 0.0068683624267578125, 0.007227778434753418, 0.0075871944427490234, 0.007946610450744629, 0.008306026458740234, 0.00866544246673584, 0.009024858474731445, 0.00938427448272705, 0.009743690490722656, 0.010103106498718262, 0.010462522506713867, 0.010821938514709473, 0.011181354522705078, 0.011540770530700684, 0.011900186538696289, 0.012259602546691895, 0.0126190185546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 8.0, 2.0, 7.0, 9.0, 11.0, 17.0, 23.0, 25.0, 47.0, 57.0, 77.0, 111.0, 159.0, 260.0, 429.0, 681.0, 1369.0, 2992.0, 8699.0, 37126.0, 223505.0, 622363.0, 118215.0, 21723.0, 5794.0, 2150.0, 1037.0, 618.0, 360.0, 228.0, 134.0, 94.0, 59.0, 47.0, 28.0, 18.0, 14.0, 14.0, 15.0, 4.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0235595703125, -0.022807598114013672, -0.022055625915527344, -0.021303653717041016, -0.020551681518554688, -0.01979970932006836, -0.01904773712158203, -0.018295764923095703, -0.017543792724609375, -0.016791820526123047, -0.01603984832763672, -0.01528787612915039, -0.014535903930664062, -0.013783931732177734, -0.013031959533691406, -0.012279987335205078, -0.01152801513671875, -0.010776042938232422, -0.010024070739746094, -0.009272098541259766, -0.008520126342773438, -0.007768154144287109, -0.007016181945800781, -0.006264209747314453, -0.005512237548828125, -0.004760265350341797, -0.004008293151855469, -0.0032563209533691406, -0.0025043487548828125, -0.0017523765563964844, -0.0010004043579101562, -0.0002484321594238281, 0.0005035400390625, 0.0012555122375488281, 0.0020074844360351562, 0.0027594566345214844, 0.0035114288330078125, 0.004263401031494141, 0.005015373229980469, 0.005767345428466797, 0.006519317626953125, 0.007271289825439453, 0.008023262023925781, 0.00877523422241211, 0.009527206420898438, 0.010279178619384766, 0.011031150817871094, 0.011783123016357422, 0.01253509521484375, 0.013287067413330078, 0.014039039611816406, 0.014791011810302734, 0.015542984008789062, 0.01629495620727539, 0.01704692840576172, 0.017798900604248047, 0.018550872802734375, 0.019302845001220703, 0.02005481719970703, 0.02080678939819336, 0.021558761596679688, 0.022310733795166016, 0.023062705993652344, 0.023814678192138672, 0.024566650390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 11.0, 11.0, 15.0, 18.0, 10.0, 28.0, 44.0, 25.0, 38.0, 42.0, 41.0, 49.0, 53.0, 66.0, 53.0, 68.0, 57.0, 59.0, 47.0, 42.0, 31.0, 31.0, 36.0, 23.0, 26.0, 12.0, 18.0, 9.0, 15.0, 5.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036529541015625, -0.035308837890625, -0.034088134765625, -0.032867431640625, -0.031646728515625, -0.030426025390625, -0.029205322265625, -0.027984619140625, -0.026763916015625, -0.025543212890625, -0.024322509765625, -0.023101806640625, -0.021881103515625, -0.020660400390625, -0.019439697265625, -0.018218994140625, -0.016998291015625, -0.015777587890625, -0.014556884765625, -0.013336181640625, -0.012115478515625, -0.010894775390625, -0.009674072265625, -0.008453369140625, -0.007232666015625, -0.006011962890625, -0.004791259765625, -0.003570556640625, -0.002349853515625, -0.001129150390625, 9.1552734375e-05, 0.001312255859375, 0.002532958984375, 0.003753662109375, 0.004974365234375, 0.006195068359375, 0.007415771484375, 0.008636474609375, 0.009857177734375, 0.011077880859375, 0.012298583984375, 0.013519287109375, 0.014739990234375, 0.015960693359375, 0.017181396484375, 0.018402099609375, 0.019622802734375, 0.020843505859375, 0.022064208984375, 0.023284912109375, 0.024505615234375, 0.025726318359375, 0.026947021484375, 0.028167724609375, 0.029388427734375, 0.030609130859375, 0.031829833984375, 0.033050537109375, 0.034271240234375, 0.035491943359375, 0.036712646484375, 0.037933349609375, 0.039154052734375, 0.040374755859375, 0.041595458984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 13.0, 16.0, 35.0, 54.0, 115.0, 285.0, 1018.0, 9019.0, 1021959.0, 14256.0, 1198.0, 315.0, 125.0, 63.0, 35.0, 15.0, 16.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07177734375, -0.0694284439086914, -0.06707954406738281, -0.06473064422607422, -0.062381744384765625, -0.06003284454345703, -0.05768394470214844, -0.055335044860839844, -0.05298614501953125, -0.050637245178222656, -0.04828834533691406, -0.04593944549560547, -0.043590545654296875, -0.04124164581298828, -0.03889274597167969, -0.036543846130371094, -0.0341949462890625, -0.031846046447753906, -0.029497146606445312, -0.02714824676513672, -0.024799346923828125, -0.02245044708251953, -0.020101547241210938, -0.017752647399902344, -0.01540374755859375, -0.013054847717285156, -0.010705947875976562, -0.008357048034667969, -0.006008148193359375, -0.0036592483520507812, -0.0013103485107421875, 0.0010385513305664062, 0.003387451171875, 0.005736351013183594, 0.008085250854492188, 0.010434150695800781, 0.012783050537109375, 0.015131950378417969, 0.017480850219726562, 0.019829750061035156, 0.02217864990234375, 0.024527549743652344, 0.026876449584960938, 0.02922534942626953, 0.031574249267578125, 0.03392314910888672, 0.03627204895019531, 0.038620948791503906, 0.0409698486328125, 0.043318748474121094, 0.04566764831542969, 0.04801654815673828, 0.050365447998046875, 0.05271434783935547, 0.05506324768066406, 0.057412147521972656, 0.05976104736328125, 0.062109947204589844, 0.06445884704589844, 0.06680774688720703, 0.06915664672851562, 0.07150554656982422, 0.07385444641113281, 0.0762033462524414, 0.07855224609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 9.0, 9.0, 6.0, 16.0, 18.0, 31.0, 64.0, 90.0, 154.0, 187.0, 157.0, 102.0, 54.0, 31.0, 21.0, 16.0, 9.0, 7.0, 9.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.716085433959961e-05, -5.463138222694397e-05, -5.210191011428833e-05, -4.957243800163269e-05, -4.704296588897705e-05, -4.451349377632141e-05, -4.198402166366577e-05, -3.945454955101013e-05, -3.692507743835449e-05, -3.439560532569885e-05, -3.186613321304321e-05, -2.9336661100387573e-05, -2.6807188987731934e-05, -2.4277716875076294e-05, -2.1748244762420654e-05, -1.9218772649765015e-05, -1.6689300537109375e-05, -1.4159828424453735e-05, -1.1630356311798096e-05, -9.100884199142456e-06, -6.571412086486816e-06, -4.041939973831177e-06, -1.5124678611755371e-06, 1.0170042514801025e-06, 3.546476364135742e-06, 6.075948476791382e-06, 8.605420589447021e-06, 1.1134892702102661e-05, 1.36643648147583e-05, 1.619383692741394e-05, 1.872330904006958e-05, 2.125278115272522e-05, 2.378225326538086e-05, 2.63117253780365e-05, 2.884119749069214e-05, 3.137066960334778e-05, 3.390014171600342e-05, 3.642961382865906e-05, 3.89590859413147e-05, 4.148855805397034e-05, 4.4018030166625977e-05, 4.6547502279281616e-05, 4.9076974391937256e-05, 5.1606446504592896e-05, 5.4135918617248535e-05, 5.6665390729904175e-05, 5.9194862842559814e-05, 6.172433495521545e-05, 6.42538070678711e-05, 6.678327918052673e-05, 6.931275129318237e-05, 7.184222340583801e-05, 7.437169551849365e-05, 7.690116763114929e-05, 7.943063974380493e-05, 8.196011185646057e-05, 8.448958396911621e-05, 8.701905608177185e-05, 8.954852819442749e-05, 9.207800030708313e-05, 9.460747241973877e-05, 9.713694453239441e-05, 9.966641664505005e-05, 0.00010219588875770569, 0.00010472536087036133]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 18.0, 20.0, 34.0, 64.0, 129.0, 240.0, 621.0, 2007.0, 10558.0, 610759.0, 411721.0, 9510.0, 1818.0, 557.0, 220.0, 105.0, 56.0, 41.0, 18.0, 13.0, 11.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04248046875, -0.04136180877685547, -0.04024314880371094, -0.039124488830566406, -0.038005828857421875, -0.036887168884277344, -0.03576850891113281, -0.03464984893798828, -0.03353118896484375, -0.03241252899169922, -0.03129386901855469, -0.030175209045410156, -0.029056549072265625, -0.027937889099121094, -0.026819229125976562, -0.02570056915283203, -0.0245819091796875, -0.02346324920654297, -0.022344589233398438, -0.021225929260253906, -0.020107269287109375, -0.018988609313964844, -0.017869949340820312, -0.01675128936767578, -0.01563262939453125, -0.014513969421386719, -0.013395309448242188, -0.012276649475097656, -0.011157989501953125, -0.010039329528808594, -0.008920669555664062, -0.007802009582519531, -0.006683349609375, -0.005564689636230469, -0.0044460296630859375, -0.0033273696899414062, -0.002208709716796875, -0.0010900497436523438, 2.86102294921875e-05, 0.0011472702026367188, 0.00226593017578125, 0.0033845901489257812, 0.0045032501220703125, 0.005621910095214844, 0.006740570068359375, 0.007859230041503906, 0.008977890014648438, 0.010096549987792969, 0.0112152099609375, 0.012333869934082031, 0.013452529907226562, 0.014571189880371094, 0.015689849853515625, 0.016808509826660156, 0.017927169799804688, 0.01904582977294922, 0.02016448974609375, 0.02128314971923828, 0.022401809692382812, 0.023520469665527344, 0.024639129638671875, 0.025757789611816406, 0.026876449584960938, 0.02799510955810547, 0.02911376953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 11.0, 18.0, 21.0, 35.0, 44.0, 67.0, 121.0, 142.0, 152.0, 120.0, 92.0, 54.0, 37.0, 23.0, 15.0, 9.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0221099853515625, -0.021422863006591797, -0.020735740661621094, -0.02004861831665039, -0.019361495971679688, -0.018674373626708984, -0.01798725128173828, -0.017300128936767578, -0.016613006591796875, -0.015925884246826172, -0.015238761901855469, -0.014551639556884766, -0.013864517211914062, -0.01317739486694336, -0.012490272521972656, -0.011803150177001953, -0.01111602783203125, -0.010428905487060547, -0.009741783142089844, -0.00905466079711914, -0.008367538452148438, -0.007680416107177734, -0.006993293762207031, -0.006306171417236328, -0.005619049072265625, -0.004931926727294922, -0.004244804382324219, -0.0035576820373535156, -0.0028705596923828125, -0.0021834373474121094, -0.0014963150024414062, -0.0008091926574707031, -0.0001220703125, 0.0005650520324707031, 0.0012521743774414062, 0.0019392967224121094, 0.0026264190673828125, 0.0033135414123535156, 0.004000663757324219, 0.004687786102294922, 0.005374908447265625, 0.006062030792236328, 0.006749153137207031, 0.007436275482177734, 0.008123397827148438, 0.00881052017211914, 0.009497642517089844, 0.010184764862060547, 0.01087188720703125, 0.011559009552001953, 0.012246131896972656, 0.01293325424194336, 0.013620376586914062, 0.014307498931884766, 0.014994621276855469, 0.015681743621826172, 0.016368865966796875, 0.017055988311767578, 0.01774311065673828, 0.018430233001708984, 0.019117355346679688, 0.01980447769165039, 0.020491600036621094, 0.021178722381591797, 0.0218658447265625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 27.0, 50.0, 226.0, 432.0, 192.0, 44.0, 11.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6043671369552612, -0.5868990421295166, -0.5694310069084167, -0.5519629120826721, -0.5344948768615723, -0.5170267820358276, -0.4995587170124054, -0.48209065198898315, -0.4646225869655609, -0.44715452194213867, -0.42968645691871643, -0.4122183918952942, -0.39475029706954956, -0.3772822618484497, -0.3598141670227051, -0.34234610199928284, -0.3248780369758606, -0.30740997195243835, -0.2899419069290161, -0.27247384190559387, -0.25500577688217163, -0.2375376969575882, -0.22006961703300476, -0.20260155200958252, -0.18513348698616028, -0.16766542196273804, -0.1501973569393158, -0.13272927701473236, -0.11526121199131012, -0.09779314696788788, -0.08032507449388504, -0.0628570020198822, -0.04538893699645996, -0.02792086824774742, -0.010452799499034882, 0.007015269249677658, 0.024483337998390198, 0.04195140302181244, 0.05941947549581528, 0.07688754796981812, 0.09435561299324036, 0.1118236780166626, 0.12929174304008484, 0.14675982296466827, 0.16422788798809052, 0.18169595301151276, 0.1991640329360962, 0.21663209795951843, 0.23410016298294067, 0.2515682280063629, 0.26903629302978516, 0.2865043580532074, 0.30397242307662964, 0.32144051790237427, 0.3389085829257965, 0.35637664794921875, 0.373844712972641, 0.39131277799606323, 0.4087808430194855, 0.4262489080429077, 0.44371700286865234, 0.4611850380897522, 0.4786531329154968, 0.49612119793891907, 0.5135892629623413]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 12.0, 27.0, 13.0, 26.0, 29.0, 45.0, 59.0, 39.0, 49.0, 63.0, 65.0, 84.0, 64.0, 65.0, 49.0, 51.0, 44.0, 37.0, 45.0, 28.0, 20.0, 21.0, 12.0, 10.0, 6.0, 9.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20341086387634277, -0.1973525434732437, -0.19129422307014465, -0.1852359175682068, -0.17917759716510773, -0.17311927676200867, -0.1670609712600708, -0.16100265085697174, -0.15494433045387268, -0.14888601005077362, -0.14282768964767456, -0.1367693841457367, -0.13071106374263763, -0.12465274333953857, -0.11859443038702011, -0.11253611743450165, -0.10647779703140259, -0.10041947662830353, -0.09436116367578506, -0.0883028507232666, -0.08224453032016754, -0.07618620991706848, -0.07012789696455002, -0.06406958401203156, -0.058011263608932495, -0.051952946931123734, -0.04589463025331497, -0.03983631357550621, -0.03377799689769745, -0.027719680219888687, -0.021661363542079926, -0.015603046864271164, -0.009544730186462402, -0.0034864135086536407, 0.002571903169155121, 0.008630219846963882, 0.014688536524772644, 0.020746853202581406, 0.026805169880390167, 0.03286348655819893, 0.03892180323600769, 0.04498011991381645, 0.051038436591625214, 0.057096753269433975, 0.06315506994724274, 0.0692133903503418, 0.07527170330286026, 0.08133001625537872, 0.08738833665847778, 0.09344665706157684, 0.0995049700140953, 0.10556328296661377, 0.11162160336971283, 0.11767992377281189, 0.12373823672533035, 0.12979654967784882, 0.13585487008094788, 0.14191319048404694, 0.147971510887146, 0.15402981638908386, 0.16008813679218292, 0.16614645719528198, 0.17220476269721985, 0.1782630831003189, 0.18432140350341797]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 5.0, 21.0, 32.0, 89.0, 251.0, 1931.0, 854319.0, 3334114.0, 3082.0, 308.0, 81.0, 31.0, 16.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0271148681640625, -0.024419546127319336, -0.021724224090576172, -0.019028902053833008, -0.016333580017089844, -0.01363825798034668, -0.010942935943603516, -0.008247613906860352, -0.0055522918701171875, -0.0028569698333740234, -0.00016164779663085938, 0.0025336742401123047, 0.005228996276855469, 0.007924318313598633, 0.010619640350341797, 0.013314962387084961, 0.016010284423828125, 0.01870560646057129, 0.021400928497314453, 0.024096250534057617, 0.02679157257080078, 0.029486894607543945, 0.03218221664428711, 0.03487753868103027, 0.03757286071777344, 0.0402681827545166, 0.042963504791259766, 0.04565882682800293, 0.048354148864746094, 0.05104947090148926, 0.05374479293823242, 0.056440114974975586, 0.05913543701171875, 0.061830759048461914, 0.06452608108520508, 0.06722140312194824, 0.0699167251586914, 0.07261204719543457, 0.07530736923217773, 0.0780026912689209, 0.08069801330566406, 0.08339333534240723, 0.08608865737915039, 0.08878397941589355, 0.09147930145263672, 0.09417462348937988, 0.09686994552612305, 0.09956526756286621, 0.10226058959960938, 0.10495591163635254, 0.1076512336730957, 0.11034655570983887, 0.11304187774658203, 0.1157371997833252, 0.11843252182006836, 0.12112784385681152, 0.12382316589355469, 0.12651848793029785, 0.12921380996704102, 0.13190913200378418, 0.13460445404052734, 0.1372997760772705, 0.13999509811401367, 0.14269042015075684, 0.1453857421875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 10.0, 18.0, 20.0, 53.0, 53.0, 82.0, 107.0, 103.0, 131.0, 123.0, 80.0, 68.0, 56.0, 30.0, 18.0, 16.0, 13.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025299072265625, -0.024700641632080078, -0.024102210998535156, -0.023503780364990234, -0.022905349731445312, -0.02230691909790039, -0.02170848846435547, -0.021110057830810547, -0.020511627197265625, -0.019913196563720703, -0.01931476593017578, -0.01871633529663086, -0.018117904663085938, -0.017519474029541016, -0.016921043395996094, -0.016322612762451172, -0.01572418212890625, -0.015125751495361328, -0.014527320861816406, -0.013928890228271484, -0.013330459594726562, -0.01273202896118164, -0.012133598327636719, -0.011535167694091797, -0.010936737060546875, -0.010338306427001953, -0.009739875793457031, -0.00914144515991211, -0.008543014526367188, -0.007944583892822266, -0.007346153259277344, -0.006747722625732422, -0.0061492919921875, -0.005550861358642578, -0.004952430725097656, -0.004354000091552734, -0.0037555694580078125, -0.0031571388244628906, -0.0025587081909179688, -0.001960277557373047, -0.001361846923828125, -0.0007634162902832031, -0.00016498565673828125, 0.0004334449768066406, 0.0010318756103515625, 0.0016303062438964844, 0.0022287368774414062, 0.002827167510986328, 0.00342559814453125, 0.004024028778076172, 0.004622459411621094, 0.005220890045166016, 0.0058193206787109375, 0.006417751312255859, 0.007016181945800781, 0.007614612579345703, 0.008213043212890625, 0.008811473846435547, 0.009409904479980469, 0.01000833511352539, 0.010606765747070312, 0.011205196380615234, 0.011803627014160156, 0.012402057647705078, 0.01300048828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 10.0, 4.0, 4.0, 10.0, 10.0, 32.0, 29.0, 51.0, 75.0, 109.0, 172.0, 333.0, 783.0, 2320.0, 10972.0, 98863.0, 3742569.0, 306755.0, 23892.0, 4566.0, 1448.0, 551.0, 227.0, 164.0, 95.0, 71.0, 46.0, 33.0, 22.0, 15.0, 17.0, 7.0, 13.0, 5.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0285186767578125, -0.02752375602722168, -0.02652883529663086, -0.02553391456604004, -0.02453899383544922, -0.0235440731048584, -0.022549152374267578, -0.021554231643676758, -0.020559310913085938, -0.019564390182495117, -0.018569469451904297, -0.017574548721313477, -0.016579627990722656, -0.015584707260131836, -0.014589786529541016, -0.013594865798950195, -0.012599945068359375, -0.011605024337768555, -0.010610103607177734, -0.009615182876586914, -0.008620262145996094, -0.0076253414154052734, -0.006630420684814453, -0.005635499954223633, -0.0046405792236328125, -0.003645658493041992, -0.002650737762451172, -0.0016558170318603516, -0.0006608963012695312, 0.00033402442932128906, 0.0013289451599121094, 0.0023238658905029297, 0.00331878662109375, 0.00431370735168457, 0.005308628082275391, 0.006303548812866211, 0.007298469543457031, 0.008293390274047852, 0.009288311004638672, 0.010283231735229492, 0.011278152465820312, 0.012273073196411133, 0.013267993927001953, 0.014262914657592773, 0.015257835388183594, 0.016252756118774414, 0.017247676849365234, 0.018242597579956055, 0.019237518310546875, 0.020232439041137695, 0.021227359771728516, 0.022222280502319336, 0.023217201232910156, 0.024212121963500977, 0.025207042694091797, 0.026201963424682617, 0.027196884155273438, 0.028191804885864258, 0.029186725616455078, 0.0301816463470459, 0.03117656707763672, 0.03217148780822754, 0.03316640853881836, 0.03416132926940918, 0.03515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 9.0, 10.0, 8.0, 13.0, 21.0, 31.0, 43.0, 87.0, 171.0, 322.0, 747.0, 1140.0, 723.0, 310.0, 157.0, 70.0, 64.0, 36.0, 24.0, 22.0, 12.0, 11.0, 14.0, 8.0, 6.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0191497802734375, -0.01833367347717285, -0.017517566680908203, -0.016701459884643555, -0.015885353088378906, -0.015069246292114258, -0.01425313949584961, -0.013437032699584961, -0.012620925903320312, -0.011804819107055664, -0.010988712310791016, -0.010172605514526367, -0.009356498718261719, -0.00854039192199707, -0.007724285125732422, -0.0069081783294677734, -0.006092071533203125, -0.0052759647369384766, -0.004459857940673828, -0.0036437511444091797, -0.0028276443481445312, -0.002011537551879883, -0.0011954307556152344, -0.00037932395935058594, 0.0004367828369140625, 0.001252889633178711, 0.0020689964294433594, 0.002885103225708008, 0.0037012100219726562, 0.004517316818237305, 0.005333423614501953, 0.0061495304107666016, 0.00696563720703125, 0.0077817440032958984, 0.008597850799560547, 0.009413957595825195, 0.010230064392089844, 0.011046171188354492, 0.01186227798461914, 0.012678384780883789, 0.013494491577148438, 0.014310598373413086, 0.015126705169677734, 0.015942811965942383, 0.01675891876220703, 0.01757502555847168, 0.018391132354736328, 0.019207239151000977, 0.020023345947265625, 0.020839452743530273, 0.021655559539794922, 0.02247166633605957, 0.02328777313232422, 0.024103879928588867, 0.024919986724853516, 0.025736093521118164, 0.026552200317382812, 0.02736830711364746, 0.02818441390991211, 0.029000520706176758, 0.029816627502441406, 0.030632734298706055, 0.0314488410949707, 0.03226494789123535, 0.0330810546875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 16.0, 27.0, 59.0, 154.0, 244.0, 269.0, 116.0, 54.0, 20.0, 15.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38885754346847534, -0.377643883228302, -0.3664301931858063, -0.35521653294563293, -0.3440028429031372, -0.33278918266296387, -0.32157549262046814, -0.3103618323802948, -0.2991481423377991, -0.28793448209762573, -0.27672079205513, -0.26550713181495667, -0.25429344177246094, -0.2430797666311264, -0.23186609148979187, -0.22065243124961853, -0.209438756108284, -0.19822508096694946, -0.18701140582561493, -0.1757977306842804, -0.16458405554294586, -0.15337038040161133, -0.142156720161438, -0.13094303011894226, -0.11972936242818832, -0.10851568728685379, -0.09730201214551926, -0.08608834445476532, -0.07487466931343079, -0.06366099417209625, -0.05244731903076172, -0.041233643889427185, -0.03001996874809265, -0.018806293606758118, -0.007592620328068733, 0.0036210529506206512, 0.014834728091955185, 0.02604840323328972, 0.037262074649333954, 0.04847574979066849, 0.05968942493200302, 0.07090310007333755, 0.08211677521467209, 0.09333044290542603, 0.10454411804676056, 0.11575779318809509, 0.12697146832942963, 0.13818514347076416, 0.1493988186120987, 0.16061249375343323, 0.17182616889476776, 0.1830398440361023, 0.19425351917743683, 0.20546719431877136, 0.2166808545589447, 0.22789454460144043, 0.23910820484161377, 0.2503218650817871, 0.26153555512428284, 0.2727492153644562, 0.2839629054069519, 0.29517656564712524, 0.30639025568962097, 0.3176039159297943, 0.32881760597229004]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 10.0, 11.0, 16.0, 9.0, 32.0, 32.0, 29.0, 42.0, 46.0, 56.0, 62.0, 74.0, 65.0, 69.0, 63.0, 59.0, 61.0, 49.0, 39.0, 34.0, 31.0, 23.0, 26.0, 19.0, 11.0, 7.0, 9.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0763278603553772, -0.07244311273097992, -0.06855837255716324, -0.06467363238334656, -0.06078888475894928, -0.0569041408598423, -0.05301939696073532, -0.04913465306162834, -0.04524990916252136, -0.04136516526341438, -0.037480421364307404, -0.033595677465200424, -0.029710933566093445, -0.025826189666986465, -0.021941445767879486, -0.018056701868772507, -0.014171957969665527, -0.010287214070558548, -0.006402470171451569, -0.0025177262723445892, 0.0013670176267623901, 0.0052517615258693695, 0.009136505424976349, 0.013021249324083328, 0.016905993223190308, 0.020790737122297287, 0.024675481021404266, 0.028560224920511246, 0.032444968819618225, 0.036329712718725204, 0.040214456617832184, 0.04409920051693916, 0.04798394441604614, 0.05186868831515312, 0.0557534322142601, 0.05963817611336708, 0.06352292001247406, 0.06740766763687134, 0.07129240781068802, 0.0751771479845047, 0.07906189560890198, 0.08294664323329926, 0.08683138340711594, 0.09071612358093262, 0.0946008712053299, 0.09848561882972717, 0.10237035900354385, 0.10625509917736053, 0.11013984680175781, 0.11402459442615509, 0.11790933459997177, 0.12179407477378845, 0.12567882239818573, 0.129563570022583, 0.1334483027458191, 0.13733305037021637, 0.14121779799461365, 0.14510254561901093, 0.1489872932434082, 0.1528720259666443, 0.15675677359104156, 0.16064152121543884, 0.16452625393867493, 0.1684110015630722, 0.17229574918746948]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 7.0, 9.0, 12.0, 21.0, 39.0, 51.0, 81.0, 138.0, 295.0, 477.0, 818.0, 1563.0, 3449.0, 7411.0, 18769.0, 49220.0, 133941.0, 315071.0, 308639.0, 129113.0, 47218.0, 18033.0, 7430.0, 3299.0, 1541.0, 828.0, 488.0, 238.0, 131.0, 69.0, 49.0, 39.0, 29.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01456451416015625, -0.014078736305236816, -0.013592958450317383, -0.01310718059539795, -0.012621402740478516, -0.012135624885559082, -0.011649847030639648, -0.011164069175720215, -0.010678291320800781, -0.010192513465881348, -0.009706735610961914, -0.00922095775604248, -0.008735179901123047, -0.008249402046203613, -0.00776362419128418, -0.007277846336364746, -0.0067920684814453125, -0.006306290626525879, -0.005820512771606445, -0.005334734916687012, -0.004848957061767578, -0.0043631792068481445, -0.003877401351928711, -0.0033916234970092773, -0.0029058456420898438, -0.00242006778717041, -0.0019342899322509766, -0.001448512077331543, -0.0009627342224121094, -0.0004769563674926758, 8.821487426757812e-06, 0.0004945993423461914, 0.000980377197265625, 0.0014661550521850586, 0.0019519329071044922, 0.0024377107620239258, 0.0029234886169433594, 0.003409266471862793, 0.0038950443267822266, 0.00438082218170166, 0.004866600036621094, 0.005352377891540527, 0.005838155746459961, 0.0063239336013793945, 0.006809711456298828, 0.007295489311218262, 0.007781267166137695, 0.008267045021057129, 0.008752822875976562, 0.009238600730895996, 0.00972437858581543, 0.010210156440734863, 0.010695934295654297, 0.01118171215057373, 0.011667490005493164, 0.012153267860412598, 0.012639045715332031, 0.013124823570251465, 0.013610601425170898, 0.014096379280090332, 0.014582157135009766, 0.0150679349899292, 0.015553712844848633, 0.016039490699768066, 0.0165252685546875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 11.0, 7.0, 15.0, 22.0, 20.0, 53.0, 44.0, 49.0, 54.0, 52.0, 82.0, 75.0, 66.0, 73.0, 71.0, 59.0, 57.0, 41.0, 34.0, 21.0, 19.0, 16.0, 14.0, 5.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01149749755859375, -0.011115193367004395, -0.010732889175415039, -0.010350584983825684, -0.009968280792236328, -0.009585976600646973, -0.009203672409057617, -0.008821368217468262, -0.008439064025878906, -0.00805675983428955, -0.007674455642700195, -0.00729215145111084, -0.006909847259521484, -0.006527543067932129, -0.0061452388763427734, -0.005762934684753418, -0.0053806304931640625, -0.004998326301574707, -0.0046160221099853516, -0.004233717918395996, -0.0038514137268066406, -0.003469109535217285, -0.0030868053436279297, -0.0027045011520385742, -0.0023221969604492188, -0.0019398927688598633, -0.0015575885772705078, -0.0011752843856811523, -0.0007929801940917969, -0.0004106760025024414, -2.8371810913085938e-05, 0.00035393238067626953, 0.000736236572265625, 0.0011185407638549805, 0.001500844955444336, 0.0018831491470336914, 0.002265453338623047, 0.0026477575302124023, 0.003030061721801758, 0.0034123659133911133, 0.0037946701049804688, 0.004176974296569824, 0.00455927848815918, 0.004941582679748535, 0.005323886871337891, 0.005706191062927246, 0.0060884952545166016, 0.006470799446105957, 0.0068531036376953125, 0.007235407829284668, 0.0076177120208740234, 0.008000016212463379, 0.008382320404052734, 0.00876462459564209, 0.009146928787231445, 0.0095292329788208, 0.009911537170410156, 0.010293841361999512, 0.010676145553588867, 0.011058449745178223, 0.011440753936767578, 0.011823058128356934, 0.012205362319946289, 0.012587666511535645, 0.012969970703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 3.0, 12.0, 21.0, 34.0, 49.0, 61.0, 75.0, 123.0, 200.0, 302.0, 420.0, 733.0, 1309.0, 2703.0, 8259.0, 47312.0, 572006.0, 364614.0, 37598.0, 7153.0, 2396.0, 1169.0, 660.0, 425.0, 282.0, 200.0, 135.0, 90.0, 48.0, 35.0, 32.0, 23.0, 13.0, 10.0, 14.0, 4.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029754638671875, -0.028689861297607422, -0.027625083923339844, -0.026560306549072266, -0.025495529174804688, -0.02443075180053711, -0.02336597442626953, -0.022301197052001953, -0.021236419677734375, -0.020171642303466797, -0.01910686492919922, -0.01804208755493164, -0.016977310180664062, -0.015912532806396484, -0.014847755432128906, -0.013782978057861328, -0.01271820068359375, -0.011653423309326172, -0.010588645935058594, -0.009523868560791016, -0.008459091186523438, -0.007394313812255859, -0.006329536437988281, -0.005264759063720703, -0.004199981689453125, -0.003135204315185547, -0.0020704269409179688, -0.0010056495666503906, 5.91278076171875e-05, 0.0011239051818847656, 0.0021886825561523438, 0.003253459930419922, 0.0043182373046875, 0.005383014678955078, 0.006447792053222656, 0.007512569427490234, 0.008577346801757812, 0.00964212417602539, 0.010706901550292969, 0.011771678924560547, 0.012836456298828125, 0.013901233673095703, 0.014966011047363281, 0.01603078842163086, 0.017095565795898438, 0.018160343170166016, 0.019225120544433594, 0.020289897918701172, 0.02135467529296875, 0.022419452667236328, 0.023484230041503906, 0.024549007415771484, 0.025613784790039062, 0.02667856216430664, 0.02774333953857422, 0.028808116912841797, 0.029872894287109375, 0.030937671661376953, 0.03200244903564453, 0.03306722640991211, 0.03413200378417969, 0.035196781158447266, 0.036261558532714844, 0.03732633590698242, 0.03839111328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 8.0, 1.0, 5.0, 9.0, 8.0, 11.0, 14.0, 12.0, 17.0, 25.0, 23.0, 35.0, 39.0, 38.0, 43.0, 50.0, 56.0, 43.0, 43.0, 56.0, 56.0, 40.0, 59.0, 45.0, 33.0, 43.0, 28.0, 36.0, 28.0, 15.0, 19.0, 18.0, 5.0, 15.0, 10.0, 4.0, 5.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034759521484375, -0.03357553482055664, -0.03239154815673828, -0.031207561492919922, -0.030023574829101562, -0.028839588165283203, -0.027655601501464844, -0.026471614837646484, -0.025287628173828125, -0.024103641510009766, -0.022919654846191406, -0.021735668182373047, -0.020551681518554688, -0.019367694854736328, -0.01818370819091797, -0.01699972152709961, -0.01581573486328125, -0.01463174819946289, -0.013447761535644531, -0.012263774871826172, -0.011079788208007812, -0.009895801544189453, -0.008711814880371094, -0.007527828216552734, -0.006343841552734375, -0.005159854888916016, -0.003975868225097656, -0.002791881561279297, -0.0016078948974609375, -0.0004239082336425781, 0.0007600784301757812, 0.0019440650939941406, 0.0031280517578125, 0.004312038421630859, 0.005496025085449219, 0.006680011749267578, 0.007863998413085938, 0.009047985076904297, 0.010231971740722656, 0.011415958404541016, 0.012599945068359375, 0.013783931732177734, 0.014967918395996094, 0.016151905059814453, 0.017335891723632812, 0.018519878387451172, 0.01970386505126953, 0.02088785171508789, 0.02207183837890625, 0.02325582504272461, 0.02443981170654297, 0.025623798370361328, 0.026807785034179688, 0.027991771697998047, 0.029175758361816406, 0.030359745025634766, 0.031543731689453125, 0.032727718353271484, 0.033911705017089844, 0.0350956916809082, 0.03627967834472656, 0.03746366500854492, 0.03864765167236328, 0.03983163833618164, 0.041015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 10.0, 25.0, 19.0, 41.0, 57.0, 77.0, 132.0, 200.0, 349.0, 534.0, 997.0, 2023.0, 4055.0, 9874.0, 32661.0, 809053.0, 155283.0, 19701.0, 6889.0, 3005.0, 1488.0, 845.0, 439.0, 288.0, 159.0, 123.0, 59.0, 61.0, 25.0, 18.0, 24.0, 8.0, 8.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029693603515625, -0.028760194778442383, -0.027826786041259766, -0.02689337730407715, -0.02595996856689453, -0.025026559829711914, -0.024093151092529297, -0.02315974235534668, -0.022226333618164062, -0.021292924880981445, -0.020359516143798828, -0.01942610740661621, -0.018492698669433594, -0.017559289932250977, -0.01662588119506836, -0.015692472457885742, -0.014759063720703125, -0.013825654983520508, -0.01289224624633789, -0.011958837509155273, -0.011025428771972656, -0.010092020034790039, -0.009158611297607422, -0.008225202560424805, -0.0072917938232421875, -0.00635838508605957, -0.005424976348876953, -0.004491567611694336, -0.0035581588745117188, -0.0026247501373291016, -0.0016913414001464844, -0.0007579326629638672, 0.00017547607421875, 0.0011088848114013672, 0.0020422935485839844, 0.0029757022857666016, 0.003909111022949219, 0.004842519760131836, 0.005775928497314453, 0.00670933723449707, 0.0076427459716796875, 0.008576154708862305, 0.009509563446044922, 0.010442972183227539, 0.011376380920410156, 0.012309789657592773, 0.01324319839477539, 0.014176607131958008, 0.015110015869140625, 0.016043424606323242, 0.01697683334350586, 0.017910242080688477, 0.018843650817871094, 0.01977705955505371, 0.020710468292236328, 0.021643877029418945, 0.022577285766601562, 0.02351069450378418, 0.024444103240966797, 0.025377511978149414, 0.02631092071533203, 0.02724432945251465, 0.028177738189697266, 0.029111146926879883, 0.0300445556640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 1.0, 10.0, 5.0, 2.0, 9.0, 12.0, 12.0, 15.0, 25.0, 23.0, 19.0, 22.0, 26.0, 52.0, 48.0, 46.0, 82.0, 64.0, 66.0, 84.0, 59.0, 53.0, 39.0, 31.0, 30.0, 24.0, 11.0, 14.0, 18.0, 12.0, 11.0, 12.0, 8.0, 11.0, 6.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.731250762939453e-05, -3.618840128183365e-05, -3.5064294934272766e-05, -3.3940188586711884e-05, -3.2816082239151e-05, -3.169197589159012e-05, -3.0567869544029236e-05, -2.9443763196468353e-05, -2.831965684890747e-05, -2.7195550501346588e-05, -2.6071444153785706e-05, -2.4947337806224823e-05, -2.382323145866394e-05, -2.2699125111103058e-05, -2.1575018763542175e-05, -2.0450912415981293e-05, -1.932680606842041e-05, -1.8202699720859528e-05, -1.7078593373298645e-05, -1.5954487025737762e-05, -1.483038067817688e-05, -1.3706274330615997e-05, -1.2582167983055115e-05, -1.1458061635494232e-05, -1.033395528793335e-05, -9.209848940372467e-06, -8.085742592811584e-06, -6.961636245250702e-06, -5.837529897689819e-06, -4.713423550128937e-06, -3.589317202568054e-06, -2.4652108550071716e-06, -1.341104507446289e-06, -2.169981598854065e-07, 9.071081876754761e-07, 2.0312145352363586e-06, 3.155320882797241e-06, 4.279427230358124e-06, 5.403533577919006e-06, 6.527639925479889e-06, 7.651746273040771e-06, 8.775852620601654e-06, 9.899958968162537e-06, 1.102406531572342e-05, 1.2148171663284302e-05, 1.3272278010845184e-05, 1.4396384358406067e-05, 1.552049070596695e-05, 1.6644597053527832e-05, 1.7768703401088715e-05, 1.8892809748649597e-05, 2.001691609621048e-05, 2.1141022443771362e-05, 2.2265128791332245e-05, 2.3389235138893127e-05, 2.451334148645401e-05, 2.5637447834014893e-05, 2.6761554181575775e-05, 2.7885660529136658e-05, 2.900976687669754e-05, 3.0133873224258423e-05, 3.1257979571819305e-05, 3.238208591938019e-05, 3.350619226694107e-05, 3.463029861450195e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 8.0, 5.0, 3.0, 6.0, 7.0, 17.0, 37.0, 42.0, 68.0, 109.0, 142.0, 244.0, 435.0, 894.0, 1984.0, 4529.0, 12148.0, 43350.0, 878638.0, 78943.0, 16224.0, 5979.0, 2360.0, 1019.0, 540.0, 283.0, 188.0, 125.0, 74.0, 47.0, 31.0, 16.0, 16.0, 10.0, 11.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0281524658203125, -0.027202367782592773, -0.026252269744873047, -0.02530217170715332, -0.024352073669433594, -0.023401975631713867, -0.02245187759399414, -0.021501779556274414, -0.020551681518554688, -0.01960158348083496, -0.018651485443115234, -0.017701387405395508, -0.01675128936767578, -0.015801191329956055, -0.014851093292236328, -0.013900995254516602, -0.012950897216796875, -0.012000799179077148, -0.011050701141357422, -0.010100603103637695, -0.009150505065917969, -0.008200407028198242, -0.007250308990478516, -0.006300210952758789, -0.0053501129150390625, -0.004400014877319336, -0.0034499168395996094, -0.002499818801879883, -0.0015497207641601562, -0.0005996227264404297, 0.0003504753112792969, 0.0013005733489990234, 0.00225067138671875, 0.0032007694244384766, 0.004150867462158203, 0.00510096549987793, 0.006051063537597656, 0.007001161575317383, 0.00795125961303711, 0.008901357650756836, 0.009851455688476562, 0.010801553726196289, 0.011751651763916016, 0.012701749801635742, 0.013651847839355469, 0.014601945877075195, 0.015552043914794922, 0.01650214195251465, 0.017452239990234375, 0.0184023380279541, 0.019352436065673828, 0.020302534103393555, 0.02125263214111328, 0.022202730178833008, 0.023152828216552734, 0.02410292625427246, 0.025053024291992188, 0.026003122329711914, 0.02695322036743164, 0.027903318405151367, 0.028853416442871094, 0.02980351448059082, 0.030753612518310547, 0.03170371055603027, 0.03265380859375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 4.0, 5.0, 8.0, 3.0, 5.0, 7.0, 14.0, 12.0, 18.0, 22.0, 38.0, 84.0, 132.0, 143.0, 153.0, 100.0, 76.0, 38.0, 31.0, 24.0, 5.0, 10.0, 9.0, 13.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.02227783203125, -0.021637916564941406, -0.020998001098632812, -0.02035808563232422, -0.019718170166015625, -0.01907825469970703, -0.018438339233398438, -0.017798423767089844, -0.01715850830078125, -0.016518592834472656, -0.015878677368164062, -0.015238761901855469, -0.014598846435546875, -0.013958930969238281, -0.013319015502929688, -0.012679100036621094, -0.0120391845703125, -0.011399269104003906, -0.010759353637695312, -0.010119438171386719, -0.009479522705078125, -0.008839607238769531, -0.008199691772460938, -0.007559776306152344, -0.00691986083984375, -0.006279945373535156, -0.0056400299072265625, -0.005000114440917969, -0.004360198974609375, -0.0037202835083007812, -0.0030803680419921875, -0.0024404525756835938, -0.001800537109375, -0.0011606216430664062, -0.0005207061767578125, 0.00011920928955078125, 0.000759124755859375, 0.0013990402221679688, 0.0020389556884765625, 0.0026788711547851562, 0.00331878662109375, 0.003958702087402344, 0.0045986175537109375, 0.005238533020019531, 0.005878448486328125, 0.006518363952636719, 0.0071582794189453125, 0.007798194885253906, 0.0084381103515625, 0.009078025817871094, 0.009717941284179688, 0.010357856750488281, 0.010997772216796875, 0.011637687683105469, 0.012277603149414062, 0.012917518615722656, 0.01355743408203125, 0.014197349548339844, 0.014837265014648438, 0.015477180480957031, 0.016117095947265625, 0.01675701141357422, 0.017396926879882812, 0.018036842346191406, 0.0186767578125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 3.0, 13.0, 14.0, 33.0, 64.0, 106.0, 217.0, 250.0, 149.0, 79.0, 38.0, 14.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34992358088493347, -0.33544108271598816, -0.32095855474472046, -0.30647605657577515, -0.29199355840682983, -0.2775110602378845, -0.2630285620689392, -0.2485460340976715, -0.2340635359287262, -0.21958103775978088, -0.20509852468967438, -0.19061601161956787, -0.17613351345062256, -0.16165101528167725, -0.14716850221157074, -0.13268598914146423, -0.11820349097251892, -0.10372098535299301, -0.0892384797334671, -0.07475597411394119, -0.06027346849441528, -0.045790962874889374, -0.031308457255363464, -0.016825951635837555, -0.0023434460163116455, 0.012139059603214264, 0.026621565222740173, 0.04110407084226608, 0.05558657646179199, 0.0700690820813179, 0.08455158770084381, 0.09903409332036972, 0.11351662874221802, 0.12799912691116333, 0.14248163998126984, 0.15696415305137634, 0.17144665122032166, 0.18592914938926697, 0.20041166245937347, 0.21489417552947998, 0.2293766736984253, 0.2438591718673706, 0.2583416700363159, 0.2728241980075836, 0.28730669617652893, 0.30178919434547424, 0.31627172231674194, 0.33075422048568726, 0.34523671865463257, 0.3597192168235779, 0.3742017149925232, 0.3886842429637909, 0.4031667411327362, 0.4176492393016815, 0.4321317672729492, 0.44661426544189453, 0.46109676361083984, 0.47557926177978516, 0.49006175994873047, 0.5045442581176758, 0.5190267562866211, 0.5335093140602112, 0.5479918122291565, 0.5624743103981018, 0.5769568085670471]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 4.0, 6.0, 7.0, 7.0, 12.0, 5.0, 17.0, 9.0, 18.0, 25.0, 16.0, 24.0, 21.0, 24.0, 34.0, 30.0, 42.0, 49.0, 53.0, 72.0, 64.0, 55.0, 51.0, 37.0, 37.0, 33.0, 30.0, 28.0, 17.0, 27.0, 24.0, 25.0, 19.0, 18.0, 7.0, 11.0, 7.0, 10.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.1523405909538269, -0.14789266884326935, -0.1434447467327118, -0.13899683952331543, -0.13454891741275787, -0.13010099530220032, -0.12565307319164276, -0.1212051510810852, -0.11675723642110825, -0.11230931431055069, -0.10786139965057373, -0.10341347754001617, -0.09896555542945862, -0.09451764076948166, -0.0900697186589241, -0.08562180399894714, -0.08117388188838959, -0.07672595977783203, -0.07227804511785507, -0.06783012300729752, -0.06338220834732056, -0.058934286236763, -0.054486364126205444, -0.05003844574093819, -0.04559052735567093, -0.04114260897040367, -0.036694690585136414, -0.03224676847457886, -0.0277988500893116, -0.023350931704044342, -0.018903011456131935, -0.014455091208219528, -0.01000717282295227, -0.005559253506362438, -0.001111334189772606, 0.0033365851268172264, 0.007784504443407059, 0.012232422828674316, 0.016680343076586723, 0.02112826332449913, 0.025576181709766388, 0.030024100095033646, 0.0344720184803009, 0.03891994059085846, 0.04336785897612572, 0.047815777361392975, 0.05226369947195053, 0.05671161785721779, 0.061159536242485046, 0.0656074583530426, 0.07005537301301956, 0.07450329512357712, 0.07895120978355408, 0.08339913189411163, 0.08784705400466919, 0.09229497611522675, 0.0967428907752037, 0.10119081288576126, 0.10563872754573822, 0.11008664965629578, 0.11453457176685333, 0.11898248642683029, 0.12343040853738785, 0.1278783231973648, 0.13232624530792236]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 7.0, 13.0, 9.0, 17.0, 23.0, 37.0, 49.0, 97.0, 157.0, 390.0, 923.0, 3225.0, 16037.0, 222408.0, 3701788.0, 226687.0, 17071.0, 3444.0, 1057.0, 369.0, 189.0, 85.0, 57.0, 28.0, 26.0, 16.0, 10.0, 8.0, 7.0, 9.0, 6.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028961181640625, -0.028011798858642578, -0.027062416076660156, -0.026113033294677734, -0.025163650512695312, -0.02421426773071289, -0.02326488494873047, -0.022315502166748047, -0.021366119384765625, -0.020416736602783203, -0.01946735382080078, -0.01851797103881836, -0.017568588256835938, -0.016619205474853516, -0.015669822692871094, -0.014720439910888672, -0.01377105712890625, -0.012821674346923828, -0.011872291564941406, -0.010922908782958984, -0.009973526000976562, -0.00902414321899414, -0.008074760437011719, -0.007125377655029297, -0.006175994873046875, -0.005226612091064453, -0.004277229309082031, -0.0033278465270996094, -0.0023784637451171875, -0.0014290809631347656, -0.00047969818115234375, 0.0004696846008300781, 0.0014190673828125, 0.002368450164794922, 0.0033178329467773438, 0.004267215728759766, 0.0052165985107421875, 0.006165981292724609, 0.007115364074707031, 0.008064746856689453, 0.009014129638671875, 0.009963512420654297, 0.010912895202636719, 0.01186227798461914, 0.012811660766601562, 0.013761043548583984, 0.014710426330566406, 0.015659809112548828, 0.01660919189453125, 0.017558574676513672, 0.018507957458496094, 0.019457340240478516, 0.020406723022460938, 0.02135610580444336, 0.02230548858642578, 0.023254871368408203, 0.024204254150390625, 0.025153636932373047, 0.02610301971435547, 0.02705240249633789, 0.028001785278320312, 0.028951168060302734, 0.029900550842285156, 0.030849933624267578, 0.03179931640625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 4.0, 6.0, 12.0, 7.0, 17.0, 17.0, 19.0, 17.0, 32.0, 41.0, 47.0, 40.0, 50.0, 49.0, 62.0, 78.0, 52.0, 58.0, 53.0, 44.0, 38.0, 56.0, 38.0, 30.0, 25.0, 22.0, 16.0, 20.0, 15.0, 9.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.010162353515625, -0.009826183319091797, -0.009490013122558594, -0.00915384292602539, -0.008817672729492188, -0.008481502532958984, -0.008145332336425781, -0.007809162139892578, -0.007472991943359375, -0.007136821746826172, -0.006800651550292969, -0.006464481353759766, -0.0061283111572265625, -0.005792140960693359, -0.005455970764160156, -0.005119800567626953, -0.00478363037109375, -0.004447460174560547, -0.004111289978027344, -0.0037751197814941406, -0.0034389495849609375, -0.0031027793884277344, -0.0027666091918945312, -0.002430438995361328, -0.002094268798828125, -0.0017580986022949219, -0.0014219284057617188, -0.0010857582092285156, -0.0007495880126953125, -0.0004134178161621094, -7.724761962890625e-05, 0.0002589225769042969, 0.0005950927734375, 0.0009312629699707031, 0.0012674331665039062, 0.0016036033630371094, 0.0019397735595703125, 0.0022759437561035156, 0.0026121139526367188, 0.002948284149169922, 0.003284454345703125, 0.003620624542236328, 0.003956794738769531, 0.004292964935302734, 0.0046291351318359375, 0.004965305328369141, 0.005301475524902344, 0.005637645721435547, 0.00597381591796875, 0.006309986114501953, 0.006646156311035156, 0.006982326507568359, 0.0073184967041015625, 0.007654666900634766, 0.007990837097167969, 0.008327007293701172, 0.008663177490234375, 0.008999347686767578, 0.009335517883300781, 0.009671688079833984, 0.010007858276367188, 0.01034402847290039, 0.010680198669433594, 0.011016368865966797, 0.0113525390625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 7.0, 5.0, 5.0, 4.0, 4.0, 12.0, 14.0, 12.0, 19.0, 21.0, 24.0, 35.0, 47.0, 56.0, 74.0, 115.0, 179.0, 234.0, 394.0, 750.0, 1820.0, 7063.0, 72126.0, 3873252.0, 220439.0, 12747.0, 2381.0, 913.0, 454.0, 269.0, 162.0, 139.0, 105.0, 81.0, 71.0, 59.0, 40.0, 30.0, 24.0, 22.0, 20.0, 15.0, 12.0, 14.0, 4.0, 8.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.040985107421875, -0.03950309753417969, -0.038021087646484375, -0.03653907775878906, -0.03505706787109375, -0.03357505798339844, -0.032093048095703125, -0.030611038208007812, -0.0291290283203125, -0.027647018432617188, -0.026165008544921875, -0.024682998657226562, -0.02320098876953125, -0.021718978881835938, -0.020236968994140625, -0.018754959106445312, -0.01727294921875, -0.015790939331054688, -0.014308929443359375, -0.012826919555664062, -0.01134490966796875, -0.009862899780273438, -0.008380889892578125, -0.0068988800048828125, -0.0054168701171875, -0.0039348602294921875, -0.002452850341796875, -0.0009708404541015625, 0.00051116943359375, 0.0019931793212890625, 0.003475189208984375, 0.0049571990966796875, 0.006439208984375, 0.007921218872070312, 0.009403228759765625, 0.010885238647460938, 0.01236724853515625, 0.013849258422851562, 0.015331268310546875, 0.016813278198242188, 0.0182952880859375, 0.019777297973632812, 0.021259307861328125, 0.022741317749023438, 0.02422332763671875, 0.025705337524414062, 0.027187347412109375, 0.028669357299804688, 0.0301513671875, 0.03163337707519531, 0.033115386962890625, 0.03459739685058594, 0.03607940673828125, 0.03756141662597656, 0.039043426513671875, 0.04052543640136719, 0.0420074462890625, 0.04348945617675781, 0.044971466064453125, 0.04645347595214844, 0.04793548583984375, 0.04941749572753906, 0.050899505615234375, 0.05238151550292969, 0.053863525390625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 10.0, 18.0, 42.0, 57.0, 105.0, 191.0, 660.0, 1452.0, 947.0, 306.0, 119.0, 62.0, 33.0, 22.0, 13.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.041717529296875, -0.04035615921020508, -0.038994789123535156, -0.037633419036865234, -0.03627204895019531, -0.03491067886352539, -0.03354930877685547, -0.03218793869018555, -0.030826568603515625, -0.029465198516845703, -0.02810382843017578, -0.02674245834350586, -0.025381088256835938, -0.024019718170166016, -0.022658348083496094, -0.021296977996826172, -0.01993560791015625, -0.018574237823486328, -0.017212867736816406, -0.015851497650146484, -0.014490127563476562, -0.01312875747680664, -0.011767387390136719, -0.010406017303466797, -0.009044647216796875, -0.007683277130126953, -0.006321907043457031, -0.004960536956787109, -0.0035991668701171875, -0.0022377967834472656, -0.0008764266967773438, 0.0004849433898925781, 0.0018463134765625, 0.003207683563232422, 0.004569053649902344, 0.005930423736572266, 0.0072917938232421875, 0.00865316390991211, 0.010014533996582031, 0.011375904083251953, 0.012737274169921875, 0.014098644256591797, 0.015460014343261719, 0.01682138442993164, 0.018182754516601562, 0.019544124603271484, 0.020905494689941406, 0.022266864776611328, 0.02362823486328125, 0.024989604949951172, 0.026350975036621094, 0.027712345123291016, 0.029073715209960938, 0.03043508529663086, 0.03179645538330078, 0.0331578254699707, 0.034519195556640625, 0.03588056564331055, 0.03724193572998047, 0.03860330581665039, 0.03996467590332031, 0.041326045989990234, 0.042687416076660156, 0.04404878616333008, 0.04541015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 2.0, 3.0, 6.0, 1.0, 7.0, 12.0, 19.0, 49.0, 86.0, 143.0, 196.0, 186.0, 125.0, 58.0, 52.0, 20.0, 9.0, 11.0, 10.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26120105385780334, -0.2501150965690613, -0.2390291690826416, -0.22794322669506073, -0.21685728430747986, -0.205771341919899, -0.19468539953231812, -0.18359945714473724, -0.17251351475715637, -0.1614275723695755, -0.15034162998199463, -0.13925568759441376, -0.12816974520683289, -0.11708380281925201, -0.10599786043167114, -0.09491191804409027, -0.0838259756565094, -0.07274003326892853, -0.061654090881347656, -0.050568148493766785, -0.03948220610618591, -0.02839626371860504, -0.01731032133102417, -0.006224378943443298, 0.004861563444137573, 0.015947505831718445, 0.027033448219299316, 0.03811939060688019, 0.04920533299446106, 0.06029127538204193, 0.0713772177696228, 0.08246316015720367, 0.09354913234710693, 0.1046350747346878, 0.11572101712226868, 0.12680695950984955, 0.13789290189743042, 0.1489788442850113, 0.16006478667259216, 0.17115072906017303, 0.1822366714477539, 0.19332261383533478, 0.20440855622291565, 0.21549449861049652, 0.2265804409980774, 0.23766638338565826, 0.24875232577323914, 0.2598382830619812, 0.2709242105484009, 0.28201013803482056, 0.2930960953235626, 0.3041820526123047, 0.31526798009872437, 0.32635390758514404, 0.3374398648738861, 0.3485258221626282, 0.35961174964904785, 0.37069767713546753, 0.3817836344242096, 0.39286959171295166, 0.40395551919937134, 0.415041446685791, 0.4261274039745331, 0.43721336126327515, 0.4482992887496948]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 1.0, 11.0, 17.0, 18.0, 29.0, 32.0, 40.0, 79.0, 81.0, 103.0, 98.0, 79.0, 110.0, 62.0, 82.0, 42.0, 34.0, 32.0, 27.0, 10.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21377688646316528, -0.2059030681848526, -0.19802924990653992, -0.19015543162822723, -0.18228161334991455, -0.17440779507160187, -0.16653397679328918, -0.1586601436138153, -0.15078634023666382, -0.14291252195835114, -0.13503870368003845, -0.12716488540172577, -0.11929106712341309, -0.1114172488451004, -0.10354342311620712, -0.09566960483789444, -0.08779577910900116, -0.07992196083068848, -0.0720481425523758, -0.06417432427406311, -0.05630050227046013, -0.048426683992147446, -0.040552861988544464, -0.03267904371023178, -0.024805225431919098, -0.016931407153606415, -0.009057587012648582, -0.0011837668716907501, 0.006690051406621933, 0.014563869684934616, 0.022437691688537598, 0.03031150996685028, 0.038185328245162964, 0.04605914652347565, 0.05393296480178833, 0.06180678680539131, 0.0696806013584137, 0.07755441963672638, 0.08542824536561966, 0.09330206364393234, 0.10117588192224503, 0.10904970020055771, 0.11692351847887039, 0.12479734420776367, 0.13267116248607635, 0.14054498076438904, 0.14841879904270172, 0.1562926173210144, 0.1641664355993271, 0.17204025387763977, 0.17991407215595245, 0.18778789043426514, 0.19566170871257782, 0.2035355269908905, 0.21140936017036438, 0.21928316354751587, 0.22715699672698975, 0.23503081500530243, 0.2429046332836151, 0.250778466463089, 0.2586522698402405, 0.26652610301971436, 0.27439990639686584, 0.2822737395763397, 0.2901475429534912]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 8.0, 9.0, 18.0, 22.0, 28.0, 49.0, 66.0, 126.0, 195.0, 264.0, 479.0, 831.0, 1393.0, 2662.0, 5221.0, 11265.0, 26559.0, 66984.0, 179805.0, 368039.0, 234540.0, 88095.0, 34003.0, 14207.0, 6417.0, 3289.0, 1639.0, 898.0, 560.0, 349.0, 185.0, 112.0, 66.0, 58.0, 32.0, 20.0, 16.0, 11.0, 8.0, 6.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169677734375, -0.016375303268432617, -0.015782833099365234, -0.015190362930297852, -0.014597892761230469, -0.014005422592163086, -0.013412952423095703, -0.01282048225402832, -0.012228012084960938, -0.011635541915893555, -0.011043071746826172, -0.010450601577758789, -0.009858131408691406, -0.009265661239624023, -0.00867319107055664, -0.008080720901489258, -0.007488250732421875, -0.006895780563354492, -0.006303310394287109, -0.0057108402252197266, -0.005118370056152344, -0.004525899887084961, -0.003933429718017578, -0.0033409595489501953, -0.0027484893798828125, -0.0021560192108154297, -0.0015635490417480469, -0.0009710788726806641, -0.00037860870361328125, 0.00021386146545410156, 0.0008063316345214844, 0.0013988018035888672, 0.00199127197265625, 0.002583742141723633, 0.0031762123107910156, 0.0037686824798583984, 0.004361152648925781, 0.004953622817993164, 0.005546092987060547, 0.00613856315612793, 0.0067310333251953125, 0.007323503494262695, 0.007915973663330078, 0.008508443832397461, 0.009100914001464844, 0.009693384170532227, 0.01028585433959961, 0.010878324508666992, 0.011470794677734375, 0.012063264846801758, 0.01265573501586914, 0.013248205184936523, 0.013840675354003906, 0.014433145523071289, 0.015025615692138672, 0.015618085861206055, 0.016210556030273438, 0.01680302619934082, 0.017395496368408203, 0.017987966537475586, 0.01858043670654297, 0.01917290687561035, 0.019765377044677734, 0.020357847213745117, 0.0209503173828125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 10.0, 4.0, 11.0, 15.0, 13.0, 18.0, 20.0, 30.0, 23.0, 30.0, 32.0, 34.0, 40.0, 49.0, 59.0, 59.0, 49.0, 64.0, 45.0, 50.0, 39.0, 49.0, 32.0, 34.0, 25.0, 31.0, 31.0, 21.0, 16.0, 16.0, 11.0, 8.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00959014892578125, -0.009249091148376465, -0.00890803337097168, -0.008566975593566895, -0.00822591781616211, -0.007884860038757324, -0.007543802261352539, -0.007202744483947754, -0.006861686706542969, -0.006520628929138184, -0.0061795711517333984, -0.005838513374328613, -0.005497455596923828, -0.005156397819519043, -0.004815340042114258, -0.004474282264709473, -0.0041332244873046875, -0.0037921667098999023, -0.003451108932495117, -0.003110051155090332, -0.002768993377685547, -0.0024279356002807617, -0.0020868778228759766, -0.0017458200454711914, -0.0014047622680664062, -0.001063704490661621, -0.0007226467132568359, -0.0003815889358520508, -4.0531158447265625e-05, 0.00030052661895751953, 0.0006415843963623047, 0.0009826421737670898, 0.001323699951171875, 0.0016647577285766602, 0.0020058155059814453, 0.0023468732833862305, 0.0026879310607910156, 0.0030289888381958008, 0.003370046615600586, 0.003711104393005371, 0.004052162170410156, 0.004393219947814941, 0.0047342777252197266, 0.005075335502624512, 0.005416393280029297, 0.005757451057434082, 0.006098508834838867, 0.006439566612243652, 0.0067806243896484375, 0.007121682167053223, 0.007462739944458008, 0.007803797721862793, 0.008144855499267578, 0.008485913276672363, 0.008826971054077148, 0.009168028831481934, 0.009509086608886719, 0.009850144386291504, 0.010191202163696289, 0.010532259941101074, 0.01087331771850586, 0.011214375495910645, 0.01155543327331543, 0.011896491050720215, 0.012237548828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 7.0, 3.0, 12.0, 12.0, 10.0, 16.0, 16.0, 40.0, 57.0, 77.0, 85.0, 177.0, 243.0, 361.0, 563.0, 979.0, 2043.0, 5293.0, 21134.0, 160722.0, 746464.0, 88120.0, 13964.0, 4103.0, 1682.0, 807.0, 536.0, 352.0, 199.0, 123.0, 88.0, 73.0, 46.0, 42.0, 30.0, 27.0, 12.0, 10.0, 11.0, 5.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.050445556640625, -0.04897785186767578, -0.04751014709472656, -0.046042442321777344, -0.044574737548828125, -0.043107032775878906, -0.04163932800292969, -0.04017162322998047, -0.03870391845703125, -0.03723621368408203, -0.03576850891113281, -0.034300804138183594, -0.032833099365234375, -0.031365394592285156, -0.029897689819335938, -0.02842998504638672, -0.0269622802734375, -0.02549457550048828, -0.024026870727539062, -0.022559165954589844, -0.021091461181640625, -0.019623756408691406, -0.018156051635742188, -0.01668834686279297, -0.01522064208984375, -0.013752937316894531, -0.012285232543945312, -0.010817527770996094, -0.009349822998046875, -0.007882118225097656, -0.0064144134521484375, -0.004946708679199219, -0.00347900390625, -0.0020112991333007812, -0.0005435943603515625, 0.0009241104125976562, 0.002391815185546875, 0.0038595199584960938, 0.0053272247314453125, 0.006794929504394531, 0.00826263427734375, 0.009730339050292969, 0.011198043823242188, 0.012665748596191406, 0.014133453369140625, 0.015601158142089844, 0.017068862915039062, 0.01853656768798828, 0.0200042724609375, 0.02147197723388672, 0.022939682006835938, 0.024407386779785156, 0.025875091552734375, 0.027342796325683594, 0.028810501098632812, 0.03027820587158203, 0.03174591064453125, 0.03321361541748047, 0.03468132019042969, 0.036149024963378906, 0.037616729736328125, 0.039084434509277344, 0.04055213928222656, 0.04201984405517578, 0.043487548828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 6.0, 4.0, 7.0, 12.0, 15.0, 15.0, 20.0, 24.0, 19.0, 29.0, 32.0, 32.0, 49.0, 50.0, 43.0, 58.0, 60.0, 55.0, 64.0, 37.0, 48.0, 36.0, 39.0, 37.0, 34.0, 34.0, 19.0, 17.0, 25.0, 17.0, 13.0, 12.0, 6.0, 5.0, 2.0, 7.0, 3.0, 6.0, 4.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04266357421875, -0.04126167297363281, -0.039859771728515625, -0.03845787048339844, -0.03705596923828125, -0.03565406799316406, -0.034252166748046875, -0.03285026550292969, -0.0314483642578125, -0.030046463012695312, -0.028644561767578125, -0.027242660522460938, -0.02584075927734375, -0.024438858032226562, -0.023036956787109375, -0.021635055541992188, -0.020233154296875, -0.018831253051757812, -0.017429351806640625, -0.016027450561523438, -0.01462554931640625, -0.013223648071289062, -0.011821746826171875, -0.010419845581054688, -0.0090179443359375, -0.0076160430908203125, -0.006214141845703125, -0.0048122406005859375, -0.00341033935546875, -0.0020084381103515625, -0.000606536865234375, 0.0007953643798828125, 0.002197265625, 0.0035991668701171875, 0.005001068115234375, 0.0064029693603515625, 0.00780487060546875, 0.009206771850585938, 0.010608673095703125, 0.012010574340820312, 0.0134124755859375, 0.014814376831054688, 0.016216278076171875, 0.017618179321289062, 0.01902008056640625, 0.020421981811523438, 0.021823883056640625, 0.023225784301757812, 0.024627685546875, 0.026029586791992188, 0.027431488037109375, 0.028833389282226562, 0.03023529052734375, 0.03163719177246094, 0.033039093017578125, 0.03444099426269531, 0.0358428955078125, 0.03724479675292969, 0.038646697998046875, 0.04004859924316406, 0.04145050048828125, 0.04285240173339844, 0.044254302978515625, 0.04565620422363281, 0.04705810546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 12.0, 14.0, 37.0, 46.0, 79.0, 171.0, 332.0, 832.0, 2329.0, 8283.0, 38475.0, 716601.0, 248560.0, 24152.0, 5619.0, 1762.0, 671.0, 267.0, 130.0, 78.0, 49.0, 24.0, 9.0, 6.0, 4.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.03802490234375, -0.037137746810913086, -0.03625059127807617, -0.03536343574523926, -0.034476280212402344, -0.03358912467956543, -0.032701969146728516, -0.0318148136138916, -0.030927658081054688, -0.030040502548217773, -0.02915334701538086, -0.028266191482543945, -0.02737903594970703, -0.026491880416870117, -0.025604724884033203, -0.02471756935119629, -0.023830413818359375, -0.02294325828552246, -0.022056102752685547, -0.021168947219848633, -0.02028179168701172, -0.019394636154174805, -0.01850748062133789, -0.017620325088500977, -0.016733169555664062, -0.01584601402282715, -0.014958858489990234, -0.01407170295715332, -0.013184547424316406, -0.012297391891479492, -0.011410236358642578, -0.010523080825805664, -0.00963592529296875, -0.008748769760131836, -0.007861614227294922, -0.006974458694458008, -0.006087303161621094, -0.00520014762878418, -0.004312992095947266, -0.0034258365631103516, -0.0025386810302734375, -0.0016515254974365234, -0.0007643699645996094, 0.0001227855682373047, 0.0010099411010742188, 0.0018970966339111328, 0.002784252166748047, 0.003671407699584961, 0.004558563232421875, 0.005445718765258789, 0.006332874298095703, 0.007220029830932617, 0.008107185363769531, 0.008994340896606445, 0.00988149642944336, 0.010768651962280273, 0.011655807495117188, 0.012542963027954102, 0.013430118560791016, 0.01431727409362793, 0.015204429626464844, 0.016091585159301758, 0.016978740692138672, 0.017865896224975586, 0.0187530517578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 7.0, 5.0, 7.0, 4.0, 9.0, 11.0, 8.0, 15.0, 9.0, 24.0, 17.0, 19.0, 35.0, 45.0, 78.0, 79.0, 84.0, 103.0, 76.0, 70.0, 58.0, 48.0, 28.0, 33.0, 26.0, 10.0, 16.0, 10.0, 6.0, 12.0, 11.0, 8.0, 8.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.9577484130859375e-05, -3.827642649412155e-05, -3.697536885738373e-05, -3.5674311220645905e-05, -3.437325358390808e-05, -3.307219594717026e-05, -3.1771138310432434e-05, -3.047008067369461e-05, -2.9169023036956787e-05, -2.7867965400218964e-05, -2.656690776348114e-05, -2.5265850126743317e-05, -2.3964792490005493e-05, -2.266373485326767e-05, -2.1362677216529846e-05, -2.0061619579792023e-05, -1.87605619430542e-05, -1.7459504306316376e-05, -1.6158446669578552e-05, -1.4857389032840729e-05, -1.3556331396102905e-05, -1.2255273759365082e-05, -1.0954216122627258e-05, -9.653158485889435e-06, -8.352100849151611e-06, -7.051043212413788e-06, -5.749985575675964e-06, -4.448927938938141e-06, -3.1478703022003174e-06, -1.846812665462494e-06, -5.457550287246704e-07, 7.553026080131531e-07, 2.0563602447509766e-06, 3.3574178814888e-06, 4.6584755182266235e-06, 5.959533154964447e-06, 7.2605907917022705e-06, 8.561648428440094e-06, 9.862706065177917e-06, 1.1163763701915741e-05, 1.2464821338653564e-05, 1.3765878975391388e-05, 1.5066936612129211e-05, 1.6367994248867035e-05, 1.766905188560486e-05, 1.8970109522342682e-05, 2.0271167159080505e-05, 2.157222479581833e-05, 2.2873282432556152e-05, 2.4174340069293976e-05, 2.54753977060318e-05, 2.6776455342769623e-05, 2.8077512979507446e-05, 2.937857061624527e-05, 3.067962825298309e-05, 3.198068588972092e-05, 3.328174352645874e-05, 3.4582801163196564e-05, 3.588385879993439e-05, 3.718491643667221e-05, 3.8485974073410034e-05, 3.978703171014786e-05, 4.108808934688568e-05, 4.2389146983623505e-05, 4.369020462036133e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 16.0, 22.0, 34.0, 48.0, 72.0, 113.0, 236.0, 458.0, 902.0, 2177.0, 6422.0, 26110.0, 201963.0, 728515.0, 62507.0, 12449.0, 3782.0, 1331.0, 642.0, 306.0, 182.0, 98.0, 57.0, 33.0, 26.0, 20.0, 9.0, 6.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01611328125, -0.015420198440551758, -0.014727115631103516, -0.014034032821655273, -0.013340950012207031, -0.012647867202758789, -0.011954784393310547, -0.011261701583862305, -0.010568618774414062, -0.00987553596496582, -0.009182453155517578, -0.008489370346069336, -0.007796287536621094, -0.0071032047271728516, -0.006410121917724609, -0.005717039108276367, -0.005023956298828125, -0.004330873489379883, -0.0036377906799316406, -0.0029447078704833984, -0.0022516250610351562, -0.001558542251586914, -0.0008654594421386719, -0.0001723766326904297, 0.0005207061767578125, 0.0012137889862060547, 0.0019068717956542969, 0.002599954605102539, 0.0032930374145507812, 0.0039861202239990234, 0.004679203033447266, 0.005372285842895508, 0.00606536865234375, 0.006758451461791992, 0.007451534271240234, 0.008144617080688477, 0.008837699890136719, 0.009530782699584961, 0.010223865509033203, 0.010916948318481445, 0.011610031127929688, 0.01230311393737793, 0.012996196746826172, 0.013689279556274414, 0.014382362365722656, 0.015075445175170898, 0.01576852798461914, 0.016461610794067383, 0.017154693603515625, 0.017847776412963867, 0.01854085922241211, 0.01923394203186035, 0.019927024841308594, 0.020620107650756836, 0.021313190460205078, 0.02200627326965332, 0.022699356079101562, 0.023392438888549805, 0.024085521697998047, 0.02477860450744629, 0.02547168731689453, 0.026164770126342773, 0.026857852935791016, 0.027550935745239258, 0.0282440185546875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 7.0, 4.0, 10.0, 13.0, 26.0, 33.0, 42.0, 64.0, 81.0, 104.0, 145.0, 128.0, 92.0, 84.0, 51.0, 36.0, 22.0, 19.0, 16.0, 12.0, 1.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0260162353515625, -0.02534627914428711, -0.02467632293701172, -0.024006366729736328, -0.023336410522460938, -0.022666454315185547, -0.021996498107910156, -0.021326541900634766, -0.020656585693359375, -0.019986629486083984, -0.019316673278808594, -0.018646717071533203, -0.017976760864257812, -0.017306804656982422, -0.01663684844970703, -0.01596689224243164, -0.01529693603515625, -0.01462697982788086, -0.013957023620605469, -0.013287067413330078, -0.012617111206054688, -0.011947154998779297, -0.011277198791503906, -0.010607242584228516, -0.009937286376953125, -0.009267330169677734, -0.008597373962402344, -0.007927417755126953, -0.0072574615478515625, -0.006587505340576172, -0.005917549133300781, -0.005247592926025391, -0.00457763671875, -0.003907680511474609, -0.0032377243041992188, -0.002567768096923828, -0.0018978118896484375, -0.0012278556823730469, -0.0005578994750976562, 0.00011205673217773438, 0.000782012939453125, 0.0014519691467285156, 0.0021219253540039062, 0.002791881561279297, 0.0034618377685546875, 0.004131793975830078, 0.004801750183105469, 0.005471706390380859, 0.00614166259765625, 0.006811618804931641, 0.007481575012207031, 0.008151531219482422, 0.008821487426757812, 0.009491443634033203, 0.010161399841308594, 0.010831356048583984, 0.011501312255859375, 0.012171268463134766, 0.012841224670410156, 0.013511180877685547, 0.014181137084960938, 0.014851093292236328, 0.015521049499511719, 0.01619100570678711, 0.0168609619140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 14.0, 33.0, 73.0, 161.0, 294.0, 196.0, 99.0, 54.0, 26.0, 11.0, 7.0, 4.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40993165969848633, -0.396430641412735, -0.38292965292930603, -0.3694286346435547, -0.35592764616012573, -0.3424266278743744, -0.32892560958862305, -0.3154246211051941, -0.30192360281944275, -0.2884225845336914, -0.27492159605026245, -0.2614205777645111, -0.24791957437992096, -0.2344185709953308, -0.22091755270957947, -0.20741654932498932, -0.19391554594039917, -0.18041454255580902, -0.16691353917121887, -0.15341252088546753, -0.13991151750087738, -0.12641051411628723, -0.11290950328111649, -0.09940849244594574, -0.08590748906135559, -0.07240648567676544, -0.058905474841594696, -0.04540446773171425, -0.0319034606218338, -0.018402457237243652, -0.0049014464020729065, 0.00859956443309784, 0.022100597620010376, 0.03560160472989082, 0.04910261183977127, 0.06260362267494202, 0.07610462605953217, 0.08960562944412231, 0.10310664027929306, 0.1166076511144638, 0.13010865449905396, 0.1436096578836441, 0.15711066126823425, 0.1706116795539856, 0.18411268293857574, 0.1976136863231659, 0.21111470460891724, 0.22461570799350739, 0.23811671137809753, 0.2516177296638489, 0.26511871814727783, 0.2786197364330292, 0.2921207547187805, 0.3056217432022095, 0.3191227614879608, 0.33262377977371216, 0.3461247682571411, 0.35962578654289246, 0.3731267750263214, 0.38662779331207275, 0.4001287817955017, 0.41362980008125305, 0.4271308183670044, 0.44063180685043335, 0.4541328251361847]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 9.0, 5.0, 8.0, 9.0, 18.0, 15.0, 21.0, 19.0, 18.0, 19.0, 30.0, 25.0, 39.0, 32.0, 63.0, 75.0, 77.0, 82.0, 67.0, 48.0, 46.0, 29.0, 26.0, 27.0, 25.0, 18.0, 17.0, 17.0, 24.0, 14.0, 14.0, 9.0, 9.0, 8.0, 10.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18436723947525024, -0.17846879363059998, -0.1725703328847885, -0.16667188704013824, -0.16077342629432678, -0.1548749804496765, -0.14897653460502625, -0.14307808876037598, -0.13717962801456451, -0.13128118216991425, -0.12538272142410278, -0.11948427557945251, -0.11358582228422165, -0.10768736898899078, -0.10178892314434052, -0.09589046984910965, -0.08999201655387878, -0.08409356325864792, -0.07819510996341705, -0.07229666411876678, -0.06639821082353592, -0.060499757528305054, -0.05460130795836449, -0.04870285838842392, -0.042804405093193054, -0.03690595179796219, -0.03100750222802162, -0.025109050795435905, -0.01921059936285019, -0.013312147930264473, -0.007413696497678757, -0.0015152469277381897, 0.004383206367492676, 0.010281657800078392, 0.01618010923266411, 0.022078560665249825, 0.02797701209783554, 0.033875465393066406, 0.03977391496300697, 0.04567236453294754, 0.051570817828178406, 0.05746927112340927, 0.06336772441864014, 0.0692661702632904, 0.07516462355852127, 0.08106307685375214, 0.0869615226984024, 0.09285997599363327, 0.09875842928886414, 0.104656882584095, 0.11055533587932587, 0.11645378172397614, 0.122352235019207, 0.12825068831443787, 0.13414913415908813, 0.1400475800037384, 0.14594604074954987, 0.15184448659420013, 0.1577429473400116, 0.16364139318466187, 0.16953983902931213, 0.1754382997751236, 0.18133674561977386, 0.18723520636558533, 0.1931336522102356]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 8.0, 10.0, 10.0, 25.0, 25.0, 40.0, 70.0, 116.0, 224.0, 460.0, 1090.0, 2679.0, 9222.0, 50327.0, 1202807.0, 2811959.0, 94845.0, 14009.0, 3845.0, 1340.0, 537.0, 257.0, 126.0, 87.0, 52.0, 32.0, 23.0, 17.0, 6.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0276031494140625, -0.026655912399291992, -0.025708675384521484, -0.024761438369750977, -0.02381420135498047, -0.02286696434020996, -0.021919727325439453, -0.020972490310668945, -0.020025253295898438, -0.01907801628112793, -0.018130779266357422, -0.017183542251586914, -0.016236305236816406, -0.015289068222045898, -0.01434183120727539, -0.013394594192504883, -0.012447357177734375, -0.011500120162963867, -0.01055288314819336, -0.009605646133422852, -0.008658409118652344, -0.007711172103881836, -0.006763935089111328, -0.00581669807434082, -0.0048694610595703125, -0.003922224044799805, -0.002974987030029297, -0.002027750015258789, -0.0010805130004882812, -0.00013327598571777344, 0.0008139610290527344, 0.0017611980438232422, 0.00270843505859375, 0.003655672073364258, 0.004602909088134766, 0.0055501461029052734, 0.006497383117675781, 0.007444620132446289, 0.008391857147216797, 0.009339094161987305, 0.010286331176757812, 0.01123356819152832, 0.012180805206298828, 0.013128042221069336, 0.014075279235839844, 0.015022516250610352, 0.01596975326538086, 0.016916990280151367, 0.017864227294921875, 0.018811464309692383, 0.01975870132446289, 0.0207059383392334, 0.021653175354003906, 0.022600412368774414, 0.023547649383544922, 0.02449488639831543, 0.025442123413085938, 0.026389360427856445, 0.027336597442626953, 0.02828383445739746, 0.02923107147216797, 0.030178308486938477, 0.031125545501708984, 0.03207278251647949, 0.03302001953125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 13.0, 12.0, 11.0, 22.0, 23.0, 38.0, 38.0, 27.0, 42.0, 47.0, 50.0, 51.0, 60.0, 52.0, 53.0, 65.0, 48.0, 60.0, 40.0, 41.0, 38.0, 27.0, 27.0, 20.0, 18.0, 14.0, 9.0, 8.0, 6.0, 7.0, 2.0, 3.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01012420654296875, -0.00977480411529541, -0.00942540168762207, -0.00907599925994873, -0.00872659683227539, -0.00837719440460205, -0.008027791976928711, -0.007678389549255371, -0.007328987121582031, -0.006979584693908691, -0.0066301822662353516, -0.006280779838562012, -0.005931377410888672, -0.005581974983215332, -0.005232572555541992, -0.004883170127868652, -0.0045337677001953125, -0.004184365272521973, -0.003834962844848633, -0.003485560417175293, -0.003136157989501953, -0.0027867555618286133, -0.0024373531341552734, -0.0020879507064819336, -0.0017385482788085938, -0.001389145851135254, -0.001039743423461914, -0.0006903409957885742, -0.0003409385681152344, 8.463859558105469e-06, 0.0003578662872314453, 0.0007072687149047852, 0.001056671142578125, 0.0014060735702514648, 0.0017554759979248047, 0.0021048784255981445, 0.0024542808532714844, 0.0028036832809448242, 0.003153085708618164, 0.003502488136291504, 0.0038518905639648438, 0.004201292991638184, 0.0045506954193115234, 0.004900097846984863, 0.005249500274658203, 0.005598902702331543, 0.005948305130004883, 0.006297707557678223, 0.0066471099853515625, 0.006996512413024902, 0.007345914840698242, 0.007695317268371582, 0.008044719696044922, 0.008394122123718262, 0.008743524551391602, 0.009092926979064941, 0.009442329406738281, 0.009791731834411621, 0.010141134262084961, 0.0104905366897583, 0.01083993911743164, 0.01118934154510498, 0.01153874397277832, 0.01188814640045166, 0.012237548828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 8.0, 8.0, 20.0, 13.0, 17.0, 28.0, 34.0, 43.0, 58.0, 88.0, 96.0, 130.0, 207.0, 317.0, 469.0, 872.0, 2513.0, 40351.0, 4107131.0, 36695.0, 2488.0, 878.0, 537.0, 352.0, 234.0, 175.0, 123.0, 98.0, 82.0, 55.0, 37.0, 29.0, 18.0, 22.0, 18.0, 7.0, 7.0, 5.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09112548828125, -0.08792686462402344, -0.08472824096679688, -0.08152961730957031, -0.07833099365234375, -0.07513236999511719, -0.07193374633789062, -0.06873512268066406, -0.0655364990234375, -0.06233787536621094, -0.059139251708984375, -0.05594062805175781, -0.05274200439453125, -0.04954338073730469, -0.046344757080078125, -0.04314613342285156, -0.039947509765625, -0.03674888610839844, -0.033550262451171875, -0.030351638793945312, -0.02715301513671875, -0.023954391479492188, -0.020755767822265625, -0.017557144165039062, -0.0143585205078125, -0.011159896850585938, -0.007961273193359375, -0.0047626495361328125, -0.00156402587890625, 0.0016345977783203125, 0.004833221435546875, 0.008031845092773438, 0.01123046875, 0.014429092407226562, 0.017627716064453125, 0.020826339721679688, 0.02402496337890625, 0.027223587036132812, 0.030422210693359375, 0.03362083435058594, 0.0368194580078125, 0.04001808166503906, 0.043216705322265625, 0.04641532897949219, 0.04961395263671875, 0.05281257629394531, 0.056011199951171875, 0.05920982360839844, 0.062408447265625, 0.06560707092285156, 0.06880569458007812, 0.07200431823730469, 0.07520294189453125, 0.07840156555175781, 0.08160018920898438, 0.08479881286621094, 0.0879974365234375, 0.09119606018066406, 0.09439468383789062, 0.09759330749511719, 0.10079193115234375, 0.10399055480957031, 0.10718917846679688, 0.11038780212402344, 0.11358642578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 12.0, 43.0, 91.0, 330.0, 1937.0, 1369.0, 185.0, 63.0, 20.0, 6.0, 10.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0833740234375, -0.08037853240966797, -0.07738304138183594, -0.0743875503540039, -0.07139205932617188, -0.06839656829833984, -0.06540107727050781, -0.06240558624267578, -0.05941009521484375, -0.05641460418701172, -0.05341911315917969, -0.050423622131347656, -0.047428131103515625, -0.044432640075683594, -0.04143714904785156, -0.03844165802001953, -0.0354461669921875, -0.03245067596435547, -0.029455184936523438, -0.026459693908691406, -0.023464202880859375, -0.020468711853027344, -0.017473220825195312, -0.014477729797363281, -0.01148223876953125, -0.008486747741699219, -0.0054912567138671875, -0.0024957656860351562, 0.000499725341796875, 0.0034952163696289062, 0.0064907073974609375, 0.009486198425292969, 0.012481689453125, 0.015477180480957031, 0.018472671508789062, 0.021468162536621094, 0.024463653564453125, 0.027459144592285156, 0.030454635620117188, 0.03345012664794922, 0.03644561767578125, 0.03944110870361328, 0.04243659973144531, 0.045432090759277344, 0.048427581787109375, 0.051423072814941406, 0.05441856384277344, 0.05741405487060547, 0.0604095458984375, 0.06340503692626953, 0.06640052795410156, 0.0693960189819336, 0.07239151000976562, 0.07538700103759766, 0.07838249206542969, 0.08137798309326172, 0.08437347412109375, 0.08736896514892578, 0.09036445617675781, 0.09335994720458984, 0.09635543823242188, 0.0993509292602539, 0.10234642028808594, 0.10534191131591797, 0.10833740234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 16.0, 33.0, 113.0, 247.0, 349.0, 134.0, 56.0, 14.0, 8.0, 9.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4741882085800171, -0.44468289613723755, -0.4151776134967804, -0.38567230105400085, -0.3561669886112213, -0.32666170597076416, -0.2971563935279846, -0.2676510810852051, -0.23814578354358673, -0.20864048600196838, -0.17913517355918884, -0.1496298760175705, -0.12012457102537155, -0.09061926603317261, -0.06111396849155426, -0.03160865604877472, -0.002103358507156372, 0.027401944622397423, 0.05690724775195122, 0.08641254901885986, 0.11591785401105881, 0.14542315900325775, 0.1749284565448761, 0.20443376898765564, 0.233939066529274, 0.26344436407089233, 0.2929496765136719, 0.3224549889564514, 0.35196027159690857, 0.3814655840396881, 0.41097086668014526, 0.4404761791229248, 0.46998149156570435, 0.4994868040084839, 0.5289921164512634, 0.558497428894043, 0.5880026817321777, 0.6175079941749573, 0.6470133066177368, 0.6765186190605164, 0.7060239315032959, 0.7355292439460754, 0.765034556388855, 0.7945398092269897, 0.8240451216697693, 0.8535504341125488, 0.8830557465553284, 0.9125610589981079, 0.9420663118362427, 0.9715716242790222, 1.0010769367218018, 1.0305821895599365, 1.0600875616073608, 1.0895928144454956, 1.11909818649292, 1.1486034393310547, 1.178108811378479, 1.2076140642166138, 1.237119436264038, 1.2666246891021729, 1.2961300611495972, 1.325635313987732, 1.3551406860351562, 1.384645938873291, 1.4141511917114258]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 8.0, 6.0, 9.0, 8.0, 11.0, 13.0, 19.0, 20.0, 30.0, 37.0, 41.0, 54.0, 49.0, 55.0, 64.0, 73.0, 45.0, 50.0, 43.0, 56.0, 49.0, 54.0, 39.0, 25.0, 21.0, 20.0, 24.0, 14.0, 16.0, 13.0, 11.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2241661548614502, -0.21562409400939941, -0.20708203315734863, -0.19853997230529785, -0.18999791145324707, -0.1814558506011963, -0.1729138046503067, -0.16437174379825592, -0.15582968294620514, -0.14728762209415436, -0.13874556124210358, -0.1302035003900528, -0.12166144698858261, -0.11311938613653183, -0.10457733273506165, -0.09603527188301086, -0.08749321103096008, -0.0789511501789093, -0.07040908932685852, -0.061867035925388336, -0.053324975073337555, -0.044782914221286774, -0.03624085709452629, -0.027698799967765808, -0.019156739115715027, -0.010614680126309395, -0.002072621136903763, 0.006469437852501869, 0.015011496841907501, 0.023553557693958282, 0.032095614820718765, 0.04063767194747925, 0.04917973279953003, 0.05772179365158081, 0.06626385450363159, 0.07480590790510178, 0.08334796875715256, 0.09189002960920334, 0.10043208301067352, 0.1089741438627243, 0.11751620471477509, 0.12605826556682587, 0.13460032641887665, 0.14314238727092743, 0.15168443322181702, 0.1602264940738678, 0.16876855492591858, 0.17731061577796936, 0.18585267663002014, 0.19439473748207092, 0.2029367983341217, 0.21147885918617249, 0.22002092003822327, 0.22856298089027405, 0.23710502684116364, 0.24564708769321442, 0.254189133644104, 0.2627311944961548, 0.27127325534820557, 0.27981531620025635, 0.28835737705230713, 0.2968994379043579, 0.3054414987564087, 0.3139835596084595, 0.32252562046051025]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 6.0, 13.0, 20.0, 17.0, 45.0, 56.0, 97.0, 122.0, 201.0, 355.0, 605.0, 1058.0, 2053.0, 4155.0, 9560.0, 24353.0, 75055.0, 259993.0, 429047.0, 162863.0, 48184.0, 16926.0, 7000.0, 3100.0, 1533.0, 853.0, 491.0, 266.0, 175.0, 106.0, 75.0, 40.0, 43.0, 23.0, 15.0, 13.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.032196044921875, -0.031229496002197266, -0.03026294708251953, -0.029296398162841797, -0.028329849243164062, -0.027363300323486328, -0.026396751403808594, -0.02543020248413086, -0.024463653564453125, -0.02349710464477539, -0.022530555725097656, -0.021564006805419922, -0.020597457885742188, -0.019630908966064453, -0.01866436004638672, -0.017697811126708984, -0.01673126220703125, -0.015764713287353516, -0.014798164367675781, -0.013831615447998047, -0.012865066528320312, -0.011898517608642578, -0.010931968688964844, -0.00996541976928711, -0.008998870849609375, -0.00803232192993164, -0.007065773010253906, -0.006099224090576172, -0.0051326751708984375, -0.004166126251220703, -0.0031995773315429688, -0.0022330284118652344, -0.0012664794921875, -0.0002999305725097656, 0.0006666183471679688, 0.0016331672668457031, 0.0025997161865234375, 0.003566265106201172, 0.004532814025878906, 0.005499362945556641, 0.006465911865234375, 0.007432460784912109, 0.008399009704589844, 0.009365558624267578, 0.010332107543945312, 0.011298656463623047, 0.012265205383300781, 0.013231754302978516, 0.01419830322265625, 0.015164852142333984, 0.01613140106201172, 0.017097949981689453, 0.018064498901367188, 0.019031047821044922, 0.019997596740722656, 0.02096414566040039, 0.021930694580078125, 0.02289724349975586, 0.023863792419433594, 0.024830341339111328, 0.025796890258789062, 0.026763439178466797, 0.02772998809814453, 0.028696537017822266, 0.0296630859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 3.0, 10.0, 4.0, 10.0, 9.0, 25.0, 25.0, 11.0, 21.0, 22.0, 26.0, 41.0, 26.0, 36.0, 29.0, 45.0, 58.0, 51.0, 52.0, 55.0, 45.0, 45.0, 40.0, 39.0, 23.0, 37.0, 42.0, 25.0, 13.0, 20.0, 21.0, 16.0, 12.0, 15.0, 11.0, 7.0, 12.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.01372528076171875, -0.01329505443572998, -0.012864828109741211, -0.012434601783752441, -0.012004375457763672, -0.011574149131774902, -0.011143922805786133, -0.010713696479797363, -0.010283470153808594, -0.009853243827819824, -0.009423017501831055, -0.008992791175842285, -0.008562564849853516, -0.008132338523864746, -0.0077021121978759766, -0.007271885871887207, -0.0068416595458984375, -0.006411433219909668, -0.0059812068939208984, -0.005550980567932129, -0.005120754241943359, -0.00469052791595459, -0.00426030158996582, -0.0038300752639770508, -0.0033998489379882812, -0.0029696226119995117, -0.002539396286010742, -0.0021091699600219727, -0.0016789436340332031, -0.0012487173080444336, -0.0008184909820556641, -0.00038826465606689453, 4.1961669921875e-05, 0.00047218799591064453, 0.0009024143218994141, 0.0013326406478881836, 0.0017628669738769531, 0.0021930932998657227, 0.002623319625854492, 0.0030535459518432617, 0.0034837722778320312, 0.003913998603820801, 0.00434422492980957, 0.00477445125579834, 0.005204677581787109, 0.005634903907775879, 0.0060651302337646484, 0.006495356559753418, 0.0069255828857421875, 0.007355809211730957, 0.0077860355377197266, 0.008216261863708496, 0.008646488189697266, 0.009076714515686035, 0.009506940841674805, 0.009937167167663574, 0.010367393493652344, 0.010797619819641113, 0.011227846145629883, 0.011658072471618652, 0.012088298797607422, 0.012518525123596191, 0.012948751449584961, 0.01337897777557373, 0.0138092041015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 12.0, 6.0, 13.0, 13.0, 21.0, 36.0, 40.0, 75.0, 119.0, 229.0, 452.0, 874.0, 1746.0, 4621.0, 18179.0, 145191.0, 775161.0, 82439.0, 12538.0, 3629.0, 1544.0, 720.0, 364.0, 196.0, 123.0, 73.0, 35.0, 27.0, 18.0, 18.0, 6.0, 7.0, 4.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07696533203125, -0.07458877563476562, -0.07221221923828125, -0.06983566284179688, -0.0674591064453125, -0.06508255004882812, -0.06270599365234375, -0.060329437255859375, -0.057952880859375, -0.055576324462890625, -0.05319976806640625, -0.050823211669921875, -0.0484466552734375, -0.046070098876953125, -0.04369354248046875, -0.041316986083984375, -0.0389404296875, -0.036563873291015625, -0.03418731689453125, -0.031810760498046875, -0.0294342041015625, -0.027057647705078125, -0.02468109130859375, -0.022304534912109375, -0.019927978515625, -0.017551422119140625, -0.01517486572265625, -0.012798309326171875, -0.0104217529296875, -0.008045196533203125, -0.00566864013671875, -0.003292083740234375, -0.00091552734375, 0.001461029052734375, 0.00383758544921875, 0.006214141845703125, 0.0085906982421875, 0.010967254638671875, 0.01334381103515625, 0.015720367431640625, 0.018096923828125, 0.020473480224609375, 0.02285003662109375, 0.025226593017578125, 0.0276031494140625, 0.029979705810546875, 0.03235626220703125, 0.034732818603515625, 0.037109375, 0.039485931396484375, 0.04186248779296875, 0.044239044189453125, 0.0466156005859375, 0.048992156982421875, 0.05136871337890625, 0.053745269775390625, 0.056121826171875, 0.058498382568359375, 0.06087493896484375, 0.06325149536132812, 0.0656280517578125, 0.06800460815429688, 0.07038116455078125, 0.07275772094726562, 0.07513427734375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 12.0, 14.0, 10.0, 23.0, 35.0, 23.0, 35.0, 30.0, 52.0, 63.0, 84.0, 71.0, 84.0, 80.0, 65.0, 74.0, 49.0, 47.0, 40.0, 25.0, 18.0, 15.0, 8.0, 13.0, 10.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0633544921875, -0.06029510498046875, -0.0572357177734375, -0.05417633056640625, -0.051116943359375, -0.04805755615234375, -0.0449981689453125, -0.04193878173828125, -0.03887939453125, -0.03582000732421875, -0.0327606201171875, -0.02970123291015625, -0.026641845703125, -0.02358245849609375, -0.0205230712890625, -0.01746368408203125, -0.014404296875, -0.01134490966796875, -0.0082855224609375, -0.00522613525390625, -0.002166748046875, 0.00089263916015625, 0.0039520263671875, 0.00701141357421875, 0.01007080078125, 0.01313018798828125, 0.0161895751953125, 0.01924896240234375, 0.022308349609375, 0.02536773681640625, 0.0284271240234375, 0.03148651123046875, 0.0345458984375, 0.03760528564453125, 0.0406646728515625, 0.04372406005859375, 0.046783447265625, 0.04984283447265625, 0.0529022216796875, 0.05596160888671875, 0.05902099609375, 0.06208038330078125, 0.0651397705078125, 0.06819915771484375, 0.071258544921875, 0.07431793212890625, 0.0773773193359375, 0.08043670654296875, 0.08349609375, 0.08655548095703125, 0.0896148681640625, 0.09267425537109375, 0.095733642578125, 0.09879302978515625, 0.1018524169921875, 0.10491180419921875, 0.10797119140625, 0.11103057861328125, 0.1140899658203125, 0.11714935302734375, 0.120208740234375, 0.12326812744140625, 0.1263275146484375, 0.12938690185546875, 0.1324462890625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 23.0, 24.0, 24.0, 34.0, 52.0, 89.0, 124.0, 195.0, 304.0, 445.0, 721.0, 1274.0, 2110.0, 4122.0, 8420.0, 21594.0, 82501.0, 701314.0, 168395.0, 33037.0, 11686.0, 5277.0, 2749.0, 1583.0, 893.0, 517.0, 356.0, 214.0, 141.0, 97.0, 65.0, 44.0, 37.0, 24.0, 16.0, 13.0, 2.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.032012939453125, -0.031062602996826172, -0.030112266540527344, -0.029161930084228516, -0.028211593627929688, -0.02726125717163086, -0.02631092071533203, -0.025360584259033203, -0.024410247802734375, -0.023459911346435547, -0.02250957489013672, -0.02155923843383789, -0.020608901977539062, -0.019658565521240234, -0.018708229064941406, -0.017757892608642578, -0.01680755615234375, -0.015857219696044922, -0.014906883239746094, -0.013956546783447266, -0.013006210327148438, -0.01205587387084961, -0.011105537414550781, -0.010155200958251953, -0.009204864501953125, -0.008254528045654297, -0.007304191589355469, -0.006353855133056641, -0.0054035186767578125, -0.004453182220458984, -0.0035028457641601562, -0.002552509307861328, -0.0016021728515625, -0.0006518363952636719, 0.00029850006103515625, 0.0012488365173339844, 0.0021991729736328125, 0.0031495094299316406, 0.004099845886230469, 0.005050182342529297, 0.006000518798828125, 0.006950855255126953, 0.007901191711425781, 0.00885152816772461, 0.009801864624023438, 0.010752201080322266, 0.011702537536621094, 0.012652873992919922, 0.01360321044921875, 0.014553546905517578, 0.015503883361816406, 0.016454219818115234, 0.017404556274414062, 0.01835489273071289, 0.01930522918701172, 0.020255565643310547, 0.021205902099609375, 0.022156238555908203, 0.02310657501220703, 0.02405691146850586, 0.025007247924804688, 0.025957584381103516, 0.026907920837402344, 0.027858257293701172, 0.02880859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 12.0, 14.0, 19.0, 24.0, 30.0, 39.0, 63.0, 76.0, 74.0, 98.0, 94.0, 98.0, 87.0, 57.0, 50.0, 46.0, 31.0, 24.0, 23.0, 13.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0067901611328125e-05, -4.876870661973953e-05, -4.746951162815094e-05, -4.617031663656235e-05, -4.4871121644973755e-05, -4.357192665338516e-05, -4.227273166179657e-05, -4.097353667020798e-05, -3.9674341678619385e-05, -3.837514668703079e-05, -3.70759516954422e-05, -3.577675670385361e-05, -3.4477561712265015e-05, -3.317836672067642e-05, -3.187917172908783e-05, -3.057997673749924e-05, -2.9280781745910645e-05, -2.7981586754322052e-05, -2.668239176273346e-05, -2.5383196771144867e-05, -2.4084001779556274e-05, -2.2784806787967682e-05, -2.148561179637909e-05, -2.0186416804790497e-05, -1.8887221813201904e-05, -1.7588026821613312e-05, -1.628883183002472e-05, -1.4989636838436127e-05, -1.3690441846847534e-05, -1.2391246855258942e-05, -1.1092051863670349e-05, -9.792856872081757e-06, -8.493661880493164e-06, -7.1944668889045715e-06, -5.895271897315979e-06, -4.5960769057273865e-06, -3.296881914138794e-06, -1.9976869225502014e-06, -6.984919309616089e-07, 6.007030606269836e-07, 1.8998980522155762e-06, 3.1990930438041687e-06, 4.498288035392761e-06, 5.797483026981354e-06, 7.096678018569946e-06, 8.395873010158539e-06, 9.695068001747131e-06, 1.0994262993335724e-05, 1.2293457984924316e-05, 1.3592652976512909e-05, 1.4891847968101501e-05, 1.6191042959690094e-05, 1.7490237951278687e-05, 1.878943294286728e-05, 2.008862793445587e-05, 2.1387822926044464e-05, 2.2687017917633057e-05, 2.398621290922165e-05, 2.5285407900810242e-05, 2.6584602892398834e-05, 2.7883797883987427e-05, 2.918299287557602e-05, 3.0482187867164612e-05, 3.1781382858753204e-05, 3.30805778503418e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 9.0, 9.0, 4.0, 20.0, 22.0, 22.0, 55.0, 71.0, 93.0, 183.0, 343.0, 629.0, 1225.0, 2911.0, 7396.0, 25433.0, 157855.0, 750720.0, 75801.0, 16178.0, 5298.0, 2085.0, 1013.0, 492.0, 284.0, 171.0, 81.0, 38.0, 36.0, 16.0, 14.0, 18.0, 4.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.036468505859375, -0.03530454635620117, -0.034140586853027344, -0.032976627349853516, -0.03181266784667969, -0.03064870834350586, -0.02948474884033203, -0.028320789337158203, -0.027156829833984375, -0.025992870330810547, -0.02482891082763672, -0.02366495132446289, -0.022500991821289062, -0.021337032318115234, -0.020173072814941406, -0.019009113311767578, -0.01784515380859375, -0.016681194305419922, -0.015517234802246094, -0.014353275299072266, -0.013189315795898438, -0.01202535629272461, -0.010861396789550781, -0.009697437286376953, -0.008533477783203125, -0.007369518280029297, -0.006205558776855469, -0.005041599273681641, -0.0038776397705078125, -0.0027136802673339844, -0.0015497207641601562, -0.0003857612609863281, 0.0007781982421875, 0.0019421577453613281, 0.0031061172485351562, 0.004270076751708984, 0.0054340362548828125, 0.006597995758056641, 0.007761955261230469, 0.008925914764404297, 0.010089874267578125, 0.011253833770751953, 0.012417793273925781, 0.01358175277709961, 0.014745712280273438, 0.015909671783447266, 0.017073631286621094, 0.018237590789794922, 0.01940155029296875, 0.020565509796142578, 0.021729469299316406, 0.022893428802490234, 0.024057388305664062, 0.02522134780883789, 0.02638530731201172, 0.027549266815185547, 0.028713226318359375, 0.029877185821533203, 0.03104114532470703, 0.03220510482788086, 0.03336906433105469, 0.034533023834228516, 0.035696983337402344, 0.03686094284057617, 0.03802490234375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 8.0, 23.0, 23.0, 23.0, 25.0, 50.0, 54.0, 72.0, 113.0, 131.0, 108.0, 77.0, 68.0, 56.0, 34.0, 21.0, 22.0, 10.0, 7.0, 8.0, 5.0, 8.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0350341796875, -0.03402376174926758, -0.033013343811035156, -0.032002925872802734, -0.030992507934570312, -0.02998208999633789, -0.02897167205810547, -0.027961254119873047, -0.026950836181640625, -0.025940418243408203, -0.02493000030517578, -0.02391958236694336, -0.022909164428710938, -0.021898746490478516, -0.020888328552246094, -0.019877910614013672, -0.01886749267578125, -0.017857074737548828, -0.016846656799316406, -0.015836238861083984, -0.014825820922851562, -0.01381540298461914, -0.012804985046386719, -0.011794567108154297, -0.010784149169921875, -0.009773731231689453, -0.008763313293457031, -0.007752895355224609, -0.0067424774169921875, -0.005732059478759766, -0.004721641540527344, -0.003711223602294922, -0.0027008056640625, -0.0016903877258300781, -0.0006799697875976562, 0.0003304481506347656, 0.0013408660888671875, 0.0023512840270996094, 0.0033617019653320312, 0.004372119903564453, 0.005382537841796875, 0.006392955780029297, 0.007403373718261719, 0.00841379165649414, 0.009424209594726562, 0.010434627532958984, 0.011445045471191406, 0.012455463409423828, 0.01346588134765625, 0.014476299285888672, 0.015486717224121094, 0.016497135162353516, 0.017507553100585938, 0.01851797103881836, 0.01952838897705078, 0.020538806915283203, 0.021549224853515625, 0.022559642791748047, 0.02357006072998047, 0.02458047866821289, 0.025590896606445312, 0.026601314544677734, 0.027611732482910156, 0.028622150421142578, 0.029632568359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 3.0, 8.0, 4.0, 20.0, 18.0, 33.0, 65.0, 108.0, 145.0, 316.0, 143.0, 62.0, 32.0, 16.0, 7.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.09871506690979, -1.0755971670150757, -1.0524792671203613, -1.0293612480163574, -1.006243348121643, -0.9831254482269287, -0.9600075483322144, -0.9368896484375, -0.9137716889381409, -0.8906537890434265, -0.8675358295440674, -0.844417929649353, -0.8213000297546387, -0.7981820702552795, -0.7750641703605652, -0.751946210861206, -0.7288283109664917, -0.7057104110717773, -0.6825924515724182, -0.6594745516777039, -0.6363565921783447, -0.6132386922836304, -0.590120792388916, -0.5670028924942017, -0.5438849329948425, -0.5207670331001282, -0.49764907360076904, -0.4745311737060547, -0.45141324400901794, -0.4282953143119812, -0.40517741441726685, -0.3820594847202301, -0.35894155502319336, -0.3358236253261566, -0.3127056956291199, -0.2895877957344055, -0.2664698660373688, -0.24335193634033203, -0.22023402154445648, -0.19711610674858093, -0.1739981770515442, -0.15088024735450745, -0.1277623325586319, -0.10464441031217575, -0.0815264880657196, -0.05840856581926346, -0.03529064357280731, -0.012172728776931763, 0.01094520092010498, 0.03406312316656113, 0.05718104541301727, 0.08029896765947342, 0.10341688990592957, 0.1265348196029663, 0.14965273439884186, 0.1727706491947174, 0.19588857889175415, 0.2190065085887909, 0.24212442338466644, 0.265242338180542, 0.28836026787757874, 0.3114781975746155, 0.33459609746932983, 0.3577140271663666, 0.3808319568634033]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 11.0, 10.0, 2.0, 9.0, 14.0, 13.0, 20.0, 14.0, 26.0, 32.0, 22.0, 20.0, 28.0, 23.0, 29.0, 47.0, 59.0, 82.0, 94.0, 81.0, 47.0, 44.0, 36.0, 31.0, 28.0, 22.0, 18.0, 21.0, 20.0, 18.0, 10.0, 8.0, 15.0, 12.0, 6.0, 6.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.392331600189209, -0.3809349834918976, -0.3695383369922638, -0.3581417202949524, -0.3467450737953186, -0.3353484570980072, -0.3239518404006958, -0.312555193901062, -0.3011585772037506, -0.2897619605064392, -0.2783653140068054, -0.266968697309494, -0.25557205080986023, -0.24417543411254883, -0.23277880251407623, -0.22138217091560364, -0.20998553931713104, -0.19858890771865845, -0.18719227612018585, -0.17579564452171326, -0.16439902782440186, -0.15300239622592926, -0.14160576462745667, -0.13020914793014526, -0.11881250888109207, -0.10741587728261948, -0.09601925313472748, -0.08462262153625488, -0.07322598993778229, -0.06182936578989029, -0.050432734191417694, -0.039036110043525696, -0.0276394784450531, -0.016242850571870804, -0.004846220836043358, 0.006550408899784088, 0.017947036772966385, 0.02934366464614868, 0.04074029624462128, 0.052136920392513275, 0.06353355199098587, 0.07493018358945847, 0.08632680773735046, 0.09772343933582306, 0.10912007093429565, 0.12051669508218765, 0.13191333413124084, 0.14330995082855225, 0.15470658242702484, 0.16610321402549744, 0.17749984562397003, 0.18889647722244263, 0.20029309391975403, 0.21168972551822662, 0.22308635711669922, 0.23448297381401062, 0.2458796203136444, 0.2572762370109558, 0.2686728835105896, 0.280069500207901, 0.2914661467075348, 0.3028627634048462, 0.31425940990448, 0.3256560266017914, 0.3370526432991028]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 2.0, 6.0, 8.0, 16.0, 16.0, 31.0, 38.0, 51.0, 67.0, 117.0, 149.0, 218.0, 352.0, 496.0, 881.0, 1499.0, 2864.0, 6477.0, 17613.0, 68809.0, 507979.0, 2823147.0, 648314.0, 81105.0, 19679.0, 6936.0, 3176.0, 1598.0, 949.0, 543.0, 364.0, 231.0, 166.0, 107.0, 76.0, 60.0, 36.0, 31.0, 24.0, 8.0, 16.0, 7.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.026611328125, -0.025793790817260742, -0.024976253509521484, -0.024158716201782227, -0.02334117889404297, -0.02252364158630371, -0.021706104278564453, -0.020888566970825195, -0.020071029663085938, -0.01925349235534668, -0.018435955047607422, -0.017618417739868164, -0.016800880432128906, -0.01598334312438965, -0.01516580581665039, -0.014348268508911133, -0.013530731201171875, -0.012713193893432617, -0.01189565658569336, -0.011078119277954102, -0.010260581970214844, -0.009443044662475586, -0.008625507354736328, -0.00780797004699707, -0.0069904327392578125, -0.006172895431518555, -0.005355358123779297, -0.004537820816040039, -0.0037202835083007812, -0.0029027462005615234, -0.0020852088928222656, -0.0012676715850830078, -0.00045013427734375, 0.0003674030303955078, 0.0011849403381347656, 0.0020024776458740234, 0.0028200149536132812, 0.003637552261352539, 0.004455089569091797, 0.005272626876831055, 0.0060901641845703125, 0.00690770149230957, 0.007725238800048828, 0.008542776107788086, 0.009360313415527344, 0.010177850723266602, 0.01099538803100586, 0.011812925338745117, 0.012630462646484375, 0.013447999954223633, 0.01426553726196289, 0.015083074569702148, 0.015900611877441406, 0.016718149185180664, 0.017535686492919922, 0.01835322380065918, 0.019170761108398438, 0.019988298416137695, 0.020805835723876953, 0.02162337303161621, 0.02244091033935547, 0.023258447647094727, 0.024075984954833984, 0.024893522262573242, 0.0257110595703125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 2.0, 9.0, 16.0, 9.0, 23.0, 21.0, 31.0, 28.0, 31.0, 38.0, 43.0, 40.0, 54.0, 51.0, 61.0, 55.0, 62.0, 58.0, 52.0, 43.0, 39.0, 40.0, 21.0, 28.0, 29.0, 15.0, 17.0, 20.0, 12.0, 6.0, 8.0, 11.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.018829345703125, -0.018265247344970703, -0.017701148986816406, -0.01713705062866211, -0.016572952270507812, -0.016008853912353516, -0.015444755554199219, -0.014880657196044922, -0.014316558837890625, -0.013752460479736328, -0.013188362121582031, -0.012624263763427734, -0.012060165405273438, -0.01149606704711914, -0.010931968688964844, -0.010367870330810547, -0.00980377197265625, -0.009239673614501953, -0.008675575256347656, -0.00811147689819336, -0.0075473785400390625, -0.006983280181884766, -0.006419181823730469, -0.005855083465576172, -0.005290985107421875, -0.004726886749267578, -0.004162788391113281, -0.0035986900329589844, -0.0030345916748046875, -0.0024704933166503906, -0.0019063949584960938, -0.0013422966003417969, -0.0007781982421875, -0.00021409988403320312, 0.00034999847412109375, 0.0009140968322753906, 0.0014781951904296875, 0.0020422935485839844, 0.0026063919067382812, 0.003170490264892578, 0.003734588623046875, 0.004298686981201172, 0.004862785339355469, 0.005426883697509766, 0.0059909820556640625, 0.006555080413818359, 0.007119178771972656, 0.007683277130126953, 0.00824737548828125, 0.008811473846435547, 0.009375572204589844, 0.00993967056274414, 0.010503768920898438, 0.011067867279052734, 0.011631965637207031, 0.012196063995361328, 0.012760162353515625, 0.013324260711669922, 0.013888359069824219, 0.014452457427978516, 0.015016555786132812, 0.01558065414428711, 0.016144752502441406, 0.016708850860595703, 0.01727294921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 17.0, 33.0, 74.0, 185.0, 518.0, 2669.0, 2584356.0, 1603086.0, 2467.0, 535.0, 209.0, 75.0, 36.0, 15.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3236846923828125, -0.313873291015625, -0.3040618896484375, -0.29425048828125, -0.2844390869140625, -0.274627685546875, -0.2648162841796875, -0.2550048828125, -0.2451934814453125, -0.235382080078125, -0.2255706787109375, -0.21575927734375, -0.2059478759765625, -0.196136474609375, -0.1863250732421875, -0.176513671875, -0.1667022705078125, -0.156890869140625, -0.1470794677734375, -0.13726806640625, -0.1274566650390625, -0.117645263671875, -0.1078338623046875, -0.0980224609375, -0.0882110595703125, -0.078399658203125, -0.0685882568359375, -0.05877685546875, -0.0489654541015625, -0.039154052734375, -0.0293426513671875, -0.01953125, -0.0097198486328125, 9.1552734375e-05, 0.0099029541015625, 0.01971435546875, 0.0295257568359375, 0.039337158203125, 0.0491485595703125, 0.0589599609375, 0.0687713623046875, 0.078582763671875, 0.0883941650390625, 0.09820556640625, 0.1080169677734375, 0.117828369140625, 0.1276397705078125, 0.137451171875, 0.1472625732421875, 0.157073974609375, 0.1668853759765625, 0.17669677734375, 0.1865081787109375, 0.196319580078125, 0.2061309814453125, 0.2159423828125, 0.2257537841796875, 0.235565185546875, 0.2453765869140625, 0.25518798828125, 0.2649993896484375, 0.274810791015625, 0.2846221923828125, 0.29443359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 21.0, 43.0, 94.0, 491.0, 2556.0, 673.0, 114.0, 35.0, 20.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1182861328125, -0.11326789855957031, -0.10824966430664062, -0.10323143005371094, -0.09821319580078125, -0.09319496154785156, -0.08817672729492188, -0.08315849304199219, -0.0781402587890625, -0.07312202453613281, -0.06810379028320312, -0.06308555603027344, -0.05806732177734375, -0.05304908752441406, -0.048030853271484375, -0.04301261901855469, -0.037994384765625, -0.03297615051269531, -0.027957916259765625, -0.022939682006835938, -0.01792144775390625, -0.012903213500976562, -0.007884979248046875, -0.0028667449951171875, 0.0021514892578125, 0.0071697235107421875, 0.012187957763671875, 0.017206192016601562, 0.02222442626953125, 0.027242660522460938, 0.032260894775390625, 0.03727912902832031, 0.04229736328125, 0.04731559753417969, 0.052333831787109375, 0.05735206604003906, 0.06237030029296875, 0.06738853454589844, 0.07240676879882812, 0.07742500305175781, 0.0824432373046875, 0.08746147155761719, 0.09247970581054688, 0.09749794006347656, 0.10251617431640625, 0.10753440856933594, 0.11255264282226562, 0.11757087707519531, 0.122589111328125, 0.1276073455810547, 0.13262557983398438, 0.13764381408691406, 0.14266204833984375, 0.14768028259277344, 0.15269851684570312, 0.1577167510986328, 0.1627349853515625, 0.1677532196044922, 0.17277145385742188, 0.17778968811035156, 0.18280792236328125, 0.18782615661621094, 0.19284439086914062, 0.1978626251220703, 0.202880859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 11.0, 18.0, 26.0, 49.0, 85.0, 120.0, 183.0, 160.0, 124.0, 101.0, 51.0, 25.0, 15.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3671375513076782, -0.3498218059539795, -0.33250606060028076, -0.31519031524658203, -0.2978745698928833, -0.28055882453918457, -0.26324307918548584, -0.2459273487329483, -0.22861160337924957, -0.21129585802555084, -0.1939801126718521, -0.17666438221931458, -0.15934863686561584, -0.14203289151191711, -0.12471714615821838, -0.10740140080451965, -0.09008565545082092, -0.07276991009712219, -0.05545416846871376, -0.03813842684030533, -0.020822681486606598, -0.0035069361329078674, 0.013808801770210266, 0.031124547123908997, 0.04844029247760773, 0.06575603783130646, 0.08307178318500519, 0.10038752108812332, 0.11770326644182205, 0.13501900434494019, 0.15233474969863892, 0.16965049505233765, 0.18696624040603638, 0.2042819857597351, 0.22159773111343384, 0.23891347646713257, 0.2562292218208313, 0.27354496717453003, 0.29086071252822876, 0.3081764578819275, 0.3254922032356262, 0.34280794858932495, 0.3601236939430237, 0.3774394392967224, 0.39475518465042114, 0.4120709300041199, 0.4293866753578186, 0.44670242071151733, 0.4640181362628937, 0.4813338816165924, 0.49864962697029114, 0.5159653425216675, 0.5332810878753662, 0.5505968332290649, 0.5679125785827637, 0.5852283239364624, 0.6025440692901611, 0.6198598146438599, 0.6371755599975586, 0.6544913053512573, 0.671807050704956, 0.6891227960586548, 0.7064385414123535, 0.7237542867660522, 0.741070032119751]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 7.0, 5.0, 6.0, 12.0, 7.0, 15.0, 15.0, 15.0, 15.0, 15.0, 17.0, 22.0, 43.0, 31.0, 39.0, 37.0, 35.0, 42.0, 46.0, 45.0, 47.0, 53.0, 46.0, 38.0, 38.0, 40.0, 28.0, 40.0, 35.0, 30.0, 26.0, 22.0, 14.0, 16.0, 13.0, 8.0, 6.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.26610541343688965, -0.2573443651199341, -0.2485833317041397, -0.23982229828834534, -0.23106126487255096, -0.2223002314567566, -0.21353918313980103, -0.20477814972400665, -0.19601711630821228, -0.1872560828924179, -0.17849503457546234, -0.16973400115966797, -0.1609729677438736, -0.15221193432807922, -0.14345088601112366, -0.13468985259532928, -0.12592880427837372, -0.11716776341199875, -0.10840672999620438, -0.0996456891298294, -0.09088465571403503, -0.08212361484766006, -0.0733625739812851, -0.06460154056549072, -0.05584049969911575, -0.04707946255803108, -0.03831842541694641, -0.02955738455057144, -0.02079634740948677, -0.0120353102684021, -0.00327426940202713, 0.005486767739057541, 0.014247804880142212, 0.023008842021226883, 0.031769879162311554, 0.04053092002868652, 0.049291957169771194, 0.058052994310855865, 0.06681403517723083, 0.07557506859302521, 0.08433610945940018, 0.09309715032577515, 0.10185818374156952, 0.11061922460794449, 0.11938026547431946, 0.12814129889011383, 0.1369023323059082, 0.14566338062286377, 0.15442441403865814, 0.16318544745445251, 0.17194649577140808, 0.18070752918720245, 0.18946856260299683, 0.1982296109199524, 0.20699064433574677, 0.21575167775154114, 0.2245127260684967, 0.23327375948429108, 0.24203480780124664, 0.250795841217041, 0.2595568895339966, 0.26831790804862976, 0.2770789563655853, 0.2858400046825409, 0.2946010231971741]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 10.0, 8.0, 15.0, 19.0, 35.0, 53.0, 75.0, 132.0, 217.0, 434.0, 808.0, 1722.0, 3671.0, 8857.0, 23093.0, 69371.0, 244115.0, 452873.0, 165279.0, 48846.0, 16588.0, 6480.0, 2939.0, 1287.0, 705.0, 385.0, 215.0, 123.0, 69.0, 42.0, 27.0, 25.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0303497314453125, -0.029239892959594727, -0.028130054473876953, -0.02702021598815918, -0.025910377502441406, -0.024800539016723633, -0.02369070053100586, -0.022580862045288086, -0.021471023559570312, -0.02036118507385254, -0.019251346588134766, -0.018141508102416992, -0.01703166961669922, -0.015921831130981445, -0.014811992645263672, -0.013702154159545898, -0.012592315673828125, -0.011482477188110352, -0.010372638702392578, -0.009262800216674805, -0.008152961730957031, -0.007043123245239258, -0.005933284759521484, -0.004823446273803711, -0.0037136077880859375, -0.002603769302368164, -0.0014939308166503906, -0.0003840923309326172, 0.0007257461547851562, 0.0018355846405029297, 0.002945423126220703, 0.0040552616119384766, 0.00516510009765625, 0.0062749385833740234, 0.007384777069091797, 0.00849461555480957, 0.009604454040527344, 0.010714292526245117, 0.01182413101196289, 0.012933969497680664, 0.014043807983398438, 0.015153646469116211, 0.016263484954833984, 0.017373323440551758, 0.01848316192626953, 0.019593000411987305, 0.020702838897705078, 0.02181267738342285, 0.022922515869140625, 0.0240323543548584, 0.025142192840576172, 0.026252031326293945, 0.02736186981201172, 0.028471708297729492, 0.029581546783447266, 0.03069138526916504, 0.03180122375488281, 0.032911062240600586, 0.03402090072631836, 0.03513073921203613, 0.036240577697753906, 0.03735041618347168, 0.03846025466918945, 0.03957009315490723, 0.040679931640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 6.0, 11.0, 13.0, 18.0, 15.0, 13.0, 18.0, 20.0, 35.0, 30.0, 35.0, 59.0, 50.0, 53.0, 63.0, 66.0, 63.0, 53.0, 54.0, 56.0, 45.0, 38.0, 35.0, 29.0, 28.0, 21.0, 17.0, 9.0, 15.0, 9.0, 3.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0231475830078125, -0.022438526153564453, -0.021729469299316406, -0.02102041244506836, -0.020311355590820312, -0.019602298736572266, -0.01889324188232422, -0.018184185028076172, -0.017475128173828125, -0.016766071319580078, -0.01605701446533203, -0.015347957611083984, -0.014638900756835938, -0.01392984390258789, -0.013220787048339844, -0.012511730194091797, -0.01180267333984375, -0.011093616485595703, -0.010384559631347656, -0.00967550277709961, -0.008966445922851562, -0.008257389068603516, -0.007548332214355469, -0.006839275360107422, -0.006130218505859375, -0.005421161651611328, -0.004712104797363281, -0.004003047943115234, -0.0032939910888671875, -0.0025849342346191406, -0.0018758773803710938, -0.0011668205261230469, -0.000457763671875, 0.0002512931823730469, 0.0009603500366210938, 0.0016694068908691406, 0.0023784637451171875, 0.0030875205993652344, 0.0037965774536132812, 0.004505634307861328, 0.005214691162109375, 0.005923748016357422, 0.006632804870605469, 0.007341861724853516, 0.008050918579101562, 0.00875997543334961, 0.009469032287597656, 0.010178089141845703, 0.01088714599609375, 0.011596202850341797, 0.012305259704589844, 0.01301431655883789, 0.013723373413085938, 0.014432430267333984, 0.015141487121582031, 0.015850543975830078, 0.016559600830078125, 0.017268657684326172, 0.01797771453857422, 0.018686771392822266, 0.019395828247070312, 0.02010488510131836, 0.020813941955566406, 0.021522998809814453, 0.0222320556640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 4.0, 9.0, 8.0, 11.0, 24.0, 27.0, 36.0, 41.0, 64.0, 59.0, 93.0, 145.0, 228.0, 362.0, 440.0, 945.0, 2134.0, 6123.0, 25575.0, 187258.0, 731433.0, 73006.0, 13064.0, 3806.0, 1500.0, 740.0, 420.0, 260.0, 208.0, 144.0, 105.0, 59.0, 52.0, 31.0, 32.0, 20.0, 23.0, 17.0, 10.0, 9.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-0.07611083984375, -0.07389068603515625, -0.0716705322265625, -0.06945037841796875, -0.067230224609375, -0.06501007080078125, -0.0627899169921875, -0.06056976318359375, -0.058349609375, -0.05612945556640625, -0.0539093017578125, -0.05168914794921875, -0.049468994140625, -0.04724884033203125, -0.0450286865234375, -0.04280853271484375, -0.04058837890625, -0.03836822509765625, -0.0361480712890625, -0.03392791748046875, -0.031707763671875, -0.02948760986328125, -0.0272674560546875, -0.02504730224609375, -0.0228271484375, -0.02060699462890625, -0.0183868408203125, -0.01616668701171875, -0.013946533203125, -0.01172637939453125, -0.0095062255859375, -0.00728607177734375, -0.00506591796875, -0.00284576416015625, -0.0006256103515625, 0.00159454345703125, 0.003814697265625, 0.00603485107421875, 0.0082550048828125, 0.01047515869140625, 0.0126953125, 0.01491546630859375, 0.0171356201171875, 0.01935577392578125, 0.021575927734375, 0.02379608154296875, 0.0260162353515625, 0.02823638916015625, 0.03045654296875, 0.03267669677734375, 0.0348968505859375, 0.03711700439453125, 0.039337158203125, 0.04155731201171875, 0.0437774658203125, 0.04599761962890625, 0.0482177734375, 0.05043792724609375, 0.0526580810546875, 0.05487823486328125, 0.057098388671875, 0.05931854248046875, 0.0615386962890625, 0.06375885009765625, 0.06597900390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 8.0, 5.0, 11.0, 10.0, 10.0, 14.0, 10.0, 14.0, 16.0, 27.0, 21.0, 44.0, 20.0, 35.0, 50.0, 46.0, 36.0, 53.0, 54.0, 46.0, 51.0, 57.0, 40.0, 52.0, 46.0, 37.0, 28.0, 26.0, 20.0, 19.0, 20.0, 13.0, 6.0, 14.0, 5.0, 9.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0831298828125, -0.08056926727294922, -0.07800865173339844, -0.07544803619384766, -0.07288742065429688, -0.0703268051147461, -0.06776618957519531, -0.06520557403564453, -0.06264495849609375, -0.06008434295654297, -0.05752372741699219, -0.054963111877441406, -0.052402496337890625, -0.049841880798339844, -0.04728126525878906, -0.04472064971923828, -0.0421600341796875, -0.03959941864013672, -0.03703880310058594, -0.034478187561035156, -0.031917572021484375, -0.029356956481933594, -0.026796340942382812, -0.02423572540283203, -0.02167510986328125, -0.01911449432373047, -0.016553878784179688, -0.013993263244628906, -0.011432647705078125, -0.008872032165527344, -0.0063114166259765625, -0.0037508010864257812, -0.001190185546875, 0.0013704299926757812, 0.0039310455322265625, 0.006491661071777344, 0.009052276611328125, 0.011612892150878906, 0.014173507690429688, 0.01673412322998047, 0.01929473876953125, 0.02185535430908203, 0.024415969848632812, 0.026976585388183594, 0.029537200927734375, 0.032097816467285156, 0.03465843200683594, 0.03721904754638672, 0.0397796630859375, 0.04234027862548828, 0.04490089416503906, 0.047461509704589844, 0.050022125244140625, 0.052582740783691406, 0.05514335632324219, 0.05770397186279297, 0.06026458740234375, 0.06282520294189453, 0.06538581848144531, 0.0679464340209961, 0.07050704956054688, 0.07306766510009766, 0.07562828063964844, 0.07818889617919922, 0.08074951171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 9.0, 11.0, 12.0, 11.0, 31.0, 18.0, 63.0, 93.0, 190.0, 300.0, 776.0, 1934.0, 6042.0, 25309.0, 172434.0, 764960.0, 59278.0, 11684.0, 3222.0, 1145.0, 479.0, 232.0, 125.0, 69.0, 41.0, 26.0, 13.0, 10.0, 10.0, 4.0, 4.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02838134765625, -0.027210712432861328, -0.026040077209472656, -0.024869441986083984, -0.023698806762695312, -0.02252817153930664, -0.02135753631591797, -0.020186901092529297, -0.019016265869140625, -0.017845630645751953, -0.01667499542236328, -0.01550436019897461, -0.014333724975585938, -0.013163089752197266, -0.011992454528808594, -0.010821819305419922, -0.00965118408203125, -0.008480548858642578, -0.007309913635253906, -0.006139278411865234, -0.0049686431884765625, -0.0037980079650878906, -0.0026273727416992188, -0.0014567375183105469, -0.000286102294921875, 0.0008845329284667969, 0.0020551681518554688, 0.0032258033752441406, 0.0043964385986328125, 0.005567073822021484, 0.006737709045410156, 0.007908344268798828, 0.0090789794921875, 0.010249614715576172, 0.011420249938964844, 0.012590885162353516, 0.013761520385742188, 0.01493215560913086, 0.01610279083251953, 0.017273426055908203, 0.018444061279296875, 0.019614696502685547, 0.02078533172607422, 0.02195596694946289, 0.023126602172851562, 0.024297237396240234, 0.025467872619628906, 0.026638507843017578, 0.02780914306640625, 0.028979778289794922, 0.030150413513183594, 0.031321048736572266, 0.03249168395996094, 0.03366231918334961, 0.03483295440673828, 0.03600358963012695, 0.037174224853515625, 0.0383448600769043, 0.03951549530029297, 0.04068613052368164, 0.04185676574707031, 0.043027400970458984, 0.044198036193847656, 0.04536867141723633, 0.046539306640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 1.0, 7.0, 7.0, 14.0, 21.0, 29.0, 41.0, 53.0, 60.0, 88.0, 90.0, 94.0, 99.0, 87.0, 73.0, 51.0, 50.0, 35.0, 25.0, 13.0, 12.0, 7.0, 7.0, 7.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.035234451293945e-05, -3.919471055269241e-05, -3.8037076592445374e-05, -3.6879442632198334e-05, -3.5721808671951294e-05, -3.4564174711704254e-05, -3.3406540751457214e-05, -3.2248906791210175e-05, -3.1091272830963135e-05, -2.9933638870716095e-05, -2.8776004910469055e-05, -2.7618370950222015e-05, -2.6460736989974976e-05, -2.5303103029727936e-05, -2.4145469069480896e-05, -2.2987835109233856e-05, -2.1830201148986816e-05, -2.0672567188739777e-05, -1.9514933228492737e-05, -1.8357299268245697e-05, -1.7199665307998657e-05, -1.6042031347751617e-05, -1.4884397387504578e-05, -1.3726763427257538e-05, -1.2569129467010498e-05, -1.1411495506763458e-05, -1.0253861546516418e-05, -9.096227586269379e-06, -7.938593626022339e-06, -6.780959665775299e-06, -5.623325705528259e-06, -4.4656917452812195e-06, -3.3080577850341797e-06, -2.15042382478714e-06, -9.927898645401e-07, 1.648440957069397e-07, 1.3224780559539795e-06, 2.4801120162010193e-06, 3.637745976448059e-06, 4.795379936695099e-06, 5.953013896942139e-06, 7.1106478571891785e-06, 8.268281817436218e-06, 9.425915777683258e-06, 1.0583549737930298e-05, 1.1741183698177338e-05, 1.2898817658424377e-05, 1.4056451618671417e-05, 1.5214085578918457e-05, 1.6371719539165497e-05, 1.7529353499412537e-05, 1.8686987459659576e-05, 1.9844621419906616e-05, 2.1002255380153656e-05, 2.2159889340400696e-05, 2.3317523300647736e-05, 2.4475157260894775e-05, 2.5632791221141815e-05, 2.6790425181388855e-05, 2.7948059141635895e-05, 2.9105693101882935e-05, 3.0263327062129974e-05, 3.1420961022377014e-05, 3.2578594982624054e-05, 3.3736228942871094e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 15.0, 21.0, 28.0, 63.0, 95.0, 158.0, 319.0, 659.0, 1820.0, 5634.0, 25978.0, 254355.0, 708372.0, 39510.0, 7682.0, 2226.0, 831.0, 373.0, 170.0, 88.0, 48.0, 36.0, 23.0, 13.0, 10.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04168701171875, -0.04034709930419922, -0.03900718688964844, -0.037667274475097656, -0.036327362060546875, -0.034987449645996094, -0.03364753723144531, -0.03230762481689453, -0.03096771240234375, -0.02962779998779297, -0.028287887573242188, -0.026947975158691406, -0.025608062744140625, -0.024268150329589844, -0.022928237915039062, -0.02158832550048828, -0.0202484130859375, -0.01890850067138672, -0.017568588256835938, -0.016228675842285156, -0.014888763427734375, -0.013548851013183594, -0.012208938598632812, -0.010869026184082031, -0.00952911376953125, -0.008189201354980469, -0.0068492889404296875, -0.005509376525878906, -0.004169464111328125, -0.0028295516967773438, -0.0014896392822265625, -0.00014972686767578125, 0.001190185546875, 0.0025300979614257812, 0.0038700103759765625, 0.005209922790527344, 0.006549835205078125, 0.007889747619628906, 0.009229660034179688, 0.010569572448730469, 0.01190948486328125, 0.013249397277832031, 0.014589309692382812, 0.015929222106933594, 0.017269134521484375, 0.018609046936035156, 0.019948959350585938, 0.02128887176513672, 0.0226287841796875, 0.02396869659423828, 0.025308609008789062, 0.026648521423339844, 0.027988433837890625, 0.029328346252441406, 0.030668258666992188, 0.03200817108154297, 0.03334808349609375, 0.03468799591064453, 0.03602790832519531, 0.037367820739746094, 0.038707733154296875, 0.040047645568847656, 0.04138755798339844, 0.04272747039794922, 0.0440673828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 4.0, 5.0, 14.0, 13.0, 12.0, 22.0, 27.0, 43.0, 66.0, 84.0, 98.0, 166.0, 143.0, 75.0, 66.0, 42.0, 29.0, 27.0, 19.0, 8.0, 7.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0261993408203125, -0.0251767635345459, -0.024154186248779297, -0.023131608963012695, -0.022109031677246094, -0.021086454391479492, -0.02006387710571289, -0.01904129981994629, -0.018018722534179688, -0.016996145248413086, -0.015973567962646484, -0.014950990676879883, -0.013928413391113281, -0.01290583610534668, -0.011883258819580078, -0.010860681533813477, -0.009838104248046875, -0.008815526962280273, -0.007792949676513672, -0.00677037239074707, -0.005747795104980469, -0.004725217819213867, -0.0037026405334472656, -0.002680063247680664, -0.0016574859619140625, -0.0006349086761474609, 0.0003876686096191406, 0.0014102458953857422, 0.0024328231811523438, 0.0034554004669189453, 0.004477977752685547, 0.0055005550384521484, 0.00652313232421875, 0.0075457096099853516, 0.008568286895751953, 0.009590864181518555, 0.010613441467285156, 0.011636018753051758, 0.01265859603881836, 0.013681173324584961, 0.014703750610351562, 0.015726327896118164, 0.016748905181884766, 0.017771482467651367, 0.01879405975341797, 0.01981663703918457, 0.020839214324951172, 0.021861791610717773, 0.022884368896484375, 0.023906946182250977, 0.024929523468017578, 0.02595210075378418, 0.02697467803955078, 0.027997255325317383, 0.029019832611083984, 0.030042409896850586, 0.031064987182617188, 0.03208756446838379, 0.03311014175415039, 0.03413271903991699, 0.035155296325683594, 0.036177873611450195, 0.0372004508972168, 0.0382230281829834, 0.03924560546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 8.0, 11.0, 32.0, 61.0, 120.0, 277.0, 291.0, 107.0, 38.0, 21.0, 7.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.2841212749481201, -1.25989830493927, -1.23567533493042, -1.2114523649215698, -1.1872293949127197, -1.1630065441131592, -1.138783574104309, -1.114560604095459, -1.0903376340866089, -1.0661146640777588, -1.0418916940689087, -1.0176687240600586, -0.9934458136558533, -0.9692228436470032, -0.9449999332427979, -0.9207769632339478, -0.8965539932250977, -0.8723310232162476, -0.8481080532073975, -0.8238851428031921, -0.799662172794342, -0.7754392027854919, -0.7512162923812866, -0.7269933223724365, -0.7027703523635864, -0.6785473823547363, -0.6543244123458862, -0.6301015019416809, -0.6058785319328308, -0.5816555619239807, -0.5574326515197754, -0.5332096815109253, -0.5089866518974304, -0.4847636818885803, -0.4605407416820526, -0.4363178014755249, -0.4120948314666748, -0.3878718614578247, -0.363648921251297, -0.3394259810447693, -0.3152030110359192, -0.2909800410270691, -0.2667571008205414, -0.24253414571285248, -0.21831119060516357, -0.19408823549747467, -0.16986528038978577, -0.14564232528209686, -0.12141937017440796, -0.09719641506671906, -0.07297345995903015, -0.04875050485134125, -0.024527549743652344, -0.00030459463596343994, 0.023918360471725464, 0.04814131557941437, 0.07236427068710327, 0.09658722579479218, 0.12081018090248108, 0.14503313601016998, 0.1692560911178589, 0.1934790462255478, 0.2177020013332367, 0.2419249564409256, 0.2661479115486145]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 2.0, 4.0, 7.0, 2.0, 7.0, 7.0, 11.0, 8.0, 8.0, 15.0, 21.0, 19.0, 21.0, 22.0, 32.0, 30.0, 23.0, 35.0, 28.0, 62.0, 115.0, 113.0, 61.0, 42.0, 32.0, 40.0, 22.0, 25.0, 27.0, 22.0, 22.0, 19.0, 8.0, 11.0, 11.0, 11.0, 6.0, 12.0, 7.0, 6.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.3943328261375427, -0.38268956542015076, -0.3710463345050812, -0.3594030737876892, -0.34775984287261963, -0.33611658215522766, -0.3244733214378357, -0.3128300905227661, -0.30118682980537415, -0.2895435690879822, -0.2779003381729126, -0.26625707745552063, -0.25461381673812866, -0.24297058582305908, -0.23132732510566711, -0.21968407928943634, -0.20804083347320557, -0.1963975876569748, -0.18475434184074402, -0.17311108112335205, -0.16146783530712128, -0.1498245894908905, -0.13818132877349854, -0.12653808295726776, -0.11489483714103699, -0.10325159132480621, -0.09160833805799484, -0.07996508479118347, -0.0683218389749527, -0.056678589433431625, -0.04503533989191055, -0.03339208662509918, -0.021748840808868408, -0.010105591267347336, 0.0015376582741737366, 0.013180907815694809, 0.02482415735721588, 0.036467406898736954, 0.048110656440258026, 0.0597539097070694, 0.07139715552330017, 0.08304040133953094, 0.09468365460634232, 0.10632690787315369, 0.11797015368938446, 0.12961339950561523, 0.1412566602230072, 0.15289990603923798, 0.16454315185546875, 0.17618639767169952, 0.1878296434879303, 0.19947290420532227, 0.21111615002155304, 0.2227593958377838, 0.23440265655517578, 0.24604590237140656, 0.25768914818763733, 0.2693324089050293, 0.2809756398200989, 0.29261890053749084, 0.3042621612548828, 0.3159053921699524, 0.32754865288734436, 0.33919191360473633, 0.3508351445198059]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 10.0, 11.0, 14.0, 18.0, 17.0, 27.0, 38.0, 49.0, 70.0, 105.0, 147.0, 247.0, 342.0, 557.0, 900.0, 1594.0, 3057.0, 6366.0, 16977.0, 74818.0, 715767.0, 2893330.0, 404477.0, 50916.0, 13207.0, 5143.0, 2496.0, 1326.0, 791.0, 465.0, 310.0, 194.0, 143.0, 89.0, 65.0, 44.0, 31.0, 28.0, 22.0, 26.0, 10.0, 9.0, 11.0, 3.0, 4.0, 2.0, 0.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03668212890625, -0.03551340103149414, -0.03434467315673828, -0.03317594528198242, -0.03200721740722656, -0.030838489532470703, -0.029669761657714844, -0.028501033782958984, -0.027332305908203125, -0.026163578033447266, -0.024994850158691406, -0.023826122283935547, -0.022657394409179688, -0.021488666534423828, -0.02031993865966797, -0.01915121078491211, -0.01798248291015625, -0.01681375503540039, -0.01564502716064453, -0.014476299285888672, -0.013307571411132812, -0.012138843536376953, -0.010970115661621094, -0.009801387786865234, -0.008632659912109375, -0.007463932037353516, -0.006295204162597656, -0.005126476287841797, -0.0039577484130859375, -0.002789020538330078, -0.0016202926635742188, -0.0004515647888183594, 0.0007171630859375, 0.0018858909606933594, 0.0030546188354492188, 0.004223346710205078, 0.0053920745849609375, 0.006560802459716797, 0.007729530334472656, 0.008898258209228516, 0.010066986083984375, 0.011235713958740234, 0.012404441833496094, 0.013573169708251953, 0.014741897583007812, 0.015910625457763672, 0.01707935333251953, 0.01824808120727539, 0.01941680908203125, 0.02058553695678711, 0.02175426483154297, 0.022922992706298828, 0.024091720581054688, 0.025260448455810547, 0.026429176330566406, 0.027597904205322266, 0.028766632080078125, 0.029935359954833984, 0.031104087829589844, 0.0322728157043457, 0.03344154357910156, 0.03461027145385742, 0.03577899932861328, 0.03694772720336914, 0.038116455078125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 4.0, 7.0, 9.0, 13.0, 4.0, 24.0, 18.0, 22.0, 30.0, 35.0, 32.0, 47.0, 54.0, 54.0, 51.0, 59.0, 66.0, 46.0, 52.0, 39.0, 46.0, 47.0, 36.0, 40.0, 29.0, 23.0, 20.0, 18.0, 13.0, 14.0, 8.0, 7.0, 6.0, 5.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02337646484375, -0.02267765998840332, -0.02197885513305664, -0.02128005027770996, -0.02058124542236328, -0.0198824405670166, -0.019183635711669922, -0.018484830856323242, -0.017786026000976562, -0.017087221145629883, -0.016388416290283203, -0.015689611434936523, -0.014990806579589844, -0.014292001724243164, -0.013593196868896484, -0.012894392013549805, -0.012195587158203125, -0.011496782302856445, -0.010797977447509766, -0.010099172592163086, -0.009400367736816406, -0.008701562881469727, -0.008002758026123047, -0.007303953170776367, -0.0066051483154296875, -0.005906343460083008, -0.005207538604736328, -0.0045087337493896484, -0.0038099288940429688, -0.003111124038696289, -0.0024123191833496094, -0.0017135143280029297, -0.00101470947265625, -0.0003159046173095703, 0.0003829002380371094, 0.001081705093383789, 0.0017805099487304688, 0.0024793148040771484, 0.003178119659423828, 0.003876924514770508, 0.0045757293701171875, 0.005274534225463867, 0.005973339080810547, 0.0066721439361572266, 0.007370948791503906, 0.008069753646850586, 0.008768558502197266, 0.009467363357543945, 0.010166168212890625, 0.010864973068237305, 0.011563777923583984, 0.012262582778930664, 0.012961387634277344, 0.013660192489624023, 0.014358997344970703, 0.015057802200317383, 0.015756607055664062, 0.016455411911010742, 0.017154216766357422, 0.0178530216217041, 0.01855182647705078, 0.01925063133239746, 0.01994943618774414, 0.02064824104309082, 0.0213470458984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 9.0, 12.0, 32.0, 61.0, 105.0, 304.0, 716.0, 2384.0, 19290.0, 4144639.0, 22623.0, 2683.0, 862.0, 312.0, 137.0, 63.0, 15.0, 13.0, 7.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28515625, -0.2763862609863281, -0.26761627197265625, -0.2588462829589844, -0.2500762939453125, -0.24130630493164062, -0.23253631591796875, -0.22376632690429688, -0.214996337890625, -0.20622634887695312, -0.19745635986328125, -0.18868637084960938, -0.1799163818359375, -0.17114639282226562, -0.16237640380859375, -0.15360641479492188, -0.14483642578125, -0.13606643676757812, -0.12729644775390625, -0.11852645874023438, -0.1097564697265625, -0.10098648071289062, -0.09221649169921875, -0.08344650268554688, -0.074676513671875, -0.06590652465820312, -0.05713653564453125, -0.048366546630859375, -0.0395965576171875, -0.030826568603515625, -0.02205657958984375, -0.013286590576171875, -0.0045166015625, 0.004253387451171875, 0.01302337646484375, 0.021793365478515625, 0.0305633544921875, 0.039333343505859375, 0.04810333251953125, 0.056873321533203125, 0.065643310546875, 0.07441329956054688, 0.08318328857421875, 0.09195327758789062, 0.1007232666015625, 0.10949325561523438, 0.11826324462890625, 0.12703323364257812, 0.13580322265625, 0.14457321166992188, 0.15334320068359375, 0.16211318969726562, 0.1708831787109375, 0.17965316772460938, 0.18842315673828125, 0.19719314575195312, 0.205963134765625, 0.21473312377929688, 0.22350311279296875, 0.23227310180664062, 0.2410430908203125, 0.24981307983398438, 0.25858306884765625, 0.2673530578613281, 0.276123046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 18.0, 58.0, 123.0, 599.0, 2263.0, 746.0, 150.0, 53.0, 23.0, 14.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.188720703125, -0.1827392578125, -0.1767578125, -0.1707763671875, -0.164794921875, -0.1588134765625, -0.15283203125, -0.1468505859375, -0.140869140625, -0.1348876953125, -0.12890625, -0.1229248046875, -0.116943359375, -0.1109619140625, -0.10498046875, -0.0989990234375, -0.093017578125, -0.0870361328125, -0.0810546875, -0.0750732421875, -0.069091796875, -0.0631103515625, -0.05712890625, -0.0511474609375, -0.045166015625, -0.0391845703125, -0.033203125, -0.0272216796875, -0.021240234375, -0.0152587890625, -0.00927734375, -0.0032958984375, 0.002685546875, 0.0086669921875, 0.0146484375, 0.0206298828125, 0.026611328125, 0.0325927734375, 0.03857421875, 0.0445556640625, 0.050537109375, 0.0565185546875, 0.0625, 0.0684814453125, 0.074462890625, 0.0804443359375, 0.08642578125, 0.0924072265625, 0.098388671875, 0.1043701171875, 0.1103515625, 0.1163330078125, 0.122314453125, 0.1282958984375, 0.13427734375, 0.1402587890625, 0.146240234375, 0.1522216796875, 0.158203125, 0.1641845703125, 0.170166015625, 0.1761474609375, 0.18212890625, 0.1881103515625, 0.194091796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 23.0, 57.0, 139.0, 308.0, 245.0, 120.0, 43.0, 25.0, 15.0, 7.0, 2.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5114376544952393, -0.4679955840110779, -0.4245535135269165, -0.3811114430427551, -0.33766937255859375, -0.2942273020744324, -0.2507852017879486, -0.20734313130378723, -0.16390106081962585, -0.12045899033546448, -0.0770169124007225, -0.03357483446598053, 0.009867236018180847, 0.053309306502342224, 0.0967513918876648, 0.14019346237182617, 0.18363553285598755, 0.22707760334014893, 0.2705196738243103, 0.3139617443084717, 0.35740381479263306, 0.40084588527679443, 0.4442879855632782, 0.4877300560474396, 0.5311721563339233, 0.5746142268180847, 0.6180562973022461, 0.6614983677864075, 0.7049404382705688, 0.7483825087547302, 0.7918245792388916, 0.8352667093276978, 0.8787087202072144, 0.9221507906913757, 0.9655928611755371, 1.0090349912643433, 1.0524770021438599, 1.095919132232666, 1.1393611431121826, 1.1828032732009888, 1.2262452840805054, 1.2696874141693115, 1.3131294250488281, 1.3565715551376343, 1.4000135660171509, 1.443455696105957, 1.4868977069854736, 1.5303398370742798, 1.573781967163086, 1.617224097251892, 1.6606661081314087, 1.7041082382202148, 1.7475502490997314, 1.7909923791885376, 1.8344343900680542, 1.8778765201568604, 1.921318531036377, 1.964760661125183, 2.0082027912139893, 2.051644802093506, 2.0950868129730225, 2.138528823852539, 2.1819710731506348, 2.2254130840301514, 2.268855094909668]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 12.0, 15.0, 12.0, 17.0, 22.0, 26.0, 37.0, 41.0, 41.0, 83.0, 51.0, 61.0, 50.0, 70.0, 55.0, 56.0, 58.0, 48.0, 40.0, 46.0, 37.0, 39.0, 21.0, 20.0, 11.0, 10.0, 5.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.693741500377655, -0.6767563819885254, -0.6597713232040405, -0.6427862048149109, -0.6258010864257812, -0.6088159680366516, -0.591830849647522, -0.5748457908630371, -0.5578606724739075, -0.5408755540847778, -0.523890495300293, -0.5069053769111633, -0.4899202585220337, -0.47293514013290405, -0.4559500515460968, -0.43896496295928955, -0.4219798445701599, -0.4049947261810303, -0.388009637594223, -0.37102454900741577, -0.35403943061828613, -0.3370543122291565, -0.32006922364234924, -0.303084135055542, -0.28609901666641235, -0.2691138982772827, -0.25212880969047546, -0.23514370620250702, -0.21815860271453857, -0.20117349922657013, -0.18418839573860168, -0.16720329225063324, -0.15021824836730957, -0.13323314487934113, -0.11624804139137268, -0.09926293790340424, -0.08227783441543579, -0.06529273092746735, -0.0483076274394989, -0.03132252395153046, -0.014337420463562012, 0.002647683024406433, 0.019632786512374878, 0.03661789000034332, 0.05360299348831177, 0.07058809697628021, 0.08757320046424866, 0.1045583039522171, 0.12154340744018555, 0.138528510928154, 0.15551361441612244, 0.17249871790409088, 0.18948382139205933, 0.20646892488002777, 0.22345402836799622, 0.24043913185596466, 0.2574242353439331, 0.27440935373306274, 0.29139444231987, 0.30837953090667725, 0.3253646492958069, 0.3423497676849365, 0.3593348562717438, 0.376319944858551, 0.39330506324768066]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 9.0, 10.0, 15.0, 14.0, 36.0, 72.0, 115.0, 183.0, 354.0, 660.0, 1340.0, 2893.0, 7600.0, 23547.0, 92293.0, 467965.0, 352607.0, 68905.0, 18717.0, 6279.0, 2462.0, 1134.0, 605.0, 306.0, 165.0, 112.0, 62.0, 36.0, 28.0, 7.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0584716796875, -0.05657958984375, -0.0546875, -0.05279541015625, -0.0509033203125, -0.04901123046875, -0.047119140625, -0.04522705078125, -0.0433349609375, -0.04144287109375, -0.03955078125, -0.03765869140625, -0.0357666015625, -0.03387451171875, -0.031982421875, -0.03009033203125, -0.0281982421875, -0.02630615234375, -0.0244140625, -0.02252197265625, -0.0206298828125, -0.01873779296875, -0.016845703125, -0.01495361328125, -0.0130615234375, -0.01116943359375, -0.00927734375, -0.00738525390625, -0.0054931640625, -0.00360107421875, -0.001708984375, 0.00018310546875, 0.0020751953125, 0.00396728515625, 0.005859375, 0.00775146484375, 0.0096435546875, 0.01153564453125, 0.013427734375, 0.01531982421875, 0.0172119140625, 0.01910400390625, 0.02099609375, 0.02288818359375, 0.0247802734375, 0.02667236328125, 0.028564453125, 0.03045654296875, 0.0323486328125, 0.03424072265625, 0.0361328125, 0.03802490234375, 0.0399169921875, 0.04180908203125, 0.043701171875, 0.04559326171875, 0.0474853515625, 0.04937744140625, 0.05126953125, 0.05316162109375, 0.0550537109375, 0.05694580078125, 0.058837890625, 0.06072998046875, 0.0626220703125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 5.0, 8.0, 6.0, 11.0, 10.0, 19.0, 16.0, 21.0, 17.0, 22.0, 34.0, 28.0, 31.0, 34.0, 54.0, 43.0, 47.0, 52.0, 45.0, 64.0, 61.0, 42.0, 43.0, 28.0, 38.0, 32.0, 34.0, 25.0, 21.0, 17.0, 13.0, 9.0, 9.0, 13.0, 11.0, 4.0, 7.0, 7.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0236358642578125, -0.022861242294311523, -0.022086620330810547, -0.02131199836730957, -0.020537376403808594, -0.019762754440307617, -0.01898813247680664, -0.018213510513305664, -0.017438888549804688, -0.01666426658630371, -0.015889644622802734, -0.015115022659301758, -0.014340400695800781, -0.013565778732299805, -0.012791156768798828, -0.012016534805297852, -0.011241912841796875, -0.010467290878295898, -0.009692668914794922, -0.008918046951293945, -0.008143424987792969, -0.007368803024291992, -0.006594181060791016, -0.005819559097290039, -0.0050449371337890625, -0.004270315170288086, -0.0034956932067871094, -0.002721071243286133, -0.0019464492797851562, -0.0011718273162841797, -0.0003972053527832031, 0.00037741661071777344, 0.00115203857421875, 0.0019266605377197266, 0.002701282501220703, 0.0034759044647216797, 0.004250526428222656, 0.005025148391723633, 0.005799770355224609, 0.006574392318725586, 0.0073490142822265625, 0.008123636245727539, 0.008898258209228516, 0.009672880172729492, 0.010447502136230469, 0.011222124099731445, 0.011996746063232422, 0.012771368026733398, 0.013545989990234375, 0.014320611953735352, 0.015095233917236328, 0.015869855880737305, 0.01664447784423828, 0.017419099807739258, 0.018193721771240234, 0.01896834373474121, 0.019742965698242188, 0.020517587661743164, 0.02129220962524414, 0.022066831588745117, 0.022841453552246094, 0.02361607551574707, 0.024390697479248047, 0.025165319442749023, 0.02593994140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 4.0, 8.0, 6.0, 17.0, 21.0, 26.0, 53.0, 58.0, 77.0, 85.0, 132.0, 166.0, 288.0, 454.0, 758.0, 1310.0, 3275.0, 11348.0, 98363.0, 859900.0, 58055.0, 8281.0, 2572.0, 1252.0, 670.0, 403.0, 281.0, 192.0, 124.0, 98.0, 58.0, 43.0, 42.0, 31.0, 15.0, 15.0, 11.0, 8.0, 7.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.096435546875, -0.09304046630859375, -0.0896453857421875, -0.08625030517578125, -0.082855224609375, -0.07946014404296875, -0.0760650634765625, -0.07266998291015625, -0.06927490234375, -0.06587982177734375, -0.0624847412109375, -0.05908966064453125, -0.055694580078125, -0.05229949951171875, -0.0489044189453125, -0.04550933837890625, -0.0421142578125, -0.03871917724609375, -0.0353240966796875, -0.03192901611328125, -0.028533935546875, -0.02513885498046875, -0.0217437744140625, -0.01834869384765625, -0.01495361328125, -0.01155853271484375, -0.0081634521484375, -0.00476837158203125, -0.001373291015625, 0.00202178955078125, 0.0054168701171875, 0.00881195068359375, 0.01220703125, 0.01560211181640625, 0.0189971923828125, 0.02239227294921875, 0.025787353515625, 0.02918243408203125, 0.0325775146484375, 0.03597259521484375, 0.03936767578125, 0.04276275634765625, 0.0461578369140625, 0.04955291748046875, 0.052947998046875, 0.05634307861328125, 0.0597381591796875, 0.06313323974609375, 0.0665283203125, 0.06992340087890625, 0.0733184814453125, 0.07671356201171875, 0.080108642578125, 0.08350372314453125, 0.0868988037109375, 0.09029388427734375, 0.09368896484375, 0.09708404541015625, 0.1004791259765625, 0.10387420654296875, 0.107269287109375, 0.11066436767578125, 0.1140594482421875, 0.11745452880859375, 0.120849609375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 2.0, 3.0, 7.0, 8.0, 14.0, 11.0, 18.0, 17.0, 29.0, 26.0, 37.0, 50.0, 54.0, 51.0, 69.0, 63.0, 69.0, 64.0, 55.0, 67.0, 46.0, 49.0, 37.0, 25.0, 28.0, 20.0, 15.0, 15.0, 6.0, 11.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.13761138916015625, -0.1337432861328125, -0.12987518310546875, -0.126007080078125, -0.12213897705078125, -0.1182708740234375, -0.11440277099609375, -0.11053466796875, -0.10666656494140625, -0.1027984619140625, -0.09893035888671875, -0.095062255859375, -0.09119415283203125, -0.0873260498046875, -0.08345794677734375, -0.07958984375, -0.07572174072265625, -0.0718536376953125, -0.06798553466796875, -0.064117431640625, -0.06024932861328125, -0.0563812255859375, -0.05251312255859375, -0.04864501953125, -0.04477691650390625, -0.0409088134765625, -0.03704071044921875, -0.033172607421875, -0.02930450439453125, -0.0254364013671875, -0.02156829833984375, -0.0177001953125, -0.01383209228515625, -0.0099639892578125, -0.00609588623046875, -0.002227783203125, 0.00164031982421875, 0.0055084228515625, 0.00937652587890625, 0.01324462890625, 0.01711273193359375, 0.0209808349609375, 0.02484893798828125, 0.028717041015625, 0.03258514404296875, 0.0364532470703125, 0.04032135009765625, 0.044189453125, 0.04805755615234375, 0.0519256591796875, 0.05579376220703125, 0.059661865234375, 0.06352996826171875, 0.0673980712890625, 0.07126617431640625, 0.07513427734375, 0.07900238037109375, 0.0828704833984375, 0.08673858642578125, 0.090606689453125, 0.09447479248046875, 0.0983428955078125, 0.10221099853515625, 0.1060791015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 22.0, 24.0, 42.0, 102.0, 250.0, 810.0, 4070.0, 47007.0, 947486.0, 43478.0, 3954.0, 829.0, 264.0, 102.0, 45.0, 23.0, 11.0, 8.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0501708984375, -0.04827690124511719, -0.046382904052734375, -0.04448890686035156, -0.04259490966796875, -0.04070091247558594, -0.038806915283203125, -0.03691291809082031, -0.0350189208984375, -0.03312492370605469, -0.031230926513671875, -0.029336929321289062, -0.02744293212890625, -0.025548934936523438, -0.023654937744140625, -0.021760940551757812, -0.019866943359375, -0.017972946166992188, -0.016078948974609375, -0.014184951782226562, -0.01229095458984375, -0.010396957397460938, -0.008502960205078125, -0.0066089630126953125, -0.0047149658203125, -0.0028209686279296875, -0.000926971435546875, 0.0009670257568359375, 0.00286102294921875, 0.0047550201416015625, 0.006649017333984375, 0.008543014526367188, 0.01043701171875, 0.012331008911132812, 0.014225006103515625, 0.016119003295898438, 0.01801300048828125, 0.019906997680664062, 0.021800994873046875, 0.023694992065429688, 0.0255889892578125, 0.027482986450195312, 0.029376983642578125, 0.03127098083496094, 0.03316497802734375, 0.03505897521972656, 0.036952972412109375, 0.03884696960449219, 0.040740966796875, 0.04263496398925781, 0.044528961181640625, 0.04642295837402344, 0.04831695556640625, 0.05021095275878906, 0.052104949951171875, 0.05399894714355469, 0.0558929443359375, 0.05778694152832031, 0.059680938720703125, 0.06157493591308594, 0.06346893310546875, 0.06536293029785156, 0.06725692749023438, 0.06915092468261719, 0.071044921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 7.0, 20.0, 26.0, 25.0, 41.0, 55.0, 93.0, 92.0, 147.0, 128.0, 106.0, 78.0, 48.0, 29.0, 30.0, 21.0, 17.0, 6.0, 8.0, 6.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6803226470947266e-05, -5.496945232152939e-05, -5.313567817211151e-05, -5.1301904022693634e-05, -4.946812987327576e-05, -4.763435572385788e-05, -4.580058157444e-05, -4.3966807425022125e-05, -4.213303327560425e-05, -4.029925912618637e-05, -3.8465484976768494e-05, -3.6631710827350616e-05, -3.479793667793274e-05, -3.296416252851486e-05, -3.1130388379096985e-05, -2.9296614229679108e-05, -2.746284008026123e-05, -2.5629065930843353e-05, -2.3795291781425476e-05, -2.19615176320076e-05, -2.012774348258972e-05, -1.8293969333171844e-05, -1.6460195183753967e-05, -1.462642103433609e-05, -1.2792646884918213e-05, -1.0958872735500336e-05, -9.125098586082458e-06, -7.291324436664581e-06, -5.457550287246704e-06, -3.623776137828827e-06, -1.7900019884109497e-06, 4.377216100692749e-08, 1.8775463104248047e-06, 3.711320459842682e-06, 5.545094609260559e-06, 7.378868758678436e-06, 9.212642908096313e-06, 1.104641705751419e-05, 1.2880191206932068e-05, 1.4713965356349945e-05, 1.6547739505767822e-05, 1.83815136551857e-05, 2.0215287804603577e-05, 2.2049061954021454e-05, 2.388283610343933e-05, 2.5716610252857208e-05, 2.7550384402275085e-05, 2.9384158551692963e-05, 3.121793270111084e-05, 3.305170685052872e-05, 3.4885480999946594e-05, 3.671925514936447e-05, 3.855302929878235e-05, 4.0386803448200226e-05, 4.22205775976181e-05, 4.405435174703598e-05, 4.588812589645386e-05, 4.7721900045871735e-05, 4.955567419528961e-05, 5.138944834470749e-05, 5.3223222494125366e-05, 5.5056996643543243e-05, 5.689077079296112e-05, 5.8724544942379e-05, 6.0558319091796875e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 3.0, 0.0, 4.0, 6.0, 6.0, 10.0, 11.0, 20.0, 27.0, 44.0, 61.0, 92.0, 114.0, 191.0, 295.0, 498.0, 1092.0, 2437.0, 7127.0, 32042.0, 479452.0, 480584.0, 32005.0, 7333.0, 2543.0, 1075.0, 574.0, 334.0, 183.0, 134.0, 72.0, 59.0, 34.0, 19.0, 24.0, 17.0, 10.0, 3.0, 4.0, 8.0, 1.0, 2.0, 0.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034637451171875, -0.033555030822753906, -0.03247261047363281, -0.03139019012451172, -0.030307769775390625, -0.02922534942626953, -0.028142929077148438, -0.027060508728027344, -0.02597808837890625, -0.024895668029785156, -0.023813247680664062, -0.02273082733154297, -0.021648406982421875, -0.02056598663330078, -0.019483566284179688, -0.018401145935058594, -0.0173187255859375, -0.016236305236816406, -0.015153884887695312, -0.014071464538574219, -0.012989044189453125, -0.011906623840332031, -0.010824203491210938, -0.009741783142089844, -0.00865936279296875, -0.007576942443847656, -0.0064945220947265625, -0.005412101745605469, -0.004329681396484375, -0.0032472610473632812, -0.0021648406982421875, -0.0010824203491210938, 0.0, 0.0010824203491210938, 0.0021648406982421875, 0.0032472610473632812, 0.004329681396484375, 0.005412101745605469, 0.0064945220947265625, 0.007576942443847656, 0.00865936279296875, 0.009741783142089844, 0.010824203491210938, 0.011906623840332031, 0.012989044189453125, 0.014071464538574219, 0.015153884887695312, 0.016236305236816406, 0.0173187255859375, 0.018401145935058594, 0.019483566284179688, 0.02056598663330078, 0.021648406982421875, 0.02273082733154297, 0.023813247680664062, 0.024895668029785156, 0.02597808837890625, 0.027060508728027344, 0.028142929077148438, 0.02922534942626953, 0.030307769775390625, 0.03139019012451172, 0.03247261047363281, 0.033555030822753906, 0.034637451171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 8.0, 6.0, 14.0, 12.0, 28.0, 34.0, 41.0, 61.0, 81.0, 109.0, 155.0, 121.0, 77.0, 76.0, 51.0, 27.0, 17.0, 23.0, 12.0, 10.0, 2.0, 9.0, 11.0, 8.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03265380859375, -0.03165006637573242, -0.030646324157714844, -0.029642581939697266, -0.028638839721679688, -0.02763509750366211, -0.02663135528564453, -0.025627613067626953, -0.024623870849609375, -0.023620128631591797, -0.02261638641357422, -0.02161264419555664, -0.020608901977539062, -0.019605159759521484, -0.018601417541503906, -0.017597675323486328, -0.01659393310546875, -0.015590190887451172, -0.014586448669433594, -0.013582706451416016, -0.012578964233398438, -0.01157522201538086, -0.010571479797363281, -0.009567737579345703, -0.008563995361328125, -0.007560253143310547, -0.006556510925292969, -0.005552768707275391, -0.0045490264892578125, -0.0035452842712402344, -0.0025415420532226562, -0.0015377998352050781, -0.0005340576171875, 0.0004696846008300781, 0.0014734268188476562, 0.0024771690368652344, 0.0034809112548828125, 0.004484653472900391, 0.005488395690917969, 0.006492137908935547, 0.007495880126953125, 0.008499622344970703, 0.009503364562988281, 0.01050710678100586, 0.011510848999023438, 0.012514591217041016, 0.013518333435058594, 0.014522075653076172, 0.01552581787109375, 0.016529560089111328, 0.017533302307128906, 0.018537044525146484, 0.019540786743164062, 0.02054452896118164, 0.02154827117919922, 0.022552013397216797, 0.023555755615234375, 0.024559497833251953, 0.02556324005126953, 0.02656698226928711, 0.027570724487304688, 0.028574466705322266, 0.029578208923339844, 0.030581951141357422, 0.031585693359375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 17.0, 76.0, 567.0, 271.0, 47.0, 17.0, 8.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193838596343994, -1.25588858127594, -1.1923933029174805, -1.1288981437683105, -1.065402865409851, -1.0019075870513916, -0.9384123682975769, -0.8749171495437622, -0.8114218711853027, -0.7479265928268433, -0.6844313740730286, -0.6209361553192139, -0.5574408769607544, -0.4939456284046173, -0.4304503798484802, -0.36695513129234314, -0.30345988273620605, -0.23996463418006897, -0.17646938562393188, -0.1129741370677948, -0.049478888511657715, 0.01401636004447937, 0.07751160860061646, 0.14100685715675354, 0.20450210571289062, 0.2679973542690277, 0.3314926028251648, 0.3949878513813019, 0.45848309993743896, 0.5219783782958984, 0.5854735970497131, 0.6489688158035278, 0.7124638557434082, 0.7759591341018677, 0.8394543528556824, 0.9029495716094971, 0.9664448499679565, 1.029940128326416, 1.093435287475586, 1.1569305658340454, 1.2204258441925049, 1.2839211225509644, 1.3474164009094238, 1.4109115600585938, 1.4744068384170532, 1.5379021167755127, 1.6013972759246826, 1.664892554283142, 1.7283878326416016, 1.791883111000061, 1.8553783893585205, 1.9188735485076904, 1.98236882686615, 2.0458641052246094, 2.1093592643737793, 2.1728546619415283, 2.2363498210906982, 2.299844980239868, 2.363340377807617, 2.426835536956787, 2.490330696105957, 2.553826093673706, 2.617321252822876, 2.680816650390625, 2.744311809539795]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 2.0, 2.0, 7.0, 5.0, 8.0, 12.0, 15.0, 8.0, 18.0, 18.0, 19.0, 20.0, 29.0, 30.0, 29.0, 41.0, 40.0, 69.0, 132.0, 132.0, 61.0, 28.0, 36.0, 30.0, 24.0, 25.0, 18.0, 22.0, 25.0, 16.0, 11.0, 9.0, 12.0, 11.0, 10.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.48429399728775024, -0.4708324074745178, -0.457370787858963, -0.4439091980457306, -0.4304475784301758, -0.41698598861694336, -0.40352439880371094, -0.3900628089904785, -0.3766011893749237, -0.3631395995616913, -0.3496779799461365, -0.33621639013290405, -0.32275480031967163, -0.3092931807041168, -0.2958315908908844, -0.2823699712753296, -0.26890838146209717, -0.25544679164886475, -0.24198517203330994, -0.22852358222007751, -0.2150619775056839, -0.20160037279129028, -0.18813878297805786, -0.17467717826366425, -0.16121557354927063, -0.14775396883487701, -0.1342923641204834, -0.12083077430725098, -0.10736916959285736, -0.09390756487846375, -0.08044596761465073, -0.06698437035083771, -0.05352276563644409, -0.040061164647340775, -0.026599563658237457, -0.01313796266913414, 0.00032363831996917725, 0.013785243034362793, 0.027246840298175812, 0.04070843756198883, 0.054170042276382446, 0.06763164699077606, 0.08109324425458908, 0.0945548415184021, 0.10801644623279572, 0.12147805094718933, 0.13493964076042175, 0.14840124547481537, 0.16186285018920898, 0.1753244549036026, 0.18878605961799622, 0.20224764943122864, 0.21570925414562225, 0.22917085886001587, 0.2426324486732483, 0.2560940384864807, 0.2695556581020355, 0.28301724791526794, 0.29647886753082275, 0.3099404573440552, 0.3234020471572876, 0.3368636667728424, 0.35032525658607483, 0.36378687620162964, 0.37724846601486206]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 10.0, 8.0, 12.0, 14.0, 18.0, 24.0, 22.0, 42.0, 55.0, 73.0, 111.0, 134.0, 220.0, 319.0, 437.0, 709.0, 1031.0, 1725.0, 2976.0, 5783.0, 12320.0, 34171.0, 146050.0, 914523.0, 2302571.0, 619008.0, 102839.0, 26839.0, 10447.0, 4915.0, 2528.0, 1486.0, 960.0, 572.0, 395.0, 268.0, 218.0, 121.0, 97.0, 65.0, 54.0, 40.0, 22.0, 16.0, 16.0, 10.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04571533203125, -0.04430389404296875, -0.0428924560546875, -0.04148101806640625, -0.040069580078125, -0.03865814208984375, -0.0372467041015625, -0.03583526611328125, -0.034423828125, -0.03301239013671875, -0.0316009521484375, -0.03018951416015625, -0.028778076171875, -0.02736663818359375, -0.0259552001953125, -0.02454376220703125, -0.02313232421875, -0.02172088623046875, -0.0203094482421875, -0.01889801025390625, -0.017486572265625, -0.01607513427734375, -0.0146636962890625, -0.01325225830078125, -0.0118408203125, -0.01042938232421875, -0.0090179443359375, -0.00760650634765625, -0.006195068359375, -0.00478363037109375, -0.0033721923828125, -0.00196075439453125, -0.00054931640625, 0.00086212158203125, 0.0022735595703125, 0.00368499755859375, 0.005096435546875, 0.00650787353515625, 0.0079193115234375, 0.00933074951171875, 0.0107421875, 0.01215362548828125, 0.0135650634765625, 0.01497650146484375, 0.016387939453125, 0.01779937744140625, 0.0192108154296875, 0.02062225341796875, 0.02203369140625, 0.02344512939453125, 0.0248565673828125, 0.02626800537109375, 0.027679443359375, 0.02909088134765625, 0.0305023193359375, 0.03191375732421875, 0.0333251953125, 0.03473663330078125, 0.0361480712890625, 0.03755950927734375, 0.038970947265625, 0.04038238525390625, 0.0417938232421875, 0.04320526123046875, 0.04461669921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 2.0, 9.0, 8.0, 9.0, 8.0, 19.0, 17.0, 17.0, 23.0, 28.0, 29.0, 31.0, 26.0, 28.0, 41.0, 36.0, 43.0, 47.0, 54.0, 36.0, 53.0, 50.0, 45.0, 37.0, 35.0, 36.0, 28.0, 34.0, 31.0, 22.0, 15.0, 12.0, 13.0, 13.0, 11.0, 14.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208740234375, -0.0202028751373291, -0.019531726837158203, -0.018860578536987305, -0.018189430236816406, -0.017518281936645508, -0.01684713363647461, -0.01617598533630371, -0.015504837036132812, -0.014833688735961914, -0.014162540435791016, -0.013491392135620117, -0.012820243835449219, -0.01214909553527832, -0.011477947235107422, -0.010806798934936523, -0.010135650634765625, -0.009464502334594727, -0.008793354034423828, -0.00812220573425293, -0.007451057434082031, -0.006779909133911133, -0.006108760833740234, -0.005437612533569336, -0.0047664642333984375, -0.004095315933227539, -0.0034241676330566406, -0.002753019332885742, -0.0020818710327148438, -0.0014107227325439453, -0.0007395744323730469, -6.842613220214844e-05, 0.00060272216796875, 0.0012738704681396484, 0.0019450187683105469, 0.0026161670684814453, 0.0032873153686523438, 0.003958463668823242, 0.004629611968994141, 0.005300760269165039, 0.0059719085693359375, 0.006643056869506836, 0.007314205169677734, 0.007985353469848633, 0.008656501770019531, 0.00932765007019043, 0.009998798370361328, 0.010669946670532227, 0.011341094970703125, 0.012012243270874023, 0.012683391571044922, 0.01335453987121582, 0.014025688171386719, 0.014696836471557617, 0.015367984771728516, 0.016039133071899414, 0.016710281372070312, 0.01738142967224121, 0.01805257797241211, 0.018723726272583008, 0.019394874572753906, 0.020066022872924805, 0.020737171173095703, 0.0214083194732666, 0.0220794677734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 27.0, 43.0, 75.0, 123.0, 303.0, 709.0, 2084.0, 22637.0, 4139692.0, 25199.0, 2100.0, 684.0, 271.0, 132.0, 74.0, 42.0, 22.0, 16.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3798828125, -0.3681983947753906, -0.35651397705078125, -0.3448295593261719, -0.3331451416015625, -0.3214607238769531, -0.30977630615234375, -0.2980918884277344, -0.286407470703125, -0.2747230529785156, -0.26303863525390625, -0.2513542175292969, -0.2396697998046875, -0.22798538208007812, -0.21630096435546875, -0.20461654663085938, -0.19293212890625, -0.18124771118164062, -0.16956329345703125, -0.15787887573242188, -0.1461944580078125, -0.13451004028320312, -0.12282562255859375, -0.11114120483398438, -0.099456787109375, -0.08777236938476562, -0.07608795166015625, -0.06440353393554688, -0.0527191162109375, -0.041034698486328125, -0.02935028076171875, -0.017665863037109375, -0.0059814453125, 0.005702972412109375, 0.01738739013671875, 0.029071807861328125, 0.0407562255859375, 0.052440643310546875, 0.06412506103515625, 0.07580947875976562, 0.087493896484375, 0.09917831420898438, 0.11086273193359375, 0.12254714965820312, 0.1342315673828125, 0.14591598510742188, 0.15760040283203125, 0.16928482055664062, 0.18096923828125, 0.19265365600585938, 0.20433807373046875, 0.21602249145507812, 0.2277069091796875, 0.23939132690429688, 0.25107574462890625, 0.2627601623535156, 0.274444580078125, 0.2861289978027344, 0.29781341552734375, 0.3094978332519531, 0.3211822509765625, 0.3328666687011719, 0.34455108642578125, 0.3562355041503906, 0.367919921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 12.0, 21.0, 45.0, 70.0, 159.0, 449.0, 1259.0, 1291.0, 437.0, 181.0, 75.0, 35.0, 14.0, 10.0, 9.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2127685546875, -0.20542335510253906, -0.19807815551757812, -0.1907329559326172, -0.18338775634765625, -0.1760425567626953, -0.16869735717773438, -0.16135215759277344, -0.1540069580078125, -0.14666175842285156, -0.13931655883789062, -0.1319713592529297, -0.12462615966796875, -0.11728096008300781, -0.10993576049804688, -0.10259056091308594, -0.095245361328125, -0.08790016174316406, -0.08055496215820312, -0.07320976257324219, -0.06586456298828125, -0.05851936340332031, -0.051174163818359375, -0.04382896423339844, -0.0364837646484375, -0.029138565063476562, -0.021793365478515625, -0.014448165893554688, -0.00710296630859375, 0.0002422332763671875, 0.007587432861328125, 0.014932632446289062, 0.02227783203125, 0.029623031616210938, 0.036968231201171875, 0.04431343078613281, 0.05165863037109375, 0.05900382995605469, 0.06634902954101562, 0.07369422912597656, 0.0810394287109375, 0.08838462829589844, 0.09572982788085938, 0.10307502746582031, 0.11042022705078125, 0.11776542663574219, 0.12511062622070312, 0.13245582580566406, 0.139801025390625, 0.14714622497558594, 0.15449142456054688, 0.1618366241455078, 0.16918182373046875, 0.1765270233154297, 0.18387222290039062, 0.19121742248535156, 0.1985626220703125, 0.20590782165527344, 0.21325302124023438, 0.2205982208251953, 0.22794342041015625, 0.2352886199951172, 0.24263381958007812, 0.24997901916503906, 0.25732421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 9.0, 10.0, 11.0, 28.0, 58.0, 94.0, 186.0, 231.0, 147.0, 90.0, 50.0, 23.0, 23.0, 16.0, 3.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.906980037689209, -1.858508825302124, -1.8100374937057495, -1.761566162109375, -1.71309494972229, -1.664623737335205, -1.6161524057388306, -1.567681074142456, -1.519209861755371, -1.4707386493682861, -1.4222673177719116, -1.373795986175537, -1.3253247737884521, -1.2768535614013672, -1.2283822298049927, -1.1799108982086182, -1.1314396858215332, -1.0829684734344482, -1.0344971418380737, -0.986025869846344, -0.9375545978546143, -0.8890833258628845, -0.8406120538711548, -0.792140781879425, -0.7436695098876953, -0.6951982378959656, -0.6467269659042358, -0.5982556939125061, -0.5497844219207764, -0.5013131499290466, -0.4528418779373169, -0.40437060594558716, -0.3558993339538574, -0.3074280619621277, -0.25895678997039795, -0.2104855179786682, -0.16201424598693848, -0.11354297399520874, -0.065071702003479, -0.016600430011749268, 0.03187084197998047, 0.0803421139717102, 0.12881338596343994, 0.17728465795516968, 0.22575592994689941, 0.27422720193862915, 0.3226984739303589, 0.3711697459220886, 0.41964101791381836, 0.4681122899055481, 0.5165835618972778, 0.5650548338890076, 0.6135261058807373, 0.661997377872467, 0.7104686498641968, 0.7589399218559265, 0.8074111938476562, 0.855882465839386, 0.9043537378311157, 0.9528250098228455, 1.0012962818145752, 1.0497674942016602, 1.0982388257980347, 1.1467101573944092, 1.1951813697814941]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 16.0, 10.0, 9.0, 16.0, 16.0, 21.0, 31.0, 42.0, 44.0, 46.0, 71.0, 82.0, 84.0, 73.0, 70.0, 48.0, 43.0, 34.0, 39.0, 39.0, 43.0, 35.0, 11.0, 22.0, 12.0, 16.0, 7.0, 1.0, 7.0, 0.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7830135822296143, -0.7581965327262878, -0.7333794832229614, -0.708562433719635, -0.6837453842163086, -0.658928394317627, -0.6341113448143005, -0.6092942953109741, -0.5844772458076477, -0.5596601963043213, -0.5348431468009949, -0.5100260972976685, -0.48520907759666443, -0.460392028093338, -0.435575008392334, -0.41075795888900757, -0.38594090938568115, -0.36112385988235474, -0.3363068103790283, -0.3114897906780243, -0.2866727411746979, -0.26185569167137146, -0.23703865706920624, -0.21222162246704102, -0.1874045729637146, -0.16258752346038818, -0.13777048885822296, -0.11295344680547714, -0.08813640475273132, -0.0633193626999855, -0.038502320647239685, -0.013685286045074463, 0.011131763458251953, 0.03594880551099777, 0.06076584756374359, 0.08558288961648941, 0.11039993166923523, 0.13521698117256165, 0.16003401577472687, 0.1848510503768921, 0.2096680998802185, 0.23448514938354492, 0.25930219888687134, 0.28411921858787537, 0.3089362680912018, 0.3337533175945282, 0.3585703372955322, 0.38338738679885864, 0.40820443630218506, 0.4330214858055115, 0.4578385353088379, 0.4826555550098419, 0.5074726343154907, 0.5322896242141724, 0.5571066737174988, 0.5819237232208252, 0.6067407727241516, 0.631557822227478, 0.6563748717308044, 0.6811919212341309, 0.7060089111328125, 0.7308259606361389, 0.7556430101394653, 0.7804600596427917, 0.8052771091461182]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 11.0, 14.0, 23.0, 26.0, 45.0, 65.0, 109.0, 146.0, 207.0, 384.0, 584.0, 1050.0, 1622.0, 3131.0, 6303.0, 13667.0, 34567.0, 110591.0, 599656.0, 190814.0, 49594.0, 18355.0, 8398.0, 3907.0, 2174.0, 1188.0, 708.0, 398.0, 300.0, 175.0, 119.0, 59.0, 43.0, 29.0, 24.0, 17.0, 17.0, 9.0, 6.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04937744140625, -0.04791116714477539, -0.04644489288330078, -0.04497861862182617, -0.04351234436035156, -0.04204607009887695, -0.040579795837402344, -0.039113521575927734, -0.037647247314453125, -0.036180973052978516, -0.034714698791503906, -0.0332484245300293, -0.03178215026855469, -0.030315876007080078, -0.02884960174560547, -0.02738332748413086, -0.02591705322265625, -0.02445077896118164, -0.02298450469970703, -0.021518230438232422, -0.020051956176757812, -0.018585681915283203, -0.017119407653808594, -0.015653133392333984, -0.014186859130859375, -0.012720584869384766, -0.011254310607910156, -0.009788036346435547, -0.008321762084960938, -0.006855487823486328, -0.005389213562011719, -0.003922939300537109, -0.0024566650390625, -0.0009903907775878906, 0.00047588348388671875, 0.0019421577453613281, 0.0034084320068359375, 0.004874706268310547, 0.006340980529785156, 0.007807254791259766, 0.009273529052734375, 0.010739803314208984, 0.012206077575683594, 0.013672351837158203, 0.015138626098632812, 0.016604900360107422, 0.01807117462158203, 0.01953744888305664, 0.02100372314453125, 0.02246999740600586, 0.02393627166748047, 0.025402545928955078, 0.026868820190429688, 0.028335094451904297, 0.029801368713378906, 0.031267642974853516, 0.032733917236328125, 0.034200191497802734, 0.035666465759277344, 0.03713274002075195, 0.03859901428222656, 0.04006528854370117, 0.04153156280517578, 0.04299783706665039, 0.044464111328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 8.0, 14.0, 16.0, 13.0, 17.0, 21.0, 19.0, 24.0, 35.0, 48.0, 53.0, 50.0, 74.0, 69.0, 64.0, 74.0, 58.0, 52.0, 36.0, 38.0, 45.0, 27.0, 31.0, 25.0, 16.0, 10.0, 10.0, 6.0, 5.0, 5.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039276123046875, -0.03801727294921875, -0.0367584228515625, -0.03549957275390625, -0.03424072265625, -0.03298187255859375, -0.0317230224609375, -0.03046417236328125, -0.029205322265625, -0.02794647216796875, -0.0266876220703125, -0.02542877197265625, -0.024169921875, -0.02291107177734375, -0.0216522216796875, -0.02039337158203125, -0.019134521484375, -0.01787567138671875, -0.0166168212890625, -0.01535797119140625, -0.01409912109375, -0.01284027099609375, -0.0115814208984375, -0.01032257080078125, -0.009063720703125, -0.00780487060546875, -0.0065460205078125, -0.00528717041015625, -0.0040283203125, -0.00276947021484375, -0.0015106201171875, -0.00025177001953125, 0.001007080078125, 0.00226593017578125, 0.0035247802734375, 0.00478363037109375, 0.00604248046875, 0.00730133056640625, 0.0085601806640625, 0.00981903076171875, 0.011077880859375, 0.01233673095703125, 0.0135955810546875, 0.01485443115234375, 0.01611328125, 0.01737213134765625, 0.0186309814453125, 0.01988983154296875, 0.021148681640625, 0.02240753173828125, 0.0236663818359375, 0.02492523193359375, 0.02618408203125, 0.02744293212890625, 0.0287017822265625, 0.02996063232421875, 0.031219482421875, 0.03247833251953125, 0.0337371826171875, 0.03499603271484375, 0.0362548828125, 0.03751373291015625, 0.0387725830078125, 0.04003143310546875, 0.041290283203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 5.0, 13.0, 17.0, 18.0, 28.0, 51.0, 66.0, 100.0, 126.0, 206.0, 324.0, 679.0, 1731.0, 6224.0, 42306.0, 926645.0, 58738.0, 7588.0, 1948.0, 721.0, 394.0, 191.0, 117.0, 83.0, 61.0, 36.0, 28.0, 17.0, 22.0, 15.0, 7.0, 7.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0982666015625, -0.09542369842529297, -0.09258079528808594, -0.0897378921508789, -0.08689498901367188, -0.08405208587646484, -0.08120918273925781, -0.07836627960205078, -0.07552337646484375, -0.07268047332763672, -0.06983757019042969, -0.06699466705322266, -0.06415176391601562, -0.061308860778808594, -0.05846595764160156, -0.05562305450439453, -0.0527801513671875, -0.04993724822998047, -0.04709434509277344, -0.044251441955566406, -0.041408538818359375, -0.038565635681152344, -0.03572273254394531, -0.03287982940673828, -0.03003692626953125, -0.02719402313232422, -0.024351119995117188, -0.021508216857910156, -0.018665313720703125, -0.015822410583496094, -0.012979507446289062, -0.010136604309082031, -0.007293701171875, -0.004450798034667969, -0.0016078948974609375, 0.0012350082397460938, 0.004077911376953125, 0.006920814514160156, 0.009763717651367188, 0.012606620788574219, 0.01544952392578125, 0.01829242706298828, 0.021135330200195312, 0.023978233337402344, 0.026821136474609375, 0.029664039611816406, 0.03250694274902344, 0.03534984588623047, 0.0381927490234375, 0.04103565216064453, 0.04387855529785156, 0.046721458435058594, 0.049564361572265625, 0.052407264709472656, 0.05525016784667969, 0.05809307098388672, 0.06093597412109375, 0.06377887725830078, 0.06662178039550781, 0.06946468353271484, 0.07230758666992188, 0.0751504898071289, 0.07799339294433594, 0.08083629608154297, 0.08367919921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 8.0, 4.0, 2.0, 7.0, 13.0, 8.0, 11.0, 10.0, 7.0, 9.0, 15.0, 15.0, 21.0, 29.0, 25.0, 29.0, 18.0, 41.0, 48.0, 66.0, 57.0, 63.0, 66.0, 48.0, 69.0, 49.0, 34.0, 35.0, 33.0, 23.0, 25.0, 20.0, 10.0, 11.0, 12.0, 14.0, 11.0, 8.0, 10.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10498046875, -0.10138893127441406, -0.09779739379882812, -0.09420585632324219, -0.09061431884765625, -0.08702278137207031, -0.08343124389648438, -0.07983970642089844, -0.0762481689453125, -0.07265663146972656, -0.06906509399414062, -0.06547355651855469, -0.06188201904296875, -0.05829048156738281, -0.054698944091796875, -0.05110740661621094, -0.047515869140625, -0.04392433166503906, -0.040332794189453125, -0.03674125671386719, -0.03314971923828125, -0.029558181762695312, -0.025966644287109375, -0.022375106811523438, -0.0187835693359375, -0.015192031860351562, -0.011600494384765625, -0.008008956909179688, -0.00441741943359375, -0.0008258819580078125, 0.002765655517578125, 0.0063571929931640625, 0.00994873046875, 0.013540267944335938, 0.017131805419921875, 0.020723342895507812, 0.02431488037109375, 0.027906417846679688, 0.031497955322265625, 0.03508949279785156, 0.0386810302734375, 0.04227256774902344, 0.045864105224609375, 0.04945564270019531, 0.05304718017578125, 0.05663871765136719, 0.060230255126953125, 0.06382179260253906, 0.067413330078125, 0.07100486755371094, 0.07459640502929688, 0.07818794250488281, 0.08177947998046875, 0.08537101745605469, 0.08896255493164062, 0.09255409240722656, 0.0961456298828125, 0.09973716735839844, 0.10332870483398438, 0.10692024230957031, 0.11051177978515625, 0.11410331726074219, 0.11769485473632812, 0.12128639221191406, 0.1248779296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 10.0, 16.0, 12.0, 18.0, 24.0, 19.0, 31.0, 35.0, 69.0, 75.0, 149.0, 233.0, 373.0, 850.0, 1991.0, 5816.0, 21517.0, 234638.0, 747798.0, 24342.0, 6239.0, 2169.0, 916.0, 499.0, 228.0, 148.0, 82.0, 48.0, 41.0, 22.0, 24.0, 16.0, 25.0, 14.0, 10.0, 10.0, 9.0, 5.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0124969482421875, -0.01206660270690918, -0.01163625717163086, -0.011205911636352539, -0.010775566101074219, -0.010345220565795898, -0.009914875030517578, -0.009484529495239258, -0.009054183959960938, -0.008623838424682617, -0.008193492889404297, -0.0077631473541259766, -0.007332801818847656, -0.006902456283569336, -0.006472110748291016, -0.006041765213012695, -0.005611419677734375, -0.005181074142456055, -0.004750728607177734, -0.004320383071899414, -0.0038900375366210938, -0.0034596920013427734, -0.003029346466064453, -0.002599000930786133, -0.0021686553955078125, -0.0017383098602294922, -0.0013079643249511719, -0.0008776187896728516, -0.00044727325439453125, -1.6927719116210938e-05, 0.0004134178161621094, 0.0008437633514404297, 0.00127410888671875, 0.0017044544219970703, 0.0021347999572753906, 0.002565145492553711, 0.0029954910278320312, 0.0034258365631103516, 0.003856182098388672, 0.004286527633666992, 0.0047168731689453125, 0.005147218704223633, 0.005577564239501953, 0.0060079097747802734, 0.006438255310058594, 0.006868600845336914, 0.007298946380615234, 0.007729291915893555, 0.008159637451171875, 0.008589982986450195, 0.009020328521728516, 0.009450674057006836, 0.009881019592285156, 0.010311365127563477, 0.010741710662841797, 0.011172056198120117, 0.011602401733398438, 0.012032747268676758, 0.012463092803955078, 0.012893438339233398, 0.013323783874511719, 0.013754129409790039, 0.01418447494506836, 0.01461482048034668, 0.015045166015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 7.0, 5.0, 3.0, 5.0, 4.0, 0.0, 0.0, 7.0, 3.0, 6.0, 3.0, 7.0, 5.0, 11.0, 9.0, 8.0, 14.0, 7.0, 25.0, 17.0, 17.0, 24.0, 22.0, 35.0, 62.0, 52.0, 72.0, 67.0, 63.0, 72.0, 64.0, 51.0, 37.0, 28.0, 22.0, 16.0, 19.0, 15.0, 14.0, 11.0, 9.0, 12.0, 11.0, 7.0, 4.0, 10.0, 5.0, 4.0, 8.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-3.1828880310058594e-05, -3.0780211091041565e-05, -2.9731541872024536e-05, -2.8682872653007507e-05, -2.763420343399048e-05, -2.658553421497345e-05, -2.553686499595642e-05, -2.4488195776939392e-05, -2.3439526557922363e-05, -2.2390857338905334e-05, -2.1342188119888306e-05, -2.0293518900871277e-05, -1.9244849681854248e-05, -1.819618046283722e-05, -1.714751124382019e-05, -1.609884202480316e-05, -1.5050172805786133e-05, -1.4001503586769104e-05, -1.2952834367752075e-05, -1.1904165148735046e-05, -1.0855495929718018e-05, -9.806826710700989e-06, -8.75815749168396e-06, -7.709488272666931e-06, -6.660819053649902e-06, -5.6121498346328735e-06, -4.563480615615845e-06, -3.514811396598816e-06, -2.466142177581787e-06, -1.4174729585647583e-06, -3.688037395477295e-07, 6.798654794692993e-07, 1.7285346984863281e-06, 2.777203917503357e-06, 3.825873136520386e-06, 4.8745423555374146e-06, 5.923211574554443e-06, 6.971880793571472e-06, 8.020550012588501e-06, 9.06921923160553e-06, 1.0117888450622559e-05, 1.1166557669639587e-05, 1.2215226888656616e-05, 1.3263896107673645e-05, 1.4312565326690674e-05, 1.5361234545707703e-05, 1.640990376472473e-05, 1.745857298374176e-05, 1.850724220275879e-05, 1.9555911421775818e-05, 2.0604580640792847e-05, 2.1653249859809875e-05, 2.2701919078826904e-05, 2.3750588297843933e-05, 2.4799257516860962e-05, 2.584792673587799e-05, 2.689659595489502e-05, 2.794526517391205e-05, 2.8993934392929077e-05, 3.0042603611946106e-05, 3.1091272830963135e-05, 3.2139942049980164e-05, 3.318861126899719e-05, 3.423728048801422e-05, 3.528594970703125e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 6.0, 15.0, 28.0, 42.0, 76.0, 121.0, 258.0, 512.0, 1013.0, 2219.0, 5824.0, 18446.0, 123960.0, 844511.0, 35796.0, 9439.0, 3340.0, 1477.0, 660.0, 347.0, 206.0, 94.0, 49.0, 48.0, 17.0, 10.0, 10.0, 10.0, 10.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0118408203125, -0.011371374130249023, -0.010901927947998047, -0.01043248176574707, -0.009963035583496094, -0.009493589401245117, -0.00902414321899414, -0.008554697036743164, -0.008085250854492188, -0.007615804672241211, -0.007146358489990234, -0.006676912307739258, -0.006207466125488281, -0.005738019943237305, -0.005268573760986328, -0.0047991275787353516, -0.004329681396484375, -0.0038602352142333984, -0.003390789031982422, -0.0029213428497314453, -0.0024518966674804688, -0.001982450485229492, -0.0015130043029785156, -0.001043558120727539, -0.0005741119384765625, -0.00010466575622558594, 0.0003647804260253906, 0.0008342266082763672, 0.0013036727905273438, 0.0017731189727783203, 0.002242565155029297, 0.0027120113372802734, 0.00318145751953125, 0.0036509037017822266, 0.004120349884033203, 0.00458979606628418, 0.005059242248535156, 0.005528688430786133, 0.005998134613037109, 0.006467580795288086, 0.0069370269775390625, 0.007406473159790039, 0.007875919342041016, 0.008345365524291992, 0.008814811706542969, 0.009284257888793945, 0.009753704071044922, 0.010223150253295898, 0.010692596435546875, 0.011162042617797852, 0.011631488800048828, 0.012100934982299805, 0.012570381164550781, 0.013039827346801758, 0.013509273529052734, 0.013978719711303711, 0.014448165893554688, 0.014917612075805664, 0.01538705825805664, 0.015856504440307617, 0.016325950622558594, 0.01679539680480957, 0.017264842987060547, 0.017734289169311523, 0.0182037353515625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 4.0, 1.0, 4.0, 13.0, 15.0, 12.0, 22.0, 15.0, 40.0, 56.0, 75.0, 118.0, 174.0, 158.0, 71.0, 58.0, 40.0, 19.0, 19.0, 13.0, 12.0, 9.0, 8.0, 8.0, 8.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01062774658203125, -0.010226130485534668, -0.009824514389038086, -0.009422898292541504, -0.009021282196044922, -0.00861966609954834, -0.008218050003051758, -0.007816433906555176, -0.007414817810058594, -0.007013201713562012, -0.00661158561706543, -0.006209969520568848, -0.005808353424072266, -0.005406737327575684, -0.0050051212310791016, -0.0046035051345825195, -0.0042018890380859375, -0.0038002729415893555, -0.0033986568450927734, -0.0029970407485961914, -0.0025954246520996094, -0.0021938085556030273, -0.0017921924591064453, -0.0013905763626098633, -0.0009889602661132812, -0.0005873441696166992, -0.0001857280731201172, 0.00021588802337646484, 0.0006175041198730469, 0.001019120216369629, 0.001420736312866211, 0.001822352409362793, 0.002223968505859375, 0.002625584602355957, 0.003027200698852539, 0.003428816795349121, 0.003830432891845703, 0.004232048988342285, 0.004633665084838867, 0.005035281181335449, 0.005436897277832031, 0.005838513374328613, 0.006240129470825195, 0.006641745567321777, 0.007043361663818359, 0.007444977760314941, 0.007846593856811523, 0.008248209953308105, 0.008649826049804688, 0.00905144214630127, 0.009453058242797852, 0.009854674339294434, 0.010256290435791016, 0.010657906532287598, 0.01105952262878418, 0.011461138725280762, 0.011862754821777344, 0.012264370918273926, 0.012665987014770508, 0.01306760311126709, 0.013469219207763672, 0.013870835304260254, 0.014272451400756836, 0.014674067497253418, 0.01507568359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 11.0, 23.0, 37.0, 62.0, 98.0, 530.0, 105.0, 59.0, 21.0, 28.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5285054445266724, -0.5099209547042847, -0.4913364350795746, -0.4727519154548645, -0.4541674256324768, -0.4355829060077667, -0.41699838638305664, -0.39841389656066895, -0.37982940673828125, -0.36124488711357117, -0.34266039729118347, -0.3240758776664734, -0.3054913878440857, -0.2869068682193756, -0.2683223485946655, -0.24973785877227783, -0.23115333914756775, -0.21256883442401886, -0.19398432970046997, -0.1753998100757599, -0.1568153202533722, -0.1382308006286621, -0.11964629590511322, -0.10106179118156433, -0.08247728645801544, -0.06389278173446655, -0.045308273285627365, -0.026723764836788177, -0.008139260113239288, 0.0104452446103096, 0.029029756784439087, 0.047614261507987976, 0.06619876623153687, 0.08478327095508575, 0.10336777567863464, 0.12195228785276413, 0.14053678512573242, 0.1591213047504425, 0.1777058094739914, 0.19629031419754028, 0.21487481892108917, 0.23345932364463806, 0.25204384326934814, 0.27062833309173584, 0.2892128527164459, 0.3077973425388336, 0.3263818621635437, 0.3449663519859314, 0.3635508716106415, 0.38213539123535156, 0.40071988105773926, 0.41930440068244934, 0.43788889050483704, 0.4564734101295471, 0.4750578999519348, 0.4936424195766449, 0.512226939201355, 0.5308114290237427, 0.5493959784507751, 0.5679804682731628, 0.5865649580955505, 0.6051494479179382, 0.6237339973449707, 0.6423184871673584, 0.6609029769897461]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 0.0, 3.0, 2.0, 6.0, 10.0, 2.0, 5.0, 6.0, 6.0, 8.0, 8.0, 9.0, 10.0, 14.0, 12.0, 21.0, 27.0, 19.0, 33.0, 26.0, 47.0, 247.0, 186.0, 49.0, 31.0, 33.0, 16.0, 17.0, 20.0, 19.0, 18.0, 16.0, 12.0, 8.0, 5.0, 11.0, 14.0, 10.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3634147047996521, -0.35235968232154846, -0.3413046598434448, -0.3302496075630188, -0.31919458508491516, -0.3081395626068115, -0.2970845401287079, -0.28602951765060425, -0.2749744653701782, -0.2639194428920746, -0.25286442041397095, -0.24180938303470612, -0.23075434565544128, -0.21969932317733765, -0.208644300699234, -0.19758926331996918, -0.18653424084186554, -0.1754792183637619, -0.16442418098449707, -0.15336915850639343, -0.1423141211271286, -0.13125909864902496, -0.12020406872034073, -0.1091490387916565, -0.09809400886297226, -0.08703897893428802, -0.07598394900560379, -0.06492891907691956, -0.05387389287352562, -0.042818862944841385, -0.03176383674144745, -0.020708806812763214, -0.00965377688407898, 0.0014012521132826805, 0.01245628111064434, 0.023511309176683426, 0.03456633910536766, 0.045621369034051895, 0.05667639523744583, 0.06773142516613007, 0.0787864550948143, 0.08984148502349854, 0.10089651495218277, 0.111951544880867, 0.12300656735897064, 0.13406160473823547, 0.1451166272163391, 0.15617164969444275, 0.16722668707370758, 0.17828170955181122, 0.18933674693107605, 0.2003917694091797, 0.21144680678844452, 0.22250182926654816, 0.233556866645813, 0.24461188912391663, 0.25566691160202026, 0.2667219340801239, 0.27777695655822754, 0.28883200883865356, 0.2998870313167572, 0.31094205379486084, 0.3219970762729645, 0.3330520987510681, 0.34410715103149414]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 3.0, 6.0, 9.0, 14.0, 12.0, 15.0, 19.0, 30.0, 31.0, 30.0, 36.0, 52.0, 278.0, 179.0, 50.0, 50.0, 44.0, 30.0, 27.0, 19.0, 16.0, 11.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05078125, -0.04928159713745117, -0.047781944274902344, -0.046282291412353516, -0.04478263854980469, -0.04328298568725586, -0.04178333282470703, -0.0402836799621582, -0.038784027099609375, -0.03728437423706055, -0.03578472137451172, -0.03428506851196289, -0.03278541564941406, -0.031285762786865234, -0.029786109924316406, -0.028286457061767578, -0.02678680419921875, -0.025287151336669922, -0.023787498474121094, -0.022287845611572266, -0.020788192749023438, -0.01928853988647461, -0.01778888702392578, -0.016289234161376953, -0.014789581298828125, -0.013289928436279297, -0.011790275573730469, -0.01029062271118164, -0.008790969848632812, -0.007291316986083984, -0.005791664123535156, -0.004292011260986328, -0.0027923583984375, -0.0012927055358886719, 0.00020694732666015625, 0.0017066001892089844, 0.0032062530517578125, 0.004705905914306641, 0.006205558776855469, 0.007705211639404297, 0.009204864501953125, 0.010704517364501953, 0.012204170227050781, 0.01370382308959961, 0.015203475952148438, 0.016703128814697266, 0.018202781677246094, 0.019702434539794922, 0.02120208740234375, 0.022701740264892578, 0.024201393127441406, 0.025701045989990234, 0.027200698852539062, 0.02870035171508789, 0.03020000457763672, 0.03169965744018555, 0.033199310302734375, 0.0346989631652832, 0.03619861602783203, 0.03769826889038086, 0.03919792175292969, 0.040697574615478516, 0.042197227478027344, 0.04369688034057617, 0.045196533203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 12.0, 12.0, 17.0, 36.0, 51.0, 108.0, 222.0, 566.0, 2161.0, 17307.0, 8355371.0, 10165.0, 1615.0, 448.0, 230.0, 100.0, 58.0, 42.0, 16.0, 10.0, 5.0, 8.0, 10.0, 2.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35434266924858093, -0.33778855204582214, -0.32123440504074097, -0.3046802878379822, -0.2881261706352234, -0.2715720534324646, -0.2550179064273834, -0.23846378922462463, -0.22190965712070465, -0.20535552501678467, -0.18880140781402588, -0.1722472757101059, -0.1556931436061859, -0.13913902640342712, -0.12258489429950714, -0.10603076964616776, -0.08947664499282837, -0.07292252033948898, -0.0563683919608593, -0.039814263582229614, -0.02326013892889023, -0.006706014275550842, 0.00984811782836914, 0.026402242481708527, 0.04295636713504791, 0.0595104917883873, 0.07606461644172668, 0.09261874854564667, 0.10917287319898605, 0.12572699785232544, 0.14228112995624542, 0.1588352620601654, 0.1753893494606018, 0.1919434815645218, 0.20849759876728058, 0.22505173087120056, 0.24160584807395935, 0.2581599950790405, 0.2747141122817993, 0.2912682294845581, 0.3078223466873169, 0.3243764638900757, 0.34093061089515686, 0.35748472809791565, 0.37403884530067444, 0.3905929923057556, 0.4071471095085144, 0.4237012267112732, 0.44025537371635437, 0.45680949091911316, 0.47336363792419434, 0.4899177551269531, 0.5064718723297119, 0.5230259895324707, 0.5395801067352295, 0.5561342835426331, 0.5726884007453918, 0.5892425179481506, 0.6057966351509094, 0.622350811958313, 0.6389049291610718, 0.6554590463638306, 0.6720131635665894, 0.6885672807693481, 0.7051213979721069]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 5.0, 4.0, 4.0, 0.0, 4.0, 7.0, 2.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 5.0, 3.0, 2.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5080909729003906, -0.4912363290786743, -0.474381685256958, -0.4575270414352417, -0.4406723976135254, -0.4238177537918091, -0.4069631099700928, -0.39010846614837646, -0.37325382232666016, -0.35639917850494385, -0.33954453468322754, -0.32268989086151123, -0.3058352470397949, -0.2889806032180786, -0.2721259593963623, -0.255271315574646, -0.2384166717529297, -0.22156202793121338, -0.20470738410949707, -0.18785274028778076, -0.17099809646606445, -0.15414345264434814, -0.13728880882263184, -0.12043416500091553, -0.10357952117919922, -0.08672487735748291, -0.0698702335357666, -0.05301558971405029, -0.036160945892333984, -0.019306302070617676, -0.002451658248901367, 0.014402985572814941, 0.03125762939453125, 0.04811227321624756, 0.06496691703796387, 0.08182156085968018, 0.09867620468139648, 0.11553084850311279, 0.1323854923248291, 0.1492401361465454, 0.16609477996826172, 0.18294942378997803, 0.19980406761169434, 0.21665871143341064, 0.23351335525512695, 0.25036799907684326, 0.26722264289855957, 0.2840772867202759, 0.3009319305419922, 0.3177865743637085, 0.3346412181854248, 0.3514958620071411, 0.3683505058288574, 0.38520514965057373, 0.40205979347229004, 0.41891443729400635, 0.43576908111572266, 0.45262372493743896, 0.4694783687591553, 0.4863330125808716, 0.5031876564025879, 0.5200423002243042, 0.5368969440460205, 0.5537515878677368, 0.5706062316894531]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 19.0, 23.0, 27.0, 50.0, 74.0, 113.0, 212.0, 357.0, 640.0, 1372.0, 3283.0, 10211.0, 46988.0, 264898.0, 159290.0, 26047.0, 6291.0, 2188.0, 940.0, 503.0, 249.0, 170.0, 101.0, 59.0, 38.0, 27.0, 19.0, 13.0, 8.0, 8.0, 6.0, 7.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.465087890625, -0.4500007629394531, -0.43491363525390625, -0.4198265075683594, -0.4047393798828125, -0.3896522521972656, -0.37456512451171875, -0.3594779968261719, -0.344390869140625, -0.3293037414550781, -0.31421661376953125, -0.2991294860839844, -0.2840423583984375, -0.2689552307128906, -0.25386810302734375, -0.23878097534179688, -0.22369384765625, -0.20860671997070312, -0.19351959228515625, -0.17843246459960938, -0.1633453369140625, -0.14825820922851562, -0.13317108154296875, -0.11808395385742188, -0.102996826171875, -0.08790969848632812, -0.07282257080078125, -0.057735443115234375, -0.0426483154296875, -0.027561187744140625, -0.01247406005859375, 0.002613067626953125, 0.0177001953125, 0.032787322998046875, 0.04787445068359375, 0.06296157836914062, 0.0780487060546875, 0.09313583374023438, 0.10822296142578125, 0.12331008911132812, 0.138397216796875, 0.15348434448242188, 0.16857147216796875, 0.18365859985351562, 0.1987457275390625, 0.21383285522460938, 0.22891998291015625, 0.24400711059570312, 0.25909423828125, 0.2741813659667969, 0.28926849365234375, 0.3043556213378906, 0.3194427490234375, 0.3345298767089844, 0.34961700439453125, 0.3647041320800781, 0.379791259765625, 0.3948783874511719, 0.40996551513671875, 0.4250526428222656, 0.4401397705078125, 0.4552268981933594, 0.47031402587890625, 0.4854011535644531, 0.50048828125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 8.0, 7.0, 11.0, 16.0, 16.0, 19.0, 23.0, 33.0, 43.0, 40.0, 59.0, 67.0, 56.0, 71.0, 56.0, 75.0, 66.0, 72.0, 56.0, 37.0, 34.0, 26.0, 21.0, 15.0, 9.0, 13.0, 6.0, 8.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.04473876953125, -0.043469905853271484, -0.04220104217529297, -0.04093217849731445, -0.03966331481933594, -0.03839445114135742, -0.037125587463378906, -0.03585672378540039, -0.034587860107421875, -0.03331899642944336, -0.032050132751464844, -0.030781269073486328, -0.029512405395507812, -0.028243541717529297, -0.02697467803955078, -0.025705814361572266, -0.02443695068359375, -0.023168087005615234, -0.02189922332763672, -0.020630359649658203, -0.019361495971679688, -0.018092632293701172, -0.016823768615722656, -0.01555490493774414, -0.014286041259765625, -0.01301717758178711, -0.011748313903808594, -0.010479450225830078, -0.009210586547851562, -0.007941722869873047, -0.006672859191894531, -0.005403995513916016, -0.0041351318359375, -0.0028662681579589844, -0.0015974044799804688, -0.0003285408020019531, 0.0009403228759765625, 0.002209186553955078, 0.0034780502319335938, 0.004746913909912109, 0.006015777587890625, 0.007284641265869141, 0.008553504943847656, 0.009822368621826172, 0.011091232299804688, 0.012360095977783203, 0.013628959655761719, 0.014897823333740234, 0.01616668701171875, 0.017435550689697266, 0.01870441436767578, 0.019973278045654297, 0.021242141723632812, 0.022511005401611328, 0.023779869079589844, 0.02504873275756836, 0.026317596435546875, 0.02758646011352539, 0.028855323791503906, 0.030124187469482422, 0.03139305114746094, 0.03266191482543945, 0.03393077850341797, 0.035199642181396484, 0.036468505859375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 3.0, 2.0, 2.0, 8.0, 11.0, 6.0, 11.0, 24.0, 26.0, 43.0, 57.0, 37.0, 54.0, 38.0, 38.0, 27.0, 18.0, 13.0, 10.0, 12.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2834893763065338, -0.27606239914894104, -0.26863542199134827, -0.2612084448337555, -0.2537814676761627, -0.24635447561740875, -0.23892749845981598, -0.2315005213022232, -0.22407352924346924, -0.21664655208587646, -0.2092195749282837, -0.20179259777069092, -0.19436560571193695, -0.18693862855434418, -0.1795116513967514, -0.17208467423915863, -0.16465769708156586, -0.15723071992397308, -0.1498037427663803, -0.14237675070762634, -0.13494977355003357, -0.1275227963924408, -0.12009581923484802, -0.11266884207725525, -0.10524185746908188, -0.0978148803114891, -0.09038789570331573, -0.08296091854572296, -0.07553394138813019, -0.06810695677995682, -0.060679979622364044, -0.05325299873948097, -0.04582600295543671, -0.038399022072553635, -0.030972043052315712, -0.02354506403207779, -0.016118083149194717, -0.008691102266311646, -0.001264125108718872, 0.0061628557741642, 0.013589836657047272, 0.021016817539930344, 0.028443796560168266, 0.03587077558040619, 0.04329775646328926, 0.05072473734617233, 0.058151714503765106, 0.06557869911193848, 0.07300567626953125, 0.08043265342712402, 0.0878596380352974, 0.09528661519289017, 0.10271359980106354, 0.11014057695865631, 0.11756755411624908, 0.12499453127384186, 0.13242152333259583, 0.1398485004901886, 0.14727547764778137, 0.15470245480537415, 0.1621294468641281, 0.1695564240217209, 0.17698340117931366, 0.18441037833690643, 0.1918373554944992]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 6.0, 2.0, 5.0, 7.0, 4.0, 10.0, 25.0, 39.0, 75.0, 86.0, 102.0, 58.0, 20.0, 6.0, 6.0, 11.0, 4.0, 7.0, 2.0, 4.0, 0.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2557032108306885, -0.24675419926643372, -0.23780518770217896, -0.2288561761379242, -0.21990716457366943, -0.21095815300941467, -0.2020091414451599, -0.19306012988090515, -0.1841111183166504, -0.17516210675239563, -0.16621309518814087, -0.1572640836238861, -0.14831507205963135, -0.1393660604953766, -0.13041704893112183, -0.12146802991628647, -0.11251901090145111, -0.10356999933719635, -0.09462098777294159, -0.08567197620868683, -0.07672296464443207, -0.06777395308017731, -0.05882493406534195, -0.04987592250108719, -0.04092691093683243, -0.03197789937257767, -0.023028885945677757, -0.014079872518777847, -0.0051308609545230865, 0.003818150609731674, 0.012767165899276733, 0.021716177463531494, 0.030665189027786255, 0.039614200592041016, 0.048563212156295776, 0.057512227445840836, 0.0664612352848053, 0.07541024684906006, 0.08435926586389542, 0.09330827742815018, 0.10225728899240494, 0.1112063005566597, 0.12015531212091446, 0.12910433113574982, 0.13805334270000458, 0.14700235426425934, 0.1559513658285141, 0.16490037739276886, 0.17384938895702362, 0.18279840052127838, 0.19174741208553314, 0.2006964236497879, 0.20964543521404266, 0.21859444677829742, 0.22754347324371338, 0.23649248480796814, 0.2454414963722229, 0.25439050793647766, 0.2633395195007324, 0.2722885310649872, 0.28123754262924194, 0.2901865541934967, 0.29913556575775146, 0.3080845773220062, 0.317033588886261]}, "train/train_runtime": 4778.2339, "train/train_samples_per_second": 5.972, "train/train_steps_per_second": 0.062, "train/total_flos": 0.0, "train/train_loss": 4.439775107284186} \ No newline at end of file +{"train/loss": 4.5598, "train/learning_rate": 5.92e-06, "train/epoch": 1.0, "train/global_step": 297, "_runtime": 6078, "_timestamp": 1646087417, "_step": 298, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 18.0, 136.0, 307.0, 339.0, 165.0, 40.0, 8.0, 3.0], "bins": [-198.99710083007812, -195.63198852539062, -192.26686096191406, -188.90174865722656, -185.53662109375, -182.1715087890625, -178.80638122558594, -175.44126892089844, -172.07614135742188, -168.71102905273438, -165.3459014892578, -161.9807891845703, -158.61566162109375, -155.25054931640625, -151.8854217529297, -148.5203094482422, -145.15518188476562, -141.79006958007812, -138.42494201660156, -135.05982971191406, -131.6947021484375, -128.32958984375, -124.96446228027344, -121.5993423461914, -118.2342300415039, -114.86911010742188, -111.50399017333984, -108.13887023925781, -104.77375030517578, -101.40863037109375, -98.04351043701172, -94.67839050292969, -91.31327056884766, -87.94815063476562, -84.5830307006836, -81.21791076660156, -77.85279083251953, -74.4876708984375, -71.12255096435547, -67.75743103027344, -64.3923110961914, -61.027191162109375, -57.662071228027344, -54.29695129394531, -50.93183135986328, -47.56671142578125, -44.20159149169922, -40.83647155761719, -37.47135543823242, -34.10623550415039, -30.74111557006836, -27.375995635986328, -24.010875701904297, -20.6457576751709, -17.280637741088867, -13.915517807006836, -10.550397872924805, -7.185277938842773, -3.8201584815979004, -0.45503902435302734, 2.910080909729004, 6.275199890136719, 9.64031982421875, 13.005439758300781, 16.370559692382812]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 7.0, 12.0, 9.0, 18.0, 17.0, 20.0, 20.0, 29.0, 35.0, 31.0, 40.0, 38.0, 43.0, 50.0, 42.0, 31.0, 38.0, 44.0, 42.0, 45.0, 48.0, 45.0, 39.0, 37.0, 19.0, 26.0, 26.0, 19.0, 16.0, 20.0, 11.0, 13.0, 11.0, 9.0, 11.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-48.525508880615234, -47.09046173095703, -45.65541458129883, -44.22036361694336, -42.785316467285156, -41.35026931762695, -39.91522216796875, -38.48017120361328, -37.04512405395508, -35.610076904296875, -34.17502975463867, -32.7399787902832, -31.304931640625, -29.869884490966797, -28.434837341308594, -26.999788284301758, -25.564741134643555, -24.12969398498535, -22.694644927978516, -21.259597778320312, -19.824548721313477, -18.389501571655273, -16.954452514648438, -15.519405364990234, -14.084357261657715, -12.649309158325195, -11.214261054992676, -9.779212951660156, -8.344165802001953, -6.909117221832275, -5.474069595336914, -4.0390214920043945, -2.603973388671875, -1.168925404548645, 0.26612257957458496, 1.7011704444885254, 3.136218547821045, 4.5712666511535645, 6.006314277648926, 7.441362380981445, 8.876410484313965, 10.311458587646484, 11.746506690979004, 13.181554794311523, 14.616601943969727, 16.051651000976562, 17.486698150634766, 18.92174530029297, 20.356794357299805, 21.791841506958008, 23.226890563964844, 24.661937713623047, 26.096986770629883, 27.532033920288086, 28.967082977294922, 30.402130126953125, 31.837177276611328, 33.27222442626953, 34.707271575927734, 36.1423225402832, 37.577369689941406, 39.01241683959961, 40.44746398925781, 41.88251495361328, 43.317562103271484]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 6.0, 5.0, 16.0, 11.0, 22.0, 14.0, 19.0, 24.0, 27.0, 25.0, 34.0, 47.0, 43.0, 51.0, 56.0, 46.0, 41.0, 54.0, 57.0, 35.0, 44.0, 46.0, 30.0, 37.0, 32.0, 32.0, 28.0, 17.0, 15.0, 21.0, 16.0, 9.0, 11.0, 4.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.906402587890625, -2.80303955078125, -2.699676513671875, -2.5963134765625, -2.492950439453125, -2.38958740234375, -2.286224365234375, -2.182861328125, -2.079498291015625, -1.97613525390625, -1.872772216796875, -1.7694091796875, -1.666046142578125, -1.56268310546875, -1.459320068359375, -1.35595703125, -1.252593994140625, -1.14923095703125, -1.045867919921875, -0.9425048828125, -0.839141845703125, -0.73577880859375, -0.632415771484375, -0.529052734375, -0.425689697265625, -0.32232666015625, -0.218963623046875, -0.1156005859375, -0.012237548828125, 0.09112548828125, 0.194488525390625, 0.2978515625, 0.401214599609375, 0.50457763671875, 0.607940673828125, 0.7113037109375, 0.814666748046875, 0.91802978515625, 1.021392822265625, 1.124755859375, 1.228118896484375, 1.33148193359375, 1.434844970703125, 1.5382080078125, 1.641571044921875, 1.74493408203125, 1.848297119140625, 1.95166015625, 2.055023193359375, 2.15838623046875, 2.261749267578125, 2.3651123046875, 2.468475341796875, 2.57183837890625, 2.675201416015625, 2.778564453125, 2.881927490234375, 2.98529052734375, 3.088653564453125, 3.1920166015625, 3.295379638671875, 3.39874267578125, 3.502105712890625, 3.60546875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 11.0, 16.0, 23.0, 45.0, 77.0, 101.0, 196.0, 245.0, 457.0, 802.0, 1606.0, 3407.0, 10055.0, 47288.0, 504506.0, 2939452.0, 612538.0, 54358.0, 11380.0, 3863.0, 1744.0, 862.0, 478.0, 267.0, 203.0, 107.0, 72.0, 45.0, 35.0, 16.0, 13.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2421875, -12.889404296875, -12.53662109375, -12.183837890625, -11.8310546875, -11.478271484375, -11.12548828125, -10.772705078125, -10.419921875, -10.067138671875, -9.71435546875, -9.361572265625, -9.0087890625, -8.656005859375, -8.30322265625, -7.950439453125, -7.59765625, -7.244873046875, -6.89208984375, -6.539306640625, -6.1865234375, -5.833740234375, -5.48095703125, -5.128173828125, -4.775390625, -4.422607421875, -4.06982421875, -3.717041015625, -3.3642578125, -3.011474609375, -2.65869140625, -2.305908203125, -1.953125, -1.600341796875, -1.24755859375, -0.894775390625, -0.5419921875, -0.189208984375, 0.16357421875, 0.516357421875, 0.869140625, 1.221923828125, 1.57470703125, 1.927490234375, 2.2802734375, 2.633056640625, 2.98583984375, 3.338623046875, 3.69140625, 4.044189453125, 4.39697265625, 4.749755859375, 5.1025390625, 5.455322265625, 5.80810546875, 6.160888671875, 6.513671875, 6.866455078125, 7.21923828125, 7.572021484375, 7.9248046875, 8.277587890625, 8.63037109375, 8.983154296875, 9.3359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 17.0, 16.0, 20.0, 36.0, 40.0, 53.0, 75.0, 136.0, 162.0, 249.0, 364.0, 529.0, 570.0, 520.0, 368.0, 282.0, 203.0, 123.0, 94.0, 61.0, 41.0, 25.0, 21.0, 18.0, 8.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.515625, -13.111328125, -12.70703125, -12.302734375, -11.8984375, -11.494140625, -11.08984375, -10.685546875, -10.28125, -9.876953125, -9.47265625, -9.068359375, -8.6640625, -8.259765625, -7.85546875, -7.451171875, -7.046875, -6.642578125, -6.23828125, -5.833984375, -5.4296875, -5.025390625, -4.62109375, -4.216796875, -3.8125, -3.408203125, -3.00390625, -2.599609375, -2.1953125, -1.791015625, -1.38671875, -0.982421875, -0.578125, -0.173828125, 0.23046875, 0.634765625, 1.0390625, 1.443359375, 1.84765625, 2.251953125, 2.65625, 3.060546875, 3.46484375, 3.869140625, 4.2734375, 4.677734375, 5.08203125, 5.486328125, 5.890625, 6.294921875, 6.69921875, 7.103515625, 7.5078125, 7.912109375, 8.31640625, 8.720703125, 9.125, 9.529296875, 9.93359375, 10.337890625, 10.7421875, 11.146484375, 11.55078125, 11.955078125, 12.359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 11.0, 11.0, 17.0, 37.0, 49.0, 53.0, 101.0, 154.0, 271.0, 461.0, 957.0, 2154.0, 9341.0, 857523.0, 3298325.0, 19224.0, 3053.0, 1146.0, 591.0, 283.0, 182.0, 102.0, 69.0, 43.0, 32.0, 26.0, 15.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.46875, -40.04541015625, -38.6220703125, -37.19873046875, -35.775390625, -34.35205078125, -32.9287109375, -31.50537109375, -30.08203125, -28.65869140625, -27.2353515625, -25.81201171875, -24.388671875, -22.96533203125, -21.5419921875, -20.11865234375, -18.6953125, -17.27197265625, -15.8486328125, -14.42529296875, -13.001953125, -11.57861328125, -10.1552734375, -8.73193359375, -7.30859375, -5.88525390625, -4.4619140625, -3.03857421875, -1.615234375, -0.19189453125, 1.2314453125, 2.65478515625, 4.078125, 5.50146484375, 6.9248046875, 8.34814453125, 9.771484375, 11.19482421875, 12.6181640625, 14.04150390625, 15.46484375, 16.88818359375, 18.3115234375, 19.73486328125, 21.158203125, 22.58154296875, 24.0048828125, 25.42822265625, 26.8515625, 28.27490234375, 29.6982421875, 31.12158203125, 32.544921875, 33.96826171875, 35.3916015625, 36.81494140625, 38.23828125, 39.66162109375, 41.0849609375, 42.50830078125, 43.931640625, 45.35498046875, 46.7783203125, 48.20166015625, 49.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 42.0, 245.0, 426.0, 241.0, 41.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.0782012939453, -156.39073181152344, -152.70327758789062, -149.01580810546875, -145.32833862304688, -141.640869140625, -137.9534149169922, -134.2659454345703, -130.57847595214844, -126.8910140991211, -123.20354461669922, -119.51608276367188, -115.82861328125, -112.14115142822266, -108.45368957519531, -104.76622009277344, -101.0787582397461, -97.39129638671875, -93.70382690429688, -90.01636505126953, -86.32889556884766, -82.64143371582031, -78.95396423339844, -75.2665023803711, -71.57904052734375, -67.8915786743164, -64.20410919189453, -60.51664733886719, -56.82917785644531, -53.14171600341797, -49.45425033569336, -45.76678466796875, -42.079315185546875, -38.391849517822266, -34.704383850097656, -31.01692008972168, -27.32945442199707, -23.64198875427246, -19.954524993896484, -16.267059326171875, -12.579593658447266, -8.892127990722656, -5.204663276672363, -1.5171985626220703, 2.170267105102539, 5.857732772827148, 9.545196533203125, 13.232662200927734, 16.920127868652344, 20.607593536376953, 24.295059204101562, 27.98252296447754, 31.66998863220215, 35.357452392578125, 39.044918060302734, 42.732383728027344, 46.41984939575195, 50.10731506347656, 53.79478073120117, 57.48224639892578, 61.169708251953125, 64.857177734375, 68.54463958740234, 72.23210144042969, 75.91957092285156]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 7.0, 4.0, 3.0, 7.0, 7.0, 14.0, 12.0, 8.0, 11.0, 15.0, 13.0, 14.0, 27.0, 25.0, 30.0, 30.0, 35.0, 33.0, 29.0, 32.0, 38.0, 31.0, 32.0, 33.0, 38.0, 43.0, 30.0, 35.0, 38.0, 26.0, 39.0, 29.0, 34.0, 26.0, 22.0, 32.0, 16.0, 20.0, 15.0, 15.0, 13.0, 13.0, 7.0, 7.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.028709411621094, -33.95008850097656, -32.8714714050293, -31.7928524017334, -30.7142333984375, -29.6356143951416, -28.556995391845703, -27.478376388549805, -26.399757385253906, -25.321138381958008, -24.24251937866211, -23.16390037536621, -22.085281372070312, -21.006662368774414, -19.928043365478516, -18.849424362182617, -17.77080535888672, -16.69218635559082, -15.613567352294922, -14.534948348999023, -13.456329345703125, -12.377710342407227, -11.299091339111328, -10.22047233581543, -9.141853332519531, -8.063234329223633, -6.984615325927734, -5.905996322631836, -4.8273773193359375, -3.748758316040039, -2.6701393127441406, -1.5915203094482422, -0.5129051208496094, 0.5657138824462891, 1.6443328857421875, 2.722951889038086, 3.8015708923339844, 4.880189895629883, 5.958808898925781, 7.03742790222168, 8.116046905517578, 9.194665908813477, 10.273284912109375, 11.351903915405273, 12.430522918701172, 13.50914192199707, 14.587760925292969, 15.666379928588867, 16.744998931884766, 17.823617935180664, 18.902236938476562, 19.98085594177246, 21.05947494506836, 22.138093948364258, 23.216712951660156, 24.295331954956055, 25.373950958251953, 26.45256996154785, 27.53118896484375, 28.60980796813965, 29.688426971435547, 30.767045974731445, 31.845664978027344, 32.924285888671875, 34.00290298461914]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 2.0, 3.0, 9.0, 9.0, 4.0, 15.0, 19.0, 24.0, 24.0, 21.0, 26.0, 21.0, 30.0, 38.0, 39.0, 24.0, 42.0, 50.0, 46.0, 58.0, 41.0, 39.0, 35.0, 41.0, 37.0, 33.0, 35.0, 26.0, 28.0, 22.0, 20.0, 32.0, 11.0, 27.0, 10.0, 11.0, 14.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.333984375, -3.230377197265625, -3.12677001953125, -3.023162841796875, -2.9195556640625, -2.815948486328125, -2.71234130859375, -2.608734130859375, -2.505126953125, -2.401519775390625, -2.29791259765625, -2.194305419921875, -2.0906982421875, -1.987091064453125, -1.88348388671875, -1.779876708984375, -1.67626953125, -1.572662353515625, -1.46905517578125, -1.365447998046875, -1.2618408203125, -1.158233642578125, -1.05462646484375, -0.951019287109375, -0.847412109375, -0.743804931640625, -0.64019775390625, -0.536590576171875, -0.4329833984375, -0.329376220703125, -0.22576904296875, -0.122161865234375, -0.0185546875, 0.085052490234375, 0.18865966796875, 0.292266845703125, 0.3958740234375, 0.499481201171875, 0.60308837890625, 0.706695556640625, 0.810302734375, 0.913909912109375, 1.01751708984375, 1.121124267578125, 1.2247314453125, 1.328338623046875, 1.43194580078125, 1.535552978515625, 1.63916015625, 1.742767333984375, 1.84637451171875, 1.949981689453125, 2.0535888671875, 2.157196044921875, 2.26080322265625, 2.364410400390625, 2.468017578125, 2.571624755859375, 2.67523193359375, 2.778839111328125, 2.8824462890625, 2.986053466796875, 3.08966064453125, 3.193267822265625, 3.296875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 10.0, 18.0, 19.0, 25.0, 61.0, 62.0, 94.0, 120.0, 178.0, 277.0, 385.0, 589.0, 847.0, 1214.0, 1797.0, 2721.0, 4127.0, 6333.0, 9428.0, 14927.0, 22528.0, 35128.0, 55721.0, 94655.0, 192169.0, 302736.0, 117237.0, 66796.0, 41349.0, 26443.0, 17349.0, 11065.0, 7401.0, 4896.0, 3089.0, 2174.0, 1434.0, 955.0, 693.0, 471.0, 299.0, 211.0, 158.0, 98.0, 85.0, 58.0, 28.0, 33.0, 24.0, 10.0, 3.0, 9.0, 4.0, 3.0, 5.0, 0.0, 2.0], "bins": [-0.85986328125, -0.8331451416015625, -0.806427001953125, -0.7797088623046875, -0.75299072265625, -0.7262725830078125, -0.699554443359375, -0.6728363037109375, -0.6461181640625, -0.6194000244140625, -0.592681884765625, -0.5659637451171875, -0.53924560546875, -0.5125274658203125, -0.485809326171875, -0.4590911865234375, -0.432373046875, -0.4056549072265625, -0.378936767578125, -0.3522186279296875, -0.32550048828125, -0.2987823486328125, -0.272064208984375, -0.2453460693359375, -0.2186279296875, -0.1919097900390625, -0.165191650390625, -0.1384735107421875, -0.11175537109375, -0.0850372314453125, -0.058319091796875, -0.0316009521484375, -0.0048828125, 0.0218353271484375, 0.048553466796875, 0.0752716064453125, 0.10198974609375, 0.1287078857421875, 0.155426025390625, 0.1821441650390625, 0.2088623046875, 0.2355804443359375, 0.262298583984375, 0.2890167236328125, 0.31573486328125, 0.3424530029296875, 0.369171142578125, 0.3958892822265625, 0.422607421875, 0.4493255615234375, 0.476043701171875, 0.5027618408203125, 0.52947998046875, 0.5561981201171875, 0.582916259765625, 0.6096343994140625, 0.6363525390625, 0.6630706787109375, 0.689788818359375, 0.7165069580078125, 0.74322509765625, 0.7699432373046875, 0.796661376953125, 0.8233795166015625, 0.85009765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 5.0, 4.0, 6.0, 10.0, 9.0, 13.0, 16.0, 12.0, 22.0, 21.0, 14.0, 27.0, 24.0, 28.0, 42.0, 27.0, 42.0, 38.0, 44.0, 40.0, 38.0, 1060.0, 40.0, 37.0, 37.0, 31.0, 36.0, 30.0, 33.0, 33.0, 31.0, 20.0, 24.0, 27.0, 15.0, 12.0, 13.0, 7.0, 14.0, 9.0, 5.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9912109375, -1.9278717041015625, -1.864532470703125, -1.8011932373046875, -1.73785400390625, -1.6745147705078125, -1.611175537109375, -1.5478363037109375, -1.4844970703125, -1.4211578369140625, -1.357818603515625, -1.2944793701171875, -1.23114013671875, -1.1678009033203125, -1.104461669921875, -1.0411224365234375, -0.977783203125, -0.9144439697265625, -0.851104736328125, -0.7877655029296875, -0.72442626953125, -0.6610870361328125, -0.597747802734375, -0.5344085693359375, -0.4710693359375, -0.4077301025390625, -0.344390869140625, -0.2810516357421875, -0.21771240234375, -0.1543731689453125, -0.091033935546875, -0.0276947021484375, 0.03564453125, 0.0989837646484375, 0.162322998046875, 0.2256622314453125, 0.28900146484375, 0.3523406982421875, 0.415679931640625, 0.4790191650390625, 0.5423583984375, 0.6056976318359375, 0.669036865234375, 0.7323760986328125, 0.79571533203125, 0.8590545654296875, 0.922393798828125, 0.9857330322265625, 1.049072265625, 1.1124114990234375, 1.175750732421875, 1.2390899658203125, 1.30242919921875, 1.3657684326171875, 1.429107666015625, 1.4924468994140625, 1.5557861328125, 1.6191253662109375, 1.682464599609375, 1.7458038330078125, 1.80914306640625, 1.8724822998046875, 1.935821533203125, 1.9991607666015625, 2.0625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 6.0, 6.0, 19.0, 11.0, 24.0, 34.0, 59.0, 68.0, 114.0, 204.0, 272.0, 328.0, 533.0, 825.0, 1191.0, 1688.0, 2309.0, 3432.0, 4891.0, 7135.0, 10551.0, 15548.0, 23368.0, 35620.0, 54642.0, 86991.0, 156070.0, 1343173.0, 127896.0, 75728.0, 48120.0, 31549.0, 20589.0, 14036.0, 9282.0, 6342.0, 4438.0, 3083.0, 2188.0, 1493.0, 967.0, 751.0, 536.0, 344.0, 231.0, 155.0, 103.0, 76.0, 40.0, 38.0, 19.0, 9.0, 7.0, 5.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.74755859375, -0.7237167358398438, -0.6998748779296875, -0.6760330200195312, -0.652191162109375, -0.6283493041992188, -0.6045074462890625, -0.5806655883789062, -0.55682373046875, -0.5329818725585938, -0.5091400146484375, -0.48529815673828125, -0.461456298828125, -0.43761444091796875, -0.4137725830078125, -0.38993072509765625, -0.3660888671875, -0.34224700927734375, -0.3184051513671875, -0.29456329345703125, -0.270721435546875, -0.24687957763671875, -0.2230377197265625, -0.19919586181640625, -0.17535400390625, -0.15151214599609375, -0.1276702880859375, -0.10382843017578125, -0.079986572265625, -0.05614471435546875, -0.0323028564453125, -0.00846099853515625, 0.015380859375, 0.03922271728515625, 0.0630645751953125, 0.08690643310546875, 0.110748291015625, 0.13459014892578125, 0.1584320068359375, 0.18227386474609375, 0.20611572265625, 0.22995758056640625, 0.2537994384765625, 0.27764129638671875, 0.301483154296875, 0.32532501220703125, 0.3491668701171875, 0.37300872802734375, 0.3968505859375, 0.42069244384765625, 0.4445343017578125, 0.46837615966796875, 0.492218017578125, 0.5160598754882812, 0.5399017333984375, 0.5637435913085938, 0.58758544921875, 0.6114273071289062, 0.6352691650390625, 0.6591110229492188, 0.682952880859375, 0.7067947387695312, 0.7306365966796875, 0.7544784545898438, 0.7783203125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 7.0, 10.0, 12.0, 15.0, 16.0, 23.0, 18.0, 38.0, 29.0, 38.0, 62.0, 66.0, 62.0, 69.0, 81.0, 60.0, 55.0, 51.0, 48.0, 36.0, 30.0, 27.0, 15.0, 15.0, 15.0, 17.0, 17.0, 6.0, 5.0, 7.0, 5.0, 1.0, 7.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00011390447616577148, -0.00011033192276954651, -0.00010675936937332153, -0.00010318681597709656, -9.961426258087158e-05, -9.60417091846466e-05, -9.246915578842163e-05, -8.889660239219666e-05, -8.532404899597168e-05, -8.17514955997467e-05, -7.817894220352173e-05, -7.460638880729675e-05, -7.103383541107178e-05, -6.74612820148468e-05, -6.388872861862183e-05, -6.031617522239685e-05, -5.6743621826171875e-05, -5.31710684299469e-05, -4.9598515033721924e-05, -4.602596163749695e-05, -4.245340824127197e-05, -3.8880854845047e-05, -3.530830144882202e-05, -3.1735748052597046e-05, -2.816319465637207e-05, -2.4590641260147095e-05, -2.101808786392212e-05, -1.7445534467697144e-05, -1.3872981071472168e-05, -1.0300427675247192e-05, -6.727874279022217e-06, -3.155320882797241e-06, 4.172325134277344e-07, 3.98978590965271e-06, 7.5623393058776855e-06, 1.1134892702102661e-05, 1.4707446098327637e-05, 1.8279999494552612e-05, 2.1852552890777588e-05, 2.5425106287002563e-05, 2.899765968322754e-05, 3.2570213079452515e-05, 3.614276647567749e-05, 3.9715319871902466e-05, 4.328787326812744e-05, 4.686042666435242e-05, 5.043298006057739e-05, 5.400553345680237e-05, 5.7578086853027344e-05, 6.115064024925232e-05, 6.47231936454773e-05, 6.829574704170227e-05, 7.186830043792725e-05, 7.544085383415222e-05, 7.90134072303772e-05, 8.258596062660217e-05, 8.615851402282715e-05, 8.973106741905212e-05, 9.33036208152771e-05, 9.687617421150208e-05, 0.00010044872760772705, 0.00010402128100395203, 0.000107593834400177, 0.00011116638779640198, 0.00011473894119262695]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 10.0, 11.0, 6.0, 10.0, 8.0, 15.0, 17.0, 30.0, 31.0, 32.0, 42.0, 53.0, 94.0, 78.0, 127.0, 147.0, 200.0, 306.0, 443.0, 717.0, 3361.0, 1032620.0, 7675.0, 736.0, 470.0, 326.0, 211.0, 179.0, 126.0, 89.0, 61.0, 80.0, 44.0, 40.0, 31.0, 16.0, 20.0, 10.0, 11.0, 19.0, 10.0, 9.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0018186569213867188, -0.001759156584739685, -0.0016996562480926514, -0.0016401559114456177, -0.001580655574798584, -0.0015211552381515503, -0.0014616549015045166, -0.001402154564857483, -0.0013426542282104492, -0.0012831538915634155, -0.0012236535549163818, -0.0011641532182693481, -0.0011046528816223145, -0.0010451525449752808, -0.000985652208328247, -0.0009261518716812134, -0.0008666515350341797, -0.000807151198387146, -0.0007476508617401123, -0.0006881505250930786, -0.0006286501884460449, -0.0005691498517990112, -0.0005096495151519775, -0.00045014917850494385, -0.00039064884185791016, -0.00033114850521087646, -0.0002716481685638428, -0.00021214783191680908, -0.0001526474952697754, -9.31471586227417e-05, -3.364682197570801e-05, 2.5853514671325684e-05, 8.535385131835938e-05, 0.00014485418796539307, 0.00020435452461242676, 0.00026385486125946045, 0.00032335519790649414, 0.00038285553455352783, 0.0004423558712005615, 0.0005018562078475952, 0.0005613565444946289, 0.0006208568811416626, 0.0006803572177886963, 0.00073985755443573, 0.0007993578910827637, 0.0008588582277297974, 0.0009183585643768311, 0.0009778589010238647, 0.0010373592376708984, 0.0010968595743179321, 0.0011563599109649658, 0.0012158602476119995, 0.0012753605842590332, 0.001334860920906067, 0.0013943612575531006, 0.0014538615942001343, 0.001513361930847168, 0.0015728622674942017, 0.0016323626041412354, 0.001691862940788269, 0.0017513632774353027, 0.0018108636140823364, 0.0018703639507293701, 0.0019298642873764038, 0.0019893646240234375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 727.0, 289.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007530585280619562, -0.0007320598233491182, -0.0007110611186362803, -0.0006900624139234424, -0.0006690637674182653, -0.0006480650627054274, -0.0006270663579925895, -0.0006060676532797515, -0.0005850689485669136, -0.0005640702438540757, -0.0005430715391412377, -0.0005220728926360607, -0.0005010741879232228, -0.00048007548321038485, -0.0004590767784975469, -0.000438078073784709, -0.00041707942727953196, -0.000396080722566694, -0.00037508204695768654, -0.0003540833422448486, -0.00033308466663584113, -0.0003120859619230032, -0.00029108725721016526, -0.00027008855249732733, -0.00024908987688831985, -0.00022809118672739714, -0.00020709249656647444, -0.0001860937918536365, -0.0001650951016927138, -0.0001440964115317911, -0.00012309770681895316, -0.00010209901665803045, -8.110032649710774e-05, -6.010163269820623e-05, -3.910293889930472e-05, -1.8104241462424397e-05, 2.8944486984983087e-06, 2.3893138859421015e-05, 4.489184357225895e-05, 6.589053373318166e-05, 8.688922389410436e-05, 0.00010788791405502707, 0.00012888660421594977, 0.0001498853089287877, 0.00017088399908971041, 0.00019188268925063312, 0.00021288139396347106, 0.00023388008412439376, 0.00025487877428531647, 0.0002758774789981544, 0.0002968761546071619, 0.0003178748593199998, 0.0003388735349290073, 0.0003598722396418452, 0.00038087094435468316, 0.0004018696490675211, 0.0004228683246765286, 0.0004438670293893665, 0.000464865704998374, 0.0004858644097112119, 0.0005068631144240499, 0.0005278617609292269, 0.0005488605238497257, 0.0005698591703549027, 0.0005908578750677407]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 12.0, 5.0, 12.0, 9.0, 17.0, 12.0, 15.0, 18.0, 25.0, 30.0, 31.0, 29.0, 22.0, 36.0, 43.0, 30.0, 50.0, 38.0, 29.0, 51.0, 42.0, 31.0, 39.0, 41.0, 39.0, 30.0, 32.0, 29.0, 29.0, 17.0, 19.0, 19.0, 19.0, 17.0, 8.0, 10.0, 11.0, 10.0, 7.0, 9.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.358457565307617e-05, -5.179643630981445e-05, -5.0008296966552734e-05, -4.8220157623291016e-05, -4.64320182800293e-05, -4.464387893676758e-05, -4.285573959350586e-05, -4.106760025024414e-05, -3.927946090698242e-05, -3.74913215637207e-05, -3.5703182220458984e-05, -3.3915042877197266e-05, -3.212690353393555e-05, -3.0338764190673828e-05, -2.855062484741211e-05, -2.676248550415039e-05, -2.4974346160888672e-05, -2.3186206817626953e-05, -2.1398067474365234e-05, -1.9609928131103516e-05, -1.7821788787841797e-05, -1.6033649444580078e-05, -1.424551010131836e-05, -1.245737075805664e-05, -1.0669231414794922e-05, -8.881092071533203e-06, -7.092952728271484e-06, -5.304813385009766e-06, -3.516674041748047e-06, -1.7285346984863281e-06, 5.960464477539063e-08, 1.8477439880371094e-06, 3.635883331298828e-06, 5.424022674560547e-06, 7.212162017822266e-06, 9.000301361083984e-06, 1.0788440704345703e-05, 1.2576580047607422e-05, 1.436471939086914e-05, 1.615285873413086e-05, 1.7940998077392578e-05, 1.9729137420654297e-05, 2.1517276763916016e-05, 2.3305416107177734e-05, 2.5093555450439453e-05, 2.6881694793701172e-05, 2.866983413696289e-05, 3.045797348022461e-05, 3.224611282348633e-05, 3.403425216674805e-05, 3.5822391510009766e-05, 3.7610530853271484e-05, 3.93986701965332e-05, 4.118680953979492e-05, 4.297494888305664e-05, 4.476308822631836e-05, 4.655122756958008e-05, 4.83393669128418e-05, 5.0127506256103516e-05, 5.1915645599365234e-05, 5.370378494262695e-05, 5.549192428588867e-05, 5.728006362915039e-05, 5.906820297241211e-05, 6.085634231567383e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 2.0, 3.0, 9.0, 9.0, 4.0, 15.0, 19.0, 24.0, 24.0, 21.0, 26.0, 21.0, 30.0, 38.0, 39.0, 24.0, 42.0, 50.0, 46.0, 58.0, 41.0, 39.0, 35.0, 41.0, 37.0, 33.0, 35.0, 26.0, 28.0, 22.0, 20.0, 32.0, 11.0, 27.0, 10.0, 11.0, 14.0, 7.0, 3.0, 4.0, 5.0, 3.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.333984375, -3.230377197265625, -3.12677001953125, -3.023162841796875, -2.9195556640625, -2.815948486328125, -2.71234130859375, -2.608734130859375, -2.505126953125, -2.401519775390625, -2.29791259765625, -2.194305419921875, -2.0906982421875, -1.987091064453125, -1.88348388671875, -1.779876708984375, -1.67626953125, -1.572662353515625, -1.46905517578125, -1.365447998046875, -1.2618408203125, -1.158233642578125, -1.05462646484375, -0.951019287109375, -0.847412109375, -0.743804931640625, -0.64019775390625, -0.536590576171875, -0.4329833984375, -0.329376220703125, -0.22576904296875, -0.122161865234375, -0.0185546875, 0.085052490234375, 0.18865966796875, 0.292266845703125, 0.3958740234375, 0.499481201171875, 0.60308837890625, 0.706695556640625, 0.810302734375, 0.913909912109375, 1.01751708984375, 1.121124267578125, 1.2247314453125, 1.328338623046875, 1.43194580078125, 1.535552978515625, 1.63916015625, 1.742767333984375, 1.84637451171875, 1.949981689453125, 2.0535888671875, 2.157196044921875, 2.26080322265625, 2.364410400390625, 2.468017578125, 2.571624755859375, 2.67523193359375, 2.778839111328125, 2.8824462890625, 2.986053466796875, 3.08966064453125, 3.193267822265625, 3.296875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 15.0, 15.0, 19.0, 15.0, 39.0, 41.0, 68.0, 56.0, 91.0, 126.0, 162.0, 221.0, 298.0, 387.0, 503.0, 673.0, 995.0, 1241.0, 1882.0, 2874.0, 4343.0, 7787.0, 16292.0, 59243.0, 560990.0, 320525.0, 37650.0, 12833.0, 6636.0, 3788.0, 2428.0, 1682.0, 1184.0, 895.0, 666.0, 453.0, 351.0, 263.0, 200.0, 145.0, 114.0, 92.0, 65.0, 48.0, 39.0, 26.0, 24.0, 15.0, 13.0, 11.0, 8.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0], "bins": [-15.1171875, -14.6427001953125, -14.168212890625, -13.6937255859375, -13.21923828125, -12.7447509765625, -12.270263671875, -11.7957763671875, -11.3212890625, -10.8468017578125, -10.372314453125, -9.8978271484375, -9.42333984375, -8.9488525390625, -8.474365234375, -7.9998779296875, -7.525390625, -7.0509033203125, -6.576416015625, -6.1019287109375, -5.62744140625, -5.1529541015625, -4.678466796875, -4.2039794921875, -3.7294921875, -3.2550048828125, -2.780517578125, -2.3060302734375, -1.83154296875, -1.3570556640625, -0.882568359375, -0.4080810546875, 0.06640625, 0.5408935546875, 1.015380859375, 1.4898681640625, 1.96435546875, 2.4388427734375, 2.913330078125, 3.3878173828125, 3.8623046875, 4.3367919921875, 4.811279296875, 5.2857666015625, 5.76025390625, 6.2347412109375, 6.709228515625, 7.1837158203125, 7.658203125, 8.1326904296875, 8.607177734375, 9.0816650390625, 9.55615234375, 10.0306396484375, 10.505126953125, 10.9796142578125, 11.4541015625, 11.9285888671875, 12.403076171875, 12.8775634765625, 13.35205078125, 13.8265380859375, 14.301025390625, 14.7755126953125, 15.25]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 1.0, 6.0, 6.0, 12.0, 6.0, 12.0, 9.0, 18.0, 17.0, 14.0, 26.0, 19.0, 23.0, 37.0, 32.0, 26.0, 36.0, 52.0, 79.0, 119.0, 214.0, 1337.0, 301.0, 165.0, 83.0, 64.0, 43.0, 38.0, 34.0, 34.0, 34.0, 37.0, 23.0, 16.0, 6.0, 14.0, 10.0, 8.0, 7.0, 5.0, 2.0, 11.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.6875, -11.370849609375, -11.05419921875, -10.737548828125, -10.4208984375, -10.104248046875, -9.78759765625, -9.470947265625, -9.154296875, -8.837646484375, -8.52099609375, -8.204345703125, -7.8876953125, -7.571044921875, -7.25439453125, -6.937744140625, -6.62109375, -6.304443359375, -5.98779296875, -5.671142578125, -5.3544921875, -5.037841796875, -4.72119140625, -4.404541015625, -4.087890625, -3.771240234375, -3.45458984375, -3.137939453125, -2.8212890625, -2.504638671875, -2.18798828125, -1.871337890625, -1.5546875, -1.238037109375, -0.92138671875, -0.604736328125, -0.2880859375, 0.028564453125, 0.34521484375, 0.661865234375, 0.978515625, 1.295166015625, 1.61181640625, 1.928466796875, 2.2451171875, 2.561767578125, 2.87841796875, 3.195068359375, 3.51171875, 3.828369140625, 4.14501953125, 4.461669921875, 4.7783203125, 5.094970703125, 5.41162109375, 5.728271484375, 6.044921875, 6.361572265625, 6.67822265625, 6.994873046875, 7.3115234375, 7.628173828125, 7.94482421875, 8.261474609375, 8.578125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 5.0, 3.0, 3.0, 10.0, 4.0, 12.0, 11.0, 7.0, 13.0, 23.0, 23.0, 40.0, 38.0, 47.0, 50.0, 112.0, 170.0, 495.0, 1884.0, 261235.0, 2876437.0, 3566.0, 751.0, 282.0, 123.0, 69.0, 59.0, 31.0, 31.0, 32.0, 24.0, 24.0, 14.0, 19.0, 12.0, 7.0, 7.0, 7.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.28125, -36.92138671875, -35.5615234375, -34.20166015625, -32.841796875, -31.48193359375, -30.1220703125, -28.76220703125, -27.40234375, -26.04248046875, -24.6826171875, -23.32275390625, -21.962890625, -20.60302734375, -19.2431640625, -17.88330078125, -16.5234375, -15.16357421875, -13.8037109375, -12.44384765625, -11.083984375, -9.72412109375, -8.3642578125, -7.00439453125, -5.64453125, -4.28466796875, -2.9248046875, -1.56494140625, -0.205078125, 1.15478515625, 2.5146484375, 3.87451171875, 5.234375, 6.59423828125, 7.9541015625, 9.31396484375, 10.673828125, 12.03369140625, 13.3935546875, 14.75341796875, 16.11328125, 17.47314453125, 18.8330078125, 20.19287109375, 21.552734375, 22.91259765625, 24.2724609375, 25.63232421875, 26.9921875, 28.35205078125, 29.7119140625, 31.07177734375, 32.431640625, 33.79150390625, 35.1513671875, 36.51123046875, 37.87109375, 39.23095703125, 40.5908203125, 41.95068359375, 43.310546875, 44.67041015625, 46.0302734375, 47.39013671875, 48.75]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 36.0, 978.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.64373779296875, -133.6239013671875, -120.60406494140625, -107.584228515625, -94.56439208984375, -81.54454803466797, -68.52471160888672, -55.50487518310547, -42.48503875732422, -29.46520233154297, -16.445363998413086, -3.425525665283203, 9.594310760498047, 22.614151000976562, 35.63398742675781, 48.65382385253906, 61.67366027832031, 74.69349670410156, 87.71333312988281, 100.73316955566406, 113.75300598144531, 126.7728500366211, 139.79269409179688, 152.81253051757812, 165.83236694335938, 178.85220336914062, 191.87203979492188, 204.89187622070312, 217.91171264648438, 230.93154907226562, 243.95138549804688, 256.9712219238281, 269.9910583496094, 283.0108947753906, 296.0307312011719, 309.0505676269531, 322.0704040527344, 335.0902404785156, 348.1100769042969, 361.1299133300781, 374.1497497558594, 387.1695861816406, 400.1894226074219, 413.2092590332031, 426.2290954589844, 439.2489318847656, 452.2687683105469, 465.2886047363281, 478.3084716796875, 491.32830810546875, 504.34814453125, 517.3679809570312, 530.3878173828125, 543.4076538085938, 556.427490234375, 569.4473266601562, 582.4671630859375, 595.4869995117188, 608.5068359375, 621.5266723632812, 634.5465087890625, 647.5663452148438, 660.586181640625, 673.6060180664062, 686.6258544921875]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 1.0, 11.0, 6.0, 6.0, 8.0, 11.0, 15.0, 15.0, 22.0, 19.0, 15.0, 14.0, 30.0, 25.0, 26.0, 23.0, 40.0, 31.0, 40.0, 38.0, 42.0, 42.0, 40.0, 36.0, 36.0, 38.0, 45.0, 37.0, 33.0, 31.0, 25.0, 21.0, 27.0, 16.0, 21.0, 15.0, 15.0, 16.0, 15.0, 11.0, 7.0, 13.0, 5.0, 7.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.29164695739746, -30.18182373046875, -29.071998596191406, -27.962175369262695, -26.852352142333984, -25.74252700805664, -24.63270378112793, -23.52288055419922, -22.413055419921875, -21.303232192993164, -20.19340705871582, -19.08358383178711, -17.973758697509766, -16.863935470581055, -15.754112243652344, -14.644288063049316, -13.534463882446289, -12.424639701843262, -11.314815521240234, -10.204992294311523, -9.095168113708496, -7.985343933105469, -6.8755202293396, -5.7656965255737305, -4.655872344970703, -3.546048402786255, -2.4362244606018066, -1.3264005184173584, -0.21657657623291016, 0.8932476043701172, 2.0030713081359863, 3.1128950119018555, 4.222721099853516, 5.332545280456543, 6.442368984222412, 7.552192687988281, 8.662016868591309, 9.771841049194336, 10.881664276123047, 11.991488456726074, 13.101312637329102, 14.211136817932129, 15.320960998535156, 16.430784225463867, 17.540607452392578, 18.650432586669922, 19.760255813598633, 20.870079040527344, 21.979904174804688, 23.0897274017334, 24.199552536010742, 25.309375762939453, 26.419200897216797, 27.529024124145508, 28.63884735107422, 29.748672485351562, 30.858495712280273, 31.968318939208984, 33.07814407348633, 34.18796920776367, 35.29779052734375, 36.407615661621094, 37.51744079589844, 38.627262115478516, 39.73708724975586]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 10.0, 8.0, 5.0, 8.0, 10.0, 15.0, 20.0, 25.0, 12.0, 27.0, 36.0, 19.0, 20.0, 31.0, 50.0, 44.0, 41.0, 43.0, 49.0, 58.0, 35.0, 27.0, 40.0, 37.0, 36.0, 26.0, 33.0, 35.0, 33.0, 24.0, 21.0, 21.0, 17.0, 17.0, 11.0, 7.0, 12.0, 12.0, 4.0, 5.0, 7.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.298828125, -3.188140869140625, -3.07745361328125, -2.966766357421875, -2.8560791015625, -2.745391845703125, -2.63470458984375, -2.524017333984375, -2.413330078125, -2.302642822265625, -2.19195556640625, -2.081268310546875, -1.9705810546875, -1.859893798828125, -1.74920654296875, -1.638519287109375, -1.52783203125, -1.417144775390625, -1.30645751953125, -1.195770263671875, -1.0850830078125, -0.974395751953125, -0.86370849609375, -0.753021240234375, -0.642333984375, -0.531646728515625, -0.42095947265625, -0.310272216796875, -0.1995849609375, -0.088897705078125, 0.02178955078125, 0.132476806640625, 0.2431640625, 0.353851318359375, 0.46453857421875, 0.575225830078125, 0.6859130859375, 0.796600341796875, 0.90728759765625, 1.017974853515625, 1.128662109375, 1.239349365234375, 1.35003662109375, 1.460723876953125, 1.5714111328125, 1.682098388671875, 1.79278564453125, 1.903472900390625, 2.01416015625, 2.124847412109375, 2.23553466796875, 2.346221923828125, 2.4569091796875, 2.567596435546875, 2.67828369140625, 2.788970947265625, 2.899658203125, 3.010345458984375, 3.12103271484375, 3.231719970703125, 3.3424072265625, 3.453094482421875, 3.56378173828125, 3.674468994140625, 3.78515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 11.0, 11.0, 9.0, 30.0, 22.0, 38.0, 44.0, 70.0, 71.0, 138.0, 165.0, 318.0, 481.0, 772.0, 1411.0, 2662.0, 5556.0, 12726.0, 38588.0, 278339.0, 2982182.0, 770815.0, 66083.0, 18015.0, 7503.0, 3554.0, 1839.0, 1039.0, 584.0, 365.0, 247.0, 174.0, 111.0, 71.0, 50.0, 50.0, 31.0, 24.0, 18.0, 16.0, 14.0, 7.0, 9.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-15.4296875, -14.9425048828125, -14.455322265625, -13.9681396484375, -13.48095703125, -12.9937744140625, -12.506591796875, -12.0194091796875, -11.5322265625, -11.0450439453125, -10.557861328125, -10.0706787109375, -9.58349609375, -9.0963134765625, -8.609130859375, -8.1219482421875, -7.634765625, -7.1475830078125, -6.660400390625, -6.1732177734375, -5.68603515625, -5.1988525390625, -4.711669921875, -4.2244873046875, -3.7373046875, -3.2501220703125, -2.762939453125, -2.2757568359375, -1.78857421875, -1.3013916015625, -0.814208984375, -0.3270263671875, 0.16015625, 0.6473388671875, 1.134521484375, 1.6217041015625, 2.10888671875, 2.5960693359375, 3.083251953125, 3.5704345703125, 4.0576171875, 4.5447998046875, 5.031982421875, 5.5191650390625, 6.00634765625, 6.4935302734375, 6.980712890625, 7.4678955078125, 7.955078125, 8.4422607421875, 8.929443359375, 9.4166259765625, 9.90380859375, 10.3909912109375, 10.878173828125, 11.3653564453125, 11.8525390625, 12.3397216796875, 12.826904296875, 13.3140869140625, 13.80126953125, 14.2884521484375, 14.775634765625, 15.2628173828125, 15.75]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 9.0, 10.0, 16.0, 22.0, 31.0, 41.0, 53.0, 82.0, 117.0, 143.0, 256.0, 337.0, 469.0, 555.0, 528.0, 439.0, 323.0, 194.0, 126.0, 110.0, 62.0, 49.0, 28.0, 22.0, 15.0, 15.0, 8.0, 8.0, 1.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.40625, -20.86962890625, -20.3330078125, -19.79638671875, -19.259765625, -18.72314453125, -18.1865234375, -17.64990234375, -17.11328125, -16.57666015625, -16.0400390625, -15.50341796875, -14.966796875, -14.43017578125, -13.8935546875, -13.35693359375, -12.8203125, -12.28369140625, -11.7470703125, -11.21044921875, -10.673828125, -10.13720703125, -9.6005859375, -9.06396484375, -8.52734375, -7.99072265625, -7.4541015625, -6.91748046875, -6.380859375, -5.84423828125, -5.3076171875, -4.77099609375, -4.234375, -3.69775390625, -3.1611328125, -2.62451171875, -2.087890625, -1.55126953125, -1.0146484375, -0.47802734375, 0.05859375, 0.59521484375, 1.1318359375, 1.66845703125, 2.205078125, 2.74169921875, 3.2783203125, 3.81494140625, 4.3515625, 4.88818359375, 5.4248046875, 5.96142578125, 6.498046875, 7.03466796875, 7.5712890625, 8.10791015625, 8.64453125, 9.18115234375, 9.7177734375, 10.25439453125, 10.791015625, 11.32763671875, 11.8642578125, 12.40087890625, 12.9375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 11.0, 7.0, 11.0, 12.0, 19.0, 27.0, 33.0, 34.0, 61.0, 64.0, 115.0, 182.0, 285.0, 854.0, 6765.0, 3666562.0, 515396.0, 2512.0, 542.0, 271.0, 162.0, 118.0, 67.0, 52.0, 30.0, 30.0, 13.0, 10.0, 12.0, 8.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.78125, -43.68505859375, -41.5888671875, -39.49267578125, -37.396484375, -35.30029296875, -33.2041015625, -31.10791015625, -29.01171875, -26.91552734375, -24.8193359375, -22.72314453125, -20.626953125, -18.53076171875, -16.4345703125, -14.33837890625, -12.2421875, -10.14599609375, -8.0498046875, -5.95361328125, -3.857421875, -1.76123046875, 0.3349609375, 2.43115234375, 4.52734375, 6.62353515625, 8.7197265625, 10.81591796875, 12.912109375, 15.00830078125, 17.1044921875, 19.20068359375, 21.296875, 23.39306640625, 25.4892578125, 27.58544921875, 29.681640625, 31.77783203125, 33.8740234375, 35.97021484375, 38.06640625, 40.16259765625, 42.2587890625, 44.35498046875, 46.451171875, 48.54736328125, 50.6435546875, 52.73974609375, 54.8359375, 56.93212890625, 59.0283203125, 61.12451171875, 63.220703125, 65.31689453125, 67.4130859375, 69.50927734375, 71.60546875, 73.70166015625, 75.7978515625, 77.89404296875, 79.990234375, 82.08642578125, 84.1826171875, 86.27880859375, 88.375]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 64.0, 780.0, 169.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.50341033935547, -53.95943069458008, -44.41545104980469, -34.87147521972656, -25.327495574951172, -15.783515930175781, -6.239540100097656, 3.304443359375, 12.848419189453125, 22.392398834228516, 31.936376571655273, 41.48035430908203, 51.02433395385742, 60.56831359863281, 70.11228942871094, 79.6562728881836, 89.20024871826172, 98.74422454833984, 108.2882080078125, 117.83218383789062, 127.37615966796875, 136.92013549804688, 146.464111328125, 156.0081024169922, 165.5520782470703, 175.09605407714844, 184.64002990722656, 194.18402099609375, 203.72799682617188, 213.27197265625, 222.81594848632812, 232.35992431640625, 241.90390014648438, 251.4478759765625, 260.9918518066406, 270.53582763671875, 280.0798034667969, 289.623779296875, 299.16778564453125, 308.7117614746094, 318.2557373046875, 327.7997131347656, 337.34368896484375, 346.8876647949219, 356.431640625, 365.97564697265625, 375.51959228515625, 385.0635986328125, 394.6075439453125, 404.1515197753906, 413.69549560546875, 423.2394714355469, 432.783447265625, 442.32745361328125, 451.87139892578125, 461.4154052734375, 470.9593811035156, 480.50335693359375, 490.0473327636719, 499.59130859375, 509.1352844238281, 518.6792602539062, 528.2232666015625, 537.7672119140625, 547.3112182617188]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 7.0, 4.0, 10.0, 8.0, 10.0, 11.0, 11.0, 20.0, 18.0, 15.0, 19.0, 29.0, 36.0, 24.0, 35.0, 31.0, 35.0, 34.0, 22.0, 40.0, 42.0, 29.0, 45.0, 33.0, 34.0, 31.0, 38.0, 30.0, 33.0, 31.0, 28.0, 16.0, 22.0, 22.0, 20.0, 15.0, 22.0, 10.0, 19.0, 7.0, 6.0, 2.0, 9.0, 6.0, 3.0, 9.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-42.270423889160156, -40.95475387573242, -39.63908386230469, -38.32341384887695, -37.00774383544922, -35.692073822021484, -34.37640380859375, -33.06072998046875, -31.74506187438965, -30.429391860961914, -29.11372184753418, -27.798051834106445, -26.482379913330078, -25.166709899902344, -23.85103988647461, -22.535369873046875, -21.21969985961914, -19.904029846191406, -18.588359832763672, -17.272689819335938, -15.957018852233887, -14.641348838806152, -13.325677871704102, -12.010007858276367, -10.694337844848633, -9.378667831420898, -8.062997817993164, -6.747326850891113, -5.431656837463379, -4.1159868240356445, -2.800316333770752, -1.4846458435058594, -0.168975830078125, 1.1466944217681885, 2.462364673614502, 3.7780349254608154, 5.093705177307129, 6.409375190734863, 7.725045680999756, 9.040716171264648, 10.356386184692383, 11.672056198120117, 12.987726211547852, 14.303397178649902, 15.619067192077637, 16.934738159179688, 18.250408172607422, 19.566078186035156, 20.88174819946289, 22.197418212890625, 23.51308822631836, 24.828758239746094, 26.144428253173828, 27.460098266601562, 28.77577018737793, 30.091440200805664, 31.4071102142334, 32.722782135009766, 34.0384521484375, 35.354122161865234, 36.66979217529297, 37.9854621887207, 39.30113220214844, 40.61680221557617, 41.932472229003906]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 2.0, 2.0, 16.0, 15.0, 13.0, 23.0, 18.0, 6.0, 18.0, 24.0, 20.0, 27.0, 31.0, 30.0, 31.0, 44.0, 37.0, 43.0, 44.0, 34.0, 39.0, 52.0, 25.0, 32.0, 31.0, 30.0, 29.0, 24.0, 24.0, 30.0, 23.0, 32.0, 20.0, 19.0, 14.0, 11.0, 9.0, 12.0, 6.0, 8.0, 10.0, 8.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.25, -3.14715576171875, -3.0443115234375, -2.94146728515625, -2.838623046875, -2.73577880859375, -2.6329345703125, -2.53009033203125, -2.42724609375, -2.32440185546875, -2.2215576171875, -2.11871337890625, -2.015869140625, -1.91302490234375, -1.8101806640625, -1.70733642578125, -1.6044921875, -1.50164794921875, -1.3988037109375, -1.29595947265625, -1.193115234375, -1.09027099609375, -0.9874267578125, -0.88458251953125, -0.78173828125, -0.67889404296875, -0.5760498046875, -0.47320556640625, -0.370361328125, -0.26751708984375, -0.1646728515625, -0.06182861328125, 0.041015625, 0.14385986328125, 0.2467041015625, 0.34954833984375, 0.452392578125, 0.55523681640625, 0.6580810546875, 0.76092529296875, 0.86376953125, 0.96661376953125, 1.0694580078125, 1.17230224609375, 1.275146484375, 1.37799072265625, 1.4808349609375, 1.58367919921875, 1.6865234375, 1.78936767578125, 1.8922119140625, 1.99505615234375, 2.097900390625, 2.20074462890625, 2.3035888671875, 2.40643310546875, 2.50927734375, 2.61212158203125, 2.7149658203125, 2.81781005859375, 2.920654296875, 3.02349853515625, 3.1263427734375, 3.22918701171875, 3.33203125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 2.0, 5.0, 4.0, 12.0, 18.0, 36.0, 33.0, 38.0, 66.0, 122.0, 116.0, 172.0, 264.0, 380.0, 512.0, 698.0, 994.0, 1296.0, 1743.0, 2424.0, 3374.0, 4762.0, 6478.0, 9266.0, 13340.0, 18666.0, 27201.0, 41229.0, 64518.0, 107018.0, 256166.0, 203177.0, 98931.0, 59962.0, 38630.0, 25858.0, 17721.0, 12247.0, 8490.0, 6252.0, 4581.0, 3313.0, 2344.0, 1711.0, 1232.0, 931.0, 639.0, 453.0, 353.0, 220.0, 153.0, 129.0, 93.0, 50.0, 44.0, 34.0, 26.0, 17.0, 8.0, 7.0, 5.0, 2.0, 4.0], "bins": [-0.7900390625, -0.765289306640625, -0.74053955078125, -0.715789794921875, -0.6910400390625, -0.666290283203125, -0.64154052734375, -0.616790771484375, -0.592041015625, -0.567291259765625, -0.54254150390625, -0.517791748046875, -0.4930419921875, -0.468292236328125, -0.44354248046875, -0.418792724609375, -0.39404296875, -0.369293212890625, -0.34454345703125, -0.319793701171875, -0.2950439453125, -0.270294189453125, -0.24554443359375, -0.220794677734375, -0.196044921875, -0.171295166015625, -0.14654541015625, -0.121795654296875, -0.0970458984375, -0.072296142578125, -0.04754638671875, -0.022796630859375, 0.001953125, 0.026702880859375, 0.05145263671875, 0.076202392578125, 0.1009521484375, 0.125701904296875, 0.15045166015625, 0.175201416015625, 0.199951171875, 0.224700927734375, 0.24945068359375, 0.274200439453125, 0.2989501953125, 0.323699951171875, 0.34844970703125, 0.373199462890625, 0.39794921875, 0.422698974609375, 0.44744873046875, 0.472198486328125, 0.4969482421875, 0.521697998046875, 0.54644775390625, 0.571197509765625, 0.595947265625, 0.620697021484375, 0.64544677734375, 0.670196533203125, 0.6949462890625, 0.719696044921875, 0.74444580078125, 0.769195556640625, 0.7939453125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 10.0, 7.0, 8.0, 7.0, 6.0, 15.0, 18.0, 16.0, 20.0, 24.0, 27.0, 25.0, 26.0, 36.0, 42.0, 47.0, 54.0, 39.0, 44.0, 1060.0, 32.0, 42.0, 42.0, 34.0, 32.0, 23.0, 35.0, 30.0, 25.0, 28.0, 22.0, 23.0, 20.0, 19.0, 17.0, 16.0, 12.0, 11.0, 6.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.23828125, -2.163482666015625, -2.08868408203125, -2.013885498046875, -1.9390869140625, -1.864288330078125, -1.78948974609375, -1.714691162109375, -1.639892578125, -1.565093994140625, -1.49029541015625, -1.415496826171875, -1.3406982421875, -1.265899658203125, -1.19110107421875, -1.116302490234375, -1.04150390625, -0.966705322265625, -0.89190673828125, -0.817108154296875, -0.7423095703125, -0.667510986328125, -0.59271240234375, -0.517913818359375, -0.443115234375, -0.368316650390625, -0.29351806640625, -0.218719482421875, -0.1439208984375, -0.069122314453125, 0.00567626953125, 0.080474853515625, 0.1552734375, 0.230072021484375, 0.30487060546875, 0.379669189453125, 0.4544677734375, 0.529266357421875, 0.60406494140625, 0.678863525390625, 0.753662109375, 0.828460693359375, 0.90325927734375, 0.978057861328125, 1.0528564453125, 1.127655029296875, 1.20245361328125, 1.277252197265625, 1.35205078125, 1.426849365234375, 1.50164794921875, 1.576446533203125, 1.6512451171875, 1.726043701171875, 1.80084228515625, 1.875640869140625, 1.950439453125, 2.025238037109375, 2.10003662109375, 2.174835205078125, 2.2496337890625, 2.324432373046875, 2.39923095703125, 2.474029541015625, 2.548828125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 0.0, 4.0, 4.0, 7.0, 8.0, 14.0, 20.0, 44.0, 38.0, 66.0, 97.0, 119.0, 212.0, 299.0, 457.0, 647.0, 1020.0, 1495.0, 2223.0, 3179.0, 4570.0, 6797.0, 10323.0, 15437.0, 23050.0, 35779.0, 55869.0, 91366.0, 174691.0, 1341643.0, 123395.0, 71856.0, 45241.0, 29295.0, 19148.0, 12478.0, 8482.0, 5762.0, 3910.0, 2559.0, 1819.0, 1209.0, 822.0, 536.0, 382.0, 241.0, 180.0, 122.0, 88.0, 46.0, 30.0, 23.0, 18.0, 8.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86328125, -0.8347549438476562, -0.8062286376953125, -0.7777023315429688, -0.749176025390625, -0.7206497192382812, -0.6921234130859375, -0.6635971069335938, -0.63507080078125, -0.6065444946289062, -0.5780181884765625, -0.5494918823242188, -0.520965576171875, -0.49243927001953125, -0.4639129638671875, -0.43538665771484375, -0.4068603515625, -0.37833404541015625, -0.3498077392578125, -0.32128143310546875, -0.292755126953125, -0.26422882080078125, -0.2357025146484375, -0.20717620849609375, -0.17864990234375, -0.15012359619140625, -0.1215972900390625, -0.09307098388671875, -0.064544677734375, -0.03601837158203125, -0.0074920654296875, 0.02103424072265625, 0.049560546875, 0.07808685302734375, 0.1066131591796875, 0.13513946533203125, 0.163665771484375, 0.19219207763671875, 0.2207183837890625, 0.24924468994140625, 0.27777099609375, 0.30629730224609375, 0.3348236083984375, 0.36334991455078125, 0.391876220703125, 0.42040252685546875, 0.4489288330078125, 0.47745513916015625, 0.5059814453125, 0.5345077514648438, 0.5630340576171875, 0.5915603637695312, 0.620086669921875, 0.6486129760742188, 0.6771392822265625, 0.7056655883789062, 0.73419189453125, 0.7627182006835938, 0.7912445068359375, 0.8197708129882812, 0.848297119140625, 0.8768234252929688, 0.9053497314453125, 0.9338760375976562, 0.96240234375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 12.0, 15.0, 20.0, 30.0, 24.0, 27.0, 38.0, 39.0, 46.0, 57.0, 63.0, 73.0, 61.0, 75.0, 57.0, 49.0, 49.0, 44.0, 24.0, 29.0, 19.0, 12.0, 27.0, 18.0, 11.0, 12.0, 13.0, 3.0, 6.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00011473894119262695, -0.00011072959750890732, -0.00010672025382518768, -0.00010271091014146805, -9.870156645774841e-05, -9.469222277402878e-05, -9.068287909030914e-05, -8.667353540658951e-05, -8.266419172286987e-05, -7.865484803915024e-05, -7.46455043554306e-05, -7.063616067171097e-05, -6.662681698799133e-05, -6.26174733042717e-05, -5.860812962055206e-05, -5.459878593683243e-05, -5.058944225311279e-05, -4.658009856939316e-05, -4.257075488567352e-05, -3.856141120195389e-05, -3.455206751823425e-05, -3.054272383451462e-05, -2.6533380150794983e-05, -2.2524036467075348e-05, -1.8514692783355713e-05, -1.4505349099636078e-05, -1.0496005415916443e-05, -6.486661732196808e-06, -2.477318048477173e-06, 1.5320256352424622e-06, 5.541369318962097e-06, 9.550713002681732e-06, 1.3560056686401367e-05, 1.7569400370121002e-05, 2.1578744053840637e-05, 2.5588087737560272e-05, 2.9597431421279907e-05, 3.360677510499954e-05, 3.761611878871918e-05, 4.162546247243881e-05, 4.563480615615845e-05, 4.964414983987808e-05, 5.365349352359772e-05, 5.766283720731735e-05, 6.167218089103699e-05, 6.568152457475662e-05, 6.969086825847626e-05, 7.370021194219589e-05, 7.770955562591553e-05, 8.171889930963516e-05, 8.57282429933548e-05, 8.973758667707443e-05, 9.374693036079407e-05, 9.77562740445137e-05, 0.00010176561772823334, 0.00010577496141195297, 0.00010978430509567261, 0.00011379364877939224, 0.00011780299246311188, 0.00012181233614683151, 0.00012582167983055115, 0.00012983102351427078, 0.00013384036719799042, 0.00013784971088171005, 0.0001418590545654297]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 9.0, 16.0, 16.0, 21.0, 15.0, 28.0, 43.0, 59.0, 65.0, 104.0, 106.0, 169.0, 254.0, 549.0, 1401.0, 994990.0, 48751.0, 764.0, 388.0, 213.0, 142.0, 115.0, 98.0, 57.0, 43.0, 33.0, 14.0, 14.0, 12.0, 9.0, 10.0, 7.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0030956268310546875, -0.003004014492034912, -0.0029124021530151367, -0.0028207898139953613, -0.002729177474975586, -0.0026375651359558105, -0.002545952796936035, -0.0024543404579162598, -0.0023627281188964844, -0.002271115779876709, -0.0021795034408569336, -0.002087891101837158, -0.001996278762817383, -0.0019046664237976074, -0.001813054084777832, -0.0017214417457580566, -0.0016298294067382812, -0.0015382170677185059, -0.0014466047286987305, -0.001354992389678955, -0.0012633800506591797, -0.0011717677116394043, -0.001080155372619629, -0.0009885430335998535, -0.0008969306945800781, -0.0008053183555603027, -0.0007137060165405273, -0.000622093677520752, -0.0005304813385009766, -0.00043886899948120117, -0.0003472566604614258, -0.0002556443214416504, -0.000164031982421875, -7.241964340209961e-05, 1.919269561767578e-05, 0.00011080503463745117, 0.00020241737365722656, 0.00029402971267700195, 0.00038564205169677734, 0.00047725439071655273, 0.0005688667297363281, 0.0006604790687561035, 0.0007520914077758789, 0.0008437037467956543, 0.0009353160858154297, 0.001026928424835205, 0.0011185407638549805, 0.0012101531028747559, 0.0013017654418945312, 0.0013933777809143066, 0.001484990119934082, 0.0015766024589538574, 0.0016682147979736328, 0.0017598271369934082, 0.0018514394760131836, 0.001943051815032959, 0.0020346641540527344, 0.0021262764930725098, 0.002217888832092285, 0.0023095011711120605, 0.002401113510131836, 0.0024927258491516113, 0.0025843381881713867, 0.002675950527191162, 0.0027675628662109375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 9.0, 44.0, 146.0, 341.0, 295.0, 145.0, 29.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.087855869438499e-05, -8.47978371893987e-05, -7.871711568441242e-05, -7.263638690346852e-05, -6.655566539848223e-05, -6.047494389349595e-05, -5.4394218750530854e-05, -4.831349360756576e-05, -4.2232772102579474e-05, -3.615205059759319e-05, -3.0071325454628095e-05, -2.3990602130652405e-05, -1.7909878806676716e-05, -1.1829155482701026e-05, -5.748432158725336e-06, 3.3229298423975706e-07, 6.413014489226043e-06, 1.2493737813201733e-05, 1.8574461137177423e-05, 2.4655184461153112e-05, 3.07359077851288e-05, 3.681662929011509e-05, 4.289735443308018e-05, 4.8978079576045275e-05, 5.505880108103156e-05, 6.113952258601785e-05, 6.722024409100413e-05, 7.330097287194803e-05, 7.938169437693432e-05, 8.54624158819206e-05, 9.15431446628645e-05, 9.762386616785079e-05, 0.00010370457312092185, 0.00010978529462590814, 0.00011586601613089442, 0.00012194674491183832, 0.000128027459140867, 0.0001341081951977685, 0.0001401889167027548, 0.00014626963820774108, 0.00015235035971272737, 0.00015843108121771365, 0.00016451180272269994, 0.00017059252422768623, 0.00017667326028458774, 0.00018275398178957403, 0.0001888347032945603, 0.0001949154247995466, 0.00020099614630453289, 0.00020707686780951917, 0.00021315758931450546, 0.00021923831081949174, 0.00022531903232447803, 0.00023139976838137954, 0.00023748048988636583, 0.00024356121139135212, 0.00024964194744825363, 0.0002557226689532399, 0.0002618033904582262, 0.0002678841119632125, 0.0002739648334681988, 0.00028004555497318506, 0.00028612627647817135, 0.00029220699798315763, 0.0002982877194881439]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 8.0, 4.0, 4.0, 3.0, 8.0, 13.0, 10.0, 7.0, 10.0, 21.0, 19.0, 28.0, 21.0, 25.0, 27.0, 41.0, 46.0, 33.0, 35.0, 50.0, 41.0, 50.0, 33.0, 37.0, 31.0, 27.0, 44.0, 31.0, 33.0, 26.0, 35.0, 35.0, 16.0, 22.0, 22.0, 16.0, 17.0, 14.0, 13.0, 11.0, 6.0, 6.0, 2.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.878376007080078e-05, -6.67748972773552e-05, -6.476603448390961e-05, -6.275717169046402e-05, -6.074830889701843e-05, -5.8739446103572845e-05, -5.673058331012726e-05, -5.472172051668167e-05, -5.2712857723236084e-05, -5.07039949297905e-05, -4.869513213634491e-05, -4.668626934289932e-05, -4.4677406549453735e-05, -4.266854375600815e-05, -4.065968096256256e-05, -3.8650818169116974e-05, -3.664195537567139e-05, -3.46330925822258e-05, -3.262422978878021e-05, -3.0615366995334625e-05, -2.8606504201889038e-05, -2.659764140844345e-05, -2.4588778614997864e-05, -2.2579915821552277e-05, -2.057105302810669e-05, -1.8562190234661102e-05, -1.6553327441215515e-05, -1.4544464647769928e-05, -1.253560185432434e-05, -1.0526739060878754e-05, -8.517876267433167e-06, -6.509013473987579e-06, -4.500150680541992e-06, -2.491287887096405e-06, -4.824250936508179e-07, 1.5264376997947693e-06, 3.5353004932403564e-06, 5.544163286685944e-06, 7.553026080131531e-06, 9.561888873577118e-06, 1.1570751667022705e-05, 1.3579614460468292e-05, 1.558847725391388e-05, 1.7597340047359467e-05, 1.9606202840805054e-05, 2.161506563425064e-05, 2.3623928427696228e-05, 2.5632791221141815e-05, 2.7641654014587402e-05, 2.965051680803299e-05, 3.165937960147858e-05, 3.3668242394924164e-05, 3.567710518836975e-05, 3.768596798181534e-05, 3.9694830775260925e-05, 4.170369356870651e-05, 4.37125563621521e-05, 4.572141915559769e-05, 4.7730281949043274e-05, 4.973914474248886e-05, 5.174800753593445e-05, 5.3756870329380035e-05, 5.576573312282562e-05, 5.777459591627121e-05, 5.97834587097168e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 2.0, 2.0, 16.0, 15.0, 13.0, 23.0, 18.0, 6.0, 18.0, 24.0, 20.0, 27.0, 31.0, 30.0, 31.0, 44.0, 37.0, 43.0, 44.0, 34.0, 39.0, 52.0, 25.0, 32.0, 31.0, 30.0, 29.0, 24.0, 24.0, 30.0, 23.0, 32.0, 20.0, 19.0, 14.0, 11.0, 9.0, 12.0, 6.0, 8.0, 10.0, 8.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.25, -3.14715576171875, -3.0443115234375, -2.94146728515625, -2.838623046875, -2.73577880859375, -2.6329345703125, -2.53009033203125, -2.42724609375, -2.32440185546875, -2.2215576171875, -2.11871337890625, -2.015869140625, -1.91302490234375, -1.8101806640625, -1.70733642578125, -1.6044921875, -1.50164794921875, -1.3988037109375, -1.29595947265625, -1.193115234375, -1.09027099609375, -0.9874267578125, -0.88458251953125, -0.78173828125, -0.67889404296875, -0.5760498046875, -0.47320556640625, -0.370361328125, -0.26751708984375, -0.1646728515625, -0.06182861328125, 0.041015625, 0.14385986328125, 0.2467041015625, 0.34954833984375, 0.452392578125, 0.55523681640625, 0.6580810546875, 0.76092529296875, 0.86376953125, 0.96661376953125, 1.0694580078125, 1.17230224609375, 1.275146484375, 1.37799072265625, 1.4808349609375, 1.58367919921875, 1.6865234375, 1.78936767578125, 1.8922119140625, 1.99505615234375, 2.097900390625, 2.20074462890625, 2.3035888671875, 2.40643310546875, 2.50927734375, 2.61212158203125, 2.7149658203125, 2.81781005859375, 2.920654296875, 3.02349853515625, 3.1263427734375, 3.22918701171875, 3.33203125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 10.0, 11.0, 7.0, 11.0, 17.0, 33.0, 45.0, 48.0, 76.0, 97.0, 106.0, 193.0, 240.0, 382.0, 536.0, 958.0, 1571.0, 2864.0, 5414.0, 11324.0, 25337.0, 60278.0, 144792.0, 276952.0, 272063.0, 139933.0, 57820.0, 24250.0, 10893.0, 5277.0, 2753.0, 1478.0, 927.0, 550.0, 391.0, 248.0, 186.0, 126.0, 98.0, 69.0, 50.0, 40.0, 26.0, 19.0, 16.0, 9.0, 9.0, 7.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.921875, -3.802947998046875, -3.68402099609375, -3.565093994140625, -3.4461669921875, -3.327239990234375, -3.20831298828125, -3.089385986328125, -2.970458984375, -2.851531982421875, -2.73260498046875, -2.613677978515625, -2.4947509765625, -2.375823974609375, -2.25689697265625, -2.137969970703125, -2.01904296875, -1.900115966796875, -1.78118896484375, -1.662261962890625, -1.5433349609375, -1.424407958984375, -1.30548095703125, -1.186553955078125, -1.067626953125, -0.948699951171875, -0.82977294921875, -0.710845947265625, -0.5919189453125, -0.472991943359375, -0.35406494140625, -0.235137939453125, -0.1162109375, 0.002716064453125, 0.12164306640625, 0.240570068359375, 0.3594970703125, 0.478424072265625, 0.59735107421875, 0.716278076171875, 0.835205078125, 0.954132080078125, 1.07305908203125, 1.191986083984375, 1.3109130859375, 1.429840087890625, 1.54876708984375, 1.667694091796875, 1.78662109375, 1.905548095703125, 2.02447509765625, 2.143402099609375, 2.2623291015625, 2.381256103515625, 2.50018310546875, 2.619110107421875, 2.738037109375, 2.856964111328125, 2.97589111328125, 3.094818115234375, 3.2137451171875, 3.332672119140625, 3.45159912109375, 3.570526123046875, 3.689453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 9.0, 4.0, 5.0, 11.0, 19.0, 10.0, 11.0, 9.0, 22.0, 20.0, 31.0, 27.0, 29.0, 29.0, 30.0, 49.0, 36.0, 76.0, 114.0, 257.0, 1425.0, 243.0, 105.0, 75.0, 60.0, 44.0, 45.0, 40.0, 32.0, 22.0, 21.0, 18.0, 17.0, 18.0, 17.0, 17.0, 12.0, 15.0, 3.0, 4.0, 12.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.875, -13.483642578125, -13.09228515625, -12.700927734375, -12.3095703125, -11.918212890625, -11.52685546875, -11.135498046875, -10.744140625, -10.352783203125, -9.96142578125, -9.570068359375, -9.1787109375, -8.787353515625, -8.39599609375, -8.004638671875, -7.61328125, -7.221923828125, -6.83056640625, -6.439208984375, -6.0478515625, -5.656494140625, -5.26513671875, -4.873779296875, -4.482421875, -4.091064453125, -3.69970703125, -3.308349609375, -2.9169921875, -2.525634765625, -2.13427734375, -1.742919921875, -1.3515625, -0.960205078125, -0.56884765625, -0.177490234375, 0.2138671875, 0.605224609375, 0.99658203125, 1.387939453125, 1.779296875, 2.170654296875, 2.56201171875, 2.953369140625, 3.3447265625, 3.736083984375, 4.12744140625, 4.518798828125, 4.91015625, 5.301513671875, 5.69287109375, 6.084228515625, 6.4755859375, 6.866943359375, 7.25830078125, 7.649658203125, 8.041015625, 8.432373046875, 8.82373046875, 9.215087890625, 9.6064453125, 9.997802734375, 10.38916015625, 10.780517578125, 11.171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 6.0, 0.0, 4.0, 4.0, 5.0, 12.0, 7.0, 8.0, 15.0, 15.0, 16.0, 15.0, 21.0, 27.0, 34.0, 29.0, 48.0, 71.0, 102.0, 160.0, 295.0, 643.0, 2562.0, 115445.0, 2995505.0, 27837.0, 1603.0, 504.0, 210.0, 138.0, 91.0, 49.0, 44.0, 30.0, 36.0, 13.0, 21.0, 11.0, 11.0, 19.0, 15.0, 6.0, 7.0, 8.0, 7.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.703125, -21.87353515625, -21.0439453125, -20.21435546875, -19.384765625, -18.55517578125, -17.7255859375, -16.89599609375, -16.06640625, -15.23681640625, -14.4072265625, -13.57763671875, -12.748046875, -11.91845703125, -11.0888671875, -10.25927734375, -9.4296875, -8.60009765625, -7.7705078125, -6.94091796875, -6.111328125, -5.28173828125, -4.4521484375, -3.62255859375, -2.79296875, -1.96337890625, -1.1337890625, -0.30419921875, 0.525390625, 1.35498046875, 2.1845703125, 3.01416015625, 3.84375, 4.67333984375, 5.5029296875, 6.33251953125, 7.162109375, 7.99169921875, 8.8212890625, 9.65087890625, 10.48046875, 11.31005859375, 12.1396484375, 12.96923828125, 13.798828125, 14.62841796875, 15.4580078125, 16.28759765625, 17.1171875, 17.94677734375, 18.7763671875, 19.60595703125, 20.435546875, 21.26513671875, 22.0947265625, 22.92431640625, 23.75390625, 24.58349609375, 25.4130859375, 26.24267578125, 27.072265625, 27.90185546875, 28.7314453125, 29.56103515625, 30.390625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 42.0, 949.0, 25.0, 0.0, 1.0], "bins": [-371.7919006347656, -365.6394348144531, -359.48699951171875, -353.33453369140625, -347.1820983886719, -341.0296325683594, -334.877197265625, -328.7247314453125, -322.5722961425781, -316.4198303222656, -310.26739501953125, -304.11492919921875, -297.9624938964844, -291.8100280761719, -285.6575927734375, -279.505126953125, -273.3526916503906, -267.2002258300781, -261.04779052734375, -254.8953399658203, -248.74288940429688, -242.59043884277344, -236.43798828125, -230.28553771972656, -224.13307189941406, -217.98062133789062, -211.8281707763672, -205.67572021484375, -199.5232696533203, -193.37081909179688, -187.21836853027344, -181.06591796875, -174.91348266601562, -168.7610321044922, -162.60858154296875, -156.4561309814453, -150.30368041992188, -144.15122985839844, -137.998779296875, -131.84632873535156, -125.6938705444336, -119.54141998291016, -113.38896942138672, -107.23651885986328, -101.08406829833984, -94.9316177368164, -88.77915954589844, -82.626708984375, -76.47425842285156, -70.32180786132812, -64.16935729980469, -58.01690673828125, -51.86445617675781, -45.712005615234375, -39.55955123901367, -33.407100677490234, -27.25465202331543, -21.102201461791992, -14.949749946594238, -8.797298431396484, -2.644847869873047, 3.5076026916503906, 9.660055160522461, 15.812505722045898, 21.964956283569336]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 4.0, 7.0, 5.0, 10.0, 12.0, 23.0, 17.0, 14.0, 21.0, 28.0, 20.0, 29.0, 35.0, 31.0, 36.0, 38.0, 48.0, 39.0, 48.0, 39.0, 36.0, 44.0, 46.0, 32.0, 39.0, 44.0, 27.0, 27.0, 26.0, 22.0, 15.0, 29.0, 17.0, 12.0, 15.0, 15.0, 8.0, 4.0, 7.0, 6.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.935726165771484, -38.70370864868164, -37.4716911315918, -36.23966979980469, -35.007652282714844, -33.775634765625, -32.543617248535156, -31.311599731445312, -30.079580307006836, -28.847562789916992, -27.615543365478516, -26.383525848388672, -25.151508331298828, -23.91948890686035, -22.687471389770508, -21.45545196533203, -20.223434448242188, -18.991416931152344, -17.759397506713867, -16.527379989624023, -15.295361518859863, -14.063343048095703, -12.83132553100586, -11.5993070602417, -10.367288589477539, -9.135270118713379, -7.903252124786377, -6.671234130859375, -5.439215660095215, -4.207197189331055, -2.9751791954040527, -1.7431612014770508, -0.5111465454101562, 0.7208716869354248, 1.9528899192810059, 3.184908151626587, 4.416926383972168, 5.648944854736328, 6.88096284866333, 8.112980842590332, 9.344999313354492, 10.577017784118652, 11.809036254882812, 13.041053771972656, 14.273072242736816, 15.505090713500977, 16.73710823059082, 17.969127655029297, 19.20114517211914, 20.433162689208984, 21.66518211364746, 22.897199630737305, 24.12921905517578, 25.361236572265625, 26.59325408935547, 27.825271606445312, 29.05729103088379, 30.289308547973633, 31.52132797241211, 32.75334548950195, 33.9853630065918, 35.217384338378906, 36.44940185546875, 37.681419372558594, 38.91343688964844]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 9.0, 12.0, 13.0, 16.0, 14.0, 15.0, 19.0, 15.0, 18.0, 23.0, 28.0, 19.0, 34.0, 27.0, 29.0, 47.0, 39.0, 39.0, 37.0, 35.0, 49.0, 45.0, 29.0, 33.0, 34.0, 31.0, 22.0, 32.0, 25.0, 29.0, 13.0, 24.0, 24.0, 21.0, 15.0, 10.0, 8.0, 8.0, 9.0, 8.0, 7.0, 7.0, 7.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.33984375, -3.23284912109375, -3.1258544921875, -3.01885986328125, -2.911865234375, -2.80487060546875, -2.6978759765625, -2.59088134765625, -2.48388671875, -2.37689208984375, -2.2698974609375, -2.16290283203125, -2.055908203125, -1.94891357421875, -1.8419189453125, -1.73492431640625, -1.6279296875, -1.52093505859375, -1.4139404296875, -1.30694580078125, -1.199951171875, -1.09295654296875, -0.9859619140625, -0.87896728515625, -0.77197265625, -0.66497802734375, -0.5579833984375, -0.45098876953125, -0.343994140625, -0.23699951171875, -0.1300048828125, -0.02301025390625, 0.083984375, 0.19097900390625, 0.2979736328125, 0.40496826171875, 0.511962890625, 0.61895751953125, 0.7259521484375, 0.83294677734375, 0.93994140625, 1.04693603515625, 1.1539306640625, 1.26092529296875, 1.367919921875, 1.47491455078125, 1.5819091796875, 1.68890380859375, 1.7958984375, 1.90289306640625, 2.0098876953125, 2.11688232421875, 2.223876953125, 2.33087158203125, 2.4378662109375, 2.54486083984375, 2.65185546875, 2.75885009765625, 2.8658447265625, 2.97283935546875, 3.079833984375, 3.18682861328125, 3.2938232421875, 3.40081787109375, 3.5078125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 4.0, 8.0, 7.0, 8.0, 11.0, 22.0, 24.0, 27.0, 37.0, 39.0, 52.0, 66.0, 109.0, 171.0, 334.0, 781.0, 2591.0, 16538.0, 289811.0, 2990276.0, 848806.0, 38028.0, 4293.0, 1102.0, 412.0, 223.0, 94.0, 87.0, 67.0, 49.0, 54.0, 24.0, 24.0, 15.0, 17.0, 11.0, 12.0, 6.0, 5.0, 3.0, 10.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-13.9296875, -13.5032958984375, -13.076904296875, -12.6505126953125, -12.22412109375, -11.7977294921875, -11.371337890625, -10.9449462890625, -10.5185546875, -10.0921630859375, -9.665771484375, -9.2393798828125, -8.81298828125, -8.3865966796875, -7.960205078125, -7.5338134765625, -7.107421875, -6.6810302734375, -6.254638671875, -5.8282470703125, -5.40185546875, -4.9754638671875, -4.549072265625, -4.1226806640625, -3.6962890625, -3.2698974609375, -2.843505859375, -2.4171142578125, -1.99072265625, -1.5643310546875, -1.137939453125, -0.7115478515625, -0.28515625, 0.1412353515625, 0.567626953125, 0.9940185546875, 1.42041015625, 1.8468017578125, 2.273193359375, 2.6995849609375, 3.1259765625, 3.5523681640625, 3.978759765625, 4.4051513671875, 4.83154296875, 5.2579345703125, 5.684326171875, 6.1107177734375, 6.537109375, 6.9635009765625, 7.389892578125, 7.8162841796875, 8.24267578125, 8.6690673828125, 9.095458984375, 9.5218505859375, 9.9482421875, 10.3746337890625, 10.801025390625, 11.2274169921875, 11.65380859375, 12.0802001953125, 12.506591796875, 12.9329833984375, 13.359375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 10.0, 14.0, 18.0, 26.0, 40.0, 60.0, 81.0, 131.0, 168.0, 221.0, 316.0, 444.0, 506.0, 541.0, 433.0, 293.0, 232.0, 155.0, 118.0, 75.0, 63.0, 36.0, 35.0, 16.0, 9.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.585693359375, -16.12451171875, -15.663330078125, -15.2021484375, -14.740966796875, -14.27978515625, -13.818603515625, -13.357421875, -12.896240234375, -12.43505859375, -11.973876953125, -11.5126953125, -11.051513671875, -10.59033203125, -10.129150390625, -9.66796875, -9.206787109375, -8.74560546875, -8.284423828125, -7.8232421875, -7.362060546875, -6.90087890625, -6.439697265625, -5.978515625, -5.517333984375, -5.05615234375, -4.594970703125, -4.1337890625, -3.672607421875, -3.21142578125, -2.750244140625, -2.2890625, -1.827880859375, -1.36669921875, -0.905517578125, -0.4443359375, 0.016845703125, 0.47802734375, 0.939208984375, 1.400390625, 1.861572265625, 2.32275390625, 2.783935546875, 3.2451171875, 3.706298828125, 4.16748046875, 4.628662109375, 5.08984375, 5.551025390625, 6.01220703125, 6.473388671875, 6.9345703125, 7.395751953125, 7.85693359375, 8.318115234375, 8.779296875, 9.240478515625, 9.70166015625, 10.162841796875, 10.6240234375, 11.085205078125, 11.54638671875, 12.007568359375, 12.46875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 13.0, 21.0, 25.0, 34.0, 65.0, 106.0, 160.0, 305.0, 703.0, 2678.0, 114570.0, 4006486.0, 65466.0, 2268.0, 624.0, 280.0, 163.0, 110.0, 65.0, 46.0, 17.0, 23.0, 11.0, 10.0, 8.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.9375, -29.4248046875, -27.912109375, -26.3994140625, -24.88671875, -23.3740234375, -21.861328125, -20.3486328125, -18.8359375, -17.3232421875, -15.810546875, -14.2978515625, -12.78515625, -11.2724609375, -9.759765625, -8.2470703125, -6.734375, -5.2216796875, -3.708984375, -2.1962890625, -0.68359375, 0.8291015625, 2.341796875, 3.8544921875, 5.3671875, 6.8798828125, 8.392578125, 9.9052734375, 11.41796875, 12.9306640625, 14.443359375, 15.9560546875, 17.46875, 18.9814453125, 20.494140625, 22.0068359375, 23.51953125, 25.0322265625, 26.544921875, 28.0576171875, 29.5703125, 31.0830078125, 32.595703125, 34.1083984375, 35.62109375, 37.1337890625, 38.646484375, 40.1591796875, 41.671875, 43.1845703125, 44.697265625, 46.2099609375, 47.72265625, 49.2353515625, 50.748046875, 52.2607421875, 53.7734375, 55.2861328125, 56.798828125, 58.3115234375, 59.82421875, 61.3369140625, 62.849609375, 64.3623046875, 65.875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 19.0, 14.0, 24.0, 42.0, 42.0, 60.0, 91.0, 88.0, 96.0, 80.0, 99.0, 82.0, 81.0, 56.0, 48.0, 41.0, 15.0, 12.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.902835845947266, -35.79629898071289, -34.68975830078125, -33.583221435546875, -32.476680755615234, -31.370141983032227, -30.26360321044922, -29.157066345214844, -28.050525665283203, -26.943986892700195, -25.837448120117188, -24.73090934753418, -23.624370574951172, -22.517831802368164, -21.411293029785156, -20.30475616455078, -19.198217391967773, -18.091678619384766, -16.985139846801758, -15.87860107421875, -14.772062301635742, -13.665523529052734, -12.558985710144043, -11.452446937561035, -10.345908164978027, -9.23936939239502, -8.132830619812012, -7.026292324066162, -5.919753551483154, -4.8132147789001465, -3.706676483154297, -2.600137710571289, -1.4935989379882812, -0.387060284614563, 0.7194783687591553, 1.826016902923584, 2.932555675506592, 4.0390944480896, 5.145632743835449, 6.252171516418457, 7.358710289001465, 8.465249061584473, 9.57178783416748, 10.678325653076172, 11.78486442565918, 12.891403198242188, 13.997941970825195, 15.104480743408203, 16.21101951599121, 17.31755828857422, 18.424097061157227, 19.530635833740234, 20.637174606323242, 21.74371337890625, 22.850250244140625, 23.956790924072266, 25.06332778930664, 26.16986656188965, 27.276405334472656, 28.382944107055664, 29.489482879638672, 30.59602165222168, 31.702560424804688, 32.80909729003906, 33.9156379699707]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 3.0, 6.0, 10.0, 8.0, 18.0, 20.0, 21.0, 16.0, 26.0, 25.0, 25.0, 38.0, 31.0, 32.0, 26.0, 40.0, 46.0, 44.0, 41.0, 54.0, 37.0, 35.0, 34.0, 37.0, 43.0, 28.0, 38.0, 35.0, 27.0, 30.0, 25.0, 14.0, 21.0, 12.0, 7.0, 9.0, 16.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.34829330444336, -39.93910598754883, -38.5299186706543, -37.120731353759766, -35.711544036865234, -34.3023567199707, -32.893165588378906, -31.483980178833008, -30.074792861938477, -28.665605545043945, -27.256418228149414, -25.84722900390625, -24.43804168701172, -23.028854370117188, -21.619667053222656, -20.210479736328125, -18.801292419433594, -17.392105102539062, -15.982917785644531, -14.573729515075684, -13.164542198181152, -11.755354881286621, -10.346166610717773, -8.936979293823242, -7.527791976928711, -6.11860466003418, -4.70941686630249, -3.300229072570801, -1.8910417556762695, -0.4818544387817383, 0.9273338317871094, 2.3365211486816406, 3.7457122802734375, 5.154899597167969, 6.564087390899658, 7.973275184631348, 9.382462501525879, 10.79164981842041, 12.200838088989258, 13.610025405883789, 15.01921272277832, 16.42840003967285, 17.837587356567383, 19.246776580810547, 20.655963897705078, 22.06515121459961, 23.47433853149414, 24.883525848388672, 26.292713165283203, 27.701900482177734, 29.111087799072266, 30.520275115966797, 31.929462432861328, 33.33864974975586, 34.747840881347656, 36.15702819824219, 37.56621551513672, 38.97540283203125, 40.38459014892578, 41.79377746582031, 43.202964782714844, 44.612152099609375, 46.021339416503906, 47.43052673339844, 48.83971405029297]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 9.0, 4.0, 10.0, 8.0, 10.0, 8.0, 13.0, 7.0, 12.0, 23.0, 18.0, 12.0, 32.0, 23.0, 25.0, 35.0, 29.0, 35.0, 46.0, 50.0, 38.0, 33.0, 46.0, 35.0, 37.0, 35.0, 35.0, 38.0, 35.0, 25.0, 25.0, 31.0, 23.0, 26.0, 10.0, 23.0, 19.0, 15.0, 14.0, 8.0, 8.0, 6.0, 3.0, 8.0, 6.0, 4.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.740234375, -3.625640869140625, -3.51104736328125, -3.396453857421875, -3.2818603515625, -3.167266845703125, -3.05267333984375, -2.938079833984375, -2.823486328125, -2.708892822265625, -2.59429931640625, -2.479705810546875, -2.3651123046875, -2.250518798828125, -2.13592529296875, -2.021331787109375, -1.90673828125, -1.792144775390625, -1.67755126953125, -1.562957763671875, -1.4483642578125, -1.333770751953125, -1.21917724609375, -1.104583740234375, -0.989990234375, -0.875396728515625, -0.76080322265625, -0.646209716796875, -0.5316162109375, -0.417022705078125, -0.30242919921875, -0.187835693359375, -0.0732421875, 0.041351318359375, 0.15594482421875, 0.270538330078125, 0.3851318359375, 0.499725341796875, 0.61431884765625, 0.728912353515625, 0.843505859375, 0.958099365234375, 1.07269287109375, 1.187286376953125, 1.3018798828125, 1.416473388671875, 1.53106689453125, 1.645660400390625, 1.76025390625, 1.874847412109375, 1.98944091796875, 2.104034423828125, 2.2186279296875, 2.333221435546875, 2.44781494140625, 2.562408447265625, 2.677001953125, 2.791595458984375, 2.90618896484375, 3.020782470703125, 3.1353759765625, 3.249969482421875, 3.36456298828125, 3.479156494140625, 3.59375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 5.0, 10.0, 18.0, 21.0, 40.0, 47.0, 71.0, 90.0, 153.0, 208.0, 311.0, 384.0, 528.0, 769.0, 1046.0, 1504.0, 2107.0, 2929.0, 4087.0, 5725.0, 7937.0, 11207.0, 16164.0, 23541.0, 33897.0, 51865.0, 84670.0, 153878.0, 291938.0, 130878.0, 73617.0, 46370.0, 30945.0, 20790.0, 14718.0, 10530.0, 7288.0, 5183.0, 3692.0, 2696.0, 1919.0, 1363.0, 964.0, 707.0, 502.0, 381.0, 266.0, 191.0, 127.0, 98.0, 65.0, 46.0, 22.0, 21.0, 17.0, 10.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.87646484375, -0.8485260009765625, -0.820587158203125, -0.7926483154296875, -0.76470947265625, -0.7367706298828125, -0.708831787109375, -0.6808929443359375, -0.6529541015625, -0.6250152587890625, -0.597076416015625, -0.5691375732421875, -0.54119873046875, -0.5132598876953125, -0.485321044921875, -0.4573822021484375, -0.429443359375, -0.4015045166015625, -0.373565673828125, -0.3456268310546875, -0.31768798828125, -0.2897491455078125, -0.261810302734375, -0.2338714599609375, -0.2059326171875, -0.1779937744140625, -0.150054931640625, -0.1221160888671875, -0.09417724609375, -0.0662384033203125, -0.038299560546875, -0.0103607177734375, 0.017578125, 0.0455169677734375, 0.073455810546875, 0.1013946533203125, 0.12933349609375, 0.1572723388671875, 0.185211181640625, 0.2131500244140625, 0.2410888671875, 0.2690277099609375, 0.296966552734375, 0.3249053955078125, 0.35284423828125, 0.3807830810546875, 0.408721923828125, 0.4366607666015625, 0.464599609375, 0.4925384521484375, 0.520477294921875, 0.5484161376953125, 0.57635498046875, 0.6042938232421875, 0.632232666015625, 0.6601715087890625, 0.6881103515625, 0.7160491943359375, 0.743988037109375, 0.7719268798828125, 0.79986572265625, 0.8278045654296875, 0.855743408203125, 0.8836822509765625, 0.91162109375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 7.0, 8.0, 3.0, 13.0, 14.0, 15.0, 20.0, 20.0, 21.0, 22.0, 29.0, 31.0, 35.0, 39.0, 39.0, 44.0, 57.0, 37.0, 1052.0, 39.0, 51.0, 50.0, 46.0, 48.0, 29.0, 40.0, 28.0, 29.0, 18.0, 19.0, 24.0, 19.0, 10.0, 13.0, 10.0, 9.0, 6.0, 6.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.453125, -2.37060546875, -2.2880859375, -2.20556640625, -2.123046875, -2.04052734375, -1.9580078125, -1.87548828125, -1.79296875, -1.71044921875, -1.6279296875, -1.54541015625, -1.462890625, -1.38037109375, -1.2978515625, -1.21533203125, -1.1328125, -1.05029296875, -0.9677734375, -0.88525390625, -0.802734375, -0.72021484375, -0.6376953125, -0.55517578125, -0.47265625, -0.39013671875, -0.3076171875, -0.22509765625, -0.142578125, -0.06005859375, 0.0224609375, 0.10498046875, 0.1875, 0.27001953125, 0.3525390625, 0.43505859375, 0.517578125, 0.60009765625, 0.6826171875, 0.76513671875, 0.84765625, 0.93017578125, 1.0126953125, 1.09521484375, 1.177734375, 1.26025390625, 1.3427734375, 1.42529296875, 1.5078125, 1.59033203125, 1.6728515625, 1.75537109375, 1.837890625, 1.92041015625, 2.0029296875, 2.08544921875, 2.16796875, 2.25048828125, 2.3330078125, 2.41552734375, 2.498046875, 2.58056640625, 2.6630859375, 2.74560546875, 2.828125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 3.0, 8.0, 5.0, 15.0, 22.0, 20.0, 54.0, 57.0, 106.0, 151.0, 247.0, 350.0, 576.0, 788.0, 1168.0, 1673.0, 2618.0, 3694.0, 5801.0, 8552.0, 13183.0, 20213.0, 32419.0, 52329.0, 89079.0, 175469.0, 1358702.0, 134339.0, 73282.0, 43702.0, 27561.0, 17211.0, 11290.0, 7447.0, 4923.0, 3258.0, 2170.0, 1557.0, 1058.0, 671.0, 466.0, 300.0, 199.0, 136.0, 98.0, 63.0, 39.0, 27.0, 16.0, 13.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9259414672851562, -0.8943634033203125, -0.8627853393554688, -0.831207275390625, -0.7996292114257812, -0.7680511474609375, -0.7364730834960938, -0.70489501953125, -0.6733169555664062, -0.6417388916015625, -0.6101608276367188, -0.578582763671875, -0.5470046997070312, -0.5154266357421875, -0.48384857177734375, -0.4522705078125, -0.42069244384765625, -0.3891143798828125, -0.35753631591796875, -0.325958251953125, -0.29438018798828125, -0.2628021240234375, -0.23122406005859375, -0.19964599609375, -0.16806793212890625, -0.1364898681640625, -0.10491180419921875, -0.073333740234375, -0.04175567626953125, -0.0101776123046875, 0.02140045166015625, 0.052978515625, 0.08455657958984375, 0.1161346435546875, 0.14771270751953125, 0.179290771484375, 0.21086883544921875, 0.2424468994140625, 0.27402496337890625, 0.30560302734375, 0.33718109130859375, 0.3687591552734375, 0.40033721923828125, 0.431915283203125, 0.46349334716796875, 0.4950714111328125, 0.5266494750976562, 0.5582275390625, 0.5898056030273438, 0.6213836669921875, 0.6529617309570312, 0.684539794921875, 0.7161178588867188, 0.7476959228515625, 0.7792739868164062, 0.81085205078125, 0.8424301147460938, 0.8740081787109375, 0.9055862426757812, 0.937164306640625, 0.9687423706054688, 1.0003204345703125, 1.0318984985351562, 1.0634765625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 11.0, 7.0, 9.0, 6.0, 9.0, 23.0, 20.0, 17.0, 29.0, 36.0, 27.0, 41.0, 32.0, 37.0, 48.0, 64.0, 68.0, 67.0, 52.0, 64.0, 55.0, 37.0, 37.0, 29.0, 34.0, 19.0, 21.0, 23.0, 22.0, 10.0, 6.0, 4.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00016391277313232422, -0.0001583937555551529, -0.00015287473797798157, -0.00014735572040081024, -0.00014183670282363892, -0.0001363176852464676, -0.00013079866766929626, -0.00012527965009212494, -0.00011976063251495361, -0.00011424161493778229, -0.00010872259736061096, -0.00010320357978343964, -9.768456220626831e-05, -9.216554462909698e-05, -8.664652705192566e-05, -8.112750947475433e-05, -7.560849189758301e-05, -7.008947432041168e-05, -6.457045674324036e-05, -5.905143916606903e-05, -5.3532421588897705e-05, -4.801340401172638e-05, -4.2494386434555054e-05, -3.697536885738373e-05, -3.14563512802124e-05, -2.5937333703041077e-05, -2.041831612586975e-05, -1.4899298548698425e-05, -9.3802809715271e-06, -3.861263394355774e-06, 1.6577541828155518e-06, 7.1767717599868774e-06, 1.2695789337158203e-05, 1.821480691432953e-05, 2.3733824491500854e-05, 2.925284206867218e-05, 3.4771859645843506e-05, 4.029087722301483e-05, 4.580989480018616e-05, 5.132891237735748e-05, 5.684792995452881e-05, 6.236694753170013e-05, 6.788596510887146e-05, 7.340498268604279e-05, 7.892400026321411e-05, 8.444301784038544e-05, 8.996203541755676e-05, 9.548105299472809e-05, 0.00010100007057189941, 0.00010651908814907074, 0.00011203810572624207, 0.00011755712330341339, 0.00012307614088058472, 0.00012859515845775604, 0.00013411417603492737, 0.0001396331936120987, 0.00014515221118927002, 0.00015067122876644135, 0.00015619024634361267, 0.000161709263920784, 0.00016722828149795532, 0.00017274729907512665, 0.00017826631665229797, 0.0001837853342294693, 0.00018930435180664062]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 5.0, 6.0, 13.0, 16.0, 17.0, 30.0, 37.0, 57.0, 62.0, 81.0, 103.0, 169.0, 236.0, 449.0, 1205.0, 1001830.0, 42440.0, 694.0, 323.0, 228.0, 146.0, 119.0, 61.0, 52.0, 40.0, 28.0, 23.0, 13.0, 11.0, 14.0, 5.0, 8.0, 8.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0044403076171875, -0.004316240549087524, -0.004192173480987549, -0.004068106412887573, -0.003944039344787598, -0.003819972276687622, -0.0036959052085876465, -0.003571838140487671, -0.0034477710723876953, -0.0033237040042877197, -0.003199636936187744, -0.0030755698680877686, -0.002951502799987793, -0.0028274357318878174, -0.002703368663787842, -0.002579301595687866, -0.0024552345275878906, -0.002331167459487915, -0.0022071003913879395, -0.002083033323287964, -0.0019589662551879883, -0.0018348991870880127, -0.0017108321189880371, -0.0015867650508880615, -0.001462697982788086, -0.0013386309146881104, -0.0012145638465881348, -0.0010904967784881592, -0.0009664297103881836, -0.000842362642288208, -0.0007182955741882324, -0.0005942285060882568, -0.00047016143798828125, -0.00034609436988830566, -0.00022202730178833008, -9.796023368835449e-05, 2.6106834411621094e-05, 0.00015017390251159668, 0.00027424097061157227, 0.00039830803871154785, 0.0005223751068115234, 0.000646442174911499, 0.0007705092430114746, 0.0008945763111114502, 0.0010186433792114258, 0.0011427104473114014, 0.001266777515411377, 0.0013908445835113525, 0.0015149116516113281, 0.0016389787197113037, 0.0017630457878112793, 0.0018871128559112549, 0.0020111799240112305, 0.002135246992111206, 0.0022593140602111816, 0.0023833811283111572, 0.002507448196411133, 0.0026315152645111084, 0.002755582332611084, 0.0028796494007110596, 0.003003716468811035, 0.0031277835369110107, 0.0032518506050109863, 0.003375917673110962, 0.0034999847412109375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 88.0, 563.0, 331.0, 29.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003600680211093277, -0.0003455566184129566, -0.000331045244820416, -0.0003165338421240449, -0.0003020224685315043, -0.0002875110658351332, -0.0002729996922425926, -0.0002584882895462215, -0.00024397690140176564, -0.0002294655132573098, -0.00021495412511285394, -0.0002004427369683981, -0.00018593133427202702, -0.0001714199606794864, -0.00015690855798311532, -0.00014239716983865947, -0.00012788578169420362, -0.00011337439354974777, -9.886300540529191e-05, -8.435160998487845e-05, -6.98402218404226e-05, -5.532883369596675e-05, -4.0817438275553286e-05, -2.6306050131097436e-05, -1.1794661986641586e-05, 2.716727976803668e-06, 1.722811794024892e-05, 3.173950972268358e-05, 4.625089786713943e-05, 6.076228601159528e-05, 7.527368143200874e-05, 8.97850695764646e-05, 0.0001042964868247509, 0.00011880787496920675, 0.0001333192631136626, 0.00014783066581003368, 0.0001623420394025743, 0.00017685344209894538, 0.00019136483024340123, 0.00020587621838785708, 0.00022038760653231293, 0.00023489899467676878, 0.00024941039737313986, 0.0002639217709656805, 0.00027843317366205156, 0.0002929445472545922, 0.00030745594995096326, 0.00032196735264733434, 0.00033647872623987496, 0.00035099012893624604, 0.00036550150252878666, 0.00038001290522515774, 0.00039452427881769836, 0.00040903568151406944, 0.00042354705510661006, 0.00043805845780298114, 0.0004525698604993522, 0.0004670812631957233, 0.0004815926367882639, 0.0004961040103808045, 0.0005106154130771756, 0.0005251268157735467, 0.0005396382184699178, 0.0005541496211662889, 0.000568660965654999]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 6.0, 14.0, 15.0, 12.0, 16.0, 17.0, 19.0, 22.0, 15.0, 32.0, 24.0, 25.0, 30.0, 37.0, 39.0, 39.0, 41.0, 27.0, 36.0, 39.0, 40.0, 43.0, 32.0, 38.0, 33.0, 35.0, 25.0, 33.0, 21.0, 25.0, 26.0, 20.0, 15.0, 20.0, 11.0, 7.0, 9.0, 14.0, 3.0, 3.0, 8.0, 2.0, 2.0, 8.0, 0.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-8.505582809448242e-05, -8.240249007940292e-05, -7.974915206432343e-05, -7.709581404924393e-05, -7.444247603416443e-05, -7.178913801908493e-05, -6.913580000400543e-05, -6.648246198892593e-05, -6.382912397384644e-05, -6.117578595876694e-05, -5.852244794368744e-05, -5.586910992860794e-05, -5.321577191352844e-05, -5.0562433898448944e-05, -4.7909095883369446e-05, -4.525575786828995e-05, -4.260241985321045e-05, -3.994908183813095e-05, -3.729574382305145e-05, -3.4642405807971954e-05, -3.1989067792892456e-05, -2.9335729777812958e-05, -2.668239176273346e-05, -2.402905374765396e-05, -2.1375715732574463e-05, -1.8722377717494965e-05, -1.6069039702415466e-05, -1.3415701687335968e-05, -1.076236367225647e-05, -8.109025657176971e-06, -5.455687642097473e-06, -2.802349627017975e-06, -1.4901161193847656e-07, 2.5043264031410217e-06, 5.15766441822052e-06, 7.811002433300018e-06, 1.0464340448379517e-05, 1.3117678463459015e-05, 1.5771016478538513e-05, 1.842435449361801e-05, 2.107769250869751e-05, 2.3731030523777008e-05, 2.6384368538856506e-05, 2.9037706553936005e-05, 3.16910445690155e-05, 3.4344382584095e-05, 3.69977205991745e-05, 3.9651058614254e-05, 4.2304396629333496e-05, 4.4957734644412994e-05, 4.761107265949249e-05, 5.026441067457199e-05, 5.291774868965149e-05, 5.557108670473099e-05, 5.8224424719810486e-05, 6.0877762734889984e-05, 6.353110074996948e-05, 6.618443876504898e-05, 6.883777678012848e-05, 7.149111479520798e-05, 7.414445281028748e-05, 7.679779082536697e-05, 7.945112884044647e-05, 8.210446685552597e-05, 8.475780487060547e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 9.0, 4.0, 10.0, 8.0, 10.0, 8.0, 13.0, 7.0, 12.0, 23.0, 18.0, 12.0, 31.0, 24.0, 25.0, 35.0, 29.0, 35.0, 46.0, 50.0, 38.0, 33.0, 46.0, 35.0, 37.0, 35.0, 35.0, 38.0, 35.0, 25.0, 25.0, 31.0, 23.0, 26.0, 10.0, 23.0, 19.0, 15.0, 14.0, 8.0, 8.0, 6.0, 3.0, 8.0, 6.0, 4.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.740234375, -3.625640869140625, -3.51104736328125, -3.396453857421875, -3.2818603515625, -3.167266845703125, -3.05267333984375, -2.938079833984375, -2.823486328125, -2.708892822265625, -2.59429931640625, -2.479705810546875, -2.3651123046875, -2.250518798828125, -2.13592529296875, -2.021331787109375, -1.90673828125, -1.792144775390625, -1.67755126953125, -1.562957763671875, -1.4483642578125, -1.333770751953125, -1.21917724609375, -1.104583740234375, -0.989990234375, -0.875396728515625, -0.76080322265625, -0.646209716796875, -0.5316162109375, -0.417022705078125, -0.30242919921875, -0.187835693359375, -0.0732421875, 0.041351318359375, 0.15594482421875, 0.270538330078125, 0.3851318359375, 0.499725341796875, 0.61431884765625, 0.728912353515625, 0.843505859375, 0.958099365234375, 1.07269287109375, 1.187286376953125, 1.3018798828125, 1.416473388671875, 1.53106689453125, 1.645660400390625, 1.76025390625, 1.874847412109375, 1.98944091796875, 2.104034423828125, 2.2186279296875, 2.333221435546875, 2.44781494140625, 2.562408447265625, 2.677001953125, 2.791595458984375, 2.90618896484375, 3.020782470703125, 3.1353759765625, 3.249969482421875, 3.36456298828125, 3.479156494140625, 3.59375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 12.0, 13.0, 13.0, 16.0, 36.0, 33.0, 61.0, 100.0, 131.0, 143.0, 221.0, 309.0, 455.0, 765.0, 1187.0, 2145.0, 4054.0, 7966.0, 17579.0, 43229.0, 123231.0, 351894.0, 316682.0, 107639.0, 38341.0, 15848.0, 7404.0, 3717.0, 2017.0, 1129.0, 672.0, 441.0, 286.0, 233.0, 152.0, 120.0, 81.0, 56.0, 37.0, 29.0, 28.0, 19.0, 13.0, 7.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.078125, -3.950439453125, -3.82275390625, -3.695068359375, -3.5673828125, -3.439697265625, -3.31201171875, -3.184326171875, -3.056640625, -2.928955078125, -2.80126953125, -2.673583984375, -2.5458984375, -2.418212890625, -2.29052734375, -2.162841796875, -2.03515625, -1.907470703125, -1.77978515625, -1.652099609375, -1.5244140625, -1.396728515625, -1.26904296875, -1.141357421875, -1.013671875, -0.885986328125, -0.75830078125, -0.630615234375, -0.5029296875, -0.375244140625, -0.24755859375, -0.119873046875, 0.0078125, 0.135498046875, 0.26318359375, 0.390869140625, 0.5185546875, 0.646240234375, 0.77392578125, 0.901611328125, 1.029296875, 1.156982421875, 1.28466796875, 1.412353515625, 1.5400390625, 1.667724609375, 1.79541015625, 1.923095703125, 2.05078125, 2.178466796875, 2.30615234375, 2.433837890625, 2.5615234375, 2.689208984375, 2.81689453125, 2.944580078125, 3.072265625, 3.199951171875, 3.32763671875, 3.455322265625, 3.5830078125, 3.710693359375, 3.83837890625, 3.966064453125, 4.09375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 3.0, 6.0, 12.0, 17.0, 13.0, 22.0, 16.0, 22.0, 25.0, 34.0, 46.0, 36.0, 36.0, 49.0, 54.0, 98.0, 309.0, 1660.0, 157.0, 58.0, 57.0, 50.0, 39.0, 41.0, 31.0, 31.0, 20.0, 15.0, 21.0, 14.0, 14.0, 15.0, 6.0, 10.0, 6.0, 8.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.1151123046875, -13.597412109375, -13.0797119140625, -12.56201171875, -12.0443115234375, -11.526611328125, -11.0089111328125, -10.4912109375, -9.9735107421875, -9.455810546875, -8.9381103515625, -8.42041015625, -7.9027099609375, -7.385009765625, -6.8673095703125, -6.349609375, -5.8319091796875, -5.314208984375, -4.7965087890625, -4.27880859375, -3.7611083984375, -3.243408203125, -2.7257080078125, -2.2080078125, -1.6903076171875, -1.172607421875, -0.6549072265625, -0.13720703125, 0.3804931640625, 0.898193359375, 1.4158935546875, 1.93359375, 2.4512939453125, 2.968994140625, 3.4866943359375, 4.00439453125, 4.5220947265625, 5.039794921875, 5.5574951171875, 6.0751953125, 6.5928955078125, 7.110595703125, 7.6282958984375, 8.14599609375, 8.6636962890625, 9.181396484375, 9.6990966796875, 10.216796875, 10.7344970703125, 11.252197265625, 11.7698974609375, 12.28759765625, 12.8052978515625, 13.322998046875, 13.8406982421875, 14.3583984375, 14.8760986328125, 15.393798828125, 15.9114990234375, 16.42919921875, 16.9468994140625, 17.464599609375, 17.9822998046875, 18.5]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 8.0, 11.0, 9.0, 21.0, 16.0, 25.0, 19.0, 32.0, 29.0, 36.0, 62.0, 104.0, 134.0, 248.0, 493.0, 1911.0, 26974.0, 2978397.0, 131574.0, 3925.0, 801.0, 293.0, 158.0, 106.0, 65.0, 51.0, 43.0, 32.0, 27.0, 24.0, 16.0, 14.0, 14.0, 9.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.21875, -27.380859375, -26.54296875, -25.705078125, -24.8671875, -24.029296875, -23.19140625, -22.353515625, -21.515625, -20.677734375, -19.83984375, -19.001953125, -18.1640625, -17.326171875, -16.48828125, -15.650390625, -14.8125, -13.974609375, -13.13671875, -12.298828125, -11.4609375, -10.623046875, -9.78515625, -8.947265625, -8.109375, -7.271484375, -6.43359375, -5.595703125, -4.7578125, -3.919921875, -3.08203125, -2.244140625, -1.40625, -0.568359375, 0.26953125, 1.107421875, 1.9453125, 2.783203125, 3.62109375, 4.458984375, 5.296875, 6.134765625, 6.97265625, 7.810546875, 8.6484375, 9.486328125, 10.32421875, 11.162109375, 12.0, 12.837890625, 13.67578125, 14.513671875, 15.3515625, 16.189453125, 17.02734375, 17.865234375, 18.703125, 19.541015625, 20.37890625, 21.216796875, 22.0546875, 22.892578125, 23.73046875, 24.568359375, 25.40625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 30.0, 91.0, 196.0, 262.0, 243.0, 114.0, 45.0, 10.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.3444709777832, -31.17164421081543, -29.998817443847656, -28.825990676879883, -27.65316390991211, -26.480337142944336, -25.307510375976562, -24.13468360900879, -22.961856842041016, -21.789030075073242, -20.61620330810547, -19.443376541137695, -18.270549774169922, -17.09772300720215, -15.924896240234375, -14.752069473266602, -13.579242706298828, -12.406415939331055, -11.233589172363281, -10.060762405395508, -8.887935638427734, -7.715108871459961, -6.5422821044921875, -5.369455337524414, -4.196628570556641, -3.023801803588867, -1.8509750366210938, -0.6781482696533203, 0.4946784973144531, 1.6675052642822266, 2.84033203125, 4.013158798217773, 5.185985565185547, 6.35881233215332, 7.531639099121094, 8.704465866088867, 9.87729263305664, 11.050119400024414, 12.222946166992188, 13.395772933959961, 14.568599700927734, 15.741426467895508, 16.91425323486328, 18.087080001831055, 19.259906768798828, 20.4327335357666, 21.605560302734375, 22.77838706970215, 23.951213836669922, 25.124040603637695, 26.29686737060547, 27.469694137573242, 28.642520904541016, 29.81534767150879, 30.988174438476562, 32.16100311279297, 33.33382797241211, 34.50665283203125, 35.679481506347656, 36.85231018066406, 38.0251350402832, 39.197959899902344, 40.37078857421875, 41.543617248535156, 42.7164421081543]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 11.0, 2.0, 13.0, 9.0, 12.0, 19.0, 12.0, 22.0, 18.0, 31.0, 35.0, 33.0, 45.0, 35.0, 32.0, 48.0, 30.0, 46.0, 36.0, 38.0, 46.0, 36.0, 43.0, 40.0, 30.0, 50.0, 26.0, 33.0, 27.0, 14.0, 23.0, 23.0, 19.0, 11.0, 10.0, 5.0, 10.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.25399398803711, -45.81037139892578, -44.36674499511719, -42.92312240600586, -41.479496002197266, -40.03587341308594, -38.592247009277344, -37.148624420166016, -35.70500183105469, -34.26137924194336, -32.817752838134766, -31.374130249023438, -29.930503845214844, -28.486881256103516, -27.043256759643555, -25.599632263183594, -24.156005859375, -22.71238136291504, -21.268756866455078, -19.82513427734375, -18.381507873535156, -16.937885284423828, -15.494260787963867, -14.050636291503906, -12.607011795043945, -11.163387298583984, -9.719762802124023, -8.276139259338379, -6.832514762878418, -5.388890266418457, -3.9452667236328125, -2.5016422271728516, -1.0580215454101562, 0.3856027126312256, 1.8292269706726074, 3.27285099029541, 4.716475486755371, 6.160099983215332, 7.603723526000977, 9.047348022460938, 10.490972518920898, 11.93459701538086, 13.37822151184082, 14.821845054626465, 16.26546859741211, 17.709095001220703, 19.15271759033203, 20.596342086791992, 22.039966583251953, 23.483591079711914, 24.927215576171875, 26.370838165283203, 27.814464569091797, 29.258087158203125, 30.701711654663086, 32.14533615112305, 33.588958740234375, 35.0325813293457, 36.4762077331543, 37.919830322265625, 39.36345672607422, 40.80707931518555, 42.250701904296875, 43.69432830810547, 45.13795471191406]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 11.0, 7.0, 12.0, 14.0, 11.0, 7.0, 11.0, 14.0, 21.0, 20.0, 23.0, 25.0, 38.0, 24.0, 32.0, 41.0, 47.0, 42.0, 36.0, 44.0, 46.0, 44.0, 41.0, 33.0, 45.0, 29.0, 35.0, 31.0, 34.0, 23.0, 27.0, 12.0, 26.0, 22.0, 17.0, 5.0, 9.0, 9.0, 6.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.15234375, -4.02435302734375, -3.8963623046875, -3.76837158203125, -3.640380859375, -3.51239013671875, -3.3843994140625, -3.25640869140625, -3.12841796875, -3.00042724609375, -2.8724365234375, -2.74444580078125, -2.616455078125, -2.48846435546875, -2.3604736328125, -2.23248291015625, -2.1044921875, -1.97650146484375, -1.8485107421875, -1.72052001953125, -1.592529296875, -1.46453857421875, -1.3365478515625, -1.20855712890625, -1.08056640625, -0.95257568359375, -0.8245849609375, -0.69659423828125, -0.568603515625, -0.44061279296875, -0.3126220703125, -0.18463134765625, -0.056640625, 0.07135009765625, 0.1993408203125, 0.32733154296875, 0.455322265625, 0.58331298828125, 0.7113037109375, 0.83929443359375, 0.96728515625, 1.09527587890625, 1.2232666015625, 1.35125732421875, 1.479248046875, 1.60723876953125, 1.7352294921875, 1.86322021484375, 1.9912109375, 2.11920166015625, 2.2471923828125, 2.37518310546875, 2.503173828125, 2.63116455078125, 2.7591552734375, 2.88714599609375, 3.01513671875, 3.14312744140625, 3.2711181640625, 3.39910888671875, 3.527099609375, 3.65509033203125, 3.7830810546875, 3.91107177734375, 4.0390625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 5.0, 7.0, 7.0, 6.0, 9.0, 15.0, 6.0, 14.0, 21.0, 19.0, 25.0, 20.0, 24.0, 39.0, 34.0, 49.0, 64.0, 148.0, 503.0, 3762.0, 132521.0, 3683712.0, 365488.0, 6481.0, 750.0, 158.0, 71.0, 33.0, 39.0, 31.0, 18.0, 24.0, 27.0, 16.0, 22.0, 11.0, 16.0, 10.0, 11.0, 11.0, 8.0, 7.0, 4.0, 7.0, 4.0, 3.0, 7.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-20.53125, -19.8603515625, -19.189453125, -18.5185546875, -17.84765625, -17.1767578125, -16.505859375, -15.8349609375, -15.1640625, -14.4931640625, -13.822265625, -13.1513671875, -12.48046875, -11.8095703125, -11.138671875, -10.4677734375, -9.796875, -9.1259765625, -8.455078125, -7.7841796875, -7.11328125, -6.4423828125, -5.771484375, -5.1005859375, -4.4296875, -3.7587890625, -3.087890625, -2.4169921875, -1.74609375, -1.0751953125, -0.404296875, 0.2666015625, 0.9375, 1.6083984375, 2.279296875, 2.9501953125, 3.62109375, 4.2919921875, 4.962890625, 5.6337890625, 6.3046875, 6.9755859375, 7.646484375, 8.3173828125, 8.98828125, 9.6591796875, 10.330078125, 11.0009765625, 11.671875, 12.3427734375, 13.013671875, 13.6845703125, 14.35546875, 15.0263671875, 15.697265625, 16.3681640625, 17.0390625, 17.7099609375, 18.380859375, 19.0517578125, 19.72265625, 20.3935546875, 21.064453125, 21.7353515625, 22.40625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 2.0, 4.0, 7.0, 4.0, 9.0, 8.0, 24.0, 25.0, 34.0, 46.0, 76.0, 95.0, 143.0, 159.0, 252.0, 380.0, 477.0, 475.0, 461.0, 364.0, 285.0, 233.0, 146.0, 93.0, 72.0, 56.0, 49.0, 34.0, 16.0, 17.0, 12.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.9765625, -15.5733642578125, -15.170166015625, -14.7669677734375, -14.36376953125, -13.9605712890625, -13.557373046875, -13.1541748046875, -12.7509765625, -12.3477783203125, -11.944580078125, -11.5413818359375, -11.13818359375, -10.7349853515625, -10.331787109375, -9.9285888671875, -9.525390625, -9.1221923828125, -8.718994140625, -8.3157958984375, -7.91259765625, -7.5093994140625, -7.106201171875, -6.7030029296875, -6.2998046875, -5.8966064453125, -5.493408203125, -5.0902099609375, -4.68701171875, -4.2838134765625, -3.880615234375, -3.4774169921875, -3.07421875, -2.6710205078125, -2.267822265625, -1.8646240234375, -1.46142578125, -1.0582275390625, -0.655029296875, -0.2518310546875, 0.1513671875, 0.5545654296875, 0.957763671875, 1.3609619140625, 1.76416015625, 2.1673583984375, 2.570556640625, 2.9737548828125, 3.376953125, 3.7801513671875, 4.183349609375, 4.5865478515625, 4.98974609375, 5.3929443359375, 5.796142578125, 6.1993408203125, 6.6025390625, 7.0057373046875, 7.408935546875, 7.8121337890625, 8.21533203125, 8.6185302734375, 9.021728515625, 9.4249267578125, 9.828125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 12.0, 7.0, 20.0, 23.0, 44.0, 77.0, 107.0, 187.0, 307.0, 801.0, 10213.0, 3796067.0, 382954.0, 2372.0, 458.0, 223.0, 156.0, 94.0, 61.0, 46.0, 13.0, 9.0, 6.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.5, -44.6240234375, -42.748046875, -40.8720703125, -38.99609375, -37.1201171875, -35.244140625, -33.3681640625, -31.4921875, -29.6162109375, -27.740234375, -25.8642578125, -23.98828125, -22.1123046875, -20.236328125, -18.3603515625, -16.484375, -14.6083984375, -12.732421875, -10.8564453125, -8.98046875, -7.1044921875, -5.228515625, -3.3525390625, -1.4765625, 0.3994140625, 2.275390625, 4.1513671875, 6.02734375, 7.9033203125, 9.779296875, 11.6552734375, 13.53125, 15.4072265625, 17.283203125, 19.1591796875, 21.03515625, 22.9111328125, 24.787109375, 26.6630859375, 28.5390625, 30.4150390625, 32.291015625, 34.1669921875, 36.04296875, 37.9189453125, 39.794921875, 41.6708984375, 43.546875, 45.4228515625, 47.298828125, 49.1748046875, 51.05078125, 52.9267578125, 54.802734375, 56.6787109375, 58.5546875, 60.4306640625, 62.306640625, 64.1826171875, 66.05859375, 67.9345703125, 69.810546875, 71.6865234375, 73.5625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 8.0, 105.0, 377.0, 403.0, 118.0, 5.0, 1.0], "bins": [-367.355224609375, -361.2361755371094, -355.1170959472656, -348.998046875, -342.87896728515625, -336.7599182128906, -330.640869140625, -324.52178955078125, -318.4027404785156, -312.28369140625, -306.16461181640625, -300.0455627441406, -293.9264831542969, -287.80743408203125, -281.6883544921875, -275.5693054199219, -269.45025634765625, -263.3312072753906, -257.2121276855469, -251.09307861328125, -244.97401428222656, -238.85494995117188, -232.7358856201172, -226.6168212890625, -220.49774169921875, -214.37867736816406, -208.25961303710938, -202.14056396484375, -196.02149963378906, -189.90243530273438, -183.7833709716797, -177.664306640625, -171.54525756835938, -165.4261932373047, -159.30712890625, -153.18807983398438, -147.0690155029297, -140.949951171875, -134.8308868408203, -128.71182250976562, -122.59275817871094, -116.47369384765625, -110.3546371459961, -104.2355728149414, -98.11651611328125, -91.99745178222656, -85.87838745117188, -79.75932312011719, -73.64026641845703, -67.52120208740234, -61.40214538574219, -55.2830810546875, -49.16402053833008, -43.044960021972656, -36.92589569091797, -30.806835174560547, -24.687776565551758, -18.568714141845703, -12.449653625488281, -6.330591201782227, -0.2115306854248047, 5.907529830932617, 12.026594161987305, 18.145654678344727, 24.26471519470215]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 8.0, 3.0, 7.0, 7.0, 15.0, 11.0, 19.0, 18.0, 15.0, 23.0, 24.0, 22.0, 29.0, 38.0, 41.0, 31.0, 32.0, 41.0, 33.0, 32.0, 52.0, 54.0, 53.0, 39.0, 50.0, 37.0, 32.0, 26.0, 31.0, 33.0, 31.0, 20.0, 16.0, 19.0, 12.0, 7.0, 18.0, 6.0, 4.0, 1.0, 5.0, 3.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.64929962158203, -40.31341552734375, -38.97753143310547, -37.64164733886719, -36.305763244628906, -34.969879150390625, -33.633995056152344, -32.2981071472168, -30.962223052978516, -29.626338958740234, -28.290454864501953, -26.954570770263672, -25.618684768676758, -24.282800674438477, -22.946916580200195, -21.61103057861328, -20.275148391723633, -18.93926429748535, -17.60338020324707, -16.267494201660156, -14.931610107421875, -13.595726013183594, -12.259841918945312, -10.923956871032715, -9.588072776794434, -8.252188682556152, -6.916303634643555, -5.580419540405273, -4.244534969329834, -2.9086503982543945, -1.5727663040161133, -0.23688125610351562, 1.0990028381347656, 2.434887409210205, 3.7707717418670654, 5.106656074523926, 6.442540645599365, 7.778425216674805, 9.114309310913086, 10.450194358825684, 11.786078453063965, 13.121962547302246, 14.457847595214844, 15.793731689453125, 17.129615783691406, 18.465499877929688, 19.80138397216797, 21.137269973754883, 22.473154067993164, 23.809038162231445, 25.144922256469727, 26.48080825805664, 27.816692352294922, 29.152576446533203, 30.488460540771484, 31.824344635009766, 33.16022872924805, 34.49611282348633, 35.83199691772461, 37.16788101196289, 38.50376510620117, 39.83965301513672, 41.175537109375, 42.51142120361328, 43.84730529785156]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 6.0, 9.0, 14.0, 12.0, 15.0, 19.0, 9.0, 20.0, 29.0, 30.0, 34.0, 35.0, 37.0, 33.0, 40.0, 46.0, 54.0, 40.0, 54.0, 44.0, 45.0, 29.0, 37.0, 32.0, 42.0, 29.0, 37.0, 23.0, 20.0, 21.0, 17.0, 12.0, 11.0, 11.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.4609375, -4.3212890625, -4.181640625, -4.0419921875, -3.90234375, -3.7626953125, -3.623046875, -3.4833984375, -3.34375, -3.2041015625, -3.064453125, -2.9248046875, -2.78515625, -2.6455078125, -2.505859375, -2.3662109375, -2.2265625, -2.0869140625, -1.947265625, -1.8076171875, -1.66796875, -1.5283203125, -1.388671875, -1.2490234375, -1.109375, -0.9697265625, -0.830078125, -0.6904296875, -0.55078125, -0.4111328125, -0.271484375, -0.1318359375, 0.0078125, 0.1474609375, 0.287109375, 0.4267578125, 0.56640625, 0.7060546875, 0.845703125, 0.9853515625, 1.125, 1.2646484375, 1.404296875, 1.5439453125, 1.68359375, 1.8232421875, 1.962890625, 2.1025390625, 2.2421875, 2.3818359375, 2.521484375, 2.6611328125, 2.80078125, 2.9404296875, 3.080078125, 3.2197265625, 3.359375, 3.4990234375, 3.638671875, 3.7783203125, 3.91796875, 4.0576171875, 4.197265625, 4.3369140625, 4.4765625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 7.0, 12.0, 8.0, 10.0, 23.0, 26.0, 38.0, 47.0, 67.0, 110.0, 149.0, 213.0, 288.0, 407.0, 563.0, 782.0, 1263.0, 1637.0, 2417.0, 3477.0, 5134.0, 7222.0, 11024.0, 16826.0, 25656.0, 39433.0, 63233.0, 107331.0, 275627.0, 218528.0, 98133.0, 58873.0, 37028.0, 24209.0, 15780.0, 10280.0, 7029.0, 4762.0, 3247.0, 2263.0, 1617.0, 1123.0, 763.0, 540.0, 368.0, 287.0, 202.0, 157.0, 98.0, 81.0, 49.0, 28.0, 27.0, 19.0, 13.0, 11.0, 7.0, 4.0, 4.0, 5.0, 2.0], "bins": [-1.060546875, -1.0273284912109375, -0.994110107421875, -0.9608917236328125, -0.92767333984375, -0.8944549560546875, -0.861236572265625, -0.8280181884765625, -0.7947998046875, -0.7615814208984375, -0.728363037109375, -0.6951446533203125, -0.66192626953125, -0.6287078857421875, -0.595489501953125, -0.5622711181640625, -0.529052734375, -0.4958343505859375, -0.462615966796875, -0.4293975830078125, -0.39617919921875, -0.3629608154296875, -0.329742431640625, -0.2965240478515625, -0.2633056640625, -0.2300872802734375, -0.196868896484375, -0.1636505126953125, -0.13043212890625, -0.0972137451171875, -0.063995361328125, -0.0307769775390625, 0.00244140625, 0.0356597900390625, 0.068878173828125, 0.1020965576171875, 0.13531494140625, 0.1685333251953125, 0.201751708984375, 0.2349700927734375, 0.2681884765625, 0.3014068603515625, 0.334625244140625, 0.3678436279296875, 0.40106201171875, 0.4342803955078125, 0.467498779296875, 0.5007171630859375, 0.533935546875, 0.5671539306640625, 0.600372314453125, 0.6335906982421875, 0.66680908203125, 0.7000274658203125, 0.733245849609375, 0.7664642333984375, 0.7996826171875, 0.8329010009765625, 0.866119384765625, 0.8993377685546875, 0.93255615234375, 0.9657745361328125, 0.998992919921875, 1.0322113037109375, 1.0654296875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 7.0, 7.0, 15.0, 14.0, 22.0, 18.0, 27.0, 19.0, 25.0, 38.0, 35.0, 35.0, 34.0, 38.0, 53.0, 40.0, 40.0, 1074.0, 41.0, 38.0, 45.0, 41.0, 35.0, 56.0, 35.0, 27.0, 27.0, 28.0, 22.0, 26.0, 16.0, 8.0, 9.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.111328125, -3.011627197265625, -2.91192626953125, -2.812225341796875, -2.7125244140625, -2.612823486328125, -2.51312255859375, -2.413421630859375, -2.313720703125, -2.214019775390625, -2.11431884765625, -2.014617919921875, -1.9149169921875, -1.815216064453125, -1.71551513671875, -1.615814208984375, -1.51611328125, -1.416412353515625, -1.31671142578125, -1.217010498046875, -1.1173095703125, -1.017608642578125, -0.91790771484375, -0.818206787109375, -0.718505859375, -0.618804931640625, -0.51910400390625, -0.419403076171875, -0.3197021484375, -0.220001220703125, -0.12030029296875, -0.020599365234375, 0.0791015625, 0.178802490234375, 0.27850341796875, 0.378204345703125, 0.4779052734375, 0.577606201171875, 0.67730712890625, 0.777008056640625, 0.876708984375, 0.976409912109375, 1.07611083984375, 1.175811767578125, 1.2755126953125, 1.375213623046875, 1.47491455078125, 1.574615478515625, 1.67431640625, 1.774017333984375, 1.87371826171875, 1.973419189453125, 2.0731201171875, 2.172821044921875, 2.27252197265625, 2.372222900390625, 2.471923828125, 2.571624755859375, 2.67132568359375, 2.771026611328125, 2.8707275390625, 2.970428466796875, 3.07012939453125, 3.169830322265625, 3.26953125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 9.0, 4.0, 3.0, 23.0, 28.0, 32.0, 47.0, 69.0, 119.0, 148.0, 267.0, 356.0, 524.0, 864.0, 1427.0, 2235.0, 3483.0, 5524.0, 8604.0, 13629.0, 22037.0, 36267.0, 59150.0, 98070.0, 192716.0, 1350466.0, 118615.0, 70058.0, 42998.0, 25796.0, 15841.0, 10043.0, 6442.0, 4032.0, 2566.0, 1654.0, 1003.0, 707.0, 439.0, 244.0, 189.0, 125.0, 93.0, 74.0, 30.0, 30.0, 17.0, 21.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1708984375, -1.133331298828125, -1.09576416015625, -1.058197021484375, -1.0206298828125, -0.983062744140625, -0.94549560546875, -0.907928466796875, -0.870361328125, -0.832794189453125, -0.79522705078125, -0.757659912109375, -0.7200927734375, -0.682525634765625, -0.64495849609375, -0.607391357421875, -0.56982421875, -0.532257080078125, -0.49468994140625, -0.457122802734375, -0.4195556640625, -0.381988525390625, -0.34442138671875, -0.306854248046875, -0.269287109375, -0.231719970703125, -0.19415283203125, -0.156585693359375, -0.1190185546875, -0.081451416015625, -0.04388427734375, -0.006317138671875, 0.03125, 0.068817138671875, 0.10638427734375, 0.143951416015625, 0.1815185546875, 0.219085693359375, 0.25665283203125, 0.294219970703125, 0.331787109375, 0.369354248046875, 0.40692138671875, 0.444488525390625, 0.4820556640625, 0.519622802734375, 0.55718994140625, 0.594757080078125, 0.63232421875, 0.669891357421875, 0.70745849609375, 0.745025634765625, 0.7825927734375, 0.820159912109375, 0.85772705078125, 0.895294189453125, 0.932861328125, 0.970428466796875, 1.00799560546875, 1.045562744140625, 1.0831298828125, 1.120697021484375, 1.15826416015625, 1.195831298828125, 1.2333984375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 10.0, 7.0, 13.0, 9.0, 14.0, 11.0, 18.0, 33.0, 28.0, 41.0, 61.0, 65.0, 78.0, 66.0, 86.0, 73.0, 80.0, 65.0, 57.0, 41.0, 26.0, 22.0, 16.0, 14.0, 12.0, 10.0, 7.0, 6.0, 8.0, 3.0, 4.0, 6.0, 7.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00024437904357910156, -0.0002376846969127655, -0.00023099035024642944, -0.00022429600358009338, -0.00021760165691375732, -0.00021090731024742126, -0.0002042129635810852, -0.00019751861691474915, -0.00019082427024841309, -0.00018412992358207703, -0.00017743557691574097, -0.0001707412302494049, -0.00016404688358306885, -0.0001573525369167328, -0.00015065819025039673, -0.00014396384358406067, -0.0001372694969177246, -0.00013057515025138855, -0.0001238808035850525, -0.00011718645691871643, -0.00011049211025238037, -0.00010379776358604431, -9.710341691970825e-05, -9.040907025337219e-05, -8.371472358703613e-05, -7.702037692070007e-05, -7.032603025436401e-05, -6.363168358802795e-05, -5.6937336921691895e-05, -5.0242990255355835e-05, -4.3548643589019775e-05, -3.6854296922683716e-05, -3.0159950256347656e-05, -2.3465603590011597e-05, -1.6771256923675537e-05, -1.0076910257339478e-05, -3.382563591003418e-06, 3.3117830753326416e-06, 1.0006129741668701e-05, 1.670047640800476e-05, 2.339482307434082e-05, 3.008916974067688e-05, 3.678351640701294e-05, 4.3477863073349e-05, 5.017220973968506e-05, 5.686655640602112e-05, 6.356090307235718e-05, 7.025524973869324e-05, 7.69495964050293e-05, 8.364394307136536e-05, 9.033828973770142e-05, 9.703263640403748e-05, 0.00010372698307037354, 0.0001104213297367096, 0.00011711567640304565, 0.00012381002306938171, 0.00013050436973571777, 0.00013719871640205383, 0.0001438930630683899, 0.00015058740973472595, 0.000157281756401062, 0.00016397610306739807, 0.00017067044973373413, 0.0001773647964000702, 0.00018405914306640625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 5.0, 15.0, 9.0, 11.0, 13.0, 27.0, 35.0, 43.0, 75.0, 104.0, 192.0, 322.0, 608.0, 22483.0, 1022206.0, 1301.0, 411.0, 231.0, 172.0, 77.0, 58.0, 32.0, 40.0, 17.0, 19.0, 9.0, 5.0, 6.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0047454833984375, -0.0045937299728393555, -0.004441976547241211, -0.004290223121643066, -0.004138469696044922, -0.003986716270446777, -0.003834962844848633, -0.0036832094192504883, -0.0035314559936523438, -0.0033797025680541992, -0.0032279491424560547, -0.00307619571685791, -0.0029244422912597656, -0.002772688865661621, -0.0026209354400634766, -0.002469182014465332, -0.0023174285888671875, -0.002165675163269043, -0.0020139217376708984, -0.001862168312072754, -0.0017104148864746094, -0.0015586614608764648, -0.0014069080352783203, -0.0012551546096801758, -0.0011034011840820312, -0.0009516477584838867, -0.0007998943328857422, -0.0006481409072875977, -0.0004963874816894531, -0.0003446340560913086, -0.00019288063049316406, -4.112720489501953e-05, 0.000110626220703125, 0.00026237964630126953, 0.00041413307189941406, 0.0005658864974975586, 0.0007176399230957031, 0.0008693933486938477, 0.0010211467742919922, 0.0011729001998901367, 0.0013246536254882812, 0.0014764070510864258, 0.0016281604766845703, 0.0017799139022827148, 0.0019316673278808594, 0.002083420753479004, 0.0022351741790771484, 0.002386927604675293, 0.0025386810302734375, 0.002690434455871582, 0.0028421878814697266, 0.002993941307067871, 0.0031456947326660156, 0.00329744815826416, 0.0034492015838623047, 0.0036009550094604492, 0.0037527084350585938, 0.0039044618606567383, 0.004056215286254883, 0.004207968711853027, 0.004359722137451172, 0.004511475563049316, 0.004663228988647461, 0.0048149824142456055, 0.00496673583984375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 20.0, 61.0, 258.0, 405.0, 197.0, 62.0, 12.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004406581283546984, -0.0004297544073779136, -0.0004188506572972983, -0.0004079469363205135, -0.00039704321534372866, -0.00038613949436694384, -0.00037523574428632855, -0.00036433202330954373, -0.0003534283023327589, -0.0003425245813559741, -0.0003316208312753588, -0.00032071711029857397, -0.00030981338932178915, -0.0002989096683450043, -0.00028800591826438904, -0.0002771021972876042, -0.00026619844720698893, -0.0002552947262302041, -0.0002443909761495888, -0.000233487255172804, -0.00022258353419601917, -0.00021167979866731912, -0.00020077606313861907, -0.00018987234216183424, -0.00017896860663313419, -0.00016806487110443413, -0.0001571611501276493, -0.00014625741459894925, -0.0001353536790702492, -0.00012444995809346437, -0.00011354622256476432, -0.00010264249431202188, -9.173873695544899e-05, -8.083500870270655e-05, -6.99312804499641e-05, -5.902754492126405e-05, -4.812381666852161e-05, -3.722008841577917e-05, -2.631635288707912e-05, -1.541262463433668e-05, -4.508896381594241e-06, 6.394833690137602e-06, 1.7298563761869445e-05, 2.8202295652590692e-05, 3.910602390533313e-05, 5.000975215807557e-05, 6.0913487686775625e-05, 7.181721593951806e-05, 8.27209441922605e-05, 9.362467244500294e-05, 0.00010452840069774538, 0.00011543213622644544, 0.00012633585720323026, 0.00013723959273193032, 0.00014814332826063037, 0.0001590470492374152, 0.00016995078476611525, 0.0001808545202948153, 0.00019175824127160013, 0.00020266197680030018, 0.00021356571232900023, 0.00022446943330578506, 0.00023537316883448511, 0.00024627690436318517, 0.00025718062533997]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 0.0, 7.0, 6.0, 3.0, 5.0, 5.0, 14.0, 8.0, 15.0, 15.0, 12.0, 15.0, 21.0, 28.0, 29.0, 23.0, 32.0, 26.0, 33.0, 27.0, 32.0, 37.0, 38.0, 41.0, 37.0, 41.0, 36.0, 33.0, 33.0, 36.0, 29.0, 28.0, 32.0, 42.0, 25.0, 21.0, 20.0, 23.0, 12.0, 18.0, 16.0, 6.0, 6.0, 11.0, 7.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.147954940795898e-05, -7.885601371526718e-05, -7.623247802257538e-05, -7.360894232988358e-05, -7.098540663719177e-05, -6.836187094449997e-05, -6.573833525180817e-05, -6.311479955911636e-05, -6.049126386642456e-05, -5.786772817373276e-05, -5.5244192481040955e-05, -5.262065678834915e-05, -4.999712109565735e-05, -4.7373585402965546e-05, -4.475004971027374e-05, -4.212651401758194e-05, -3.950297832489014e-05, -3.6879442632198334e-05, -3.425590693950653e-05, -3.163237124681473e-05, -2.9008835554122925e-05, -2.6385299861431122e-05, -2.376176416873932e-05, -2.1138228476047516e-05, -1.8514692783355713e-05, -1.589115709066391e-05, -1.3267621397972107e-05, -1.0644085705280304e-05, -8.020550012588501e-06, -5.397014319896698e-06, -2.773478627204895e-06, -1.4994293451309204e-07, 2.473592758178711e-06, 5.097128450870514e-06, 7.720664143562317e-06, 1.034419983625412e-05, 1.2967735528945923e-05, 1.5591271221637726e-05, 1.821480691432953e-05, 2.0838342607021332e-05, 2.3461878299713135e-05, 2.6085413992404938e-05, 2.870894968509674e-05, 3.1332485377788544e-05, 3.395602107048035e-05, 3.657955676317215e-05, 3.920309245586395e-05, 4.1826628148555756e-05, 4.445016384124756e-05, 4.707369953393936e-05, 4.9697235226631165e-05, 5.232077091932297e-05, 5.494430661201477e-05, 5.7567842304706573e-05, 6.0191377997398376e-05, 6.281491369009018e-05, 6.543844938278198e-05, 6.806198507547379e-05, 7.068552076816559e-05, 7.330905646085739e-05, 7.59325921535492e-05, 7.8556127846241e-05, 8.11796635389328e-05, 8.38031992316246e-05, 8.64267349243164e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 6.0, 9.0, 14.0, 12.0, 15.0, 19.0, 9.0, 20.0, 29.0, 30.0, 34.0, 35.0, 37.0, 33.0, 40.0, 46.0, 54.0, 40.0, 54.0, 44.0, 45.0, 29.0, 37.0, 32.0, 42.0, 29.0, 37.0, 23.0, 20.0, 21.0, 17.0, 12.0, 11.0, 11.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.4609375, -4.3212890625, -4.181640625, -4.0419921875, -3.90234375, -3.7626953125, -3.623046875, -3.4833984375, -3.34375, -3.2041015625, -3.064453125, -2.9248046875, -2.78515625, -2.6455078125, -2.505859375, -2.3662109375, -2.2265625, -2.0869140625, -1.947265625, -1.8076171875, -1.66796875, -1.5283203125, -1.388671875, -1.2490234375, -1.109375, -0.9697265625, -0.830078125, -0.6904296875, -0.55078125, -0.4111328125, -0.271484375, -0.1318359375, 0.0078125, 0.1474609375, 0.287109375, 0.4267578125, 0.56640625, 0.7060546875, 0.845703125, 0.9853515625, 1.125, 1.2646484375, 1.404296875, 1.5439453125, 1.68359375, 1.8232421875, 1.962890625, 2.1025390625, 2.2421875, 2.3818359375, 2.521484375, 2.6611328125, 2.80078125, 2.9404296875, 3.080078125, 3.2197265625, 3.359375, 3.4990234375, 3.638671875, 3.7783203125, 3.91796875, 4.0576171875, 4.197265625, 4.3369140625, 4.4765625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 10.0, 19.0, 20.0, 15.0, 33.0, 46.0, 58.0, 62.0, 119.0, 185.0, 226.0, 373.0, 626.0, 1044.0, 1964.0, 4041.0, 9956.0, 27780.0, 110545.0, 456058.0, 329090.0, 70941.0, 20447.0, 7600.0, 3197.0, 1577.0, 896.0, 534.0, 355.0, 227.0, 133.0, 106.0, 74.0, 61.0, 35.0, 21.0, 18.0, 13.0, 9.0, 12.0, 8.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16796875, -5.0057373046875, -4.843505859375, -4.6812744140625, -4.51904296875, -4.3568115234375, -4.194580078125, -4.0323486328125, -3.8701171875, -3.7078857421875, -3.545654296875, -3.3834228515625, -3.22119140625, -3.0589599609375, -2.896728515625, -2.7344970703125, -2.572265625, -2.4100341796875, -2.247802734375, -2.0855712890625, -1.92333984375, -1.7611083984375, -1.598876953125, -1.4366455078125, -1.2744140625, -1.1121826171875, -0.949951171875, -0.7877197265625, -0.62548828125, -0.4632568359375, -0.301025390625, -0.1387939453125, 0.0234375, 0.1856689453125, 0.347900390625, 0.5101318359375, 0.67236328125, 0.8345947265625, 0.996826171875, 1.1590576171875, 1.3212890625, 1.4835205078125, 1.645751953125, 1.8079833984375, 1.97021484375, 2.1324462890625, 2.294677734375, 2.4569091796875, 2.619140625, 2.7813720703125, 2.943603515625, 3.1058349609375, 3.26806640625, 3.4302978515625, 3.592529296875, 3.7547607421875, 3.9169921875, 4.0792236328125, 4.241455078125, 4.4036865234375, 4.56591796875, 4.7281494140625, 4.890380859375, 5.0526123046875, 5.21484375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 4.0, 9.0, 5.0, 11.0, 10.0, 17.0, 13.0, 25.0, 19.0, 39.0, 38.0, 46.0, 40.0, 53.0, 68.0, 115.0, 1657.0, 383.0, 91.0, 66.0, 54.0, 60.0, 36.0, 37.0, 33.0, 26.0, 16.0, 20.0, 22.0, 16.0, 9.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.984375, -21.35400390625, -20.7236328125, -20.09326171875, -19.462890625, -18.83251953125, -18.2021484375, -17.57177734375, -16.94140625, -16.31103515625, -15.6806640625, -15.05029296875, -14.419921875, -13.78955078125, -13.1591796875, -12.52880859375, -11.8984375, -11.26806640625, -10.6376953125, -10.00732421875, -9.376953125, -8.74658203125, -8.1162109375, -7.48583984375, -6.85546875, -6.22509765625, -5.5947265625, -4.96435546875, -4.333984375, -3.70361328125, -3.0732421875, -2.44287109375, -1.8125, -1.18212890625, -0.5517578125, 0.07861328125, 0.708984375, 1.33935546875, 1.9697265625, 2.60009765625, 3.23046875, 3.86083984375, 4.4912109375, 5.12158203125, 5.751953125, 6.38232421875, 7.0126953125, 7.64306640625, 8.2734375, 8.90380859375, 9.5341796875, 10.16455078125, 10.794921875, 11.42529296875, 12.0556640625, 12.68603515625, 13.31640625, 13.94677734375, 14.5771484375, 15.20751953125, 15.837890625, 16.46826171875, 17.0986328125, 17.72900390625, 18.359375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 5.0, 12.0, 14.0, 15.0, 19.0, 21.0, 22.0, 31.0, 37.0, 60.0, 76.0, 124.0, 184.0, 398.0, 1204.0, 10614.0, 2760720.0, 365540.0, 4932.0, 800.0, 320.0, 170.0, 91.0, 70.0, 47.0, 37.0, 25.0, 24.0, 12.0, 20.0, 11.0, 12.0, 6.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.234375, -22.336181640625, -21.43798828125, -20.539794921875, -19.6416015625, -18.743408203125, -17.84521484375, -16.947021484375, -16.048828125, -15.150634765625, -14.25244140625, -13.354248046875, -12.4560546875, -11.557861328125, -10.65966796875, -9.761474609375, -8.86328125, -7.965087890625, -7.06689453125, -6.168701171875, -5.2705078125, -4.372314453125, -3.47412109375, -2.575927734375, -1.677734375, -0.779541015625, 0.11865234375, 1.016845703125, 1.9150390625, 2.813232421875, 3.71142578125, 4.609619140625, 5.5078125, 6.406005859375, 7.30419921875, 8.202392578125, 9.1005859375, 9.998779296875, 10.89697265625, 11.795166015625, 12.693359375, 13.591552734375, 14.48974609375, 15.387939453125, 16.2861328125, 17.184326171875, 18.08251953125, 18.980712890625, 19.87890625, 20.777099609375, 21.67529296875, 22.573486328125, 23.4716796875, 24.369873046875, 25.26806640625, 26.166259765625, 27.064453125, 27.962646484375, 28.86083984375, 29.759033203125, 30.6572265625, 31.555419921875, 32.45361328125, 33.351806640625, 34.25]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 12.0, 159.0, 634.0, 205.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.68896484375, -126.63888549804688, -123.58880615234375, -120.53873443603516, -117.48865509033203, -114.4385757446289, -111.38850402832031, -108.33842468261719, -105.28834533691406, -102.23826599121094, -99.18818664550781, -96.13811492919922, -93.0880355834961, -90.03795623779297, -86.98788452148438, -83.93780517578125, -80.88772583007812, -77.837646484375, -74.78756713867188, -71.73749542236328, -68.68741607666016, -65.63733673095703, -62.58726119995117, -59.53718566894531, -56.48710632324219, -53.43702697753906, -50.3869514465332, -47.336875915527344, -44.28679656982422, -41.236717224121094, -38.186641693115234, -35.136566162109375, -32.08648681640625, -29.036409378051758, -25.986331939697266, -22.936254501342773, -19.88617706298828, -16.83609962463379, -13.786022186279297, -10.735944747924805, -7.6858673095703125, -4.63578987121582, -1.5857124328613281, 1.464365005493164, 4.514442443847656, 7.564519882202148, 10.61459732055664, 13.664674758911133, 16.714752197265625, 19.764829635620117, 22.81490707397461, 25.8649845123291, 28.915061950683594, 31.965139389038086, 35.01521682739258, 38.06529235839844, 41.11537170410156, 44.16545104980469, 47.21552658081055, 50.265602111816406, 53.31568145751953, 56.365760803222656, 59.415836334228516, 62.465911865234375, 65.5159912109375]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 2.0, 10.0, 8.0, 9.0, 8.0, 13.0, 20.0, 18.0, 24.0, 24.0, 32.0, 32.0, 33.0, 46.0, 34.0, 46.0, 43.0, 53.0, 43.0, 39.0, 52.0, 32.0, 51.0, 43.0, 42.0, 28.0, 27.0, 20.0, 33.0, 20.0, 14.0, 17.0, 17.0, 10.0, 5.0, 12.0, 5.0, 9.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.86970901489258, -51.22285079956055, -49.575992584228516, -47.929134368896484, -46.28227615356445, -44.63541793823242, -42.988563537597656, -41.341705322265625, -39.694847106933594, -38.04798889160156, -36.40113067626953, -34.7542724609375, -33.10741424560547, -31.460556030273438, -29.81369972229004, -28.166841506958008, -26.519981384277344, -24.873123168945312, -23.22626495361328, -21.57940673828125, -19.93254852294922, -18.285690307617188, -16.63883399963379, -14.991975784301758, -13.345117568969727, -11.698259353637695, -10.051401138305664, -8.40454387664795, -6.757685661315918, -5.110827445983887, -3.463970184326172, -1.8171119689941406, -0.170257568359375, 1.4766004085540771, 3.1234583854675293, 4.770316123962402, 6.417174339294434, 8.064032554626465, 9.71088981628418, 11.357748031616211, 13.004606246948242, 14.651464462280273, 16.298322677612305, 17.945178985595703, 19.592037200927734, 21.238895416259766, 22.885753631591797, 24.532611846923828, 26.17947006225586, 27.82632827758789, 29.473186492919922, 31.120044708251953, 32.766902923583984, 34.413761138916016, 36.06061553955078, 37.70747375488281, 39.354331970214844, 41.001190185546875, 42.648048400878906, 44.29490661621094, 45.94176483154297, 47.588623046875, 49.23548126220703, 50.88233947753906, 52.529197692871094]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 14.0, 10.0, 9.0, 9.0, 13.0, 19.0, 20.0, 25.0, 15.0, 29.0, 27.0, 31.0, 43.0, 43.0, 43.0, 40.0, 40.0, 49.0, 52.0, 45.0, 35.0, 35.0, 35.0, 30.0, 54.0, 37.0, 23.0, 24.0, 24.0, 14.0, 21.0, 17.0, 10.0, 14.0, 3.0, 10.0, 14.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.47265625, -4.3291015625, -4.185546875, -4.0419921875, -3.8984375, -3.7548828125, -3.611328125, -3.4677734375, -3.32421875, -3.1806640625, -3.037109375, -2.8935546875, -2.75, -2.6064453125, -2.462890625, -2.3193359375, -2.17578125, -2.0322265625, -1.888671875, -1.7451171875, -1.6015625, -1.4580078125, -1.314453125, -1.1708984375, -1.02734375, -0.8837890625, -0.740234375, -0.5966796875, -0.453125, -0.3095703125, -0.166015625, -0.0224609375, 0.12109375, 0.2646484375, 0.408203125, 0.5517578125, 0.6953125, 0.8388671875, 0.982421875, 1.1259765625, 1.26953125, 1.4130859375, 1.556640625, 1.7001953125, 1.84375, 1.9873046875, 2.130859375, 2.2744140625, 2.41796875, 2.5615234375, 2.705078125, 2.8486328125, 2.9921875, 3.1357421875, 3.279296875, 3.4228515625, 3.56640625, 3.7099609375, 3.853515625, 3.9970703125, 4.140625, 4.2841796875, 4.427734375, 4.5712890625, 4.71484375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 7.0, 10.0, 7.0, 11.0, 12.0, 12.0, 17.0, 19.0, 25.0, 45.0, 51.0, 82.0, 148.0, 231.0, 516.0, 1293.0, 3907.0, 16092.0, 96723.0, 717160.0, 2234878.0, 962300.0, 132323.0, 20904.0, 4796.0, 1496.0, 510.0, 265.0, 129.0, 69.0, 49.0, 36.0, 30.0, 30.0, 17.0, 16.0, 13.0, 5.0, 9.0, 10.0, 5.0, 7.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.2296142578125, -7.951416015625, -7.6732177734375, -7.39501953125, -7.1168212890625, -6.838623046875, -6.5604248046875, -6.2822265625, -6.0040283203125, -5.725830078125, -5.4476318359375, -5.16943359375, -4.8912353515625, -4.613037109375, -4.3348388671875, -4.056640625, -3.7784423828125, -3.500244140625, -3.2220458984375, -2.94384765625, -2.6656494140625, -2.387451171875, -2.1092529296875, -1.8310546875, -1.5528564453125, -1.274658203125, -0.9964599609375, -0.71826171875, -0.4400634765625, -0.161865234375, 0.1163330078125, 0.39453125, 0.6727294921875, 0.950927734375, 1.2291259765625, 1.50732421875, 1.7855224609375, 2.063720703125, 2.3419189453125, 2.6201171875, 2.8983154296875, 3.176513671875, 3.4547119140625, 3.73291015625, 4.0111083984375, 4.289306640625, 4.5675048828125, 4.845703125, 5.1239013671875, 5.402099609375, 5.6802978515625, 5.95849609375, 6.2366943359375, 6.514892578125, 6.7930908203125, 7.0712890625, 7.3494873046875, 7.627685546875, 7.9058837890625, 8.18408203125, 8.4622802734375, 8.740478515625, 9.0186767578125, 9.296875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 1.0, 10.0, 5.0, 19.0, 26.0, 36.0, 55.0, 97.0, 131.0, 166.0, 256.0, 336.0, 460.0, 517.0, 526.0, 433.0, 296.0, 207.0, 174.0, 90.0, 77.0, 68.0, 23.0, 19.0, 18.0, 12.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5390625, -13.085693359375, -12.63232421875, -12.178955078125, -11.7255859375, -11.272216796875, -10.81884765625, -10.365478515625, -9.912109375, -9.458740234375, -9.00537109375, -8.552001953125, -8.0986328125, -7.645263671875, -7.19189453125, -6.738525390625, -6.28515625, -5.831787109375, -5.37841796875, -4.925048828125, -4.4716796875, -4.018310546875, -3.56494140625, -3.111572265625, -2.658203125, -2.204833984375, -1.75146484375, -1.298095703125, -0.8447265625, -0.391357421875, 0.06201171875, 0.515380859375, 0.96875, 1.422119140625, 1.87548828125, 2.328857421875, 2.7822265625, 3.235595703125, 3.68896484375, 4.142333984375, 4.595703125, 5.049072265625, 5.50244140625, 5.955810546875, 6.4091796875, 6.862548828125, 7.31591796875, 7.769287109375, 8.22265625, 8.676025390625, 9.12939453125, 9.582763671875, 10.0361328125, 10.489501953125, 10.94287109375, 11.396240234375, 11.849609375, 12.302978515625, 12.75634765625, 13.209716796875, 13.6630859375, 14.116455078125, 14.56982421875, 15.023193359375, 15.4765625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 16.0, 12.0, 26.0, 34.0, 44.0, 80.0, 132.0, 224.0, 568.0, 2617.0, 385589.0, 3788994.0, 14177.0, 955.0, 340.0, 182.0, 91.0, 56.0, 50.0, 30.0, 19.0, 17.0, 11.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.8125, -56.07275390625, -54.3330078125, -52.59326171875, -50.853515625, -49.11376953125, -47.3740234375, -45.63427734375, -43.89453125, -42.15478515625, -40.4150390625, -38.67529296875, -36.935546875, -35.19580078125, -33.4560546875, -31.71630859375, -29.9765625, -28.23681640625, -26.4970703125, -24.75732421875, -23.017578125, -21.27783203125, -19.5380859375, -17.79833984375, -16.05859375, -14.31884765625, -12.5791015625, -10.83935546875, -9.099609375, -7.35986328125, -5.6201171875, -3.88037109375, -2.140625, -0.40087890625, 1.3388671875, 3.07861328125, 4.818359375, 6.55810546875, 8.2978515625, 10.03759765625, 11.77734375, 13.51708984375, 15.2568359375, 16.99658203125, 18.736328125, 20.47607421875, 22.2158203125, 23.95556640625, 25.6953125, 27.43505859375, 29.1748046875, 30.91455078125, 32.654296875, 34.39404296875, 36.1337890625, 37.87353515625, 39.61328125, 41.35302734375, 43.0927734375, 44.83251953125, 46.572265625, 48.31201171875, 50.0517578125, 51.79150390625, 53.53125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 111.0, 378.0, 402.0, 113.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-282.3742370605469, -275.4939880371094, -268.6137390136719, -261.7334899902344, -254.85325622558594, -247.97300720214844, -241.0927734375, -234.2125244140625, -227.332275390625, -220.4520263671875, -213.57177734375, -206.69154357910156, -199.81129455566406, -192.93104553222656, -186.05081176757812, -179.17056274414062, -172.29031372070312, -165.41006469726562, -158.52981567382812, -151.6495819091797, -144.7693328857422, -137.8890838623047, -131.00885009765625, -124.12860107421875, -117.24835205078125, -110.36810302734375, -103.48786163330078, -96.60762023925781, -89.72737121582031, -82.84712219238281, -75.96688079833984, -69.08663940429688, -62.20637512207031, -55.32612991333008, -48.445884704589844, -41.56563949584961, -34.685394287109375, -27.80514907836914, -20.924903869628906, -14.044658660888672, -7.1644134521484375, -0.2841682434082031, 6.596076965332031, 13.476322174072266, 20.3565673828125, 27.236812591552734, 34.11705780029297, 40.9973030090332, 47.87754821777344, 54.75779342651367, 61.638038635253906, 68.51828002929688, 75.39852905273438, 82.27877807617188, 89.15901947021484, 96.03926086425781, 102.91950988769531, 109.79975891113281, 116.68000030517578, 123.56024169921875, 130.44049072265625, 137.32073974609375, 144.20098876953125, 151.0812225341797, 157.9614715576172]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 8.0, 9.0, 12.0, 13.0, 8.0, 20.0, 21.0, 19.0, 23.0, 27.0, 19.0, 35.0, 37.0, 26.0, 41.0, 41.0, 49.0, 39.0, 46.0, 40.0, 40.0, 31.0, 25.0, 42.0, 29.0, 44.0, 38.0, 40.0, 24.0, 24.0, 12.0, 15.0, 16.0, 10.0, 16.0, 9.0, 14.0, 7.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.73896408081055, -39.46942138671875, -38.19987869262695, -36.930335998535156, -35.66079330444336, -34.39125061035156, -33.121707916259766, -31.85216522216797, -30.582622528076172, -29.313079833984375, -28.043537139892578, -26.77399444580078, -25.504451751708984, -24.234909057617188, -22.96536636352539, -21.695823669433594, -20.426280975341797, -19.15673828125, -17.887195587158203, -16.617652893066406, -15.34811019897461, -14.078567504882812, -12.809024810791016, -11.539482116699219, -10.269939422607422, -9.000396728515625, -7.730854034423828, -6.461311340332031, -5.191768646240234, -3.9222259521484375, -2.6526832580566406, -1.3831405639648438, -0.1136016845703125, 1.1559410095214844, 2.4254837036132812, 3.695026397705078, 4.964569091796875, 6.234111785888672, 7.503654479980469, 8.773197174072266, 10.042739868164062, 11.31228256225586, 12.581825256347656, 13.851367950439453, 15.12091064453125, 16.390453338623047, 17.659996032714844, 18.92953872680664, 20.199081420898438, 21.468624114990234, 22.73816680908203, 24.007709503173828, 25.277252197265625, 26.546794891357422, 27.81633758544922, 29.085880279541016, 30.355422973632812, 31.62496566772461, 32.894508361816406, 34.1640510559082, 35.43359375, 36.7031364440918, 37.972679138183594, 39.24222183227539, 40.51176452636719]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 10.0, 9.0, 8.0, 5.0, 14.0, 9.0, 13.0, 20.0, 21.0, 22.0, 21.0, 27.0, 31.0, 40.0, 41.0, 42.0, 38.0, 39.0, 42.0, 34.0, 50.0, 49.0, 43.0, 34.0, 45.0, 31.0, 35.0, 30.0, 28.0, 28.0, 25.0, 20.0, 12.0, 25.0, 14.0, 13.0, 8.0, 5.0, 2.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.4609375, -4.31640625, -4.171875, -4.02734375, -3.8828125, -3.73828125, -3.59375, -3.44921875, -3.3046875, -3.16015625, -3.015625, -2.87109375, -2.7265625, -2.58203125, -2.4375, -2.29296875, -2.1484375, -2.00390625, -1.859375, -1.71484375, -1.5703125, -1.42578125, -1.28125, -1.13671875, -0.9921875, -0.84765625, -0.703125, -0.55859375, -0.4140625, -0.26953125, -0.125, 0.01953125, 0.1640625, 0.30859375, 0.453125, 0.59765625, 0.7421875, 0.88671875, 1.03125, 1.17578125, 1.3203125, 1.46484375, 1.609375, 1.75390625, 1.8984375, 2.04296875, 2.1875, 2.33203125, 2.4765625, 2.62109375, 2.765625, 2.91015625, 3.0546875, 3.19921875, 3.34375, 3.48828125, 3.6328125, 3.77734375, 3.921875, 4.06640625, 4.2109375, 4.35546875, 4.5, 4.64453125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 2.0, 3.0, 9.0, 6.0, 7.0, 9.0, 27.0, 38.0, 47.0, 76.0, 100.0, 140.0, 186.0, 260.0, 393.0, 550.0, 935.0, 1324.0, 1816.0, 2910.0, 4409.0, 6682.0, 10136.0, 15556.0, 24445.0, 39063.0, 65111.0, 116630.0, 292731.0, 211639.0, 99001.0, 56776.0, 34774.0, 21770.0, 13975.0, 9166.0, 5763.0, 4006.0, 2610.0, 1761.0, 1145.0, 822.0, 542.0, 393.0, 252.0, 179.0, 130.0, 77.0, 58.0, 32.0, 28.0, 15.0, 16.0, 11.0, 11.0, 4.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.2177734375, -1.1795654296875, -1.141357421875, -1.1031494140625, -1.06494140625, -1.0267333984375, -0.988525390625, -0.9503173828125, -0.912109375, -0.8739013671875, -0.835693359375, -0.7974853515625, -0.75927734375, -0.7210693359375, -0.682861328125, -0.6446533203125, -0.6064453125, -0.5682373046875, -0.530029296875, -0.4918212890625, -0.45361328125, -0.4154052734375, -0.377197265625, -0.3389892578125, -0.30078125, -0.2625732421875, -0.224365234375, -0.1861572265625, -0.14794921875, -0.1097412109375, -0.071533203125, -0.0333251953125, 0.0048828125, 0.0430908203125, 0.081298828125, 0.1195068359375, 0.15771484375, 0.1959228515625, 0.234130859375, 0.2723388671875, 0.310546875, 0.3487548828125, 0.386962890625, 0.4251708984375, 0.46337890625, 0.5015869140625, 0.539794921875, 0.5780029296875, 0.6162109375, 0.6544189453125, 0.692626953125, 0.7308349609375, 0.76904296875, 0.8072509765625, 0.845458984375, 0.8836669921875, 0.921875, 0.9600830078125, 0.998291015625, 1.0364990234375, 1.07470703125, 1.1129150390625, 1.151123046875, 1.1893310546875, 1.2275390625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 13.0, 4.0, 7.0, 10.0, 8.0, 21.0, 14.0, 12.0, 9.0, 15.0, 27.0, 28.0, 28.0, 30.0, 33.0, 35.0, 36.0, 36.0, 41.0, 52.0, 44.0, 1061.0, 27.0, 45.0, 48.0, 37.0, 34.0, 41.0, 30.0, 20.0, 23.0, 25.0, 13.0, 17.0, 10.0, 13.0, 12.0, 12.0, 11.0, 6.0, 8.0, 6.0, 2.0, 7.0, 2.0, 2.0, 3.0, 5.0], "bins": [-3.224609375, -3.138519287109375, -3.05242919921875, -2.966339111328125, -2.8802490234375, -2.794158935546875, -2.70806884765625, -2.621978759765625, -2.535888671875, -2.449798583984375, -2.36370849609375, -2.277618408203125, -2.1915283203125, -2.105438232421875, -2.01934814453125, -1.933258056640625, -1.84716796875, -1.761077880859375, -1.67498779296875, -1.588897705078125, -1.5028076171875, -1.416717529296875, -1.33062744140625, -1.244537353515625, -1.158447265625, -1.072357177734375, -0.98626708984375, -0.900177001953125, -0.8140869140625, -0.727996826171875, -0.64190673828125, -0.555816650390625, -0.4697265625, -0.383636474609375, -0.29754638671875, -0.211456298828125, -0.1253662109375, -0.039276123046875, 0.04681396484375, 0.132904052734375, 0.218994140625, 0.305084228515625, 0.39117431640625, 0.477264404296875, 0.5633544921875, 0.649444580078125, 0.73553466796875, 0.821624755859375, 0.90771484375, 0.993804931640625, 1.07989501953125, 1.165985107421875, 1.2520751953125, 1.338165283203125, 1.42425537109375, 1.510345458984375, 1.596435546875, 1.682525634765625, 1.76861572265625, 1.854705810546875, 1.9407958984375, 2.026885986328125, 2.11297607421875, 2.199066162109375, 2.28515625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 9.0, 10.0, 29.0, 27.0, 56.0, 89.0, 123.0, 172.0, 328.0, 453.0, 700.0, 1106.0, 1740.0, 2517.0, 3534.0, 5161.0, 7542.0, 11625.0, 18031.0, 28001.0, 44346.0, 73368.0, 135262.0, 1373899.0, 164981.0, 83852.0, 49797.0, 30991.0, 20323.0, 12779.0, 8577.0, 5611.0, 3962.0, 2644.0, 1838.0, 1261.0, 915.0, 517.0, 342.0, 219.0, 140.0, 89.0, 48.0, 46.0, 23.0, 15.0, 16.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.212890625, -1.17681884765625, -1.1407470703125, -1.10467529296875, -1.068603515625, -1.03253173828125, -0.9964599609375, -0.96038818359375, -0.92431640625, -0.88824462890625, -0.8521728515625, -0.81610107421875, -0.780029296875, -0.74395751953125, -0.7078857421875, -0.67181396484375, -0.6357421875, -0.59967041015625, -0.5635986328125, -0.52752685546875, -0.491455078125, -0.45538330078125, -0.4193115234375, -0.38323974609375, -0.34716796875, -0.31109619140625, -0.2750244140625, -0.23895263671875, -0.202880859375, -0.16680908203125, -0.1307373046875, -0.09466552734375, -0.05859375, -0.02252197265625, 0.0135498046875, 0.04962158203125, 0.085693359375, 0.12176513671875, 0.1578369140625, 0.19390869140625, 0.22998046875, 0.26605224609375, 0.3021240234375, 0.33819580078125, 0.374267578125, 0.41033935546875, 0.4464111328125, 0.48248291015625, 0.5185546875, 0.55462646484375, 0.5906982421875, 0.62677001953125, 0.662841796875, 0.69891357421875, 0.7349853515625, 0.77105712890625, 0.80712890625, 0.84320068359375, 0.8792724609375, 0.91534423828125, 0.951416015625, 0.98748779296875, 1.0235595703125, 1.05963134765625, 1.095703125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 6.0, 8.0, 9.0, 15.0, 16.0, 19.0, 21.0, 15.0, 20.0, 18.0, 43.0, 44.0, 44.0, 71.0, 82.0, 84.0, 82.0, 60.0, 47.0, 65.0, 38.0, 31.0, 37.0, 22.0, 20.0, 19.0, 7.0, 14.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00020885467529296875, -0.0002026595175266266, -0.00019646435976028442, -0.00019026920199394226, -0.0001840740442276001, -0.00017787888646125793, -0.00017168372869491577, -0.0001654885709285736, -0.00015929341316223145, -0.00015309825539588928, -0.00014690309762954712, -0.00014070793986320496, -0.0001345127820968628, -0.00012831762433052063, -0.00012212246656417847, -0.0001159273087978363, -0.00010973215103149414, -0.00010353699326515198, -9.734183549880981e-05, -9.114667773246765e-05, -8.495151996612549e-05, -7.875636219978333e-05, -7.256120443344116e-05, -6.6366046667099e-05, -6.0170888900756836e-05, -5.397573113441467e-05, -4.778057336807251e-05, -4.158541560173035e-05, -3.5390257835388184e-05, -2.919510006904602e-05, -2.2999942302703857e-05, -1.6804784536361694e-05, -1.0609626770019531e-05, -4.414469003677368e-06, 1.780688762664795e-06, 7.975846529006958e-06, 1.4171004295349121e-05, 2.0366162061691284e-05, 2.6561319828033447e-05, 3.275647759437561e-05, 3.8951635360717773e-05, 4.5146793127059937e-05, 5.13419508934021e-05, 5.753710865974426e-05, 6.373226642608643e-05, 6.992742419242859e-05, 7.612258195877075e-05, 8.231773972511292e-05, 8.851289749145508e-05, 9.470805525779724e-05, 0.0001009032130241394, 0.00010709837079048157, 0.00011329352855682373, 0.0001194886863231659, 0.00012568384408950806, 0.00013187900185585022, 0.00013807415962219238, 0.00014426931738853455, 0.0001504644751548767, 0.00015665963292121887, 0.00016285479068756104, 0.0001690499484539032, 0.00017524510622024536, 0.00018144026398658752, 0.0001876354217529297]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 18.0, 12.0, 19.0, 28.0, 29.0, 44.0, 70.0, 98.0, 136.0, 185.0, 260.0, 437.0, 1432.0, 798005.0, 245391.0, 1048.0, 461.0, 296.0, 179.0, 109.0, 72.0, 56.0, 40.0, 41.0, 28.0, 9.0, 13.0, 6.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0040283203125, -0.003898024559020996, -0.003767728805541992, -0.0036374330520629883, -0.0035071372985839844, -0.0033768415451049805, -0.0032465457916259766, -0.0031162500381469727, -0.0029859542846679688, -0.002855658531188965, -0.002725362777709961, -0.002595067024230957, -0.002464771270751953, -0.0023344755172729492, -0.0022041797637939453, -0.0020738840103149414, -0.0019435882568359375, -0.0018132925033569336, -0.0016829967498779297, -0.0015527009963989258, -0.0014224052429199219, -0.001292109489440918, -0.001161813735961914, -0.0010315179824829102, -0.0009012222290039062, -0.0007709264755249023, -0.0006406307220458984, -0.0005103349685668945, -0.0003800392150878906, -0.0002497434616088867, -0.00011944770812988281, 1.0848045349121094e-05, 0.000141143798828125, 0.0002714395523071289, 0.0004017353057861328, 0.0005320310592651367, 0.0006623268127441406, 0.0007926225662231445, 0.0009229183197021484, 0.0010532140731811523, 0.0011835098266601562, 0.0013138055801391602, 0.001444101333618164, 0.001574397087097168, 0.0017046928405761719, 0.0018349885940551758, 0.0019652843475341797, 0.0020955801010131836, 0.0022258758544921875, 0.0023561716079711914, 0.0024864673614501953, 0.0026167631149291992, 0.002747058868408203, 0.002877354621887207, 0.003007650375366211, 0.003137946128845215, 0.0032682418823242188, 0.0033985376358032227, 0.0035288333892822266, 0.0036591291427612305, 0.0037894248962402344, 0.003919720649719238, 0.004050016403198242, 0.004180312156677246, 0.00431060791015625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 35.0, 245.0, 465.0, 230.0, 35.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000203538074856624, -0.00018842345161829144, -0.00017330881382804364, -0.00015819419058971107, -0.00014307955279946327, -0.0001279649295611307, -0.00011285030632279813, -9.773567580850795e-05, -8.262104529421777e-05, -6.750641477992758e-05, -5.2391787903616205e-05, -3.727716102730483e-05, -2.2162530513014644e-05, -7.047899998724461e-06, 8.066723239608109e-06, 2.3181353753898293e-05, 3.8295984268188477e-05, 5.341061478247866e-05, 6.852524529676884e-05, 8.363986853510141e-05, 9.87544990493916e-05, 0.00011386912956368178, 0.00012898375280201435, 0.00014409839059226215, 0.00015921301383059472, 0.0001743276370689273, 0.00018944227485917509, 0.00020455689809750766, 0.00021967152133584023, 0.00023478615912608802, 0.0002499007969163358, 0.00026501540560275316, 0.0002801300142891705, 0.0002952446520794183, 0.00031035926076583564, 0.00032547389855608344, 0.00034058853634633124, 0.00035570317413657904, 0.0003708177828229964, 0.0003859324206132442, 0.000401047058403492, 0.00041616169619373977, 0.0004312763048801571, 0.0004463909426704049, 0.0004615055804606527, 0.0004766202182509005, 0.0004917348269373178, 0.0005068494356237352, 0.0005219640443101525, 0.0005370786529965699, 0.0005521933198906481, 0.0005673079285770655, 0.0005824225372634828, 0.0005975372041575611, 0.0006126518128439784, 0.0006277664215303957, 0.000642881088424474, 0.0006579956971108913, 0.0006731103640049696, 0.0006882249726913869, 0.0007033395813778043, 0.0007184542482718825, 0.0007335688569582999, 0.0007486834656447172, 0.0007637981325387955]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 10.0, 7.0, 10.0, 8.0, 18.0, 16.0, 24.0, 10.0, 30.0, 22.0, 24.0, 28.0, 42.0, 40.0, 43.0, 40.0, 35.0, 36.0, 50.0, 39.0, 38.0, 40.0, 34.0, 36.0, 40.0, 27.0, 24.0, 27.0, 29.0, 23.0, 20.0, 18.0, 20.0, 22.0, 11.0, 13.0, 11.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.626150131225586e-05, -9.333807975053787e-05, -9.041465818881989e-05, -8.74912366271019e-05, -8.456781506538391e-05, -8.164439350366592e-05, -7.872097194194794e-05, -7.579755038022995e-05, -7.287412881851196e-05, -6.995070725679398e-05, -6.702728569507599e-05, -6.4103864133358e-05, -6.118044257164001e-05, -5.825702100992203e-05, -5.533359944820404e-05, -5.2410177886486053e-05, -4.9486756324768066e-05, -4.656333476305008e-05, -4.363991320133209e-05, -4.0716491639614105e-05, -3.779307007789612e-05, -3.486964851617813e-05, -3.1946226954460144e-05, -2.9022805392742157e-05, -2.609938383102417e-05, -2.3175962269306183e-05, -2.0252540707588196e-05, -1.732911914587021e-05, -1.4405697584152222e-05, -1.1482276022434235e-05, -8.558854460716248e-06, -5.6354328989982605e-06, -2.7120113372802734e-06, 2.1141022443771362e-07, 3.1348317861557007e-06, 6.058253347873688e-06, 8.981674909591675e-06, 1.1905096471309662e-05, 1.4828518033027649e-05, 1.7751939594745636e-05, 2.0675361156463623e-05, 2.359878271818161e-05, 2.6522204279899597e-05, 2.9445625841617584e-05, 3.236904740333557e-05, 3.529246896505356e-05, 3.8215890526771545e-05, 4.113931208848953e-05, 4.406273365020752e-05, 4.6986155211925507e-05, 4.9909576773643494e-05, 5.283299833536148e-05, 5.575641989707947e-05, 5.8679841458797455e-05, 6.160326302051544e-05, 6.452668458223343e-05, 6.745010614395142e-05, 7.03735277056694e-05, 7.329694926738739e-05, 7.622037082910538e-05, 7.914379239082336e-05, 8.206721395254135e-05, 8.499063551425934e-05, 8.791405707597733e-05, 9.083747863769531e-05]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 10.0, 9.0, 8.0, 5.0, 14.0, 9.0, 13.0, 20.0, 21.0, 22.0, 21.0, 27.0, 31.0, 40.0, 41.0, 42.0, 38.0, 39.0, 42.0, 34.0, 50.0, 49.0, 43.0, 34.0, 45.0, 31.0, 35.0, 30.0, 28.0, 28.0, 25.0, 20.0, 12.0, 25.0, 14.0, 13.0, 8.0, 5.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.4609375, -4.31640625, -4.171875, -4.02734375, -3.8828125, -3.73828125, -3.59375, -3.44921875, -3.3046875, -3.16015625, -3.015625, -2.87109375, -2.7265625, -2.58203125, -2.4375, -2.29296875, -2.1484375, -2.00390625, -1.859375, -1.71484375, -1.5703125, -1.42578125, -1.28125, -1.13671875, -0.9921875, -0.84765625, -0.703125, -0.55859375, -0.4140625, -0.26953125, -0.125, 0.01953125, 0.1640625, 0.30859375, 0.453125, 0.59765625, 0.7421875, 0.88671875, 1.03125, 1.17578125, 1.3203125, 1.46484375, 1.609375, 1.75390625, 1.8984375, 2.04296875, 2.1875, 2.33203125, 2.4765625, 2.62109375, 2.765625, 2.91015625, 3.0546875, 3.19921875, 3.34375, 3.48828125, 3.6328125, 3.77734375, 3.921875, 4.06640625, 4.2109375, 4.35546875, 4.5, 4.64453125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 12.0, 12.0, 12.0, 18.0, 22.0, 48.0, 63.0, 136.0, 203.0, 311.0, 516.0, 965.0, 1779.0, 3374.0, 6440.0, 13461.0, 28829.0, 66449.0, 150012.0, 267217.0, 257463.0, 138308.0, 61261.0, 26297.0, 12174.0, 6093.0, 3054.0, 1785.0, 900.0, 479.0, 293.0, 183.0, 123.0, 91.0, 50.0, 36.0, 22.0, 13.0, 14.0, 7.0, 8.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.741241455078125, -2.64654541015625, -2.551849365234375, -2.4571533203125, -2.362457275390625, -2.26776123046875, -2.173065185546875, -2.078369140625, -1.983673095703125, -1.88897705078125, -1.794281005859375, -1.6995849609375, -1.604888916015625, -1.51019287109375, -1.415496826171875, -1.32080078125, -1.226104736328125, -1.13140869140625, -1.036712646484375, -0.9420166015625, -0.847320556640625, -0.75262451171875, -0.657928466796875, -0.563232421875, -0.468536376953125, -0.37384033203125, -0.279144287109375, -0.1844482421875, -0.089752197265625, 0.00494384765625, 0.099639892578125, 0.1943359375, 0.289031982421875, 0.38372802734375, 0.478424072265625, 0.5731201171875, 0.667816162109375, 0.76251220703125, 0.857208251953125, 0.951904296875, 1.046600341796875, 1.14129638671875, 1.235992431640625, 1.3306884765625, 1.425384521484375, 1.52008056640625, 1.614776611328125, 1.70947265625, 1.804168701171875, 1.89886474609375, 1.993560791015625, 2.0882568359375, 2.182952880859375, 2.27764892578125, 2.372344970703125, 2.467041015625, 2.561737060546875, 2.65643310546875, 2.751129150390625, 2.8458251953125, 2.940521240234375, 3.03521728515625, 3.129913330078125, 3.224609375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 2.0, 9.0, 2.0, 8.0, 10.0, 9.0, 13.0, 18.0, 17.0, 12.0, 17.0, 26.0, 27.0, 33.0, 36.0, 29.0, 39.0, 39.0, 44.0, 110.0, 302.0, 1565.0, 198.0, 69.0, 47.0, 50.0, 36.0, 34.0, 27.0, 25.0, 14.0, 20.0, 26.0, 30.0, 29.0, 16.0, 10.0, 9.0, 9.0, 7.0, 9.0, 1.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-17.328125, -16.8375244140625, -16.346923828125, -15.8563232421875, -15.36572265625, -14.8751220703125, -14.384521484375, -13.8939208984375, -13.4033203125, -12.9127197265625, -12.422119140625, -11.9315185546875, -11.44091796875, -10.9503173828125, -10.459716796875, -9.9691162109375, -9.478515625, -8.9879150390625, -8.497314453125, -8.0067138671875, -7.51611328125, -7.0255126953125, -6.534912109375, -6.0443115234375, -5.5537109375, -5.0631103515625, -4.572509765625, -4.0819091796875, -3.59130859375, -3.1007080078125, -2.610107421875, -2.1195068359375, -1.62890625, -1.1383056640625, -0.647705078125, -0.1571044921875, 0.33349609375, 0.8240966796875, 1.314697265625, 1.8052978515625, 2.2958984375, 2.7864990234375, 3.277099609375, 3.7677001953125, 4.25830078125, 4.7489013671875, 5.239501953125, 5.7301025390625, 6.220703125, 6.7113037109375, 7.201904296875, 7.6925048828125, 8.18310546875, 8.6737060546875, 9.164306640625, 9.6549072265625, 10.1455078125, 10.6361083984375, 11.126708984375, 11.6173095703125, 12.10791015625, 12.5985107421875, 13.089111328125, 13.5797119140625, 14.0703125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 10.0, 2.0, 13.0, 9.0, 8.0, 16.0, 14.0, 22.0, 29.0, 30.0, 33.0, 41.0, 39.0, 60.0, 79.0, 131.0, 213.0, 319.0, 675.0, 3518.0, 116719.0, 2978677.0, 41290.0, 2220.0, 568.0, 280.0, 172.0, 116.0, 82.0, 74.0, 52.0, 42.0, 18.0, 11.0, 26.0, 15.0, 10.0, 16.0, 11.0, 9.0, 6.0, 2.0, 7.0, 9.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-21.453125, -20.697509765625, -19.94189453125, -19.186279296875, -18.4306640625, -17.675048828125, -16.91943359375, -16.163818359375, -15.408203125, -14.652587890625, -13.89697265625, -13.141357421875, -12.3857421875, -11.630126953125, -10.87451171875, -10.118896484375, -9.36328125, -8.607666015625, -7.85205078125, -7.096435546875, -6.3408203125, -5.585205078125, -4.82958984375, -4.073974609375, -3.318359375, -2.562744140625, -1.80712890625, -1.051513671875, -0.2958984375, 0.459716796875, 1.21533203125, 1.970947265625, 2.7265625, 3.482177734375, 4.23779296875, 4.993408203125, 5.7490234375, 6.504638671875, 7.26025390625, 8.015869140625, 8.771484375, 9.527099609375, 10.28271484375, 11.038330078125, 11.7939453125, 12.549560546875, 13.30517578125, 14.060791015625, 14.81640625, 15.572021484375, 16.32763671875, 17.083251953125, 17.8388671875, 18.594482421875, 19.35009765625, 20.105712890625, 20.861328125, 21.616943359375, 22.37255859375, 23.128173828125, 23.8837890625, 24.639404296875, 25.39501953125, 26.150634765625, 26.90625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 33.0, 217.0, 444.0, 277.0, 41.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.92256927490234, -100.5626449584961, -98.20271301269531, -95.84278869628906, -93.48286437988281, -91.12293243408203, -88.76300811767578, -86.403076171875, -84.04315185546875, -81.6832275390625, -79.32329559326172, -76.96337127685547, -74.60343933105469, -72.24351501464844, -69.88359069824219, -67.52366638183594, -65.16373443603516, -62.80380630493164, -60.443878173828125, -58.083953857421875, -55.72402572631836, -53.364097595214844, -51.004173278808594, -48.64424514770508, -46.28431701660156, -43.92438888549805, -41.56446075439453, -39.20453643798828, -36.844608306884766, -34.48468017578125, -32.124755859375, -29.764827728271484, -27.4049072265625, -25.044979095458984, -22.6850528717041, -20.32512664794922, -17.965198516845703, -15.605271339416504, -13.245344161987305, -10.885417938232422, -8.525489807128906, -6.165562629699707, -3.805635452270508, -1.4457082748413086, 0.9142189025878906, 3.27414608001709, 5.634073257446289, 7.993999481201172, 10.353927612304688, 12.713854789733887, 15.073781967163086, 17.43370819091797, 19.793636322021484, 22.153564453125, 24.513490676879883, 26.873416900634766, 29.23334503173828, 31.593273162841797, 33.95320129394531, 36.31312561035156, 38.67305374145508, 41.032981872558594, 43.392906188964844, 45.75283432006836, 48.112762451171875]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 7.0, 5.0, 5.0, 8.0, 8.0, 14.0, 20.0, 16.0, 21.0, 23.0, 31.0, 33.0, 27.0, 32.0, 35.0, 37.0, 35.0, 45.0, 49.0, 62.0, 51.0, 47.0, 45.0, 36.0, 36.0, 36.0, 32.0, 31.0, 26.0, 21.0, 27.0, 16.0, 13.0, 14.0, 10.0, 14.0, 9.0, 10.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.56816482543945, -49.88494110107422, -48.20171356201172, -46.518489837646484, -44.835262298583984, -43.15203857421875, -41.46881103515625, -39.785587310791016, -38.10236358642578, -36.41913986206055, -34.73591232299805, -33.05268859863281, -31.369461059570312, -29.686237335205078, -28.00301170349121, -26.319786071777344, -24.636558532714844, -22.953332901000977, -21.27010726928711, -19.586883544921875, -17.903656005859375, -16.22043228149414, -14.537206649780273, -12.853981018066406, -11.170755386352539, -9.487529754638672, -7.804304599761963, -6.121079444885254, -4.437853813171387, -2.7546281814575195, -1.0714035034179688, 0.6118221282958984, 2.2950515747070312, 3.9782769680023193, 5.661502361297607, 7.344727516174316, 9.027953147888184, 10.71117877960205, 12.394403457641602, 14.077629089355469, 15.760854721069336, 17.444080352783203, 19.12730598449707, 20.810531616210938, 22.493755340576172, 24.176982879638672, 25.860206604003906, 27.543432235717773, 29.22665786743164, 30.909883499145508, 32.593109130859375, 34.27633285522461, 35.95956039428711, 37.642784118652344, 39.326011657714844, 41.00923538208008, 42.69245910644531, 44.37568283081055, 46.05891036987305, 47.74213409423828, 49.42536163330078, 51.108585357666016, 52.79180908203125, 54.47503662109375, 56.15826416015625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 8.0, 7.0, 6.0, 8.0, 13.0, 16.0, 24.0, 22.0, 19.0, 21.0, 20.0, 33.0, 37.0, 45.0, 44.0, 31.0, 34.0, 45.0, 43.0, 40.0, 49.0, 38.0, 35.0, 33.0, 40.0, 40.0, 29.0, 33.0, 26.0, 27.0, 20.0, 17.0, 19.0, 8.0, 17.0, 8.0, 8.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.37713623046875, -4.2308349609375, -4.08453369140625, -3.938232421875, -3.79193115234375, -3.6456298828125, -3.49932861328125, -3.35302734375, -3.20672607421875, -3.0604248046875, -2.91412353515625, -2.767822265625, -2.62152099609375, -2.4752197265625, -2.32891845703125, -2.1826171875, -2.03631591796875, -1.8900146484375, -1.74371337890625, -1.597412109375, -1.45111083984375, -1.3048095703125, -1.15850830078125, -1.01220703125, -0.86590576171875, -0.7196044921875, -0.57330322265625, -0.427001953125, -0.28070068359375, -0.1343994140625, 0.01190185546875, 0.158203125, 0.30450439453125, 0.4508056640625, 0.59710693359375, 0.743408203125, 0.88970947265625, 1.0360107421875, 1.18231201171875, 1.32861328125, 1.47491455078125, 1.6212158203125, 1.76751708984375, 1.913818359375, 2.06011962890625, 2.2064208984375, 2.35272216796875, 2.4990234375, 2.64532470703125, 2.7916259765625, 2.93792724609375, 3.084228515625, 3.23052978515625, 3.3768310546875, 3.52313232421875, 3.66943359375, 3.81573486328125, 3.9620361328125, 4.10833740234375, 4.254638671875, 4.40093994140625, 4.5472412109375, 4.69354248046875, 4.83984375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 5.0, 3.0, 7.0, 8.0, 9.0, 10.0, 14.0, 15.0, 14.0, 19.0, 20.0, 31.0, 29.0, 47.0, 61.0, 64.0, 114.0, 230.0, 457.0, 1386.0, 6868.0, 54600.0, 679689.0, 2670003.0, 713895.0, 56938.0, 7179.0, 1406.0, 492.0, 175.0, 118.0, 93.0, 55.0, 41.0, 28.0, 26.0, 17.0, 29.0, 8.0, 16.0, 15.0, 8.0, 9.0, 7.0, 4.0, 0.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-11.96875, -11.6005859375, -11.232421875, -10.8642578125, -10.49609375, -10.1279296875, -9.759765625, -9.3916015625, -9.0234375, -8.6552734375, -8.287109375, -7.9189453125, -7.55078125, -7.1826171875, -6.814453125, -6.4462890625, -6.078125, -5.7099609375, -5.341796875, -4.9736328125, -4.60546875, -4.2373046875, -3.869140625, -3.5009765625, -3.1328125, -2.7646484375, -2.396484375, -2.0283203125, -1.66015625, -1.2919921875, -0.923828125, -0.5556640625, -0.1875, 0.1806640625, 0.548828125, 0.9169921875, 1.28515625, 1.6533203125, 2.021484375, 2.3896484375, 2.7578125, 3.1259765625, 3.494140625, 3.8623046875, 4.23046875, 4.5986328125, 4.966796875, 5.3349609375, 5.703125, 6.0712890625, 6.439453125, 6.8076171875, 7.17578125, 7.5439453125, 7.912109375, 8.2802734375, 8.6484375, 9.0166015625, 9.384765625, 9.7529296875, 10.12109375, 10.4892578125, 10.857421875, 11.2255859375, 11.59375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 3.0, 10.0, 6.0, 13.0, 11.0, 17.0, 17.0, 35.0, 35.0, 49.0, 58.0, 83.0, 89.0, 125.0, 160.0, 195.0, 248.0, 285.0, 304.0, 380.0, 348.0, 281.0, 303.0, 217.0, 168.0, 151.0, 98.0, 84.0, 72.0, 60.0, 38.0, 34.0, 25.0, 17.0, 15.0, 8.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.1328125, -9.8231201171875, -9.513427734375, -9.2037353515625, -8.89404296875, -8.5843505859375, -8.274658203125, -7.9649658203125, -7.6552734375, -7.3455810546875, -7.035888671875, -6.7261962890625, -6.41650390625, -6.1068115234375, -5.797119140625, -5.4874267578125, -5.177734375, -4.8680419921875, -4.558349609375, -4.2486572265625, -3.93896484375, -3.6292724609375, -3.319580078125, -3.0098876953125, -2.7001953125, -2.3905029296875, -2.080810546875, -1.7711181640625, -1.46142578125, -1.1517333984375, -0.842041015625, -0.5323486328125, -0.22265625, 0.0870361328125, 0.396728515625, 0.7064208984375, 1.01611328125, 1.3258056640625, 1.635498046875, 1.9451904296875, 2.2548828125, 2.5645751953125, 2.874267578125, 3.1839599609375, 3.49365234375, 3.8033447265625, 4.113037109375, 4.4227294921875, 4.732421875, 5.0421142578125, 5.351806640625, 5.6614990234375, 5.97119140625, 6.2808837890625, 6.590576171875, 6.9002685546875, 7.2099609375, 7.5196533203125, 7.829345703125, 8.1390380859375, 8.44873046875, 8.7584228515625, 9.068115234375, 9.3778076171875, 9.6875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 4.0, 10.0, 7.0, 10.0, 24.0, 24.0, 30.0, 44.0, 66.0, 86.0, 92.0, 133.0, 226.0, 382.0, 937.0, 7494.0, 340927.0, 3703003.0, 134710.0, 4354.0, 676.0, 276.0, 204.0, 139.0, 89.0, 68.0, 61.0, 50.0, 44.0, 34.0, 20.0, 16.0, 13.0, 4.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.78125, -32.669921875, -31.55859375, -30.447265625, -29.3359375, -28.224609375, -27.11328125, -26.001953125, -24.890625, -23.779296875, -22.66796875, -21.556640625, -20.4453125, -19.333984375, -18.22265625, -17.111328125, -16.0, -14.888671875, -13.77734375, -12.666015625, -11.5546875, -10.443359375, -9.33203125, -8.220703125, -7.109375, -5.998046875, -4.88671875, -3.775390625, -2.6640625, -1.552734375, -0.44140625, 0.669921875, 1.78125, 2.892578125, 4.00390625, 5.115234375, 6.2265625, 7.337890625, 8.44921875, 9.560546875, 10.671875, 11.783203125, 12.89453125, 14.005859375, 15.1171875, 16.228515625, 17.33984375, 18.451171875, 19.5625, 20.673828125, 21.78515625, 22.896484375, 24.0078125, 25.119140625, 26.23046875, 27.341796875, 28.453125, 29.564453125, 30.67578125, 31.787109375, 32.8984375, 34.009765625, 35.12109375, 36.232421875, 37.34375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 16.0, 38.0, 62.0, 125.0, 170.0, 191.0, 143.0, 129.0, 76.0, 34.0, 14.0, 12.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.45832443237305, -29.862314224243164, -27.26630401611328, -24.6702938079834, -22.074283599853516, -19.478273391723633, -16.88226318359375, -14.286252975463867, -11.690242767333984, -9.094232559204102, -6.498222351074219, -3.902212142944336, -1.3062019348144531, 1.2898082733154297, 3.8858184814453125, 6.481828689575195, 9.077838897705078, 11.673849105834961, 14.269859313964844, 16.865869522094727, 19.46187973022461, 22.057889938354492, 24.653900146484375, 27.249910354614258, 29.84592056274414, 32.441932678222656, 35.037940979003906, 37.633949279785156, 40.22996139526367, 42.82597351074219, 45.42198181152344, 48.01799011230469, 50.61399841308594, 53.21000671386719, 55.8060188293457, 58.40203094482422, 60.99803924560547, 63.59404754638672, 66.1900634765625, 68.78607177734375, 71.382080078125, 73.97808837890625, 76.5740966796875, 79.17011260986328, 81.76612091064453, 84.36212921142578, 86.95814514160156, 89.55415344238281, 92.15016174316406, 94.74617004394531, 97.34217834472656, 99.93819427490234, 102.5342025756836, 105.13021087646484, 107.72622680664062, 110.32223510742188, 112.91824340820312, 115.51425170898438, 118.11026000976562, 120.7062759399414, 123.30228424072266, 125.8982925415039, 128.4943084716797, 131.09031677246094, 133.6863250732422]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 7.0, 5.0, 7.0, 19.0, 12.0, 14.0, 16.0, 20.0, 27.0, 23.0, 15.0, 26.0, 26.0, 30.0, 24.0, 24.0, 37.0, 28.0, 47.0, 40.0, 51.0, 30.0, 40.0, 22.0, 46.0, 32.0, 33.0, 32.0, 26.0, 36.0, 23.0, 19.0, 19.0, 20.0, 18.0, 17.0, 10.0, 12.0, 4.0, 10.0, 6.0, 8.0, 6.0, 1.0, 3.0, 9.0, 5.0, 5.0, 1.0, 4.0, 4.0, 0.0, 2.0], "bins": [-35.34066390991211, -34.23487091064453, -33.12907791137695, -32.023284912109375, -30.91749382019043, -29.81170082092285, -28.705907821655273, -27.600114822387695, -26.49432373046875, -25.388530731201172, -24.282737731933594, -23.176944732666016, -22.07115364074707, -20.965360641479492, -19.859567642211914, -18.753774642944336, -17.647981643676758, -16.54218864440918, -15.436396598815918, -14.33060359954834, -13.224811553955078, -12.1190185546875, -11.013225555419922, -9.907432556152344, -8.801640510559082, -7.695847988128662, -6.590055465698242, -5.484262466430664, -4.378469944000244, -3.272677421569824, -2.166884422302246, -1.0610918998718262, 0.04470062255859375, 1.1504932641983032, 2.2562859058380127, 3.3620786666870117, 4.467871189117432, 5.573663711547852, 6.67945671081543, 7.78524923324585, 8.89104175567627, 9.996834754943848, 11.10262680053711, 12.208419799804688, 13.314212799072266, 14.420004844665527, 15.525797843933105, 16.631589889526367, 17.737382888793945, 18.843175888061523, 19.9489688873291, 21.054759979248047, 22.160552978515625, 23.266345977783203, 24.37213897705078, 25.47793197631836, 26.583724975585938, 27.689517974853516, 28.795310974121094, 29.901103973388672, 31.006895065307617, 32.11268615722656, 33.218482971191406, 34.32427215576172, 35.4300651550293]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 8.0, 11.0, 9.0, 10.0, 15.0, 19.0, 21.0, 17.0, 27.0, 41.0, 35.0, 33.0, 33.0, 28.0, 36.0, 43.0, 44.0, 51.0, 35.0, 45.0, 42.0, 36.0, 39.0, 36.0, 30.0, 26.0, 29.0, 27.0, 31.0, 20.0, 21.0, 18.0, 12.0, 10.0, 10.0, 10.0, 6.0, 10.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.953125, -4.8038330078125, -4.654541015625, -4.5052490234375, -4.35595703125, -4.2066650390625, -4.057373046875, -3.9080810546875, -3.7587890625, -3.6094970703125, -3.460205078125, -3.3109130859375, -3.16162109375, -3.0123291015625, -2.863037109375, -2.7137451171875, -2.564453125, -2.4151611328125, -2.265869140625, -2.1165771484375, -1.96728515625, -1.8179931640625, -1.668701171875, -1.5194091796875, -1.3701171875, -1.2208251953125, -1.071533203125, -0.9222412109375, -0.77294921875, -0.6236572265625, -0.474365234375, -0.3250732421875, -0.17578125, -0.0264892578125, 0.122802734375, 0.2720947265625, 0.42138671875, 0.5706787109375, 0.719970703125, 0.8692626953125, 1.0185546875, 1.1678466796875, 1.317138671875, 1.4664306640625, 1.61572265625, 1.7650146484375, 1.914306640625, 2.0635986328125, 2.212890625, 2.3621826171875, 2.511474609375, 2.6607666015625, 2.81005859375, 2.9593505859375, 3.108642578125, 3.2579345703125, 3.4072265625, 3.5565185546875, 3.705810546875, 3.8551025390625, 4.00439453125, 4.1536865234375, 4.302978515625, 4.4522705078125, 4.6015625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 5.0, 16.0, 11.0, 15.0, 26.0, 36.0, 56.0, 63.0, 111.0, 177.0, 218.0, 315.0, 491.0, 626.0, 924.0, 1449.0, 1953.0, 3003.0, 4234.0, 6386.0, 9337.0, 14247.0, 21350.0, 32555.0, 50620.0, 82282.0, 160251.0, 316283.0, 133531.0, 73427.0, 45529.0, 29662.0, 19520.0, 12816.0, 8582.0, 5792.0, 3971.0, 2623.0, 1960.0, 1234.0, 873.0, 618.0, 377.0, 339.0, 218.0, 129.0, 95.0, 87.0, 30.0, 30.0, 27.0, 19.0, 16.0, 7.0, 5.0, 4.0, 6.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.0901031494140625, -1.054229736328125, -1.0183563232421875, -0.98248291015625, -0.9466094970703125, -0.910736083984375, -0.8748626708984375, -0.8389892578125, -0.8031158447265625, -0.767242431640625, -0.7313690185546875, -0.69549560546875, -0.6596221923828125, -0.623748779296875, -0.5878753662109375, -0.552001953125, -0.5161285400390625, -0.480255126953125, -0.4443817138671875, -0.40850830078125, -0.3726348876953125, -0.336761474609375, -0.3008880615234375, -0.2650146484375, -0.2291412353515625, -0.193267822265625, -0.1573944091796875, -0.12152099609375, -0.0856475830078125, -0.049774169921875, -0.0139007568359375, 0.02197265625, 0.0578460693359375, 0.093719482421875, 0.1295928955078125, 0.16546630859375, 0.2013397216796875, 0.237213134765625, 0.2730865478515625, 0.3089599609375, 0.3448333740234375, 0.380706787109375, 0.4165802001953125, 0.45245361328125, 0.4883270263671875, 0.524200439453125, 0.5600738525390625, 0.595947265625, 0.6318206787109375, 0.667694091796875, 0.7035675048828125, 0.73944091796875, 0.7753143310546875, 0.811187744140625, 0.8470611572265625, 0.8829345703125, 0.9188079833984375, 0.954681396484375, 0.9905548095703125, 1.02642822265625, 1.0623016357421875, 1.098175048828125, 1.1340484619140625, 1.169921875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 7.0, 6.0, 11.0, 16.0, 11.0, 11.0, 20.0, 19.0, 20.0, 25.0, 26.0, 28.0, 33.0, 39.0, 38.0, 55.0, 33.0, 39.0, 1059.0, 39.0, 47.0, 45.0, 48.0, 33.0, 38.0, 36.0, 37.0, 29.0, 30.0, 22.0, 18.0, 26.0, 20.0, 12.0, 4.0, 11.0, 4.0, 5.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.30859375, -3.210418701171875, -3.11224365234375, -3.014068603515625, -2.9158935546875, -2.817718505859375, -2.71954345703125, -2.621368408203125, -2.523193359375, -2.425018310546875, -2.32684326171875, -2.228668212890625, -2.1304931640625, -2.032318115234375, -1.93414306640625, -1.835968017578125, -1.73779296875, -1.639617919921875, -1.54144287109375, -1.443267822265625, -1.3450927734375, -1.246917724609375, -1.14874267578125, -1.050567626953125, -0.952392578125, -0.854217529296875, -0.75604248046875, -0.657867431640625, -0.5596923828125, -0.461517333984375, -0.36334228515625, -0.265167236328125, -0.1669921875, -0.068817138671875, 0.02935791015625, 0.127532958984375, 0.2257080078125, 0.323883056640625, 0.42205810546875, 0.520233154296875, 0.618408203125, 0.716583251953125, 0.81475830078125, 0.912933349609375, 1.0111083984375, 1.109283447265625, 1.20745849609375, 1.305633544921875, 1.40380859375, 1.501983642578125, 1.60015869140625, 1.698333740234375, 1.7965087890625, 1.894683837890625, 1.99285888671875, 2.091033935546875, 2.189208984375, 2.287384033203125, 2.38555908203125, 2.483734130859375, 2.5819091796875, 2.680084228515625, 2.77825927734375, 2.876434326171875, 2.974609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 10.0, 21.0, 18.0, 35.0, 52.0, 82.0, 122.0, 162.0, 247.0, 325.0, 483.0, 715.0, 1118.0, 1617.0, 2436.0, 3535.0, 5385.0, 7885.0, 12058.0, 18497.0, 28877.0, 45698.0, 74449.0, 131042.0, 1352486.0, 168382.0, 89775.0, 54219.0, 34204.0, 21460.0, 13831.0, 9338.0, 6073.0, 3995.0, 2706.0, 1885.0, 1244.0, 832.0, 604.0, 376.0, 260.0, 204.0, 103.0, 91.0, 63.0, 45.0, 25.0, 17.0, 18.0, 9.0, 6.0, 4.0, 4.0, 0.0, 4.0], "bins": [-1.24609375, -1.2090911865234375, -1.172088623046875, -1.1350860595703125, -1.09808349609375, -1.0610809326171875, -1.024078369140625, -0.9870758056640625, -0.9500732421875, -0.9130706787109375, -0.876068115234375, -0.8390655517578125, -0.80206298828125, -0.7650604248046875, -0.728057861328125, -0.6910552978515625, -0.654052734375, -0.6170501708984375, -0.580047607421875, -0.5430450439453125, -0.50604248046875, -0.4690399169921875, -0.432037353515625, -0.3950347900390625, -0.3580322265625, -0.3210296630859375, -0.284027099609375, -0.2470245361328125, -0.21002197265625, -0.1730194091796875, -0.136016845703125, -0.0990142822265625, -0.06201171875, -0.0250091552734375, 0.011993408203125, 0.0489959716796875, 0.08599853515625, 0.1230010986328125, 0.160003662109375, 0.1970062255859375, 0.2340087890625, 0.2710113525390625, 0.308013916015625, 0.3450164794921875, 0.38201904296875, 0.4190216064453125, 0.456024169921875, 0.4930267333984375, 0.530029296875, 0.5670318603515625, 0.604034423828125, 0.6410369873046875, 0.67803955078125, 0.7150421142578125, 0.752044677734375, 0.7890472412109375, 0.8260498046875, 0.8630523681640625, 0.900054931640625, 0.9370574951171875, 0.97406005859375, 1.0110626220703125, 1.048065185546875, 1.0850677490234375, 1.1220703125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 19.0, 9.0, 17.0, 20.0, 19.0, 20.0, 39.0, 44.0, 47.0, 58.0, 83.0, 98.0, 85.0, 87.0, 81.0, 62.0, 45.0, 33.0, 18.0, 22.0, 19.0, 11.0, 15.0, 6.0, 6.0, 6.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002275705337524414, -0.00022162310779094696, -0.00021567568182945251, -0.00020972825586795807, -0.00020378082990646362, -0.00019783340394496918, -0.00019188597798347473, -0.00018593855202198029, -0.00017999112606048584, -0.0001740437000989914, -0.00016809627413749695, -0.0001621488481760025, -0.00015620142221450806, -0.0001502539962530136, -0.00014430657029151917, -0.00013835914433002472, -0.00013241171836853027, -0.00012646429240703583, -0.00012051686644554138, -0.00011456944048404694, -0.00010862201452255249, -0.00010267458856105804, -9.67271625995636e-05, -9.077973663806915e-05, -8.483231067657471e-05, -7.888488471508026e-05, -7.293745875358582e-05, -6.699003279209137e-05, -6.104260683059692e-05, -5.509518086910248e-05, -4.914775490760803e-05, -4.3200328946113586e-05, -3.725290298461914e-05, -3.1305477023124695e-05, -2.535805106163025e-05, -1.9410625100135803e-05, -1.3463199138641357e-05, -7.515773177146912e-06, -1.5683472156524658e-06, 4.37907874584198e-06, 1.0326504707336426e-05, 1.627393066883087e-05, 2.2221356630325317e-05, 2.8168782591819763e-05, 3.411620855331421e-05, 4.0063634514808655e-05, 4.60110604763031e-05, 5.1958486437797546e-05, 5.790591239929199e-05, 6.385333836078644e-05, 6.980076432228088e-05, 7.574819028377533e-05, 8.169561624526978e-05, 8.764304220676422e-05, 9.359046816825867e-05, 9.953789412975311e-05, 0.00010548532009124756, 0.000111432746052742, 0.00011738017201423645, 0.0001233275979757309, 0.00012927502393722534, 0.0001352224498987198, 0.00014116987586021423, 0.00014711730182170868, 0.00015306472778320312]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 9.0, 5.0, 17.0, 17.0, 23.0, 21.0, 47.0, 71.0, 106.0, 164.0, 290.0, 563.0, 5043.0, 1030815.0, 9979.0, 601.0, 292.0, 163.0, 117.0, 69.0, 38.0, 40.0, 22.0, 17.0, 10.0, 4.0, 1.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003307342529296875, -0.0031669139862060547, -0.0030264854431152344, -0.002886056900024414, -0.0027456283569335938, -0.0026051998138427734, -0.002464771270751953, -0.002324342727661133, -0.0021839141845703125, -0.002043485641479492, -0.0019030570983886719, -0.0017626285552978516, -0.0016222000122070312, -0.001481771469116211, -0.0013413429260253906, -0.0012009143829345703, -0.00106048583984375, -0.0009200572967529297, -0.0007796287536621094, -0.0006392002105712891, -0.0004987716674804688, -0.00035834312438964844, -0.00021791458129882812, -7.748603820800781e-05, 6.29425048828125e-05, 0.0002033710479736328, 0.0003437995910644531, 0.00048422813415527344, 0.0006246566772460938, 0.0007650852203369141, 0.0009055137634277344, 0.0010459423065185547, 0.001186370849609375, 0.0013267993927001953, 0.0014672279357910156, 0.001607656478881836, 0.0017480850219726562, 0.0018885135650634766, 0.002028942108154297, 0.002169370651245117, 0.0023097991943359375, 0.002450227737426758, 0.002590656280517578, 0.0027310848236083984, 0.0028715133666992188, 0.003011941909790039, 0.0031523704528808594, 0.0032927989959716797, 0.0034332275390625, 0.0035736560821533203, 0.0037140846252441406, 0.003854513168334961, 0.003994941711425781, 0.0041353702545166016, 0.004275798797607422, 0.004416227340698242, 0.0045566558837890625, 0.004697084426879883, 0.004837512969970703, 0.0049779415130615234, 0.005118370056152344, 0.005258798599243164, 0.005399227142333984, 0.005539655685424805, 0.005680084228515625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 13.0, 44.0, 91.0, 189.0, 238.0, 195.0, 156.0, 54.0, 21.0, 9.0, 1.0], "bins": [-0.0004177834198344499, -0.0004105457628611475, -0.0004033081349916756, -0.00039607047801837325, -0.00038883285014890134, -0.000381595193175599, -0.00037435756530612707, -0.0003671199083328247, -0.0003598822804633528, -0.00035264462349005044, -0.00034540699562057853, -0.00033816933864727616, -0.00033093171077780426, -0.0003236940538045019, -0.00031645642593503, -0.0003092187689617276, -0.00030198111198842525, -0.0002947434550151229, -0.000287505827145651, -0.0002802681701723486, -0.0002730305423028767, -0.00026579288532957435, -0.00025855525746010244, -0.0002513176004868001, -0.00024407997261732817, -0.00023684233019594103, -0.0002296046877745539, -0.00022236704535316676, -0.00021512940293177962, -0.00020789174595847726, -0.00020065411808900535, -0.000193416461115703, -0.00018617883324623108, -0.00017894119082484394, -0.0001717035484034568, -0.00016446590598206967, -0.00015722826356068254, -0.00014999060658738017, -0.00014275297871790826, -0.0001355153217446059, -0.00012827767932321876, -0.00012104003690183163, -0.00011380239448044449, -0.00010656475205905735, -9.93271023617126e-05, -9.208945994032547e-05, -8.485181751893833e-05, -7.761416782159358e-05, -7.037652540020645e-05, -6.313888297881931e-05, -5.590123691945337e-05, -4.866359449806623e-05, -4.142594843870029e-05, -3.418830601731315e-05, -2.6950663595926017e-05, -1.9713017536560073e-05, -1.2475378753151745e-05, -5.237734967522556e-06, 1.9999088181066327e-06, 9.23755214898847e-06, 1.647519638936501e-05, 2.371284062974155e-05, 3.0950483051128685e-05, 3.818812911049463e-05, 4.5425771531881765e-05]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 4.0, 6.0, 7.0, 7.0, 12.0, 12.0, 13.0, 20.0, 22.0, 25.0, 26.0, 29.0, 37.0, 36.0, 30.0, 34.0, 29.0, 45.0, 51.0, 41.0, 65.0, 42.0, 43.0, 58.0, 43.0, 36.0, 25.0, 21.0, 26.0, 26.0, 24.0, 25.0, 14.0, 10.0, 12.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.903575897216797e-05, -7.644761353731155e-05, -7.385946810245514e-05, -7.127132266759872e-05, -6.868317723274231e-05, -6.60950317978859e-05, -6.350688636302948e-05, -6.0918740928173065e-05, -5.833059549331665e-05, -5.5742450058460236e-05, -5.315430462360382e-05, -5.0566159188747406e-05, -4.797801375389099e-05, -4.5389868319034576e-05, -4.280172288417816e-05, -4.021357744932175e-05, -3.762543201446533e-05, -3.503728657960892e-05, -3.24491411447525e-05, -2.9860995709896088e-05, -2.7272850275039673e-05, -2.4684704840183258e-05, -2.2096559405326843e-05, -1.950841397047043e-05, -1.6920268535614014e-05, -1.4332123100757599e-05, -1.1743977665901184e-05, -9.15583223104477e-06, -6.5676867961883545e-06, -3.97954136133194e-06, -1.391395926475525e-06, 1.1967495083808899e-06, 3.7848949432373047e-06, 6.3730403780937195e-06, 8.961185812950134e-06, 1.1549331247806549e-05, 1.4137476682662964e-05, 1.672562211751938e-05, 1.9313767552375793e-05, 2.1901912987232208e-05, 2.4490058422088623e-05, 2.7078203856945038e-05, 2.9666349291801453e-05, 3.225449472665787e-05, 3.484264016151428e-05, 3.74307855963707e-05, 4.001893103122711e-05, 4.2607076466083527e-05, 4.519522190093994e-05, 4.7783367335796356e-05, 5.037151277065277e-05, 5.2959658205509186e-05, 5.55478036403656e-05, 5.8135949075222015e-05, 6.072409451007843e-05, 6.331223994493484e-05, 6.590038537979126e-05, 6.848853081464767e-05, 7.107667624950409e-05, 7.36648216843605e-05, 7.625296711921692e-05, 7.884111255407333e-05, 8.142925798892975e-05, 8.401740342378616e-05, 8.660554885864258e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 8.0, 11.0, 9.0, 10.0, 15.0, 19.0, 21.0, 17.0, 27.0, 41.0, 35.0, 33.0, 33.0, 28.0, 36.0, 43.0, 44.0, 51.0, 35.0, 45.0, 42.0, 36.0, 39.0, 36.0, 30.0, 26.0, 29.0, 27.0, 31.0, 20.0, 21.0, 18.0, 12.0, 10.0, 10.0, 10.0, 6.0, 10.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.953125, -4.8038330078125, -4.654541015625, -4.5052490234375, -4.35595703125, -4.2066650390625, -4.057373046875, -3.9080810546875, -3.7587890625, -3.6094970703125, -3.460205078125, -3.3109130859375, -3.16162109375, -3.0123291015625, -2.863037109375, -2.7137451171875, -2.564453125, -2.4151611328125, -2.265869140625, -2.1165771484375, -1.96728515625, -1.8179931640625, -1.668701171875, -1.5194091796875, -1.3701171875, -1.2208251953125, -1.071533203125, -0.9222412109375, -0.77294921875, -0.6236572265625, -0.474365234375, -0.3250732421875, -0.17578125, -0.0264892578125, 0.122802734375, 0.2720947265625, 0.42138671875, 0.5706787109375, 0.719970703125, 0.8692626953125, 1.0185546875, 1.1678466796875, 1.317138671875, 1.4664306640625, 1.61572265625, 1.7650146484375, 1.914306640625, 2.0635986328125, 2.212890625, 2.3621826171875, 2.511474609375, 2.6607666015625, 2.81005859375, 2.9593505859375, 3.108642578125, 3.2579345703125, 3.4072265625, 3.5565185546875, 3.705810546875, 3.8551025390625, 4.00439453125, 4.1536865234375, 4.302978515625, 4.4522705078125, 4.6015625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 12.0, 18.0, 18.0, 32.0, 43.0, 46.0, 66.0, 94.0, 175.0, 203.0, 272.0, 352.0, 679.0, 761.0, 1199.0, 1825.0, 2682.0, 3995.0, 6393.0, 10328.0, 19616.0, 42917.0, 113328.0, 317537.0, 319703.0, 114012.0, 43478.0, 19405.0, 10469.0, 6347.0, 3960.0, 2679.0, 1828.0, 1257.0, 830.0, 568.0, 401.0, 279.0, 180.0, 149.0, 120.0, 77.0, 57.0, 39.0, 33.0, 27.0, 18.0, 15.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0], "bins": [-4.70703125, -4.568603515625, -4.43017578125, -4.291748046875, -4.1533203125, -4.014892578125, -3.87646484375, -3.738037109375, -3.599609375, -3.461181640625, -3.32275390625, -3.184326171875, -3.0458984375, -2.907470703125, -2.76904296875, -2.630615234375, -2.4921875, -2.353759765625, -2.21533203125, -2.076904296875, -1.9384765625, -1.800048828125, -1.66162109375, -1.523193359375, -1.384765625, -1.246337890625, -1.10791015625, -0.969482421875, -0.8310546875, -0.692626953125, -0.55419921875, -0.415771484375, -0.27734375, -0.138916015625, -0.00048828125, 0.137939453125, 0.2763671875, 0.414794921875, 0.55322265625, 0.691650390625, 0.830078125, 0.968505859375, 1.10693359375, 1.245361328125, 1.3837890625, 1.522216796875, 1.66064453125, 1.799072265625, 1.9375, 2.075927734375, 2.21435546875, 2.352783203125, 2.4912109375, 2.629638671875, 2.76806640625, 2.906494140625, 3.044921875, 3.183349609375, 3.32177734375, 3.460205078125, 3.5986328125, 3.737060546875, 3.87548828125, 4.013916015625, 4.15234375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 8.0, 8.0, 14.0, 9.0, 16.0, 16.0, 19.0, 19.0, 32.0, 26.0, 26.0, 33.0, 37.0, 36.0, 30.0, 43.0, 61.0, 109.0, 213.0, 1501.0, 218.0, 120.0, 59.0, 54.0, 29.0, 33.0, 26.0, 28.0, 30.0, 22.0, 24.0, 21.0, 20.0, 10.0, 15.0, 11.0, 13.0, 6.0, 8.0, 4.0, 4.0, 7.0, 3.0, 4.0, 1.0, 7.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.3203125, -14.86328125, -14.40625, -13.94921875, -13.4921875, -13.03515625, -12.578125, -12.12109375, -11.6640625, -11.20703125, -10.75, -10.29296875, -9.8359375, -9.37890625, -8.921875, -8.46484375, -8.0078125, -7.55078125, -7.09375, -6.63671875, -6.1796875, -5.72265625, -5.265625, -4.80859375, -4.3515625, -3.89453125, -3.4375, -2.98046875, -2.5234375, -2.06640625, -1.609375, -1.15234375, -0.6953125, -0.23828125, 0.21875, 0.67578125, 1.1328125, 1.58984375, 2.046875, 2.50390625, 2.9609375, 3.41796875, 3.875, 4.33203125, 4.7890625, 5.24609375, 5.703125, 6.16015625, 6.6171875, 7.07421875, 7.53125, 7.98828125, 8.4453125, 8.90234375, 9.359375, 9.81640625, 10.2734375, 10.73046875, 11.1875, 11.64453125, 12.1015625, 12.55859375, 13.015625, 13.47265625, 13.9296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 7.0, 11.0, 17.0, 16.0, 13.0, 23.0, 38.0, 45.0, 68.0, 100.0, 200.0, 289.0, 703.0, 5273.0, 2348123.0, 785297.0, 4003.0, 616.0, 320.0, 155.0, 116.0, 68.0, 59.0, 35.0, 33.0, 17.0, 19.0, 14.0, 7.0, 9.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.5, -47.0712890625, -45.642578125, -44.2138671875, -42.78515625, -41.3564453125, -39.927734375, -38.4990234375, -37.0703125, -35.6416015625, -34.212890625, -32.7841796875, -31.35546875, -29.9267578125, -28.498046875, -27.0693359375, -25.640625, -24.2119140625, -22.783203125, -21.3544921875, -19.92578125, -18.4970703125, -17.068359375, -15.6396484375, -14.2109375, -12.7822265625, -11.353515625, -9.9248046875, -8.49609375, -7.0673828125, -5.638671875, -4.2099609375, -2.78125, -1.3525390625, 0.076171875, 1.5048828125, 2.93359375, 4.3623046875, 5.791015625, 7.2197265625, 8.6484375, 10.0771484375, 11.505859375, 12.9345703125, 14.36328125, 15.7919921875, 17.220703125, 18.6494140625, 20.078125, 21.5068359375, 22.935546875, 24.3642578125, 25.79296875, 27.2216796875, 28.650390625, 30.0791015625, 31.5078125, 32.9365234375, 34.365234375, 35.7939453125, 37.22265625, 38.6513671875, 40.080078125, 41.5087890625, 42.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 41.0, 551.0, 406.0, 16.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.082496643066406, -14.234087944030762, -9.385679244995117, -4.537270545959473, 0.3111381530761719, 5.1595458984375, 10.007955551147461, 14.856365203857422, 19.70477294921875, 24.553180694580078, 29.40159034729004, 34.25, 39.09840774536133, 43.946815490722656, 48.79522705078125, 53.64363479614258, 58.492042541503906, 63.340450286865234, 68.18885803222656, 73.03726959228516, 77.88568115234375, 82.73408508300781, 87.5824966430664, 92.430908203125, 97.27931213378906, 102.12772369384766, 106.97612762451172, 111.82453918457031, 116.67294311523438, 121.52135467529297, 126.36976623535156, 131.21817016601562, 136.06658935546875, 140.9149932861328, 145.76341247558594, 150.61181640625, 155.46022033691406, 160.30862426757812, 165.15704345703125, 170.0054473876953, 174.85385131835938, 179.70225524902344, 184.55067443847656, 189.39907836914062, 194.2474822998047, 199.09588623046875, 203.94430541992188, 208.79270935058594, 213.64112854003906, 218.48953247070312, 223.33795166015625, 228.1863555908203, 233.03475952148438, 237.8831787109375, 242.73158264160156, 247.57998657226562, 252.42840576171875, 257.2768249511719, 262.1252136230469, 266.9736328125, 271.8220520019531, 276.6704406738281, 281.51885986328125, 286.3672790527344, 291.2156677246094]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 12.0, 9.0, 11.0, 15.0, 9.0, 13.0, 21.0, 20.0, 22.0, 38.0, 32.0, 32.0, 26.0, 39.0, 39.0, 38.0, 38.0, 35.0, 62.0, 50.0, 41.0, 27.0, 40.0, 34.0, 31.0, 35.0, 25.0, 28.0, 26.0, 13.0, 15.0, 17.0, 9.0, 23.0, 11.0, 13.0, 4.0, 13.0, 4.0, 3.0, 10.0, 4.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.79249572753906, -46.234886169433594, -44.677276611328125, -43.119667053222656, -41.56205749511719, -40.00444412231445, -38.446834564208984, -36.889225006103516, -35.33161544799805, -33.77400588989258, -32.21639633178711, -30.658784866333008, -29.10117530822754, -27.54356575012207, -25.98595428466797, -24.4283447265625, -22.87073516845703, -21.313125610351562, -19.755516052246094, -18.197904586791992, -16.640295028686523, -15.082685470581055, -13.52507495880127, -11.967464447021484, -10.409854888916016, -8.852245330810547, -7.294634819030762, -5.737024784088135, -4.179414749145508, -2.621804714202881, -1.064194679260254, 0.49341583251953125, 2.0510292053222656, 3.6086392402648926, 5.1662492752075195, 6.7238593101501465, 8.281469345092773, 9.839078903198242, 11.396689414978027, 12.954299926757812, 14.511909484863281, 16.06951904296875, 17.62712860107422, 19.18474006652832, 20.74234962463379, 22.299959182739258, 23.85757064819336, 25.415180206298828, 26.972789764404297, 28.530399322509766, 30.088008880615234, 31.645620346069336, 33.20323181152344, 34.760841369628906, 36.318450927734375, 37.876060485839844, 39.43367004394531, 40.99127960205078, 42.54888916015625, 44.10649871826172, 45.66410827636719, 47.22172164916992, 48.77933120727539, 50.33694076538086, 51.89455032348633]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 5.0, 13.0, 9.0, 7.0, 14.0, 13.0, 21.0, 16.0, 29.0, 31.0, 35.0, 35.0, 26.0, 33.0, 44.0, 40.0, 51.0, 37.0, 43.0, 47.0, 47.0, 47.0, 39.0, 38.0, 19.0, 27.0, 28.0, 39.0, 28.0, 22.0, 17.0, 15.0, 13.0, 14.0, 16.0, 6.0, 8.0, 5.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.1796875, -5.02056884765625, -4.8614501953125, -4.70233154296875, -4.543212890625, -4.38409423828125, -4.2249755859375, -4.06585693359375, -3.90673828125, -3.74761962890625, -3.5885009765625, -3.42938232421875, -3.270263671875, -3.11114501953125, -2.9520263671875, -2.79290771484375, -2.6337890625, -2.47467041015625, -2.3155517578125, -2.15643310546875, -1.997314453125, -1.83819580078125, -1.6790771484375, -1.51995849609375, -1.36083984375, -1.20172119140625, -1.0426025390625, -0.88348388671875, -0.724365234375, -0.56524658203125, -0.4061279296875, -0.24700927734375, -0.087890625, 0.07122802734375, 0.2303466796875, 0.38946533203125, 0.548583984375, 0.70770263671875, 0.8668212890625, 1.02593994140625, 1.18505859375, 1.34417724609375, 1.5032958984375, 1.66241455078125, 1.821533203125, 1.98065185546875, 2.1397705078125, 2.29888916015625, 2.4580078125, 2.61712646484375, 2.7762451171875, 2.93536376953125, 3.094482421875, 3.25360107421875, 3.4127197265625, 3.57183837890625, 3.73095703125, 3.89007568359375, 4.0491943359375, 4.20831298828125, 4.367431640625, 4.52655029296875, 4.6856689453125, 4.84478759765625, 5.00390625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 8.0, 11.0, 13.0, 15.0, 19.0, 25.0, 32.0, 50.0, 62.0, 112.0, 169.0, 255.0, 543.0, 908.0, 1941.0, 4589.0, 12152.0, 37635.0, 133844.0, 473881.0, 1216369.0, 1399336.0, 643836.0, 189762.0, 52056.0, 16018.0, 5777.0, 2337.0, 1138.0, 522.0, 300.0, 198.0, 113.0, 81.0, 51.0, 34.0, 26.0, 19.0, 10.0, 12.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.90032958984375, -5.7108154296875, -5.52130126953125, -5.331787109375, -5.14227294921875, -4.9527587890625, -4.76324462890625, -4.57373046875, -4.38421630859375, -4.1947021484375, -4.00518798828125, -3.815673828125, -3.62615966796875, -3.4366455078125, -3.24713134765625, -3.0576171875, -2.86810302734375, -2.6785888671875, -2.48907470703125, -2.299560546875, -2.11004638671875, -1.9205322265625, -1.73101806640625, -1.54150390625, -1.35198974609375, -1.1624755859375, -0.97296142578125, -0.783447265625, -0.59393310546875, -0.4044189453125, -0.21490478515625, -0.025390625, 0.16412353515625, 0.3536376953125, 0.54315185546875, 0.732666015625, 0.92218017578125, 1.1116943359375, 1.30120849609375, 1.49072265625, 1.68023681640625, 1.8697509765625, 2.05926513671875, 2.248779296875, 2.43829345703125, 2.6278076171875, 2.81732177734375, 3.0068359375, 3.19635009765625, 3.3858642578125, 3.57537841796875, 3.764892578125, 3.95440673828125, 4.1439208984375, 4.33343505859375, 4.52294921875, 4.71246337890625, 4.9019775390625, 5.09149169921875, 5.281005859375, 5.47052001953125, 5.6600341796875, 5.84954833984375, 6.0390625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 6.0, 14.0, 15.0, 20.0, 22.0, 32.0, 45.0, 64.0, 86.0, 122.0, 160.0, 229.0, 296.0, 368.0, 400.0, 400.0, 406.0, 352.0, 270.0, 202.0, 145.0, 108.0, 96.0, 58.0, 52.0, 37.0, 20.0, 15.0, 12.0, 10.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.171875, -13.781982421875, -13.39208984375, -13.002197265625, -12.6123046875, -12.222412109375, -11.83251953125, -11.442626953125, -11.052734375, -10.662841796875, -10.27294921875, -9.883056640625, -9.4931640625, -9.103271484375, -8.71337890625, -8.323486328125, -7.93359375, -7.543701171875, -7.15380859375, -6.763916015625, -6.3740234375, -5.984130859375, -5.59423828125, -5.204345703125, -4.814453125, -4.424560546875, -4.03466796875, -3.644775390625, -3.2548828125, -2.864990234375, -2.47509765625, -2.085205078125, -1.6953125, -1.305419921875, -0.91552734375, -0.525634765625, -0.1357421875, 0.254150390625, 0.64404296875, 1.033935546875, 1.423828125, 1.813720703125, 2.20361328125, 2.593505859375, 2.9833984375, 3.373291015625, 3.76318359375, 4.153076171875, 4.54296875, 4.932861328125, 5.32275390625, 5.712646484375, 6.1025390625, 6.492431640625, 6.88232421875, 7.272216796875, 7.662109375, 8.052001953125, 8.44189453125, 8.831787109375, 9.2216796875, 9.611572265625, 10.00146484375, 10.391357421875, 10.78125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 11.0, 9.0, 13.0, 14.0, 32.0, 41.0, 40.0, 58.0, 66.0, 114.0, 171.0, 298.0, 829.0, 5661.0, 259857.0, 3775228.0, 146096.0, 4098.0, 716.0, 263.0, 188.0, 135.0, 82.0, 51.0, 50.0, 30.0, 24.0, 27.0, 21.0, 15.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.375, -24.19140625, -23.0078125, -21.82421875, -20.640625, -19.45703125, -18.2734375, -17.08984375, -15.90625, -14.72265625, -13.5390625, -12.35546875, -11.171875, -9.98828125, -8.8046875, -7.62109375, -6.4375, -5.25390625, -4.0703125, -2.88671875, -1.703125, -0.51953125, 0.6640625, 1.84765625, 3.03125, 4.21484375, 5.3984375, 6.58203125, 7.765625, 8.94921875, 10.1328125, 11.31640625, 12.5, 13.68359375, 14.8671875, 16.05078125, 17.234375, 18.41796875, 19.6015625, 20.78515625, 21.96875, 23.15234375, 24.3359375, 25.51953125, 26.703125, 27.88671875, 29.0703125, 30.25390625, 31.4375, 32.62109375, 33.8046875, 34.98828125, 36.171875, 37.35546875, 38.5390625, 39.72265625, 40.90625, 42.08984375, 43.2734375, 44.45703125, 45.640625, 46.82421875, 48.0078125, 49.19140625, 50.375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 30.0, 69.0, 157.0, 206.0, 252.0, 152.0, 89.0, 38.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-181.41685485839844, -177.7894287109375, -174.16201782226562, -170.53460693359375, -166.9071807861328, -163.27975463867188, -159.65234375, -156.02493286132812, -152.3975067138672, -148.77008056640625, -145.14266967773438, -141.5152587890625, -137.88783264160156, -134.26040649414062, -130.63299560546875, -127.00557708740234, -123.37815856933594, -119.75074005126953, -116.12332153320312, -112.49590301513672, -108.86848449707031, -105.2410659790039, -101.6136474609375, -97.9862289428711, -94.35881042480469, -90.73139190673828, -87.10397338867188, -83.47655487060547, -79.84913635253906, -76.22171783447266, -72.59429931640625, -68.96688079833984, -65.33946228027344, -61.71204376220703, -58.084625244140625, -54.45720672607422, -50.82978820800781, -47.202369689941406, -43.574951171875, -39.947532653808594, -36.32011413574219, -32.69269561767578, -29.065277099609375, -25.43785858154297, -21.810440063476562, -18.183021545410156, -14.55560302734375, -10.928184509277344, -7.3007659912109375, -3.6733474731445312, -0.045928955078125, 3.5814895629882812, 7.2089080810546875, 10.836326599121094, 14.4637451171875, 18.091163635253906, 21.718582153320312, 25.34600067138672, 28.973419189453125, 32.60083770751953, 36.22825622558594, 39.855674743652344, 43.48309326171875, 47.110511779785156, 50.73793029785156]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 9.0, 5.0, 6.0, 8.0, 11.0, 14.0, 14.0, 12.0, 15.0, 14.0, 18.0, 23.0, 26.0, 33.0, 33.0, 43.0, 28.0, 33.0, 33.0, 48.0, 38.0, 50.0, 44.0, 40.0, 47.0, 37.0, 28.0, 40.0, 24.0, 25.0, 29.0, 21.0, 28.0, 28.0, 21.0, 17.0, 18.0, 11.0, 7.0, 7.0, 8.0, 6.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.00314712524414, -39.75244140625, -38.501731872558594, -37.25102615356445, -36.00032043457031, -34.74961471557617, -33.49890899658203, -32.248199462890625, -30.997493743896484, -29.746788024902344, -28.49608039855957, -27.245372772216797, -25.994667053222656, -24.743961334228516, -23.493253707885742, -22.24254608154297, -20.991840362548828, -19.741134643554688, -18.490427017211914, -17.23971939086914, -15.989013671875, -14.738306999206543, -13.487600326538086, -12.236893653869629, -10.986186981201172, -9.735480308532715, -8.484773635864258, -7.234066963195801, -5.983360290527344, -4.732653617858887, -3.4819469451904297, -2.2312402725219727, -0.9805335998535156, 0.2701730728149414, 1.5208797454833984, 2.7715864181518555, 4.0222930908203125, 5.2729997634887695, 6.523706436157227, 7.774413108825684, 9.02511978149414, 10.275826454162598, 11.526533126831055, 12.777239799499512, 14.027946472167969, 15.278653144836426, 16.529359817504883, 17.780067443847656, 19.030773162841797, 20.281478881835938, 21.53218650817871, 22.782894134521484, 24.033599853515625, 25.284305572509766, 26.53501319885254, 27.785720825195312, 29.036426544189453, 30.287132263183594, 31.537839889526367, 32.78854751586914, 34.03925323486328, 35.28995895385742, 36.54066467285156, 37.79137420654297, 39.04207992553711]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 10.0, 12.0, 10.0, 16.0, 10.0, 24.0, 19.0, 24.0, 29.0, 24.0, 26.0, 36.0, 38.0, 42.0, 50.0, 38.0, 41.0, 46.0, 44.0, 50.0, 30.0, 34.0, 29.0, 33.0, 39.0, 27.0, 29.0, 21.0, 25.0, 21.0, 20.0, 12.0, 18.0, 9.0, 14.0, 10.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.0, -4.84271240234375, -4.6854248046875, -4.52813720703125, -4.370849609375, -4.21356201171875, -4.0562744140625, -3.89898681640625, -3.74169921875, -3.58441162109375, -3.4271240234375, -3.26983642578125, -3.112548828125, -2.95526123046875, -2.7979736328125, -2.64068603515625, -2.4833984375, -2.32611083984375, -2.1688232421875, -2.01153564453125, -1.854248046875, -1.69696044921875, -1.5396728515625, -1.38238525390625, -1.22509765625, -1.06781005859375, -0.9105224609375, -0.75323486328125, -0.595947265625, -0.43865966796875, -0.2813720703125, -0.12408447265625, 0.033203125, 0.19049072265625, 0.3477783203125, 0.50506591796875, 0.662353515625, 0.81964111328125, 0.9769287109375, 1.13421630859375, 1.29150390625, 1.44879150390625, 1.6060791015625, 1.76336669921875, 1.920654296875, 2.07794189453125, 2.2352294921875, 2.39251708984375, 2.5498046875, 2.70709228515625, 2.8643798828125, 3.02166748046875, 3.178955078125, 3.33624267578125, 3.4935302734375, 3.65081787109375, 3.80810546875, 3.96539306640625, 4.1226806640625, 4.27996826171875, 4.437255859375, 4.59454345703125, 4.7518310546875, 4.90911865234375, 5.06640625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 5.0, 3.0, 5.0, 7.0, 10.0, 13.0, 15.0, 33.0, 38.0, 69.0, 89.0, 142.0, 157.0, 256.0, 401.0, 545.0, 752.0, 1017.0, 1459.0, 2029.0, 2879.0, 4052.0, 5593.0, 8202.0, 11536.0, 16502.0, 23920.0, 35964.0, 54944.0, 89435.0, 175801.0, 293101.0, 115176.0, 67327.0, 42948.0, 28711.0, 19480.0, 13444.0, 9498.0, 6726.0, 4724.0, 3354.0, 2428.0, 1705.0, 1207.0, 858.0, 583.0, 416.0, 295.0, 206.0, 163.0, 92.0, 71.0, 54.0, 32.0, 34.0, 28.0, 12.0, 10.0, 5.0, 3.0, 2.0, 5.0], "bins": [-1.1376953125, -1.102386474609375, -1.06707763671875, -1.031768798828125, -0.9964599609375, -0.961151123046875, -0.92584228515625, -0.890533447265625, -0.855224609375, -0.819915771484375, -0.78460693359375, -0.749298095703125, -0.7139892578125, -0.678680419921875, -0.64337158203125, -0.608062744140625, -0.57275390625, -0.537445068359375, -0.50213623046875, -0.466827392578125, -0.4315185546875, -0.396209716796875, -0.36090087890625, -0.325592041015625, -0.290283203125, -0.254974365234375, -0.21966552734375, -0.184356689453125, -0.1490478515625, -0.113739013671875, -0.07843017578125, -0.043121337890625, -0.0078125, 0.027496337890625, 0.06280517578125, 0.098114013671875, 0.1334228515625, 0.168731689453125, 0.20404052734375, 0.239349365234375, 0.274658203125, 0.309967041015625, 0.34527587890625, 0.380584716796875, 0.4158935546875, 0.451202392578125, 0.48651123046875, 0.521820068359375, 0.55712890625, 0.592437744140625, 0.62774658203125, 0.663055419921875, 0.6983642578125, 0.733673095703125, 0.76898193359375, 0.804290771484375, 0.839599609375, 0.874908447265625, 0.91021728515625, 0.945526123046875, 0.9808349609375, 1.016143798828125, 1.05145263671875, 1.086761474609375, 1.1220703125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 5.0, 9.0, 9.0, 7.0, 14.0, 9.0, 17.0, 21.0, 22.0, 25.0, 27.0, 22.0, 33.0, 26.0, 42.0, 38.0, 45.0, 36.0, 42.0, 54.0, 1061.0, 36.0, 45.0, 36.0, 26.0, 40.0, 39.0, 33.0, 29.0, 22.0, 25.0, 26.0, 11.0, 17.0, 17.0, 9.0, 14.0, 8.0, 5.0, 5.0, 5.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.733123779296875, -2.63226318359375, -2.531402587890625, -2.4305419921875, -2.329681396484375, -2.22882080078125, -2.127960205078125, -2.027099609375, -1.926239013671875, -1.82537841796875, -1.724517822265625, -1.6236572265625, -1.522796630859375, -1.42193603515625, -1.321075439453125, -1.22021484375, -1.119354248046875, -1.01849365234375, -0.917633056640625, -0.8167724609375, -0.715911865234375, -0.61505126953125, -0.514190673828125, -0.413330078125, -0.312469482421875, -0.21160888671875, -0.110748291015625, -0.0098876953125, 0.090972900390625, 0.19183349609375, 0.292694091796875, 0.3935546875, 0.494415283203125, 0.59527587890625, 0.696136474609375, 0.7969970703125, 0.897857666015625, 0.99871826171875, 1.099578857421875, 1.200439453125, 1.301300048828125, 1.40216064453125, 1.503021240234375, 1.6038818359375, 1.704742431640625, 1.80560302734375, 1.906463623046875, 2.00732421875, 2.108184814453125, 2.20904541015625, 2.309906005859375, 2.4107666015625, 2.511627197265625, 2.61248779296875, 2.713348388671875, 2.814208984375, 2.915069580078125, 3.01593017578125, 3.116790771484375, 3.2176513671875, 3.318511962890625, 3.41937255859375, 3.520233154296875, 3.62109375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 11.0, 22.0, 22.0, 47.0, 53.0, 72.0, 134.0, 201.0, 297.0, 483.0, 688.0, 1059.0, 1643.0, 2479.0, 3610.0, 5542.0, 8550.0, 13231.0, 20661.0, 32892.0, 52681.0, 86139.0, 158249.0, 1373625.0, 130964.0, 75709.0, 46642.0, 28957.0, 18241.0, 11732.0, 7799.0, 4956.0, 3271.0, 2213.0, 1444.0, 987.0, 654.0, 405.0, 267.0, 178.0, 109.0, 76.0, 55.0, 18.0, 29.0, 6.0, 10.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1871185302734375, -1.146697998046875, -1.1062774658203125, -1.06585693359375, -1.0254364013671875, -0.985015869140625, -0.9445953369140625, -0.9041748046875, -0.8637542724609375, -0.823333740234375, -0.7829132080078125, -0.74249267578125, -0.7020721435546875, -0.661651611328125, -0.6212310791015625, -0.580810546875, -0.5403900146484375, -0.499969482421875, -0.4595489501953125, -0.41912841796875, -0.3787078857421875, -0.338287353515625, -0.2978668212890625, -0.2574462890625, -0.2170257568359375, -0.176605224609375, -0.1361846923828125, -0.09576416015625, -0.0553436279296875, -0.014923095703125, 0.0254974365234375, 0.06591796875, 0.1063385009765625, 0.146759033203125, 0.1871795654296875, 0.22760009765625, 0.2680206298828125, 0.308441162109375, 0.3488616943359375, 0.3892822265625, 0.4297027587890625, 0.470123291015625, 0.5105438232421875, 0.55096435546875, 0.5913848876953125, 0.631805419921875, 0.6722259521484375, 0.712646484375, 0.7530670166015625, 0.793487548828125, 0.8339080810546875, 0.87432861328125, 0.9147491455078125, 0.955169677734375, 0.9955902099609375, 1.0360107421875, 1.0764312744140625, 1.116851806640625, 1.1572723388671875, 1.19769287109375, 1.2381134033203125, 1.278533935546875, 1.3189544677734375, 1.359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 10.0, 10.0, 14.0, 16.0, 14.0, 10.0, 27.0, 30.0, 47.0, 42.0, 47.0, 68.0, 60.0, 82.0, 68.0, 72.0, 76.0, 44.0, 54.0, 32.0, 28.0, 21.0, 23.0, 23.0, 13.0, 8.0, 9.0, 8.0, 9.0, 8.0, 0.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001659393310546875, -0.00016040727496147156, -0.00015487521886825562, -0.00014934316277503967, -0.00014381110668182373, -0.0001382790505886078, -0.00013274699449539185, -0.0001272149384021759, -0.00012168288230895996, -0.00011615082621574402, -0.00011061877012252808, -0.00010508671402931213, -9.955465793609619e-05, -9.402260184288025e-05, -8.84905457496643e-05, -8.295848965644836e-05, -7.742643356323242e-05, -7.189437747001648e-05, -6.636232137680054e-05, -6.0830265283584595e-05, -5.529820919036865e-05, -4.976615309715271e-05, -4.423409700393677e-05, -3.8702040910720825e-05, -3.316998481750488e-05, -2.763792872428894e-05, -2.2105872631072998e-05, -1.6573816537857056e-05, -1.1041760444641113e-05, -5.509704351425171e-06, 2.2351741790771484e-08, 5.554407835006714e-06, 1.1086463928222656e-05, 1.66185200214386e-05, 2.215057611465454e-05, 2.7682632207870483e-05, 3.3214688301086426e-05, 3.874674439430237e-05, 4.427880048751831e-05, 4.981085658073425e-05, 5.5342912673950195e-05, 6.087496876716614e-05, 6.640702486038208e-05, 7.193908095359802e-05, 7.747113704681396e-05, 8.300319314002991e-05, 8.853524923324585e-05, 9.406730532646179e-05, 9.959936141967773e-05, 0.00010513141751289368, 0.00011066347360610962, 0.00011619552969932556, 0.0001217275857925415, 0.00012725964188575745, 0.0001327916979789734, 0.00013832375407218933, 0.00014385581016540527, 0.00014938786625862122, 0.00015491992235183716, 0.0001604519784450531, 0.00016598403453826904, 0.00017151609063148499, 0.00017704814672470093, 0.00018258020281791687, 0.0001881122589111328]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 14.0, 10.0, 13.0, 11.0, 14.0, 10.0, 25.0, 36.0, 46.0, 62.0, 108.0, 186.0, 275.0, 503.0, 2242.0, 807225.0, 235229.0, 1306.0, 469.0, 248.0, 173.0, 90.0, 65.0, 54.0, 29.0, 25.0, 11.0, 23.0, 13.0, 12.0, 9.0, 5.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003971099853515625, -0.003853917121887207, -0.003736734390258789, -0.003619551658630371, -0.003502368927001953, -0.003385186195373535, -0.003268003463745117, -0.0031508207321166992, -0.0030336380004882812, -0.0029164552688598633, -0.0027992725372314453, -0.0026820898056030273, -0.0025649070739746094, -0.0024477243423461914, -0.0023305416107177734, -0.0022133588790893555, -0.0020961761474609375, -0.0019789934158325195, -0.0018618106842041016, -0.0017446279525756836, -0.0016274452209472656, -0.0015102624893188477, -0.0013930797576904297, -0.0012758970260620117, -0.0011587142944335938, -0.0010415315628051758, -0.0009243488311767578, -0.0008071660995483398, -0.0006899833679199219, -0.0005728006362915039, -0.00045561790466308594, -0.00033843517303466797, -0.00022125244140625, -0.00010406970977783203, 1.3113021850585938e-05, 0.0001302957534790039, 0.0002474784851074219, 0.00036466121673583984, 0.0004818439483642578, 0.0005990266799926758, 0.0007162094116210938, 0.0008333921432495117, 0.0009505748748779297, 0.0010677576065063477, 0.0011849403381347656, 0.0013021230697631836, 0.0014193058013916016, 0.0015364885330200195, 0.0016536712646484375, 0.0017708539962768555, 0.0018880367279052734, 0.0020052194595336914, 0.0021224021911621094, 0.0022395849227905273, 0.0023567676544189453, 0.0024739503860473633, 0.0025911331176757812, 0.0027083158493041992, 0.002825498580932617, 0.002942681312561035, 0.003059864044189453, 0.003177046775817871, 0.003294229507446289, 0.003411412239074707, 0.003528594970703125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 15.0, 24.0, 43.0, 80.0, 91.0, 131.0, 157.0, 137.0, 105.0, 72.0, 57.0, 49.0, 24.0, 11.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017996500537265092, -0.00017478116205893457, -0.000169597304193303, -0.00016441346087958664, -0.00015922961756587029, -0.0001540457597002387, -0.00014886191638652235, -0.000143678073072806, -0.00013849421520717442, -0.00013331037189345807, -0.0001281265140278265, -0.00012294267071411014, -0.00011775882740039378, -0.00011257497681071982, -0.00010739112622104585, -0.0001022072829073295, -9.702343959361315e-05, -9.183958900393918e-05, -8.665574569022283e-05, -8.147189510054886e-05, -7.628805178683251e-05, -7.110420119715855e-05, -6.592035060748458e-05, -6.073650365578942e-05, -5.555265670409426e-05, -5.03688097523991e-05, -4.518496280070394e-05, -4.0001112211029977e-05, -3.481726525933482e-05, -2.963341830763966e-05, -2.4449567717965692e-05, -1.9265720766270533e-05, -1.4081859262660146e-05, -8.898011401470285e-06, -3.714163540280424e-06, 1.4696852304041386e-06, 6.653532182099298e-06, 1.1837379133794457e-05, 1.7021229723468423e-05, 2.2205076675163582e-05, 2.738892362685874e-05, 3.25727705785539e-05, 3.775661753024906e-05, 4.2940468119923025e-05, 4.8124315071618184e-05, 5.3308162023313344e-05, 5.849201261298731e-05, 6.367586320266128e-05, 6.885970651637763e-05, 7.40435571060516e-05, 7.922740041976795e-05, 8.441125100944191e-05, 8.959509432315826e-05, 9.477894491283223e-05, 9.99627955025062e-05, 0.00010514663881622255, 0.00011033048940589651, 0.00011551433999557048, 0.00012069818330928683, 0.0001258820411749184, 0.00013106588448863477, 0.00013624972780235112, 0.0001414335856679827, 0.00014661742898169905, 0.0001518012722954154]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 6.0, 4.0, 12.0, 12.0, 13.0, 18.0, 18.0, 15.0, 29.0, 32.0, 30.0, 29.0, 40.0, 29.0, 33.0, 50.0, 38.0, 56.0, 48.0, 30.0, 39.0, 36.0, 40.0, 36.0, 48.0, 39.0, 30.0, 30.0, 25.0, 22.0, 17.0, 20.0, 9.0, 18.0, 12.0, 10.0, 7.0, 5.0, 3.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010561943054199219, -0.00010267645120620728, -9.973347187042236e-05, -9.679049253463745e-05, -9.384751319885254e-05, -9.090453386306763e-05, -8.796155452728271e-05, -8.50185751914978e-05, -8.207559585571289e-05, -7.913261651992798e-05, -7.618963718414307e-05, -7.324665784835815e-05, -7.030367851257324e-05, -6.736069917678833e-05, -6.441771984100342e-05, -6.14747405052185e-05, -5.8531761169433594e-05, -5.558878183364868e-05, -5.264580249786377e-05, -4.970282316207886e-05, -4.6759843826293945e-05, -4.381686449050903e-05, -4.087388515472412e-05, -3.793090581893921e-05, -3.49879264831543e-05, -3.2044947147369385e-05, -2.9101967811584473e-05, -2.615898847579956e-05, -2.321600914001465e-05, -2.0273029804229736e-05, -1.7330050468444824e-05, -1.4387071132659912e-05, -1.1444091796875e-05, -8.501112461090088e-06, -5.558133125305176e-06, -2.6151537895202637e-06, 3.2782554626464844e-07, 3.2708048820495605e-06, 6.213784217834473e-06, 9.156763553619385e-06, 1.2099742889404297e-05, 1.5042722225189209e-05, 1.798570156097412e-05, 2.0928680896759033e-05, 2.3871660232543945e-05, 2.6814639568328857e-05, 2.975761890411377e-05, 3.270059823989868e-05, 3.5643577575683594e-05, 3.8586556911468506e-05, 4.152953624725342e-05, 4.447251558303833e-05, 4.741549491882324e-05, 5.0358474254608154e-05, 5.3301453590393066e-05, 5.624443292617798e-05, 5.918741226196289e-05, 6.21303915977478e-05, 6.507337093353271e-05, 6.801635026931763e-05, 7.095932960510254e-05, 7.390230894088745e-05, 7.684528827667236e-05, 7.978826761245728e-05, 8.273124694824219e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 10.0, 12.0, 10.0, 16.0, 10.0, 24.0, 19.0, 24.0, 29.0, 24.0, 26.0, 36.0, 38.0, 42.0, 50.0, 38.0, 41.0, 46.0, 44.0, 50.0, 30.0, 34.0, 29.0, 33.0, 39.0, 27.0, 29.0, 21.0, 25.0, 21.0, 20.0, 12.0, 18.0, 9.0, 14.0, 10.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.0, -4.84271240234375, -4.6854248046875, -4.52813720703125, -4.370849609375, -4.21356201171875, -4.0562744140625, -3.89898681640625, -3.74169921875, -3.58441162109375, -3.4271240234375, -3.26983642578125, -3.112548828125, -2.95526123046875, -2.7979736328125, -2.64068603515625, -2.4833984375, -2.32611083984375, -2.1688232421875, -2.01153564453125, -1.854248046875, -1.69696044921875, -1.5396728515625, -1.38238525390625, -1.22509765625, -1.06781005859375, -0.9105224609375, -0.75323486328125, -0.595947265625, -0.43865966796875, -0.2813720703125, -0.12408447265625, 0.033203125, 0.19049072265625, 0.3477783203125, 0.50506591796875, 0.662353515625, 0.81964111328125, 0.9769287109375, 1.13421630859375, 1.29150390625, 1.44879150390625, 1.6060791015625, 1.76336669921875, 1.920654296875, 2.07794189453125, 2.2352294921875, 2.39251708984375, 2.5498046875, 2.70709228515625, 2.8643798828125, 3.02166748046875, 3.178955078125, 3.33624267578125, 3.4935302734375, 3.65081787109375, 3.80810546875, 3.96539306640625, 4.1226806640625, 4.27996826171875, 4.437255859375, 4.59454345703125, 4.7518310546875, 4.90911865234375, 5.06640625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 3.0, 0.0, 8.0, 7.0, 12.0, 19.0, 18.0, 40.0, 41.0, 58.0, 89.0, 143.0, 240.0, 496.0, 998.0, 1928.0, 4042.0, 8728.0, 20259.0, 52217.0, 163947.0, 397031.0, 262655.0, 82634.0, 29658.0, 12368.0, 5536.0, 2550.0, 1259.0, 678.0, 337.0, 200.0, 109.0, 45.0, 56.0, 35.0, 27.0, 25.0, 15.0, 15.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.1903076171875, -5.009521484375, -4.8287353515625, -4.64794921875, -4.4671630859375, -4.286376953125, -4.1055908203125, -3.9248046875, -3.7440185546875, -3.563232421875, -3.3824462890625, -3.20166015625, -3.0208740234375, -2.840087890625, -2.6593017578125, -2.478515625, -2.2977294921875, -2.116943359375, -1.9361572265625, -1.75537109375, -1.5745849609375, -1.393798828125, -1.2130126953125, -1.0322265625, -0.8514404296875, -0.670654296875, -0.4898681640625, -0.30908203125, -0.1282958984375, 0.052490234375, 0.2332763671875, 0.4140625, 0.5948486328125, 0.775634765625, 0.9564208984375, 1.13720703125, 1.3179931640625, 1.498779296875, 1.6795654296875, 1.8603515625, 2.0411376953125, 2.221923828125, 2.4027099609375, 2.58349609375, 2.7642822265625, 2.945068359375, 3.1258544921875, 3.306640625, 3.4874267578125, 3.668212890625, 3.8489990234375, 4.02978515625, 4.2105712890625, 4.391357421875, 4.5721435546875, 4.7529296875, 4.9337158203125, 5.114501953125, 5.2952880859375, 5.47607421875, 5.6568603515625, 5.837646484375, 6.0184326171875, 6.19921875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 9.0, 5.0, 6.0, 4.0, 7.0, 16.0, 9.0, 13.0, 12.0, 21.0, 14.0, 28.0, 27.0, 43.0, 33.0, 32.0, 59.0, 63.0, 104.0, 193.0, 1455.0, 299.0, 142.0, 77.0, 37.0, 37.0, 36.0, 38.0, 30.0, 19.0, 29.0, 30.0, 19.0, 16.0, 22.0, 12.0, 18.0, 7.0, 3.0, 6.0, 2.0, 6.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -18.02734375, -17.4765625, -16.92578125, -16.375, -15.82421875, -15.2734375, -14.72265625, -14.171875, -13.62109375, -13.0703125, -12.51953125, -11.96875, -11.41796875, -10.8671875, -10.31640625, -9.765625, -9.21484375, -8.6640625, -8.11328125, -7.5625, -7.01171875, -6.4609375, -5.91015625, -5.359375, -4.80859375, -4.2578125, -3.70703125, -3.15625, -2.60546875, -2.0546875, -1.50390625, -0.953125, -0.40234375, 0.1484375, 0.69921875, 1.25, 1.80078125, 2.3515625, 2.90234375, 3.453125, 4.00390625, 4.5546875, 5.10546875, 5.65625, 6.20703125, 6.7578125, 7.30859375, 7.859375, 8.41015625, 8.9609375, 9.51171875, 10.0625, 10.61328125, 11.1640625, 11.71484375, 12.265625, 12.81640625, 13.3671875, 13.91796875, 14.46875, 15.01953125, 15.5703125, 16.12109375, 16.671875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 8.0, 13.0, 7.0, 13.0, 19.0, 34.0, 29.0, 52.0, 64.0, 61.0, 112.0, 179.0, 256.0, 436.0, 1150.0, 16831.0, 3043409.0, 79592.0, 1999.0, 533.0, 258.0, 190.0, 118.0, 84.0, 47.0, 50.0, 28.0, 32.0, 16.0, 18.0, 10.0, 16.0, 5.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.59375, -40.19091796875, -38.7880859375, -37.38525390625, -35.982421875, -34.57958984375, -33.1767578125, -31.77392578125, -30.37109375, -28.96826171875, -27.5654296875, -26.16259765625, -24.759765625, -23.35693359375, -21.9541015625, -20.55126953125, -19.1484375, -17.74560546875, -16.3427734375, -14.93994140625, -13.537109375, -12.13427734375, -10.7314453125, -9.32861328125, -7.92578125, -6.52294921875, -5.1201171875, -3.71728515625, -2.314453125, -0.91162109375, 0.4912109375, 1.89404296875, 3.296875, 4.69970703125, 6.1025390625, 7.50537109375, 8.908203125, 10.31103515625, 11.7138671875, 13.11669921875, 14.51953125, 15.92236328125, 17.3251953125, 18.72802734375, 20.130859375, 21.53369140625, 22.9365234375, 24.33935546875, 25.7421875, 27.14501953125, 28.5478515625, 29.95068359375, 31.353515625, 32.75634765625, 34.1591796875, 35.56201171875, 36.96484375, 38.36767578125, 39.7705078125, 41.17333984375, 42.576171875, 43.97900390625, 45.3818359375, 46.78466796875, 48.1875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 66.0, 553.0, 368.0, 23.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.55719757080078, -31.037094116210938, -26.516990661621094, -21.996889114379883, -17.47678565979004, -12.956682205200195, -8.436580657958984, -3.9164772033691406, 0.6036262512207031, 5.123729228973389, 9.643832206726074, 14.163934707641602, 18.684038162231445, 23.20414161682129, 27.7242431640625, 32.244346618652344, 36.76445007324219, 41.28455352783203, 45.804656982421875, 50.32476043701172, 54.84486389160156, 59.364967346191406, 63.885066986083984, 68.40516662597656, 72.92527770996094, 77.44538116455078, 81.96548461914062, 86.48558807373047, 91.00569152832031, 95.52579498291016, 100.0458984375, 104.56599426269531, 109.08609008789062, 113.60619354248047, 118.12629699707031, 122.64640045166016, 127.16650390625, 131.6865997314453, 136.2067108154297, 140.726806640625, 145.24691772460938, 149.7670135498047, 154.28712463378906, 158.80722045898438, 163.32733154296875, 167.84742736816406, 172.36753845214844, 176.88763427734375, 181.40774536132812, 185.92784118652344, 190.4479522705078, 194.96804809570312, 199.4881591796875, 204.0082550048828, 208.5283660888672, 213.0484619140625, 217.5685577392578, 222.08865356445312, 226.6087646484375, 231.1288604736328, 235.6489715576172, 240.1690673828125, 244.68917846679688, 249.2092742919922, 253.72938537597656]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 9.0, 8.0, 6.0, 7.0, 11.0, 9.0, 18.0, 17.0, 22.0, 20.0, 33.0, 22.0, 38.0, 33.0, 29.0, 34.0, 41.0, 42.0, 38.0, 37.0, 44.0, 38.0, 39.0, 41.0, 31.0, 45.0, 36.0, 36.0, 27.0, 33.0, 18.0, 17.0, 21.0, 13.0, 11.0, 10.0, 17.0, 16.0, 8.0, 9.0, 4.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-49.78704071044922, -48.39008712768555, -46.993133544921875, -45.59617614746094, -44.199222564697266, -42.802268981933594, -41.40531539916992, -40.00836181640625, -38.61140441894531, -37.21445083618164, -35.81749725341797, -34.42053985595703, -33.02358627319336, -31.626632690429688, -30.229679107666016, -28.832725524902344, -27.435771942138672, -26.038818359375, -24.641862869262695, -23.244909286499023, -21.84795379638672, -20.451000213623047, -19.054046630859375, -17.657093048095703, -16.2601375579834, -14.86318302154541, -13.466228485107422, -12.06927490234375, -10.672320365905762, -9.275365829467773, -7.878412246704102, -6.481457710266113, -5.084506988525391, -3.6875526905059814, -2.2905983924865723, -0.8936443328857422, 0.5033102035522461, 1.9002647399902344, 3.2972183227539062, 4.6941728591918945, 6.091127395629883, 7.488081932067871, 8.88503646850586, 10.281990051269531, 11.67894458770752, 13.075899124145508, 14.47285270690918, 15.869807243347168, 17.266761779785156, 18.663715362548828, 20.060670852661133, 21.457624435424805, 22.85457992553711, 24.25153350830078, 25.648487091064453, 27.045440673828125, 28.44239616394043, 29.8393497467041, 31.236305236816406, 32.63325881958008, 34.03021240234375, 35.42716979980469, 36.824119567871094, 38.22107696533203, 39.6180305480957]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 6.0, 5.0, 6.0, 9.0, 15.0, 14.0, 10.0, 17.0, 18.0, 26.0, 26.0, 27.0, 21.0, 29.0, 33.0, 32.0, 36.0, 40.0, 56.0, 39.0, 33.0, 45.0, 43.0, 41.0, 35.0, 27.0, 34.0, 30.0, 32.0, 34.0, 17.0, 21.0, 16.0, 20.0, 18.0, 15.0, 14.0, 13.0, 15.0, 9.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.0703125, -4.91156005859375, -4.7528076171875, -4.59405517578125, -4.435302734375, -4.27655029296875, -4.1177978515625, -3.95904541015625, -3.80029296875, -3.64154052734375, -3.4827880859375, -3.32403564453125, -3.165283203125, -3.00653076171875, -2.8477783203125, -2.68902587890625, -2.5302734375, -2.37152099609375, -2.2127685546875, -2.05401611328125, -1.895263671875, -1.73651123046875, -1.5777587890625, -1.41900634765625, -1.26025390625, -1.10150146484375, -0.9427490234375, -0.78399658203125, -0.625244140625, -0.46649169921875, -0.3077392578125, -0.14898681640625, 0.009765625, 0.16851806640625, 0.3272705078125, 0.48602294921875, 0.644775390625, 0.80352783203125, 0.9622802734375, 1.12103271484375, 1.27978515625, 1.43853759765625, 1.5972900390625, 1.75604248046875, 1.914794921875, 2.07354736328125, 2.2322998046875, 2.39105224609375, 2.5498046875, 2.70855712890625, 2.8673095703125, 3.02606201171875, 3.184814453125, 3.34356689453125, 3.5023193359375, 3.66107177734375, 3.81982421875, 3.97857666015625, 4.1373291015625, 4.29608154296875, 4.454833984375, 4.61358642578125, 4.7723388671875, 4.93109130859375, 5.08984375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 8.0, 8.0, 7.0, 7.0, 9.0, 11.0, 18.0, 19.0, 28.0, 21.0, 29.0, 30.0, 46.0, 51.0, 77.0, 98.0, 132.0, 239.0, 721.0, 5454.0, 382206.0, 3653701.0, 147028.0, 3030.0, 511.0, 197.0, 144.0, 93.0, 71.0, 52.0, 39.0, 29.0, 27.0, 17.0, 22.0, 22.0, 19.0, 16.0, 6.0, 8.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.390625, -23.614013671875, -22.83740234375, -22.060791015625, -21.2841796875, -20.507568359375, -19.73095703125, -18.954345703125, -18.177734375, -17.401123046875, -16.62451171875, -15.847900390625, -15.0712890625, -14.294677734375, -13.51806640625, -12.741455078125, -11.96484375, -11.188232421875, -10.41162109375, -9.635009765625, -8.8583984375, -8.081787109375, -7.30517578125, -6.528564453125, -5.751953125, -4.975341796875, -4.19873046875, -3.422119140625, -2.6455078125, -1.868896484375, -1.09228515625, -0.315673828125, 0.4609375, 1.237548828125, 2.01416015625, 2.790771484375, 3.5673828125, 4.343994140625, 5.12060546875, 5.897216796875, 6.673828125, 7.450439453125, 8.22705078125, 9.003662109375, 9.7802734375, 10.556884765625, 11.33349609375, 12.110107421875, 12.88671875, 13.663330078125, 14.43994140625, 15.216552734375, 15.9931640625, 16.769775390625, 17.54638671875, 18.322998046875, 19.099609375, 19.876220703125, 20.65283203125, 21.429443359375, 22.2060546875, 22.982666015625, 23.75927734375, 24.535888671875, 25.3125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 10.0, 12.0, 21.0, 29.0, 45.0, 51.0, 94.0, 131.0, 229.0, 292.0, 374.0, 543.0, 566.0, 527.0, 393.0, 237.0, 185.0, 108.0, 87.0, 54.0, 25.0, 19.0, 11.0, 8.0, 6.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5234375, -13.0098876953125, -12.496337890625, -11.9827880859375, -11.46923828125, -10.9556884765625, -10.442138671875, -9.9285888671875, -9.4150390625, -8.9014892578125, -8.387939453125, -7.8743896484375, -7.36083984375, -6.8472900390625, -6.333740234375, -5.8201904296875, -5.306640625, -4.7930908203125, -4.279541015625, -3.7659912109375, -3.25244140625, -2.7388916015625, -2.225341796875, -1.7117919921875, -1.1982421875, -0.6846923828125, -0.171142578125, 0.3424072265625, 0.85595703125, 1.3695068359375, 1.883056640625, 2.3966064453125, 2.91015625, 3.4237060546875, 3.937255859375, 4.4508056640625, 4.96435546875, 5.4779052734375, 5.991455078125, 6.5050048828125, 7.0185546875, 7.5321044921875, 8.045654296875, 8.5592041015625, 9.07275390625, 9.5863037109375, 10.099853515625, 10.6134033203125, 11.126953125, 11.6405029296875, 12.154052734375, 12.6676025390625, 13.18115234375, 13.6947021484375, 14.208251953125, 14.7218017578125, 15.2353515625, 15.7489013671875, 16.262451171875, 16.7760009765625, 17.28955078125, 17.8031005859375, 18.316650390625, 18.8302001953125, 19.34375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 6.0, 10.0, 9.0, 15.0, 24.0, 27.0, 44.0, 74.0, 99.0, 123.0, 167.0, 288.0, 473.0, 1099.0, 8213.0, 1092516.0, 3066944.0, 21052.0, 1494.0, 603.0, 302.0, 195.0, 132.0, 98.0, 72.0, 46.0, 38.0, 33.0, 24.0, 18.0, 15.0, 4.0, 8.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-53.78125, -52.37060546875, -50.9599609375, -49.54931640625, -48.138671875, -46.72802734375, -45.3173828125, -43.90673828125, -42.49609375, -41.08544921875, -39.6748046875, -38.26416015625, -36.853515625, -35.44287109375, -34.0322265625, -32.62158203125, -31.2109375, -29.80029296875, -28.3896484375, -26.97900390625, -25.568359375, -24.15771484375, -22.7470703125, -21.33642578125, -19.92578125, -18.51513671875, -17.1044921875, -15.69384765625, -14.283203125, -12.87255859375, -11.4619140625, -10.05126953125, -8.640625, -7.22998046875, -5.8193359375, -4.40869140625, -2.998046875, -1.58740234375, -0.1767578125, 1.23388671875, 2.64453125, 4.05517578125, 5.4658203125, 6.87646484375, 8.287109375, 9.69775390625, 11.1083984375, 12.51904296875, 13.9296875, 15.34033203125, 16.7509765625, 18.16162109375, 19.572265625, 20.98291015625, 22.3935546875, 23.80419921875, 25.21484375, 26.62548828125, 28.0361328125, 29.44677734375, 30.857421875, 32.26806640625, 33.6787109375, 35.08935546875, 36.5]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 7.0, 12.0, 61.0, 117.0, 185.0, 212.0, 174.0, 142.0, 61.0, 25.0, 13.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.015506744384766, -30.507736206054688, -26.99996566772461, -23.49219512939453, -19.984424591064453, -16.476654052734375, -12.968883514404297, -9.461112976074219, -5.953342437744141, -2.4455718994140625, 1.0621986389160156, 4.569969177246094, 8.077739715576172, 11.58551025390625, 15.093280792236328, 18.601051330566406, 22.108821868896484, 25.616592407226562, 29.12436294555664, 32.63213348388672, 36.1399040222168, 39.647674560546875, 43.15544509887695, 46.66321563720703, 50.17098617553711, 53.67875671386719, 57.186527252197266, 60.694297790527344, 64.20207214355469, 67.7098388671875, 71.21760559082031, 74.72537994384766, 78.233154296875, 81.74092102050781, 85.24869537353516, 88.7564697265625, 92.26423645019531, 95.77200317382812, 99.27977752685547, 102.78755187988281, 106.29531860351562, 109.80308532714844, 113.31085968017578, 116.81863403320312, 120.32640075683594, 123.83416748046875, 127.3419418334961, 130.84971618652344, 134.35748291015625, 137.86524963378906, 141.37301635742188, 144.88079833984375, 148.38856506347656, 151.89633178710938, 155.40411376953125, 158.91188049316406, 162.41964721679688, 165.9274139404297, 169.4351806640625, 172.94296264648438, 176.4507293701172, 179.95849609375, 183.46627807617188, 186.9740447998047, 190.4818115234375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 12.0, 4.0, 11.0, 17.0, 12.0, 14.0, 18.0, 14.0, 25.0, 21.0, 25.0, 40.0, 41.0, 42.0, 34.0, 36.0, 37.0, 37.0, 51.0, 47.0, 45.0, 40.0, 43.0, 37.0, 34.0, 37.0, 30.0, 33.0, 22.0, 24.0, 18.0, 20.0, 17.0, 14.0, 13.0, 7.0, 4.0, 6.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.61219787597656, -47.231136322021484, -45.85007858276367, -44.469017028808594, -43.08795928955078, -41.7068977355957, -40.325836181640625, -38.94477844238281, -37.563716888427734, -36.182655334472656, -34.801597595214844, -33.420536041259766, -32.03947448730469, -30.658416748046875, -29.277355194091797, -27.89629554748535, -26.515235900878906, -25.13417625427246, -23.753116607666016, -22.372055053710938, -20.990995407104492, -19.609935760498047, -18.22887420654297, -16.847814559936523, -15.466754913330078, -14.085695266723633, -12.704634666442871, -11.32357406616211, -9.942514419555664, -8.561454772949219, -7.180394172668457, -5.799333572387695, -4.418270111083984, -3.037209987640381, -1.6561498641967773, -0.27508974075317383, 1.1059703826904297, 2.487030506134033, 3.8680906295776367, 5.249151229858398, 6.630210876464844, 8.011270523071289, 9.39233112335205, 10.773391723632812, 12.154451370239258, 13.535511016845703, 14.916571617126465, 16.297632217407227, 17.678691864013672, 19.059751510620117, 20.440811157226562, 21.82187271118164, 23.202932357788086, 24.58399200439453, 25.96505355834961, 27.346113204956055, 28.7271728515625, 30.108232498168945, 31.48929214477539, 32.87035369873047, 34.25141143798828, 35.63247299194336, 37.01353454589844, 38.39459228515625, 39.77565383911133]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 4.0, 12.0, 9.0, 14.0, 15.0, 17.0, 16.0, 21.0, 31.0, 22.0, 28.0, 39.0, 37.0, 36.0, 51.0, 52.0, 40.0, 41.0, 40.0, 33.0, 39.0, 40.0, 27.0, 34.0, 42.0, 37.0, 32.0, 37.0, 20.0, 25.0, 19.0, 14.0, 13.0, 9.0, 10.0, 12.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4765625, -5.3017578125, -5.126953125, -4.9521484375, -4.77734375, -4.6025390625, -4.427734375, -4.2529296875, -4.078125, -3.9033203125, -3.728515625, -3.5537109375, -3.37890625, -3.2041015625, -3.029296875, -2.8544921875, -2.6796875, -2.5048828125, -2.330078125, -2.1552734375, -1.98046875, -1.8056640625, -1.630859375, -1.4560546875, -1.28125, -1.1064453125, -0.931640625, -0.7568359375, -0.58203125, -0.4072265625, -0.232421875, -0.0576171875, 0.1171875, 0.2919921875, 0.466796875, 0.6416015625, 0.81640625, 0.9912109375, 1.166015625, 1.3408203125, 1.515625, 1.6904296875, 1.865234375, 2.0400390625, 2.21484375, 2.3896484375, 2.564453125, 2.7392578125, 2.9140625, 3.0888671875, 3.263671875, 3.4384765625, 3.61328125, 3.7880859375, 3.962890625, 4.1376953125, 4.3125, 4.4873046875, 4.662109375, 4.8369140625, 5.01171875, 5.1865234375, 5.361328125, 5.5361328125, 5.7109375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 13.0, 12.0, 16.0, 30.0, 41.0, 62.0, 103.0, 150.0, 239.0, 353.0, 520.0, 829.0, 1275.0, 1922.0, 2940.0, 4581.0, 6945.0, 10746.0, 16954.0, 26934.0, 43751.0, 72649.0, 132922.0, 320795.0, 175105.0, 89431.0, 51614.0, 31727.0, 19833.0, 12687.0, 8211.0, 5316.0, 3384.0, 2253.0, 1464.0, 965.0, 620.0, 387.0, 268.0, 162.0, 120.0, 68.0, 50.0, 32.0, 28.0, 20.0, 16.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.484375, -1.4389495849609375, -1.393524169921875, -1.3480987548828125, -1.30267333984375, -1.2572479248046875, -1.211822509765625, -1.1663970947265625, -1.1209716796875, -1.0755462646484375, -1.030120849609375, -0.9846954345703125, -0.93927001953125, -0.8938446044921875, -0.848419189453125, -0.8029937744140625, -0.757568359375, -0.7121429443359375, -0.666717529296875, -0.6212921142578125, -0.57586669921875, -0.5304412841796875, -0.485015869140625, -0.4395904541015625, -0.3941650390625, -0.3487396240234375, -0.303314208984375, -0.2578887939453125, -0.21246337890625, -0.1670379638671875, -0.121612548828125, -0.0761871337890625, -0.03076171875, 0.0146636962890625, 0.060089111328125, 0.1055145263671875, 0.15093994140625, 0.1963653564453125, 0.241790771484375, 0.2872161865234375, 0.3326416015625, 0.3780670166015625, 0.423492431640625, 0.4689178466796875, 0.51434326171875, 0.5597686767578125, 0.605194091796875, 0.6506195068359375, 0.696044921875, 0.7414703369140625, 0.786895751953125, 0.8323211669921875, 0.87774658203125, 0.9231719970703125, 0.968597412109375, 1.0140228271484375, 1.0594482421875, 1.1048736572265625, 1.150299072265625, 1.1957244873046875, 1.24114990234375, 1.2865753173828125, 1.332000732421875, 1.3774261474609375, 1.4228515625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 6.0, 8.0, 5.0, 19.0, 11.0, 10.0, 13.0, 19.0, 18.0, 21.0, 22.0, 18.0, 27.0, 35.0, 35.0, 38.0, 33.0, 42.0, 32.0, 46.0, 1079.0, 39.0, 46.0, 38.0, 36.0, 32.0, 34.0, 26.0, 31.0, 19.0, 25.0, 25.0, 24.0, 26.0, 8.0, 12.0, 12.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0], "bins": [-3.708984375, -3.6009521484375, -3.492919921875, -3.3848876953125, -3.27685546875, -3.1688232421875, -3.060791015625, -2.9527587890625, -2.8447265625, -2.7366943359375, -2.628662109375, -2.5206298828125, -2.41259765625, -2.3045654296875, -2.196533203125, -2.0885009765625, -1.98046875, -1.8724365234375, -1.764404296875, -1.6563720703125, -1.54833984375, -1.4403076171875, -1.332275390625, -1.2242431640625, -1.1162109375, -1.0081787109375, -0.900146484375, -0.7921142578125, -0.68408203125, -0.5760498046875, -0.468017578125, -0.3599853515625, -0.251953125, -0.1439208984375, -0.035888671875, 0.0721435546875, 0.18017578125, 0.2882080078125, 0.396240234375, 0.5042724609375, 0.6123046875, 0.7203369140625, 0.828369140625, 0.9364013671875, 1.04443359375, 1.1524658203125, 1.260498046875, 1.3685302734375, 1.4765625, 1.5845947265625, 1.692626953125, 1.8006591796875, 1.90869140625, 2.0167236328125, 2.124755859375, 2.2327880859375, 2.3408203125, 2.4488525390625, 2.556884765625, 2.6649169921875, 2.77294921875, 2.8809814453125, 2.989013671875, 3.0970458984375, 3.205078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 12.0, 7.0, 25.0, 30.0, 45.0, 74.0, 94.0, 176.0, 226.0, 343.0, 447.0, 702.0, 980.0, 1484.0, 2134.0, 3016.0, 4322.0, 6391.0, 9403.0, 13607.0, 20383.0, 31024.0, 47410.0, 75119.0, 132750.0, 1371633.0, 145151.0, 79959.0, 50342.0, 32917.0, 21236.0, 14410.0, 9793.0, 6672.0, 4629.0, 3134.0, 2124.0, 1501.0, 1047.0, 738.0, 582.0, 365.0, 248.0, 139.0, 120.0, 63.0, 49.0, 34.0, 17.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0], "bins": [-1.39453125, -1.3529815673828125, -1.311431884765625, -1.2698822021484375, -1.22833251953125, -1.1867828369140625, -1.145233154296875, -1.1036834716796875, -1.0621337890625, -1.0205841064453125, -0.979034423828125, -0.9374847412109375, -0.89593505859375, -0.8543853759765625, -0.812835693359375, -0.7712860107421875, -0.729736328125, -0.6881866455078125, -0.646636962890625, -0.6050872802734375, -0.56353759765625, -0.5219879150390625, -0.480438232421875, -0.4388885498046875, -0.3973388671875, -0.3557891845703125, -0.314239501953125, -0.2726898193359375, -0.23114013671875, -0.1895904541015625, -0.148040771484375, -0.1064910888671875, -0.06494140625, -0.0233917236328125, 0.018157958984375, 0.0597076416015625, 0.10125732421875, 0.1428070068359375, 0.184356689453125, 0.2259063720703125, 0.2674560546875, 0.3090057373046875, 0.350555419921875, 0.3921051025390625, 0.43365478515625, 0.4752044677734375, 0.516754150390625, 0.5583038330078125, 0.599853515625, 0.6414031982421875, 0.682952880859375, 0.7245025634765625, 0.76605224609375, 0.8076019287109375, 0.849151611328125, 0.8907012939453125, 0.9322509765625, 0.9738006591796875, 1.015350341796875, 1.0569000244140625, 1.09844970703125, 1.1399993896484375, 1.181549072265625, 1.2230987548828125, 1.2646484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 9.0, 13.0, 11.0, 11.0, 12.0, 15.0, 20.0, 26.0, 34.0, 45.0, 57.0, 71.0, 97.0, 104.0, 80.0, 89.0, 54.0, 47.0, 28.0, 30.0, 36.0, 22.0, 13.0, 14.0, 11.0, 2.0, 6.0, 4.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002951622009277344, -0.00028659403324127197, -0.00027802586555480957, -0.00026945769786834717, -0.00026088953018188477, -0.00025232136249542236, -0.00024375319480895996, -0.00023518502712249756, -0.00022661685943603516, -0.00021804869174957275, -0.00020948052406311035, -0.00020091235637664795, -0.00019234418869018555, -0.00018377602100372314, -0.00017520785331726074, -0.00016663968563079834, -0.00015807151794433594, -0.00014950335025787354, -0.00014093518257141113, -0.00013236701488494873, -0.00012379884719848633, -0.00011523067951202393, -0.00010666251182556152, -9.809434413909912e-05, -8.952617645263672e-05, -8.095800876617432e-05, -7.238984107971191e-05, -6.382167339324951e-05, -5.525350570678711e-05, -4.668533802032471e-05, -3.8117170333862305e-05, -2.9549002647399902e-05, -2.09808349609375e-05, -1.2412667274475098e-05, -3.844499588012695e-06, 4.723668098449707e-06, 1.329183578491211e-05, 2.1860003471374512e-05, 3.0428171157836914e-05, 3.8996338844299316e-05, 4.756450653076172e-05, 5.613267421722412e-05, 6.470084190368652e-05, 7.326900959014893e-05, 8.183717727661133e-05, 9.040534496307373e-05, 9.897351264953613e-05, 0.00010754168033599854, 0.00011610984802246094, 0.00012467801570892334, 0.00013324618339538574, 0.00014181435108184814, 0.00015038251876831055, 0.00015895068645477295, 0.00016751885414123535, 0.00017608702182769775, 0.00018465518951416016, 0.00019322335720062256, 0.00020179152488708496, 0.00021035969257354736, 0.00021892786026000977, 0.00022749602794647217, 0.00023606419563293457, 0.00024463236331939697, 0.0002532005310058594]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 8.0, 9.0, 9.0, 9.0, 5.0, 12.0, 19.0, 38.0, 37.0, 51.0, 94.0, 117.0, 174.0, 352.0, 820.0, 29779.0, 1011593.0, 3985.0, 629.0, 293.0, 155.0, 89.0, 69.0, 45.0, 22.0, 23.0, 18.0, 17.0, 15.0, 11.0, 9.0, 6.0, 6.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.004840850830078125, -0.004681289196014404, -0.004521727561950684, -0.004362165927886963, -0.004202604293823242, -0.0040430426597595215, -0.0038834810256958008, -0.00372391939163208, -0.0035643577575683594, -0.0034047961235046387, -0.003245234489440918, -0.0030856728553771973, -0.0029261112213134766, -0.002766549587249756, -0.002606987953186035, -0.0024474263191223145, -0.0022878646850585938, -0.002128303050994873, -0.0019687414169311523, -0.0018091797828674316, -0.001649618148803711, -0.0014900565147399902, -0.0013304948806762695, -0.0011709332466125488, -0.0010113716125488281, -0.0008518099784851074, -0.0006922483444213867, -0.000532686710357666, -0.0003731250762939453, -0.0002135634422302246, -5.4001808166503906e-05, 0.0001055598258972168, 0.0002651214599609375, 0.0004246830940246582, 0.0005842447280883789, 0.0007438063621520996, 0.0009033679962158203, 0.001062929630279541, 0.0012224912643432617, 0.0013820528984069824, 0.0015416145324707031, 0.0017011761665344238, 0.0018607378005981445, 0.0020202994346618652, 0.002179861068725586, 0.0023394227027893066, 0.0024989843368530273, 0.002658545970916748, 0.0028181076049804688, 0.0029776692390441895, 0.00313723087310791, 0.003296792507171631, 0.0034563541412353516, 0.0036159157752990723, 0.003775477409362793, 0.003935039043426514, 0.004094600677490234, 0.004254162311553955, 0.004413723945617676, 0.0045732855796813965, 0.004732847213745117, 0.004892408847808838, 0.005051970481872559, 0.005211532115936279, 0.00537109375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 57.0, 233.0, 415.0, 250.0, 52.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009420436690561473, -0.0009237512713298202, -0.000905458873603493, -0.0008871664758771658, -0.0008688740781508386, -0.0008505816804245114, -0.0008322892826981843, -0.0008139968849718571, -0.000795704429037869, -0.0007774120313115418, -0.0007591196335852146, -0.0007408272358588874, -0.0007225348381325603, -0.0007042424404062331, -0.0006859500426799059, -0.0006676575867459178, -0.0006493652472272515, -0.0006310728495009243, -0.0006127804517745972, -0.00059448805404827, -0.0005761956563219428, -0.0005579032585956156, -0.0005396108608692884, -0.0005213184049353004, -0.0005030260654166341, -0.0004847336676903069, -0.0004664412699639797, -0.00044814887223765254, -0.00042985647451132536, -0.0004115640767849982, -0.00039327164995484054, -0.00037497925222851336, -0.0003566868253983557, -0.00033839442767202854, -0.00032010202994570136, -0.0003018096322193742, -0.000283517234493047, -0.0002652248367667198, -0.0002469324099365622, -0.000228640012210235, -0.00021034762903582305, -0.00019205523130949587, -0.00017376281903125346, -0.00015547042130492628, -0.0001371780235785991, -0.00011888562585227191, -0.00010059322084998712, -8.230081584770232e-05, -6.400841812137514e-05, -4.5716016757069156e-05, -2.7423615392763168e-05, -9.13121402845718e-06, 9.161187335848808e-06, 2.745358506217599e-05, 4.5745990064460784e-05, 6.403839506674558e-05, 8.233079279307276e-05, 0.00010062319051939994, 0.00011891559552168474, 0.00013720800052396953, 0.0001555003982502967, 0.0001737927959766239, 0.00019208519370295107, 0.00021037760598119348, 0.00022867000370752066]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 9.0, 9.0, 10.0, 6.0, 15.0, 11.0, 10.0, 18.0, 17.0, 16.0, 27.0, 36.0, 24.0, 32.0, 36.0, 36.0, 41.0, 38.0, 31.0, 37.0, 49.0, 35.0, 31.0, 49.0, 56.0, 34.0, 41.0, 25.0, 31.0, 29.0, 21.0, 14.0, 22.0, 17.0, 18.0, 13.0, 17.0, 9.0, 8.0, 6.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010722875595092773, -0.00010335631668567657, -9.948387742042542e-05, -9.561143815517426e-05, -9.17389988899231e-05, -8.786655962467194e-05, -8.399412035942078e-05, -8.012168109416962e-05, -7.624924182891846e-05, -7.23768025636673e-05, -6.850436329841614e-05, -6.463192403316498e-05, -6.075948476791382e-05, -5.688704550266266e-05, -5.30146062374115e-05, -4.914216697216034e-05, -4.526972770690918e-05, -4.139728844165802e-05, -3.752484917640686e-05, -3.36524099111557e-05, -2.977997064590454e-05, -2.590753138065338e-05, -2.203509211540222e-05, -1.8162652850151062e-05, -1.4290213584899902e-05, -1.0417774319648743e-05, -6.545335054397583e-06, -2.6728957891464233e-06, 1.1995434761047363e-06, 5.071982741355896e-06, 8.944422006607056e-06, 1.2816861271858215e-05, 1.6689300537109375e-05, 2.0561739802360535e-05, 2.4434179067611694e-05, 2.8306618332862854e-05, 3.2179057598114014e-05, 3.605149686336517e-05, 3.992393612861633e-05, 4.379637539386749e-05, 4.766881465911865e-05, 5.154125392436981e-05, 5.541369318962097e-05, 5.928613245487213e-05, 6.315857172012329e-05, 6.703101098537445e-05, 7.090345025062561e-05, 7.477588951587677e-05, 7.864832878112793e-05, 8.252076804637909e-05, 8.639320731163025e-05, 9.026564657688141e-05, 9.413808584213257e-05, 9.801052510738373e-05, 0.00010188296437263489, 0.00010575540363788605, 0.00010962784290313721, 0.00011350028216838837, 0.00011737272143363953, 0.00012124516069889069, 0.00012511759996414185, 0.000128990039229393, 0.00013286247849464417, 0.00013673491775989532, 0.00014060735702514648]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 4.0, 12.0, 9.0, 14.0, 15.0, 17.0, 16.0, 21.0, 31.0, 22.0, 28.0, 39.0, 37.0, 36.0, 51.0, 52.0, 40.0, 41.0, 40.0, 33.0, 39.0, 40.0, 27.0, 34.0, 42.0, 37.0, 32.0, 37.0, 20.0, 25.0, 19.0, 14.0, 13.0, 9.0, 10.0, 12.0, 9.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4765625, -5.3017578125, -5.126953125, -4.9521484375, -4.77734375, -4.6025390625, -4.427734375, -4.2529296875, -4.078125, -3.9033203125, -3.728515625, -3.5537109375, -3.37890625, -3.2041015625, -3.029296875, -2.8544921875, -2.6796875, -2.5048828125, -2.330078125, -2.1552734375, -1.98046875, -1.8056640625, -1.630859375, -1.4560546875, -1.28125, -1.1064453125, -0.931640625, -0.7568359375, -0.58203125, -0.4072265625, -0.232421875, -0.0576171875, 0.1171875, 0.2919921875, 0.466796875, 0.6416015625, 0.81640625, 0.9912109375, 1.166015625, 1.3408203125, 1.515625, 1.6904296875, 1.865234375, 2.0400390625, 2.21484375, 2.3896484375, 2.564453125, 2.7392578125, 2.9140625, 3.0888671875, 3.263671875, 3.4384765625, 3.61328125, 3.7880859375, 3.962890625, 4.1376953125, 4.3125, 4.4873046875, 4.662109375, 4.8369140625, 5.01171875, 5.1865234375, 5.361328125, 5.5361328125, 5.7109375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 16.0, 17.0, 33.0, 35.0, 45.0, 78.0, 109.0, 185.0, 237.0, 388.0, 682.0, 1131.0, 1887.0, 3505.0, 6125.0, 11414.0, 20446.0, 38430.0, 75960.0, 162088.0, 298702.0, 216327.0, 102541.0, 49700.0, 25899.0, 14446.0, 7767.0, 4420.0, 2416.0, 1406.0, 794.0, 476.0, 291.0, 185.0, 92.0, 76.0, 56.0, 35.0, 32.0, 21.0, 15.0, 9.0, 10.0, 6.0, 4.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.9532470703125, -3.824462890625, -3.6956787109375, -3.56689453125, -3.4381103515625, -3.309326171875, -3.1805419921875, -3.0517578125, -2.9229736328125, -2.794189453125, -2.6654052734375, -2.53662109375, -2.4078369140625, -2.279052734375, -2.1502685546875, -2.021484375, -1.8927001953125, -1.763916015625, -1.6351318359375, -1.50634765625, -1.3775634765625, -1.248779296875, -1.1199951171875, -0.9912109375, -0.8624267578125, -0.733642578125, -0.6048583984375, -0.47607421875, -0.3472900390625, -0.218505859375, -0.0897216796875, 0.0390625, 0.1678466796875, 0.296630859375, 0.4254150390625, 0.55419921875, 0.6829833984375, 0.811767578125, 0.9405517578125, 1.0693359375, 1.1981201171875, 1.326904296875, 1.4556884765625, 1.58447265625, 1.7132568359375, 1.842041015625, 1.9708251953125, 2.099609375, 2.2283935546875, 2.357177734375, 2.4859619140625, 2.61474609375, 2.7435302734375, 2.872314453125, 3.0010986328125, 3.1298828125, 3.2586669921875, 3.387451171875, 3.5162353515625, 3.64501953125, 3.7738037109375, 3.902587890625, 4.0313720703125, 4.16015625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 2.0, 7.0, 7.0, 10.0, 7.0, 7.0, 7.0, 10.0, 23.0, 23.0, 23.0, 24.0, 19.0, 32.0, 38.0, 37.0, 37.0, 57.0, 49.0, 87.0, 119.0, 356.0, 1409.0, 155.0, 71.0, 52.0, 44.0, 40.0, 40.0, 29.0, 31.0, 32.0, 31.0, 20.0, 20.0, 20.0, 22.0, 7.0, 17.0, 8.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.39306640625, -17.8017578125, -17.21044921875, -16.619140625, -16.02783203125, -15.4365234375, -14.84521484375, -14.25390625, -13.66259765625, -13.0712890625, -12.47998046875, -11.888671875, -11.29736328125, -10.7060546875, -10.11474609375, -9.5234375, -8.93212890625, -8.3408203125, -7.74951171875, -7.158203125, -6.56689453125, -5.9755859375, -5.38427734375, -4.79296875, -4.20166015625, -3.6103515625, -3.01904296875, -2.427734375, -1.83642578125, -1.2451171875, -0.65380859375, -0.0625, 0.52880859375, 1.1201171875, 1.71142578125, 2.302734375, 2.89404296875, 3.4853515625, 4.07666015625, 4.66796875, 5.25927734375, 5.8505859375, 6.44189453125, 7.033203125, 7.62451171875, 8.2158203125, 8.80712890625, 9.3984375, 9.98974609375, 10.5810546875, 11.17236328125, 11.763671875, 12.35498046875, 12.9462890625, 13.53759765625, 14.12890625, 14.72021484375, 15.3115234375, 15.90283203125, 16.494140625, 17.08544921875, 17.6767578125, 18.26806640625, 18.859375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 8.0, 14.0, 24.0, 27.0, 51.0, 97.0, 151.0, 319.0, 922.0, 39116.0, 3101611.0, 2363.0, 448.0, 212.0, 109.0, 73.0, 40.0, 33.0, 20.0, 17.0, 7.0, 11.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-126.5625, -122.9697265625, -119.376953125, -115.7841796875, -112.19140625, -108.5986328125, -105.005859375, -101.4130859375, -97.8203125, -94.2275390625, -90.634765625, -87.0419921875, -83.44921875, -79.8564453125, -76.263671875, -72.6708984375, -69.078125, -65.4853515625, -61.892578125, -58.2998046875, -54.70703125, -51.1142578125, -47.521484375, -43.9287109375, -40.3359375, -36.7431640625, -33.150390625, -29.5576171875, -25.96484375, -22.3720703125, -18.779296875, -15.1865234375, -11.59375, -8.0009765625, -4.408203125, -0.8154296875, 2.77734375, 6.3701171875, 9.962890625, 13.5556640625, 17.1484375, 20.7412109375, 24.333984375, 27.9267578125, 31.51953125, 35.1123046875, 38.705078125, 42.2978515625, 45.890625, 49.4833984375, 53.076171875, 56.6689453125, 60.26171875, 63.8544921875, 67.447265625, 71.0400390625, 74.6328125, 78.2255859375, 81.818359375, 85.4111328125, 89.00390625, 92.5966796875, 96.189453125, 99.7822265625, 103.375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 816.0, 201.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.60578918457031, -52.339107513427734, -34.072425842285156, -15.805744171142578, 2.4609375, 20.727615356445312, 38.994300842285156, 57.260986328125, 75.52766418457031, 93.79434204101562, 112.06102752685547, 130.3277130126953, 148.59439086914062, 166.86106872558594, 185.12774658203125, 203.39443969726562, 221.66111755371094, 239.92779541015625, 258.1944885253906, 276.4611511230469, 294.72784423828125, 312.9945068359375, 331.2611999511719, 349.52789306640625, 367.7945556640625, 386.0612487792969, 404.3279113769531, 422.5946044921875, 440.86126708984375, 459.1279602050781, 477.3946533203125, 495.66131591796875, 513.927978515625, 532.1946411132812, 550.4613647460938, 568.72802734375, 586.9946899414062, 605.2613525390625, 623.528076171875, 641.7947387695312, 660.0614013671875, 678.3280639648438, 696.5947875976562, 714.8614501953125, 733.1281127929688, 751.394775390625, 769.6614990234375, 787.9281616210938, 806.1948852539062, 824.4615478515625, 842.728271484375, 860.9949340820312, 879.2615966796875, 897.5283203125, 915.7949829101562, 934.0616455078125, 952.328369140625, 970.5950317382812, 988.8617553710938, 1007.12841796875, 1025.3951416015625, 1043.6617431640625, 1061.928466796875, 1080.1951904296875, 1098.4617919921875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 6.0, 7.0, 10.0, 10.0, 14.0, 15.0, 16.0, 14.0, 18.0, 18.0, 22.0, 32.0, 27.0, 32.0, 24.0, 37.0, 36.0, 40.0, 40.0, 39.0, 33.0, 34.0, 53.0, 39.0, 35.0, 27.0, 28.0, 37.0, 25.0, 27.0, 25.0, 27.0, 18.0, 23.0, 16.0, 10.0, 12.0, 11.0, 10.0, 8.0, 10.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-45.475093841552734, -43.94450759887695, -42.413917541503906, -40.883331298828125, -39.352745056152344, -37.8221549987793, -36.291568756103516, -34.76097869873047, -33.23039245605469, -31.699804306030273, -30.169218063354492, -28.638629913330078, -27.108041763305664, -25.57745361328125, -24.04686737060547, -22.516279220581055, -20.985692977905273, -19.45510482788086, -17.924518585205078, -16.393930435180664, -14.86334228515625, -13.332755088806152, -11.802167892456055, -10.27157974243164, -8.740992546081543, -7.210404872894287, -5.679817199707031, -4.149230003356934, -2.6186423301696777, -1.0880546569824219, 0.4425325393676758, 1.9731206893920898, 3.5037078857421875, 5.034295558929443, 6.564883232116699, 8.095470428466797, 9.626058578491211, 11.156645774841309, 12.687232971191406, 14.21782112121582, 15.748408317565918, 17.278995513916016, 18.80958366394043, 20.340171813964844, 21.870758056640625, 23.40134620666504, 24.931934356689453, 26.462520599365234, 27.99310874938965, 29.523696899414062, 31.054283142089844, 32.584869384765625, 34.11545944213867, 35.64604568481445, 37.1766357421875, 38.70722198486328, 40.23780822753906, 41.768394470214844, 43.29898452758789, 44.82957077026367, 46.36015701293945, 47.8907470703125, 49.42133331298828, 50.95191955566406, 52.48250961303711]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 8.0, 7.0, 9.0, 18.0, 16.0, 16.0, 19.0, 17.0, 25.0, 29.0, 37.0, 39.0, 33.0, 37.0, 32.0, 44.0, 41.0, 47.0, 36.0, 49.0, 36.0, 38.0, 33.0, 39.0, 34.0, 24.0, 39.0, 29.0, 26.0, 17.0, 22.0, 15.0, 17.0, 8.0, 10.0, 6.0, 11.0, 10.0, 6.0, 0.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.073486328125, -4.88916015625, -4.704833984375, -4.5205078125, -4.336181640625, -4.15185546875, -3.967529296875, -3.783203125, -3.598876953125, -3.41455078125, -3.230224609375, -3.0458984375, -2.861572265625, -2.67724609375, -2.492919921875, -2.30859375, -2.124267578125, -1.93994140625, -1.755615234375, -1.5712890625, -1.386962890625, -1.20263671875, -1.018310546875, -0.833984375, -0.649658203125, -0.46533203125, -0.281005859375, -0.0966796875, 0.087646484375, 0.27197265625, 0.456298828125, 0.640625, 0.824951171875, 1.00927734375, 1.193603515625, 1.3779296875, 1.562255859375, 1.74658203125, 1.930908203125, 2.115234375, 2.299560546875, 2.48388671875, 2.668212890625, 2.8525390625, 3.036865234375, 3.22119140625, 3.405517578125, 3.58984375, 3.774169921875, 3.95849609375, 4.142822265625, 4.3271484375, 4.511474609375, 4.69580078125, 4.880126953125, 5.064453125, 5.248779296875, 5.43310546875, 5.617431640625, 5.8017578125, 5.986083984375, 6.17041015625, 6.354736328125, 6.5390625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 2.0, 7.0, 2.0, 18.0, 14.0, 21.0, 24.0, 34.0, 44.0, 60.0, 91.0, 102.0, 161.0, 231.0, 406.0, 740.0, 1578.0, 3871.0, 12474.0, 48919.0, 209277.0, 747761.0, 1487298.0, 1154390.0, 399116.0, 94006.0, 22450.0, 6370.0, 2340.0, 943.0, 531.0, 298.0, 208.0, 142.0, 95.0, 61.0, 41.0, 38.0, 36.0, 20.0, 15.0, 13.0, 8.0, 4.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.0703125, -6.84027099609375, -6.6102294921875, -6.38018798828125, -6.150146484375, -5.92010498046875, -5.6900634765625, -5.46002197265625, -5.22998046875, -4.99993896484375, -4.7698974609375, -4.53985595703125, -4.309814453125, -4.07977294921875, -3.8497314453125, -3.61968994140625, -3.3896484375, -3.15960693359375, -2.9295654296875, -2.69952392578125, -2.469482421875, -2.23944091796875, -2.0093994140625, -1.77935791015625, -1.54931640625, -1.31927490234375, -1.0892333984375, -0.85919189453125, -0.629150390625, -0.39910888671875, -0.1690673828125, 0.06097412109375, 0.291015625, 0.52105712890625, 0.7510986328125, 0.98114013671875, 1.211181640625, 1.44122314453125, 1.6712646484375, 1.90130615234375, 2.13134765625, 2.36138916015625, 2.5914306640625, 2.82147216796875, 3.051513671875, 3.28155517578125, 3.5115966796875, 3.74163818359375, 3.9716796875, 4.20172119140625, 4.4317626953125, 4.66180419921875, 4.891845703125, 5.12188720703125, 5.3519287109375, 5.58197021484375, 5.81201171875, 6.04205322265625, 6.2720947265625, 6.50213623046875, 6.732177734375, 6.96221923828125, 7.1922607421875, 7.42230224609375, 7.65234375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 9.0, 16.0, 20.0, 27.0, 24.0, 49.0, 62.0, 79.0, 97.0, 123.0, 175.0, 259.0, 311.0, 374.0, 418.0, 404.0, 318.0, 299.0, 262.0, 193.0, 143.0, 95.0, 93.0, 62.0, 41.0, 29.0, 23.0, 11.0, 6.0, 12.0, 7.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.5625, -14.1688232421875, -13.775146484375, -13.3814697265625, -12.98779296875, -12.5941162109375, -12.200439453125, -11.8067626953125, -11.4130859375, -11.0194091796875, -10.625732421875, -10.2320556640625, -9.83837890625, -9.4447021484375, -9.051025390625, -8.6573486328125, -8.263671875, -7.8699951171875, -7.476318359375, -7.0826416015625, -6.68896484375, -6.2952880859375, -5.901611328125, -5.5079345703125, -5.1142578125, -4.7205810546875, -4.326904296875, -3.9332275390625, -3.53955078125, -3.1458740234375, -2.752197265625, -2.3585205078125, -1.96484375, -1.5711669921875, -1.177490234375, -0.7838134765625, -0.39013671875, 0.0035400390625, 0.397216796875, 0.7908935546875, 1.1845703125, 1.5782470703125, 1.971923828125, 2.3656005859375, 2.75927734375, 3.1529541015625, 3.546630859375, 3.9403076171875, 4.333984375, 4.7276611328125, 5.121337890625, 5.5150146484375, 5.90869140625, 6.3023681640625, 6.696044921875, 7.0897216796875, 7.4833984375, 7.8770751953125, 8.270751953125, 8.6644287109375, 9.05810546875, 9.4517822265625, 9.845458984375, 10.2391357421875, 10.6328125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 7.0, 8.0, 7.0, 9.0, 16.0, 14.0, 20.0, 34.0, 44.0, 50.0, 66.0, 93.0, 185.0, 238.0, 513.0, 1341.0, 16776.0, 2051989.0, 2102931.0, 17273.0, 1345.0, 476.0, 247.0, 161.0, 108.0, 89.0, 56.0, 53.0, 39.0, 26.0, 26.0, 8.0, 15.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.875, -33.58349609375, -32.2919921875, -31.00048828125, -29.708984375, -28.41748046875, -27.1259765625, -25.83447265625, -24.54296875, -23.25146484375, -21.9599609375, -20.66845703125, -19.376953125, -18.08544921875, -16.7939453125, -15.50244140625, -14.2109375, -12.91943359375, -11.6279296875, -10.33642578125, -9.044921875, -7.75341796875, -6.4619140625, -5.17041015625, -3.87890625, -2.58740234375, -1.2958984375, -0.00439453125, 1.287109375, 2.57861328125, 3.8701171875, 5.16162109375, 6.453125, 7.74462890625, 9.0361328125, 10.32763671875, 11.619140625, 12.91064453125, 14.2021484375, 15.49365234375, 16.78515625, 18.07666015625, 19.3681640625, 20.65966796875, 21.951171875, 23.24267578125, 24.5341796875, 25.82568359375, 27.1171875, 28.40869140625, 29.7001953125, 30.99169921875, 32.283203125, 33.57470703125, 34.8662109375, 36.15771484375, 37.44921875, 38.74072265625, 40.0322265625, 41.32373046875, 42.615234375, 43.90673828125, 45.1982421875, 46.48974609375, 47.78125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 16.0, 32.0, 78.0, 124.0, 160.0, 191.0, 176.0, 117.0, 58.0, 30.0, 19.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-120.8705062866211, -117.87789916992188, -114.88529205322266, -111.89268493652344, -108.90007019042969, -105.90746307373047, -102.91485595703125, -99.92224884033203, -96.92964172363281, -93.9370346069336, -90.94442749023438, -87.95181274414062, -84.9592056274414, -81.96659851074219, -78.97399139404297, -75.98138427734375, -72.98876953125, -69.99616241455078, -67.00355529785156, -64.01094055175781, -61.01833724975586, -58.025726318359375, -55.033119201660156, -52.04051208496094, -49.04790496826172, -46.0552978515625, -43.062686920166016, -40.0700798034668, -37.07747268676758, -34.084861755371094, -31.092254638671875, -28.099647521972656, -25.107040405273438, -22.114431381225586, -19.121824264526367, -16.129215240478516, -13.13660717010498, -10.143999099731445, -7.151390075683594, -4.158782958984375, -1.1661739349365234, 1.8264343738555908, 4.819042682647705, 7.811651229858398, 10.804259300231934, 13.796867370605469, 16.78947639465332, 19.78208351135254, 22.77469253540039, 25.767301559448242, 28.75990867614746, 31.752517700195312, 34.74512481689453, 37.73773193359375, 40.730342864990234, 43.72294998168945, 46.71556091308594, 49.708168029785156, 52.70077896118164, 55.69338607788086, 58.68599319458008, 61.67860412597656, 64.67121124267578, 67.663818359375, 70.65642547607422]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 5.0, 8.0, 7.0, 5.0, 15.0, 15.0, 21.0, 20.0, 24.0, 24.0, 18.0, 23.0, 44.0, 30.0, 47.0, 39.0, 37.0, 34.0, 29.0, 56.0, 58.0, 38.0, 38.0, 43.0, 32.0, 47.0, 38.0, 41.0, 32.0, 20.0, 22.0, 21.0, 13.0, 9.0, 14.0, 9.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.60210418701172, -41.16630935668945, -39.73051452636719, -38.29472351074219, -36.85892868041992, -35.423133850097656, -33.98733901977539, -32.551544189453125, -31.115751266479492, -29.679956436157227, -28.244163513183594, -26.808368682861328, -25.372573852539062, -23.93678092956543, -22.500986099243164, -21.06519317626953, -19.629398345947266, -18.193603515625, -16.757810592651367, -15.322015762329102, -13.886221885681152, -12.450428009033203, -11.014633178710938, -9.578839302062988, -8.143045425415039, -6.70725154876709, -5.271457195281982, -3.835662841796875, -2.399868965148926, -0.9640750885009766, 0.47171974182128906, 1.9075136184692383, 3.343303680419922, 4.779097557067871, 6.2148919105529785, 7.650686264038086, 9.086480140686035, 10.522274017333984, 11.95806884765625, 13.3938627243042, 14.829656600952148, 16.265451431274414, 17.701244354248047, 19.137039184570312, 20.572834014892578, 22.00862693786621, 23.444421768188477, 24.88021469116211, 26.316009521484375, 27.75180435180664, 29.187597274780273, 30.62339210510254, 32.05918502807617, 33.49497985839844, 34.9307746887207, 36.36656951904297, 37.80236053466797, 39.238155364990234, 40.6739501953125, 42.1097412109375, 43.545536041259766, 44.98133087158203, 46.4171257019043, 47.85292053222656, 49.28871536254883]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 7.0, 10.0, 11.0, 10.0, 17.0, 19.0, 16.0, 30.0, 27.0, 29.0, 46.0, 34.0, 42.0, 37.0, 34.0, 46.0, 41.0, 53.0, 36.0, 46.0, 51.0, 40.0, 30.0, 49.0, 24.0, 36.0, 34.0, 15.0, 23.0, 17.0, 18.0, 7.0, 15.0, 8.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.37109375, -5.17547607421875, -4.9798583984375, -4.78424072265625, -4.588623046875, -4.39300537109375, -4.1973876953125, -4.00177001953125, -3.80615234375, -3.61053466796875, -3.4149169921875, -3.21929931640625, -3.023681640625, -2.82806396484375, -2.6324462890625, -2.43682861328125, -2.2412109375, -2.04559326171875, -1.8499755859375, -1.65435791015625, -1.458740234375, -1.26312255859375, -1.0675048828125, -0.87188720703125, -0.67626953125, -0.48065185546875, -0.2850341796875, -0.08941650390625, 0.106201171875, 0.30181884765625, 0.4974365234375, 0.69305419921875, 0.888671875, 1.08428955078125, 1.2799072265625, 1.47552490234375, 1.671142578125, 1.86676025390625, 2.0623779296875, 2.25799560546875, 2.45361328125, 2.64923095703125, 2.8448486328125, 3.04046630859375, 3.236083984375, 3.43170166015625, 3.6273193359375, 3.82293701171875, 4.0185546875, 4.21417236328125, 4.4097900390625, 4.60540771484375, 4.801025390625, 4.99664306640625, 5.1922607421875, 5.38787841796875, 5.58349609375, 5.77911376953125, 5.9747314453125, 6.17034912109375, 6.365966796875, 6.56158447265625, 6.7572021484375, 6.95281982421875, 7.1484375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 12.0, 12.0, 17.0, 20.0, 39.0, 50.0, 70.0, 119.0, 170.0, 260.0, 411.0, 635.0, 959.0, 1427.0, 2183.0, 3419.0, 5263.0, 8234.0, 13315.0, 21069.0, 34910.0, 58895.0, 103959.0, 234928.0, 286010.0, 111433.0, 62737.0, 36866.0, 22507.0, 13909.0, 8753.0, 5690.0, 3655.0, 2287.0, 1524.0, 1008.0, 634.0, 403.0, 284.0, 159.0, 105.0, 73.0, 41.0, 25.0, 17.0, 17.0, 10.0, 12.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.654296875, -1.602691650390625, -1.55108642578125, -1.499481201171875, -1.4478759765625, -1.396270751953125, -1.34466552734375, -1.293060302734375, -1.241455078125, -1.189849853515625, -1.13824462890625, -1.086639404296875, -1.0350341796875, -0.983428955078125, -0.93182373046875, -0.880218505859375, -0.82861328125, -0.777008056640625, -0.72540283203125, -0.673797607421875, -0.6221923828125, -0.570587158203125, -0.51898193359375, -0.467376708984375, -0.415771484375, -0.364166259765625, -0.31256103515625, -0.260955810546875, -0.2093505859375, -0.157745361328125, -0.10614013671875, -0.054534912109375, -0.0029296875, 0.048675537109375, 0.10028076171875, 0.151885986328125, 0.2034912109375, 0.255096435546875, 0.30670166015625, 0.358306884765625, 0.409912109375, 0.461517333984375, 0.51312255859375, 0.564727783203125, 0.6163330078125, 0.667938232421875, 0.71954345703125, 0.771148681640625, 0.82275390625, 0.874359130859375, 0.92596435546875, 0.977569580078125, 1.0291748046875, 1.080780029296875, 1.13238525390625, 1.183990478515625, 1.235595703125, 1.287200927734375, 1.33880615234375, 1.390411376953125, 1.4420166015625, 1.493621826171875, 1.54522705078125, 1.596832275390625, 1.6484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 8.0, 8.0, 14.0, 13.0, 11.0, 11.0, 28.0, 24.0, 20.0, 32.0, 42.0, 28.0, 30.0, 33.0, 41.0, 49.0, 47.0, 40.0, 1066.0, 52.0, 37.0, 39.0, 35.0, 31.0, 36.0, 27.0, 23.0, 19.0, 27.0, 23.0, 19.0, 23.0, 14.0, 13.0, 12.0, 5.0, 7.0, 4.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.96875, -3.8499755859375, -3.731201171875, -3.6124267578125, -3.49365234375, -3.3748779296875, -3.256103515625, -3.1373291015625, -3.0185546875, -2.8997802734375, -2.781005859375, -2.6622314453125, -2.54345703125, -2.4246826171875, -2.305908203125, -2.1871337890625, -2.068359375, -1.9495849609375, -1.830810546875, -1.7120361328125, -1.59326171875, -1.4744873046875, -1.355712890625, -1.2369384765625, -1.1181640625, -0.9993896484375, -0.880615234375, -0.7618408203125, -0.64306640625, -0.5242919921875, -0.405517578125, -0.2867431640625, -0.16796875, -0.0491943359375, 0.069580078125, 0.1883544921875, 0.30712890625, 0.4259033203125, 0.544677734375, 0.6634521484375, 0.7822265625, 0.9010009765625, 1.019775390625, 1.1385498046875, 1.25732421875, 1.3760986328125, 1.494873046875, 1.6136474609375, 1.732421875, 1.8511962890625, 1.969970703125, 2.0887451171875, 2.20751953125, 2.3262939453125, 2.445068359375, 2.5638427734375, 2.6826171875, 2.8013916015625, 2.920166015625, 3.0389404296875, 3.15771484375, 3.2764892578125, 3.395263671875, 3.5140380859375, 3.6328125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 5.0, 12.0, 9.0, 24.0, 34.0, 43.0, 84.0, 104.0, 182.0, 209.0, 315.0, 442.0, 634.0, 915.0, 1304.0, 2031.0, 2926.0, 4183.0, 6146.0, 9200.0, 13791.0, 20987.0, 31964.0, 49790.0, 79090.0, 142313.0, 1368505.0, 139741.0, 77988.0, 49272.0, 31981.0, 20519.0, 13688.0, 9337.0, 6164.0, 4170.0, 2796.0, 1895.0, 1401.0, 923.0, 622.0, 451.0, 310.0, 208.0, 144.0, 84.0, 63.0, 50.0, 28.0, 20.0, 14.0, 11.0, 4.0, 6.0, 2.0, 1.0, 5.0], "bins": [-1.494140625, -1.44952392578125, -1.4049072265625, -1.36029052734375, -1.315673828125, -1.27105712890625, -1.2264404296875, -1.18182373046875, -1.13720703125, -1.09259033203125, -1.0479736328125, -1.00335693359375, -0.958740234375, -0.91412353515625, -0.8695068359375, -0.82489013671875, -0.7802734375, -0.73565673828125, -0.6910400390625, -0.64642333984375, -0.601806640625, -0.55718994140625, -0.5125732421875, -0.46795654296875, -0.42333984375, -0.37872314453125, -0.3341064453125, -0.28948974609375, -0.244873046875, -0.20025634765625, -0.1556396484375, -0.11102294921875, -0.06640625, -0.02178955078125, 0.0228271484375, 0.06744384765625, 0.112060546875, 0.15667724609375, 0.2012939453125, 0.24591064453125, 0.29052734375, 0.33514404296875, 0.3797607421875, 0.42437744140625, 0.468994140625, 0.51361083984375, 0.5582275390625, 0.60284423828125, 0.6474609375, 0.69207763671875, 0.7366943359375, 0.78131103515625, 0.825927734375, 0.87054443359375, 0.9151611328125, 0.95977783203125, 1.00439453125, 1.04901123046875, 1.0936279296875, 1.13824462890625, 1.182861328125, 1.22747802734375, 1.2720947265625, 1.31671142578125, 1.361328125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 9.0, 8.0, 16.0, 11.0, 12.0, 20.0, 21.0, 22.0, 45.0, 41.0, 56.0, 81.0, 100.0, 94.0, 93.0, 74.0, 59.0, 35.0, 30.0, 20.0, 18.0, 15.0, 16.0, 13.0, 19.0, 5.0, 8.0, 9.0, 13.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002944469451904297, -0.0002850145101547241, -0.00027558207511901855, -0.000266149640083313, -0.0002567172050476074, -0.00024728477001190186, -0.0002378523349761963, -0.00022841989994049072, -0.00021898746490478516, -0.0002095550298690796, -0.00020012259483337402, -0.00019069015979766846, -0.0001812577247619629, -0.00017182528972625732, -0.00016239285469055176, -0.0001529604196548462, -0.00014352798461914062, -0.00013409554958343506, -0.0001246631145477295, -0.00011523067951202393, -0.00010579824447631836, -9.636580944061279e-05, -8.693337440490723e-05, -7.750093936920166e-05, -6.80685043334961e-05, -5.863606929779053e-05, -4.920363426208496e-05, -3.9771199226379395e-05, -3.0338764190673828e-05, -2.0906329154968262e-05, -1.1473894119262695e-05, -2.041459083557129e-06, 7.3909759521484375e-06, 1.6823410987854004e-05, 2.625584602355957e-05, 3.568828105926514e-05, 4.51207160949707e-05, 5.455315113067627e-05, 6.398558616638184e-05, 7.34180212020874e-05, 8.285045623779297e-05, 9.228289127349854e-05, 0.0001017153263092041, 0.00011114776134490967, 0.00012058019638061523, 0.0001300126314163208, 0.00013944506645202637, 0.00014887750148773193, 0.0001583099365234375, 0.00016774237155914307, 0.00017717480659484863, 0.0001866072416305542, 0.00019603967666625977, 0.00020547211170196533, 0.0002149045467376709, 0.00022433698177337646, 0.00023376941680908203, 0.0002432018518447876, 0.00025263428688049316, 0.00026206672191619873, 0.0002714991569519043, 0.00028093159198760986, 0.00029036402702331543, 0.000299796462059021, 0.00030922889709472656]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 2.0, 11.0, 12.0, 15.0, 20.0, 19.0, 21.0, 33.0, 37.0, 45.0, 62.0, 81.0, 163.0, 275.0, 490.0, 1676.0, 634819.0, 408039.0, 1448.0, 490.0, 252.0, 174.0, 105.0, 67.0, 50.0, 34.0, 20.0, 20.0, 18.0, 12.0, 7.0, 7.0, 5.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.006465911865234375, -0.006281018257141113, -0.0060961246490478516, -0.00591123104095459, -0.005726337432861328, -0.005541443824768066, -0.005356550216674805, -0.005171656608581543, -0.004986763000488281, -0.0048018693923950195, -0.004616975784301758, -0.004432082176208496, -0.004247188568115234, -0.004062294960021973, -0.003877401351928711, -0.0036925077438354492, -0.0035076141357421875, -0.0033227205276489258, -0.003137826919555664, -0.0029529333114624023, -0.0027680397033691406, -0.002583146095275879, -0.002398252487182617, -0.0022133588790893555, -0.0020284652709960938, -0.001843571662902832, -0.0016586780548095703, -0.0014737844467163086, -0.0012888908386230469, -0.0011039972305297852, -0.0009191036224365234, -0.0007342100143432617, -0.00054931640625, -0.0003644227981567383, -0.00017952919006347656, 5.364418029785156e-06, 0.00019025802612304688, 0.0003751516342163086, 0.0005600452423095703, 0.000744938850402832, 0.0009298324584960938, 0.0011147260665893555, 0.0012996196746826172, 0.001484513282775879, 0.0016694068908691406, 0.0018543004989624023, 0.002039194107055664, 0.0022240877151489258, 0.0024089813232421875, 0.0025938749313354492, 0.002778768539428711, 0.0029636621475219727, 0.0031485557556152344, 0.003333449363708496, 0.003518342971801758, 0.0037032365798950195, 0.0038881301879882812, 0.004073023796081543, 0.004257917404174805, 0.004442811012268066, 0.004627704620361328, 0.00481259822845459, 0.0049974918365478516, 0.005182385444641113, 0.005367279052734375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 7.0, 80.0, 379.0, 413.0, 120.0, 14.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020806145039387047, -0.0001851484994404018, -0.0001622355484869331, -0.00013932261208537966, -0.00011640966113191098, -9.34967101784423e-05, -7.058377377688885e-05, -4.767082282342017e-05, -2.4757871869951487e-05, -1.8449245544616133e-06, 2.106802276102826e-05, 4.3980966438539326e-05, 6.6893917392008e-05, 8.980686834547669e-05, 0.00011271980474703014, 0.00013563275570049882, 0.0001585457066539675, 0.00018145865760743618, 0.00020437160856090486, 0.0002272845449624583, 0.00025019748136401176, 0.0002731104614213109, 0.0002960233832709491, 0.0003189363342244178, 0.0003418492851778865, 0.00036476223613135517, 0.00038767518708482385, 0.00041058810893446207, 0.0004335010889917612, 0.00045641401084139943, 0.0004793269617948681, 0.0005022399127483368, 0.0005251528928056359, 0.0005480658146552742, 0.0005709787947125733, 0.0005938917165622115, 0.0006168046966195107, 0.0006397176184691489, 0.0006626305403187871, 0.0006855435203760862, 0.0007084565004333854, 0.0007313694222830236, 0.0007542824023403227, 0.000777195324189961, 0.0008001083042472601, 0.0008230212260968983, 0.0008459341479465365, 0.0008688471280038357, 0.0008917600498534739, 0.0009146729717031121, 0.0009375859517604113, 0.0009604988736100495, 0.0009834117954596877, 0.0010063247755169868, 0.001029237755574286, 0.0010521507356315851, 0.0010750635992735624, 0.0010979765793308616, 0.0011208894429728389, 0.001143802423030138, 0.0011667154030874372, 0.0011896283831447363, 0.0012125412467867136, 0.0012354542268440127, 0.0012583672069013119]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 1.0, 1.0, 4.0, 8.0, 11.0, 9.0, 12.0, 11.0, 17.0, 15.0, 26.0, 21.0, 20.0, 28.0, 28.0, 24.0, 36.0, 30.0, 36.0, 48.0, 31.0, 45.0, 39.0, 34.0, 37.0, 38.0, 32.0, 47.0, 32.0, 34.0, 35.0, 21.0, 23.0, 18.0, 18.0, 20.0, 20.0, 16.0, 5.0, 14.0, 12.0, 7.0, 12.0, 3.0, 2.0, 10.0, 2.0, 4.0, 2.0, 3.0, 1.0], "bins": [-0.00014102458953857422, -0.00013707950711250305, -0.00013313442468643188, -0.00012918934226036072, -0.00012524425983428955, -0.00012129917740821838, -0.00011735409498214722, -0.00011340901255607605, -0.00010946393013000488, -0.00010551884770393372, -0.00010157376527786255, -9.762868285179138e-05, -9.368360042572021e-05, -8.973851799964905e-05, -8.579343557357788e-05, -8.184835314750671e-05, -7.790327072143555e-05, -7.395818829536438e-05, -7.001310586929321e-05, -6.606802344322205e-05, -6.212294101715088e-05, -5.817785859107971e-05, -5.4232776165008545e-05, -5.028769373893738e-05, -4.634261131286621e-05, -4.2397528886795044e-05, -3.845244646072388e-05, -3.450736403465271e-05, -3.056228160858154e-05, -2.6617199182510376e-05, -2.267211675643921e-05, -1.8727034330368042e-05, -1.4781951904296875e-05, -1.0836869478225708e-05, -6.891787052154541e-06, -2.946704626083374e-06, 9.98377799987793e-07, 4.94346022605896e-06, 8.888542652130127e-06, 1.2833625078201294e-05, 1.677870750427246e-05, 2.0723789930343628e-05, 2.4668872356414795e-05, 2.8613954782485962e-05, 3.255903720855713e-05, 3.6504119634628296e-05, 4.044920206069946e-05, 4.439428448677063e-05, 4.83393669128418e-05, 5.2284449338912964e-05, 5.622953176498413e-05, 6.01746141910553e-05, 6.411969661712646e-05, 6.806477904319763e-05, 7.20098614692688e-05, 7.595494389533997e-05, 7.990002632141113e-05, 8.38451087474823e-05, 8.779019117355347e-05, 9.173527359962463e-05, 9.56803560256958e-05, 9.962543845176697e-05, 0.00010357052087783813, 0.0001075156033039093, 0.00011146068572998047]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 7.0, 10.0, 11.0, 10.0, 17.0, 19.0, 16.0, 30.0, 27.0, 29.0, 46.0, 34.0, 42.0, 37.0, 34.0, 46.0, 41.0, 53.0, 36.0, 46.0, 51.0, 40.0, 30.0, 49.0, 24.0, 36.0, 34.0, 15.0, 23.0, 17.0, 18.0, 7.0, 15.0, 8.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.37109375, -5.17547607421875, -4.9798583984375, -4.78424072265625, -4.588623046875, -4.39300537109375, -4.1973876953125, -4.00177001953125, -3.80615234375, -3.61053466796875, -3.4149169921875, -3.21929931640625, -3.023681640625, -2.82806396484375, -2.6324462890625, -2.43682861328125, -2.2412109375, -2.04559326171875, -1.8499755859375, -1.65435791015625, -1.458740234375, -1.26312255859375, -1.0675048828125, -0.87188720703125, -0.67626953125, -0.48065185546875, -0.2850341796875, -0.08941650390625, 0.106201171875, 0.30181884765625, 0.4974365234375, 0.69305419921875, 0.888671875, 1.08428955078125, 1.2799072265625, 1.47552490234375, 1.671142578125, 1.86676025390625, 2.0623779296875, 2.25799560546875, 2.45361328125, 2.64923095703125, 2.8448486328125, 3.04046630859375, 3.236083984375, 3.43170166015625, 3.6273193359375, 3.82293701171875, 4.0185546875, 4.21417236328125, 4.4097900390625, 4.60540771484375, 4.801025390625, 4.99664306640625, 5.1922607421875, 5.38787841796875, 5.58349609375, 5.77911376953125, 5.9747314453125, 6.17034912109375, 6.365966796875, 6.56158447265625, 6.7572021484375, 6.95281982421875, 7.1484375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 6.0, 9.0, 18.0, 27.0, 32.0, 57.0, 76.0, 121.0, 171.0, 292.0, 453.0, 812.0, 1564.0, 3022.0, 5948.0, 11963.0, 24270.0, 48092.0, 96422.0, 187214.0, 273885.0, 192431.0, 100109.0, 50721.0, 25394.0, 12533.0, 6141.0, 3019.0, 1566.0, 864.0, 481.0, 307.0, 161.0, 113.0, 99.0, 55.0, 43.0, 23.0, 17.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9296875, -4.77813720703125, -4.6265869140625, -4.47503662109375, -4.323486328125, -4.17193603515625, -4.0203857421875, -3.86883544921875, -3.71728515625, -3.56573486328125, -3.4141845703125, -3.26263427734375, -3.111083984375, -2.95953369140625, -2.8079833984375, -2.65643310546875, -2.5048828125, -2.35333251953125, -2.2017822265625, -2.05023193359375, -1.898681640625, -1.74713134765625, -1.5955810546875, -1.44403076171875, -1.29248046875, -1.14093017578125, -0.9893798828125, -0.83782958984375, -0.686279296875, -0.53472900390625, -0.3831787109375, -0.23162841796875, -0.080078125, 0.07147216796875, 0.2230224609375, 0.37457275390625, 0.526123046875, 0.67767333984375, 0.8292236328125, 0.98077392578125, 1.13232421875, 1.28387451171875, 1.4354248046875, 1.58697509765625, 1.738525390625, 1.89007568359375, 2.0416259765625, 2.19317626953125, 2.3447265625, 2.49627685546875, 2.6478271484375, 2.79937744140625, 2.950927734375, 3.10247802734375, 3.2540283203125, 3.40557861328125, 3.55712890625, 3.70867919921875, 3.8602294921875, 4.01177978515625, 4.163330078125, 4.31488037109375, 4.4664306640625, 4.61798095703125, 4.76953125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 7.0, 14.0, 11.0, 18.0, 13.0, 27.0, 17.0, 28.0, 39.0, 45.0, 45.0, 51.0, 59.0, 76.0, 115.0, 282.0, 1443.0, 241.0, 99.0, 53.0, 56.0, 49.0, 36.0, 41.0, 28.0, 25.0, 10.0, 27.0, 16.0, 14.0, 9.0, 9.0, 8.0, 4.0, 6.0, 8.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-26.96875, -26.22802734375, -25.4873046875, -24.74658203125, -24.005859375, -23.26513671875, -22.5244140625, -21.78369140625, -21.04296875, -20.30224609375, -19.5615234375, -18.82080078125, -18.080078125, -17.33935546875, -16.5986328125, -15.85791015625, -15.1171875, -14.37646484375, -13.6357421875, -12.89501953125, -12.154296875, -11.41357421875, -10.6728515625, -9.93212890625, -9.19140625, -8.45068359375, -7.7099609375, -6.96923828125, -6.228515625, -5.48779296875, -4.7470703125, -4.00634765625, -3.265625, -2.52490234375, -1.7841796875, -1.04345703125, -0.302734375, 0.43798828125, 1.1787109375, 1.91943359375, 2.66015625, 3.40087890625, 4.1416015625, 4.88232421875, 5.623046875, 6.36376953125, 7.1044921875, 7.84521484375, 8.5859375, 9.32666015625, 10.0673828125, 10.80810546875, 11.548828125, 12.28955078125, 13.0302734375, 13.77099609375, 14.51171875, 15.25244140625, 15.9931640625, 16.73388671875, 17.474609375, 18.21533203125, 18.9560546875, 19.69677734375, 20.4375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 11.0, 13.0, 25.0, 24.0, 48.0, 50.0, 87.0, 118.0, 193.0, 348.0, 848.0, 16205.0, 3120571.0, 5613.0, 693.0, 308.0, 183.0, 111.0, 82.0, 60.0, 39.0, 26.0, 13.0, 11.0, 4.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.0, -76.1171875, -73.234375, -70.3515625, -67.46875, -64.5859375, -61.703125, -58.8203125, -55.9375, -53.0546875, -50.171875, -47.2890625, -44.40625, -41.5234375, -38.640625, -35.7578125, -32.875, -29.9921875, -27.109375, -24.2265625, -21.34375, -18.4609375, -15.578125, -12.6953125, -9.8125, -6.9296875, -4.046875, -1.1640625, 1.71875, 4.6015625, 7.484375, 10.3671875, 13.25, 16.1328125, 19.015625, 21.8984375, 24.78125, 27.6640625, 30.546875, 33.4296875, 36.3125, 39.1953125, 42.078125, 44.9609375, 47.84375, 50.7265625, 53.609375, 56.4921875, 59.375, 62.2578125, 65.140625, 68.0234375, 70.90625, 73.7890625, 76.671875, 79.5546875, 82.4375, 85.3203125, 88.203125, 91.0859375, 93.96875, 96.8515625, 99.734375, 102.6171875, 105.5]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 26.0, 181.0, 453.0, 296.0, 52.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-186.2519989013672, -182.5824432373047, -178.91290283203125, -175.24334716796875, -171.5738067626953, -167.9042510986328, -164.23471069335938, -160.56515502929688, -156.89559936523438, -153.22604370117188, -149.55650329589844, -145.88694763183594, -142.2174072265625, -138.5478515625, -134.87831115722656, -131.20875549316406, -127.53921508789062, -123.86966705322266, -120.20011901855469, -116.53057098388672, -112.86102294921875, -109.19146728515625, -105.52191925048828, -101.85237121582031, -98.18282318115234, -94.51327514648438, -90.8437271118164, -87.17417907714844, -83.50462341308594, -79.8350830078125, -76.16552734375, -72.49597930908203, -68.8264389038086, -65.15689086914062, -61.487342834472656, -57.81779098510742, -54.14824295043945, -50.478694915771484, -46.80914306640625, -43.13959503173828, -39.47004699707031, -35.800498962402344, -32.130950927734375, -28.46139907836914, -24.791851043701172, -21.122303009033203, -17.4527530670166, -13.783203125, -10.113655090332031, -6.444106101989746, -2.774557113647461, 0.8949918746948242, 4.564540863037109, 8.234088897705078, 11.90363883972168, 15.573188781738281, 19.24273681640625, 22.91228485107422, 26.58183479309082, 30.251384735107422, 33.92093276977539, 37.59048080444336, 41.260032653808594, 44.92958068847656, 48.59912872314453]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 6.0, 9.0, 8.0, 12.0, 16.0, 16.0, 20.0, 16.0, 20.0, 31.0, 19.0, 30.0, 24.0, 32.0, 27.0, 26.0, 32.0, 47.0, 39.0, 35.0, 30.0, 50.0, 33.0, 33.0, 42.0, 35.0, 36.0, 29.0, 40.0, 24.0, 20.0, 19.0, 19.0, 22.0, 14.0, 17.0, 16.0, 8.0, 5.0, 9.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-41.673072814941406, -40.20881271362305, -38.74455261230469, -37.28029251098633, -35.81603240966797, -34.351776123046875, -32.88751220703125, -31.423255920410156, -29.958995819091797, -28.494735717773438, -27.030475616455078, -25.56621551513672, -24.101957321166992, -22.637697219848633, -21.173437118530273, -19.709178924560547, -18.244916915893555, -16.780656814575195, -15.316397666931152, -13.852137565612793, -12.38787841796875, -10.92361831665039, -9.459358215332031, -7.995099067687988, -6.530838966369629, -5.066579341888428, -3.6023194789886475, -2.138059616088867, -0.673799991607666, 0.7904596328735352, 2.2547197341918945, 3.7189788818359375, 5.183238983154297, 6.647498607635498, 8.1117582321167, 9.576018333435059, 11.040277481079102, 12.504537582397461, 13.96879768371582, 15.433056831359863, 16.897315979003906, 18.361576080322266, 19.825836181640625, 21.290096282958984, 22.75435447692871, 24.21861457824707, 25.68287467956543, 27.147132873535156, 28.61139488220215, 30.075654983520508, 31.539915084838867, 33.004173278808594, 34.46843338012695, 35.93269348144531, 37.39695358276367, 38.86121368408203, 40.32547378540039, 41.78973388671875, 43.25399398803711, 44.71825408935547, 46.18251419067383, 47.64677429199219, 49.11103057861328, 50.57529067993164, 52.03955078125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 12.0, 9.0, 12.0, 12.0, 13.0, 12.0, 21.0, 18.0, 27.0, 27.0, 29.0, 35.0, 41.0, 45.0, 35.0, 41.0, 48.0, 46.0, 36.0, 36.0, 36.0, 47.0, 44.0, 42.0, 29.0, 36.0, 28.0, 22.0, 26.0, 27.0, 14.0, 15.0, 11.0, 9.0, 12.0, 11.0, 10.0, 3.0, 7.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.234375, -5.02911376953125, -4.8238525390625, -4.61859130859375, -4.413330078125, -4.20806884765625, -4.0028076171875, -3.79754638671875, -3.59228515625, -3.38702392578125, -3.1817626953125, -2.97650146484375, -2.771240234375, -2.56597900390625, -2.3607177734375, -2.15545654296875, -1.9501953125, -1.74493408203125, -1.5396728515625, -1.33441162109375, -1.129150390625, -0.92388916015625, -0.7186279296875, -0.51336669921875, -0.30810546875, -0.10284423828125, 0.1024169921875, 0.30767822265625, 0.512939453125, 0.71820068359375, 0.9234619140625, 1.12872314453125, 1.333984375, 1.53924560546875, 1.7445068359375, 1.94976806640625, 2.155029296875, 2.36029052734375, 2.5655517578125, 2.77081298828125, 2.97607421875, 3.18133544921875, 3.3865966796875, 3.59185791015625, 3.797119140625, 4.00238037109375, 4.2076416015625, 4.41290283203125, 4.6181640625, 4.82342529296875, 5.0286865234375, 5.23394775390625, 5.439208984375, 5.64447021484375, 5.8497314453125, 6.05499267578125, 6.26025390625, 6.46551513671875, 6.6707763671875, 6.87603759765625, 7.081298828125, 7.28656005859375, 7.4918212890625, 7.69708251953125, 7.90234375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 3.0, 6.0, 4.0, 9.0, 11.0, 9.0, 11.0, 11.0, 19.0, 16.0, 20.0, 25.0, 29.0, 42.0, 62.0, 74.0, 132.0, 211.0, 457.0, 1852.0, 31113.0, 1593559.0, 2497739.0, 65041.0, 2586.0, 522.0, 214.0, 129.0, 86.0, 64.0, 45.0, 25.0, 30.0, 25.0, 16.0, 17.0, 16.0, 6.0, 11.0, 7.0, 10.0, 4.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.15625, -17.432861328125, -16.70947265625, -15.986083984375, -15.2626953125, -14.539306640625, -13.81591796875, -13.092529296875, -12.369140625, -11.645751953125, -10.92236328125, -10.198974609375, -9.4755859375, -8.752197265625, -8.02880859375, -7.305419921875, -6.58203125, -5.858642578125, -5.13525390625, -4.411865234375, -3.6884765625, -2.965087890625, -2.24169921875, -1.518310546875, -0.794921875, -0.071533203125, 0.65185546875, 1.375244140625, 2.0986328125, 2.822021484375, 3.54541015625, 4.268798828125, 4.9921875, 5.715576171875, 6.43896484375, 7.162353515625, 7.8857421875, 8.609130859375, 9.33251953125, 10.055908203125, 10.779296875, 11.502685546875, 12.22607421875, 12.949462890625, 13.6728515625, 14.396240234375, 15.11962890625, 15.843017578125, 16.56640625, 17.289794921875, 18.01318359375, 18.736572265625, 19.4599609375, 20.183349609375, 20.90673828125, 21.630126953125, 22.353515625, 23.076904296875, 23.80029296875, 24.523681640625, 25.2470703125, 25.970458984375, 26.69384765625, 27.417236328125, 28.140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 13.0, 8.0, 11.0, 17.0, 29.0, 28.0, 64.0, 74.0, 93.0, 116.0, 177.0, 214.0, 268.0, 349.0, 396.0, 450.0, 379.0, 350.0, 264.0, 201.0, 153.0, 101.0, 70.0, 49.0, 49.0, 30.0, 26.0, 17.0, 19.0, 19.0, 6.0, 3.0, 4.0, 5.0, 4.0, 1.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.47802734375, -11.0732421875, -10.66845703125, -10.263671875, -9.85888671875, -9.4541015625, -9.04931640625, -8.64453125, -8.23974609375, -7.8349609375, -7.43017578125, -7.025390625, -6.62060546875, -6.2158203125, -5.81103515625, -5.40625, -5.00146484375, -4.5966796875, -4.19189453125, -3.787109375, -3.38232421875, -2.9775390625, -2.57275390625, -2.16796875, -1.76318359375, -1.3583984375, -0.95361328125, -0.548828125, -0.14404296875, 0.2607421875, 0.66552734375, 1.0703125, 1.47509765625, 1.8798828125, 2.28466796875, 2.689453125, 3.09423828125, 3.4990234375, 3.90380859375, 4.30859375, 4.71337890625, 5.1181640625, 5.52294921875, 5.927734375, 6.33251953125, 6.7373046875, 7.14208984375, 7.546875, 7.95166015625, 8.3564453125, 8.76123046875, 9.166015625, 9.57080078125, 9.9755859375, 10.38037109375, 10.78515625, 11.18994140625, 11.5947265625, 11.99951171875, 12.404296875, 12.80908203125, 13.2138671875, 13.61865234375, 14.0234375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 10.0, 12.0, 18.0, 22.0, 19.0, 26.0, 43.0, 60.0, 75.0, 105.0, 140.0, 226.0, 409.0, 1203.0, 21308.0, 3695242.0, 470263.0, 3517.0, 627.0, 273.0, 216.0, 143.0, 82.0, 75.0, 46.0, 41.0, 21.0, 17.0, 14.0, 9.0, 11.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.128173828125, -28.52197265625, -26.915771484375, -25.3095703125, -23.703369140625, -22.09716796875, -20.490966796875, -18.884765625, -17.278564453125, -15.67236328125, -14.066162109375, -12.4599609375, -10.853759765625, -9.24755859375, -7.641357421875, -6.03515625, -4.428955078125, -2.82275390625, -1.216552734375, 0.3896484375, 1.995849609375, 3.60205078125, 5.208251953125, 6.814453125, 8.420654296875, 10.02685546875, 11.633056640625, 13.2392578125, 14.845458984375, 16.45166015625, 18.057861328125, 19.6640625, 21.270263671875, 22.87646484375, 24.482666015625, 26.0888671875, 27.695068359375, 29.30126953125, 30.907470703125, 32.513671875, 34.119873046875, 35.72607421875, 37.332275390625, 38.9384765625, 40.544677734375, 42.15087890625, 43.757080078125, 45.36328125, 46.969482421875, 48.57568359375, 50.181884765625, 51.7880859375, 53.394287109375, 55.00048828125, 56.606689453125, 58.212890625, 59.819091796875, 61.42529296875, 63.031494140625, 64.6376953125, 66.243896484375, 67.85009765625, 69.456298828125, 71.0625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 20.0, 48.0, 94.0, 151.0, 205.0, 182.0, 170.0, 79.0, 40.0, 11.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.94778442382812, -84.80497741699219, -81.66217803955078, -78.51937103271484, -75.3765640258789, -72.2337646484375, -69.09095764160156, -65.94815063476562, -62.80534744262695, -59.66254425048828, -56.519737243652344, -53.37693405151367, -50.234130859375, -47.09132385253906, -43.94852066040039, -40.80571746826172, -37.66291046142578, -34.52010726928711, -31.377300262451172, -28.2344970703125, -25.091691970825195, -21.94888687133789, -18.80608367919922, -15.663278579711914, -12.52047348022461, -9.377668380737305, -6.234864234924316, -3.092060089111328, 0.05074501037597656, 3.1935501098632812, 6.336353302001953, 9.479158401489258, 12.621955871582031, 15.764760971069336, 18.90756607055664, 22.050369262695312, 25.193174362182617, 28.335979461669922, 31.478782653808594, 34.62158966064453, 37.7643928527832, 40.907196044921875, 44.05000305175781, 47.192806243896484, 50.335609436035156, 53.478416442871094, 56.621219635009766, 59.76402282714844, 62.906829833984375, 66.04963684082031, 69.19243621826172, 72.33524322509766, 75.4780502319336, 78.620849609375, 81.76365661621094, 84.90646362304688, 88.04927062988281, 91.19207763671875, 94.33487701416016, 97.4776840209961, 100.62049102783203, 103.76329040527344, 106.90609741210938, 110.04890441894531, 113.19170379638672]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 12.0, 8.0, 12.0, 12.0, 19.0, 20.0, 15.0, 29.0, 25.0, 22.0, 30.0, 32.0, 28.0, 41.0, 31.0, 35.0, 59.0, 37.0, 37.0, 44.0, 37.0, 38.0, 47.0, 25.0, 35.0, 31.0, 26.0, 27.0, 24.0, 21.0, 26.0, 20.0, 17.0, 14.0, 11.0, 7.0, 11.0, 5.0, 6.0, 8.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.784873962402344, -39.405967712402344, -38.027061462402344, -36.648155212402344, -35.26924514770508, -33.89033889770508, -32.51143264770508, -31.132526397705078, -29.753618240356445, -28.374711990356445, -26.995803833007812, -25.616897583007812, -24.237991333007812, -22.85908317565918, -21.48017692565918, -20.101268768310547, -18.722362518310547, -17.343456268310547, -15.964548110961914, -14.585641860961914, -13.206734657287598, -11.827827453613281, -10.448921203613281, -9.070013999938965, -7.691106796264648, -6.312199592590332, -4.933292865753174, -3.5543861389160156, -2.175478935241699, -0.7965717315673828, 0.5823345184326172, 1.9612417221069336, 3.34014892578125, 4.719056129455566, 6.097962856292725, 7.476869583129883, 8.8557767868042, 10.234683990478516, 11.613590240478516, 12.992497444152832, 14.371404647827148, 15.750311851501465, 17.12921905517578, 18.50812530517578, 19.88703155517578, 21.265939712524414, 22.644845962524414, 24.023754119873047, 25.402660369873047, 26.781566619873047, 28.16047477722168, 29.53938102722168, 30.918289184570312, 32.29719543457031, 33.67610168457031, 35.05500793457031, 36.43391418457031, 37.81282043457031, 39.19172668457031, 40.57063293457031, 41.94954299926758, 43.32844924926758, 44.70735549926758, 46.08626174926758, 47.465171813964844]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 8.0, 14.0, 16.0, 10.0, 13.0, 21.0, 31.0, 32.0, 28.0, 32.0, 47.0, 44.0, 46.0, 47.0, 37.0, 38.0, 52.0, 39.0, 50.0, 39.0, 41.0, 40.0, 43.0, 31.0, 31.0, 35.0, 28.0, 25.0, 19.0, 16.0, 7.0, 7.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.640625, -5.420654296875, -5.20068359375, -4.980712890625, -4.7607421875, -4.540771484375, -4.32080078125, -4.100830078125, -3.880859375, -3.660888671875, -3.44091796875, -3.220947265625, -3.0009765625, -2.781005859375, -2.56103515625, -2.341064453125, -2.12109375, -1.901123046875, -1.68115234375, -1.461181640625, -1.2412109375, -1.021240234375, -0.80126953125, -0.581298828125, -0.361328125, -0.141357421875, 0.07861328125, 0.298583984375, 0.5185546875, 0.738525390625, 0.95849609375, 1.178466796875, 1.3984375, 1.618408203125, 1.83837890625, 2.058349609375, 2.2783203125, 2.498291015625, 2.71826171875, 2.938232421875, 3.158203125, 3.378173828125, 3.59814453125, 3.818115234375, 4.0380859375, 4.258056640625, 4.47802734375, 4.697998046875, 4.91796875, 5.137939453125, 5.35791015625, 5.577880859375, 5.7978515625, 6.017822265625, 6.23779296875, 6.457763671875, 6.677734375, 6.897705078125, 7.11767578125, 7.337646484375, 7.5576171875, 7.777587890625, 7.99755859375, 8.217529296875, 8.4375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 0.0, 4.0, 9.0, 11.0, 16.0, 29.0, 39.0, 70.0, 106.0, 150.0, 255.0, 428.0, 693.0, 1119.0, 1922.0, 3367.0, 5754.0, 9861.0, 17458.0, 31435.0, 58223.0, 115589.0, 324772.0, 253414.0, 103910.0, 52941.0, 28669.0, 16248.0, 9008.0, 5268.0, 3072.0, 1781.0, 1113.0, 682.0, 414.0, 245.0, 167.0, 108.0, 67.0, 49.0, 32.0, 17.0, 18.0, 7.0, 5.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.20703125, -2.137908935546875, -2.06878662109375, -1.999664306640625, -1.9305419921875, -1.861419677734375, -1.79229736328125, -1.723175048828125, -1.654052734375, -1.584930419921875, -1.51580810546875, -1.446685791015625, -1.3775634765625, -1.308441162109375, -1.23931884765625, -1.170196533203125, -1.10107421875, -1.031951904296875, -0.96282958984375, -0.893707275390625, -0.8245849609375, -0.755462646484375, -0.68634033203125, -0.617218017578125, -0.548095703125, -0.478973388671875, -0.40985107421875, -0.340728759765625, -0.2716064453125, -0.202484130859375, -0.13336181640625, -0.064239501953125, 0.0048828125, 0.074005126953125, 0.14312744140625, 0.212249755859375, 0.2813720703125, 0.350494384765625, 0.41961669921875, 0.488739013671875, 0.557861328125, 0.626983642578125, 0.69610595703125, 0.765228271484375, 0.8343505859375, 0.903472900390625, 0.97259521484375, 1.041717529296875, 1.11083984375, 1.179962158203125, 1.24908447265625, 1.318206787109375, 1.3873291015625, 1.456451416015625, 1.52557373046875, 1.594696044921875, 1.663818359375, 1.732940673828125, 1.80206298828125, 1.871185302734375, 1.9403076171875, 2.009429931640625, 2.07855224609375, 2.147674560546875, 2.216796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 2.0, 10.0, 3.0, 10.0, 10.0, 16.0, 11.0, 10.0, 13.0, 26.0, 21.0, 29.0, 22.0, 31.0, 36.0, 43.0, 45.0, 31.0, 45.0, 52.0, 1061.0, 43.0, 46.0, 42.0, 37.0, 28.0, 34.0, 32.0, 36.0, 29.0, 16.0, 27.0, 25.0, 15.0, 21.0, 5.0, 11.0, 11.0, 6.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.748046875, -3.625885009765625, -3.50372314453125, -3.381561279296875, -3.2593994140625, -3.137237548828125, -3.01507568359375, -2.892913818359375, -2.770751953125, -2.648590087890625, -2.52642822265625, -2.404266357421875, -2.2821044921875, -2.159942626953125, -2.03778076171875, -1.915618896484375, -1.79345703125, -1.671295166015625, -1.54913330078125, -1.426971435546875, -1.3048095703125, -1.182647705078125, -1.06048583984375, -0.938323974609375, -0.816162109375, -0.694000244140625, -0.57183837890625, -0.449676513671875, -0.3275146484375, -0.205352783203125, -0.08319091796875, 0.038970947265625, 0.1611328125, 0.283294677734375, 0.40545654296875, 0.527618408203125, 0.6497802734375, 0.771942138671875, 0.89410400390625, 1.016265869140625, 1.138427734375, 1.260589599609375, 1.38275146484375, 1.504913330078125, 1.6270751953125, 1.749237060546875, 1.87139892578125, 1.993560791015625, 2.11572265625, 2.237884521484375, 2.36004638671875, 2.482208251953125, 2.6043701171875, 2.726531982421875, 2.84869384765625, 2.970855712890625, 3.093017578125, 3.215179443359375, 3.33734130859375, 3.459503173828125, 3.5816650390625, 3.703826904296875, 3.82598876953125, 3.948150634765625, 4.0703125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 7.0, 2.0, 9.0, 23.0, 17.0, 27.0, 52.0, 67.0, 102.0, 136.0, 227.0, 315.0, 434.0, 659.0, 926.0, 1356.0, 1894.0, 2679.0, 3978.0, 5845.0, 8358.0, 12639.0, 19207.0, 28863.0, 45508.0, 72329.0, 125248.0, 1363377.0, 162598.0, 85902.0, 53132.0, 34152.0, 21796.0, 14425.0, 9698.0, 6480.0, 4485.0, 3090.0, 2156.0, 1474.0, 1035.0, 744.0, 546.0, 373.0, 241.0, 175.0, 124.0, 83.0, 51.0, 37.0, 24.0, 15.0, 10.0, 3.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.408203125, -1.3622894287109375, -1.316375732421875, -1.2704620361328125, -1.22454833984375, -1.1786346435546875, -1.132720947265625, -1.0868072509765625, -1.0408935546875, -0.9949798583984375, -0.949066162109375, -0.9031524658203125, -0.85723876953125, -0.8113250732421875, -0.765411376953125, -0.7194976806640625, -0.673583984375, -0.6276702880859375, -0.581756591796875, -0.5358428955078125, -0.48992919921875, -0.4440155029296875, -0.398101806640625, -0.3521881103515625, -0.3062744140625, -0.2603607177734375, -0.214447021484375, -0.1685333251953125, -0.12261962890625, -0.0767059326171875, -0.030792236328125, 0.0151214599609375, 0.06103515625, 0.1069488525390625, 0.152862548828125, 0.1987762451171875, 0.24468994140625, 0.2906036376953125, 0.336517333984375, 0.3824310302734375, 0.4283447265625, 0.4742584228515625, 0.520172119140625, 0.5660858154296875, 0.61199951171875, 0.6579132080078125, 0.703826904296875, 0.7497406005859375, 0.795654296875, 0.8415679931640625, 0.887481689453125, 0.9333953857421875, 0.97930908203125, 1.0252227783203125, 1.071136474609375, 1.1170501708984375, 1.1629638671875, 1.2088775634765625, 1.254791259765625, 1.3007049560546875, 1.34661865234375, 1.3925323486328125, 1.438446044921875, 1.4843597412109375, 1.5302734375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 7.0, 9.0, 12.0, 10.0, 9.0, 15.0, 21.0, 24.0, 21.0, 43.0, 50.0, 77.0, 78.0, 106.0, 90.0, 94.0, 55.0, 48.0, 34.0, 35.0, 27.0, 22.0, 15.0, 10.0, 13.0, 8.0, 12.0, 11.0, 6.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00024127960205078125, -0.00023292377591133118, -0.0002245679497718811, -0.00021621212363243103, -0.00020785629749298096, -0.00019950047135353088, -0.0001911446452140808, -0.00018278881907463074, -0.00017443299293518066, -0.0001660771667957306, -0.00015772134065628052, -0.00014936551451683044, -0.00014100968837738037, -0.0001326538622379303, -0.00012429803609848022, -0.00011594220995903015, -0.00010758638381958008, -9.923055768013e-05, -9.087473154067993e-05, -8.251890540122986e-05, -7.416307926177979e-05, -6.580725312232971e-05, -5.745142698287964e-05, -4.9095600843429565e-05, -4.073977470397949e-05, -3.238394856452942e-05, -2.4028122425079346e-05, -1.5672296285629272e-05, -7.316470146179199e-06, 1.039355993270874e-06, 9.395182132720947e-06, 1.775100827217102e-05, 2.6106834411621094e-05, 3.446266055107117e-05, 4.281848669052124e-05, 5.1174312829971313e-05, 5.953013896942139e-05, 6.788596510887146e-05, 7.624179124832153e-05, 8.45976173877716e-05, 9.295344352722168e-05, 0.00010130926966667175, 0.00010966509580612183, 0.0001180209219455719, 0.00012637674808502197, 0.00013473257422447205, 0.00014308840036392212, 0.0001514442265033722, 0.00015980005264282227, 0.00016815587878227234, 0.0001765117049217224, 0.00018486753106117249, 0.00019322335720062256, 0.00020157918334007263, 0.0002099350094795227, 0.00021829083561897278, 0.00022664666175842285, 0.00023500248789787292, 0.000243358314037323, 0.00025171414017677307, 0.00026006996631622314, 0.0002684257924556732, 0.0002767816185951233, 0.00028513744473457336, 0.00029349327087402344]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 10.0, 12.0, 21.0, 16.0, 21.0, 28.0, 38.0, 71.0, 96.0, 174.0, 367.0, 1013.0, 171868.0, 872390.0, 1399.0, 469.0, 223.0, 93.0, 65.0, 40.0, 25.0, 21.0, 21.0, 17.0, 15.0, 6.0, 4.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.007110595703125, -0.006908059120178223, -0.006705522537231445, -0.006502985954284668, -0.006300449371337891, -0.006097912788391113, -0.005895376205444336, -0.005692839622497559, -0.005490303039550781, -0.005287766456604004, -0.0050852298736572266, -0.004882693290710449, -0.004680156707763672, -0.0044776201248168945, -0.004275083541870117, -0.00407254695892334, -0.0038700103759765625, -0.003667473793029785, -0.003464937210083008, -0.0032624006271362305, -0.003059864044189453, -0.0028573274612426758, -0.0026547908782958984, -0.002452254295349121, -0.0022497177124023438, -0.0020471811294555664, -0.001844644546508789, -0.0016421079635620117, -0.0014395713806152344, -0.001237034797668457, -0.0010344982147216797, -0.0008319616317749023, -0.000629425048828125, -0.00042688846588134766, -0.0002243518829345703, -2.181529998779297e-05, 0.00018072128295898438, 0.0003832578659057617, 0.0005857944488525391, 0.0007883310317993164, 0.0009908676147460938, 0.001193404197692871, 0.0013959407806396484, 0.0015984773635864258, 0.0018010139465332031, 0.0020035505294799805, 0.002206087112426758, 0.002408623695373535, 0.0026111602783203125, 0.00281369686126709, 0.003016233444213867, 0.0032187700271606445, 0.003421306610107422, 0.0036238431930541992, 0.0038263797760009766, 0.004028916358947754, 0.004231452941894531, 0.004433989524841309, 0.004636526107788086, 0.004839062690734863, 0.005041599273681641, 0.005244135856628418, 0.005446672439575195, 0.005649209022521973, 0.00585174560546875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 155.0, 514.0, 307.0, 32.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001896093599498272, -0.00016496184980496764, -0.0001403143396601081, -0.00011566683679120615, -9.10193266463466e-05, -6.637182377744466e-05, -4.172431363258511e-05, -1.7076803487725556e-05, 7.5707066571339965e-06, 3.221821680199355e-05, 5.6865723308874294e-05, 8.151322981575504e-05, 0.00010616073996061459, 0.00013080824282951653, 0.00015545575297437608, 0.00018010326311923563, 0.0002047507732640952, 0.00022939828340895474, 0.0002540457935538143, 0.00027869330369867384, 0.0003033408138435334, 0.0003279882948845625, 0.00035263580502942204, 0.0003772833151742816, 0.00040193082531914115, 0.0004265783354640007, 0.00045122584560886025, 0.0004758733557537198, 0.0005005208658985794, 0.0005251683760434389, 0.0005498158861882985, 0.000574463396333158, 0.0005991109064780176, 0.0006237584166228771, 0.0006484059267677367, 0.0006730534369125962, 0.0006977009470574558, 0.0007223484572023153, 0.0007469959673471749, 0.0007716434774920344, 0.000796290987636894, 0.0008209384977817535, 0.0008455860079266131, 0.0008702335180714726, 0.0008948810282163322, 0.0009195285383611917, 0.0009441760485060513, 0.0009688235586509109, 0.0009934710105881095, 0.0010181184625253081, 0.0010427660308778286, 0.0010674134828150272, 0.0010920610511675477, 0.0011167085031047463, 0.0011413560714572668, 0.0011660035233944654, 0.001190651091746986, 0.0012152985436841846, 0.001239946112036705, 0.0012645935639739037, 0.0012892411323264241, 0.0013138885842636228, 0.0013385361526161432, 0.0013631836045533419, 0.0013878311729058623]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 14.0, 23.0, 14.0, 24.0, 21.0, 24.0, 25.0, 27.0, 27.0, 35.0, 31.0, 25.0, 37.0, 43.0, 45.0, 49.0, 34.0, 37.0, 34.0, 37.0, 27.0, 34.0, 34.0, 32.0, 36.0, 20.0, 20.0, 16.0, 24.0, 23.0, 24.0, 16.0, 10.0, 12.0, 12.0, 5.0, 4.0, 6.0, 2.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.00013256072998046875, -0.00012884102761745453, -0.0001251213252544403, -0.00012140162289142609, -0.00011768192052841187, -0.00011396221816539764, -0.00011024251580238342, -0.0001065228134393692, -0.00010280311107635498, -9.908340871334076e-05, -9.536370635032654e-05, -9.164400398731232e-05, -8.79243016242981e-05, -8.420459926128387e-05, -8.048489689826965e-05, -7.676519453525543e-05, -7.304549217224121e-05, -6.932578980922699e-05, -6.560608744621277e-05, -6.188638508319855e-05, -5.8166682720184326e-05, -5.4446980357170105e-05, -5.0727277994155884e-05, -4.700757563114166e-05, -4.328787326812744e-05, -3.956817090511322e-05, -3.5848468542099e-05, -3.212876617908478e-05, -2.8409063816070557e-05, -2.4689361453056335e-05, -2.0969659090042114e-05, -1.7249956727027893e-05, -1.3530254364013672e-05, -9.81055200099945e-06, -6.0908496379852295e-06, -2.3711472749710083e-06, 1.3485550880432129e-06, 5.068257451057434e-06, 8.787959814071655e-06, 1.2507662177085876e-05, 1.6227364540100098e-05, 1.994706690311432e-05, 2.366676926612854e-05, 2.738647162914276e-05, 3.110617399215698e-05, 3.4825876355171204e-05, 3.8545578718185425e-05, 4.2265281081199646e-05, 4.598498344421387e-05, 4.970468580722809e-05, 5.342438817024231e-05, 5.714409053325653e-05, 6.086379289627075e-05, 6.458349525928497e-05, 6.83031976222992e-05, 7.202289998531342e-05, 7.574260234832764e-05, 7.946230471134186e-05, 8.318200707435608e-05, 8.69017094373703e-05, 9.062141180038452e-05, 9.434111416339874e-05, 9.806081652641296e-05, 0.00010178051888942719, 0.0001055002212524414]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 8.0, 14.0, 16.0, 10.0, 13.0, 21.0, 31.0, 32.0, 28.0, 32.0, 47.0, 44.0, 46.0, 47.0, 37.0, 38.0, 52.0, 39.0, 50.0, 39.0, 41.0, 40.0, 43.0, 31.0, 31.0, 35.0, 28.0, 25.0, 19.0, 16.0, 7.0, 7.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.640625, -5.420654296875, -5.20068359375, -4.980712890625, -4.7607421875, -4.540771484375, -4.32080078125, -4.100830078125, -3.880859375, -3.660888671875, -3.44091796875, -3.220947265625, -3.0009765625, -2.781005859375, -2.56103515625, -2.341064453125, -2.12109375, -1.901123046875, -1.68115234375, -1.461181640625, -1.2412109375, -1.021240234375, -0.80126953125, -0.581298828125, -0.361328125, -0.141357421875, 0.07861328125, 0.298583984375, 0.5185546875, 0.738525390625, 0.95849609375, 1.178466796875, 1.3984375, 1.618408203125, 1.83837890625, 2.058349609375, 2.2783203125, 2.498291015625, 2.71826171875, 2.938232421875, 3.158203125, 3.378173828125, 3.59814453125, 3.818115234375, 4.0380859375, 4.258056640625, 4.47802734375, 4.697998046875, 4.91796875, 5.137939453125, 5.35791015625, 5.577880859375, 5.7978515625, 6.017822265625, 6.23779296875, 6.457763671875, 6.677734375, 6.897705078125, 7.11767578125, 7.337646484375, 7.5576171875, 7.777587890625, 7.99755859375, 8.217529296875, 8.4375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 8.0, 9.0, 18.0, 21.0, 32.0, 38.0, 49.0, 69.0, 76.0, 144.0, 192.0, 271.0, 441.0, 715.0, 1306.0, 3101.0, 7696.0, 21755.0, 60946.0, 168880.0, 433247.0, 224653.0, 78659.0, 28431.0, 10100.0, 3720.0, 1577.0, 866.0, 511.0, 308.0, 196.0, 156.0, 95.0, 79.0, 58.0, 36.0, 27.0, 19.0, 15.0, 15.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.671875, -7.42138671875, -7.1708984375, -6.92041015625, -6.669921875, -6.41943359375, -6.1689453125, -5.91845703125, -5.66796875, -5.41748046875, -5.1669921875, -4.91650390625, -4.666015625, -4.41552734375, -4.1650390625, -3.91455078125, -3.6640625, -3.41357421875, -3.1630859375, -2.91259765625, -2.662109375, -2.41162109375, -2.1611328125, -1.91064453125, -1.66015625, -1.40966796875, -1.1591796875, -0.90869140625, -0.658203125, -0.40771484375, -0.1572265625, 0.09326171875, 0.34375, 0.59423828125, 0.8447265625, 1.09521484375, 1.345703125, 1.59619140625, 1.8466796875, 2.09716796875, 2.34765625, 2.59814453125, 2.8486328125, 3.09912109375, 3.349609375, 3.60009765625, 3.8505859375, 4.10107421875, 4.3515625, 4.60205078125, 4.8525390625, 5.10302734375, 5.353515625, 5.60400390625, 5.8544921875, 6.10498046875, 6.35546875, 6.60595703125, 6.8564453125, 7.10693359375, 7.357421875, 7.60791015625, 7.8583984375, 8.10888671875, 8.359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 8.0, 12.0, 16.0, 6.0, 17.0, 21.0, 35.0, 29.0, 42.0, 32.0, 58.0, 46.0, 66.0, 100.0, 218.0, 1511.0, 262.0, 111.0, 79.0, 44.0, 39.0, 42.0, 47.0, 32.0, 31.0, 22.0, 29.0, 24.0, 11.0, 13.0, 10.0, 8.0, 3.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.5771484375, -18.810546875, -18.0439453125, -17.27734375, -16.5107421875, -15.744140625, -14.9775390625, -14.2109375, -13.4443359375, -12.677734375, -11.9111328125, -11.14453125, -10.3779296875, -9.611328125, -8.8447265625, -8.078125, -7.3115234375, -6.544921875, -5.7783203125, -5.01171875, -4.2451171875, -3.478515625, -2.7119140625, -1.9453125, -1.1787109375, -0.412109375, 0.3544921875, 1.12109375, 1.8876953125, 2.654296875, 3.4208984375, 4.1875, 4.9541015625, 5.720703125, 6.4873046875, 7.25390625, 8.0205078125, 8.787109375, 9.5537109375, 10.3203125, 11.0869140625, 11.853515625, 12.6201171875, 13.38671875, 14.1533203125, 14.919921875, 15.6865234375, 16.453125, 17.2197265625, 17.986328125, 18.7529296875, 19.51953125, 20.2861328125, 21.052734375, 21.8193359375, 22.5859375, 23.3525390625, 24.119140625, 24.8857421875, 25.65234375, 26.4189453125, 27.185546875, 27.9521484375, 28.71875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 7.0, 10.0, 8.0, 5.0, 7.0, 10.0, 6.0, 16.0, 18.0, 26.0, 24.0, 27.0, 56.0, 57.0, 57.0, 90.0, 115.0, 149.0, 217.0, 431.0, 871.0, 5157.0, 2892196.0, 242426.0, 2078.0, 592.0, 280.0, 213.0, 119.0, 97.0, 69.0, 55.0, 47.0, 34.0, 22.0, 24.0, 18.0, 17.0, 18.0, 8.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-66.6875, -64.7158203125, -62.744140625, -60.7724609375, -58.80078125, -56.8291015625, -54.857421875, -52.8857421875, -50.9140625, -48.9423828125, -46.970703125, -44.9990234375, -43.02734375, -41.0556640625, -39.083984375, -37.1123046875, -35.140625, -33.1689453125, -31.197265625, -29.2255859375, -27.25390625, -25.2822265625, -23.310546875, -21.3388671875, -19.3671875, -17.3955078125, -15.423828125, -13.4521484375, -11.48046875, -9.5087890625, -7.537109375, -5.5654296875, -3.59375, -1.6220703125, 0.349609375, 2.3212890625, 4.29296875, 6.2646484375, 8.236328125, 10.2080078125, 12.1796875, 14.1513671875, 16.123046875, 18.0947265625, 20.06640625, 22.0380859375, 24.009765625, 25.9814453125, 27.953125, 29.9248046875, 31.896484375, 33.8681640625, 35.83984375, 37.8115234375, 39.783203125, 41.7548828125, 43.7265625, 45.6982421875, 47.669921875, 49.6416015625, 51.61328125, 53.5849609375, 55.556640625, 57.5283203125, 59.5]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 247.0, 676.0, 78.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.267841339111328, -23.244535446166992, -16.221229553222656, -9.197925567626953, -2.174619674682617, 4.848686218261719, 11.871990203857422, 18.89529800415039, 25.918601989746094, 32.9419059753418, 39.965213775634766, 46.98851776123047, 54.01182556152344, 61.03512954711914, 68.05843353271484, 75.08174133300781, 82.10504150390625, 89.12834930419922, 96.15164947509766, 103.17495727539062, 110.1982650756836, 117.22157287597656, 124.244873046875, 131.2681884765625, 138.29148864746094, 145.31478881835938, 152.33810424804688, 159.3614044189453, 166.38470458984375, 173.40802001953125, 180.4313201904297, 187.45462036132812, 194.47792053222656, 201.501220703125, 208.5245361328125, 215.54783630371094, 222.57113647460938, 229.59445190429688, 236.6177520751953, 243.64105224609375, 250.66436767578125, 257.68768310546875, 264.7109680175781, 271.7342834472656, 278.7575988769531, 285.7808837890625, 292.80419921875, 299.8275146484375, 306.8507995605469, 313.8741149902344, 320.89739990234375, 327.92071533203125, 334.94403076171875, 341.9673156738281, 348.9906311035156, 356.0139465332031, 363.0372619628906, 370.0605773925781, 377.0838623046875, 384.107177734375, 391.1304931640625, 398.1537780761719, 405.1770935058594, 412.2004089355469, 419.22369384765625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 4.0, 8.0, 8.0, 6.0, 10.0, 14.0, 17.0, 17.0, 27.0, 20.0, 19.0, 30.0, 28.0, 37.0, 37.0, 35.0, 47.0, 42.0, 50.0, 51.0, 51.0, 39.0, 37.0, 39.0, 44.0, 33.0, 39.0, 28.0, 22.0, 26.0, 22.0, 18.0, 12.0, 10.0, 11.0, 10.0, 11.0, 3.0, 6.0, 3.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-65.57060241699219, -63.566627502441406, -61.56265640258789, -59.55868148803711, -57.554710388183594, -55.55073547363281, -53.54676055908203, -51.54278564453125, -49.538814544677734, -47.53483963012695, -45.53086853027344, -43.526893615722656, -41.522918701171875, -39.51894760131836, -37.51497268676758, -35.51100158691406, -33.50702667236328, -31.503053665161133, -29.499080657958984, -27.495105743408203, -25.491132736206055, -23.487159729003906, -21.483184814453125, -19.479211807250977, -17.475238800048828, -15.47126579284668, -13.467291831970215, -11.46331787109375, -9.459344863891602, -7.455371856689453, -5.451397895812988, -3.4474239349365234, -1.4434432983398438, 0.5605301856994629, 2.5645036697387695, 4.568477153778076, 6.572450637817383, 8.576423645019531, 10.580397605895996, 12.584371566772461, 14.58834457397461, 16.592317581176758, 18.596290588378906, 20.600265502929688, 22.604238510131836, 24.608211517333984, 26.612186431884766, 28.616159439086914, 30.620132446289062, 32.624107360839844, 34.62807846069336, 36.63205337524414, 38.636024475097656, 40.63999938964844, 42.64397430419922, 44.64794921875, 46.651920318603516, 48.6558952331543, 50.65986633300781, 52.663841247558594, 54.667816162109375, 56.67178726196289, 58.67576217651367, 60.67973327636719, 62.68370819091797]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 11.0, 16.0, 13.0, 16.0, 16.0, 20.0, 24.0, 27.0, 28.0, 32.0, 42.0, 38.0, 34.0, 27.0, 59.0, 36.0, 37.0, 41.0, 42.0, 53.0, 51.0, 36.0, 42.0, 36.0, 37.0, 33.0, 31.0, 26.0, 16.0, 15.0, 13.0, 12.0, 7.0, 9.0, 7.0, 3.0, 2.0, 8.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3984375, -6.15380859375, -5.9091796875, -5.66455078125, -5.419921875, -5.17529296875, -4.9306640625, -4.68603515625, -4.44140625, -4.19677734375, -3.9521484375, -3.70751953125, -3.462890625, -3.21826171875, -2.9736328125, -2.72900390625, -2.484375, -2.23974609375, -1.9951171875, -1.75048828125, -1.505859375, -1.26123046875, -1.0166015625, -0.77197265625, -0.52734375, -0.28271484375, -0.0380859375, 0.20654296875, 0.451171875, 0.69580078125, 0.9404296875, 1.18505859375, 1.4296875, 1.67431640625, 1.9189453125, 2.16357421875, 2.408203125, 2.65283203125, 2.8974609375, 3.14208984375, 3.38671875, 3.63134765625, 3.8759765625, 4.12060546875, 4.365234375, 4.60986328125, 4.8544921875, 5.09912109375, 5.34375, 5.58837890625, 5.8330078125, 6.07763671875, 6.322265625, 6.56689453125, 6.8115234375, 7.05615234375, 7.30078125, 7.54541015625, 7.7900390625, 8.03466796875, 8.279296875, 8.52392578125, 8.7685546875, 9.01318359375, 9.2578125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 10.0, 15.0, 15.0, 13.0, 29.0, 27.0, 25.0, 23.0, 32.0, 51.0, 56.0, 104.0, 305.0, 1072.0, 9780.0, 867925.0, 3212908.0, 98056.0, 2767.0, 549.0, 172.0, 74.0, 46.0, 34.0, 35.0, 32.0, 20.0, 19.0, 10.0, 23.0, 7.0, 10.0, 4.0, 5.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.598388671875, -20.74365234375, -19.888916015625, -19.0341796875, -18.179443359375, -17.32470703125, -16.469970703125, -15.615234375, -14.760498046875, -13.90576171875, -13.051025390625, -12.1962890625, -11.341552734375, -10.48681640625, -9.632080078125, -8.77734375, -7.922607421875, -7.06787109375, -6.213134765625, -5.3583984375, -4.503662109375, -3.64892578125, -2.794189453125, -1.939453125, -1.084716796875, -0.22998046875, 0.624755859375, 1.4794921875, 2.334228515625, 3.18896484375, 4.043701171875, 4.8984375, 5.753173828125, 6.60791015625, 7.462646484375, 8.3173828125, 9.172119140625, 10.02685546875, 10.881591796875, 11.736328125, 12.591064453125, 13.44580078125, 14.300537109375, 15.1552734375, 16.010009765625, 16.86474609375, 17.719482421875, 18.57421875, 19.428955078125, 20.28369140625, 21.138427734375, 21.9931640625, 22.847900390625, 23.70263671875, 24.557373046875, 25.412109375, 26.266845703125, 27.12158203125, 27.976318359375, 28.8310546875, 29.685791015625, 30.54052734375, 31.395263671875, 32.25]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 15.0, 17.0, 33.0, 46.0, 41.0, 83.0, 129.0, 175.0, 246.0, 349.0, 400.0, 477.0, 477.0, 437.0, 301.0, 250.0, 175.0, 127.0, 75.0, 60.0, 52.0, 30.0, 18.0, 9.0, 16.0, 9.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7578125, -14.2474365234375, -13.737060546875, -13.2266845703125, -12.71630859375, -12.2059326171875, -11.695556640625, -11.1851806640625, -10.6748046875, -10.1644287109375, -9.654052734375, -9.1436767578125, -8.63330078125, -8.1229248046875, -7.612548828125, -7.1021728515625, -6.591796875, -6.0814208984375, -5.571044921875, -5.0606689453125, -4.55029296875, -4.0399169921875, -3.529541015625, -3.0191650390625, -2.5087890625, -1.9984130859375, -1.488037109375, -0.9776611328125, -0.46728515625, 0.0430908203125, 0.553466796875, 1.0638427734375, 1.57421875, 2.0845947265625, 2.594970703125, 3.1053466796875, 3.61572265625, 4.1260986328125, 4.636474609375, 5.1468505859375, 5.6572265625, 6.1676025390625, 6.677978515625, 7.1883544921875, 7.69873046875, 8.2091064453125, 8.719482421875, 9.2298583984375, 9.740234375, 10.2506103515625, 10.760986328125, 11.2713623046875, 11.78173828125, 12.2921142578125, 12.802490234375, 13.3128662109375, 13.8232421875, 14.3336181640625, 14.843994140625, 15.3543701171875, 15.86474609375, 16.3751220703125, 16.885498046875, 17.3958740234375, 17.90625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 10.0, 5.0, 14.0, 10.0, 16.0, 22.0, 44.0, 40.0, 60.0, 73.0, 110.0, 158.0, 197.0, 273.0, 411.0, 841.0, 9139.0, 2937801.0, 1238325.0, 4706.0, 711.0, 381.0, 244.0, 194.0, 134.0, 90.0, 99.0, 67.0, 38.0, 21.0, 18.0, 17.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.625, -57.9169921875, -56.208984375, -54.5009765625, -52.79296875, -51.0849609375, -49.376953125, -47.6689453125, -45.9609375, -44.2529296875, -42.544921875, -40.8369140625, -39.12890625, -37.4208984375, -35.712890625, -34.0048828125, -32.296875, -30.5888671875, -28.880859375, -27.1728515625, -25.46484375, -23.7568359375, -22.048828125, -20.3408203125, -18.6328125, -16.9248046875, -15.216796875, -13.5087890625, -11.80078125, -10.0927734375, -8.384765625, -6.6767578125, -4.96875, -3.2607421875, -1.552734375, 0.1552734375, 1.86328125, 3.5712890625, 5.279296875, 6.9873046875, 8.6953125, 10.4033203125, 12.111328125, 13.8193359375, 15.52734375, 17.2353515625, 18.943359375, 20.6513671875, 22.359375, 24.0673828125, 25.775390625, 27.4833984375, 29.19140625, 30.8994140625, 32.607421875, 34.3154296875, 36.0234375, 37.7314453125, 39.439453125, 41.1474609375, 42.85546875, 44.5634765625, 46.271484375, 47.9794921875, 49.6875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 16.0, 82.0, 212.0, 327.0, 251.0, 88.0, 28.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.50189208984375, -133.45700073242188, -128.412109375, -123.3672103881836, -118.32231140136719, -113.27742004394531, -108.23252868652344, -103.18763732910156, -98.14273834228516, -93.09784698486328, -88.05294799804688, -83.008056640625, -77.96316528320312, -72.91826629638672, -67.87337493896484, -62.8284797668457, -57.78358459472656, -52.73868942260742, -47.69379425048828, -42.648902893066406, -37.604007720947266, -32.559112548828125, -27.514219284057617, -22.46932601928711, -17.42443084716797, -12.379536628723145, -7.33464241027832, -2.289748191833496, 2.755146026611328, 7.800041198730469, 12.844934463500977, 17.889827728271484, 22.934738159179688, 27.979633331298828, 33.02452850341797, 38.069419860839844, 43.114315032958984, 48.159210205078125, 53.2041015625, 58.24899673461914, 63.29389190673828, 68.33878326416016, 73.38368225097656, 78.42857360839844, 83.47346496582031, 88.51836395263672, 93.5632553100586, 98.608154296875, 103.65304565429688, 108.69793701171875, 113.74283599853516, 118.78772735595703, 123.83262634277344, 128.8775177001953, 133.9224090576172, 138.96730041503906, 144.01220703125, 149.05709838867188, 154.10198974609375, 159.1468963623047, 164.19178771972656, 169.23667907714844, 174.2815704345703, 179.3264617919922, 184.37135314941406]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 10.0, 9.0, 13.0, 13.0, 11.0, 18.0, 20.0, 23.0, 31.0, 31.0, 31.0, 41.0, 39.0, 43.0, 36.0, 32.0, 34.0, 34.0, 51.0, 44.0, 46.0, 34.0, 31.0, 41.0, 36.0, 34.0, 30.0, 24.0, 32.0, 19.0, 18.0, 8.0, 10.0, 14.0, 8.0, 9.0, 11.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.45903396606445, -40.982994079589844, -39.506954193115234, -38.030914306640625, -36.554874420166016, -35.078834533691406, -33.6027946472168, -32.12675476074219, -30.650714874267578, -29.17467498779297, -27.69863510131836, -26.22259521484375, -24.74655532836914, -23.27051544189453, -21.794475555419922, -20.318435668945312, -18.842395782470703, -17.366355895996094, -15.890316009521484, -14.414276123046875, -12.938236236572266, -11.462196350097656, -9.986156463623047, -8.510116577148438, -7.034076690673828, -5.558036804199219, -4.081996917724609, -2.60595703125, -1.1299171447753906, 0.34612274169921875, 1.8221626281738281, 3.2982025146484375, 4.774238586425781, 6.250278472900391, 7.726318359375, 9.20235824584961, 10.678398132324219, 12.154438018798828, 13.630477905273438, 15.106517791748047, 16.582557678222656, 18.058597564697266, 19.534637451171875, 21.010677337646484, 22.486717224121094, 23.962757110595703, 25.438796997070312, 26.914836883544922, 28.39087677001953, 29.86691665649414, 31.34295654296875, 32.81899642944336, 34.29503631591797, 35.77107620239258, 37.24711608886719, 38.7231559753418, 40.199195861816406, 41.675235748291016, 43.151275634765625, 44.627315521240234, 46.103355407714844, 47.57939529418945, 49.05543518066406, 50.53147506713867, 52.00751495361328]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 8.0, 9.0, 15.0, 18.0, 18.0, 22.0, 24.0, 28.0, 34.0, 37.0, 32.0, 48.0, 49.0, 47.0, 44.0, 38.0, 49.0, 47.0, 50.0, 46.0, 48.0, 46.0, 44.0, 36.0, 46.0, 19.0, 23.0, 11.0, 15.0, 9.0, 5.0, 10.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.63348388671875, -6.3802490234375, -6.12701416015625, -5.873779296875, -5.62054443359375, -5.3673095703125, -5.11407470703125, -4.86083984375, -4.60760498046875, -4.3543701171875, -4.10113525390625, -3.847900390625, -3.59466552734375, -3.3414306640625, -3.08819580078125, -2.8349609375, -2.58172607421875, -2.3284912109375, -2.07525634765625, -1.822021484375, -1.56878662109375, -1.3155517578125, -1.06231689453125, -0.80908203125, -0.55584716796875, -0.3026123046875, -0.04937744140625, 0.203857421875, 0.45709228515625, 0.7103271484375, 0.96356201171875, 1.216796875, 1.47003173828125, 1.7232666015625, 1.97650146484375, 2.229736328125, 2.48297119140625, 2.7362060546875, 2.98944091796875, 3.24267578125, 3.49591064453125, 3.7491455078125, 4.00238037109375, 4.255615234375, 4.50885009765625, 4.7620849609375, 5.01531982421875, 5.2685546875, 5.52178955078125, 5.7750244140625, 6.02825927734375, 6.281494140625, 6.53472900390625, 6.7879638671875, 7.04119873046875, 7.29443359375, 7.54766845703125, 7.8009033203125, 8.05413818359375, 8.307373046875, 8.56060791015625, 8.8138427734375, 9.06707763671875, 9.3203125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 10.0, 20.0, 21.0, 34.0, 36.0, 59.0, 109.0, 151.0, 268.0, 462.0, 719.0, 1268.0, 2042.0, 3432.0, 5627.0, 9790.0, 17474.0, 31014.0, 56774.0, 110017.0, 269530.0, 293614.0, 113678.0, 58391.0, 31644.0, 17602.0, 10249.0, 5819.0, 3477.0, 2033.0, 1183.0, 775.0, 439.0, 301.0, 177.0, 109.0, 67.0, 42.0, 33.0, 18.0, 12.0, 11.0, 3.0, 7.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.43359375, -2.359893798828125, -2.28619384765625, -2.212493896484375, -2.1387939453125, -2.065093994140625, -1.99139404296875, -1.917694091796875, -1.843994140625, -1.770294189453125, -1.69659423828125, -1.622894287109375, -1.5491943359375, -1.475494384765625, -1.40179443359375, -1.328094482421875, -1.25439453125, -1.180694580078125, -1.10699462890625, -1.033294677734375, -0.9595947265625, -0.885894775390625, -0.81219482421875, -0.738494873046875, -0.664794921875, -0.591094970703125, -0.51739501953125, -0.443695068359375, -0.3699951171875, -0.296295166015625, -0.22259521484375, -0.148895263671875, -0.0751953125, -0.001495361328125, 0.07220458984375, 0.145904541015625, 0.2196044921875, 0.293304443359375, 0.36700439453125, 0.440704345703125, 0.514404296875, 0.588104248046875, 0.66180419921875, 0.735504150390625, 0.8092041015625, 0.882904052734375, 0.95660400390625, 1.030303955078125, 1.10400390625, 1.177703857421875, 1.25140380859375, 1.325103759765625, 1.3988037109375, 1.472503662109375, 1.54620361328125, 1.619903564453125, 1.693603515625, 1.767303466796875, 1.84100341796875, 1.914703369140625, 1.9884033203125, 2.062103271484375, 2.13580322265625, 2.209503173828125, 2.283203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 7.0, 6.0, 9.0, 6.0, 11.0, 11.0, 12.0, 12.0, 19.0, 30.0, 21.0, 27.0, 29.0, 39.0, 28.0, 41.0, 34.0, 38.0, 48.0, 41.0, 1069.0, 38.0, 51.0, 58.0, 34.0, 36.0, 25.0, 36.0, 38.0, 26.0, 34.0, 29.0, 17.0, 14.0, 10.0, 11.0, 7.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.3984375, -5.252838134765625, -5.10723876953125, -4.961639404296875, -4.8160400390625, -4.670440673828125, -4.52484130859375, -4.379241943359375, -4.233642578125, -4.088043212890625, -3.94244384765625, -3.796844482421875, -3.6512451171875, -3.505645751953125, -3.36004638671875, -3.214447021484375, -3.06884765625, -2.923248291015625, -2.77764892578125, -2.632049560546875, -2.4864501953125, -2.340850830078125, -2.19525146484375, -2.049652099609375, -1.904052734375, -1.758453369140625, -1.61285400390625, -1.467254638671875, -1.3216552734375, -1.176055908203125, -1.03045654296875, -0.884857177734375, -0.7392578125, -0.593658447265625, -0.44805908203125, -0.302459716796875, -0.1568603515625, -0.011260986328125, 0.13433837890625, 0.279937744140625, 0.425537109375, 0.571136474609375, 0.71673583984375, 0.862335205078125, 1.0079345703125, 1.153533935546875, 1.29913330078125, 1.444732666015625, 1.59033203125, 1.735931396484375, 1.88153076171875, 2.027130126953125, 2.1727294921875, 2.318328857421875, 2.46392822265625, 2.609527587890625, 2.755126953125, 2.900726318359375, 3.04632568359375, 3.191925048828125, 3.3375244140625, 3.483123779296875, 3.62872314453125, 3.774322509765625, 3.919921875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 8.0, 6.0, 11.0, 21.0, 30.0, 55.0, 70.0, 108.0, 169.0, 300.0, 487.0, 678.0, 1091.0, 1710.0, 2648.0, 4064.0, 6510.0, 10539.0, 17391.0, 27787.0, 46845.0, 79047.0, 147418.0, 1393688.0, 151940.0, 81515.0, 48024.0, 28516.0, 17450.0, 10832.0, 6533.0, 4100.0, 2623.0, 1718.0, 1140.0, 746.0, 447.0, 298.0, 210.0, 136.0, 86.0, 38.0, 33.0, 29.0, 12.0, 17.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.0234375, -1.96307373046875, -1.9027099609375, -1.84234619140625, -1.781982421875, -1.72161865234375, -1.6612548828125, -1.60089111328125, -1.54052734375, -1.48016357421875, -1.4197998046875, -1.35943603515625, -1.299072265625, -1.23870849609375, -1.1783447265625, -1.11798095703125, -1.0576171875, -0.99725341796875, -0.9368896484375, -0.87652587890625, -0.816162109375, -0.75579833984375, -0.6954345703125, -0.63507080078125, -0.57470703125, -0.51434326171875, -0.4539794921875, -0.39361572265625, -0.333251953125, -0.27288818359375, -0.2125244140625, -0.15216064453125, -0.091796875, -0.03143310546875, 0.0289306640625, 0.08929443359375, 0.149658203125, 0.21002197265625, 0.2703857421875, 0.33074951171875, 0.39111328125, 0.45147705078125, 0.5118408203125, 0.57220458984375, 0.632568359375, 0.69293212890625, 0.7532958984375, 0.81365966796875, 0.8740234375, 0.93438720703125, 0.9947509765625, 1.05511474609375, 1.115478515625, 1.17584228515625, 1.2362060546875, 1.29656982421875, 1.35693359375, 1.41729736328125, 1.4776611328125, 1.53802490234375, 1.598388671875, 1.65875244140625, 1.7191162109375, 1.77947998046875, 1.83984375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 6.0, 7.0, 6.0, 5.0, 6.0, 13.0, 7.0, 9.0, 11.0, 11.0, 10.0, 23.0, 21.0, 30.0, 37.0, 32.0, 43.0, 59.0, 63.0, 71.0, 66.0, 63.0, 45.0, 54.0, 36.0, 54.0, 26.0, 28.0, 29.0, 18.0, 19.0, 17.0, 14.0, 16.0, 7.0, 4.0, 7.0, 3.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0002315044403076172, -0.0002239122986793518, -0.00021632015705108643, -0.00020872801542282104, -0.00020113587379455566, -0.00019354373216629028, -0.0001859515905380249, -0.00017835944890975952, -0.00017076730728149414, -0.00016317516565322876, -0.00015558302402496338, -0.000147990882396698, -0.00014039874076843262, -0.00013280659914016724, -0.00012521445751190186, -0.00011762231588363647, -0.0001100301742553711, -0.00010243803262710571, -9.484589099884033e-05, -8.725374937057495e-05, -7.966160774230957e-05, -7.206946611404419e-05, -6.447732448577881e-05, -5.688518285751343e-05, -4.929304122924805e-05, -4.1700899600982666e-05, -3.4108757972717285e-05, -2.6516616344451904e-05, -1.8924474716186523e-05, -1.1332333087921143e-05, -3.7401914596557617e-06, 3.851950168609619e-06, 1.1444091796875e-05, 1.903623342514038e-05, 2.6628375053405762e-05, 3.422051668167114e-05, 4.1812658309936523e-05, 4.9404799938201904e-05, 5.6996941566467285e-05, 6.458908319473267e-05, 7.218122482299805e-05, 7.977336645126343e-05, 8.736550807952881e-05, 9.495764970779419e-05, 0.00010254979133605957, 0.00011014193296432495, 0.00011773407459259033, 0.0001253262162208557, 0.0001329183578491211, 0.00014051049947738647, 0.00014810264110565186, 0.00015569478273391724, 0.00016328692436218262, 0.000170879065990448, 0.00017847120761871338, 0.00018606334924697876, 0.00019365549087524414, 0.00020124763250350952, 0.0002088397741317749, 0.00021643191576004028, 0.00022402405738830566, 0.00023161619901657104, 0.00023920834064483643, 0.0002468004822731018, 0.0002543926239013672]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 7.0, 10.0, 9.0, 16.0, 17.0, 20.0, 30.0, 41.0, 57.0, 63.0, 117.0, 138.0, 291.0, 600.0, 2561.0, 917550.0, 124617.0, 1196.0, 504.0, 229.0, 131.0, 68.0, 51.0, 48.0, 25.0, 24.0, 19.0, 13.0, 17.0, 15.0, 8.0, 13.0, 2.0, 3.0, 10.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.005825042724609375, -0.0056528449058532715, -0.005480647087097168, -0.0053084492683410645, -0.005136251449584961, -0.004964053630828857, -0.004791855812072754, -0.00461965799331665, -0.004447460174560547, -0.004275262355804443, -0.00410306453704834, -0.003930866718292236, -0.003758668899536133, -0.0035864710807800293, -0.0034142732620239258, -0.0032420754432678223, -0.0030698776245117188, -0.0028976798057556152, -0.0027254819869995117, -0.002553284168243408, -0.0023810863494873047, -0.002208888530731201, -0.0020366907119750977, -0.0018644928932189941, -0.0016922950744628906, -0.0015200972557067871, -0.0013478994369506836, -0.00117570161819458, -0.0010035037994384766, -0.000831305980682373, -0.0006591081619262695, -0.000486910343170166, -0.0003147125244140625, -0.00014251470565795898, 2.968311309814453e-05, 0.00020188093185424805, 0.00037407875061035156, 0.0005462765693664551, 0.0007184743881225586, 0.0008906722068786621, 0.0010628700256347656, 0.0012350678443908691, 0.0014072656631469727, 0.0015794634819030762, 0.0017516613006591797, 0.0019238591194152832, 0.0020960569381713867, 0.0022682547569274902, 0.0024404525756835938, 0.0026126503944396973, 0.0027848482131958008, 0.0029570460319519043, 0.003129243850708008, 0.0033014416694641113, 0.003473639488220215, 0.0036458373069763184, 0.003818035125732422, 0.003990232944488525, 0.004162430763244629, 0.004334628582000732, 0.004506826400756836, 0.0046790242195129395, 0.004851222038269043, 0.0050234198570251465, 0.00519561767578125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 8.0, 72.0, 301.0, 412.0, 175.0, 43.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002528906334191561, -0.00023235274420585483, -0.0002118148549925536, -0.00019127698033116758, -0.0001707390765659511, -0.0001502012019045651, -0.00012966331269126385, -0.00010912542347796261, -8.858753426466137e-05, -6.804964505136013e-05, -4.7511759476037696e-05, -2.6973873900715262e-05, -6.43598468741402e-06, 1.4101904525887221e-05, 3.463978646323085e-05, 5.517767567653209e-05, 7.571556488983333e-05, 9.625345410313457e-05, 0.00011679134331643581, 0.00013732921797782183, 0.0001578671217430383, 0.0001784049964044243, 0.00019894288561772555, 0.0002194807748310268, 0.00024001866404432803, 0.0002605565532576293, 0.0002810944279190153, 0.00030163233168423176, 0.00032217020634561777, 0.00034270811011083424, 0.00036324598477222025, 0.0003837838885374367, 0.00040432176319882274, 0.00042485963786020875, 0.0004453975416254252, 0.00046593541628681123, 0.0004864733200520277, 0.0005070111947134137, 0.0005275490693747997, 0.0005480869440361857, 0.0005686248769052327, 0.0005891627515666187, 0.0006097006262280047, 0.0006302385590970516, 0.0006507764337584376, 0.0006713143084198236, 0.0006918521830812097, 0.0007123900577425957, 0.0007329279324039817, 0.0007534658070653677, 0.0007740036817267537, 0.0007945416145958006, 0.0008150794892571867, 0.0008356173639185727, 0.0008561552385799587, 0.0008766931714490056, 0.0008972310461103916, 0.0009177689207717776, 0.0009383067954331636, 0.0009588447283022106, 0.0009793825447559357, 0.0009999205358326435, 0.0010204584104940295, 0.0010409962851554155, 0.0010615341598168015]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 6.0, 7.0, 9.0, 11.0, 13.0, 17.0, 22.0, 27.0, 35.0, 34.0, 35.0, 38.0, 31.0, 35.0, 43.0, 50.0, 51.0, 42.0, 32.0, 43.0, 53.0, 41.0, 35.0, 42.0, 34.0, 30.0, 36.0, 19.0, 13.0, 23.0, 22.0, 9.0, 6.0, 13.0, 8.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.00015360116958618164, -0.00014895573258399963, -0.00014431029558181763, -0.00013966485857963562, -0.0001350194215774536, -0.0001303739845752716, -0.0001257285475730896, -0.00012108311057090759, -0.00011643767356872559, -0.00011179223656654358, -0.00010714679956436157, -0.00010250136256217957, -9.785592555999756e-05, -9.321048855781555e-05, -8.856505155563354e-05, -8.391961455345154e-05, -7.927417755126953e-05, -7.462874054908752e-05, -6.998330354690552e-05, -6.533786654472351e-05, -6.0692429542541504e-05, -5.60469925403595e-05, -5.140155553817749e-05, -4.6756118535995483e-05, -4.2110681533813477e-05, -3.746524453163147e-05, -3.281980752944946e-05, -2.8174370527267456e-05, -2.352893352508545e-05, -1.8883496522903442e-05, -1.4238059520721436e-05, -9.592622518539429e-06, -4.947185516357422e-06, -3.0174851417541504e-07, 4.343688488006592e-06, 8.989125490188599e-06, 1.3634562492370605e-05, 1.8279999494552612e-05, 2.292543649673462e-05, 2.7570873498916626e-05, 3.221631050109863e-05, 3.686174750328064e-05, 4.1507184505462646e-05, 4.615262150764465e-05, 5.079805850982666e-05, 5.544349551200867e-05, 6.0088932514190674e-05, 6.473436951637268e-05, 6.937980651855469e-05, 7.40252435207367e-05, 7.86706805229187e-05, 8.331611752510071e-05, 8.796155452728271e-05, 9.260699152946472e-05, 9.725242853164673e-05, 0.00010189786553382874, 0.00010654330253601074, 0.00011118873953819275, 0.00011583417654037476, 0.00012047961354255676, 0.00012512505054473877, 0.00012977048754692078, 0.00013441592454910278, 0.0001390613615512848, 0.0001437067985534668]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 8.0, 9.0, 15.0, 18.0, 18.0, 22.0, 24.0, 28.0, 34.0, 37.0, 32.0, 48.0, 49.0, 47.0, 44.0, 38.0, 49.0, 47.0, 50.0, 46.0, 48.0, 46.0, 44.0, 36.0, 46.0, 19.0, 23.0, 11.0, 15.0, 9.0, 5.0, 10.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.63348388671875, -6.3802490234375, -6.12701416015625, -5.873779296875, -5.62054443359375, -5.3673095703125, -5.11407470703125, -4.86083984375, -4.60760498046875, -4.3543701171875, -4.10113525390625, -3.847900390625, -3.59466552734375, -3.3414306640625, -3.08819580078125, -2.8349609375, -2.58172607421875, -2.3284912109375, -2.07525634765625, -1.822021484375, -1.56878662109375, -1.3155517578125, -1.06231689453125, -0.80908203125, -0.55584716796875, -0.3026123046875, -0.04937744140625, 0.203857421875, 0.45709228515625, 0.7103271484375, 0.96356201171875, 1.216796875, 1.47003173828125, 1.7232666015625, 1.97650146484375, 2.229736328125, 2.48297119140625, 2.7362060546875, 2.98944091796875, 3.24267578125, 3.49591064453125, 3.7491455078125, 4.00238037109375, 4.255615234375, 4.50885009765625, 4.7620849609375, 5.01531982421875, 5.2685546875, 5.52178955078125, 5.7750244140625, 6.02825927734375, 6.281494140625, 6.53472900390625, 6.7879638671875, 7.04119873046875, 7.29443359375, 7.54766845703125, 7.8009033203125, 8.05413818359375, 8.307373046875, 8.56060791015625, 8.8138427734375, 9.06707763671875, 9.3203125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 22.0, 30.0, 39.0, 67.0, 101.0, 124.0, 219.0, 260.0, 471.0, 722.0, 1266.0, 2471.0, 4941.0, 10602.0, 24928.0, 62987.0, 158112.0, 336914.0, 261209.0, 107492.0, 42472.0, 17372.0, 7566.0, 3566.0, 1842.0, 1018.0, 597.0, 362.0, 257.0, 150.0, 99.0, 73.0, 49.0, 34.0, 23.0, 15.0, 17.0, 12.0, 5.0, 5.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.90234375, -5.69732666015625, -5.4923095703125, -5.28729248046875, -5.082275390625, -4.87725830078125, -4.6722412109375, -4.46722412109375, -4.26220703125, -4.05718994140625, -3.8521728515625, -3.64715576171875, -3.442138671875, -3.23712158203125, -3.0321044921875, -2.82708740234375, -2.6220703125, -2.41705322265625, -2.2120361328125, -2.00701904296875, -1.802001953125, -1.59698486328125, -1.3919677734375, -1.18695068359375, -0.98193359375, -0.77691650390625, -0.5718994140625, -0.36688232421875, -0.161865234375, 0.04315185546875, 0.2481689453125, 0.45318603515625, 0.658203125, 0.86322021484375, 1.0682373046875, 1.27325439453125, 1.478271484375, 1.68328857421875, 1.8883056640625, 2.09332275390625, 2.29833984375, 2.50335693359375, 2.7083740234375, 2.91339111328125, 3.118408203125, 3.32342529296875, 3.5284423828125, 3.73345947265625, 3.9384765625, 4.14349365234375, 4.3485107421875, 4.55352783203125, 4.758544921875, 4.96356201171875, 5.1685791015625, 5.37359619140625, 5.57861328125, 5.78363037109375, 5.9886474609375, 6.19366455078125, 6.398681640625, 6.60369873046875, 6.8087158203125, 7.01373291015625, 7.21875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 10.0, 4.0, 16.0, 8.0, 14.0, 31.0, 18.0, 24.0, 28.0, 22.0, 30.0, 31.0, 46.0, 40.0, 66.0, 88.0, 191.0, 1486.0, 327.0, 115.0, 69.0, 66.0, 36.0, 37.0, 39.0, 36.0, 25.0, 27.0, 16.0, 21.0, 11.0, 13.0, 13.0, 12.0, 12.0, 4.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.609375, -24.8505859375, -24.091796875, -23.3330078125, -22.57421875, -21.8154296875, -21.056640625, -20.2978515625, -19.5390625, -18.7802734375, -18.021484375, -17.2626953125, -16.50390625, -15.7451171875, -14.986328125, -14.2275390625, -13.46875, -12.7099609375, -11.951171875, -11.1923828125, -10.43359375, -9.6748046875, -8.916015625, -8.1572265625, -7.3984375, -6.6396484375, -5.880859375, -5.1220703125, -4.36328125, -3.6044921875, -2.845703125, -2.0869140625, -1.328125, -0.5693359375, 0.189453125, 0.9482421875, 1.70703125, 2.4658203125, 3.224609375, 3.9833984375, 4.7421875, 5.5009765625, 6.259765625, 7.0185546875, 7.77734375, 8.5361328125, 9.294921875, 10.0537109375, 10.8125, 11.5712890625, 12.330078125, 13.0888671875, 13.84765625, 14.6064453125, 15.365234375, 16.1240234375, 16.8828125, 17.6416015625, 18.400390625, 19.1591796875, 19.91796875, 20.6767578125, 21.435546875, 22.1943359375, 22.953125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 7.0, 11.0, 10.0, 13.0, 12.0, 12.0, 20.0, 39.0, 64.0, 70.0, 148.0, 206.0, 396.0, 1031.0, 225852.0, 2915266.0, 1393.0, 470.0, 218.0, 161.0, 95.0, 60.0, 35.0, 34.0, 15.0, 11.0, 11.0, 12.0, 7.0, 6.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.875, -117.22265625, -113.5703125, -109.91796875, -106.265625, -102.61328125, -98.9609375, -95.30859375, -91.65625, -88.00390625, -84.3515625, -80.69921875, -77.046875, -73.39453125, -69.7421875, -66.08984375, -62.4375, -58.78515625, -55.1328125, -51.48046875, -47.828125, -44.17578125, -40.5234375, -36.87109375, -33.21875, -29.56640625, -25.9140625, -22.26171875, -18.609375, -14.95703125, -11.3046875, -7.65234375, -4.0, -0.34765625, 3.3046875, 6.95703125, 10.609375, 14.26171875, 17.9140625, 21.56640625, 25.21875, 28.87109375, 32.5234375, 36.17578125, 39.828125, 43.48046875, 47.1328125, 50.78515625, 54.4375, 58.08984375, 61.7421875, 65.39453125, 69.046875, 72.69921875, 76.3515625, 80.00390625, 83.65625, 87.30859375, 90.9609375, 94.61328125, 98.265625, 101.91796875, 105.5703125, 109.22265625, 112.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 13.0, 18.0, 25.0, 64.0, 112.0, 167.0, 144.0, 165.0, 128.0, 83.0, 51.0, 19.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-45.60902404785156, -44.368011474609375, -43.12699508666992, -41.885982513427734, -40.64496612548828, -39.403953552246094, -38.16293716430664, -36.92192459106445, -35.680908203125, -34.43989562988281, -33.19887924194336, -31.95786476135254, -30.71685028076172, -29.47583770751953, -28.23482322692871, -26.99380874633789, -25.752796173095703, -24.511781692504883, -23.270767211914062, -22.029752731323242, -20.788738250732422, -19.547725677490234, -18.306711196899414, -17.065696716308594, -15.824682235717773, -14.583667755126953, -13.342653274536133, -12.101639747619629, -10.860625267028809, -9.619610786437988, -8.378597259521484, -7.137582778930664, -5.896568298339844, -4.655553817749023, -3.4145398139953613, -2.17352557182312, -0.9325113296508789, 0.3085031509399414, 1.5495171546936035, 2.7905311584472656, 4.031545639038086, 5.272560119628906, 6.513574123382568, 7.7545881271362305, 8.99560260772705, 10.236617088317871, 11.477630615234375, 12.718645095825195, 13.959659576416016, 15.200674057006836, 16.441688537597656, 17.682703018188477, 18.923717498779297, 20.164730072021484, 21.405744552612305, 22.646759033203125, 23.887773513793945, 25.128787994384766, 26.369802474975586, 27.610816955566406, 28.851829528808594, 30.092845916748047, 31.333858489990234, 32.57487487792969, 33.815887451171875]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 7.0, 11.0, 10.0, 10.0, 16.0, 21.0, 19.0, 17.0, 32.0, 30.0, 39.0, 27.0, 35.0, 34.0, 31.0, 40.0, 42.0, 44.0, 44.0, 51.0, 44.0, 38.0, 40.0, 34.0, 25.0, 37.0, 29.0, 31.0, 24.0, 15.0, 14.0, 20.0, 12.0, 9.0, 12.0, 10.0, 6.0, 8.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-61.82469177246094, -60.10287094116211, -58.38105010986328, -56.65922927856445, -54.937408447265625, -53.2155876159668, -51.49376678466797, -49.77194595336914, -48.05012512207031, -46.328304290771484, -44.606483459472656, -42.88466262817383, -41.162841796875, -39.44102096557617, -37.719200134277344, -35.997379302978516, -34.27555847167969, -32.55373764038086, -30.83191680908203, -29.110095977783203, -27.388275146484375, -25.666454315185547, -23.94463348388672, -22.22281265258789, -20.500991821289062, -18.779170989990234, -17.057350158691406, -15.335529327392578, -13.61370849609375, -11.891887664794922, -10.170066833496094, -8.448246002197266, -6.7264251708984375, -5.004604339599609, -3.2827835083007812, -1.5609626770019531, 0.160858154296875, 1.8826789855957031, 3.6044998168945312, 5.326320648193359, 7.0481414794921875, 8.769962310791016, 10.491783142089844, 12.213603973388672, 13.9354248046875, 15.657245635986328, 17.379066467285156, 19.100887298583984, 20.822708129882812, 22.54452896118164, 24.26634979248047, 25.988170623779297, 27.709991455078125, 29.431812286376953, 31.15363311767578, 32.87545394897461, 34.59727478027344, 36.319095611572266, 38.040916442871094, 39.76273727416992, 41.48455810546875, 43.20637893676758, 44.928199768066406, 46.650020599365234, 48.37184143066406]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 14.0, 19.0, 14.0, 21.0, 25.0, 33.0, 28.0, 31.0, 36.0, 35.0, 37.0, 48.0, 59.0, 50.0, 43.0, 51.0, 48.0, 53.0, 31.0, 49.0, 55.0, 27.0, 29.0, 33.0, 18.0, 27.0, 17.0, 9.0, 10.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.96875, -6.6956787109375, -6.422607421875, -6.1495361328125, -5.87646484375, -5.6033935546875, -5.330322265625, -5.0572509765625, -4.7841796875, -4.5111083984375, -4.238037109375, -3.9649658203125, -3.69189453125, -3.4188232421875, -3.145751953125, -2.8726806640625, -2.599609375, -2.3265380859375, -2.053466796875, -1.7803955078125, -1.50732421875, -1.2342529296875, -0.961181640625, -0.6881103515625, -0.4150390625, -0.1419677734375, 0.131103515625, 0.4041748046875, 0.67724609375, 0.9503173828125, 1.223388671875, 1.4964599609375, 1.76953125, 2.0426025390625, 2.315673828125, 2.5887451171875, 2.86181640625, 3.1348876953125, 3.407958984375, 3.6810302734375, 3.9541015625, 4.2271728515625, 4.500244140625, 4.7733154296875, 5.04638671875, 5.3194580078125, 5.592529296875, 5.8656005859375, 6.138671875, 6.4117431640625, 6.684814453125, 6.9578857421875, 7.23095703125, 7.5040283203125, 7.777099609375, 8.0501708984375, 8.3232421875, 8.5963134765625, 8.869384765625, 9.1424560546875, 9.41552734375, 9.6885986328125, 9.961669921875, 10.2347412109375, 10.5078125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 8.0, 9.0, 9.0, 15.0, 25.0, 22.0, 31.0, 30.0, 49.0, 66.0, 111.0, 181.0, 345.0, 1046.0, 6755.0, 202262.0, 2745769.0, 1198917.0, 35121.0, 2272.0, 530.0, 264.0, 126.0, 80.0, 47.0, 40.0, 36.0, 31.0, 16.0, 17.0, 12.0, 5.0, 7.0, 6.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.162109375, -16.49609375, -15.830078125, -15.1640625, -14.498046875, -13.83203125, -13.166015625, -12.5, -11.833984375, -11.16796875, -10.501953125, -9.8359375, -9.169921875, -8.50390625, -7.837890625, -7.171875, -6.505859375, -5.83984375, -5.173828125, -4.5078125, -3.841796875, -3.17578125, -2.509765625, -1.84375, -1.177734375, -0.51171875, 0.154296875, 0.8203125, 1.486328125, 2.15234375, 2.818359375, 3.484375, 4.150390625, 4.81640625, 5.482421875, 6.1484375, 6.814453125, 7.48046875, 8.146484375, 8.8125, 9.478515625, 10.14453125, 10.810546875, 11.4765625, 12.142578125, 12.80859375, 13.474609375, 14.140625, 14.806640625, 15.47265625, 16.138671875, 16.8046875, 17.470703125, 18.13671875, 18.802734375, 19.46875, 20.134765625, 20.80078125, 21.466796875, 22.1328125, 22.798828125, 23.46484375, 24.130859375, 24.796875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 2.0, 6.0, 8.0, 8.0, 18.0, 22.0, 32.0, 29.0, 48.0, 85.0, 110.0, 160.0, 179.0, 235.0, 303.0, 386.0, 425.0, 426.0, 370.0, 309.0, 235.0, 195.0, 133.0, 94.0, 70.0, 46.0, 31.0, 26.0, 26.0, 16.0, 11.0, 5.0, 3.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.8828125, -15.4410400390625, -14.999267578125, -14.5574951171875, -14.11572265625, -13.6739501953125, -13.232177734375, -12.7904052734375, -12.3486328125, -11.9068603515625, -11.465087890625, -11.0233154296875, -10.58154296875, -10.1397705078125, -9.697998046875, -9.2562255859375, -8.814453125, -8.3726806640625, -7.930908203125, -7.4891357421875, -7.04736328125, -6.6055908203125, -6.163818359375, -5.7220458984375, -5.2802734375, -4.8385009765625, -4.396728515625, -3.9549560546875, -3.51318359375, -3.0714111328125, -2.629638671875, -2.1878662109375, -1.74609375, -1.3043212890625, -0.862548828125, -0.4207763671875, 0.02099609375, 0.4627685546875, 0.904541015625, 1.3463134765625, 1.7880859375, 2.2298583984375, 2.671630859375, 3.1134033203125, 3.55517578125, 3.9969482421875, 4.438720703125, 4.8804931640625, 5.322265625, 5.7640380859375, 6.205810546875, 6.6475830078125, 7.08935546875, 7.5311279296875, 7.972900390625, 8.4146728515625, 8.8564453125, 9.2982177734375, 9.739990234375, 10.1817626953125, 10.62353515625, 11.0653076171875, 11.507080078125, 11.9488525390625, 12.390625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 5.0, 10.0, 7.0, 5.0, 11.0, 15.0, 27.0, 34.0, 38.0, 45.0, 58.0, 87.0, 118.0, 136.0, 187.0, 270.0, 403.0, 616.0, 2841.0, 330581.0, 3812032.0, 43660.0, 1251.0, 521.0, 307.0, 257.0, 194.0, 129.0, 109.0, 87.0, 43.0, 52.0, 30.0, 27.0, 26.0, 17.0, 12.0, 10.0, 3.0, 6.0, 11.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.625, -41.1201171875, -39.615234375, -38.1103515625, -36.60546875, -35.1005859375, -33.595703125, -32.0908203125, -30.5859375, -29.0810546875, -27.576171875, -26.0712890625, -24.56640625, -23.0615234375, -21.556640625, -20.0517578125, -18.546875, -17.0419921875, -15.537109375, -14.0322265625, -12.52734375, -11.0224609375, -9.517578125, -8.0126953125, -6.5078125, -5.0029296875, -3.498046875, -1.9931640625, -0.48828125, 1.0166015625, 2.521484375, 4.0263671875, 5.53125, 7.0361328125, 8.541015625, 10.0458984375, 11.55078125, 13.0556640625, 14.560546875, 16.0654296875, 17.5703125, 19.0751953125, 20.580078125, 22.0849609375, 23.58984375, 25.0947265625, 26.599609375, 28.1044921875, 29.609375, 31.1142578125, 32.619140625, 34.1240234375, 35.62890625, 37.1337890625, 38.638671875, 40.1435546875, 41.6484375, 43.1533203125, 44.658203125, 46.1630859375, 47.66796875, 49.1728515625, 50.677734375, 52.1826171875, 53.6875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 10.0, 10.0, 34.0, 42.0, 50.0, 69.0, 128.0, 113.0, 114.0, 131.0, 113.0, 76.0, 50.0, 24.0, 25.0, 13.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.03345489501953, -64.05902099609375, -62.0845947265625, -60.110164642333984, -58.13573455810547, -56.16130065917969, -54.18687438964844, -52.212440490722656, -50.23801040649414, -48.263580322265625, -46.28915023803711, -44.314720153808594, -42.34029006958008, -40.36585998535156, -38.39142608642578, -36.416996002197266, -34.44256591796875, -32.468135833740234, -30.49370574951172, -28.519275665283203, -26.544843673706055, -24.57041358947754, -22.595983505249023, -20.621551513671875, -18.647125244140625, -16.67269515991211, -14.698264122009277, -12.723834037780762, -10.74940299987793, -8.774972915649414, -6.800542831420898, -4.826111793518066, -2.8516807556152344, -0.8772503137588501, 1.0971801280975342, 3.071610450744629, 5.046041011810303, 7.020471572875977, 8.994901657104492, 10.969332695007324, 12.94376277923584, 14.918192863464355, 16.892623901367188, 18.867053985595703, 20.84148406982422, 22.815914154052734, 24.79034423828125, 26.7647762298584, 28.739206314086914, 30.71363639831543, 32.68806838989258, 34.662498474121094, 36.63692855834961, 38.611358642578125, 40.58578872680664, 42.560218811035156, 44.53464889526367, 46.50907897949219, 48.4835090637207, 50.45793914794922, 52.432369232177734, 54.40679931640625, 56.38123321533203, 58.35566329956055, 60.33009338378906]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 8.0, 5.0, 9.0, 9.0, 8.0, 10.0, 9.0, 8.0, 7.0, 13.0, 12.0, 20.0, 18.0, 20.0, 21.0, 31.0, 36.0, 33.0, 28.0, 25.0, 38.0, 31.0, 34.0, 46.0, 39.0, 42.0, 38.0, 29.0, 25.0, 16.0, 25.0, 27.0, 35.0, 41.0, 30.0, 19.0, 22.0, 19.0, 22.0, 22.0, 9.0, 14.0, 10.0, 9.0, 7.0, 6.0, 7.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.33945846557617, -38.082916259765625, -36.826377868652344, -35.56983947753906, -34.313297271728516, -33.05675506591797, -31.800216674804688, -30.543676376342773, -29.28713607788086, -28.030595779418945, -26.77405548095703, -25.517515182495117, -24.260974884033203, -23.00443458557129, -21.747894287109375, -20.49135398864746, -19.234813690185547, -17.978273391723633, -16.72173309326172, -15.465192794799805, -14.20865249633789, -12.952112197875977, -11.695571899414062, -10.439031600952148, -9.182491302490234, -7.92595100402832, -6.669410705566406, -5.412870407104492, -4.156330108642578, -2.899789810180664, -1.64324951171875, -0.38670921325683594, 0.8698272705078125, 2.1263675689697266, 3.3829078674316406, 4.639448165893555, 5.895988464355469, 7.152528762817383, 8.409069061279297, 9.665609359741211, 10.922149658203125, 12.178689956665039, 13.435230255126953, 14.691770553588867, 15.948310852050781, 17.204851150512695, 18.46139144897461, 19.717931747436523, 20.974472045898438, 22.23101234436035, 23.487552642822266, 24.74409294128418, 26.000633239746094, 27.257173538208008, 28.513713836669922, 29.770254135131836, 31.02679443359375, 32.28333282470703, 33.53987503051758, 34.796417236328125, 36.052955627441406, 37.30949401855469, 38.566036224365234, 39.82257843017578, 41.07911682128906]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 11.0, 6.0, 5.0, 11.0, 15.0, 21.0, 21.0, 20.0, 26.0, 27.0, 39.0, 41.0, 41.0, 43.0, 54.0, 44.0, 59.0, 47.0, 50.0, 39.0, 44.0, 47.0, 45.0, 44.0, 33.0, 31.0, 20.0, 24.0, 20.0, 19.0, 10.0, 9.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6328125, -6.37109375, -6.109375, -5.84765625, -5.5859375, -5.32421875, -5.0625, -4.80078125, -4.5390625, -4.27734375, -4.015625, -3.75390625, -3.4921875, -3.23046875, -2.96875, -2.70703125, -2.4453125, -2.18359375, -1.921875, -1.66015625, -1.3984375, -1.13671875, -0.875, -0.61328125, -0.3515625, -0.08984375, 0.171875, 0.43359375, 0.6953125, 0.95703125, 1.21875, 1.48046875, 1.7421875, 2.00390625, 2.265625, 2.52734375, 2.7890625, 3.05078125, 3.3125, 3.57421875, 3.8359375, 4.09765625, 4.359375, 4.62109375, 4.8828125, 5.14453125, 5.40625, 5.66796875, 5.9296875, 6.19140625, 6.453125, 6.71484375, 6.9765625, 7.23828125, 7.5, 7.76171875, 8.0234375, 8.28515625, 8.546875, 8.80859375, 9.0703125, 9.33203125, 9.59375, 9.85546875, 10.1171875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 9.0, 18.0, 36.0, 41.0, 92.0, 95.0, 161.0, 267.0, 443.0, 813.0, 1446.0, 2558.0, 4630.0, 8583.0, 16124.0, 31410.0, 65409.0, 148380.0, 426796.0, 185173.0, 78306.0, 37014.0, 18702.0, 9948.0, 5301.0, 2928.0, 1647.0, 871.0, 503.0, 325.0, 172.0, 130.0, 78.0, 49.0, 34.0, 23.0, 14.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.697265625, -2.609161376953125, -2.52105712890625, -2.432952880859375, -2.3448486328125, -2.256744384765625, -2.16864013671875, -2.080535888671875, -1.992431640625, -1.904327392578125, -1.81622314453125, -1.728118896484375, -1.6400146484375, -1.551910400390625, -1.46380615234375, -1.375701904296875, -1.28759765625, -1.199493408203125, -1.11138916015625, -1.023284912109375, -0.9351806640625, -0.847076416015625, -0.75897216796875, -0.670867919921875, -0.582763671875, -0.494659423828125, -0.40655517578125, -0.318450927734375, -0.2303466796875, -0.142242431640625, -0.05413818359375, 0.033966064453125, 0.1220703125, 0.210174560546875, 0.29827880859375, 0.386383056640625, 0.4744873046875, 0.562591552734375, 0.65069580078125, 0.738800048828125, 0.826904296875, 0.915008544921875, 1.00311279296875, 1.091217041015625, 1.1793212890625, 1.267425537109375, 1.35552978515625, 1.443634033203125, 1.53173828125, 1.619842529296875, 1.70794677734375, 1.796051025390625, 1.8841552734375, 1.972259521484375, 2.06036376953125, 2.148468017578125, 2.236572265625, 2.324676513671875, 2.41278076171875, 2.500885009765625, 2.5889892578125, 2.677093505859375, 2.76519775390625, 2.853302001953125, 2.94140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 7.0, 11.0, 13.0, 15.0, 12.0, 20.0, 24.0, 22.0, 27.0, 24.0, 25.0, 26.0, 37.0, 40.0, 39.0, 38.0, 41.0, 34.0, 1079.0, 42.0, 46.0, 34.0, 42.0, 46.0, 31.0, 32.0, 26.0, 33.0, 19.0, 26.0, 18.0, 16.0, 9.0, 8.0, 12.0, 8.0, 15.0, 9.0, 2.0, 1.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.966796875, -3.826629638671875, -3.68646240234375, -3.546295166015625, -3.4061279296875, -3.265960693359375, -3.12579345703125, -2.985626220703125, -2.845458984375, -2.705291748046875, -2.56512451171875, -2.424957275390625, -2.2847900390625, -2.144622802734375, -2.00445556640625, -1.864288330078125, -1.72412109375, -1.583953857421875, -1.44378662109375, -1.303619384765625, -1.1634521484375, -1.023284912109375, -0.88311767578125, -0.742950439453125, -0.602783203125, -0.462615966796875, -0.32244873046875, -0.182281494140625, -0.0421142578125, 0.098052978515625, 0.23822021484375, 0.378387451171875, 0.5185546875, 0.658721923828125, 0.79888916015625, 0.939056396484375, 1.0792236328125, 1.219390869140625, 1.35955810546875, 1.499725341796875, 1.639892578125, 1.780059814453125, 1.92022705078125, 2.060394287109375, 2.2005615234375, 2.340728759765625, 2.48089599609375, 2.621063232421875, 2.76123046875, 2.901397705078125, 3.04156494140625, 3.181732177734375, 3.3218994140625, 3.462066650390625, 3.60223388671875, 3.742401123046875, 3.882568359375, 4.022735595703125, 4.16290283203125, 4.303070068359375, 4.4432373046875, 4.583404541015625, 4.72357177734375, 4.863739013671875, 5.00390625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 9.0, 7.0, 16.0, 25.0, 27.0, 59.0, 80.0, 157.0, 222.0, 416.0, 600.0, 905.0, 1527.0, 2180.0, 3336.0, 5120.0, 7737.0, 11976.0, 18751.0, 29540.0, 47611.0, 77303.0, 138774.0, 1379584.0, 151318.0, 82488.0, 50188.0, 31015.0, 19831.0, 12803.0, 8215.0, 5198.0, 3495.0, 2446.0, 1484.0, 1051.0, 609.0, 384.0, 262.0, 128.0, 89.0, 77.0, 37.0, 12.0, 18.0, 12.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.708984375, -1.6530609130859375, -1.597137451171875, -1.5412139892578125, -1.48529052734375, -1.4293670654296875, -1.373443603515625, -1.3175201416015625, -1.2615966796875, -1.2056732177734375, -1.149749755859375, -1.0938262939453125, -1.03790283203125, -0.9819793701171875, -0.926055908203125, -0.8701324462890625, -0.814208984375, -0.7582855224609375, -0.702362060546875, -0.6464385986328125, -0.59051513671875, -0.5345916748046875, -0.478668212890625, -0.4227447509765625, -0.3668212890625, -0.3108978271484375, -0.254974365234375, -0.1990509033203125, -0.14312744140625, -0.0872039794921875, -0.031280517578125, 0.0246429443359375, 0.08056640625, 0.1364898681640625, 0.192413330078125, 0.2483367919921875, 0.30426025390625, 0.3601837158203125, 0.416107177734375, 0.4720306396484375, 0.5279541015625, 0.5838775634765625, 0.639801025390625, 0.6957244873046875, 0.75164794921875, 0.8075714111328125, 0.863494873046875, 0.9194183349609375, 0.975341796875, 1.0312652587890625, 1.087188720703125, 1.1431121826171875, 1.19903564453125, 1.2549591064453125, 1.310882568359375, 1.3668060302734375, 1.4227294921875, 1.4786529541015625, 1.534576416015625, 1.5904998779296875, 1.64642333984375, 1.7023468017578125, 1.758270263671875, 1.8141937255859375, 1.8701171875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 15.0, 14.0, 18.0, 19.0, 31.0, 43.0, 48.0, 67.0, 81.0, 68.0, 82.0, 88.0, 72.0, 64.0, 45.0, 54.0, 38.0, 22.0, 24.0, 13.0, 16.0, 18.0, 11.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029158592224121094, -0.0002821795642375946, -0.00027277320623397827, -0.00026336684823036194, -0.0002539604902267456, -0.00024455413222312927, -0.00023514777421951294, -0.0002257414162158966, -0.00021633505821228027, -0.00020692870020866394, -0.0001975223422050476, -0.00018811598420143127, -0.00017870962619781494, -0.0001693032681941986, -0.00015989691019058228, -0.00015049055218696594, -0.0001410841941833496, -0.00013167783617973328, -0.00012227147817611694, -0.00011286512017250061, -0.00010345876216888428, -9.405240416526794e-05, -8.464604616165161e-05, -7.523968815803528e-05, -6.583333015441895e-05, -5.642697215080261e-05, -4.702061414718628e-05, -3.7614256143569946e-05, -2.8207898139953613e-05, -1.880154013633728e-05, -9.395182132720947e-06, 1.1175870895385742e-08, 9.417533874511719e-06, 1.8823891878128052e-05, 2.8230249881744385e-05, 3.763660788536072e-05, 4.704296588897705e-05, 5.6449323892593384e-05, 6.585568189620972e-05, 7.526203989982605e-05, 8.466839790344238e-05, 9.407475590705872e-05, 0.00010348111391067505, 0.00011288747191429138, 0.00012229382991790771, 0.00013170018792152405, 0.00014110654592514038, 0.00015051290392875671, 0.00015991926193237305, 0.00016932561993598938, 0.0001787319779396057, 0.00018813833594322205, 0.00019754469394683838, 0.0002069510519504547, 0.00021635740995407104, 0.00022576376795768738, 0.0002351701259613037, 0.00024457648396492004, 0.0002539828419685364, 0.0002633891999721527, 0.00027279555797576904, 0.0002822019159793854, 0.0002916082739830017, 0.00030101463198661804, 0.0003104209899902344]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 6.0, 4.0, 8.0, 11.0, 14.0, 13.0, 23.0, 35.0, 30.0, 31.0, 70.0, 124.0, 163.0, 340.0, 1171.0, 827658.0, 217117.0, 867.0, 324.0, 165.0, 111.0, 74.0, 43.0, 46.0, 21.0, 17.0, 13.0, 13.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.006740570068359375, -0.006535768508911133, -0.006330966949462891, -0.0061261653900146484, -0.005921363830566406, -0.005716562271118164, -0.005511760711669922, -0.00530695915222168, -0.0051021575927734375, -0.004897356033325195, -0.004692554473876953, -0.004487752914428711, -0.004282951354980469, -0.0040781497955322266, -0.0038733482360839844, -0.003668546676635742, -0.0034637451171875, -0.003258943557739258, -0.0030541419982910156, -0.0028493404388427734, -0.0026445388793945312, -0.002439737319946289, -0.002234935760498047, -0.0020301342010498047, -0.0018253326416015625, -0.0016205310821533203, -0.0014157295227050781, -0.001210927963256836, -0.0010061264038085938, -0.0008013248443603516, -0.0005965232849121094, -0.0003917217254638672, -0.000186920166015625, 1.7881393432617188e-05, 0.00022268295288085938, 0.00042748451232910156, 0.0006322860717773438, 0.0008370876312255859, 0.0010418891906738281, 0.0012466907501220703, 0.0014514923095703125, 0.0016562938690185547, 0.0018610954284667969, 0.002065896987915039, 0.0022706985473632812, 0.0024755001068115234, 0.0026803016662597656, 0.002885103225708008, 0.00308990478515625, 0.003294706344604492, 0.0034995079040527344, 0.0037043094635009766, 0.003909111022949219, 0.004113912582397461, 0.004318714141845703, 0.004523515701293945, 0.0047283172607421875, 0.00493311882019043, 0.005137920379638672, 0.005342721939086914, 0.005547523498535156, 0.0057523250579833984, 0.005957126617431641, 0.006161928176879883, 0.006366729736328125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 6.0, 17.0, 23.0, 45.0, 86.0, 100.0, 129.0, 145.0, 139.0, 114.0, 94.0, 35.0, 33.0, 17.0, 10.0, 3.0, 5.0, 3.0, 1.0], "bins": [-0.000325835746480152, -0.00031961838249117136, -0.0003134010185021907, -0.00030718365451321006, -0.0003009662905242294, -0.00029474892653524876, -0.0002885315625462681, -0.00028231419855728745, -0.00027609680546447635, -0.0002698794414754957, -0.00026366207748651505, -0.0002574447134975344, -0.00025122734950855374, -0.0002450099855195731, -0.0002387926069786772, -0.00023257524298969656, -0.00022635789355263114, -0.0002201405295636505, -0.00021392316557466984, -0.0002077058015856892, -0.00020148843759670854, -0.00019527107360772789, -0.000189053695066832, -0.00018283633107785136, -0.0001766189670888707, -0.00017040160309989005, -0.0001641842391109094, -0.00015796687512192875, -0.00015174949658103287, -0.00014553213259205222, -0.00013931476860307157, -0.00013309740461409092, -0.00012688004062511027, -0.00012066267663612962, -0.00011444531264714897, -0.0001082279413822107, -0.00010201057739323005, -9.57932134042494e-05, -8.957584213931113e-05, -8.335847815033048e-05, -7.714110688539222e-05, -7.092374289641157e-05, -6.47063716314733e-05, -5.848900764249265e-05, -5.2271643653512e-05, -4.605427966453135e-05, -3.983691203757189e-05, -3.3619544410612434e-05, -2.7402180421631783e-05, -2.118481461366173e-05, -1.4967448805691674e-05, -8.75008299772162e-06, -2.5327171897515655e-06, 3.6846467992290854e-06, 9.902014426188543e-06, 1.6119382053148e-05, 2.2336746042128652e-05, 2.8554111850098707e-05, 3.477147765806876e-05, 4.098884528502822e-05, 4.720620927400887e-05, 5.342357326298952e-05, 5.964094088994898e-05, 6.585830851690844e-05, 7.207567250588909e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 3.0, 12.0, 18.0, 17.0, 30.0, 29.0, 30.0, 36.0, 38.0, 44.0, 54.0, 49.0, 52.0, 52.0, 46.0, 36.0, 44.0, 46.0, 50.0, 42.0, 35.0, 36.0, 36.0, 25.0, 36.0, 24.0, 17.0, 10.0, 9.0, 11.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001621246337890625, -0.00015720073133707047, -0.00015227682888507843, -0.0001473529264330864, -0.00014242902398109436, -0.00013750512152910233, -0.0001325812190771103, -0.00012765731662511826, -0.00012273341417312622, -0.00011780951172113419, -0.00011288560926914215, -0.00010796170681715012, -0.00010303780436515808, -9.811390191316605e-05, -9.318999946117401e-05, -8.826609700918198e-05, -8.334219455718994e-05, -7.84182921051979e-05, -7.349438965320587e-05, -6.857048720121384e-05, -6.36465847492218e-05, -5.872268229722977e-05, -5.379877984523773e-05, -4.88748773932457e-05, -4.395097494125366e-05, -3.902707248926163e-05, -3.410317003726959e-05, -2.9179267585277557e-05, -2.4255365133285522e-05, -1.9331462681293488e-05, -1.4407560229301453e-05, -9.483657777309418e-06, -4.559755325317383e-06, 3.641471266746521e-07, 5.288049578666687e-06, 1.0211952030658722e-05, 1.5135854482650757e-05, 2.0059756934642792e-05, 2.4983659386634827e-05, 2.990756183862686e-05, 3.4831464290618896e-05, 3.975536674261093e-05, 4.4679269194602966e-05, 4.9603171646595e-05, 5.4527074098587036e-05, 5.945097655057907e-05, 6.43748790025711e-05, 6.929878145456314e-05, 7.422268390655518e-05, 7.914658635854721e-05, 8.407048881053925e-05, 8.899439126253128e-05, 9.391829371452332e-05, 9.884219616651535e-05, 0.00010376609861850739, 0.00010869000107049942, 0.00011361390352249146, 0.00011853780597448349, 0.00012346170842647552, 0.00012838561087846756, 0.0001333095133304596, 0.00013823341578245163, 0.00014315731823444366, 0.0001480812206864357, 0.00015300512313842773]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 11.0, 6.0, 5.0, 11.0, 15.0, 21.0, 21.0, 20.0, 26.0, 27.0, 39.0, 41.0, 41.0, 43.0, 54.0, 44.0, 59.0, 47.0, 50.0, 39.0, 44.0, 47.0, 45.0, 44.0, 33.0, 31.0, 20.0, 24.0, 20.0, 19.0, 10.0, 9.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6328125, -6.37109375, -6.109375, -5.84765625, -5.5859375, -5.32421875, -5.0625, -4.80078125, -4.5390625, -4.27734375, -4.015625, -3.75390625, -3.4921875, -3.23046875, -2.96875, -2.70703125, -2.4453125, -2.18359375, -1.921875, -1.66015625, -1.3984375, -1.13671875, -0.875, -0.61328125, -0.3515625, -0.08984375, 0.171875, 0.43359375, 0.6953125, 0.95703125, 1.21875, 1.48046875, 1.7421875, 2.00390625, 2.265625, 2.52734375, 2.7890625, 3.05078125, 3.3125, 3.57421875, 3.8359375, 4.09765625, 4.359375, 4.62109375, 4.8828125, 5.14453125, 5.40625, 5.66796875, 5.9296875, 6.19140625, 6.453125, 6.71484375, 6.9765625, 7.23828125, 7.5, 7.76171875, 8.0234375, 8.28515625, 8.546875, 8.80859375, 9.0703125, 9.33203125, 9.59375, 9.85546875, 10.1171875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 14.0, 17.0, 22.0, 31.0, 42.0, 71.0, 86.0, 137.0, 261.0, 464.0, 1087.0, 2792.0, 8487.0, 28329.0, 102235.0, 371733.0, 383004.0, 106724.0, 29038.0, 8677.0, 2903.0, 1118.0, 512.0, 285.0, 152.0, 116.0, 84.0, 41.0, 23.0, 18.0, 18.0, 12.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.9215087890625, -8.624267578125, -8.3270263671875, -8.02978515625, -7.7325439453125, -7.435302734375, -7.1380615234375, -6.8408203125, -6.5435791015625, -6.246337890625, -5.9490966796875, -5.65185546875, -5.3546142578125, -5.057373046875, -4.7601318359375, -4.462890625, -4.1656494140625, -3.868408203125, -3.5711669921875, -3.27392578125, -2.9766845703125, -2.679443359375, -2.3822021484375, -2.0849609375, -1.7877197265625, -1.490478515625, -1.1932373046875, -0.89599609375, -0.5987548828125, -0.301513671875, -0.0042724609375, 0.29296875, 0.5902099609375, 0.887451171875, 1.1846923828125, 1.48193359375, 1.7791748046875, 2.076416015625, 2.3736572265625, 2.6708984375, 2.9681396484375, 3.265380859375, 3.5626220703125, 3.85986328125, 4.1571044921875, 4.454345703125, 4.7515869140625, 5.048828125, 5.3460693359375, 5.643310546875, 5.9405517578125, 6.23779296875, 6.5350341796875, 6.832275390625, 7.1295166015625, 7.4267578125, 7.7239990234375, 8.021240234375, 8.3184814453125, 8.61572265625, 8.9129638671875, 9.210205078125, 9.5074462890625, 9.8046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 7.0, 5.0, 7.0, 8.0, 14.0, 18.0, 12.0, 19.0, 23.0, 19.0, 26.0, 36.0, 36.0, 40.0, 41.0, 52.0, 47.0, 70.0, 167.0, 1398.0, 376.0, 128.0, 67.0, 53.0, 42.0, 45.0, 37.0, 42.0, 23.0, 33.0, 20.0, 14.0, 27.0, 20.0, 18.0, 17.0, 11.0, 5.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0, -20.274658203125, -19.54931640625, -18.823974609375, -18.0986328125, -17.373291015625, -16.64794921875, -15.922607421875, -15.197265625, -14.471923828125, -13.74658203125, -13.021240234375, -12.2958984375, -11.570556640625, -10.84521484375, -10.119873046875, -9.39453125, -8.669189453125, -7.94384765625, -7.218505859375, -6.4931640625, -5.767822265625, -5.04248046875, -4.317138671875, -3.591796875, -2.866455078125, -2.14111328125, -1.415771484375, -0.6904296875, 0.034912109375, 0.76025390625, 1.485595703125, 2.2109375, 2.936279296875, 3.66162109375, 4.386962890625, 5.1123046875, 5.837646484375, 6.56298828125, 7.288330078125, 8.013671875, 8.739013671875, 9.46435546875, 10.189697265625, 10.9150390625, 11.640380859375, 12.36572265625, 13.091064453125, 13.81640625, 14.541748046875, 15.26708984375, 15.992431640625, 16.7177734375, 17.443115234375, 18.16845703125, 18.893798828125, 19.619140625, 20.344482421875, 21.06982421875, 21.795166015625, 22.5205078125, 23.245849609375, 23.97119140625, 24.696533203125, 25.421875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 8.0, 11.0, 9.0, 16.0, 30.0, 26.0, 54.0, 75.0, 128.0, 172.0, 361.0, 1083.0, 48175.0, 3092435.0, 2039.0, 471.0, 219.0, 131.0, 85.0, 57.0, 40.0, 26.0, 19.0, 10.0, 7.0, 6.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.5, -143.18359375, -138.8671875, -134.55078125, -130.234375, -125.91796875, -121.6015625, -117.28515625, -112.96875, -108.65234375, -104.3359375, -100.01953125, -95.703125, -91.38671875, -87.0703125, -82.75390625, -78.4375, -74.12109375, -69.8046875, -65.48828125, -61.171875, -56.85546875, -52.5390625, -48.22265625, -43.90625, -39.58984375, -35.2734375, -30.95703125, -26.640625, -22.32421875, -18.0078125, -13.69140625, -9.375, -5.05859375, -0.7421875, 3.57421875, 7.890625, 12.20703125, 16.5234375, 20.83984375, 25.15625, 29.47265625, 33.7890625, 38.10546875, 42.421875, 46.73828125, 51.0546875, 55.37109375, 59.6875, 64.00390625, 68.3203125, 72.63671875, 76.953125, 81.26953125, 85.5859375, 89.90234375, 94.21875, 98.53515625, 102.8515625, 107.16796875, 111.484375, 115.80078125, 120.1171875, 124.43359375, 128.75]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 26.0, 99.0, 246.0, 376.0, 201.0, 56.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-121.8890609741211, -119.25873565673828, -116.62841033935547, -113.99809265136719, -111.36776733398438, -108.73744201660156, -106.10711669921875, -103.47679138183594, -100.84647369384766, -98.21614837646484, -95.58582305908203, -92.95550537109375, -90.32518005371094, -87.69485473632812, -85.06452941894531, -82.4342041015625, -79.80387878417969, -77.17355346679688, -74.54322814941406, -71.91291046142578, -69.28258514404297, -66.65225982666016, -64.02193450927734, -61.3916130065918, -58.76129150390625, -56.13096618652344, -53.50064468383789, -50.87031936645508, -48.23999786376953, -45.60967254638672, -42.979347229003906, -40.34902572631836, -37.71870803833008, -35.088382720947266, -32.45806121826172, -29.827735900878906, -27.19741439819336, -24.567089080810547, -21.936765670776367, -19.306442260742188, -16.676118850708008, -14.045795440673828, -11.415472030639648, -8.785147666931152, -6.154824256896973, -3.524500846862793, -0.8941764831542969, 1.7361469268798828, 4.3664703369140625, 6.996793746948242, 9.627117156982422, 12.257441520690918, 14.887764930725098, 17.518089294433594, 20.148412704467773, 22.778736114501953, 25.409059524536133, 28.039382934570312, 30.669706344604492, 33.30002975463867, 35.930355072021484, 38.56067657470703, 41.191001892089844, 43.821327209472656, 46.4516487121582]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 7.0, 12.0, 16.0, 24.0, 24.0, 15.0, 34.0, 31.0, 31.0, 30.0, 43.0, 39.0, 46.0, 38.0, 44.0, 41.0, 41.0, 54.0, 43.0, 44.0, 42.0, 39.0, 29.0, 25.0, 29.0, 25.0, 24.0, 20.0, 12.0, 17.0, 19.0, 10.0, 6.0, 11.0, 7.0, 4.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.51719284057617, -48.575565338134766, -46.63393783569336, -44.69231033325195, -42.75068283081055, -40.80905532836914, -38.867431640625, -36.925804138183594, -34.98417663574219, -33.04254913330078, -31.100921630859375, -29.15929412841797, -27.217666625976562, -25.276039123535156, -23.334413528442383, -21.392786026000977, -19.451156616210938, -17.50952911376953, -15.567901611328125, -13.626275062561035, -11.684647560119629, -9.743020057678223, -7.801393508911133, -5.859766006469727, -3.9181385040283203, -1.9765112400054932, -0.034883975982666016, 1.906743049621582, 3.8483705520629883, 5.7899980545043945, 7.731624603271484, 9.67325210571289, 11.614875793457031, 13.556503295898438, 15.498130798339844, 17.43975830078125, 19.381385803222656, 21.323013305664062, 23.264638900756836, 25.206266403198242, 27.14789390563965, 29.089521408081055, 31.03114891052246, 32.972774505615234, 34.91440200805664, 36.85602951049805, 38.79765701293945, 40.73928451538086, 42.680912017822266, 44.62253952026367, 46.56416702270508, 48.505794525146484, 50.44742202758789, 52.3890495300293, 54.33067321777344, 56.272300720214844, 58.21392822265625, 60.155555725097656, 62.09718322753906, 64.03881072998047, 65.98043823242188, 67.92206573486328, 69.86369323730469, 71.8053207397461, 73.7469482421875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 11.0, 13.0, 14.0, 13.0, 19.0, 17.0, 30.0, 38.0, 32.0, 37.0, 29.0, 42.0, 54.0, 52.0, 47.0, 46.0, 55.0, 50.0, 50.0, 44.0, 41.0, 42.0, 39.0, 26.0, 36.0, 24.0, 17.0, 17.0, 12.0, 11.0, 11.0, 6.0, 3.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4609375, -7.1712646484375, -6.881591796875, -6.5919189453125, -6.30224609375, -6.0125732421875, -5.722900390625, -5.4332275390625, -5.1435546875, -4.8538818359375, -4.564208984375, -4.2745361328125, -3.98486328125, -3.6951904296875, -3.405517578125, -3.1158447265625, -2.826171875, -2.5364990234375, -2.246826171875, -1.9571533203125, -1.66748046875, -1.3778076171875, -1.088134765625, -0.7984619140625, -0.5087890625, -0.2191162109375, 0.070556640625, 0.3602294921875, 0.64990234375, 0.9395751953125, 1.229248046875, 1.5189208984375, 1.80859375, 2.0982666015625, 2.387939453125, 2.6776123046875, 2.96728515625, 3.2569580078125, 3.546630859375, 3.8363037109375, 4.1259765625, 4.4156494140625, 4.705322265625, 4.9949951171875, 5.28466796875, 5.5743408203125, 5.864013671875, 6.1536865234375, 6.443359375, 6.7330322265625, 7.022705078125, 7.3123779296875, 7.60205078125, 7.8917236328125, 8.181396484375, 8.4710693359375, 8.7607421875, 9.0504150390625, 9.340087890625, 9.6297607421875, 9.91943359375, 10.2091064453125, 10.498779296875, 10.7884521484375, 11.078125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 11.0, 8.0, 8.0, 23.0, 20.0, 14.0, 21.0, 41.0, 54.0, 54.0, 60.0, 71.0, 109.0, 149.0, 248.0, 562.0, 2204.0, 27710.0, 835945.0, 2926504.0, 385733.0, 12053.0, 1418.0, 455.0, 200.0, 143.0, 91.0, 87.0, 47.0, 59.0, 39.0, 31.0, 19.0, 22.0, 13.0, 17.0, 17.0, 5.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.4375, -16.7763671875, -16.115234375, -15.4541015625, -14.79296875, -14.1318359375, -13.470703125, -12.8095703125, -12.1484375, -11.4873046875, -10.826171875, -10.1650390625, -9.50390625, -8.8427734375, -8.181640625, -7.5205078125, -6.859375, -6.1982421875, -5.537109375, -4.8759765625, -4.21484375, -3.5537109375, -2.892578125, -2.2314453125, -1.5703125, -0.9091796875, -0.248046875, 0.4130859375, 1.07421875, 1.7353515625, 2.396484375, 3.0576171875, 3.71875, 4.3798828125, 5.041015625, 5.7021484375, 6.36328125, 7.0244140625, 7.685546875, 8.3466796875, 9.0078125, 9.6689453125, 10.330078125, 10.9912109375, 11.65234375, 12.3134765625, 12.974609375, 13.6357421875, 14.296875, 14.9580078125, 15.619140625, 16.2802734375, 16.94140625, 17.6025390625, 18.263671875, 18.9248046875, 19.5859375, 20.2470703125, 20.908203125, 21.5693359375, 22.23046875, 22.8916015625, 23.552734375, 24.2138671875, 24.875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 10.0, 12.0, 19.0, 24.0, 22.0, 39.0, 67.0, 79.0, 128.0, 174.0, 232.0, 295.0, 396.0, 425.0, 463.0, 448.0, 314.0, 268.0, 177.0, 138.0, 89.0, 52.0, 56.0, 41.0, 25.0, 18.0, 16.0, 12.0, 7.0, 4.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9765625, -12.5001220703125, -12.023681640625, -11.5472412109375, -11.07080078125, -10.5943603515625, -10.117919921875, -9.6414794921875, -9.1650390625, -8.6885986328125, -8.212158203125, -7.7357177734375, -7.25927734375, -6.7828369140625, -6.306396484375, -5.8299560546875, -5.353515625, -4.8770751953125, -4.400634765625, -3.9241943359375, -3.44775390625, -2.9713134765625, -2.494873046875, -2.0184326171875, -1.5419921875, -1.0655517578125, -0.589111328125, -0.1126708984375, 0.36376953125, 0.8402099609375, 1.316650390625, 1.7930908203125, 2.26953125, 2.7459716796875, 3.222412109375, 3.6988525390625, 4.17529296875, 4.6517333984375, 5.128173828125, 5.6046142578125, 6.0810546875, 6.5574951171875, 7.033935546875, 7.5103759765625, 7.98681640625, 8.4632568359375, 8.939697265625, 9.4161376953125, 9.892578125, 10.3690185546875, 10.845458984375, 11.3218994140625, 11.79833984375, 12.2747802734375, 12.751220703125, 13.2276611328125, 13.7041015625, 14.1805419921875, 14.656982421875, 15.1334228515625, 15.60986328125, 16.0863037109375, 16.562744140625, 17.0391845703125, 17.515625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 4.0, 5.0, 3.0, 10.0, 13.0, 12.0, 28.0, 28.0, 62.0, 67.0, 65.0, 118.0, 190.0, 228.0, 339.0, 498.0, 2396.0, 2007353.0, 2178535.0, 2552.0, 522.0, 348.0, 249.0, 200.0, 145.0, 104.0, 67.0, 38.0, 29.0, 21.0, 17.0, 15.0, 13.0, 1.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.0, -79.7841796875, -77.568359375, -75.3525390625, -73.13671875, -70.9208984375, -68.705078125, -66.4892578125, -64.2734375, -62.0576171875, -59.841796875, -57.6259765625, -55.41015625, -53.1943359375, -50.978515625, -48.7626953125, -46.546875, -44.3310546875, -42.115234375, -39.8994140625, -37.68359375, -35.4677734375, -33.251953125, -31.0361328125, -28.8203125, -26.6044921875, -24.388671875, -22.1728515625, -19.95703125, -17.7412109375, -15.525390625, -13.3095703125, -11.09375, -8.8779296875, -6.662109375, -4.4462890625, -2.23046875, -0.0146484375, 2.201171875, 4.4169921875, 6.6328125, 8.8486328125, 11.064453125, 13.2802734375, 15.49609375, 17.7119140625, 19.927734375, 22.1435546875, 24.359375, 26.5751953125, 28.791015625, 31.0068359375, 33.22265625, 35.4384765625, 37.654296875, 39.8701171875, 42.0859375, 44.3017578125, 46.517578125, 48.7333984375, 50.94921875, 53.1650390625, 55.380859375, 57.5966796875, 59.8125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 34.0, 326.0, 496.0, 142.0, 17.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.7945556640625, -62.24710464477539, -53.69965362548828, -45.15220260620117, -36.60475158691406, -28.057300567626953, -19.509849548339844, -10.962398529052734, -2.414947509765625, 6.132503509521484, 14.679954528808594, 23.227405548095703, 31.774856567382812, 40.32230758666992, 48.86975860595703, 57.41720962524414, 65.96466064453125, 74.51211547851562, 83.05956268310547, 91.60700988769531, 100.15446472167969, 108.70191955566406, 117.2493667602539, 125.79681396484375, 134.34426879882812, 142.8917236328125, 151.43917846679688, 159.9866180419922, 168.53407287597656, 177.08152770996094, 185.62896728515625, 194.17642211914062, 202.723876953125, 211.27133178710938, 219.81878662109375, 228.36622619628906, 236.91368103027344, 245.4611358642578, 254.00857543945312, 262.5560302734375, 271.1034851074219, 279.65093994140625, 288.1983947753906, 296.745849609375, 305.29327392578125, 313.8407287597656, 322.38818359375, 330.9356384277344, 339.48309326171875, 348.0305480957031, 356.5780029296875, 365.1254577636719, 373.67291259765625, 382.2203369140625, 390.7677917480469, 399.31524658203125, 407.8627014160156, 416.41015625, 424.9576110839844, 433.50506591796875, 442.052490234375, 450.5999450683594, 459.14739990234375, 467.6948547363281, 476.2423095703125]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 2.0, 9.0, 1.0, 9.0, 6.0, 13.0, 11.0, 11.0, 12.0, 12.0, 26.0, 22.0, 20.0, 40.0, 33.0, 31.0, 30.0, 32.0, 35.0, 42.0, 45.0, 35.0, 34.0, 37.0, 32.0, 51.0, 33.0, 39.0, 33.0, 32.0, 36.0, 24.0, 20.0, 18.0, 20.0, 15.0, 18.0, 18.0, 14.0, 9.0, 11.0, 6.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.30508041381836, -36.9688720703125, -35.63266372680664, -34.29645538330078, -32.96025085449219, -31.624040603637695, -30.28783416748047, -28.95162582397461, -27.61541748046875, -26.27920913696289, -24.94300079345703, -23.606794357299805, -22.270586013793945, -20.934377670288086, -19.59817123413086, -18.261962890625, -16.92575454711914, -15.589546203613281, -14.253338813781738, -12.917131423950195, -11.580923080444336, -10.244714736938477, -8.908507347106934, -7.572299957275391, -6.236091613769531, -4.89988374710083, -3.563675880432129, -2.2274680137634277, -0.8912601470947266, 0.4449477195739746, 1.7811555862426758, 3.1173629760742188, 4.4535675048828125, 5.789775371551514, 7.125983238220215, 8.462190628051758, 9.798398971557617, 11.134607315063477, 12.47081470489502, 13.807022094726562, 15.143230438232422, 16.47943878173828, 17.81564712524414, 19.151853561401367, 20.488061904907227, 21.824270248413086, 23.160476684570312, 24.496685028076172, 25.83289337158203, 27.16910171508789, 28.50531005859375, 29.841516494750977, 31.177724838256836, 32.51393127441406, 33.85013961791992, 35.18634796142578, 36.52255630493164, 37.8587646484375, 39.19497299194336, 40.53118133544922, 41.86738586425781, 43.20359420776367, 44.53980255126953, 45.87601089477539, 47.21221923828125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 12.0, 20.0, 17.0, 16.0, 33.0, 31.0, 35.0, 30.0, 41.0, 51.0, 51.0, 28.0, 42.0, 47.0, 54.0, 41.0, 43.0, 45.0, 35.0, 40.0, 42.0, 27.0, 32.0, 26.0, 26.0, 20.0, 15.0, 17.0, 11.0, 12.0, 16.0, 4.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0703125, -6.8115234375, -6.552734375, -6.2939453125, -6.03515625, -5.7763671875, -5.517578125, -5.2587890625, -5.0, -4.7412109375, -4.482421875, -4.2236328125, -3.96484375, -3.7060546875, -3.447265625, -3.1884765625, -2.9296875, -2.6708984375, -2.412109375, -2.1533203125, -1.89453125, -1.6357421875, -1.376953125, -1.1181640625, -0.859375, -0.6005859375, -0.341796875, -0.0830078125, 0.17578125, 0.4345703125, 0.693359375, 0.9521484375, 1.2109375, 1.4697265625, 1.728515625, 1.9873046875, 2.24609375, 2.5048828125, 2.763671875, 3.0224609375, 3.28125, 3.5400390625, 3.798828125, 4.0576171875, 4.31640625, 4.5751953125, 4.833984375, 5.0927734375, 5.3515625, 5.6103515625, 5.869140625, 6.1279296875, 6.38671875, 6.6455078125, 6.904296875, 7.1630859375, 7.421875, 7.6806640625, 7.939453125, 8.1982421875, 8.45703125, 8.7158203125, 8.974609375, 9.2333984375, 9.4921875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 9.0, 12.0, 20.0, 33.0, 46.0, 83.0, 124.0, 174.0, 291.0, 476.0, 711.0, 1146.0, 1832.0, 2817.0, 4608.0, 7293.0, 11638.0, 19549.0, 32879.0, 58761.0, 108008.0, 244662.0, 290472.0, 113757.0, 61402.0, 34623.0, 20430.0, 12227.0, 7529.0, 4830.0, 2977.0, 1879.0, 1203.0, 743.0, 476.0, 285.0, 194.0, 117.0, 87.0, 52.0, 36.0, 18.0, 18.0, 12.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.157073974609375, -2.08758544921875, -2.018096923828125, -1.9486083984375, -1.879119873046875, -1.80963134765625, -1.740142822265625, -1.670654296875, -1.601165771484375, -1.53167724609375, -1.462188720703125, -1.3927001953125, -1.323211669921875, -1.25372314453125, -1.184234619140625, -1.11474609375, -1.045257568359375, -0.97576904296875, -0.906280517578125, -0.8367919921875, -0.767303466796875, -0.69781494140625, -0.628326416015625, -0.558837890625, -0.489349365234375, -0.41986083984375, -0.350372314453125, -0.2808837890625, -0.211395263671875, -0.14190673828125, -0.072418212890625, -0.0029296875, 0.066558837890625, 0.13604736328125, 0.205535888671875, 0.2750244140625, 0.344512939453125, 0.41400146484375, 0.483489990234375, 0.552978515625, 0.622467041015625, 0.69195556640625, 0.761444091796875, 0.8309326171875, 0.900421142578125, 0.96990966796875, 1.039398193359375, 1.10888671875, 1.178375244140625, 1.24786376953125, 1.317352294921875, 1.3868408203125, 1.456329345703125, 1.52581787109375, 1.595306396484375, 1.664794921875, 1.734283447265625, 1.80377197265625, 1.873260498046875, 1.9427490234375, 2.012237548828125, 2.08172607421875, 2.151214599609375, 2.220703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 2.0, 9.0, 11.0, 13.0, 5.0, 12.0, 21.0, 18.0, 22.0, 15.0, 30.0, 35.0, 34.0, 36.0, 38.0, 41.0, 45.0, 33.0, 37.0, 1061.0, 47.0, 57.0, 36.0, 34.0, 35.0, 37.0, 26.0, 27.0, 20.0, 28.0, 21.0, 21.0, 22.0, 17.0, 12.0, 13.0, 13.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.9609375, -4.8148193359375, -4.668701171875, -4.5225830078125, -4.37646484375, -4.2303466796875, -4.084228515625, -3.9381103515625, -3.7919921875, -3.6458740234375, -3.499755859375, -3.3536376953125, -3.20751953125, -3.0614013671875, -2.915283203125, -2.7691650390625, -2.623046875, -2.4769287109375, -2.330810546875, -2.1846923828125, -2.03857421875, -1.8924560546875, -1.746337890625, -1.6002197265625, -1.4541015625, -1.3079833984375, -1.161865234375, -1.0157470703125, -0.86962890625, -0.7235107421875, -0.577392578125, -0.4312744140625, -0.28515625, -0.1390380859375, 0.007080078125, 0.1531982421875, 0.29931640625, 0.4454345703125, 0.591552734375, 0.7376708984375, 0.8837890625, 1.0299072265625, 1.176025390625, 1.3221435546875, 1.46826171875, 1.6143798828125, 1.760498046875, 1.9066162109375, 2.052734375, 2.1988525390625, 2.344970703125, 2.4910888671875, 2.63720703125, 2.7833251953125, 2.929443359375, 3.0755615234375, 3.2216796875, 3.3677978515625, 3.513916015625, 3.6600341796875, 3.80615234375, 3.9522705078125, 4.098388671875, 4.2445068359375, 4.390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 9.0, 22.0, 19.0, 36.0, 57.0, 77.0, 138.0, 180.0, 288.0, 399.0, 613.0, 877.0, 1297.0, 1948.0, 2870.0, 4179.0, 6090.0, 9145.0, 13547.0, 20694.0, 32115.0, 49912.0, 79936.0, 141515.0, 1363189.0, 142566.0, 79845.0, 50286.0, 32228.0, 21033.0, 13778.0, 9074.0, 6162.0, 4256.0, 2791.0, 1905.0, 1307.0, 914.0, 591.0, 444.0, 267.0, 184.0, 103.0, 93.0, 50.0, 39.0, 20.0, 14.0, 16.0, 5.0, 5.0, 6.0, 0.0, 0.0, 3.0], "bins": [-1.8583984375, -1.8029327392578125, -1.747467041015625, -1.6920013427734375, -1.63653564453125, -1.5810699462890625, -1.525604248046875, -1.4701385498046875, -1.4146728515625, -1.3592071533203125, -1.303741455078125, -1.2482757568359375, -1.19281005859375, -1.1373443603515625, -1.081878662109375, -1.0264129638671875, -0.970947265625, -0.9154815673828125, -0.860015869140625, -0.8045501708984375, -0.74908447265625, -0.6936187744140625, -0.638153076171875, -0.5826873779296875, -0.5272216796875, -0.4717559814453125, -0.416290283203125, -0.3608245849609375, -0.30535888671875, -0.2498931884765625, -0.194427490234375, -0.1389617919921875, -0.08349609375, -0.0280303955078125, 0.027435302734375, 0.0829010009765625, 0.13836669921875, 0.1938323974609375, 0.249298095703125, 0.3047637939453125, 0.3602294921875, 0.4156951904296875, 0.471160888671875, 0.5266265869140625, 0.58209228515625, 0.6375579833984375, 0.693023681640625, 0.7484893798828125, 0.803955078125, 0.8594207763671875, 0.914886474609375, 0.9703521728515625, 1.02581787109375, 1.0812835693359375, 1.136749267578125, 1.1922149658203125, 1.2476806640625, 1.3031463623046875, 1.358612060546875, 1.4140777587890625, 1.46954345703125, 1.5250091552734375, 1.580474853515625, 1.6359405517578125, 1.69140625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 7.0, 4.0, 5.0, 6.0, 4.0, 5.0, 11.0, 21.0, 14.0, 26.0, 24.0, 30.0, 44.0, 52.0, 59.0, 82.0, 102.0, 127.0, 79.0, 64.0, 46.0, 27.0, 29.0, 26.0, 21.0, 20.0, 11.0, 10.0, 9.0, 7.0, 8.0, 8.0, 4.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002951622009277344, -0.00028489530086517334, -0.0002746284008026123, -0.00026436150074005127, -0.00025409460067749023, -0.0002438277006149292, -0.00023356080055236816, -0.00022329390048980713, -0.0002130270004272461, -0.00020276010036468506, -0.00019249320030212402, -0.000182226300239563, -0.00017195940017700195, -0.00016169250011444092, -0.00015142560005187988, -0.00014115869998931885, -0.0001308917999267578, -0.00012062489986419678, -0.00011035799980163574, -0.00010009109973907471, -8.982419967651367e-05, -7.955729961395264e-05, -6.92903995513916e-05, -5.9023499488830566e-05, -4.875659942626953e-05, -3.8489699363708496e-05, -2.822279930114746e-05, -1.7955899238586426e-05, -7.68899917602539e-06, 2.5779008865356445e-06, 1.284480094909668e-05, 2.3111701011657715e-05, 3.337860107421875e-05, 4.3645501136779785e-05, 5.391240119934082e-05, 6.417930126190186e-05, 7.444620132446289e-05, 8.471310138702393e-05, 9.498000144958496e-05, 0.000105246901512146, 0.00011551380157470703, 0.00012578070163726807, 0.0001360476016998291, 0.00014631450176239014, 0.00015658140182495117, 0.0001668483018875122, 0.00017711520195007324, 0.00018738210201263428, 0.0001976490020751953, 0.00020791590213775635, 0.00021818280220031738, 0.00022844970226287842, 0.00023871660232543945, 0.0002489835023880005, 0.0002592504024505615, 0.00026951730251312256, 0.0002797842025756836, 0.00029005110263824463, 0.00030031800270080566, 0.0003105849027633667, 0.00032085180282592773, 0.00033111870288848877, 0.0003413856029510498, 0.00035165250301361084, 0.0003619194030761719]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 7.0, 10.0, 8.0, 21.0, 20.0, 28.0, 33.0, 43.0, 59.0, 69.0, 161.0, 350.0, 955.0, 578551.0, 466556.0, 892.0, 312.0, 148.0, 81.0, 55.0, 41.0, 34.0, 17.0, 25.0, 13.0, 11.0, 8.0, 8.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00826263427734375, -0.008026480674743652, -0.007790327072143555, -0.007554173469543457, -0.007318019866943359, -0.007081866264343262, -0.006845712661743164, -0.006609559059143066, -0.006373405456542969, -0.006137251853942871, -0.0059010982513427734, -0.005664944648742676, -0.005428791046142578, -0.0051926374435424805, -0.004956483840942383, -0.004720330238342285, -0.0044841766357421875, -0.00424802303314209, -0.004011869430541992, -0.0037757158279418945, -0.003539562225341797, -0.0033034086227416992, -0.0030672550201416016, -0.002831101417541504, -0.0025949478149414062, -0.0023587942123413086, -0.002122640609741211, -0.0018864870071411133, -0.0016503334045410156, -0.001414179801940918, -0.0011780261993408203, -0.0009418725967407227, -0.000705718994140625, -0.00046956539154052734, -0.0002334117889404297, 2.7418136596679688e-06, 0.00023889541625976562, 0.0004750490188598633, 0.0007112026214599609, 0.0009473562240600586, 0.0011835098266601562, 0.001419663429260254, 0.0016558170318603516, 0.0018919706344604492, 0.002128124237060547, 0.0023642778396606445, 0.002600431442260742, 0.00283658504486084, 0.0030727386474609375, 0.003308892250061035, 0.003545045852661133, 0.0037811994552612305, 0.004017353057861328, 0.004253506660461426, 0.0044896602630615234, 0.004725813865661621, 0.004961967468261719, 0.005198121070861816, 0.005434274673461914, 0.005670428276062012, 0.005906581878662109, 0.006142735481262207, 0.006378889083862305, 0.006615042686462402, 0.0068511962890625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 28.0, 147.0, 270.0, 285.0, 193.0, 58.0, 18.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.0007903288933448493, -0.0007762444438412786, -0.0007621600525453687, -0.0007480756030417979, -0.0007339911535382271, -0.0007199067622423172, -0.0007058223127387464, -0.0006917378632351756, -0.0006776534719392657, -0.0006635690224356949, -0.000649484631139785, -0.0006354001816362143, -0.0006213157321326435, -0.0006072313408367336, -0.0005931468913331628, -0.000579062441829592, -0.0005649779923260212, -0.0005508935428224504, -0.0005368091515265405, -0.0005227247020229697, -0.0005086402525193989, -0.000494555861223489, -0.00048047141171991825, -0.00046638696221634746, -0.0004523025709204376, -0.00043821815052069724, -0.00042413370101712644, -0.0004100492806173861, -0.00039596486021764576, -0.00038188041071407497, -0.00036779599031433463, -0.00035371154081076384, -0.0003396271204110235, -0.00032554270001128316, -0.00031145825050771236, -0.000297373830107972, -0.0002832894097082317, -0.0002692049602046609, -0.00025512053980492055, -0.000241036104853265, -0.00022695166990160942, -0.00021286723494995385, -0.00019878281455021352, -0.00018469837959855795, -0.00017061394464690238, -0.00015652950969524682, -0.00014244508929550648, -0.0001283606543438509, -0.00011427622666815296, -0.000100191798992455, -8.610736404079944e-05, -7.202293636510149e-05, -5.793850505142473e-05, -4.385407373774797e-05, -2.9769646062050015e-05, -1.5685211110394448e-05, -1.6007834346964955e-06, 1.2483646969485562e-05, 2.656807737366762e-05, 4.0652506868354976e-05, 5.4736938182031736e-05, 6.88213694957085e-05, 8.290579717140645e-05, 9.699023212306201e-05, 0.00011107465979875997]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 8.0, 6.0, 14.0, 10.0, 7.0, 13.0, 14.0, 13.0, 23.0, 26.0, 33.0, 38.0, 26.0, 26.0, 27.0, 35.0, 50.0, 36.0, 49.0, 45.0, 40.0, 37.0, 39.0, 45.0, 46.0, 34.0, 40.0, 34.0, 19.0, 32.0, 22.0, 14.0, 9.0, 20.0, 19.0, 8.0, 9.0, 8.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00013846158981323242, -0.0001339958980679512, -0.00012953020632266998, -0.00012506451457738876, -0.00012059882283210754, -0.00011613313108682632, -0.0001116674393415451, -0.00010720174759626389, -0.00010273605585098267, -9.827036410570145e-05, -9.380467236042023e-05, -8.933898061513901e-05, -8.487328886985779e-05, -8.040759712457657e-05, -7.594190537929535e-05, -7.147621363401413e-05, -6.701052188873291e-05, -6.254483014345169e-05, -5.807913839817047e-05, -5.361344665288925e-05, -4.914775490760803e-05, -4.468206316232681e-05, -4.021637141704559e-05, -3.5750679671764374e-05, -3.1284987926483154e-05, -2.6819296181201935e-05, -2.2353604435920715e-05, -1.7887912690639496e-05, -1.3422220945358276e-05, -8.956529200077057e-06, -4.490837454795837e-06, -2.514570951461792e-08, 4.4405460357666016e-06, 8.906237781047821e-06, 1.337192952632904e-05, 1.783762127161026e-05, 2.230331301689148e-05, 2.67690047621727e-05, 3.123469650745392e-05, 3.570038825273514e-05, 4.016607999801636e-05, 4.463177174329758e-05, 4.9097463488578796e-05, 5.3563155233860016e-05, 5.8028846979141235e-05, 6.249453872442245e-05, 6.696023046970367e-05, 7.14259222149849e-05, 7.589161396026611e-05, 8.035730570554733e-05, 8.482299745082855e-05, 8.928868919610977e-05, 9.375438094139099e-05, 9.822007268667221e-05, 0.00010268576443195343, 0.00010715145617723465, 0.00011161714792251587, 0.00011608283966779709, 0.00012054853141307831, 0.00012501422315835953, 0.00012947991490364075, 0.00013394560664892197, 0.00013841129839420319, 0.0001428769901394844, 0.00014734268188476562]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 12.0, 20.0, 17.0, 16.0, 33.0, 31.0, 35.0, 30.0, 41.0, 51.0, 51.0, 28.0, 42.0, 47.0, 54.0, 41.0, 43.0, 45.0, 35.0, 40.0, 42.0, 27.0, 32.0, 26.0, 26.0, 20.0, 15.0, 17.0, 11.0, 12.0, 16.0, 4.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0703125, -6.8115234375, -6.552734375, -6.2939453125, -6.03515625, -5.7763671875, -5.517578125, -5.2587890625, -5.0, -4.7412109375, -4.482421875, -4.2236328125, -3.96484375, -3.7060546875, -3.447265625, -3.1884765625, -2.9296875, -2.6708984375, -2.412109375, -2.1533203125, -1.89453125, -1.6357421875, -1.376953125, -1.1181640625, -0.859375, -0.6005859375, -0.341796875, -0.0830078125, 0.17578125, 0.4345703125, 0.693359375, 0.9521484375, 1.2109375, 1.4697265625, 1.728515625, 1.9873046875, 2.24609375, 2.5048828125, 2.763671875, 3.0224609375, 3.28125, 3.5400390625, 3.798828125, 4.0576171875, 4.31640625, 4.5751953125, 4.833984375, 5.0927734375, 5.3515625, 5.6103515625, 5.869140625, 6.1279296875, 6.38671875, 6.6455078125, 6.904296875, 7.1630859375, 7.421875, 7.6806640625, 7.939453125, 8.1982421875, 8.45703125, 8.7158203125, 8.974609375, 9.2333984375, 9.4921875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 10.0, 10.0, 11.0, 16.0, 12.0, 31.0, 53.0, 75.0, 120.0, 163.0, 314.0, 613.0, 1456.0, 3007.0, 6642.0, 14506.0, 33811.0, 85046.0, 224446.0, 362643.0, 190775.0, 72246.0, 28897.0, 12684.0, 5690.0, 2683.0, 1286.0, 567.0, 307.0, 130.0, 108.0, 57.0, 29.0, 29.0, 23.0, 15.0, 10.0, 12.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.88671875, -6.6602783203125, -6.433837890625, -6.2073974609375, -5.98095703125, -5.7545166015625, -5.528076171875, -5.3016357421875, -5.0751953125, -4.8487548828125, -4.622314453125, -4.3958740234375, -4.16943359375, -3.9429931640625, -3.716552734375, -3.4901123046875, -3.263671875, -3.0372314453125, -2.810791015625, -2.5843505859375, -2.35791015625, -2.1314697265625, -1.905029296875, -1.6785888671875, -1.4521484375, -1.2257080078125, -0.999267578125, -0.7728271484375, -0.54638671875, -0.3199462890625, -0.093505859375, 0.1329345703125, 0.359375, 0.5858154296875, 0.812255859375, 1.0386962890625, 1.26513671875, 1.4915771484375, 1.718017578125, 1.9444580078125, 2.1708984375, 2.3973388671875, 2.623779296875, 2.8502197265625, 3.07666015625, 3.3031005859375, 3.529541015625, 3.7559814453125, 3.982421875, 4.2088623046875, 4.435302734375, 4.6617431640625, 4.88818359375, 5.1146240234375, 5.341064453125, 5.5675048828125, 5.7939453125, 6.0203857421875, 6.246826171875, 6.4732666015625, 6.69970703125, 6.9261474609375, 7.152587890625, 7.3790283203125, 7.60546875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 9.0, 6.0, 6.0, 11.0, 12.0, 8.0, 12.0, 11.0, 10.0, 28.0, 23.0, 16.0, 32.0, 32.0, 42.0, 48.0, 57.0, 63.0, 133.0, 336.0, 1436.0, 222.0, 102.0, 57.0, 35.0, 49.0, 37.0, 34.0, 27.0, 20.0, 12.0, 21.0, 15.0, 19.0, 17.0, 12.0, 9.0, 5.0, 7.0, 7.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.8125, -28.942626953125, -28.07275390625, -27.202880859375, -26.3330078125, -25.463134765625, -24.59326171875, -23.723388671875, -22.853515625, -21.983642578125, -21.11376953125, -20.243896484375, -19.3740234375, -18.504150390625, -17.63427734375, -16.764404296875, -15.89453125, -15.024658203125, -14.15478515625, -13.284912109375, -12.4150390625, -11.545166015625, -10.67529296875, -9.805419921875, -8.935546875, -8.065673828125, -7.19580078125, -6.325927734375, -5.4560546875, -4.586181640625, -3.71630859375, -2.846435546875, -1.9765625, -1.106689453125, -0.23681640625, 0.633056640625, 1.5029296875, 2.372802734375, 3.24267578125, 4.112548828125, 4.982421875, 5.852294921875, 6.72216796875, 7.592041015625, 8.4619140625, 9.331787109375, 10.20166015625, 11.071533203125, 11.94140625, 12.811279296875, 13.68115234375, 14.551025390625, 15.4208984375, 16.290771484375, 17.16064453125, 18.030517578125, 18.900390625, 19.770263671875, 20.64013671875, 21.510009765625, 22.3798828125, 23.249755859375, 24.11962890625, 24.989501953125, 25.859375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 4.0, 4.0, 4.0, 6.0, 10.0, 21.0, 23.0, 22.0, 31.0, 51.0, 52.0, 72.0, 109.0, 180.0, 303.0, 489.0, 1850.0, 2866165.0, 273962.0, 1106.0, 455.0, 269.0, 157.0, 97.0, 71.0, 47.0, 28.0, 28.0, 36.0, 20.0, 13.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-99.125, -96.0166015625, -92.908203125, -89.7998046875, -86.69140625, -83.5830078125, -80.474609375, -77.3662109375, -74.2578125, -71.1494140625, -68.041015625, -64.9326171875, -61.82421875, -58.7158203125, -55.607421875, -52.4990234375, -49.390625, -46.2822265625, -43.173828125, -40.0654296875, -36.95703125, -33.8486328125, -30.740234375, -27.6318359375, -24.5234375, -21.4150390625, -18.306640625, -15.1982421875, -12.08984375, -8.9814453125, -5.873046875, -2.7646484375, 0.34375, 3.4521484375, 6.560546875, 9.6689453125, 12.77734375, 15.8857421875, 18.994140625, 22.1025390625, 25.2109375, 28.3193359375, 31.427734375, 34.5361328125, 37.64453125, 40.7529296875, 43.861328125, 46.9697265625, 50.078125, 53.1865234375, 56.294921875, 59.4033203125, 62.51171875, 65.6201171875, 68.728515625, 71.8369140625, 74.9453125, 78.0537109375, 81.162109375, 84.2705078125, 87.37890625, 90.4873046875, 93.595703125, 96.7041015625, 99.8125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [2.0, 33.0, 378.0, 542.0, 56.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.687761306762695, -11.46932601928711, -6.250889778137207, -1.0324535369873047, 4.185981750488281, 9.404417037963867, 14.622854232788086, 19.84128761291504, 25.059724807739258, 30.278160095214844, 35.49659729003906, 40.71503448486328, 45.933467864990234, 51.15190124511719, 56.370338439941406, 61.588775634765625, 66.80721282958984, 72.02565002441406, 77.24408721923828, 82.4625244140625, 87.68095397949219, 92.8993911743164, 98.11782836914062, 103.33625793457031, 108.55469512939453, 113.77313232421875, 118.99156951904297, 124.21000671386719, 129.42843627929688, 134.64688110351562, 139.8653106689453, 145.083740234375, 150.3021697998047, 155.52059936523438, 160.73904418945312, 165.9574737548828, 171.17591857910156, 176.39434814453125, 181.61279296875, 186.8312225341797, 192.04965209960938, 197.26808166503906, 202.4865264892578, 207.7049560546875, 212.92340087890625, 218.14183044433594, 223.36026000976562, 228.57870483398438, 233.79714965820312, 239.0155792236328, 244.23402404785156, 249.45245361328125, 254.6708984375, 259.88934326171875, 265.1077575683594, 270.3262023925781, 275.54461669921875, 280.7630615234375, 285.9814758300781, 291.1999206542969, 296.4183654785156, 301.63677978515625, 306.855224609375, 312.07366943359375, 317.2921142578125]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 5.0, 6.0, 13.0, 21.0, 12.0, 14.0, 16.0, 16.0, 20.0, 20.0, 15.0, 25.0, 20.0, 40.0, 22.0, 34.0, 34.0, 37.0, 39.0, 33.0, 34.0, 34.0, 33.0, 24.0, 35.0, 32.0, 35.0, 38.0, 35.0, 21.0, 28.0, 33.0, 22.0, 24.0, 21.0, 14.0, 12.0, 21.0, 2.0, 8.0, 13.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-58.020729064941406, -56.284339904785156, -54.547950744628906, -52.81156539916992, -51.07517623901367, -49.33878707885742, -47.60239791870117, -45.86601257324219, -44.12962341308594, -42.39323425292969, -40.65684509277344, -38.92045974731445, -37.1840705871582, -35.44768142700195, -33.7112922668457, -31.974905014038086, -30.238515853881836, -28.502126693725586, -26.76573944091797, -25.02935028076172, -23.2929630279541, -21.55657386779785, -19.820186614990234, -18.083797454833984, -16.347408294677734, -14.6110200881958, -12.874631881713867, -11.138242721557617, -9.40185546875, -7.66546630859375, -5.929078102111816, -4.192689895629883, -2.4563026428222656, -0.7199143171310425, 1.0164740085601807, 2.7528624534606934, 4.489250659942627, 6.225639343261719, 7.962027549743652, 9.698415756225586, 11.43480396270752, 13.171192169189453, 14.907580375671387, 16.64396858215332, 18.38035774230957, 20.116744995117188, 21.853134155273438, 23.589523315429688, 25.325910568237305, 27.062299728393555, 28.798686981201172, 30.535076141357422, 32.27146530151367, 34.007850646972656, 35.744239807128906, 37.480628967285156, 39.217018127441406, 40.953407287597656, 42.689796447753906, 44.42618179321289, 46.16257095336914, 47.89896011352539, 49.63534927368164, 51.371734619140625, 53.108123779296875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 7.0, 10.0, 14.0, 14.0, 26.0, 17.0, 27.0, 32.0, 30.0, 39.0, 35.0, 35.0, 37.0, 47.0, 51.0, 49.0, 46.0, 44.0, 42.0, 48.0, 34.0, 35.0, 35.0, 32.0, 20.0, 25.0, 28.0, 13.0, 23.0, 17.0, 13.0, 12.0, 12.0, 8.0, 7.0, 7.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.24609375, -6.97015380859375, -6.6942138671875, -6.41827392578125, -6.142333984375, -5.86639404296875, -5.5904541015625, -5.31451416015625, -5.03857421875, -4.76263427734375, -4.4866943359375, -4.21075439453125, -3.934814453125, -3.65887451171875, -3.3829345703125, -3.10699462890625, -2.8310546875, -2.55511474609375, -2.2791748046875, -2.00323486328125, -1.727294921875, -1.45135498046875, -1.1754150390625, -0.89947509765625, -0.62353515625, -0.34759521484375, -0.0716552734375, 0.20428466796875, 0.480224609375, 0.75616455078125, 1.0321044921875, 1.30804443359375, 1.583984375, 1.85992431640625, 2.1358642578125, 2.41180419921875, 2.687744140625, 2.96368408203125, 3.2396240234375, 3.51556396484375, 3.79150390625, 4.06744384765625, 4.3433837890625, 4.61932373046875, 4.895263671875, 5.17120361328125, 5.4471435546875, 5.72308349609375, 5.9990234375, 6.27496337890625, 6.5509033203125, 6.82684326171875, 7.102783203125, 7.37872314453125, 7.6546630859375, 7.93060302734375, 8.20654296875, 8.48248291015625, 8.7584228515625, 9.03436279296875, 9.310302734375, 9.58624267578125, 9.8621826171875, 10.13812255859375, 10.4140625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 8.0, 9.0, 8.0, 13.0, 17.0, 16.0, 26.0, 28.0, 50.0, 47.0, 57.0, 97.0, 148.0, 222.0, 524.0, 1281.0, 10427.0, 672672.0, 3296405.0, 205650.0, 4635.0, 888.0, 378.0, 187.0, 120.0, 83.0, 59.0, 44.0, 29.0, 31.0, 28.0, 25.0, 15.0, 12.0, 11.0, 6.0, 7.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.8125, -22.942138671875, -22.07177734375, -21.201416015625, -20.3310546875, -19.460693359375, -18.59033203125, -17.719970703125, -16.849609375, -15.979248046875, -15.10888671875, -14.238525390625, -13.3681640625, -12.497802734375, -11.62744140625, -10.757080078125, -9.88671875, -9.016357421875, -8.14599609375, -7.275634765625, -6.4052734375, -5.534912109375, -4.66455078125, -3.794189453125, -2.923828125, -2.053466796875, -1.18310546875, -0.312744140625, 0.5576171875, 1.427978515625, 2.29833984375, 3.168701171875, 4.0390625, 4.909423828125, 5.77978515625, 6.650146484375, 7.5205078125, 8.390869140625, 9.26123046875, 10.131591796875, 11.001953125, 11.872314453125, 12.74267578125, 13.613037109375, 14.4833984375, 15.353759765625, 16.22412109375, 17.094482421875, 17.96484375, 18.835205078125, 19.70556640625, 20.575927734375, 21.4462890625, 22.316650390625, 23.18701171875, 24.057373046875, 24.927734375, 25.798095703125, 26.66845703125, 27.538818359375, 28.4091796875, 29.279541015625, 30.14990234375, 31.020263671875, 31.890625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 9.0, 9.0, 19.0, 26.0, 29.0, 52.0, 54.0, 92.0, 106.0, 124.0, 198.0, 253.0, 302.0, 373.0, 436.0, 413.0, 345.0, 314.0, 225.0, 184.0, 117.0, 105.0, 62.0, 60.0, 41.0, 27.0, 29.0, 19.0, 6.0, 8.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.453125, -15.9805908203125, -15.508056640625, -15.0355224609375, -14.56298828125, -14.0904541015625, -13.617919921875, -13.1453857421875, -12.6728515625, -12.2003173828125, -11.727783203125, -11.2552490234375, -10.78271484375, -10.3101806640625, -9.837646484375, -9.3651123046875, -8.892578125, -8.4200439453125, -7.947509765625, -7.4749755859375, -7.00244140625, -6.5299072265625, -6.057373046875, -5.5848388671875, -5.1123046875, -4.6397705078125, -4.167236328125, -3.6947021484375, -3.22216796875, -2.7496337890625, -2.277099609375, -1.8045654296875, -1.33203125, -0.8594970703125, -0.386962890625, 0.0855712890625, 0.55810546875, 1.0306396484375, 1.503173828125, 1.9757080078125, 2.4482421875, 2.9207763671875, 3.393310546875, 3.8658447265625, 4.33837890625, 4.8109130859375, 5.283447265625, 5.7559814453125, 6.228515625, 6.7010498046875, 7.173583984375, 7.6461181640625, 8.11865234375, 8.5911865234375, 9.063720703125, 9.5362548828125, 10.0087890625, 10.4813232421875, 10.953857421875, 11.4263916015625, 11.89892578125, 12.3714599609375, 12.843994140625, 13.3165283203125, 13.7890625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 14.0, 24.0, 34.0, 46.0, 50.0, 75.0, 102.0, 133.0, 176.0, 240.0, 306.0, 497.0, 1339.0, 182954.0, 3988883.0, 17106.0, 736.0, 388.0, 294.0, 201.0, 189.0, 122.0, 92.0, 74.0, 41.0, 35.0, 36.0, 23.0, 10.0, 11.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.3125, -60.1875, -58.0625, -55.9375, -53.8125, -51.6875, -49.5625, -47.4375, -45.3125, -43.1875, -41.0625, -38.9375, -36.8125, -34.6875, -32.5625, -30.4375, -28.3125, -26.1875, -24.0625, -21.9375, -19.8125, -17.6875, -15.5625, -13.4375, -11.3125, -9.1875, -7.0625, -4.9375, -2.8125, -0.6875, 1.4375, 3.5625, 5.6875, 7.8125, 9.9375, 12.0625, 14.1875, 16.3125, 18.4375, 20.5625, 22.6875, 24.8125, 26.9375, 29.0625, 31.1875, 33.3125, 35.4375, 37.5625, 39.6875, 41.8125, 43.9375, 46.0625, 48.1875, 50.3125, 52.4375, 54.5625, 56.6875, 58.8125, 60.9375, 63.0625, 65.1875, 67.3125, 69.4375, 71.5625, 73.6875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 6.0, 30.0, 219.0, 409.0, 278.0, 65.0, 10.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.27892303466797, -43.66758728027344, -37.05625534057617, -30.444921493530273, -23.833587646484375, -17.222251892089844, -10.610919952392578, -3.9995880126953125, 2.6117477416992188, 9.223081588745117, 15.834415435791016, 22.445749282836914, 29.057083129882812, 35.668418884277344, 42.27975082397461, 48.891082763671875, 55.502418518066406, 62.11375427246094, 68.72508239746094, 75.33641815185547, 81.94775390625, 88.55908966064453, 95.17042541503906, 101.78175354003906, 108.3930892944336, 115.00442504882812, 121.61575317382812, 128.2270965576172, 134.8384246826172, 141.44976806640625, 148.06109619140625, 154.67242431640625, 161.28375244140625, 167.89508056640625, 174.5064239501953, 181.1177520751953, 187.72909545898438, 194.34042358398438, 200.95175170898438, 207.56307983398438, 214.17442321777344, 220.78575134277344, 227.3970947265625, 234.0084228515625, 240.6197509765625, 247.23109436035156, 253.84242248535156, 260.4537658691406, 267.0650939941406, 273.6764221191406, 280.2877502441406, 286.89910888671875, 293.51043701171875, 300.12176513671875, 306.73309326171875, 313.34442138671875, 319.95574951171875, 326.56707763671875, 333.17840576171875, 339.7897644042969, 346.4010925292969, 353.0124206542969, 359.6237487792969, 366.2350769042969, 372.846435546875]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 13.0, 13.0, 17.0, 10.0, 22.0, 17.0, 22.0, 22.0, 34.0, 31.0, 45.0, 30.0, 36.0, 44.0, 37.0, 44.0, 28.0, 44.0, 44.0, 42.0, 42.0, 44.0, 35.0, 37.0, 24.0, 28.0, 27.0, 20.0, 25.0, 14.0, 18.0, 14.0, 13.0, 9.0, 9.0, 7.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-58.853214263916016, -57.18791580200195, -55.522613525390625, -53.85731506347656, -52.1920166015625, -50.52671813964844, -48.861419677734375, -47.19611740112305, -45.530818939208984, -43.86552047729492, -42.200218200683594, -40.53491973876953, -38.86962127685547, -37.204322814941406, -35.539024353027344, -33.873722076416016, -32.20842361450195, -30.54312515258789, -28.877824783325195, -27.2125244140625, -25.547225952148438, -23.881927490234375, -22.21662712097168, -20.551326751708984, -18.886028289794922, -17.22072982788086, -15.555429458618164, -13.890130043029785, -12.224830627441406, -10.559531211853027, -8.894231796264648, -7.2289323806762695, -5.563632965087891, -3.8983335494995117, -2.233034133911133, -0.5677347183227539, 1.097564697265625, 2.762864112854004, 4.428163528442383, 6.093462944030762, 7.758762359619141, 9.42406177520752, 11.089361190795898, 12.754660606384277, 14.419960021972656, 16.08525848388672, 17.750558853149414, 19.41585922241211, 21.081157684326172, 22.746456146240234, 24.41175651550293, 26.077056884765625, 27.742355346679688, 29.40765380859375, 31.072954177856445, 32.73825454711914, 34.4035530090332, 36.068851470947266, 37.734153747558594, 39.399452209472656, 41.06475067138672, 42.73004913330078, 44.395347595214844, 46.06064987182617, 47.725948333740234]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 3.0, 9.0, 6.0, 18.0, 12.0, 12.0, 20.0, 13.0, 17.0, 27.0, 23.0, 24.0, 28.0, 26.0, 36.0, 39.0, 54.0, 42.0, 49.0, 46.0, 50.0, 47.0, 31.0, 41.0, 43.0, 38.0, 32.0, 22.0, 31.0, 25.0, 24.0, 18.0, 21.0, 14.0, 13.0, 14.0, 12.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6328125, -8.376953125, -8.12109375, -7.865234375, -7.609375, -7.353515625, -7.09765625, -6.841796875, -6.5859375, -6.330078125, -6.07421875, -5.818359375, -5.5625, -5.306640625, -5.05078125, -4.794921875, -4.5390625, -4.283203125, -4.02734375, -3.771484375, -3.515625, -3.259765625, -3.00390625, -2.748046875, -2.4921875, -2.236328125, -1.98046875, -1.724609375, -1.46875, -1.212890625, -0.95703125, -0.701171875, -0.4453125, -0.189453125, 0.06640625, 0.322265625, 0.578125, 0.833984375, 1.08984375, 1.345703125, 1.6015625, 1.857421875, 2.11328125, 2.369140625, 2.625, 2.880859375, 3.13671875, 3.392578125, 3.6484375, 3.904296875, 4.16015625, 4.416015625, 4.671875, 4.927734375, 5.18359375, 5.439453125, 5.6953125, 5.951171875, 6.20703125, 6.462890625, 6.71875, 6.974609375, 7.23046875, 7.486328125, 7.7421875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 10.0, 22.0, 13.0, 23.0, 46.0, 65.0, 95.0, 103.0, 175.0, 304.0, 434.0, 610.0, 975.0, 1468.0, 2169.0, 3108.0, 4674.0, 7130.0, 10945.0, 16800.0, 25779.0, 41423.0, 70339.0, 130814.0, 328492.0, 176284.0, 87428.0, 50014.0, 31119.0, 19760.0, 12953.0, 8374.0, 5520.0, 3654.0, 2527.0, 1641.0, 1079.0, 737.0, 470.0, 298.0, 213.0, 174.0, 98.0, 42.0, 49.0, 37.0, 24.0, 16.0, 9.0, 4.0, 10.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-2.12890625, -2.06378173828125, -1.9986572265625, -1.93353271484375, -1.868408203125, -1.80328369140625, -1.7381591796875, -1.67303466796875, -1.60791015625, -1.54278564453125, -1.4776611328125, -1.41253662109375, -1.347412109375, -1.28228759765625, -1.2171630859375, -1.15203857421875, -1.0869140625, -1.02178955078125, -0.9566650390625, -0.89154052734375, -0.826416015625, -0.76129150390625, -0.6961669921875, -0.63104248046875, -0.56591796875, -0.50079345703125, -0.4356689453125, -0.37054443359375, -0.305419921875, -0.24029541015625, -0.1751708984375, -0.11004638671875, -0.044921875, 0.02020263671875, 0.0853271484375, 0.15045166015625, 0.215576171875, 0.28070068359375, 0.3458251953125, 0.41094970703125, 0.47607421875, 0.54119873046875, 0.6063232421875, 0.67144775390625, 0.736572265625, 0.80169677734375, 0.8668212890625, 0.93194580078125, 0.9970703125, 1.06219482421875, 1.1273193359375, 1.19244384765625, 1.257568359375, 1.32269287109375, 1.3878173828125, 1.45294189453125, 1.51806640625, 1.58319091796875, 1.6483154296875, 1.71343994140625, 1.778564453125, 1.84368896484375, 1.9088134765625, 1.97393798828125, 2.0390625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 6.0, 6.0, 6.0, 12.0, 9.0, 12.0, 12.0, 15.0, 24.0, 20.0, 14.0, 24.0, 30.0, 29.0, 38.0, 34.0, 37.0, 36.0, 37.0, 42.0, 34.0, 1067.0, 40.0, 47.0, 29.0, 38.0, 32.0, 32.0, 40.0, 31.0, 21.0, 20.0, 19.0, 20.0, 11.0, 17.0, 15.0, 15.0, 8.0, 5.0, 10.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5078125, -4.35845947265625, -4.2091064453125, -4.05975341796875, -3.910400390625, -3.76104736328125, -3.6116943359375, -3.46234130859375, -3.31298828125, -3.16363525390625, -3.0142822265625, -2.86492919921875, -2.715576171875, -2.56622314453125, -2.4168701171875, -2.26751708984375, -2.1181640625, -1.96881103515625, -1.8194580078125, -1.67010498046875, -1.520751953125, -1.37139892578125, -1.2220458984375, -1.07269287109375, -0.92333984375, -0.77398681640625, -0.6246337890625, -0.47528076171875, -0.325927734375, -0.17657470703125, -0.0272216796875, 0.12213134765625, 0.271484375, 0.42083740234375, 0.5701904296875, 0.71954345703125, 0.868896484375, 1.01824951171875, 1.1676025390625, 1.31695556640625, 1.46630859375, 1.61566162109375, 1.7650146484375, 1.91436767578125, 2.063720703125, 2.21307373046875, 2.3624267578125, 2.51177978515625, 2.6611328125, 2.81048583984375, 2.9598388671875, 3.10919189453125, 3.258544921875, 3.40789794921875, 3.5572509765625, 3.70660400390625, 3.85595703125, 4.00531005859375, 4.1546630859375, 4.30401611328125, 4.453369140625, 4.60272216796875, 4.7520751953125, 4.90142822265625, 5.05078125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 5.0, 14.0, 17.0, 26.0, 34.0, 42.0, 95.0, 100.0, 176.0, 268.0, 389.0, 541.0, 882.0, 1242.0, 1803.0, 2411.0, 3605.0, 4877.0, 7259.0, 10698.0, 15387.0, 23323.0, 35366.0, 53950.0, 85671.0, 156645.0, 1346551.0, 126897.0, 74703.0, 47164.0, 31590.0, 20670.0, 13824.0, 9307.0, 6550.0, 4594.0, 3195.0, 2284.0, 1533.0, 1097.0, 743.0, 534.0, 359.0, 235.0, 164.0, 131.0, 63.0, 43.0, 32.0, 18.0, 13.0, 5.0, 3.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.712890625, -1.656463623046875, -1.60003662109375, -1.543609619140625, -1.4871826171875, -1.430755615234375, -1.37432861328125, -1.317901611328125, -1.261474609375, -1.205047607421875, -1.14862060546875, -1.092193603515625, -1.0357666015625, -0.979339599609375, -0.92291259765625, -0.866485595703125, -0.81005859375, -0.753631591796875, -0.69720458984375, -0.640777587890625, -0.5843505859375, -0.527923583984375, -0.47149658203125, -0.415069580078125, -0.358642578125, -0.302215576171875, -0.24578857421875, -0.189361572265625, -0.1329345703125, -0.076507568359375, -0.02008056640625, 0.036346435546875, 0.0927734375, 0.149200439453125, 0.20562744140625, 0.262054443359375, 0.3184814453125, 0.374908447265625, 0.43133544921875, 0.487762451171875, 0.544189453125, 0.600616455078125, 0.65704345703125, 0.713470458984375, 0.7698974609375, 0.826324462890625, 0.88275146484375, 0.939178466796875, 0.99560546875, 1.052032470703125, 1.10845947265625, 1.164886474609375, 1.2213134765625, 1.277740478515625, 1.33416748046875, 1.390594482421875, 1.447021484375, 1.503448486328125, 1.55987548828125, 1.616302490234375, 1.6727294921875, 1.729156494140625, 1.78558349609375, 1.842010498046875, 1.8984375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 9.0, 10.0, 8.0, 7.0, 12.0, 13.0, 10.0, 21.0, 16.0, 18.0, 26.0, 33.0, 32.0, 41.0, 33.0, 67.0, 57.0, 70.0, 67.0, 56.0, 62.0, 59.0, 48.0, 33.0, 34.0, 23.0, 17.0, 20.0, 19.0, 10.0, 11.0, 11.0, 5.0, 4.0, 3.0, 6.0, 1.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0002617835998535156, -0.0002538226544857025, -0.0002458617091178894, -0.0002379007637500763, -0.00022993981838226318, -0.00022197887301445007, -0.00021401792764663696, -0.00020605698227882385, -0.00019809603691101074, -0.00019013509154319763, -0.00018217414617538452, -0.0001742132008075714, -0.0001662522554397583, -0.0001582913100719452, -0.00015033036470413208, -0.00014236941933631897, -0.00013440847396850586, -0.00012644752860069275, -0.00011848658323287964, -0.00011052563786506653, -0.00010256469249725342, -9.460374712944031e-05, -8.66428017616272e-05, -7.868185639381409e-05, -7.072091102600098e-05, -6.275996565818787e-05, -5.4799020290374756e-05, -4.6838074922561646e-05, -3.8877129554748535e-05, -3.0916184186935425e-05, -2.2955238819122314e-05, -1.4994293451309204e-05, -7.033348083496094e-06, 9.275972843170166e-07, 8.888542652130127e-06, 1.6849488019943237e-05, 2.4810433387756348e-05, 3.277137875556946e-05, 4.073232412338257e-05, 4.869326949119568e-05, 5.665421485900879e-05, 6.46151602268219e-05, 7.257610559463501e-05, 8.053705096244812e-05, 8.849799633026123e-05, 9.645894169807434e-05, 0.00010441988706588745, 0.00011238083243370056, 0.00012034177780151367, 0.00012830272316932678, 0.0001362636685371399, 0.000144224613904953, 0.0001521855592727661, 0.00016014650464057922, 0.00016810745000839233, 0.00017606839537620544, 0.00018402934074401855, 0.00019199028611183167, 0.00019995123147964478, 0.00020791217684745789, 0.000215873122215271, 0.0002238340675830841, 0.00023179501295089722, 0.00023975595831871033, 0.00024771690368652344]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 9.0, 2.0, 5.0, 7.0, 6.0, 11.0, 13.0, 21.0, 18.0, 20.0, 26.0, 24.0, 49.0, 45.0, 79.0, 140.0, 203.0, 325.0, 1040.0, 155805.0, 887717.0, 1816.0, 447.0, 218.0, 120.0, 92.0, 53.0, 36.0, 34.0, 38.0, 20.0, 31.0, 14.0, 14.0, 18.0, 11.0, 7.0, 5.0, 2.0, 6.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.005886077880859375, -0.0057029128074646, -0.005519747734069824, -0.005336582660675049, -0.0051534175872802734, -0.004970252513885498, -0.004787087440490723, -0.004603922367095947, -0.004420757293701172, -0.0042375922203063965, -0.004054427146911621, -0.0038712620735168457, -0.0036880970001220703, -0.003504931926727295, -0.0033217668533325195, -0.003138601779937744, -0.0029554367065429688, -0.0027722716331481934, -0.002589106559753418, -0.0024059414863586426, -0.002222776412963867, -0.002039611339569092, -0.0018564462661743164, -0.001673281192779541, -0.0014901161193847656, -0.0013069510459899902, -0.0011237859725952148, -0.0009406208992004395, -0.0007574558258056641, -0.0005742907524108887, -0.0003911256790161133, -0.0002079606056213379, -2.47955322265625e-05, 0.0001583695411682129, 0.0003415346145629883, 0.0005246996879577637, 0.0007078647613525391, 0.0008910298347473145, 0.0010741949081420898, 0.0012573599815368652, 0.0014405250549316406, 0.001623690128326416, 0.0018068552017211914, 0.001990020275115967, 0.002173185348510742, 0.0023563504219055176, 0.002539515495300293, 0.0027226805686950684, 0.0029058456420898438, 0.003089010715484619, 0.0032721757888793945, 0.00345534086227417, 0.0036385059356689453, 0.0038216710090637207, 0.004004836082458496, 0.0041880011558532715, 0.004371166229248047, 0.004554331302642822, 0.004737496376037598, 0.004920661449432373, 0.0051038265228271484, 0.005286991596221924, 0.005470156669616699, 0.005653321743011475, 0.00583648681640625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 11.0, 20.0, 38.0, 103.0, 158.0, 212.0, 213.0, 142.0, 62.0, 25.0, 18.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000443780270870775, -0.0004340611631050706, -0.00042434208444319665, -0.00041462297667749226, -0.00040490386891178787, -0.00039518479024991393, -0.00038546568248420954, -0.00037574657471850514, -0.00036602746695280075, -0.00035630835918709636, -0.0003465892805252224, -0.00033687017275951803, -0.00032715106499381363, -0.0003174319863319397, -0.0003077128785662353, -0.0002979937708005309, -0.000288274692138657, -0.0002785555843729526, -0.00026883650571107864, -0.00025911739794537425, -0.00024939829017966986, -0.0002396791969658807, -0.00022996010375209153, -0.00022024099598638713, -0.00021052190277259797, -0.0002008028095588088, -0.0001910837017931044, -0.00018136460857931525, -0.00017164551536552608, -0.0001619264075998217, -0.00015220731438603252, -0.00014248822117224336, -0.0001327690843027085, -0.00012304999108891934, -0.00011333088332321495, -0.00010361179010942578, -9.3892689619679e-05, -8.417358912993222e-05, -7.445449591614306e-05, -6.473539542639628e-05, -5.50162949366495e-05, -4.529719444690272e-05, -3.557809759513475e-05, -2.5858998924377374e-05, -1.613990025362e-05, -6.4207997638732195e-06, 3.2982970878947526e-06, 1.3017393939662725e-05, 2.2736494429409504e-05, 3.245559491915628e-05, 4.2174691770924255e-05, 5.189378862269223e-05, 6.1612889112439e-05, 7.133198960218579e-05, 8.105108281597495e-05, 9.077018330572173e-05, 0.00010048928379546851, 0.00011020838428521529, 0.00011992748477496207, 0.00012964657798875123, 0.0001393656712025404, 0.0001490847789682448, 0.00015880387218203396, 0.00016852296539582312, 0.00017824207316152751]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 11.0, 11.0, 9.0, 17.0, 13.0, 14.0, 18.0, 22.0, 26.0, 29.0, 30.0, 24.0, 36.0, 36.0, 46.0, 41.0, 42.0, 45.0, 48.0, 41.0, 46.0, 35.0, 40.0, 35.0, 32.0, 24.0, 38.0, 24.0, 23.0, 25.0, 14.0, 15.0, 18.0, 9.0, 9.0, 8.0, 11.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012576580047607422, -0.00012152735143899918, -0.00011728890240192413, -0.00011305045336484909, -0.00010881200432777405, -0.000104573555290699, -0.00010033510625362396, -9.609665721654892e-05, -9.185820817947388e-05, -8.761975914239883e-05, -8.338131010532379e-05, -7.914286106824875e-05, -7.49044120311737e-05, -7.066596299409866e-05, -6.642751395702362e-05, -6.218906491994858e-05, -5.7950615882873535e-05, -5.371216684579849e-05, -4.947371780872345e-05, -4.523526877164841e-05, -4.0996819734573364e-05, -3.675837069749832e-05, -3.251992166042328e-05, -2.8281472623348236e-05, -2.4043023586273193e-05, -1.980457454919815e-05, -1.5566125512123108e-05, -1.1327676475048065e-05, -7.0892274379730225e-06, -2.8507784008979797e-06, 1.387670636177063e-06, 5.626119673252106e-06, 9.864568710327148e-06, 1.4103017747402191e-05, 1.8341466784477234e-05, 2.2579915821552277e-05, 2.681836485862732e-05, 3.105681389570236e-05, 3.5295262932777405e-05, 3.953371196985245e-05, 4.377216100692749e-05, 4.801061004400253e-05, 5.2249059081077576e-05, 5.648750811815262e-05, 6.072595715522766e-05, 6.49644061923027e-05, 6.920285522937775e-05, 7.344130426645279e-05, 7.767975330352783e-05, 8.191820234060287e-05, 8.615665137767792e-05, 9.039510041475296e-05, 9.4633549451828e-05, 9.887199848890305e-05, 0.00010311044752597809, 0.00010734889656305313, 0.00011158734560012817, 0.00011582579463720322, 0.00012006424367427826, 0.0001243026927113533, 0.00012854114174842834, 0.0001327795907855034, 0.00013701803982257843, 0.00014125648885965347, 0.00014549493789672852]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 3.0, 9.0, 6.0, 18.0, 12.0, 12.0, 20.0, 13.0, 17.0, 27.0, 23.0, 24.0, 28.0, 26.0, 36.0, 39.0, 54.0, 42.0, 49.0, 46.0, 50.0, 47.0, 31.0, 41.0, 43.0, 38.0, 32.0, 22.0, 31.0, 25.0, 24.0, 18.0, 21.0, 14.0, 13.0, 14.0, 12.0, 11.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6328125, -8.376953125, -8.12109375, -7.865234375, -7.609375, -7.353515625, -7.09765625, -6.841796875, -6.5859375, -6.330078125, -6.07421875, -5.818359375, -5.5625, -5.306640625, -5.05078125, -4.794921875, -4.5390625, -4.283203125, -4.02734375, -3.771484375, -3.515625, -3.259765625, -3.00390625, -2.748046875, -2.4921875, -2.236328125, -1.98046875, -1.724609375, -1.46875, -1.212890625, -0.95703125, -0.701171875, -0.4453125, -0.189453125, 0.06640625, 0.322265625, 0.578125, 0.833984375, 1.08984375, 1.345703125, 1.6015625, 1.857421875, 2.11328125, 2.369140625, 2.625, 2.880859375, 3.13671875, 3.392578125, 3.6484375, 3.904296875, 4.16015625, 4.416015625, 4.671875, 4.927734375, 5.18359375, 5.439453125, 5.6953125, 5.951171875, 6.20703125, 6.462890625, 6.71875, 6.974609375, 7.23046875, 7.486328125, 7.7421875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 7.0, 13.0, 11.0, 21.0, 19.0, 38.0, 38.0, 57.0, 67.0, 106.0, 172.0, 197.0, 404.0, 813.0, 2233.0, 5866.0, 17103.0, 47507.0, 130648.0, 333272.0, 315866.0, 123152.0, 45475.0, 15837.0, 5647.0, 2008.0, 810.0, 386.0, 203.0, 137.0, 113.0, 90.0, 55.0, 46.0, 33.0, 22.0, 27.0, 12.0, 11.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6640625, -8.39306640625, -8.1220703125, -7.85107421875, -7.580078125, -7.30908203125, -7.0380859375, -6.76708984375, -6.49609375, -6.22509765625, -5.9541015625, -5.68310546875, -5.412109375, -5.14111328125, -4.8701171875, -4.59912109375, -4.328125, -4.05712890625, -3.7861328125, -3.51513671875, -3.244140625, -2.97314453125, -2.7021484375, -2.43115234375, -2.16015625, -1.88916015625, -1.6181640625, -1.34716796875, -1.076171875, -0.80517578125, -0.5341796875, -0.26318359375, 0.0078125, 0.27880859375, 0.5498046875, 0.82080078125, 1.091796875, 1.36279296875, 1.6337890625, 1.90478515625, 2.17578125, 2.44677734375, 2.7177734375, 2.98876953125, 3.259765625, 3.53076171875, 3.8017578125, 4.07275390625, 4.34375, 4.61474609375, 4.8857421875, 5.15673828125, 5.427734375, 5.69873046875, 5.9697265625, 6.24072265625, 6.51171875, 6.78271484375, 7.0537109375, 7.32470703125, 7.595703125, 7.86669921875, 8.1376953125, 8.40869140625, 8.6796875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 3.0, 8.0, 5.0, 8.0, 16.0, 17.0, 13.0, 17.0, 21.0, 22.0, 19.0, 39.0, 23.0, 33.0, 38.0, 28.0, 50.0, 64.0, 142.0, 1455.0, 466.0, 122.0, 74.0, 40.0, 34.0, 39.0, 39.0, 32.0, 25.0, 29.0, 18.0, 24.0, 17.0, 15.0, 12.0, 11.0, 10.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-32.21875, -31.347412109375, -30.47607421875, -29.604736328125, -28.7333984375, -27.862060546875, -26.99072265625, -26.119384765625, -25.248046875, -24.376708984375, -23.50537109375, -22.634033203125, -21.7626953125, -20.891357421875, -20.02001953125, -19.148681640625, -18.27734375, -17.406005859375, -16.53466796875, -15.663330078125, -14.7919921875, -13.920654296875, -13.04931640625, -12.177978515625, -11.306640625, -10.435302734375, -9.56396484375, -8.692626953125, -7.8212890625, -6.949951171875, -6.07861328125, -5.207275390625, -4.3359375, -3.464599609375, -2.59326171875, -1.721923828125, -0.8505859375, 0.020751953125, 0.89208984375, 1.763427734375, 2.634765625, 3.506103515625, 4.37744140625, 5.248779296875, 6.1201171875, 6.991455078125, 7.86279296875, 8.734130859375, 9.60546875, 10.476806640625, 11.34814453125, 12.219482421875, 13.0908203125, 13.962158203125, 14.83349609375, 15.704833984375, 16.576171875, 17.447509765625, 18.31884765625, 19.190185546875, 20.0615234375, 20.932861328125, 21.80419921875, 22.675537109375, 23.546875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 10.0, 9.0, 14.0, 16.0, 6.0, 22.0, 31.0, 65.0, 66.0, 91.0, 162.0, 234.0, 583.0, 2169.0, 2998024.0, 141671.0, 1363.0, 468.0, 240.0, 114.0, 91.0, 59.0, 48.0, 36.0, 27.0, 15.0, 10.0, 11.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-145.125, -141.1884765625, -137.251953125, -133.3154296875, -129.37890625, -125.4423828125, -121.505859375, -117.5693359375, -113.6328125, -109.6962890625, -105.759765625, -101.8232421875, -97.88671875, -93.9501953125, -90.013671875, -86.0771484375, -82.140625, -78.2041015625, -74.267578125, -70.3310546875, -66.39453125, -62.4580078125, -58.521484375, -54.5849609375, -50.6484375, -46.7119140625, -42.775390625, -38.8388671875, -34.90234375, -30.9658203125, -27.029296875, -23.0927734375, -19.15625, -15.2197265625, -11.283203125, -7.3466796875, -3.41015625, 0.5263671875, 4.462890625, 8.3994140625, 12.3359375, 16.2724609375, 20.208984375, 24.1455078125, 28.08203125, 32.0185546875, 35.955078125, 39.8916015625, 43.828125, 47.7646484375, 51.701171875, 55.6376953125, 59.57421875, 63.5107421875, 67.447265625, 71.3837890625, 75.3203125, 79.2568359375, 83.193359375, 87.1298828125, 91.06640625, 95.0029296875, 98.939453125, 102.8759765625, 106.8125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 9.0, 47.0, 308.0, 509.0, 130.0, 13.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-235.23777770996094, -230.8983917236328, -226.55899047851562, -222.2196044921875, -217.88021850585938, -213.54083251953125, -209.20143127441406, -204.86204528808594, -200.52264404296875, -196.18325805664062, -191.84385681152344, -187.5044708251953, -183.1650848388672, -178.82568359375, -174.48629760742188, -170.14691162109375, -165.80752563476562, -161.4681396484375, -157.1287384033203, -152.7893524169922, -148.44996643066406, -144.11056518554688, -139.77117919921875, -135.43179321289062, -131.0924072265625, -126.75301361083984, -122.41362762451172, -118.07423400878906, -113.73484802246094, -109.39545440673828, -105.05606079101562, -100.7166748046875, -96.37728881835938, -92.03789520263672, -87.6985092163086, -83.35911560058594, -79.01972961425781, -74.68033599853516, -70.3409423828125, -66.00155639648438, -61.66216278076172, -57.32277297973633, -52.98338317871094, -48.64398956298828, -44.30459976196289, -39.9652099609375, -35.625816345214844, -31.286426544189453, -26.947036743164062, -22.607646942138672, -18.26825523376465, -13.928864479064941, -9.589473724365234, -5.250083923339844, -0.9106922149658203, 3.428699493408203, 7.768089294433594, 12.1074800491333, 16.446870803833008, 20.78626251220703, 25.125652313232422, 29.465042114257812, 33.80443572998047, 38.14382553100586, 42.48321533203125]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 7.0, 12.0, 10.0, 16.0, 14.0, 15.0, 20.0, 27.0, 26.0, 25.0, 28.0, 27.0, 37.0, 33.0, 23.0, 45.0, 42.0, 34.0, 40.0, 50.0, 48.0, 42.0, 35.0, 41.0, 39.0, 28.0, 36.0, 20.0, 20.0, 23.0, 16.0, 16.0, 19.0, 17.0, 10.0, 17.0, 8.0, 15.0, 4.0, 2.0, 7.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.32453536987305, -59.222618103027344, -57.120697021484375, -55.01877975463867, -52.91686248779297, -50.81494140625, -48.7130241394043, -46.611106872558594, -44.509185791015625, -42.40726852416992, -40.30534744262695, -38.20343017578125, -36.10150909423828, -33.99959182739258, -31.897674560546875, -29.79575538635254, -27.693836212158203, -25.591917037963867, -23.48999786376953, -21.388080596923828, -19.286161422729492, -17.184242248535156, -15.082324028015137, -12.980405807495117, -10.878486633300781, -8.776567459106445, -6.674649238586426, -4.572730541229248, -2.4708118438720703, -0.3688926696777344, 1.7330255508422852, 3.8349437713623047, 5.936859130859375, 8.038778305053711, 10.14069652557373, 12.24261474609375, 14.344533920288086, 16.446453094482422, 18.548370361328125, 20.65028953552246, 22.752208709716797, 24.854127883911133, 26.95604705810547, 29.057964324951172, 31.159883499145508, 33.261802673339844, 35.36371994018555, 37.46563720703125, 39.56755828857422, 41.66947555541992, 43.77139663696289, 45.873313903808594, 47.97523498535156, 50.077152252197266, 52.17906951904297, 54.28099060058594, 56.38290786743164, 58.484825134277344, 60.58674621582031, 62.688663482666016, 64.79058074951172, 66.89250183105469, 68.99442291259766, 71.0963363647461, 73.19825744628906]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 3.0, 6.0, 9.0, 16.0, 10.0, 16.0, 15.0, 11.0, 21.0, 18.0, 27.0, 28.0, 22.0, 36.0, 40.0, 35.0, 45.0, 46.0, 41.0, 47.0, 48.0, 36.0, 40.0, 41.0, 46.0, 34.0, 41.0, 33.0, 21.0, 28.0, 19.0, 26.0, 15.0, 12.0, 20.0, 15.0, 11.0, 11.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.3486328125, -9.056640625, -8.7646484375, -8.47265625, -8.1806640625, -7.888671875, -7.5966796875, -7.3046875, -7.0126953125, -6.720703125, -6.4287109375, -6.13671875, -5.8447265625, -5.552734375, -5.2607421875, -4.96875, -4.6767578125, -4.384765625, -4.0927734375, -3.80078125, -3.5087890625, -3.216796875, -2.9248046875, -2.6328125, -2.3408203125, -2.048828125, -1.7568359375, -1.46484375, -1.1728515625, -0.880859375, -0.5888671875, -0.296875, -0.0048828125, 0.287109375, 0.5791015625, 0.87109375, 1.1630859375, 1.455078125, 1.7470703125, 2.0390625, 2.3310546875, 2.623046875, 2.9150390625, 3.20703125, 3.4990234375, 3.791015625, 4.0830078125, 4.375, 4.6669921875, 4.958984375, 5.2509765625, 5.54296875, 5.8349609375, 6.126953125, 6.4189453125, 6.7109375, 7.0029296875, 7.294921875, 7.5869140625, 7.87890625, 8.1708984375, 8.462890625, 8.7548828125, 9.046875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 0.0, 3.0, 5.0, 11.0, 9.0, 11.0, 16.0, 26.0, 25.0, 21.0, 33.0, 44.0, 60.0, 75.0, 97.0, 114.0, 148.0, 252.0, 647.0, 4448.0, 255851.0, 3531028.0, 394034.0, 5617.0, 716.0, 279.0, 150.0, 115.0, 96.0, 67.0, 62.0, 48.0, 40.0, 21.0, 20.0, 25.0, 25.0, 12.0, 6.0, 8.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.53125, -32.560546875, -31.58984375, -30.619140625, -29.6484375, -28.677734375, -27.70703125, -26.736328125, -25.765625, -24.794921875, -23.82421875, -22.853515625, -21.8828125, -20.912109375, -19.94140625, -18.970703125, -18.0, -17.029296875, -16.05859375, -15.087890625, -14.1171875, -13.146484375, -12.17578125, -11.205078125, -10.234375, -9.263671875, -8.29296875, -7.322265625, -6.3515625, -5.380859375, -4.41015625, -3.439453125, -2.46875, -1.498046875, -0.52734375, 0.443359375, 1.4140625, 2.384765625, 3.35546875, 4.326171875, 5.296875, 6.267578125, 7.23828125, 8.208984375, 9.1796875, 10.150390625, 11.12109375, 12.091796875, 13.0625, 14.033203125, 15.00390625, 15.974609375, 16.9453125, 17.916015625, 18.88671875, 19.857421875, 20.828125, 21.798828125, 22.76953125, 23.740234375, 24.7109375, 25.681640625, 26.65234375, 27.623046875, 28.59375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 8.0, 8.0, 9.0, 13.0, 16.0, 28.0, 25.0, 45.0, 57.0, 85.0, 119.0, 173.0, 244.0, 299.0, 410.0, 487.0, 458.0, 412.0, 318.0, 234.0, 182.0, 108.0, 67.0, 68.0, 50.0, 44.0, 34.0, 28.0, 13.0, 8.0, 5.0, 7.0, 7.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.046875, -13.526611328125, -13.00634765625, -12.486083984375, -11.9658203125, -11.445556640625, -10.92529296875, -10.405029296875, -9.884765625, -9.364501953125, -8.84423828125, -8.323974609375, -7.8037109375, -7.283447265625, -6.76318359375, -6.242919921875, -5.72265625, -5.202392578125, -4.68212890625, -4.161865234375, -3.6416015625, -3.121337890625, -2.60107421875, -2.080810546875, -1.560546875, -1.040283203125, -0.52001953125, 0.000244140625, 0.5205078125, 1.040771484375, 1.56103515625, 2.081298828125, 2.6015625, 3.121826171875, 3.64208984375, 4.162353515625, 4.6826171875, 5.202880859375, 5.72314453125, 6.243408203125, 6.763671875, 7.283935546875, 7.80419921875, 8.324462890625, 8.8447265625, 9.364990234375, 9.88525390625, 10.405517578125, 10.92578125, 11.446044921875, 11.96630859375, 12.486572265625, 13.0068359375, 13.527099609375, 14.04736328125, 14.567626953125, 15.087890625, 15.608154296875, 16.12841796875, 16.648681640625, 17.1689453125, 17.689208984375, 18.20947265625, 18.729736328125, 19.25]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 7.0, 6.0, 2.0, 11.0, 22.0, 26.0, 33.0, 47.0, 61.0, 82.0, 98.0, 148.0, 230.0, 344.0, 465.0, 1778.0, 542513.0, 3642333.0, 4304.0, 590.0, 362.0, 259.0, 179.0, 105.0, 89.0, 55.0, 34.0, 32.0, 22.0, 11.0, 11.0, 11.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.0625, -100.2880859375, -97.513671875, -94.7392578125, -91.96484375, -89.1904296875, -86.416015625, -83.6416015625, -80.8671875, -78.0927734375, -75.318359375, -72.5439453125, -69.76953125, -66.9951171875, -64.220703125, -61.4462890625, -58.671875, -55.8974609375, -53.123046875, -50.3486328125, -47.57421875, -44.7998046875, -42.025390625, -39.2509765625, -36.4765625, -33.7021484375, -30.927734375, -28.1533203125, -25.37890625, -22.6044921875, -19.830078125, -17.0556640625, -14.28125, -11.5068359375, -8.732421875, -5.9580078125, -3.18359375, -0.4091796875, 2.365234375, 5.1396484375, 7.9140625, 10.6884765625, 13.462890625, 16.2373046875, 19.01171875, 21.7861328125, 24.560546875, 27.3349609375, 30.109375, 32.8837890625, 35.658203125, 38.4326171875, 41.20703125, 43.9814453125, 46.755859375, 49.5302734375, 52.3046875, 55.0791015625, 57.853515625, 60.6279296875, 63.40234375, 66.1767578125, 68.951171875, 71.7255859375, 74.5]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 45.0, 154.0, 278.0, 307.0, 165.0, 46.0, 14.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.33499908447266, -89.36363983154297, -84.39227294921875, -79.42091369628906, -74.44955444335938, -69.47818756103516, -64.50682830810547, -59.535465240478516, -54.56410217285156, -49.59273910522461, -44.621376037597656, -39.65001678466797, -34.678653717041016, -29.707290649414062, -24.735929489135742, -19.764568328857422, -14.793205261230469, -9.821843147277832, -4.850481033325195, 0.1208810806274414, 5.092243194580078, 10.063606262207031, 15.034967422485352, 20.006328582763672, 24.977691650390625, 29.949054718017578, 34.92041778564453, 39.89177703857422, 44.86314010620117, 49.834503173828125, 54.80586242675781, 59.777225494384766, 64.74858093261719, 69.71994018554688, 74.6913070678711, 79.66266632080078, 84.634033203125, 89.60539245605469, 94.57675170898438, 99.54811096191406, 104.51947784423828, 109.49083709716797, 114.46220397949219, 119.43356323242188, 124.40492248535156, 129.37628173828125, 134.34765625, 139.3190155029297, 144.29037475585938, 149.26173400878906, 154.23309326171875, 159.2044677734375, 164.1758270263672, 169.14718627929688, 174.11854553222656, 179.08990478515625, 184.061279296875, 189.0326385498047, 194.00399780273438, 198.97537231445312, 203.9467315673828, 208.9180908203125, 213.8894500732422, 218.86080932617188, 223.83216857910156]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 9.0, 7.0, 5.0, 7.0, 6.0, 20.0, 11.0, 10.0, 17.0, 14.0, 18.0, 24.0, 17.0, 22.0, 18.0, 32.0, 25.0, 25.0, 29.0, 34.0, 40.0, 48.0, 41.0, 45.0, 34.0, 29.0, 35.0, 34.0, 34.0, 30.0, 32.0, 28.0, 29.0, 17.0, 21.0, 14.0, 23.0, 13.0, 18.0, 14.0, 16.0, 12.0, 6.0, 6.0, 6.0, 3.0, 4.0, 5.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0], "bins": [-45.16847610473633, -43.82695007324219, -42.48542785644531, -41.14390182495117, -39.8023796081543, -38.460853576660156, -37.11933135986328, -35.77780532836914, -34.436279296875, -33.09475326538086, -31.753231048583984, -30.411705017089844, -29.070180892944336, -27.728656768798828, -26.38713264465332, -25.045608520507812, -23.704084396362305, -22.362560272216797, -21.02103614807129, -19.67951202392578, -18.33798599243164, -16.996461868286133, -15.654937744140625, -14.3134126663208, -12.971888542175293, -11.630364418029785, -10.288839340209961, -8.947315216064453, -7.605790615081787, -6.264266014099121, -4.922741889953613, -3.581216812133789, -2.2396926879882812, -0.8981682062149048, 0.4433562755584717, 1.7848806381225586, 3.1264052391052246, 4.467929840087891, 5.809453964233398, 7.150979042053223, 8.49250316619873, 9.834027290344238, 11.175552368164062, 12.51707649230957, 13.858600616455078, 15.200125694274902, 16.541648864746094, 17.883174896240234, 19.224699020385742, 20.56622314453125, 21.907747268676758, 23.249271392822266, 24.590797424316406, 25.932321548461914, 27.273845672607422, 28.615371704101562, 29.956893920898438, 31.298418045043945, 32.63994216918945, 33.981468200683594, 35.32299041748047, 36.66451644897461, 38.00604248046875, 39.347564697265625, 40.689090728759766]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 13.0, 6.0, 12.0, 17.0, 20.0, 17.0, 21.0, 27.0, 28.0, 19.0, 42.0, 33.0, 31.0, 35.0, 42.0, 45.0, 41.0, 52.0, 38.0, 47.0, 51.0, 32.0, 36.0, 42.0, 29.0, 33.0, 33.0, 18.0, 26.0, 17.0, 11.0, 9.0, 15.0, 12.0, 7.0, 7.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.203125, -8.9273681640625, -8.651611328125, -8.3758544921875, -8.10009765625, -7.8243408203125, -7.548583984375, -7.2728271484375, -6.9970703125, -6.7213134765625, -6.445556640625, -6.1697998046875, -5.89404296875, -5.6182861328125, -5.342529296875, -5.0667724609375, -4.791015625, -4.5152587890625, -4.239501953125, -3.9637451171875, -3.68798828125, -3.4122314453125, -3.136474609375, -2.8607177734375, -2.5849609375, -2.3092041015625, -2.033447265625, -1.7576904296875, -1.48193359375, -1.2061767578125, -0.930419921875, -0.6546630859375, -0.37890625, -0.1031494140625, 0.172607421875, 0.4483642578125, 0.72412109375, 0.9998779296875, 1.275634765625, 1.5513916015625, 1.8271484375, 2.1029052734375, 2.378662109375, 2.6544189453125, 2.93017578125, 3.2059326171875, 3.481689453125, 3.7574462890625, 4.033203125, 4.3089599609375, 4.584716796875, 4.8604736328125, 5.13623046875, 5.4119873046875, 5.687744140625, 5.9635009765625, 6.2392578125, 6.5150146484375, 6.790771484375, 7.0665283203125, 7.34228515625, 7.6180419921875, 7.893798828125, 8.1695556640625, 8.4453125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 15.0, 16.0, 22.0, 37.0, 49.0, 70.0, 128.0, 145.0, 245.0, 330.0, 510.0, 723.0, 1091.0, 1557.0, 2382.0, 3438.0, 5187.0, 7657.0, 11778.0, 17894.0, 27499.0, 43489.0, 72509.0, 135539.0, 325022.0, 165931.0, 85064.0, 49517.0, 31126.0, 20120.0, 12962.0, 8688.0, 5902.0, 3754.0, 2645.0, 1752.0, 1142.0, 862.0, 537.0, 388.0, 256.0, 180.0, 120.0, 82.0, 70.0, 37.0, 30.0, 17.0, 15.0, 10.0, 9.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.041015625, -1.974395751953125, -1.90777587890625, -1.841156005859375, -1.7745361328125, -1.707916259765625, -1.64129638671875, -1.574676513671875, -1.508056640625, -1.441436767578125, -1.37481689453125, -1.308197021484375, -1.2415771484375, -1.174957275390625, -1.10833740234375, -1.041717529296875, -0.97509765625, -0.908477783203125, -0.84185791015625, -0.775238037109375, -0.7086181640625, -0.641998291015625, -0.57537841796875, -0.508758544921875, -0.442138671875, -0.375518798828125, -0.30889892578125, -0.242279052734375, -0.1756591796875, -0.109039306640625, -0.04241943359375, 0.024200439453125, 0.0908203125, 0.157440185546875, 0.22406005859375, 0.290679931640625, 0.3572998046875, 0.423919677734375, 0.49053955078125, 0.557159423828125, 0.623779296875, 0.690399169921875, 0.75701904296875, 0.823638916015625, 0.8902587890625, 0.956878662109375, 1.02349853515625, 1.090118408203125, 1.15673828125, 1.223358154296875, 1.28997802734375, 1.356597900390625, 1.4232177734375, 1.489837646484375, 1.55645751953125, 1.623077392578125, 1.689697265625, 1.756317138671875, 1.82293701171875, 1.889556884765625, 1.9561767578125, 2.022796630859375, 2.08941650390625, 2.156036376953125, 2.22265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 4.0, 6.0, 5.0, 9.0, 7.0, 9.0, 6.0, 8.0, 9.0, 16.0, 12.0, 21.0, 30.0, 31.0, 32.0, 31.0, 38.0, 31.0, 35.0, 41.0, 39.0, 39.0, 39.0, 1068.0, 33.0, 47.0, 37.0, 33.0, 34.0, 36.0, 28.0, 21.0, 30.0, 28.0, 25.0, 17.0, 16.0, 18.0, 11.0, 6.0, 10.0, 6.0, 6.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.90234375, -4.7349853515625, -4.567626953125, -4.4002685546875, -4.23291015625, -4.0655517578125, -3.898193359375, -3.7308349609375, -3.5634765625, -3.3961181640625, -3.228759765625, -3.0614013671875, -2.89404296875, -2.7266845703125, -2.559326171875, -2.3919677734375, -2.224609375, -2.0572509765625, -1.889892578125, -1.7225341796875, -1.55517578125, -1.3878173828125, -1.220458984375, -1.0531005859375, -0.8857421875, -0.7183837890625, -0.551025390625, -0.3836669921875, -0.21630859375, -0.0489501953125, 0.118408203125, 0.2857666015625, 0.453125, 0.6204833984375, 0.787841796875, 0.9552001953125, 1.12255859375, 1.2899169921875, 1.457275390625, 1.6246337890625, 1.7919921875, 1.9593505859375, 2.126708984375, 2.2940673828125, 2.46142578125, 2.6287841796875, 2.796142578125, 2.9635009765625, 3.130859375, 3.2982177734375, 3.465576171875, 3.6329345703125, 3.80029296875, 3.9676513671875, 4.135009765625, 4.3023681640625, 4.4697265625, 4.6370849609375, 4.804443359375, 4.9718017578125, 5.13916015625, 5.3065185546875, 5.473876953125, 5.6412353515625, 5.80859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 1.0, 5.0, 6.0, 15.0, 15.0, 36.0, 37.0, 59.0, 88.0, 135.0, 189.0, 337.0, 470.0, 700.0, 1061.0, 1492.0, 2084.0, 2997.0, 4307.0, 6451.0, 9896.0, 15150.0, 22629.0, 35182.0, 55573.0, 89561.0, 164710.0, 1352521.0, 124257.0, 73260.0, 46521.0, 29375.0, 19224.0, 12845.0, 8353.0, 5539.0, 3643.0, 2613.0, 1862.0, 1232.0, 882.0, 630.0, 421.0, 253.0, 175.0, 130.0, 85.0, 41.0, 42.0, 18.0, 11.0, 6.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.966796875, -1.901885986328125, -1.83697509765625, -1.772064208984375, -1.7071533203125, -1.642242431640625, -1.57733154296875, -1.512420654296875, -1.447509765625, -1.382598876953125, -1.31768798828125, -1.252777099609375, -1.1878662109375, -1.122955322265625, -1.05804443359375, -0.993133544921875, -0.92822265625, -0.863311767578125, -0.79840087890625, -0.733489990234375, -0.6685791015625, -0.603668212890625, -0.53875732421875, -0.473846435546875, -0.408935546875, -0.344024658203125, -0.27911376953125, -0.214202880859375, -0.1492919921875, -0.084381103515625, -0.01947021484375, 0.045440673828125, 0.1103515625, 0.175262451171875, 0.24017333984375, 0.305084228515625, 0.3699951171875, 0.434906005859375, 0.49981689453125, 0.564727783203125, 0.629638671875, 0.694549560546875, 0.75946044921875, 0.824371337890625, 0.8892822265625, 0.954193115234375, 1.01910400390625, 1.084014892578125, 1.14892578125, 1.213836669921875, 1.27874755859375, 1.343658447265625, 1.4085693359375, 1.473480224609375, 1.53839111328125, 1.603302001953125, 1.668212890625, 1.733123779296875, 1.79803466796875, 1.862945556640625, 1.9278564453125, 1.992767333984375, 2.05767822265625, 2.122589111328125, 2.1875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 9.0, 4.0, 8.0, 13.0, 9.0, 16.0, 25.0, 30.0, 43.0, 46.0, 69.0, 78.0, 106.0, 123.0, 88.0, 72.0, 52.0, 44.0, 39.0, 33.0, 16.0, 9.0, 15.0, 10.0, 7.0, 5.0, 3.0, 11.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00041675567626953125, -0.00040387362241744995, -0.00039099156856536865, -0.00037810951471328735, -0.00036522746086120605, -0.00035234540700912476, -0.00033946335315704346, -0.00032658129930496216, -0.00031369924545288086, -0.00030081719160079956, -0.00028793513774871826, -0.00027505308389663696, -0.00026217103004455566, -0.00024928897619247437, -0.00023640692234039307, -0.00022352486848831177, -0.00021064281463623047, -0.00019776076078414917, -0.00018487870693206787, -0.00017199665307998657, -0.00015911459922790527, -0.00014623254537582397, -0.00013335049152374268, -0.00012046843767166138, -0.00010758638381958008, -9.470432996749878e-05, -8.182227611541748e-05, -6.894022226333618e-05, -5.605816841125488e-05, -4.3176114559173584e-05, -3.0294060707092285e-05, -1.7412006855010986e-05, -4.5299530029296875e-06, 8.352100849151611e-06, 2.123415470123291e-05, 3.411620855331421e-05, 4.699826240539551e-05, 5.988031625747681e-05, 7.27623701095581e-05, 8.56444239616394e-05, 9.85264778137207e-05, 0.000111408531665802, 0.0001242905855178833, 0.0001371726393699646, 0.0001500546932220459, 0.0001629367470741272, 0.0001758188009262085, 0.0001887008547782898, 0.0002015829086303711, 0.0002144649624824524, 0.0002273470163345337, 0.000240229070186615, 0.0002531111240386963, 0.0002659931778907776, 0.0002788752317428589, 0.0002917572855949402, 0.0003046393394470215, 0.0003175213932991028, 0.0003304034471511841, 0.0003432855010032654, 0.0003561675548553467, 0.000369049608707428, 0.0003819316625595093, 0.0003948137164115906, 0.0004076957702636719]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 0.0, 2.0, 7.0, 9.0, 6.0, 15.0, 12.0, 22.0, 16.0, 33.0, 45.0, 72.0, 126.0, 210.0, 456.0, 2383.0, 1038302.0, 5658.0, 553.0, 215.0, 141.0, 78.0, 44.0, 37.0, 26.0, 25.0, 17.0, 8.0, 10.0, 13.0, 2.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0091705322265625, -0.008880138397216797, -0.008589744567871094, -0.00829935073852539, -0.008008956909179688, -0.007718563079833984, -0.007428169250488281, -0.007137775421142578, -0.006847381591796875, -0.006556987762451172, -0.006266593933105469, -0.005976200103759766, -0.0056858062744140625, -0.005395412445068359, -0.005105018615722656, -0.004814624786376953, -0.00452423095703125, -0.004233837127685547, -0.003943443298339844, -0.0036530494689941406, -0.0033626556396484375, -0.0030722618103027344, -0.0027818679809570312, -0.002491474151611328, -0.002201080322265625, -0.0019106864929199219, -0.0016202926635742188, -0.0013298988342285156, -0.0010395050048828125, -0.0007491111755371094, -0.00045871734619140625, -0.00016832351684570312, 0.0001220703125, 0.0004124641418457031, 0.0007028579711914062, 0.0009932518005371094, 0.0012836456298828125, 0.0015740394592285156, 0.0018644332885742188, 0.002154827117919922, 0.002445220947265625, 0.002735614776611328, 0.0030260086059570312, 0.0033164024353027344, 0.0036067962646484375, 0.0038971900939941406, 0.004187583923339844, 0.004477977752685547, 0.00476837158203125, 0.005058765411376953, 0.005349159240722656, 0.005639553070068359, 0.0059299468994140625, 0.006220340728759766, 0.006510734558105469, 0.006801128387451172, 0.007091522216796875, 0.007381916046142578, 0.007672309875488281, 0.007962703704833984, 0.008253097534179688, 0.00854349136352539, 0.008833885192871094, 0.009124279022216797, 0.0094146728515625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 26.0, 125.0, 320.0, 349.0, 147.0, 37.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000897666672244668, -0.0008789906860329211, -0.0008603146998211741, -0.0008416387718170881, -0.0008229627856053412, -0.0008042867993935943, -0.0007856108713895082, -0.0007669348851777613, -0.0007482588989660144, -0.0007295829127542675, -0.0007109069265425205, -0.0006922309985384345, -0.0006735550123266876, -0.0006548790261149406, -0.0006362030981108546, -0.0006175271118991077, -0.0005988511256873608, -0.0005801751394756138, -0.0005614991532638669, -0.0005428232252597809, -0.000524147239048034, -0.000505471252836287, -0.00048679529572837055, -0.0004681193386204541, -0.00044944335240870714, -0.0004307673661969602, -0.00041209140908904374, -0.00039341545198112726, -0.00037473946576938033, -0.0003560634795576334, -0.0003373875224497169, -0.00031871156534180045, -0.0003000355209223926, -0.0002813595347106457, -0.0002626835776027292, -0.0002440076059428975, -0.0002253316342830658, -0.0002066556626232341, -0.0001879796909634024, -0.0001693037193035707, -0.00015062774764373899, -0.00013195177598390728, -0.00011327580432407558, -9.459983266424388e-05, -7.592386100441217e-05, -5.724788934458047e-05, -3.857191768474877e-05, -1.9895946024917066e-05, -1.2199743650853634e-06, 1.745599729474634e-05, 3.613196895457804e-05, 5.4807940614409745e-05, 7.348391227424145e-05, 9.215988393407315e-05, 0.00011083585559390485, 0.00012951182725373656, 0.00014818779891356826, 0.00016686377057339996, 0.00018553974223323166, 0.00020421571389306337, 0.00022289168555289507, 0.00024156765721272677, 0.0002602436288725585, 0.00027891958598047495, 0.0002975955721922219]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 5.0, 2.0, 3.0, 5.0, 9.0, 8.0, 10.0, 13.0, 15.0, 13.0, 14.0, 21.0, 19.0, 15.0, 21.0, 23.0, 28.0, 27.0, 24.0, 30.0, 44.0, 31.0, 32.0, 32.0, 30.0, 34.0, 38.0, 46.0, 38.0, 23.0, 39.0, 28.0, 34.0, 43.0, 28.0, 16.0, 17.0, 17.0, 20.0, 25.0, 18.0, 7.0, 10.0, 6.0, 10.0, 11.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00015294551849365234, -0.00014839600771665573, -0.00014384649693965912, -0.0001392969861626625, -0.0001347474753856659, -0.00013019796460866928, -0.00012564845383167267, -0.00012109894305467606, -0.00011654943227767944, -0.00011199992150068283, -0.00010745041072368622, -0.0001029008999466896, -9.835138916969299e-05, -9.380187839269638e-05, -8.925236761569977e-05, -8.470285683870316e-05, -8.015334606170654e-05, -7.560383528470993e-05, -7.105432450771332e-05, -6.65048137307167e-05, -6.195530295372009e-05, -5.740579217672348e-05, -5.285628139972687e-05, -4.8306770622730255e-05, -4.375725984573364e-05, -3.920774906873703e-05, -3.465823829174042e-05, -3.0108727514743805e-05, -2.5559216737747192e-05, -2.100970596075058e-05, -1.6460195183753967e-05, -1.1910684406757355e-05, -7.361173629760742e-06, -2.8116628527641296e-06, 1.737847924232483e-06, 6.2873587012290955e-06, 1.0836869478225708e-05, 1.538638025522232e-05, 1.9935891032218933e-05, 2.4485401809215546e-05, 2.9034912586212158e-05, 3.358442336320877e-05, 3.813393414020538e-05, 4.2683444917201996e-05, 4.723295569419861e-05, 5.178246647119522e-05, 5.6331977248191833e-05, 6.0881488025188446e-05, 6.543099880218506e-05, 6.998050957918167e-05, 7.453002035617828e-05, 7.90795311331749e-05, 8.362904191017151e-05, 8.817855268716812e-05, 9.272806346416473e-05, 9.727757424116135e-05, 0.00010182708501815796, 0.00010637659579515457, 0.00011092610657215118, 0.0001154756173491478, 0.00012002512812614441, 0.00012457463890314102, 0.00012912414968013763, 0.00013367366045713425, 0.00013822317123413086]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 13.0, 6.0, 12.0, 17.0, 20.0, 17.0, 21.0, 27.0, 28.0, 19.0, 42.0, 33.0, 31.0, 35.0, 42.0, 45.0, 41.0, 52.0, 38.0, 47.0, 51.0, 32.0, 36.0, 42.0, 29.0, 33.0, 33.0, 18.0, 26.0, 17.0, 11.0, 9.0, 15.0, 12.0, 7.0, 7.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.203125, -8.9273681640625, -8.651611328125, -8.3758544921875, -8.10009765625, -7.8243408203125, -7.548583984375, -7.2728271484375, -6.9970703125, -6.7213134765625, -6.445556640625, -6.1697998046875, -5.89404296875, -5.6182861328125, -5.342529296875, -5.0667724609375, -4.791015625, -4.5152587890625, -4.239501953125, -3.9637451171875, -3.68798828125, -3.4122314453125, -3.136474609375, -2.8607177734375, -2.5849609375, -2.3092041015625, -2.033447265625, -1.7576904296875, -1.48193359375, -1.2061767578125, -0.930419921875, -0.6546630859375, -0.37890625, -0.1031494140625, 0.172607421875, 0.4483642578125, 0.72412109375, 0.9998779296875, 1.275634765625, 1.5513916015625, 1.8271484375, 2.1029052734375, 2.378662109375, 2.6544189453125, 2.93017578125, 3.2059326171875, 3.481689453125, 3.7574462890625, 4.033203125, 4.3089599609375, 4.584716796875, 4.8604736328125, 5.13623046875, 5.4119873046875, 5.687744140625, 5.9635009765625, 6.2392578125, 6.5150146484375, 6.790771484375, 7.0665283203125, 7.34228515625, 7.6180419921875, 7.893798828125, 8.1695556640625, 8.4453125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 10.0, 9.0, 13.0, 16.0, 23.0, 23.0, 33.0, 45.0, 60.0, 74.0, 99.0, 141.0, 232.0, 339.0, 621.0, 1629.0, 7866.0, 56367.0, 427468.0, 477968.0, 63042.0, 8787.0, 1747.0, 703.0, 392.0, 226.0, 146.0, 99.0, 70.0, 68.0, 59.0, 28.0, 35.0, 21.0, 17.0, 11.0, 9.0, 14.0, 8.0, 3.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.125, -16.59033203125, -16.0556640625, -15.52099609375, -14.986328125, -14.45166015625, -13.9169921875, -13.38232421875, -12.84765625, -12.31298828125, -11.7783203125, -11.24365234375, -10.708984375, -10.17431640625, -9.6396484375, -9.10498046875, -8.5703125, -8.03564453125, -7.5009765625, -6.96630859375, -6.431640625, -5.89697265625, -5.3623046875, -4.82763671875, -4.29296875, -3.75830078125, -3.2236328125, -2.68896484375, -2.154296875, -1.61962890625, -1.0849609375, -0.55029296875, -0.015625, 0.51904296875, 1.0537109375, 1.58837890625, 2.123046875, 2.65771484375, 3.1923828125, 3.72705078125, 4.26171875, 4.79638671875, 5.3310546875, 5.86572265625, 6.400390625, 6.93505859375, 7.4697265625, 8.00439453125, 8.5390625, 9.07373046875, 9.6083984375, 10.14306640625, 10.677734375, 11.21240234375, 11.7470703125, 12.28173828125, 12.81640625, 13.35107421875, 13.8857421875, 14.42041015625, 14.955078125, 15.48974609375, 16.0244140625, 16.55908203125, 17.09375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 2.0, 10.0, 7.0, 8.0, 15.0, 22.0, 19.0, 14.0, 25.0, 33.0, 43.0, 40.0, 43.0, 46.0, 73.0, 141.0, 303.0, 1500.0, 163.0, 100.0, 68.0, 51.0, 47.0, 50.0, 43.0, 35.0, 24.0, 22.0, 23.0, 15.0, 17.0, 10.0, 10.0, 8.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.828125, -30.778076171875, -29.72802734375, -28.677978515625, -27.6279296875, -26.577880859375, -25.52783203125, -24.477783203125, -23.427734375, -22.377685546875, -21.32763671875, -20.277587890625, -19.2275390625, -18.177490234375, -17.12744140625, -16.077392578125, -15.02734375, -13.977294921875, -12.92724609375, -11.877197265625, -10.8271484375, -9.777099609375, -8.72705078125, -7.677001953125, -6.626953125, -5.576904296875, -4.52685546875, -3.476806640625, -2.4267578125, -1.376708984375, -0.32666015625, 0.723388671875, 1.7734375, 2.823486328125, 3.87353515625, 4.923583984375, 5.9736328125, 7.023681640625, 8.07373046875, 9.123779296875, 10.173828125, 11.223876953125, 12.27392578125, 13.323974609375, 14.3740234375, 15.424072265625, 16.47412109375, 17.524169921875, 18.57421875, 19.624267578125, 20.67431640625, 21.724365234375, 22.7744140625, 23.824462890625, 24.87451171875, 25.924560546875, 26.974609375, 28.024658203125, 29.07470703125, 30.124755859375, 31.1748046875, 32.224853515625, 33.27490234375, 34.324951171875, 35.375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 5.0, 10.0, 17.0, 14.0, 20.0, 27.0, 37.0, 39.0, 57.0, 54.0, 87.0, 122.0, 148.0, 263.0, 533.0, 1556.0, 69779.0, 3066245.0, 4782.0, 809.0, 359.0, 171.0, 144.0, 109.0, 70.0, 47.0, 36.0, 36.0, 37.0, 17.0, 17.0, 15.0, 9.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.5625, -96.271484375, -92.98046875, -89.689453125, -86.3984375, -83.107421875, -79.81640625, -76.525390625, -73.234375, -69.943359375, -66.65234375, -63.361328125, -60.0703125, -56.779296875, -53.48828125, -50.197265625, -46.90625, -43.615234375, -40.32421875, -37.033203125, -33.7421875, -30.451171875, -27.16015625, -23.869140625, -20.578125, -17.287109375, -13.99609375, -10.705078125, -7.4140625, -4.123046875, -0.83203125, 2.458984375, 5.75, 9.041015625, 12.33203125, 15.623046875, 18.9140625, 22.205078125, 25.49609375, 28.787109375, 32.078125, 35.369140625, 38.66015625, 41.951171875, 45.2421875, 48.533203125, 51.82421875, 55.115234375, 58.40625, 61.697265625, 64.98828125, 68.279296875, 71.5703125, 74.861328125, 78.15234375, 81.443359375, 84.734375, 88.025390625, 91.31640625, 94.607421875, 97.8984375, 101.189453125, 104.48046875, 107.771484375, 111.0625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 35.0, 231.0, 449.0, 254.0, 37.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-207.31723022460938, -203.58607482910156, -199.8549346923828, -196.123779296875, -192.39263916015625, -188.66148376464844, -184.93032836914062, -181.19918823242188, -177.46803283691406, -173.73687744140625, -170.0057373046875, -166.2745819091797, -162.54344177246094, -158.81228637695312, -155.08114624023438, -151.34999084472656, -147.61883544921875, -143.88768005371094, -140.1565399169922, -136.42538452148438, -132.69424438476562, -128.9630889892578, -125.23194122314453, -121.50079345703125, -117.7696533203125, -114.03850555419922, -110.30735778808594, -106.57620239257812, -102.84505462646484, -99.11390686035156, -95.38275909423828, -91.651611328125, -87.92046356201172, -84.18931579589844, -80.45816802978516, -76.72702026367188, -72.99586486816406, -69.26471710205078, -65.5335693359375, -61.80242156982422, -58.07126998901367, -54.34012222290039, -50.608970642089844, -46.87782287597656, -43.14667510986328, -39.415523529052734, -35.68437576293945, -31.95322608947754, -28.222076416015625, -24.49092674255371, -20.759777069091797, -17.028629302978516, -13.297479629516602, -9.566329956054688, -5.835182189941406, -2.104032516479492, 1.6271171569824219, 5.358266353607178, 9.089415550231934, 12.820564270019531, 16.551713943481445, 20.28286361694336, 24.01401138305664, 27.745161056518555, 31.47631072998047]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 10.0, 9.0, 7.0, 9.0, 9.0, 14.0, 15.0, 22.0, 13.0, 15.0, 26.0, 28.0, 29.0, 30.0, 50.0, 38.0, 38.0, 30.0, 45.0, 39.0, 43.0, 44.0, 35.0, 47.0, 41.0, 34.0, 33.0, 21.0, 22.0, 20.0, 27.0, 23.0, 13.0, 16.0, 16.0, 18.0, 13.0, 8.0, 11.0, 3.0, 10.0, 5.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-70.11868286132812, -67.88211059570312, -65.64554595947266, -63.408973693847656, -61.172401428222656, -58.93583297729492, -56.69926452636719, -54.46269226074219, -52.22612380981445, -49.98955535888672, -47.75298309326172, -45.516414642333984, -43.27984619140625, -41.04327392578125, -38.806705474853516, -36.57013702392578, -34.33356475830078, -32.09699630737305, -29.860424041748047, -27.623855590820312, -25.387285232543945, -23.150714874267578, -20.914146423339844, -18.677576065063477, -16.44100570678711, -14.204435348510742, -11.967865943908691, -9.73129653930664, -7.494726181030273, -5.258155822753906, -3.0215864181518555, -0.7850170135498047, 1.4515533447265625, 3.6881232261657715, 5.9246931076049805, 8.161262512207031, 10.397832870483398, 12.634403228759766, 14.870972633361816, 17.107542037963867, 19.344112396240234, 21.5806827545166, 23.81725311279297, 26.053821563720703, 28.29039192199707, 30.526962280273438, 32.76353073120117, 35.000099182128906, 37.236671447753906, 39.47323989868164, 41.70981216430664, 43.946380615234375, 46.182952880859375, 48.41952133178711, 50.656089782714844, 52.892662048339844, 55.12923049926758, 57.36579895019531, 59.60237121582031, 61.83893966674805, 64.07550811767578, 66.31208038330078, 68.54865264892578, 70.78521728515625, 73.02178955078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 9.0, 2.0, 12.0, 5.0, 14.0, 16.0, 15.0, 20.0, 28.0, 29.0, 34.0, 31.0, 34.0, 24.0, 44.0, 38.0, 46.0, 43.0, 45.0, 49.0, 43.0, 45.0, 36.0, 45.0, 37.0, 26.0, 44.0, 31.0, 17.0, 22.0, 27.0, 16.0, 15.0, 11.0, 10.0, 8.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.3828125, -11.056884765625, -10.73095703125, -10.405029296875, -10.0791015625, -9.753173828125, -9.42724609375, -9.101318359375, -8.775390625, -8.449462890625, -8.12353515625, -7.797607421875, -7.4716796875, -7.145751953125, -6.81982421875, -6.493896484375, -6.16796875, -5.842041015625, -5.51611328125, -5.190185546875, -4.8642578125, -4.538330078125, -4.21240234375, -3.886474609375, -3.560546875, -3.234619140625, -2.90869140625, -2.582763671875, -2.2568359375, -1.930908203125, -1.60498046875, -1.279052734375, -0.953125, -0.627197265625, -0.30126953125, 0.024658203125, 0.3505859375, 0.676513671875, 1.00244140625, 1.328369140625, 1.654296875, 1.980224609375, 2.30615234375, 2.632080078125, 2.9580078125, 3.283935546875, 3.60986328125, 3.935791015625, 4.26171875, 4.587646484375, 4.91357421875, 5.239501953125, 5.5654296875, 5.891357421875, 6.21728515625, 6.543212890625, 6.869140625, 7.195068359375, 7.52099609375, 7.846923828125, 8.1728515625, 8.498779296875, 8.82470703125, 9.150634765625, 9.4765625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 6.0, 0.0, 3.0, 5.0, 5.0, 5.0, 8.0, 12.0, 18.0, 16.0, 39.0, 41.0, 34.0, 49.0, 81.0, 136.0, 194.0, 322.0, 671.0, 1701.0, 5869.0, 31521.0, 216888.0, 1028034.0, 1820825.0, 878763.0, 174801.0, 26345.0, 4984.0, 1477.0, 565.0, 278.0, 180.0, 109.0, 70.0, 42.0, 45.0, 30.0, 26.0, 21.0, 12.0, 14.0, 9.0, 6.0, 9.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.5234375, -14.089111328125, -13.65478515625, -13.220458984375, -12.7861328125, -12.351806640625, -11.91748046875, -11.483154296875, -11.048828125, -10.614501953125, -10.18017578125, -9.745849609375, -9.3115234375, -8.877197265625, -8.44287109375, -8.008544921875, -7.57421875, -7.139892578125, -6.70556640625, -6.271240234375, -5.8369140625, -5.402587890625, -4.96826171875, -4.533935546875, -4.099609375, -3.665283203125, -3.23095703125, -2.796630859375, -2.3623046875, -1.927978515625, -1.49365234375, -1.059326171875, -0.625, -0.190673828125, 0.24365234375, 0.677978515625, 1.1123046875, 1.546630859375, 1.98095703125, 2.415283203125, 2.849609375, 3.283935546875, 3.71826171875, 4.152587890625, 4.5869140625, 5.021240234375, 5.45556640625, 5.889892578125, 6.32421875, 6.758544921875, 7.19287109375, 7.627197265625, 8.0615234375, 8.495849609375, 8.93017578125, 9.364501953125, 9.798828125, 10.233154296875, 10.66748046875, 11.101806640625, 11.5361328125, 11.970458984375, 12.40478515625, 12.839111328125, 13.2734375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 13.0, 20.0, 15.0, 40.0, 50.0, 54.0, 74.0, 83.0, 111.0, 150.0, 192.0, 237.0, 294.0, 332.0, 357.0, 371.0, 320.0, 270.0, 230.0, 175.0, 132.0, 104.0, 93.0, 69.0, 49.0, 59.0, 32.0, 25.0, 29.0, 16.0, 11.0, 13.0, 3.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.5577392578125, -15.099853515625, -14.6419677734375, -14.18408203125, -13.7261962890625, -13.268310546875, -12.8104248046875, -12.3525390625, -11.8946533203125, -11.436767578125, -10.9788818359375, -10.52099609375, -10.0631103515625, -9.605224609375, -9.1473388671875, -8.689453125, -8.2315673828125, -7.773681640625, -7.3157958984375, -6.85791015625, -6.4000244140625, -5.942138671875, -5.4842529296875, -5.0263671875, -4.5684814453125, -4.110595703125, -3.6527099609375, -3.19482421875, -2.7369384765625, -2.279052734375, -1.8211669921875, -1.36328125, -0.9053955078125, -0.447509765625, 0.0103759765625, 0.46826171875, 0.9261474609375, 1.384033203125, 1.8419189453125, 2.2998046875, 2.7576904296875, 3.215576171875, 3.6734619140625, 4.13134765625, 4.5892333984375, 5.047119140625, 5.5050048828125, 5.962890625, 6.4207763671875, 6.878662109375, 7.3365478515625, 7.79443359375, 8.2523193359375, 8.710205078125, 9.1680908203125, 9.6259765625, 10.0838623046875, 10.541748046875, 10.9996337890625, 11.45751953125, 11.9154052734375, 12.373291015625, 12.8311767578125, 13.2890625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 4.0, 5.0, 13.0, 9.0, 21.0, 17.0, 40.0, 44.0, 56.0, 82.0, 128.0, 160.0, 187.0, 248.0, 341.0, 578.0, 1151.0, 3107.0, 50424.0, 3649117.0, 477430.0, 7242.0, 1500.0, 746.0, 478.0, 298.0, 219.0, 179.0, 130.0, 89.0, 77.0, 36.0, 28.0, 29.0, 14.0, 17.0, 7.0, 8.0, 8.0, 4.0, 5.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.78125, -46.11767578125, -44.4541015625, -42.79052734375, -41.126953125, -39.46337890625, -37.7998046875, -36.13623046875, -34.47265625, -32.80908203125, -31.1455078125, -29.48193359375, -27.818359375, -26.15478515625, -24.4912109375, -22.82763671875, -21.1640625, -19.50048828125, -17.8369140625, -16.17333984375, -14.509765625, -12.84619140625, -11.1826171875, -9.51904296875, -7.85546875, -6.19189453125, -4.5283203125, -2.86474609375, -1.201171875, 0.46240234375, 2.1259765625, 3.78955078125, 5.453125, 7.11669921875, 8.7802734375, 10.44384765625, 12.107421875, 13.77099609375, 15.4345703125, 17.09814453125, 18.76171875, 20.42529296875, 22.0888671875, 23.75244140625, 25.416015625, 27.07958984375, 28.7431640625, 30.40673828125, 32.0703125, 33.73388671875, 35.3974609375, 37.06103515625, 38.724609375, 40.38818359375, 42.0517578125, 43.71533203125, 45.37890625, 47.04248046875, 48.7060546875, 50.36962890625, 52.033203125, 53.69677734375, 55.3603515625, 57.02392578125, 58.6875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 10.0, 100.0, 357.0, 383.0, 142.0, 17.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-419.21783447265625, -411.4634094238281, -403.708984375, -395.9545593261719, -388.20013427734375, -380.4457092285156, -372.6912841796875, -364.9368591308594, -357.18243408203125, -349.4280090332031, -341.673583984375, -333.9191589355469, -326.16473388671875, -318.4103088378906, -310.6558837890625, -302.9014587402344, -295.14703369140625, -287.3926086425781, -279.63818359375, -271.8837585449219, -264.12933349609375, -256.3749084472656, -248.6204833984375, -240.86605834960938, -233.1116180419922, -225.35719299316406, -217.60276794433594, -209.8483428955078, -202.0939178466797, -194.33949279785156, -186.58506774902344, -178.8306427001953, -171.07623291015625, -163.32180786132812, -155.5673828125, -147.81295776367188, -140.05853271484375, -132.30410766601562, -124.5496826171875, -116.79525756835938, -109.04081726074219, -101.28639221191406, -93.53196716308594, -85.77754211425781, -78.02311706542969, -70.26869201660156, -62.51426315307617, -54.75983810424805, -47.00541687011719, -39.25099182128906, -31.496566772460938, -23.74213981628418, -15.987714767456055, -8.233287811279297, -0.4788627624511719, 7.275562286376953, 15.029987335205078, 22.784412384033203, 30.538837432861328, 38.29326629638672, 46.047691345214844, 53.80211639404297, 61.556541442871094, 69.31096649169922, 77.06539154052734]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 12.0, 6.0, 17.0, 14.0, 14.0, 14.0, 15.0, 16.0, 26.0, 33.0, 24.0, 32.0, 27.0, 43.0, 43.0, 33.0, 49.0, 34.0, 54.0, 40.0, 43.0, 40.0, 54.0, 38.0, 35.0, 41.0, 33.0, 25.0, 24.0, 29.0, 21.0, 10.0, 15.0, 13.0, 10.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.907901763916016, -60.98272705078125, -59.05754852294922, -57.13237380981445, -55.20719909667969, -53.282020568847656, -51.35684585571289, -49.431671142578125, -47.506492614746094, -45.58131790161133, -43.6561393737793, -41.73096466064453, -39.805789947509766, -37.880615234375, -35.95543670654297, -34.0302619934082, -32.10508728027344, -30.17991065979004, -28.254735946655273, -26.329559326171875, -24.40438461303711, -22.47920799255371, -20.554031372070312, -18.628856658935547, -16.70368003845215, -14.778504371643066, -12.853328704833984, -10.928152084350586, -9.002976417541504, -7.077800750732422, -5.152624130249023, -3.2274484634399414, -1.302276611328125, 0.6228992938995361, 2.5480751991271973, 4.4732513427734375, 6.3984270095825195, 8.323602676391602, 10.248779296875, 12.173954963684082, 14.099130630493164, 16.024307250976562, 17.949481964111328, 19.874658584594727, 21.799835205078125, 23.72500991821289, 25.65018653869629, 27.575363159179688, 29.500537872314453, 31.42571449279785, 33.35089111328125, 35.276065826416016, 37.20124053955078, 39.12641906738281, 41.05159378051758, 42.976768493652344, 44.901947021484375, 46.82712173461914, 48.75230026245117, 50.67747497558594, 52.6026496887207, 54.52782440185547, 56.4530029296875, 58.378177642822266, 60.30335235595703]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 2.0, 7.0, 6.0, 3.0, 6.0, 8.0, 10.0, 14.0, 13.0, 20.0, 19.0, 16.0, 21.0, 30.0, 39.0, 25.0, 26.0, 36.0, 34.0, 52.0, 36.0, 36.0, 41.0, 48.0, 41.0, 48.0, 38.0, 40.0, 32.0, 34.0, 28.0, 24.0, 16.0, 31.0, 21.0, 10.0, 19.0, 10.0, 10.0, 9.0, 8.0, 11.0, 5.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.2578125, -8.9742431640625, -8.690673828125, -8.4071044921875, -8.12353515625, -7.8399658203125, -7.556396484375, -7.2728271484375, -6.9892578125, -6.7056884765625, -6.422119140625, -6.1385498046875, -5.85498046875, -5.5714111328125, -5.287841796875, -5.0042724609375, -4.720703125, -4.4371337890625, -4.153564453125, -3.8699951171875, -3.58642578125, -3.3028564453125, -3.019287109375, -2.7357177734375, -2.4521484375, -2.1685791015625, -1.885009765625, -1.6014404296875, -1.31787109375, -1.0343017578125, -0.750732421875, -0.4671630859375, -0.18359375, 0.0999755859375, 0.383544921875, 0.6671142578125, 0.95068359375, 1.2342529296875, 1.517822265625, 1.8013916015625, 2.0849609375, 2.3685302734375, 2.652099609375, 2.9356689453125, 3.21923828125, 3.5028076171875, 3.786376953125, 4.0699462890625, 4.353515625, 4.6370849609375, 4.920654296875, 5.2042236328125, 5.48779296875, 5.7713623046875, 6.054931640625, 6.3385009765625, 6.6220703125, 6.9056396484375, 7.189208984375, 7.4727783203125, 7.75634765625, 8.0399169921875, 8.323486328125, 8.6070556640625, 8.890625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 13.0, 19.0, 34.0, 54.0, 77.0, 110.0, 148.0, 236.0, 371.0, 533.0, 790.0, 1111.0, 1735.0, 2508.0, 3662.0, 5402.0, 8181.0, 12209.0, 18688.0, 28710.0, 45889.0, 79457.0, 160741.0, 350838.0, 136995.0, 70458.0, 41575.0, 26564.0, 17070.0, 11171.0, 7553.0, 5098.0, 3394.0, 2283.0, 1547.0, 1093.0, 747.0, 465.0, 360.0, 215.0, 153.0, 109.0, 54.0, 42.0, 32.0, 23.0, 11.0, 9.0, 6.0, 7.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.40625, -2.329620361328125, -2.25299072265625, -2.176361083984375, -2.0997314453125, -2.023101806640625, -1.94647216796875, -1.869842529296875, -1.793212890625, -1.716583251953125, -1.63995361328125, -1.563323974609375, -1.4866943359375, -1.410064697265625, -1.33343505859375, -1.256805419921875, -1.18017578125, -1.103546142578125, -1.02691650390625, -0.950286865234375, -0.8736572265625, -0.797027587890625, -0.72039794921875, -0.643768310546875, -0.567138671875, -0.490509033203125, -0.41387939453125, -0.337249755859375, -0.2606201171875, -0.183990478515625, -0.10736083984375, -0.030731201171875, 0.0458984375, 0.122528076171875, 0.19915771484375, 0.275787353515625, 0.3524169921875, 0.429046630859375, 0.50567626953125, 0.582305908203125, 0.658935546875, 0.735565185546875, 0.81219482421875, 0.888824462890625, 0.9654541015625, 1.042083740234375, 1.11871337890625, 1.195343017578125, 1.27197265625, 1.348602294921875, 1.42523193359375, 1.501861572265625, 1.5784912109375, 1.655120849609375, 1.73175048828125, 1.808380126953125, 1.885009765625, 1.961639404296875, 2.03826904296875, 2.114898681640625, 2.1915283203125, 2.268157958984375, 2.34478759765625, 2.421417236328125, 2.498046875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 8.0, 6.0, 12.0, 9.0, 8.0, 12.0, 12.0, 17.0, 22.0, 23.0, 33.0, 28.0, 37.0, 42.0, 38.0, 29.0, 48.0, 36.0, 38.0, 1063.0, 45.0, 37.0, 51.0, 39.0, 36.0, 37.0, 41.0, 27.0, 30.0, 26.0, 28.0, 20.0, 18.0, 17.0, 14.0, 7.0, 7.0, 13.0, 3.0, 8.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-7.5859375, -7.38568115234375, -7.1854248046875, -6.98516845703125, -6.784912109375, -6.58465576171875, -6.3843994140625, -6.18414306640625, -5.98388671875, -5.78363037109375, -5.5833740234375, -5.38311767578125, -5.182861328125, -4.98260498046875, -4.7823486328125, -4.58209228515625, -4.3818359375, -4.18157958984375, -3.9813232421875, -3.78106689453125, -3.580810546875, -3.38055419921875, -3.1802978515625, -2.98004150390625, -2.77978515625, -2.57952880859375, -2.3792724609375, -2.17901611328125, -1.978759765625, -1.77850341796875, -1.5782470703125, -1.37799072265625, -1.177734375, -0.97747802734375, -0.7772216796875, -0.57696533203125, -0.376708984375, -0.17645263671875, 0.0238037109375, 0.22406005859375, 0.42431640625, 0.62457275390625, 0.8248291015625, 1.02508544921875, 1.225341796875, 1.42559814453125, 1.6258544921875, 1.82611083984375, 2.0263671875, 2.22662353515625, 2.4268798828125, 2.62713623046875, 2.827392578125, 3.02764892578125, 3.2279052734375, 3.42816162109375, 3.62841796875, 3.82867431640625, 4.0289306640625, 4.22918701171875, 4.429443359375, 4.62969970703125, 4.8299560546875, 5.03021240234375, 5.23046875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 8.0, 18.0, 25.0, 38.0, 36.0, 87.0, 117.0, 209.0, 386.0, 495.0, 983.0, 1523.0, 2383.0, 3779.0, 5832.0, 9562.0, 16053.0, 26136.0, 44414.0, 75719.0, 135693.0, 1380862.0, 170961.0, 89910.0, 52639.0, 30931.0, 18614.0, 11266.0, 6899.0, 4169.0, 2770.0, 1767.0, 1056.0, 715.0, 418.0, 235.0, 150.0, 107.0, 51.0, 40.0, 16.0, 22.0, 6.0, 16.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.85546875, -2.7706298828125, -2.685791015625, -2.6009521484375, -2.51611328125, -2.4312744140625, -2.346435546875, -2.2615966796875, -2.1767578125, -2.0919189453125, -2.007080078125, -1.9222412109375, -1.83740234375, -1.7525634765625, -1.667724609375, -1.5828857421875, -1.498046875, -1.4132080078125, -1.328369140625, -1.2435302734375, -1.15869140625, -1.0738525390625, -0.989013671875, -0.9041748046875, -0.8193359375, -0.7344970703125, -0.649658203125, -0.5648193359375, -0.47998046875, -0.3951416015625, -0.310302734375, -0.2254638671875, -0.140625, -0.0557861328125, 0.029052734375, 0.1138916015625, 0.19873046875, 0.2835693359375, 0.368408203125, 0.4532470703125, 0.5380859375, 0.6229248046875, 0.707763671875, 0.7926025390625, 0.87744140625, 0.9622802734375, 1.047119140625, 1.1319580078125, 1.216796875, 1.3016357421875, 1.386474609375, 1.4713134765625, 1.55615234375, 1.6409912109375, 1.725830078125, 1.8106689453125, 1.8955078125, 1.9803466796875, 2.065185546875, 2.1500244140625, 2.23486328125, 2.3197021484375, 2.404541015625, 2.4893798828125, 2.57421875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 0.0, 3.0, 5.0, 3.0, 5.0, 3.0, 5.0, 10.0, 13.0, 11.0, 13.0, 19.0, 23.0, 34.0, 30.0, 42.0, 51.0, 78.0, 92.0, 104.0, 109.0, 68.0, 56.0, 52.0, 31.0, 42.0, 17.0, 26.0, 12.0, 8.0, 13.0, 4.0, 5.0, 2.0, 1.0, 5.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005817413330078125, -0.0005673989653587341, -0.0005530565977096558, -0.0005387142300605774, -0.000524371862411499, -0.0005100294947624207, -0.0004956871271133423, -0.0004813447594642639, -0.00046700239181518555, -0.0004526600241661072, -0.0004383176565170288, -0.00042397528886795044, -0.00040963292121887207, -0.0003952905535697937, -0.00038094818592071533, -0.00036660581827163696, -0.0003522634506225586, -0.0003379210829734802, -0.00032357871532440186, -0.0003092363476753235, -0.0002948939800262451, -0.00028055161237716675, -0.0002662092447280884, -0.00025186687707901, -0.00023752450942993164, -0.00022318214178085327, -0.0002088397741317749, -0.00019449740648269653, -0.00018015503883361816, -0.0001658126711845398, -0.00015147030353546143, -0.00013712793588638306, -0.0001227855682373047, -0.00010844320058822632, -9.410083293914795e-05, -7.975846529006958e-05, -6.541609764099121e-05, -5.107372999191284e-05, -3.673136234283447e-05, -2.2388994693756104e-05, -8.046627044677734e-06, 6.295740604400635e-06, 2.0638108253479004e-05, 3.498047590255737e-05, 4.932284355163574e-05, 6.366521120071411e-05, 7.800757884979248e-05, 9.234994649887085e-05, 0.00010669231414794922, 0.00012103468179702759, 0.00013537704944610596, 0.00014971941709518433, 0.0001640617847442627, 0.00017840415239334106, 0.00019274652004241943, 0.0002070888876914978, 0.00022143125534057617, 0.00023577362298965454, 0.0002501159906387329, 0.0002644583582878113, 0.00027880072593688965, 0.000293143093585968, 0.0003074854612350464, 0.00032182782888412476, 0.0003361701965332031]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 6.0, 2.0, 7.0, 10.0, 15.0, 13.0, 9.0, 24.0, 39.0, 50.0, 69.0, 81.0, 139.0, 232.0, 555.0, 3203.0, 1037788.0, 4923.0, 636.0, 242.0, 137.0, 95.0, 59.0, 52.0, 40.0, 19.0, 19.0, 10.0, 19.0, 11.0, 9.0, 12.0, 6.0, 4.0, 10.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0069580078125, -0.006662487983703613, -0.0063669681549072266, -0.00607144832611084, -0.005775928497314453, -0.005480408668518066, -0.00518488883972168, -0.004889369010925293, -0.004593849182128906, -0.0042983293533325195, -0.004002809524536133, -0.003707289695739746, -0.0034117698669433594, -0.0031162500381469727, -0.002820730209350586, -0.0025252103805541992, -0.0022296905517578125, -0.0019341707229614258, -0.001638650894165039, -0.0013431310653686523, -0.0010476112365722656, -0.0007520914077758789, -0.0004565715789794922, -0.00016105175018310547, 0.00013446807861328125, 0.00042998790740966797, 0.0007255077362060547, 0.0010210275650024414, 0.0013165473937988281, 0.0016120672225952148, 0.0019075870513916016, 0.0022031068801879883, 0.002498626708984375, 0.0027941465377807617, 0.0030896663665771484, 0.003385186195373535, 0.003680706024169922, 0.003976225852966309, 0.004271745681762695, 0.004567265510559082, 0.004862785339355469, 0.0051583051681518555, 0.005453824996948242, 0.005749344825744629, 0.006044864654541016, 0.006340384483337402, 0.006635904312133789, 0.006931424140930176, 0.0072269439697265625, 0.007522463798522949, 0.007817983627319336, 0.008113503456115723, 0.00840902328491211, 0.008704543113708496, 0.009000062942504883, 0.00929558277130127, 0.009591102600097656, 0.009886622428894043, 0.01018214225769043, 0.010477662086486816, 0.010773181915283203, 0.01106870174407959, 0.011364221572875977, 0.011659741401672363, 0.01195526123046875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 20.0, 131.0, 415.0, 345.0, 83.0, 16.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0013385488418862224, -0.001314577297307551, -0.0012906056363135576, -0.0012666340917348862, -0.0012426624307408929, -0.0012186908861622214, -0.0011947192251682281, -0.0011707476805895567, -0.0011467761360108852, -0.0011228045914322138, -0.0010988329304382205, -0.001074861385859549, -0.0010508897248655558, -0.0010269181802868843, -0.0010029466357082129, -0.0009789749747142196, -0.0009550033137202263, -0.0009310317109338939, -0.0009070601081475616, -0.0008830885635688901, -0.0008591169607825577, -0.0008351453579962254, -0.000811173755209893, -0.0007872021524235606, -0.0007632306078448892, -0.0007392590050585568, -0.0007152874022722244, -0.000691315857693553, -0.0006673442549072206, -0.0006433726521208882, -0.0006194010493345559, -0.0005954294465482235, -0.0005714578437618911, -0.0005474862409755588, -0.0005235146381892264, -0.000499543035402894, -0.0004755714617203921, -0.0004515998880378902, -0.0004276282852515578, -0.00040365668246522546, -0.00037968510878272355, -0.0003557135059963912, -0.00033174193231388927, -0.0003077703295275569, -0.00028379872674122453, -0.00025982712395489216, -0.00023585555027239025, -0.00021188394748605788, -0.00018791235925164074, -0.0001639407710172236, -0.00013996916823089123, -0.00011599757999647409, -9.202598448609933e-05, -6.805438897572458e-05, -4.408280074130744e-05, -2.011119795497507e-05, 3.860390279442072e-06, 2.7831983970827423e-05, 5.1803577662212774e-05, 7.577516953460872e-05, 9.974676504498348e-05, 0.00012371836055535823, 0.00014768994878977537, 0.00017166155157610774, 0.00019563313981052488]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 14.0, 3.0, 11.0, 9.0, 7.0, 10.0, 19.0, 12.0, 14.0, 23.0, 23.0, 34.0, 36.0, 42.0, 31.0, 32.0, 45.0, 43.0, 47.0, 43.0, 42.0, 40.0, 44.0, 38.0, 39.0, 25.0, 38.0, 25.0, 28.0, 32.0, 24.0, 22.0, 17.0, 21.0, 14.0, 14.0, 10.0, 6.0, 3.0, 7.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017088651657104492, -0.000164874829351902, -0.0001588631421327591, -0.00015285145491361618, -0.00014683976769447327, -0.00014082808047533035, -0.00013481639325618744, -0.00012880470603704453, -0.0001227930188179016, -0.0001167813315987587, -0.00011076964437961578, -0.00010475795716047287, -9.874626994132996e-05, -9.273458272218704e-05, -8.672289550304413e-05, -8.071120828390121e-05, -7.46995210647583e-05, -6.868783384561539e-05, -6.267614662647247e-05, -5.666445940732956e-05, -5.0652772188186646e-05, -4.464108496904373e-05, -3.862939774990082e-05, -3.2617710530757904e-05, -2.660602331161499e-05, -2.0594336092472076e-05, -1.4582648873329163e-05, -8.570961654186249e-06, -2.559274435043335e-06, 3.452412784099579e-06, 9.464100003242493e-06, 1.5475787222385406e-05, 2.148747444152832e-05, 2.7499161660671234e-05, 3.351084887981415e-05, 3.952253609895706e-05, 4.5534223318099976e-05, 5.154591053724289e-05, 5.75575977563858e-05, 6.356928497552872e-05, 6.958097219467163e-05, 7.559265941381454e-05, 8.160434663295746e-05, 8.761603385210037e-05, 9.362772107124329e-05, 9.96394082903862e-05, 0.00010565109550952911, 0.00011166278272867203, 0.00011767446994781494, 0.00012368615716695786, 0.00012969784438610077, 0.00013570953160524368, 0.0001417212188243866, 0.0001477329060435295, 0.00015374459326267242, 0.00015975628048181534, 0.00016576796770095825, 0.00017177965492010117, 0.00017779134213924408, 0.000183803029358387, 0.0001898147165775299, 0.00019582640379667282, 0.00020183809101581573, 0.00020784977823495865, 0.00021386146545410156]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 2.0, 7.0, 6.0, 3.0, 6.0, 8.0, 10.0, 14.0, 13.0, 20.0, 19.0, 16.0, 21.0, 30.0, 39.0, 25.0, 26.0, 36.0, 34.0, 51.0, 37.0, 36.0, 41.0, 48.0, 41.0, 48.0, 38.0, 40.0, 32.0, 34.0, 28.0, 24.0, 16.0, 31.0, 21.0, 10.0, 19.0, 10.0, 10.0, 9.0, 8.0, 11.0, 5.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.2578125, -8.9742431640625, -8.690673828125, -8.4071044921875, -8.12353515625, -7.8399658203125, -7.556396484375, -7.2728271484375, -6.9892578125, -6.7056884765625, -6.422119140625, -6.1385498046875, -5.85498046875, -5.5714111328125, -5.287841796875, -5.0042724609375, -4.720703125, -4.4371337890625, -4.153564453125, -3.8699951171875, -3.58642578125, -3.3028564453125, -3.019287109375, -2.7357177734375, -2.4521484375, -2.1685791015625, -1.885009765625, -1.6014404296875, -1.31787109375, -1.0343017578125, -0.750732421875, -0.4671630859375, -0.18359375, 0.0999755859375, 0.383544921875, 0.6671142578125, 0.95068359375, 1.2342529296875, 1.517822265625, 1.8013916015625, 2.0849609375, 2.3685302734375, 2.652099609375, 2.9356689453125, 3.21923828125, 3.5028076171875, 3.786376953125, 4.0699462890625, 4.353515625, 4.6370849609375, 4.920654296875, 5.2042236328125, 5.48779296875, 5.7713623046875, 6.054931640625, 6.3385009765625, 6.6220703125, 6.9056396484375, 7.189208984375, 7.4727783203125, 7.75634765625, 8.0399169921875, 8.323486328125, 8.6070556640625, 8.890625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 6.0, 5.0, 11.0, 8.0, 14.0, 21.0, 22.0, 29.0, 38.0, 71.0, 110.0, 173.0, 305.0, 606.0, 1342.0, 3000.0, 6792.0, 16251.0, 39755.0, 108605.0, 278324.0, 338920.0, 158355.0, 56665.0, 22259.0, 9273.0, 3959.0, 1782.0, 806.0, 413.0, 208.0, 128.0, 73.0, 55.0, 34.0, 31.0, 21.0, 14.0, 7.0, 11.0, 9.0, 10.0, 6.0, 6.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6640625, -9.36376953125, -9.0634765625, -8.76318359375, -8.462890625, -8.16259765625, -7.8623046875, -7.56201171875, -7.26171875, -6.96142578125, -6.6611328125, -6.36083984375, -6.060546875, -5.76025390625, -5.4599609375, -5.15966796875, -4.859375, -4.55908203125, -4.2587890625, -3.95849609375, -3.658203125, -3.35791015625, -3.0576171875, -2.75732421875, -2.45703125, -2.15673828125, -1.8564453125, -1.55615234375, -1.255859375, -0.95556640625, -0.6552734375, -0.35498046875, -0.0546875, 0.24560546875, 0.5458984375, 0.84619140625, 1.146484375, 1.44677734375, 1.7470703125, 2.04736328125, 2.34765625, 2.64794921875, 2.9482421875, 3.24853515625, 3.548828125, 3.84912109375, 4.1494140625, 4.44970703125, 4.75, 5.05029296875, 5.3505859375, 5.65087890625, 5.951171875, 6.25146484375, 6.5517578125, 6.85205078125, 7.15234375, 7.45263671875, 7.7529296875, 8.05322265625, 8.353515625, 8.65380859375, 8.9541015625, 9.25439453125, 9.5546875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 6.0, 8.0, 13.0, 13.0, 11.0, 14.0, 20.0, 33.0, 22.0, 32.0, 34.0, 41.0, 51.0, 42.0, 56.0, 79.0, 195.0, 1464.0, 344.0, 126.0, 64.0, 47.0, 44.0, 42.0, 34.0, 36.0, 27.0, 22.0, 18.0, 17.0, 15.0, 14.0, 8.0, 17.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.625, -25.59423828125, -24.5634765625, -23.53271484375, -22.501953125, -21.47119140625, -20.4404296875, -19.40966796875, -18.37890625, -17.34814453125, -16.3173828125, -15.28662109375, -14.255859375, -13.22509765625, -12.1943359375, -11.16357421875, -10.1328125, -9.10205078125, -8.0712890625, -7.04052734375, -6.009765625, -4.97900390625, -3.9482421875, -2.91748046875, -1.88671875, -0.85595703125, 0.1748046875, 1.20556640625, 2.236328125, 3.26708984375, 4.2978515625, 5.32861328125, 6.359375, 7.39013671875, 8.4208984375, 9.45166015625, 10.482421875, 11.51318359375, 12.5439453125, 13.57470703125, 14.60546875, 15.63623046875, 16.6669921875, 17.69775390625, 18.728515625, 19.75927734375, 20.7900390625, 21.82080078125, 22.8515625, 23.88232421875, 24.9130859375, 25.94384765625, 26.974609375, 28.00537109375, 29.0361328125, 30.06689453125, 31.09765625, 32.12841796875, 33.1591796875, 34.18994140625, 35.220703125, 36.25146484375, 37.2822265625, 38.31298828125, 39.34375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 4.0, 1.0, 11.0, 13.0, 13.0, 20.0, 37.0, 47.0, 61.0, 77.0, 100.0, 189.0, 306.0, 570.0, 1493.0, 46130.0, 3076402.0, 17629.0, 1170.0, 529.0, 273.0, 198.0, 130.0, 66.0, 49.0, 44.0, 28.0, 22.0, 21.0, 10.0, 9.0, 11.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.125, -69.6728515625, -67.220703125, -64.7685546875, -62.31640625, -59.8642578125, -57.412109375, -54.9599609375, -52.5078125, -50.0556640625, -47.603515625, -45.1513671875, -42.69921875, -40.2470703125, -37.794921875, -35.3427734375, -32.890625, -30.4384765625, -27.986328125, -25.5341796875, -23.08203125, -20.6298828125, -18.177734375, -15.7255859375, -13.2734375, -10.8212890625, -8.369140625, -5.9169921875, -3.46484375, -1.0126953125, 1.439453125, 3.8916015625, 6.34375, 8.7958984375, 11.248046875, 13.7001953125, 16.15234375, 18.6044921875, 21.056640625, 23.5087890625, 25.9609375, 28.4130859375, 30.865234375, 33.3173828125, 35.76953125, 38.2216796875, 40.673828125, 43.1259765625, 45.578125, 48.0302734375, 50.482421875, 52.9345703125, 55.38671875, 57.8388671875, 60.291015625, 62.7431640625, 65.1953125, 67.6474609375, 70.099609375, 72.5517578125, 75.00390625, 77.4560546875, 79.908203125, 82.3603515625, 84.8125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 167.0, 541.0, 272.0, 31.0, 1.0, 0.0, 1.0], "bins": [-321.1007385253906, -315.61968994140625, -310.1386413574219, -304.6575927734375, -299.1765441894531, -293.69549560546875, -288.21441650390625, -282.7333679199219, -277.2523193359375, -271.7712707519531, -266.29022216796875, -260.8091735839844, -255.32810974121094, -249.84706115722656, -244.3660125732422, -238.8849639892578, -233.40391540527344, -227.92286682128906, -222.4418182373047, -216.96075439453125, -211.47970581054688, -205.9986572265625, -200.51760864257812, -195.03656005859375, -189.55551147460938, -184.074462890625, -178.59341430664062, -173.11236572265625, -167.6313018798828, -162.15025329589844, -156.66920471191406, -151.1881561279297, -145.7071075439453, -140.22605895996094, -134.74501037597656, -129.26394653320312, -123.78289794921875, -118.30184936523438, -112.82080078125, -107.33975219726562, -101.85868835449219, -96.37763977050781, -90.8965835571289, -85.41553497314453, -79.93447875976562, -74.45343017578125, -68.97238159179688, -63.491329193115234, -58.010276794433594, -52.52922439575195, -47.04817199707031, -41.56712341308594, -36.0860710144043, -30.605018615722656, -25.12397003173828, -19.64291763305664, -14.161867141723633, -8.680815696716309, -3.1997642517089844, 2.2812862396240234, 7.762338638305664, 13.243391036987305, 18.72443962097168, 24.20549201965332, 29.68654441833496]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 4.0, 8.0, 10.0, 13.0, 10.0, 17.0, 20.0, 20.0, 17.0, 22.0, 29.0, 26.0, 32.0, 34.0, 46.0, 40.0, 36.0, 49.0, 50.0, 42.0, 46.0, 38.0, 40.0, 46.0, 31.0, 33.0, 37.0, 32.0, 29.0, 31.0, 16.0, 21.0, 12.0, 13.0, 7.0, 15.0, 7.0, 6.0, 7.0, 1.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.52777099609375, -76.05451965332031, -73.5812759399414, -71.10802459716797, -68.63477325439453, -66.16152954101562, -63.68827819824219, -61.21502685546875, -58.74177932739258, -56.268531799316406, -53.79528045654297, -51.3220329284668, -48.848785400390625, -46.37553405761719, -43.902286529541016, -41.429039001464844, -38.955787658691406, -36.482540130615234, -34.0092887878418, -31.536041259765625, -29.06279182434082, -26.589542388916016, -24.116294860839844, -21.64304542541504, -19.169795989990234, -16.69654655456543, -14.223298072814941, -11.750049591064453, -9.276800155639648, -6.803550720214844, -4.3303022384643555, -1.8570537567138672, 0.6162033081054688, 3.0894522666931152, 5.562701225280762, 8.03594970703125, 10.509199142456055, 12.98244857788086, 15.455697059631348, 17.928945541381836, 20.40219497680664, 22.875444412231445, 25.34869384765625, 27.821941375732422, 30.295190811157227, 32.76844024658203, 35.2416877746582, 37.714935302734375, 40.18818664550781, 42.661434173583984, 45.13468551635742, 47.607933044433594, 50.08118438720703, 52.5544319152832, 55.027679443359375, 57.50093078613281, 59.974178314208984, 62.447425842285156, 64.9206771850586, 67.39392852783203, 69.86717224121094, 72.34042358398438, 74.81367492675781, 77.28691864013672, 79.76016998291016]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 6.0, 1.0, 10.0, 5.0, 8.0, 8.0, 9.0, 9.0, 22.0, 29.0, 25.0, 27.0, 37.0, 28.0, 30.0, 41.0, 33.0, 35.0, 38.0, 53.0, 47.0, 50.0, 55.0, 49.0, 29.0, 51.0, 26.0, 34.0, 39.0, 26.0, 20.0, 16.0, 22.0, 21.0, 11.0, 12.0, 9.0, 4.0, 10.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.7734375, -11.4420166015625, -11.110595703125, -10.7791748046875, -10.44775390625, -10.1163330078125, -9.784912109375, -9.4534912109375, -9.1220703125, -8.7906494140625, -8.459228515625, -8.1278076171875, -7.79638671875, -7.4649658203125, -7.133544921875, -6.8021240234375, -6.470703125, -6.1392822265625, -5.807861328125, -5.4764404296875, -5.14501953125, -4.8135986328125, -4.482177734375, -4.1507568359375, -3.8193359375, -3.4879150390625, -3.156494140625, -2.8250732421875, -2.49365234375, -2.1622314453125, -1.830810546875, -1.4993896484375, -1.16796875, -0.8365478515625, -0.505126953125, -0.1737060546875, 0.15771484375, 0.4891357421875, 0.820556640625, 1.1519775390625, 1.4833984375, 1.8148193359375, 2.146240234375, 2.4776611328125, 2.80908203125, 3.1405029296875, 3.471923828125, 3.8033447265625, 4.134765625, 4.4661865234375, 4.797607421875, 5.1290283203125, 5.46044921875, 5.7918701171875, 6.123291015625, 6.4547119140625, 6.7861328125, 7.1175537109375, 7.448974609375, 7.7803955078125, 8.11181640625, 8.4432373046875, 8.774658203125, 9.1060791015625, 9.4375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 4.0, 11.0, 9.0, 11.0, 17.0, 23.0, 19.0, 32.0, 43.0, 48.0, 53.0, 77.0, 107.0, 184.0, 491.0, 2618.0, 112151.0, 3353088.0, 715365.0, 8364.0, 775.0, 246.0, 126.0, 86.0, 75.0, 47.0, 38.0, 22.0, 32.0, 14.0, 17.0, 20.0, 17.0, 12.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.90625, -38.788330078125, -37.67041015625, -36.552490234375, -35.4345703125, -34.316650390625, -33.19873046875, -32.080810546875, -30.962890625, -29.844970703125, -28.72705078125, -27.609130859375, -26.4912109375, -25.373291015625, -24.25537109375, -23.137451171875, -22.01953125, -20.901611328125, -19.78369140625, -18.665771484375, -17.5478515625, -16.429931640625, -15.31201171875, -14.194091796875, -13.076171875, -11.958251953125, -10.84033203125, -9.722412109375, -8.6044921875, -7.486572265625, -6.36865234375, -5.250732421875, -4.1328125, -3.014892578125, -1.89697265625, -0.779052734375, 0.3388671875, 1.456787109375, 2.57470703125, 3.692626953125, 4.810546875, 5.928466796875, 7.04638671875, 8.164306640625, 9.2822265625, 10.400146484375, 11.51806640625, 12.635986328125, 13.75390625, 14.871826171875, 15.98974609375, 17.107666015625, 18.2255859375, 19.343505859375, 20.46142578125, 21.579345703125, 22.697265625, 23.815185546875, 24.93310546875, 26.051025390625, 27.1689453125, 28.286865234375, 29.40478515625, 30.522705078125, 31.640625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 10.0, 14.0, 19.0, 34.0, 33.0, 39.0, 56.0, 60.0, 103.0, 150.0, 185.0, 251.0, 336.0, 398.0, 445.0, 426.0, 374.0, 306.0, 226.0, 168.0, 96.0, 83.0, 67.0, 42.0, 33.0, 30.0, 21.0, 19.0, 14.0, 5.0, 5.0, 4.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.328125, -13.81298828125, -13.2978515625, -12.78271484375, -12.267578125, -11.75244140625, -11.2373046875, -10.72216796875, -10.20703125, -9.69189453125, -9.1767578125, -8.66162109375, -8.146484375, -7.63134765625, -7.1162109375, -6.60107421875, -6.0859375, -5.57080078125, -5.0556640625, -4.54052734375, -4.025390625, -3.51025390625, -2.9951171875, -2.47998046875, -1.96484375, -1.44970703125, -0.9345703125, -0.41943359375, 0.095703125, 0.61083984375, 1.1259765625, 1.64111328125, 2.15625, 2.67138671875, 3.1865234375, 3.70166015625, 4.216796875, 4.73193359375, 5.2470703125, 5.76220703125, 6.27734375, 6.79248046875, 7.3076171875, 7.82275390625, 8.337890625, 8.85302734375, 9.3681640625, 9.88330078125, 10.3984375, 10.91357421875, 11.4287109375, 11.94384765625, 12.458984375, 12.97412109375, 13.4892578125, 14.00439453125, 14.51953125, 15.03466796875, 15.5498046875, 16.06494140625, 16.580078125, 17.09521484375, 17.6103515625, 18.12548828125, 18.640625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 10.0, 11.0, 18.0, 29.0, 30.0, 45.0, 59.0, 81.0, 100.0, 130.0, 168.0, 245.0, 380.0, 791.0, 3288.0, 92024.0, 3821248.0, 267360.0, 5696.0, 1016.0, 452.0, 306.0, 200.0, 144.0, 115.0, 73.0, 75.0, 49.0, 43.0, 27.0, 21.0, 11.0, 14.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-65.625, -63.83251953125, -62.0400390625, -60.24755859375, -58.455078125, -56.66259765625, -54.8701171875, -53.07763671875, -51.28515625, -49.49267578125, -47.7001953125, -45.90771484375, -44.115234375, -42.32275390625, -40.5302734375, -38.73779296875, -36.9453125, -35.15283203125, -33.3603515625, -31.56787109375, -29.775390625, -27.98291015625, -26.1904296875, -24.39794921875, -22.60546875, -20.81298828125, -19.0205078125, -17.22802734375, -15.435546875, -13.64306640625, -11.8505859375, -10.05810546875, -8.265625, -6.47314453125, -4.6806640625, -2.88818359375, -1.095703125, 0.69677734375, 2.4892578125, 4.28173828125, 6.07421875, 7.86669921875, 9.6591796875, 11.45166015625, 13.244140625, 15.03662109375, 16.8291015625, 18.62158203125, 20.4140625, 22.20654296875, 23.9990234375, 25.79150390625, 27.583984375, 29.37646484375, 31.1689453125, 32.96142578125, 34.75390625, 36.54638671875, 38.3388671875, 40.13134765625, 41.923828125, 43.71630859375, 45.5087890625, 47.30126953125, 49.09375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 15.0, 398.0, 559.0, 43.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.58255004882812, -184.50808715820312, -170.43362426757812, -156.35914611816406, -142.28468322753906, -128.21022033691406, -114.13574981689453, -100.061279296875, -85.98681640625, -71.912353515625, -57.83788299560547, -43.7634162902832, -29.688949584960938, -15.614486694335938, -1.5400161743164062, 12.534454345703125, 26.608917236328125, 40.68338394165039, 54.757850646972656, 68.83232116699219, 82.90678405761719, 96.98124694824219, 111.05571746826172, 125.13018798828125, 139.20465087890625, 153.27911376953125, 167.35357666015625, 181.4280548095703, 195.5025177001953, 209.5769805908203, 223.65145874023438, 237.72592163085938, 251.8004150390625, 265.8748779296875, 279.9493408203125, 294.0238037109375, 308.0982666015625, 322.1727294921875, 336.2472229003906, 350.3216857910156, 364.3961486816406, 378.4706115722656, 392.5450744628906, 406.6195373535156, 420.69403076171875, 434.76849365234375, 448.84295654296875, 462.91741943359375, 476.99188232421875, 491.06634521484375, 505.14080810546875, 519.2152709960938, 533.2897338867188, 547.3641967773438, 561.4386596679688, 575.51318359375, 589.587646484375, 603.662109375, 617.736572265625, 631.81103515625, 645.885498046875, 659.9599609375, 674.034423828125, 688.10888671875, 702.183349609375]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 13.0, 8.0, 8.0, 12.0, 17.0, 4.0, 31.0, 20.0, 29.0, 32.0, 26.0, 34.0, 23.0, 49.0, 40.0, 40.0, 38.0, 37.0, 42.0, 31.0, 38.0, 40.0, 42.0, 36.0, 38.0, 29.0, 28.0, 23.0, 29.0, 14.0, 20.0, 19.0, 22.0, 14.0, 10.0, 12.0, 8.0, 7.0, 4.0, 3.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-61.49842834472656, -59.76128005981445, -58.024131774902344, -56.28697967529297, -54.54983139038086, -52.81268310546875, -51.075531005859375, -49.338382720947266, -47.601234436035156, -45.86408615112305, -44.12693786621094, -42.38978576660156, -40.65263748168945, -38.915489196777344, -37.17833709716797, -35.44118881225586, -33.70404052734375, -31.96689224243164, -30.2297420501709, -28.492591857910156, -26.755443572998047, -25.018295288085938, -23.281145095825195, -21.543994903564453, -19.806846618652344, -18.069698333740234, -16.332548141479492, -14.595398902893066, -12.85824966430664, -11.121100425720215, -9.383951187133789, -7.646801948547363, -5.9096527099609375, -4.172503471374512, -2.435354232788086, -0.6982049942016602, 1.0389442443847656, 2.7760934829711914, 4.513242721557617, 6.250391960144043, 7.987541198730469, 9.724690437316895, 11.46183967590332, 13.198988914489746, 14.936138153076172, 16.67328643798828, 18.410436630249023, 20.147586822509766, 21.884735107421875, 23.621883392333984, 25.359033584594727, 27.09618377685547, 28.833332061767578, 30.570480346679688, 32.30763244628906, 34.04478073120117, 35.78192901611328, 37.51907730102539, 39.2562255859375, 40.993377685546875, 42.730525970458984, 44.467674255371094, 46.20482635498047, 47.94197463989258, 49.67912292480469]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 8.0, 4.0, 13.0, 9.0, 7.0, 10.0, 13.0, 14.0, 8.0, 23.0, 22.0, 22.0, 21.0, 34.0, 27.0, 27.0, 47.0, 38.0, 43.0, 47.0, 44.0, 48.0, 38.0, 47.0, 37.0, 30.0, 35.0, 41.0, 19.0, 16.0, 19.0, 17.0, 27.0, 21.0, 20.0, 21.0, 13.0, 17.0, 11.0, 10.0, 7.0, 2.0, 5.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.7421875, -9.4517822265625, -9.161376953125, -8.8709716796875, -8.58056640625, -8.2901611328125, -7.999755859375, -7.7093505859375, -7.4189453125, -7.1285400390625, -6.838134765625, -6.5477294921875, -6.25732421875, -5.9669189453125, -5.676513671875, -5.3861083984375, -5.095703125, -4.8052978515625, -4.514892578125, -4.2244873046875, -3.93408203125, -3.6436767578125, -3.353271484375, -3.0628662109375, -2.7724609375, -2.4820556640625, -2.191650390625, -1.9012451171875, -1.61083984375, -1.3204345703125, -1.030029296875, -0.7396240234375, -0.44921875, -0.1588134765625, 0.131591796875, 0.4219970703125, 0.71240234375, 1.0028076171875, 1.293212890625, 1.5836181640625, 1.8740234375, 2.1644287109375, 2.454833984375, 2.7452392578125, 3.03564453125, 3.3260498046875, 3.616455078125, 3.9068603515625, 4.197265625, 4.4876708984375, 4.778076171875, 5.0684814453125, 5.35888671875, 5.6492919921875, 5.939697265625, 6.2301025390625, 6.5205078125, 6.8109130859375, 7.101318359375, 7.3917236328125, 7.68212890625, 7.9725341796875, 8.262939453125, 8.5533447265625, 8.84375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 12.0, 20.0, 24.0, 41.0, 53.0, 81.0, 122.0, 159.0, 261.0, 385.0, 546.0, 801.0, 1178.0, 1772.0, 2585.0, 3792.0, 5564.0, 8008.0, 11931.0, 18008.0, 28078.0, 44066.0, 75438.0, 148394.0, 341698.0, 150534.0, 76026.0, 45186.0, 27730.0, 18419.0, 12296.0, 8197.0, 5484.0, 3672.0, 2539.0, 1719.0, 1179.0, 844.0, 525.0, 367.0, 265.0, 175.0, 118.0, 93.0, 52.0, 42.0, 24.0, 19.0, 14.0, 5.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.478515625, -2.39727783203125, -2.3160400390625, -2.23480224609375, -2.153564453125, -2.07232666015625, -1.9910888671875, -1.90985107421875, -1.82861328125, -1.74737548828125, -1.6661376953125, -1.58489990234375, -1.503662109375, -1.42242431640625, -1.3411865234375, -1.25994873046875, -1.1787109375, -1.09747314453125, -1.0162353515625, -0.93499755859375, -0.853759765625, -0.77252197265625, -0.6912841796875, -0.61004638671875, -0.52880859375, -0.44757080078125, -0.3663330078125, -0.28509521484375, -0.203857421875, -0.12261962890625, -0.0413818359375, 0.03985595703125, 0.12109375, 0.20233154296875, 0.2835693359375, 0.36480712890625, 0.446044921875, 0.52728271484375, 0.6085205078125, 0.68975830078125, 0.77099609375, 0.85223388671875, 0.9334716796875, 1.01470947265625, 1.095947265625, 1.17718505859375, 1.2584228515625, 1.33966064453125, 1.4208984375, 1.50213623046875, 1.5833740234375, 1.66461181640625, 1.745849609375, 1.82708740234375, 1.9083251953125, 1.98956298828125, 2.07080078125, 2.15203857421875, 2.2332763671875, 2.31451416015625, 2.395751953125, 2.47698974609375, 2.5582275390625, 2.63946533203125, 2.720703125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 6.0, 9.0, 13.0, 15.0, 19.0, 20.0, 19.0, 17.0, 21.0, 23.0, 34.0, 32.0, 33.0, 44.0, 40.0, 42.0, 37.0, 1065.0, 42.0, 35.0, 38.0, 36.0, 39.0, 35.0, 33.0, 29.0, 36.0, 19.0, 29.0, 15.0, 19.0, 21.0, 12.0, 25.0, 9.0, 12.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.35546875, -6.1617431640625, -5.968017578125, -5.7742919921875, -5.58056640625, -5.3868408203125, -5.193115234375, -4.9993896484375, -4.8056640625, -4.6119384765625, -4.418212890625, -4.2244873046875, -4.03076171875, -3.8370361328125, -3.643310546875, -3.4495849609375, -3.255859375, -3.0621337890625, -2.868408203125, -2.6746826171875, -2.48095703125, -2.2872314453125, -2.093505859375, -1.8997802734375, -1.7060546875, -1.5123291015625, -1.318603515625, -1.1248779296875, -0.93115234375, -0.7374267578125, -0.543701171875, -0.3499755859375, -0.15625, 0.0374755859375, 0.231201171875, 0.4249267578125, 0.61865234375, 0.8123779296875, 1.006103515625, 1.1998291015625, 1.3935546875, 1.5872802734375, 1.781005859375, 1.9747314453125, 2.16845703125, 2.3621826171875, 2.555908203125, 2.7496337890625, 2.943359375, 3.1370849609375, 3.330810546875, 3.5245361328125, 3.71826171875, 3.9119873046875, 4.105712890625, 4.2994384765625, 4.4931640625, 4.6868896484375, 4.880615234375, 5.0743408203125, 5.26806640625, 5.4617919921875, 5.655517578125, 5.8492431640625, 6.04296875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 23.0, 20.0, 35.0, 51.0, 80.0, 134.0, 159.0, 254.0, 396.0, 484.0, 717.0, 1024.0, 1357.0, 2008.0, 3065.0, 4274.0, 6316.0, 9050.0, 12939.0, 19476.0, 29911.0, 45072.0, 71422.0, 120017.0, 1340146.0, 168201.0, 91295.0, 56948.0, 36805.0, 24396.0, 15891.0, 10674.0, 7471.0, 5394.0, 3577.0, 2390.0, 1715.0, 1129.0, 834.0, 588.0, 419.0, 317.0, 210.0, 128.0, 105.0, 73.0, 56.0, 23.0, 19.0, 14.0, 8.0, 10.0, 1.0, 2.0, 3.0, 1.0], "bins": [-2.384765625, -2.31195068359375, -2.2391357421875, -2.16632080078125, -2.093505859375, -2.02069091796875, -1.9478759765625, -1.87506103515625, -1.80224609375, -1.72943115234375, -1.6566162109375, -1.58380126953125, -1.510986328125, -1.43817138671875, -1.3653564453125, -1.29254150390625, -1.2197265625, -1.14691162109375, -1.0740966796875, -1.00128173828125, -0.928466796875, -0.85565185546875, -0.7828369140625, -0.71002197265625, -0.63720703125, -0.56439208984375, -0.4915771484375, -0.41876220703125, -0.345947265625, -0.27313232421875, -0.2003173828125, -0.12750244140625, -0.0546875, 0.01812744140625, 0.0909423828125, 0.16375732421875, 0.236572265625, 0.30938720703125, 0.3822021484375, 0.45501708984375, 0.52783203125, 0.60064697265625, 0.6734619140625, 0.74627685546875, 0.819091796875, 0.89190673828125, 0.9647216796875, 1.03753662109375, 1.1103515625, 1.18316650390625, 1.2559814453125, 1.32879638671875, 1.401611328125, 1.47442626953125, 1.5472412109375, 1.62005615234375, 1.69287109375, 1.76568603515625, 1.8385009765625, 1.91131591796875, 1.984130859375, 2.05694580078125, 2.1297607421875, 2.20257568359375, 2.275390625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 10.0, 6.0, 24.0, 16.0, 41.0, 49.0, 66.0, 104.0, 112.0, 109.0, 110.0, 100.0, 64.0, 59.0, 34.0, 38.0, 16.0, 12.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0010042190551757812, -0.000978916883468628, -0.0009536147117614746, -0.0009283125400543213, -0.000903010368347168, -0.0008777081966400146, -0.0008524060249328613, -0.000827103853225708, -0.0008018016815185547, -0.0007764995098114014, -0.000751197338104248, -0.0007258951663970947, -0.0007005929946899414, -0.0006752908229827881, -0.0006499886512756348, -0.0006246864795684814, -0.0005993843078613281, -0.0005740821361541748, -0.0005487799644470215, -0.0005234777927398682, -0.0004981756210327148, -0.0004728734493255615, -0.0004475712776184082, -0.0004222691059112549, -0.00039696693420410156, -0.00037166476249694824, -0.0003463625907897949, -0.0003210604190826416, -0.0002957582473754883, -0.00027045607566833496, -0.00024515390396118164, -0.00021985173225402832, -0.000194549560546875, -0.00016924738883972168, -0.00014394521713256836, -0.00011864304542541504, -9.334087371826172e-05, -6.80387020111084e-05, -4.273653030395508e-05, -1.7434358596801758e-05, 7.867813110351562e-06, 3.316998481750488e-05, 5.84721565246582e-05, 8.377432823181152e-05, 0.00010907649993896484, 0.00013437867164611816, 0.00015968084335327148, 0.0001849830150604248, 0.00021028518676757812, 0.00023558735847473145, 0.00026088953018188477, 0.0002861917018890381, 0.0003114938735961914, 0.0003367960453033447, 0.00036209821701049805, 0.00038740038871765137, 0.0004127025604248047, 0.000438004732131958, 0.00046330690383911133, 0.0004886090755462646, 0.000513911247253418, 0.0005392134189605713, 0.0005645155906677246, 0.0005898177623748779, 0.0006151199340820312]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 15.0, 19.0, 32.0, 40.0, 56.0, 85.0, 130.0, 242.0, 584.0, 9026.0, 1036101.0, 1316.0, 369.0, 179.0, 109.0, 74.0, 48.0, 35.0, 21.0, 15.0, 9.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01166534423828125, -0.01118457317352295, -0.010703802108764648, -0.010223031044006348, -0.009742259979248047, -0.009261488914489746, -0.008780717849731445, -0.008299946784973145, -0.007819175720214844, -0.007338404655456543, -0.006857633590698242, -0.006376862525939941, -0.005896091461181641, -0.00541532039642334, -0.004934549331665039, -0.004453778266906738, -0.0039730072021484375, -0.0034922361373901367, -0.003011465072631836, -0.002530694007873535, -0.0020499229431152344, -0.0015691518783569336, -0.0010883808135986328, -0.000607609748840332, -0.00012683868408203125, 0.00035393238067626953, 0.0008347034454345703, 0.001315474510192871, 0.0017962455749511719, 0.0022770166397094727, 0.0027577877044677734, 0.0032385587692260742, 0.003719329833984375, 0.004200100898742676, 0.0046808719635009766, 0.005161643028259277, 0.005642414093017578, 0.006123185157775879, 0.00660395622253418, 0.0070847272872924805, 0.007565498352050781, 0.008046269416809082, 0.008527040481567383, 0.009007811546325684, 0.009488582611083984, 0.009969353675842285, 0.010450124740600586, 0.010930895805358887, 0.011411666870117188, 0.011892437934875488, 0.012373208999633789, 0.01285398006439209, 0.01333475112915039, 0.013815522193908691, 0.014296293258666992, 0.014777064323425293, 0.015257835388183594, 0.015738606452941895, 0.016219377517700195, 0.016700148582458496, 0.017180919647216797, 0.017661690711975098, 0.0181424617767334, 0.0186232328414917, 0.01910400390625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 33.0, 163.0, 449.0, 296.0, 67.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044992691255174577, -0.00042295450111851096, -0.0003959821187891066, -0.0003690097073558718, -0.000342037295922637, -0.0003150648844894022, -0.00028809247305616736, -0.000261120090726763, -0.0002341476792935282, -0.0002071752678602934, -0.0001802028709789738, -0.00015323047409765422, -0.0001262580626644194, -9.92856512311846e-05, -7.231325434986502e-05, -4.534085746854544e-05, -1.8368446035310626e-05, 8.60395812196657e-06, 3.557636227924377e-05, 6.254876643652096e-05, 8.952117059379816e-05, 0.00011649358202703297, 0.00014346597890835255, 0.00017043837578967214, 0.00019741078722290695, 0.00022438319865614176, 0.0002513555809855461, 0.0002783279924187809, 0.00030530040385201573, 0.00033227281528525054, 0.00035924522671848536, 0.0003862176090478897, 0.00041318999137729406, 0.0004401624028105289, 0.0004671348142437637, 0.000494107196573168, 0.0005210796371102333, 0.0005480520194396377, 0.000575024401769042, 0.0006019967840984464, 0.0006289692246355116, 0.000655941606964916, 0.0006829140475019813, 0.0007098864298313856, 0.00073685881216079, 0.0007638312526978552, 0.0007908036350272596, 0.0008177760755643249, 0.0008447484578937292, 0.0008717208402231336, 0.0008986932807601988, 0.0009256656630896032, 0.0009526381036266685, 0.0009796104859560728, 0.0010065828682854772, 0.0010335552506148815, 0.0010605277493596077, 0.001087500131689012, 0.0011144725140184164, 0.0011414450127631426, 0.001168417395092547, 0.0011953897774219513, 0.0012223621597513556, 0.00124933454208076, 0.0012763069244101644]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 5.0, 6.0, 11.0, 23.0, 16.0, 14.0, 12.0, 28.0, 19.0, 21.0, 33.0, 32.0, 34.0, 39.0, 36.0, 33.0, 40.0, 47.0, 53.0, 35.0, 29.0, 28.0, 38.0, 33.0, 39.0, 36.0, 39.0, 32.0, 20.0, 18.0, 22.0, 17.0, 20.0, 11.0, 9.0, 7.0, 8.0, 9.0, 9.0, 7.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00025707483291625977, -0.00024903565645217896, -0.00024099647998809814, -0.00023295730352401733, -0.00022491812705993652, -0.0002168789505958557, -0.0002088397741317749, -0.0002008005976676941, -0.00019276142120361328, -0.00018472224473953247, -0.00017668306827545166, -0.00016864389181137085, -0.00016060471534729004, -0.00015256553888320923, -0.00014452636241912842, -0.0001364871859550476, -0.0001284480094909668, -0.00012040883302688599, -0.00011236965656280518, -0.00010433048009872437, -9.629130363464355e-05, -8.825212717056274e-05, -8.021295070648193e-05, -7.217377424240112e-05, -6.413459777832031e-05, -5.60954213142395e-05, -4.805624485015869e-05, -4.001706838607788e-05, -3.197789192199707e-05, -2.393871545791626e-05, -1.589953899383545e-05, -7.860362529754639e-06, 1.7881393432617188e-07, 8.217990398406982e-06, 1.6257166862487793e-05, 2.4296343326568604e-05, 3.2335519790649414e-05, 4.0374696254730225e-05, 4.8413872718811035e-05, 5.6453049182891846e-05, 6.449222564697266e-05, 7.253140211105347e-05, 8.057057857513428e-05, 8.860975503921509e-05, 9.66489315032959e-05, 0.00010468810796737671, 0.00011272728443145752, 0.00012076646089553833, 0.00012880563735961914, 0.00013684481382369995, 0.00014488399028778076, 0.00015292316675186157, 0.00016096234321594238, 0.0001690015196800232, 0.000177040696144104, 0.00018507987260818481, 0.00019311904907226562, 0.00020115822553634644, 0.00020919740200042725, 0.00021723657846450806, 0.00022527575492858887, 0.00023331493139266968, 0.0002413541078567505, 0.0002493932843208313, 0.0002574324607849121]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 8.0, 4.0, 13.0, 9.0, 7.0, 10.0, 13.0, 14.0, 8.0, 23.0, 22.0, 22.0, 21.0, 34.0, 27.0, 27.0, 47.0, 38.0, 43.0, 47.0, 44.0, 48.0, 38.0, 47.0, 37.0, 30.0, 35.0, 41.0, 19.0, 16.0, 19.0, 17.0, 27.0, 21.0, 20.0, 21.0, 13.0, 17.0, 11.0, 10.0, 7.0, 2.0, 5.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.7421875, -9.4517822265625, -9.161376953125, -8.8709716796875, -8.58056640625, -8.2901611328125, -7.999755859375, -7.7093505859375, -7.4189453125, -7.1285400390625, -6.838134765625, -6.5477294921875, -6.25732421875, -5.9669189453125, -5.676513671875, -5.3861083984375, -5.095703125, -4.8052978515625, -4.514892578125, -4.2244873046875, -3.93408203125, -3.6436767578125, -3.353271484375, -3.0628662109375, -2.7724609375, -2.4820556640625, -2.191650390625, -1.9012451171875, -1.61083984375, -1.3204345703125, -1.030029296875, -0.7396240234375, -0.44921875, -0.1588134765625, 0.131591796875, 0.4219970703125, 0.71240234375, 1.0028076171875, 1.293212890625, 1.5836181640625, 1.8740234375, 2.1644287109375, 2.454833984375, 2.7452392578125, 3.03564453125, 3.3260498046875, 3.616455078125, 3.9068603515625, 4.197265625, 4.4876708984375, 4.778076171875, 5.0684814453125, 5.35888671875, 5.6492919921875, 5.939697265625, 6.2301025390625, 6.5205078125, 6.8109130859375, 7.101318359375, 7.3917236328125, 7.68212890625, 7.9725341796875, 8.262939453125, 8.5533447265625, 8.84375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 6.0, 6.0, 13.0, 14.0, 15.0, 12.0, 23.0, 32.0, 42.0, 39.0, 68.0, 90.0, 99.0, 135.0, 204.0, 303.0, 485.0, 1050.0, 2598.0, 7571.0, 23710.0, 89822.0, 376541.0, 406898.0, 99376.0, 25910.0, 7937.0, 2688.0, 1116.0, 540.0, 335.0, 230.0, 138.0, 96.0, 91.0, 65.0, 55.0, 40.0, 21.0, 29.0, 23.0, 13.0, 18.0, 7.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0], "bins": [-15.21875, -14.758056640625, -14.29736328125, -13.836669921875, -13.3759765625, -12.915283203125, -12.45458984375, -11.993896484375, -11.533203125, -11.072509765625, -10.61181640625, -10.151123046875, -9.6904296875, -9.229736328125, -8.76904296875, -8.308349609375, -7.84765625, -7.386962890625, -6.92626953125, -6.465576171875, -6.0048828125, -5.544189453125, -5.08349609375, -4.622802734375, -4.162109375, -3.701416015625, -3.24072265625, -2.780029296875, -2.3193359375, -1.858642578125, -1.39794921875, -0.937255859375, -0.4765625, -0.015869140625, 0.44482421875, 0.905517578125, 1.3662109375, 1.826904296875, 2.28759765625, 2.748291015625, 3.208984375, 3.669677734375, 4.13037109375, 4.591064453125, 5.0517578125, 5.512451171875, 5.97314453125, 6.433837890625, 6.89453125, 7.355224609375, 7.81591796875, 8.276611328125, 8.7373046875, 9.197998046875, 9.65869140625, 10.119384765625, 10.580078125, 11.040771484375, 11.50146484375, 11.962158203125, 12.4228515625, 12.883544921875, 13.34423828125, 13.804931640625, 14.265625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 4.0, 8.0, 10.0, 13.0, 13.0, 15.0, 17.0, 33.0, 21.0, 17.0, 25.0, 28.0, 33.0, 41.0, 36.0, 44.0, 66.0, 77.0, 175.0, 1348.0, 331.0, 137.0, 85.0, 49.0, 46.0, 42.0, 31.0, 34.0, 34.0, 29.0, 26.0, 23.0, 26.0, 19.0, 14.0, 13.0, 14.0, 7.0, 6.0, 9.0, 4.0, 7.0, 7.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-28.40625, -27.51806640625, -26.6298828125, -25.74169921875, -24.853515625, -23.96533203125, -23.0771484375, -22.18896484375, -21.30078125, -20.41259765625, -19.5244140625, -18.63623046875, -17.748046875, -16.85986328125, -15.9716796875, -15.08349609375, -14.1953125, -13.30712890625, -12.4189453125, -11.53076171875, -10.642578125, -9.75439453125, -8.8662109375, -7.97802734375, -7.08984375, -6.20166015625, -5.3134765625, -4.42529296875, -3.537109375, -2.64892578125, -1.7607421875, -0.87255859375, 0.015625, 0.90380859375, 1.7919921875, 2.68017578125, 3.568359375, 4.45654296875, 5.3447265625, 6.23291015625, 7.12109375, 8.00927734375, 8.8974609375, 9.78564453125, 10.673828125, 11.56201171875, 12.4501953125, 13.33837890625, 14.2265625, 15.11474609375, 16.0029296875, 16.89111328125, 17.779296875, 18.66748046875, 19.5556640625, 20.44384765625, 21.33203125, 22.22021484375, 23.1083984375, 23.99658203125, 24.884765625, 25.77294921875, 26.6611328125, 27.54931640625, 28.4375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 7.0, 6.0, 14.0, 14.0, 14.0, 26.0, 36.0, 46.0, 55.0, 79.0, 109.0, 151.0, 260.0, 462.0, 1296.0, 14504.0, 3081339.0, 44107.0, 1700.0, 586.0, 270.0, 187.0, 101.0, 83.0, 60.0, 46.0, 39.0, 19.0, 18.0, 12.0, 15.0, 9.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.3125, -74.29296875, -71.2734375, -68.25390625, -65.234375, -62.21484375, -59.1953125, -56.17578125, -53.15625, -50.13671875, -47.1171875, -44.09765625, -41.078125, -38.05859375, -35.0390625, -32.01953125, -29.0, -25.98046875, -22.9609375, -19.94140625, -16.921875, -13.90234375, -10.8828125, -7.86328125, -4.84375, -1.82421875, 1.1953125, 4.21484375, 7.234375, 10.25390625, 13.2734375, 16.29296875, 19.3125, 22.33203125, 25.3515625, 28.37109375, 31.390625, 34.41015625, 37.4296875, 40.44921875, 43.46875, 46.48828125, 49.5078125, 52.52734375, 55.546875, 58.56640625, 61.5859375, 64.60546875, 67.625, 70.64453125, 73.6640625, 76.68359375, 79.703125, 82.72265625, 85.7421875, 88.76171875, 91.78125, 94.80078125, 97.8203125, 100.83984375, 103.859375, 106.87890625, 109.8984375, 112.91796875, 115.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 217.0, 754.0, 43.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-515.4291381835938, -504.5255432128906, -493.6219787597656, -482.7183837890625, -471.8148193359375, -460.9112243652344, -450.00762939453125, -439.10406494140625, -428.20050048828125, -417.2969055175781, -406.3933410644531, -395.48974609375, -384.586181640625, -373.6825866699219, -362.77899169921875, -351.87542724609375, -340.9718322753906, -330.0682373046875, -319.1646728515625, -308.2610778808594, -297.3575134277344, -286.45391845703125, -275.55035400390625, -264.6467590332031, -253.74317932128906, -242.839599609375, -231.93601989746094, -221.03244018554688, -210.12884521484375, -199.22528076171875, -188.32168579101562, -177.41810607910156, -166.51454162597656, -155.6109619140625, -144.70738220214844, -133.80380249023438, -122.90021514892578, -111.99663543701172, -101.09304809570312, -90.18946838378906, -79.285888671875, -68.38230895996094, -57.47872543334961, -46.57514190673828, -35.67156219482422, -24.767982482910156, -13.864395141601562, -2.9608154296875, 7.9427642822265625, 18.846345901489258, 29.749927520751953, 40.65351104736328, 51.557090759277344, 62.460670471191406, 73.3642578125, 84.26783752441406, 95.17141723632812, 106.07499694824219, 116.97857666015625, 127.88216400146484, 138.78573608398438, 149.6893310546875, 160.59291076660156, 171.49649047851562, 182.4000701904297]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 6.0, 6.0, 10.0, 11.0, 16.0, 18.0, 21.0, 22.0, 18.0, 17.0, 20.0, 33.0, 30.0, 28.0, 34.0, 38.0, 44.0, 29.0, 51.0, 48.0, 36.0, 36.0, 48.0, 35.0, 33.0, 44.0, 32.0, 21.0, 32.0, 21.0, 15.0, 26.0, 25.0, 18.0, 12.0, 8.0, 12.0, 9.0, 5.0, 1.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.20426177978516, -73.78888702392578, -71.3735122680664, -68.95813751220703, -66.54277038574219, -64.12739562988281, -61.71202087402344, -59.29664611816406, -56.88127136230469, -54.46589660644531, -52.05052185058594, -49.63515090942383, -47.21977615356445, -44.80440139770508, -42.38903045654297, -39.973655700683594, -37.55828094482422, -35.142906188964844, -32.72753143310547, -30.31216049194336, -27.896785736083984, -25.48141098022461, -23.066038131713867, -20.650665283203125, -18.23529052734375, -15.819916725158691, -13.404542922973633, -10.989169120788574, -8.573795318603516, -6.158421516418457, -3.7430477142333984, -1.3276748657226562, 1.0876998901367188, 3.5030736923217773, 5.918447494506836, 8.333821296691895, 10.749195098876953, 13.164568901062012, 15.57994270324707, 17.995315551757812, 20.410690307617188, 22.826065063476562, 25.241437911987305, 27.656810760498047, 30.072185516357422, 32.4875602722168, 34.902931213378906, 37.31830596923828, 39.733680725097656, 42.14905548095703, 44.564430236816406, 46.979801177978516, 49.39517593383789, 51.810550689697266, 54.225921630859375, 56.64129638671875, 59.056671142578125, 61.4720458984375, 63.887420654296875, 66.30279541015625, 68.71817016601562, 71.13353729248047, 73.54891204833984, 75.96428680419922, 78.3796615600586]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 6.0, 3.0, 6.0, 5.0, 7.0, 8.0, 11.0, 5.0, 11.0, 13.0, 15.0, 19.0, 15.0, 12.0, 25.0, 35.0, 31.0, 31.0, 37.0, 23.0, 38.0, 36.0, 30.0, 31.0, 39.0, 39.0, 46.0, 42.0, 34.0, 36.0, 36.0, 38.0, 22.0, 29.0, 29.0, 15.0, 19.0, 26.0, 17.0, 11.0, 16.0, 12.0, 14.0, 9.0, 9.0, 3.0, 2.0, 2.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.659912109375, -8.35107421875, -8.042236328125, -7.7333984375, -7.424560546875, -7.11572265625, -6.806884765625, -6.498046875, -6.189208984375, -5.88037109375, -5.571533203125, -5.2626953125, -4.953857421875, -4.64501953125, -4.336181640625, -4.02734375, -3.718505859375, -3.40966796875, -3.100830078125, -2.7919921875, -2.483154296875, -2.17431640625, -1.865478515625, -1.556640625, -1.247802734375, -0.93896484375, -0.630126953125, -0.3212890625, -0.012451171875, 0.29638671875, 0.605224609375, 0.9140625, 1.222900390625, 1.53173828125, 1.840576171875, 2.1494140625, 2.458251953125, 2.76708984375, 3.075927734375, 3.384765625, 3.693603515625, 4.00244140625, 4.311279296875, 4.6201171875, 4.928955078125, 5.23779296875, 5.546630859375, 5.85546875, 6.164306640625, 6.47314453125, 6.781982421875, 7.0908203125, 7.399658203125, 7.70849609375, 8.017333984375, 8.326171875, 8.635009765625, 8.94384765625, 9.252685546875, 9.5615234375, 9.870361328125, 10.17919921875, 10.488037109375, 10.796875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 8.0, 7.0, 10.0, 10.0, 11.0, 15.0, 27.0, 21.0, 25.0, 23.0, 35.0, 63.0, 78.0, 96.0, 137.0, 290.0, 692.0, 2555.0, 21105.0, 399661.0, 2688757.0, 1017703.0, 56080.0, 4806.0, 1005.0, 375.0, 196.0, 109.0, 72.0, 44.0, 39.0, 35.0, 29.0, 21.0, 21.0, 17.0, 12.0, 20.0, 10.0, 10.0, 7.0, 10.0, 5.0, 0.0, 10.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.234375, -22.451416015625, -21.66845703125, -20.885498046875, -20.1025390625, -19.319580078125, -18.53662109375, -17.753662109375, -16.970703125, -16.187744140625, -15.40478515625, -14.621826171875, -13.8388671875, -13.055908203125, -12.27294921875, -11.489990234375, -10.70703125, -9.924072265625, -9.14111328125, -8.358154296875, -7.5751953125, -6.792236328125, -6.00927734375, -5.226318359375, -4.443359375, -3.660400390625, -2.87744140625, -2.094482421875, -1.3115234375, -0.528564453125, 0.25439453125, 1.037353515625, 1.8203125, 2.603271484375, 3.38623046875, 4.169189453125, 4.9521484375, 5.735107421875, 6.51806640625, 7.301025390625, 8.083984375, 8.866943359375, 9.64990234375, 10.432861328125, 11.2158203125, 11.998779296875, 12.78173828125, 13.564697265625, 14.34765625, 15.130615234375, 15.91357421875, 16.696533203125, 17.4794921875, 18.262451171875, 19.04541015625, 19.828369140625, 20.611328125, 21.394287109375, 22.17724609375, 22.960205078125, 23.7431640625, 24.526123046875, 25.30908203125, 26.092041015625, 26.875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 8.0, 10.0, 8.0, 13.0, 18.0, 23.0, 29.0, 44.0, 47.0, 68.0, 110.0, 156.0, 210.0, 274.0, 403.0, 448.0, 477.0, 441.0, 362.0, 274.0, 180.0, 141.0, 114.0, 67.0, 33.0, 38.0, 19.0, 18.0, 12.0, 9.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.578125, -19.008056640625, -18.43798828125, -17.867919921875, -17.2978515625, -16.727783203125, -16.15771484375, -15.587646484375, -15.017578125, -14.447509765625, -13.87744140625, -13.307373046875, -12.7373046875, -12.167236328125, -11.59716796875, -11.027099609375, -10.45703125, -9.886962890625, -9.31689453125, -8.746826171875, -8.1767578125, -7.606689453125, -7.03662109375, -6.466552734375, -5.896484375, -5.326416015625, -4.75634765625, -4.186279296875, -3.6162109375, -3.046142578125, -2.47607421875, -1.906005859375, -1.3359375, -0.765869140625, -0.19580078125, 0.374267578125, 0.9443359375, 1.514404296875, 2.08447265625, 2.654541015625, 3.224609375, 3.794677734375, 4.36474609375, 4.934814453125, 5.5048828125, 6.074951171875, 6.64501953125, 7.215087890625, 7.78515625, 8.355224609375, 8.92529296875, 9.495361328125, 10.0654296875, 10.635498046875, 11.20556640625, 11.775634765625, 12.345703125, 12.915771484375, 13.48583984375, 14.055908203125, 14.6259765625, 15.196044921875, 15.76611328125, 16.336181640625, 16.90625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 13.0, 8.0, 22.0, 35.0, 35.0, 60.0, 71.0, 86.0, 108.0, 161.0, 222.0, 368.0, 651.0, 1588.0, 6711.0, 77282.0, 2559530.0, 1495373.0, 44327.0, 4651.0, 1229.0, 560.0, 335.0, 211.0, 168.0, 103.0, 96.0, 63.0, 48.0, 43.0, 37.0, 26.0, 9.0, 7.0, 12.0, 11.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.6875, -36.3837890625, -35.080078125, -33.7763671875, -32.47265625, -31.1689453125, -29.865234375, -28.5615234375, -27.2578125, -25.9541015625, -24.650390625, -23.3466796875, -22.04296875, -20.7392578125, -19.435546875, -18.1318359375, -16.828125, -15.5244140625, -14.220703125, -12.9169921875, -11.61328125, -10.3095703125, -9.005859375, -7.7021484375, -6.3984375, -5.0947265625, -3.791015625, -2.4873046875, -1.18359375, 0.1201171875, 1.423828125, 2.7275390625, 4.03125, 5.3349609375, 6.638671875, 7.9423828125, 9.24609375, 10.5498046875, 11.853515625, 13.1572265625, 14.4609375, 15.7646484375, 17.068359375, 18.3720703125, 19.67578125, 20.9794921875, 22.283203125, 23.5869140625, 24.890625, 26.1943359375, 27.498046875, 28.8017578125, 30.10546875, 31.4091796875, 32.712890625, 34.0166015625, 35.3203125, 36.6240234375, 37.927734375, 39.2314453125, 40.53515625, 41.8388671875, 43.142578125, 44.4462890625, 45.75]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 11.0, 161.0, 591.0, 237.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.8463134765625, -177.69480895996094, -165.54330444335938, -153.39181518554688, -141.24029541015625, -129.08880615234375, -116.93730163574219, -104.78579711914062, -92.63429260253906, -80.4827880859375, -68.33128356933594, -56.179786682128906, -44.028282165527344, -31.87677764892578, -19.72528076171875, -7.5737762451171875, 4.577728271484375, 16.729230880737305, 28.880733489990234, 41.03223419189453, 53.183738708496094, 65.33524322509766, 77.48674011230469, 89.63824462890625, 101.78974914550781, 113.94125366210938, 126.09275817871094, 138.2442626953125, 150.395751953125, 162.54727172851562, 174.69876098632812, 186.8502655029297, 199.00177001953125, 211.1532745361328, 223.30477905273438, 235.45626831054688, 247.6077880859375, 259.75927734375, 271.9107666015625, 284.0622863769531, 296.21380615234375, 308.36529541015625, 320.5168151855469, 332.6683044433594, 344.81982421875, 356.9713134765625, 369.122802734375, 381.2743225097656, 393.4258117675781, 405.5773010253906, 417.72882080078125, 429.88031005859375, 442.0318298339844, 454.1833190917969, 466.3348388671875, 478.486328125, 490.6378173828125, 502.789306640625, 514.9407958984375, 527.0923461914062, 539.2438354492188, 551.3953247070312, 563.5468139648438, 575.6983642578125, 587.849853515625]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 8.0, 9.0, 18.0, 8.0, 18.0, 10.0, 25.0, 28.0, 22.0, 17.0, 33.0, 39.0, 26.0, 35.0, 45.0, 35.0, 43.0, 41.0, 52.0, 45.0, 35.0, 45.0, 33.0, 31.0, 33.0, 23.0, 27.0, 28.0, 24.0, 25.0, 19.0, 24.0, 19.0, 6.0, 10.0, 9.0, 7.0, 9.0, 2.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-66.0582275390625, -64.1529541015625, -62.24768829345703, -60.3424186706543, -58.43714904785156, -56.53187942504883, -54.626609802246094, -52.721336364746094, -50.816070556640625, -48.91080093383789, -47.005531311035156, -45.10026168823242, -43.19499206542969, -41.28972244262695, -39.38445281982422, -37.47917938232422, -35.573909759521484, -33.66864013671875, -31.763370513916016, -29.85810089111328, -27.952831268310547, -26.047561645507812, -24.142290115356445, -22.23702049255371, -20.331750869750977, -18.426481246948242, -16.521211624145508, -14.615941047668457, -12.710671424865723, -10.805401802062988, -8.900131225585938, -6.994861602783203, -5.089595794677734, -3.184325933456421, -1.2790560722351074, 0.6262140274047852, 2.5314836502075195, 4.436753273010254, 6.342023849487305, 8.247293472290039, 10.152563095092773, 12.057832717895508, 13.963102340698242, 15.868372917175293, 17.773643493652344, 19.678913116455078, 21.584182739257812, 23.489452362060547, 25.39472198486328, 27.299991607666016, 29.20526123046875, 31.110530853271484, 33.01580047607422, 34.92107009887695, 36.82633972167969, 38.73161315917969, 40.636878967285156, 42.54214859008789, 44.447418212890625, 46.35268783569336, 48.257957458496094, 50.16322708129883, 52.06849670410156, 53.97377014160156, 55.8790397644043]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 7.0, 1.0, 5.0, 11.0, 6.0, 7.0, 11.0, 11.0, 16.0, 20.0, 17.0, 17.0, 19.0, 24.0, 25.0, 22.0, 33.0, 30.0, 31.0, 35.0, 41.0, 39.0, 34.0, 32.0, 38.0, 37.0, 29.0, 53.0, 25.0, 25.0, 31.0, 39.0, 28.0, 18.0, 21.0, 20.0, 20.0, 18.0, 13.0, 13.0, 13.0, 9.0, 11.0, 6.0, 4.0, 4.0, 10.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-8.8125, -8.5201416015625, -8.227783203125, -7.9354248046875, -7.64306640625, -7.3507080078125, -7.058349609375, -6.7659912109375, -6.4736328125, -6.1812744140625, -5.888916015625, -5.5965576171875, -5.30419921875, -5.0118408203125, -4.719482421875, -4.4271240234375, -4.134765625, -3.8424072265625, -3.550048828125, -3.2576904296875, -2.96533203125, -2.6729736328125, -2.380615234375, -2.0882568359375, -1.7958984375, -1.5035400390625, -1.211181640625, -0.9188232421875, -0.62646484375, -0.3341064453125, -0.041748046875, 0.2506103515625, 0.54296875, 0.8353271484375, 1.127685546875, 1.4200439453125, 1.71240234375, 2.0047607421875, 2.297119140625, 2.5894775390625, 2.8818359375, 3.1741943359375, 3.466552734375, 3.7589111328125, 4.05126953125, 4.3436279296875, 4.635986328125, 4.9283447265625, 5.220703125, 5.5130615234375, 5.805419921875, 6.0977783203125, 6.39013671875, 6.6824951171875, 6.974853515625, 7.2672119140625, 7.5595703125, 7.8519287109375, 8.144287109375, 8.4366455078125, 8.72900390625, 9.0213623046875, 9.313720703125, 9.6060791015625, 9.8984375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 0.0, 12.0, 10.0, 20.0, 47.0, 51.0, 61.0, 96.0, 113.0, 197.0, 283.0, 362.0, 527.0, 696.0, 919.0, 1392.0, 1771.0, 2357.0, 3209.0, 4532.0, 6028.0, 8022.0, 11299.0, 15827.0, 22373.0, 32714.0, 49536.0, 79752.0, 145300.0, 291712.0, 136195.0, 75889.0, 47683.0, 31735.0, 21818.0, 15291.0, 10764.0, 8038.0, 5821.0, 4109.0, 3219.0, 2353.0, 1735.0, 1261.0, 972.0, 697.0, 504.0, 342.0, 261.0, 216.0, 132.0, 113.0, 69.0, 39.0, 25.0, 17.0, 22.0, 13.0, 6.0, 8.0], "bins": [-2.3359375, -2.26611328125, -2.1962890625, -2.12646484375, -2.056640625, -1.98681640625, -1.9169921875, -1.84716796875, -1.77734375, -1.70751953125, -1.6376953125, -1.56787109375, -1.498046875, -1.42822265625, -1.3583984375, -1.28857421875, -1.21875, -1.14892578125, -1.0791015625, -1.00927734375, -0.939453125, -0.86962890625, -0.7998046875, -0.72998046875, -0.66015625, -0.59033203125, -0.5205078125, -0.45068359375, -0.380859375, -0.31103515625, -0.2412109375, -0.17138671875, -0.1015625, -0.03173828125, 0.0380859375, 0.10791015625, 0.177734375, 0.24755859375, 0.3173828125, 0.38720703125, 0.45703125, 0.52685546875, 0.5966796875, 0.66650390625, 0.736328125, 0.80615234375, 0.8759765625, 0.94580078125, 1.015625, 1.08544921875, 1.1552734375, 1.22509765625, 1.294921875, 1.36474609375, 1.4345703125, 1.50439453125, 1.57421875, 1.64404296875, 1.7138671875, 1.78369140625, 1.853515625, 1.92333984375, 1.9931640625, 2.06298828125, 2.1328125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 5.0, 12.0, 12.0, 8.0, 12.0, 9.0, 20.0, 10.0, 21.0, 22.0, 24.0, 25.0, 31.0, 26.0, 46.0, 40.0, 45.0, 39.0, 54.0, 1053.0, 31.0, 36.0, 48.0, 39.0, 31.0, 42.0, 34.0, 32.0, 26.0, 25.0, 20.0, 22.0, 18.0, 13.0, 19.0, 11.0, 9.0, 11.0, 7.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-7.12890625, -6.91802978515625, -6.7071533203125, -6.49627685546875, -6.285400390625, -6.07452392578125, -5.8636474609375, -5.65277099609375, -5.44189453125, -5.23101806640625, -5.0201416015625, -4.80926513671875, -4.598388671875, -4.38751220703125, -4.1766357421875, -3.96575927734375, -3.7548828125, -3.54400634765625, -3.3331298828125, -3.12225341796875, -2.911376953125, -2.70050048828125, -2.4896240234375, -2.27874755859375, -2.06787109375, -1.85699462890625, -1.6461181640625, -1.43524169921875, -1.224365234375, -1.01348876953125, -0.8026123046875, -0.59173583984375, -0.380859375, -0.16998291015625, 0.0408935546875, 0.25177001953125, 0.462646484375, 0.67352294921875, 0.8843994140625, 1.09527587890625, 1.30615234375, 1.51702880859375, 1.7279052734375, 1.93878173828125, 2.149658203125, 2.36053466796875, 2.5714111328125, 2.78228759765625, 2.9931640625, 3.20404052734375, 3.4149169921875, 3.62579345703125, 3.836669921875, 4.04754638671875, 4.2584228515625, 4.46929931640625, 4.68017578125, 4.89105224609375, 5.1019287109375, 5.31280517578125, 5.523681640625, 5.73455810546875, 5.9454345703125, 6.15631103515625, 6.3671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 12.0, 6.0, 9.0, 13.0, 30.0, 32.0, 54.0, 77.0, 114.0, 212.0, 208.0, 348.0, 503.0, 714.0, 1029.0, 1507.0, 2157.0, 3129.0, 4466.0, 6195.0, 9138.0, 13569.0, 20225.0, 30660.0, 47669.0, 76137.0, 134545.0, 1348040.0, 156008.0, 85106.0, 52370.0, 33727.0, 22047.0, 14712.0, 9972.0, 6812.0, 4647.0, 3339.0, 2304.0, 1669.0, 1127.0, 760.0, 507.0, 399.0, 258.0, 186.0, 118.0, 93.0, 52.0, 49.0, 28.0, 23.0, 12.0, 5.0, 9.0, 3.0, 1.0, 6.0], "bins": [-2.677734375, -2.598052978515625, -2.51837158203125, -2.438690185546875, -2.3590087890625, -2.279327392578125, -2.19964599609375, -2.119964599609375, -2.040283203125, -1.960601806640625, -1.88092041015625, -1.801239013671875, -1.7215576171875, -1.641876220703125, -1.56219482421875, -1.482513427734375, -1.40283203125, -1.323150634765625, -1.24346923828125, -1.163787841796875, -1.0841064453125, -1.004425048828125, -0.92474365234375, -0.845062255859375, -0.765380859375, -0.685699462890625, -0.60601806640625, -0.526336669921875, -0.4466552734375, -0.366973876953125, -0.28729248046875, -0.207611083984375, -0.1279296875, -0.048248291015625, 0.03143310546875, 0.111114501953125, 0.1907958984375, 0.270477294921875, 0.35015869140625, 0.429840087890625, 0.509521484375, 0.589202880859375, 0.66888427734375, 0.748565673828125, 0.8282470703125, 0.907928466796875, 0.98760986328125, 1.067291259765625, 1.14697265625, 1.226654052734375, 1.30633544921875, 1.386016845703125, 1.4656982421875, 1.545379638671875, 1.62506103515625, 1.704742431640625, 1.784423828125, 1.864105224609375, 1.94378662109375, 2.023468017578125, 2.1031494140625, 2.182830810546875, 2.26251220703125, 2.342193603515625, 2.421875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 7.0, 13.0, 15.0, 27.0, 26.0, 23.0, 38.0, 45.0, 57.0, 71.0, 85.0, 78.0, 103.0, 69.0, 63.0, 49.0, 47.0, 37.0, 31.0, 35.0, 19.0, 10.0, 18.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005221366882324219, -0.0005052313208580017, -0.0004883259534835815, -0.0004714205861091614, -0.0004545152187347412, -0.00043760985136032104, -0.0004207044839859009, -0.0004037991166114807, -0.00038689374923706055, -0.0003699883818626404, -0.0003530830144882202, -0.00033617764711380005, -0.0003192722797393799, -0.0003023669123649597, -0.00028546154499053955, -0.0002685561776161194, -0.0002516508102416992, -0.00023474544286727905, -0.0002178400754928589, -0.00020093470811843872, -0.00018402934074401855, -0.0001671239733695984, -0.00015021860599517822, -0.00013331323862075806, -0.00011640787124633789, -9.950250387191772e-05, -8.259713649749756e-05, -6.569176912307739e-05, -4.8786401748657227e-05, -3.188103437423706e-05, -1.4975666999816895e-05, 1.9297003746032715e-06, 1.8835067749023438e-05, 3.5740435123443604e-05, 5.264580249786377e-05, 6.955116987228394e-05, 8.64565372467041e-05, 0.00010336190462112427, 0.00012026727199554443, 0.0001371726393699646, 0.00015407800674438477, 0.00017098337411880493, 0.0001878887414932251, 0.00020479410886764526, 0.00022169947624206543, 0.0002386048436164856, 0.00025551021099090576, 0.00027241557836532593, 0.0002893209457397461, 0.00030622631311416626, 0.0003231316804885864, 0.0003400370478630066, 0.00035694241523742676, 0.0003738477826118469, 0.0003907531499862671, 0.00040765851736068726, 0.0004245638847351074, 0.0004414692521095276, 0.00045837461948394775, 0.0004752799868583679, 0.0004921853542327881, 0.0005090907216072083, 0.0005259960889816284, 0.0005429014563560486, 0.0005598068237304688]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 6.0, 6.0, 10.0, 19.0, 27.0, 36.0, 54.0, 65.0, 102.0, 140.0, 208.0, 429.0, 1018.0, 309499.0, 734604.0, 1123.0, 499.0, 219.0, 140.0, 90.0, 68.0, 45.0, 36.0, 35.0, 17.0, 12.0, 10.0, 12.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01123046875, -0.010890603065490723, -0.010550737380981445, -0.010210871696472168, -0.00987100601196289, -0.009531140327453613, -0.009191274642944336, -0.008851408958435059, -0.008511543273925781, -0.008171677589416504, -0.007831811904907227, -0.007491946220397949, -0.007152080535888672, -0.0068122148513793945, -0.006472349166870117, -0.00613248348236084, -0.0057926177978515625, -0.005452752113342285, -0.005112886428833008, -0.0047730207443237305, -0.004433155059814453, -0.004093289375305176, -0.0037534236907958984, -0.003413558006286621, -0.0030736923217773438, -0.0027338266372680664, -0.002393960952758789, -0.0020540952682495117, -0.0017142295837402344, -0.001374363899230957, -0.0010344982147216797, -0.0006946325302124023, -0.000354766845703125, -1.4901161193847656e-05, 0.0003249645233154297, 0.000664830207824707, 0.0010046958923339844, 0.0013445615768432617, 0.001684427261352539, 0.0020242929458618164, 0.0023641586303710938, 0.002704024314880371, 0.0030438899993896484, 0.0033837556838989258, 0.003723621368408203, 0.0040634870529174805, 0.004403352737426758, 0.004743218421936035, 0.0050830841064453125, 0.00542294979095459, 0.005762815475463867, 0.0061026811599731445, 0.006442546844482422, 0.006782412528991699, 0.0071222782135009766, 0.007462143898010254, 0.007802009582519531, 0.008141875267028809, 0.008481740951538086, 0.008821606636047363, 0.00916147232055664, 0.009501338005065918, 0.009841203689575195, 0.010181069374084473, 0.01052093505859375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 57.0, 625.0, 318.0, 13.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002935346565209329, -0.00024281709920614958, -0.00019209952733945101, -0.00014138195547275245, -9.066439815796912e-05, -3.994684084318578e-05, 1.0770745575428009e-05, 6.148830289021134e-05, 0.00011220586020499468, 0.000162923417519778, 0.00021364098938647658, 0.00026435856125317514, 0.0003150761185679585, 0.0003657936758827418, 0.0004165112623013556, 0.00046722881961613894, 0.0005179463769309223, 0.0005686639342457056, 0.0006193814915604889, 0.0006700990488752723, 0.0007208166643977165, 0.0007715341635048389, 0.0008222517790272832, 0.0008729693363420665, 0.0009236868936568499, 0.0009744044509716332, 0.0010251220082864165, 0.0010758396238088608, 0.0011265571229159832, 0.0011772747384384274, 0.0012279923539608717, 0.0012787098530679941, 0.0013294273521751165, 0.0013801449676975608, 0.0014308624668046832, 0.0014815800823271275, 0.0015322975814342499, 0.0015830151969566941, 0.0016337328124791384, 0.0016844503115862608, 0.0017351678106933832, 0.0017858854262158275, 0.0018366029253229499, 0.0018873205408453941, 0.0019380380399525166, 0.001988755539059639, 0.002039473270997405, 0.0020901907701045275, 0.0021409085020422935, 0.002191626001149416, 0.002242343733087182, 0.0022930612321943045, 0.002343778731301427, 0.0023944962304085493, 0.0024452139623463154, 0.002495931461453438, 0.0025466489605605602, 0.0025973664596676826, 0.0026480841916054487, 0.002698801690712571, 0.0027495191898196936, 0.002800236688926816, 0.002850954420864582, 0.0029016719199717045, 0.002952389419078827]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 7.0, 5.0, 5.0, 15.0, 17.0, 12.0, 17.0, 12.0, 19.0, 17.0, 24.0, 27.0, 34.0, 35.0, 27.0, 35.0, 48.0, 55.0, 45.0, 40.0, 44.0, 52.0, 33.0, 39.0, 35.0, 31.0, 41.0, 33.0, 29.0, 37.0, 19.0, 22.0, 11.0, 13.0, 10.0, 11.0, 10.0, 4.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019627809524536133, -0.00018920749425888062, -0.0001821368932723999, -0.0001750662922859192, -0.00016799569129943848, -0.00016092509031295776, -0.00015385448932647705, -0.00014678388833999634, -0.00013971328735351562, -0.0001326426863670349, -0.0001255720853805542, -0.00011850148439407349, -0.00011143088340759277, -0.00010436028242111206, -9.728968143463135e-05, -9.021908044815063e-05, -8.314847946166992e-05, -7.607787847518921e-05, -6.90072774887085e-05, -6.193667650222778e-05, -5.486607551574707e-05, -4.779547452926636e-05, -4.0724873542785645e-05, -3.365427255630493e-05, -2.658367156982422e-05, -1.9513070583343506e-05, -1.2442469596862793e-05, -5.37186861038208e-06, 1.6987323760986328e-06, 8.769333362579346e-06, 1.583993434906006e-05, 2.291053533554077e-05, 2.9981136322021484e-05, 3.70517373085022e-05, 4.412233829498291e-05, 5.119293928146362e-05, 5.8263540267944336e-05, 6.533414125442505e-05, 7.240474224090576e-05, 7.947534322738647e-05, 8.654594421386719e-05, 9.36165452003479e-05, 0.00010068714618682861, 0.00010775774717330933, 0.00011482834815979004, 0.00012189894914627075, 0.00012896955013275146, 0.00013604015111923218, 0.0001431107521057129, 0.0001501813530921936, 0.00015725195407867432, 0.00016432255506515503, 0.00017139315605163574, 0.00017846375703811646, 0.00018553435802459717, 0.00019260495901107788, 0.0001996755599975586, 0.0002067461609840393, 0.00021381676197052002, 0.00022088736295700073, 0.00022795796394348145, 0.00023502856492996216, 0.00024209916591644287, 0.0002491697669029236, 0.0002562403678894043]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 7.0, 1.0, 5.0, 11.0, 6.0, 7.0, 11.0, 11.0, 16.0, 20.0, 17.0, 17.0, 19.0, 24.0, 25.0, 22.0, 33.0, 30.0, 31.0, 35.0, 41.0, 40.0, 33.0, 32.0, 38.0, 37.0, 29.0, 53.0, 25.0, 25.0, 31.0, 39.0, 28.0, 18.0, 21.0, 20.0, 20.0, 18.0, 13.0, 13.0, 13.0, 9.0, 11.0, 6.0, 4.0, 4.0, 10.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-8.8125, -8.5201416015625, -8.227783203125, -7.9354248046875, -7.64306640625, -7.3507080078125, -7.058349609375, -6.7659912109375, -6.4736328125, -6.1812744140625, -5.888916015625, -5.5965576171875, -5.30419921875, -5.0118408203125, -4.719482421875, -4.4271240234375, -4.134765625, -3.8424072265625, -3.550048828125, -3.2576904296875, -2.96533203125, -2.6729736328125, -2.380615234375, -2.0882568359375, -1.7958984375, -1.5035400390625, -1.211181640625, -0.9188232421875, -0.62646484375, -0.3341064453125, -0.041748046875, 0.2506103515625, 0.54296875, 0.8353271484375, 1.127685546875, 1.4200439453125, 1.71240234375, 2.0047607421875, 2.297119140625, 2.5894775390625, 2.8818359375, 3.1741943359375, 3.466552734375, 3.7589111328125, 4.05126953125, 4.3436279296875, 4.635986328125, 4.9283447265625, 5.220703125, 5.5130615234375, 5.805419921875, 6.0977783203125, 6.39013671875, 6.6824951171875, 6.974853515625, 7.2672119140625, 7.5595703125, 7.8519287109375, 8.144287109375, 8.4366455078125, 8.72900390625, 9.0213623046875, 9.313720703125, 9.6060791015625, 9.8984375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 9.0, 17.0, 14.0, 26.0, 37.0, 33.0, 54.0, 65.0, 86.0, 98.0, 154.0, 175.0, 225.0, 274.0, 374.0, 534.0, 849.0, 1952.0, 6248.0, 27755.0, 177321.0, 711946.0, 94118.0, 17602.0, 4425.0, 1441.0, 700.0, 462.0, 376.0, 249.0, 187.0, 156.0, 139.0, 100.0, 79.0, 58.0, 43.0, 28.0, 21.0, 23.0, 16.0, 13.0, 15.0, 12.0, 13.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-22.65625, -21.909912109375, -21.16357421875, -20.417236328125, -19.6708984375, -18.924560546875, -18.17822265625, -17.431884765625, -16.685546875, -15.939208984375, -15.19287109375, -14.446533203125, -13.7001953125, -12.953857421875, -12.20751953125, -11.461181640625, -10.71484375, -9.968505859375, -9.22216796875, -8.475830078125, -7.7294921875, -6.983154296875, -6.23681640625, -5.490478515625, -4.744140625, -3.997802734375, -3.25146484375, -2.505126953125, -1.7587890625, -1.012451171875, -0.26611328125, 0.480224609375, 1.2265625, 1.972900390625, 2.71923828125, 3.465576171875, 4.2119140625, 4.958251953125, 5.70458984375, 6.450927734375, 7.197265625, 7.943603515625, 8.68994140625, 9.436279296875, 10.1826171875, 10.928955078125, 11.67529296875, 12.421630859375, 13.16796875, 13.914306640625, 14.66064453125, 15.406982421875, 16.1533203125, 16.899658203125, 17.64599609375, 18.392333984375, 19.138671875, 19.885009765625, 20.63134765625, 21.377685546875, 22.1240234375, 22.870361328125, 23.61669921875, 24.363037109375, 25.109375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 13.0, 19.0, 15.0, 26.0, 20.0, 23.0, 31.0, 29.0, 44.0, 38.0, 44.0, 59.0, 94.0, 211.0, 1536.0, 299.0, 115.0, 65.0, 51.0, 44.0, 41.0, 37.0, 30.0, 25.0, 29.0, 25.0, 9.0, 15.0, 10.0, 6.0, 8.0, 6.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.90625, -38.68359375, -37.4609375, -36.23828125, -35.015625, -33.79296875, -32.5703125, -31.34765625, -30.125, -28.90234375, -27.6796875, -26.45703125, -25.234375, -24.01171875, -22.7890625, -21.56640625, -20.34375, -19.12109375, -17.8984375, -16.67578125, -15.453125, -14.23046875, -13.0078125, -11.78515625, -10.5625, -9.33984375, -8.1171875, -6.89453125, -5.671875, -4.44921875, -3.2265625, -2.00390625, -0.78125, 0.44140625, 1.6640625, 2.88671875, 4.109375, 5.33203125, 6.5546875, 7.77734375, 9.0, 10.22265625, 11.4453125, 12.66796875, 13.890625, 15.11328125, 16.3359375, 17.55859375, 18.78125, 20.00390625, 21.2265625, 22.44921875, 23.671875, 24.89453125, 26.1171875, 27.33984375, 28.5625, 29.78515625, 31.0078125, 32.23046875, 33.453125, 34.67578125, 35.8984375, 37.12109375, 38.34375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 8.0, 8.0, 12.0, 13.0, 16.0, 16.0, 34.0, 29.0, 50.0, 42.0, 73.0, 109.0, 143.0, 244.0, 642.0, 1797.0, 23692.0, 3080446.0, 34757.0, 2010.0, 642.0, 282.0, 172.0, 107.0, 68.0, 50.0, 45.0, 39.0, 39.0, 28.0, 16.0, 17.0, 7.0, 11.0, 6.0, 5.0, 4.0, 2.0, 9.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.6875, -97.390625, -94.09375, -90.796875, -87.5, -84.203125, -80.90625, -77.609375, -74.3125, -71.015625, -67.71875, -64.421875, -61.125, -57.828125, -54.53125, -51.234375, -47.9375, -44.640625, -41.34375, -38.046875, -34.75, -31.453125, -28.15625, -24.859375, -21.5625, -18.265625, -14.96875, -11.671875, -8.375, -5.078125, -1.78125, 1.515625, 4.8125, 8.109375, 11.40625, 14.703125, 18.0, 21.296875, 24.59375, 27.890625, 31.1875, 34.484375, 37.78125, 41.078125, 44.375, 47.671875, 50.96875, 54.265625, 57.5625, 60.859375, 64.15625, 67.453125, 70.75, 74.046875, 77.34375, 80.640625, 83.9375, 87.234375, 90.53125, 93.828125, 97.125, 100.421875, 103.71875, 107.015625, 110.3125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [3.0, 11.0, 96.0, 549.0, 319.0, 38.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.00372886657715, -19.84703826904297, -12.690346717834473, -5.533655166625977, 1.6230354309082031, 8.779726028442383, 15.936418533325195, 23.093107223510742, 30.249799728393555, 37.406490325927734, 44.56318283081055, 51.719871520996094, 58.876564025878906, 66.03325653076172, 73.18994903564453, 80.34663391113281, 87.50332641601562, 94.66001892089844, 101.81671142578125, 108.97340393066406, 116.13008880615234, 123.28678131103516, 130.4434814453125, 137.60015869140625, 144.75685119628906, 151.91354370117188, 159.0702362060547, 166.2269287109375, 173.3836212158203, 180.54031372070312, 187.69699096679688, 194.8536834716797, 202.01039123535156, 209.16708374023438, 216.3237762451172, 223.48046875, 230.6371612548828, 237.79385375976562, 244.95053100585938, 252.1072235107422, 259.263916015625, 266.42059326171875, 273.5773010253906, 280.7339782714844, 287.89068603515625, 295.04736328125, 302.2040710449219, 309.3607482910156, 316.5174560546875, 323.67413330078125, 330.8308410644531, 337.9875183105469, 345.14422607421875, 352.3009033203125, 359.4576110839844, 366.6142883300781, 373.7709655761719, 380.9276428222656, 388.0843505859375, 395.24102783203125, 402.3977355957031, 409.5544128417969, 416.71112060546875, 423.8677978515625, 431.0245056152344]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 9.0, 4.0, 6.0, 9.0, 13.0, 10.0, 15.0, 17.0, 14.0, 15.0, 22.0, 20.0, 15.0, 35.0, 29.0, 34.0, 41.0, 35.0, 38.0, 31.0, 31.0, 34.0, 34.0, 37.0, 36.0, 35.0, 42.0, 45.0, 28.0, 37.0, 33.0, 24.0, 24.0, 26.0, 20.0, 26.0, 17.0, 7.0, 14.0, 7.0, 5.0, 7.0, 9.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-84.48446655273438, -81.71961975097656, -78.95477294921875, -76.18992614746094, -73.42507934570312, -70.66023254394531, -67.8953857421875, -65.13054656982422, -62.365699768066406, -59.600852966308594, -56.83600616455078, -54.07115936279297, -51.30631637573242, -48.54146957397461, -45.7766227722168, -43.01177978515625, -40.24692916870117, -37.48208236694336, -34.71723556518555, -31.952390670776367, -29.187545776367188, -26.422698974609375, -23.657852172851562, -20.893007278442383, -18.12816047668457, -15.363314628601074, -12.598468780517578, -9.833621978759766, -7.0687761306762695, -4.303930282592773, -1.539083480834961, 1.2257614135742188, 3.9906082153320312, 6.755454063415527, 9.520299911499023, 12.285146713256836, 15.049992561340332, 17.814838409423828, 20.57968521118164, 23.34453010559082, 26.109376907348633, 28.874223709106445, 31.639068603515625, 34.40391540527344, 37.16876220703125, 39.93360900878906, 42.698455810546875, 45.46329879760742, 48.228145599365234, 50.99299240112305, 53.75783920288086, 56.522682189941406, 59.28752899169922, 62.05237579345703, 64.81722259521484, 67.58206939697266, 70.34691619873047, 73.11176300048828, 75.8766098022461, 78.6414566040039, 81.40630340576172, 84.171142578125, 86.93598937988281, 89.70083618164062, 92.46568298339844]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 4.0, 4.0, 6.0, 6.0, 11.0, 15.0, 9.0, 14.0, 12.0, 23.0, 22.0, 18.0, 30.0, 21.0, 36.0, 31.0, 33.0, 41.0, 41.0, 39.0, 31.0, 35.0, 43.0, 33.0, 44.0, 39.0, 33.0, 43.0, 26.0, 32.0, 32.0, 24.0, 23.0, 20.0, 15.0, 14.0, 15.0, 10.0, 9.0, 8.0, 12.0, 9.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 8.0, 1.0, 2.0, 3.0, 2.0], "bins": [-11.2578125, -10.9180908203125, -10.578369140625, -10.2386474609375, -9.89892578125, -9.5592041015625, -9.219482421875, -8.8797607421875, -8.5400390625, -8.2003173828125, -7.860595703125, -7.5208740234375, -7.18115234375, -6.8414306640625, -6.501708984375, -6.1619873046875, -5.822265625, -5.4825439453125, -5.142822265625, -4.8031005859375, -4.46337890625, -4.1236572265625, -3.783935546875, -3.4442138671875, -3.1044921875, -2.7647705078125, -2.425048828125, -2.0853271484375, -1.74560546875, -1.4058837890625, -1.066162109375, -0.7264404296875, -0.38671875, -0.0469970703125, 0.292724609375, 0.6324462890625, 0.97216796875, 1.3118896484375, 1.651611328125, 1.9913330078125, 2.3310546875, 2.6707763671875, 3.010498046875, 3.3502197265625, 3.68994140625, 4.0296630859375, 4.369384765625, 4.7091064453125, 5.048828125, 5.3885498046875, 5.728271484375, 6.0679931640625, 6.40771484375, 6.7474365234375, 7.087158203125, 7.4268798828125, 7.7666015625, 8.1063232421875, 8.446044921875, 8.7857666015625, 9.12548828125, 9.4652099609375, 9.804931640625, 10.1446533203125, 10.484375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 11.0, 8.0, 28.0, 22.0, 24.0, 29.0, 28.0, 41.0, 48.0, 77.0, 94.0, 132.0, 176.0, 240.0, 350.0, 655.0, 1593.0, 6382.0, 50228.0, 568827.0, 2378133.0, 1067285.0, 104566.0, 10579.0, 2300.0, 867.0, 419.0, 293.0, 196.0, 133.0, 109.0, 92.0, 57.0, 40.0, 51.0, 26.0, 27.0, 24.0, 17.0, 13.0, 12.0, 8.0, 7.0, 10.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-22.109375, -21.410888671875, -20.71240234375, -20.013916015625, -19.3154296875, -18.616943359375, -17.91845703125, -17.219970703125, -16.521484375, -15.822998046875, -15.12451171875, -14.426025390625, -13.7275390625, -13.029052734375, -12.33056640625, -11.632080078125, -10.93359375, -10.235107421875, -9.53662109375, -8.838134765625, -8.1396484375, -7.441162109375, -6.74267578125, -6.044189453125, -5.345703125, -4.647216796875, -3.94873046875, -3.250244140625, -2.5517578125, -1.853271484375, -1.15478515625, -0.456298828125, 0.2421875, 0.940673828125, 1.63916015625, 2.337646484375, 3.0361328125, 3.734619140625, 4.43310546875, 5.131591796875, 5.830078125, 6.528564453125, 7.22705078125, 7.925537109375, 8.6240234375, 9.322509765625, 10.02099609375, 10.719482421875, 11.41796875, 12.116455078125, 12.81494140625, 13.513427734375, 14.2119140625, 14.910400390625, 15.60888671875, 16.307373046875, 17.005859375, 17.704345703125, 18.40283203125, 19.101318359375, 19.7998046875, 20.498291015625, 21.19677734375, 21.895263671875, 22.59375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 4.0, 18.0, 21.0, 30.0, 47.0, 94.0, 124.0, 207.0, 314.0, 457.0, 607.0, 629.0, 489.0, 356.0, 222.0, 145.0, 87.0, 81.0, 36.0, 33.0, 16.0, 11.0, 9.0, 11.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.890625, -29.0859375, -28.28125, -27.4765625, -26.671875, -25.8671875, -25.0625, -24.2578125, -23.453125, -22.6484375, -21.84375, -21.0390625, -20.234375, -19.4296875, -18.625, -17.8203125, -17.015625, -16.2109375, -15.40625, -14.6015625, -13.796875, -12.9921875, -12.1875, -11.3828125, -10.578125, -9.7734375, -8.96875, -8.1640625, -7.359375, -6.5546875, -5.75, -4.9453125, -4.140625, -3.3359375, -2.53125, -1.7265625, -0.921875, -0.1171875, 0.6875, 1.4921875, 2.296875, 3.1015625, 3.90625, 4.7109375, 5.515625, 6.3203125, 7.125, 7.9296875, 8.734375, 9.5390625, 10.34375, 11.1484375, 11.953125, 12.7578125, 13.5625, 14.3671875, 15.171875, 15.9765625, 16.78125, 17.5859375, 18.390625, 19.1953125, 20.0, 20.8046875, 21.609375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 4.0, 13.0, 11.0, 30.0, 62.0, 78.0, 140.0, 265.0, 494.0, 998.0, 3170.0, 34075.0, 3406075.0, 733502.0, 11772.0, 1981.0, 738.0, 380.0, 207.0, 118.0, 58.0, 39.0, 29.0, 10.0, 8.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.5625, -62.3974609375, -60.232421875, -58.0673828125, -55.90234375, -53.7373046875, -51.572265625, -49.4072265625, -47.2421875, -45.0771484375, -42.912109375, -40.7470703125, -38.58203125, -36.4169921875, -34.251953125, -32.0869140625, -29.921875, -27.7568359375, -25.591796875, -23.4267578125, -21.26171875, -19.0966796875, -16.931640625, -14.7666015625, -12.6015625, -10.4365234375, -8.271484375, -6.1064453125, -3.94140625, -1.7763671875, 0.388671875, 2.5537109375, 4.71875, 6.8837890625, 9.048828125, 11.2138671875, 13.37890625, 15.5439453125, 17.708984375, 19.8740234375, 22.0390625, 24.2041015625, 26.369140625, 28.5341796875, 30.69921875, 32.8642578125, 35.029296875, 37.1943359375, 39.359375, 41.5244140625, 43.689453125, 45.8544921875, 48.01953125, 50.1845703125, 52.349609375, 54.5146484375, 56.6796875, 58.8447265625, 61.009765625, 63.1748046875, 65.33984375, 67.5048828125, 69.669921875, 71.8349609375, 74.0]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 7.0, 405.0, 594.0, 10.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.93930053710938, -111.90988159179688, -89.88045501708984, -67.85102844238281, -45.82160949707031, -23.792190551757812, -1.76275634765625, 20.26666259765625, 42.29608154296875, 64.32550048828125, 86.35492706298828, 108.38435363769531, 130.4137725830078, 152.4431915283203, 174.47262573242188, 196.50204467773438, 218.53146362304688, 240.56088256835938, 262.5903015136719, 284.6197509765625, 306.649169921875, 328.6785888671875, 350.7080078125, 372.7374267578125, 394.766845703125, 416.7962646484375, 438.82568359375, 460.8551025390625, 482.884521484375, 504.9139404296875, 526.943359375, 548.9727783203125, 571.002197265625, 593.0316162109375, 615.06103515625, 637.0904541015625, 659.119873046875, 681.1492919921875, 703.1787109375, 725.2081298828125, 747.237548828125, 769.2669677734375, 791.29638671875, 813.3258056640625, 835.355224609375, 857.3846435546875, 879.4140625, 901.4434814453125, 923.4729614257812, 945.5023803710938, 967.5317993164062, 989.5612182617188, 1011.5906372070312, 1033.6201171875, 1055.6495361328125, 1077.678955078125, 1099.7083740234375, 1121.73779296875, 1143.7672119140625, 1165.796630859375, 1187.8260498046875, 1209.85546875, 1231.8848876953125, 1253.914306640625, 1275.9437255859375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 10.0, 5.0, 8.0, 18.0, 13.0, 9.0, 14.0, 26.0, 11.0, 18.0, 19.0, 37.0, 29.0, 31.0, 37.0, 34.0, 45.0, 33.0, 42.0, 45.0, 44.0, 49.0, 42.0, 41.0, 33.0, 36.0, 30.0, 28.0, 27.0, 17.0, 24.0, 16.0, 16.0, 17.0, 18.0, 18.0, 4.0, 13.0, 9.0, 5.0, 12.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-62.558265686035156, -60.59885025024414, -58.63943862915039, -56.680023193359375, -54.720611572265625, -52.76119613647461, -50.801780700683594, -48.842369079589844, -46.88295364379883, -44.92353820800781, -42.96412658691406, -41.00471115112305, -39.0452995300293, -37.08588409423828, -35.12647247314453, -33.167057037353516, -31.207643508911133, -29.24822998046875, -27.288816452026367, -25.329402923583984, -23.36998748779297, -21.410573959350586, -19.451160430908203, -17.491744995117188, -15.532332420349121, -13.572918891906738, -11.613504409790039, -9.654090881347656, -7.694676876068115, -5.735262870788574, -3.7758493423461914, -1.8164348602294922, 0.14297866821289062, 2.1023926734924316, 4.061806678771973, 6.0212202072143555, 7.9806342124938965, 9.940048217773438, 11.89946174621582, 13.85887622833252, 15.818289756774902, 17.7777042388916, 19.737117767333984, 21.696531295776367, 23.65594482421875, 25.615360260009766, 27.574771881103516, 29.53418731689453, 31.493600845336914, 33.4530143737793, 35.41242980957031, 37.37184143066406, 39.33125686645508, 41.290672302246094, 43.250083923339844, 45.20949935913086, 47.16891098022461, 49.128326416015625, 51.087738037109375, 53.04715347290039, 55.00656509399414, 56.965980529785156, 58.925392150878906, 60.88480758666992, 62.84422302246094]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 11.0, 7.0, 12.0, 13.0, 17.0, 16.0, 22.0, 23.0, 20.0, 29.0, 33.0, 28.0, 36.0, 39.0, 46.0, 48.0, 51.0, 52.0, 47.0, 47.0, 40.0, 41.0, 44.0, 45.0, 32.0, 33.0, 21.0, 28.0, 17.0, 16.0, 19.0, 10.0, 8.0, 11.0, 13.0, 8.0, 6.0, 1.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.78125, -12.3668212890625, -11.952392578125, -11.5379638671875, -11.12353515625, -10.7091064453125, -10.294677734375, -9.8802490234375, -9.4658203125, -9.0513916015625, -8.636962890625, -8.2225341796875, -7.80810546875, -7.3936767578125, -6.979248046875, -6.5648193359375, -6.150390625, -5.7359619140625, -5.321533203125, -4.9071044921875, -4.49267578125, -4.0782470703125, -3.663818359375, -3.2493896484375, -2.8349609375, -2.4205322265625, -2.006103515625, -1.5916748046875, -1.17724609375, -0.7628173828125, -0.348388671875, 0.0660400390625, 0.48046875, 0.8948974609375, 1.309326171875, 1.7237548828125, 2.13818359375, 2.5526123046875, 2.967041015625, 3.3814697265625, 3.7958984375, 4.2103271484375, 4.624755859375, 5.0391845703125, 5.45361328125, 5.8680419921875, 6.282470703125, 6.6968994140625, 7.111328125, 7.5257568359375, 7.940185546875, 8.3546142578125, 8.76904296875, 9.1834716796875, 9.597900390625, 10.0123291015625, 10.4267578125, 10.8411865234375, 11.255615234375, 11.6700439453125, 12.08447265625, 12.4989013671875, 12.913330078125, 13.3277587890625, 13.7421875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 3.0, 17.0, 17.0, 16.0, 26.0, 41.0, 62.0, 93.0, 126.0, 203.0, 286.0, 434.0, 550.0, 840.0, 1350.0, 2028.0, 3126.0, 4773.0, 7308.0, 11410.0, 17389.0, 27456.0, 45015.0, 77806.0, 150911.0, 361029.0, 142529.0, 74629.0, 43757.0, 26756.0, 16886.0, 10973.0, 7024.0, 4633.0, 3077.0, 1998.0, 1308.0, 823.0, 588.0, 360.0, 271.0, 194.0, 146.0, 87.0, 53.0, 47.0, 29.0, 22.0, 13.0, 7.0, 6.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.333984375, -3.22802734375, -3.1220703125, -3.01611328125, -2.91015625, -2.80419921875, -2.6982421875, -2.59228515625, -2.486328125, -2.38037109375, -2.2744140625, -2.16845703125, -2.0625, -1.95654296875, -1.8505859375, -1.74462890625, -1.638671875, -1.53271484375, -1.4267578125, -1.32080078125, -1.21484375, -1.10888671875, -1.0029296875, -0.89697265625, -0.791015625, -0.68505859375, -0.5791015625, -0.47314453125, -0.3671875, -0.26123046875, -0.1552734375, -0.04931640625, 0.056640625, 0.16259765625, 0.2685546875, 0.37451171875, 0.48046875, 0.58642578125, 0.6923828125, 0.79833984375, 0.904296875, 1.01025390625, 1.1162109375, 1.22216796875, 1.328125, 1.43408203125, 1.5400390625, 1.64599609375, 1.751953125, 1.85791015625, 1.9638671875, 2.06982421875, 2.17578125, 2.28173828125, 2.3876953125, 2.49365234375, 2.599609375, 2.70556640625, 2.8115234375, 2.91748046875, 3.0234375, 3.12939453125, 3.2353515625, 3.34130859375, 3.447265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 5.0, 3.0, 5.0, 6.0, 10.0, 5.0, 11.0, 7.0, 19.0, 20.0, 13.0, 18.0, 22.0, 33.0, 23.0, 27.0, 37.0, 28.0, 32.0, 34.0, 37.0, 44.0, 45.0, 1064.0, 49.0, 36.0, 44.0, 41.0, 39.0, 33.0, 33.0, 33.0, 25.0, 22.0, 24.0, 16.0, 13.0, 22.0, 8.0, 12.0, 7.0, 7.0, 4.0, 5.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.27734375, -7.03668212890625, -6.7960205078125, -6.55535888671875, -6.314697265625, -6.07403564453125, -5.8333740234375, -5.59271240234375, -5.35205078125, -5.11138916015625, -4.8707275390625, -4.63006591796875, -4.389404296875, -4.14874267578125, -3.9080810546875, -3.66741943359375, -3.4267578125, -3.18609619140625, -2.9454345703125, -2.70477294921875, -2.464111328125, -2.22344970703125, -1.9827880859375, -1.74212646484375, -1.50146484375, -1.26080322265625, -1.0201416015625, -0.77947998046875, -0.538818359375, -0.29815673828125, -0.0574951171875, 0.18316650390625, 0.423828125, 0.66448974609375, 0.9051513671875, 1.14581298828125, 1.386474609375, 1.62713623046875, 1.8677978515625, 2.10845947265625, 2.34912109375, 2.58978271484375, 2.8304443359375, 3.07110595703125, 3.311767578125, 3.55242919921875, 3.7930908203125, 4.03375244140625, 4.2744140625, 4.51507568359375, 4.7557373046875, 4.99639892578125, 5.237060546875, 5.47772216796875, 5.7183837890625, 5.95904541015625, 6.19970703125, 6.44036865234375, 6.6810302734375, 6.92169189453125, 7.162353515625, 7.40301513671875, 7.6436767578125, 7.88433837890625, 8.125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 12.0, 14.0, 21.0, 38.0, 62.0, 83.0, 110.0, 193.0, 285.0, 454.0, 663.0, 1006.0, 1366.0, 2046.0, 2948.0, 4324.0, 6662.0, 9589.0, 14474.0, 21984.0, 34060.0, 52673.0, 84523.0, 153866.0, 1363543.0, 129226.0, 75077.0, 47468.0, 30415.0, 19638.0, 13083.0, 8774.0, 5817.0, 4110.0, 2619.0, 1865.0, 1338.0, 883.0, 567.0, 416.0, 290.0, 164.0, 145.0, 87.0, 52.0, 32.0, 23.0, 23.0, 9.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.76171875, -2.670806884765625, -2.57989501953125, -2.488983154296875, -2.3980712890625, -2.307159423828125, -2.21624755859375, -2.125335693359375, -2.034423828125, -1.943511962890625, -1.85260009765625, -1.761688232421875, -1.6707763671875, -1.579864501953125, -1.48895263671875, -1.398040771484375, -1.30712890625, -1.216217041015625, -1.12530517578125, -1.034393310546875, -0.9434814453125, -0.852569580078125, -0.76165771484375, -0.670745849609375, -0.579833984375, -0.488922119140625, -0.39801025390625, -0.307098388671875, -0.2161865234375, -0.125274658203125, -0.03436279296875, 0.056549072265625, 0.1474609375, 0.238372802734375, 0.32928466796875, 0.420196533203125, 0.5111083984375, 0.602020263671875, 0.69293212890625, 0.783843994140625, 0.874755859375, 0.965667724609375, 1.05657958984375, 1.147491455078125, 1.2384033203125, 1.329315185546875, 1.42022705078125, 1.511138916015625, 1.60205078125, 1.692962646484375, 1.78387451171875, 1.874786376953125, 1.9656982421875, 2.056610107421875, 2.14752197265625, 2.238433837890625, 2.329345703125, 2.420257568359375, 2.51116943359375, 2.602081298828125, 2.6929931640625, 2.783905029296875, 2.87481689453125, 2.965728759765625, 3.056640625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 6.0, 6.0, 5.0, 4.0, 11.0, 11.0, 20.0, 15.0, 18.0, 28.0, 28.0, 21.0, 28.0, 31.0, 40.0, 53.0, 52.0, 36.0, 57.0, 56.0, 53.0, 61.0, 53.0, 34.0, 35.0, 38.0, 28.0, 26.0, 17.0, 20.0, 10.0, 24.0, 14.0, 9.0, 10.0, 7.0, 4.0, 5.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00044727325439453125, -0.0004339739680290222, -0.0004206746816635132, -0.00040737539529800415, -0.0003940761089324951, -0.0003807768225669861, -0.00036747753620147705, -0.000354178249835968, -0.000340878963470459, -0.00032757967710494995, -0.0003142803907394409, -0.0003009811043739319, -0.00028768181800842285, -0.0002743825316429138, -0.0002610832452774048, -0.00024778395891189575, -0.00023448467254638672, -0.00022118538618087769, -0.00020788609981536865, -0.00019458681344985962, -0.00018128752708435059, -0.00016798824071884155, -0.00015468895435333252, -0.00014138966798782349, -0.00012809038162231445, -0.00011479109525680542, -0.00010149180889129639, -8.819252252578735e-05, -7.489323616027832e-05, -6.159394979476929e-05, -4.8294663429260254e-05, -3.499537706375122e-05, -2.1696090698242188e-05, -8.396804332733154e-06, 4.902482032775879e-06, 1.8201768398284912e-05, 3.1501054763793945e-05, 4.480034112930298e-05, 5.809962749481201e-05, 7.139891386032104e-05, 8.469820022583008e-05, 9.799748659133911e-05, 0.00011129677295684814, 0.00012459605932235718, 0.0001378953456878662, 0.00015119463205337524, 0.00016449391841888428, 0.0001777932047843933, 0.00019109249114990234, 0.00020439177751541138, 0.0002176910638809204, 0.00023099035024642944, 0.0002442896366119385, 0.0002575889229774475, 0.00027088820934295654, 0.0002841874957084656, 0.0002974867820739746, 0.00031078606843948364, 0.0003240853548049927, 0.0003373846411705017, 0.00035068392753601074, 0.0003639832139015198, 0.0003772825002670288, 0.00039058178663253784, 0.0004038810729980469]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 12.0, 11.0, 11.0, 11.0, 15.0, 16.0, 26.0, 35.0, 33.0, 37.0, 52.0, 56.0, 101.0, 113.0, 161.0, 253.0, 364.0, 669.0, 3091.0, 876117.0, 164126.0, 1386.0, 556.0, 320.0, 233.0, 159.0, 120.0, 89.0, 64.0, 47.0, 44.0, 45.0, 27.0, 25.0, 23.0, 13.0, 11.0, 15.0, 13.0, 12.0, 9.0, 8.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.007381439208984375, -0.007142126560211182, -0.006902813911437988, -0.006663501262664795, -0.0064241886138916016, -0.006184875965118408, -0.005945563316345215, -0.0057062506675720215, -0.005466938018798828, -0.005227625370025635, -0.004988312721252441, -0.004749000072479248, -0.004509687423706055, -0.004270374774932861, -0.004031062126159668, -0.0037917494773864746, -0.0035524368286132812, -0.003313124179840088, -0.0030738115310668945, -0.002834498882293701, -0.002595186233520508, -0.0023558735847473145, -0.002116560935974121, -0.0018772482872009277, -0.0016379356384277344, -0.001398622989654541, -0.0011593103408813477, -0.0009199976921081543, -0.0006806850433349609, -0.0004413723945617676, -0.00020205974578857422, 3.725290298461914e-05, 0.0002765655517578125, 0.0005158782005310059, 0.0007551908493041992, 0.0009945034980773926, 0.001233816146850586, 0.0014731287956237793, 0.0017124414443969727, 0.001951754093170166, 0.0021910667419433594, 0.0024303793907165527, 0.002669692039489746, 0.0029090046882629395, 0.003148317337036133, 0.003387629985809326, 0.0036269426345825195, 0.003866255283355713, 0.004105567932128906, 0.0043448805809021, 0.004584193229675293, 0.004823505878448486, 0.00506281852722168, 0.005302131175994873, 0.005541443824768066, 0.00578075647354126, 0.006020069122314453, 0.0062593817710876465, 0.00649869441986084, 0.006738007068634033, 0.0069773197174072266, 0.00721663236618042, 0.007455945014953613, 0.007695257663726807, 0.0079345703125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 130.0, 524.0, 309.0, 43.0, 2.0, 0.0, 1.0], "bins": [-0.0024589516688138247, -0.00241710152477026, -0.002375251380726695, -0.0023334012366831303, -0.002291551325470209, -0.0022497011814266443, -0.0022078510373830795, -0.0021660008933395147, -0.00212415074929595, -0.002082300605252385, -0.0020404504612088203, -0.0019986003171652555, -0.0019567501731216908, -0.0019149001454934478, -0.0018730501178652048, -0.00183119997382164, -0.0017893498297780752, -0.0017474996857345104, -0.0017056495416909456, -0.0016637995140627027, -0.0016219493700191379, -0.001580099225975573, -0.00153824919834733, -0.0014963990543037653, -0.0014545489102602005, -0.0014126987662166357, -0.001370848622173071, -0.001328998594544828, -0.0012871484505012631, -0.0012452983064576983, -0.0012034482788294554, -0.0011615981347858906, -0.0011197479907423258, -0.001077897846698761, -0.0010360477026551962, -0.0009941976750269532, -0.0009523475309833884, -0.0009104973869398236, -0.0008686473011039197, -0.0008267972152680159, -0.0007849470712244511, -0.0007430969271808863, -0.0007012468413449824, -0.0006593967555090785, -0.0006175466114655137, -0.0005756964674219489, -0.000533846381586045, -0.0004919962957501411, -0.00045014615170657635, -0.000408296036766842, -0.00036644592182710767, -0.00032459580688737333, -0.000282745691947639, -0.00024089557700790465, -0.0001990454620681703, -0.00015719534712843597, -0.0001153452176367864, -7.349510269705206e-05, -3.164498775731772e-05, 1.0205127182416618e-05, 5.205524212215096e-05, 9.39053570618853e-05, 0.00013575547200161964, 0.00017760558694135398, 0.00021945570188108832]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 3.0, 10.0, 9.0, 8.0, 10.0, 18.0, 9.0, 24.0, 27.0, 31.0, 37.0, 35.0, 31.0, 35.0, 41.0, 58.0, 60.0, 46.0, 66.0, 36.0, 49.0, 40.0, 32.0, 28.0, 45.0, 33.0, 35.0, 27.0, 18.0, 19.0, 17.0, 15.0, 10.0, 7.0, 10.0, 1.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002516508102416992, -0.00024271663278341293, -0.00023378245532512665, -0.00022484827786684036, -0.00021591410040855408, -0.0002069799229502678, -0.0001980457454919815, -0.00018911156803369522, -0.00018017739057540894, -0.00017124321311712265, -0.00016230903565883636, -0.00015337485820055008, -0.0001444406807422638, -0.0001355065032839775, -0.00012657232582569122, -0.00011763814836740494, -0.00010870397090911865, -9.976979345083237e-05, -9.083561599254608e-05, -8.19014385342598e-05, -7.296726107597351e-05, -6.403308361768723e-05, -5.509890615940094e-05, -4.6164728701114655e-05, -3.723055124282837e-05, -2.8296373784542084e-05, -1.93621963262558e-05, -1.0428018867969513e-05, -1.4938414096832275e-06, 7.440336048603058e-06, 1.6374513506889343e-05, 2.530869096517563e-05, 3.4242868423461914e-05, 4.31770458817482e-05, 5.2111223340034485e-05, 6.104540079832077e-05, 6.997957825660706e-05, 7.891375571489334e-05, 8.784793317317963e-05, 9.678211063146591e-05, 0.0001057162880897522, 0.00011465046554803848, 0.00012358464300632477, 0.00013251882046461105, 0.00014145299792289734, 0.00015038717538118362, 0.0001593213528394699, 0.0001682555302977562, 0.00017718970775604248, 0.00018612388521432877, 0.00019505806267261505, 0.00020399224013090134, 0.00021292641758918762, 0.0002218605950474739, 0.0002307947725057602, 0.00023972894996404648, 0.00024866312742233276, 0.00025759730488061905, 0.00026653148233890533, 0.0002754656597971916, 0.0002843998372554779, 0.0002933340147137642, 0.0003022681921720505, 0.00031120236963033676, 0.00032013654708862305]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 11.0, 7.0, 12.0, 13.0, 17.0, 16.0, 22.0, 23.0, 20.0, 29.0, 33.0, 28.0, 37.0, 38.0, 48.0, 47.0, 50.0, 52.0, 48.0, 46.0, 40.0, 42.0, 43.0, 45.0, 32.0, 33.0, 21.0, 28.0, 18.0, 15.0, 19.0, 10.0, 8.0, 11.0, 13.0, 8.0, 6.0, 1.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.7734375, -12.359130859375, -11.94482421875, -11.530517578125, -11.1162109375, -10.701904296875, -10.28759765625, -9.873291015625, -9.458984375, -9.044677734375, -8.63037109375, -8.216064453125, -7.8017578125, -7.387451171875, -6.97314453125, -6.558837890625, -6.14453125, -5.730224609375, -5.31591796875, -4.901611328125, -4.4873046875, -4.072998046875, -3.65869140625, -3.244384765625, -2.830078125, -2.415771484375, -2.00146484375, -1.587158203125, -1.1728515625, -0.758544921875, -0.34423828125, 0.070068359375, 0.484375, 0.898681640625, 1.31298828125, 1.727294921875, 2.1416015625, 2.555908203125, 2.97021484375, 3.384521484375, 3.798828125, 4.213134765625, 4.62744140625, 5.041748046875, 5.4560546875, 5.870361328125, 6.28466796875, 6.698974609375, 7.11328125, 7.527587890625, 7.94189453125, 8.356201171875, 8.7705078125, 9.184814453125, 9.59912109375, 10.013427734375, 10.427734375, 10.842041015625, 11.25634765625, 11.670654296875, 12.0849609375, 12.499267578125, 12.91357421875, 13.327880859375, 13.7421875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 6.0, 9.0, 12.0, 19.0, 24.0, 44.0, 38.0, 56.0, 75.0, 109.0, 161.0, 237.0, 316.0, 609.0, 1043.0, 1973.0, 4321.0, 10256.0, 27286.0, 77914.0, 232954.0, 413396.0, 179522.0, 60687.0, 21553.0, 8237.0, 3540.0, 1684.0, 957.0, 496.0, 310.0, 192.0, 143.0, 81.0, 67.0, 64.0, 46.0, 29.0, 24.0, 15.0, 15.0, 12.0, 7.0, 1.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4765625, -14.9671630859375, -14.457763671875, -13.9483642578125, -13.43896484375, -12.9295654296875, -12.420166015625, -11.9107666015625, -11.4013671875, -10.8919677734375, -10.382568359375, -9.8731689453125, -9.36376953125, -8.8543701171875, -8.344970703125, -7.8355712890625, -7.326171875, -6.8167724609375, -6.307373046875, -5.7979736328125, -5.28857421875, -4.7791748046875, -4.269775390625, -3.7603759765625, -3.2509765625, -2.7415771484375, -2.232177734375, -1.7227783203125, -1.21337890625, -0.7039794921875, -0.194580078125, 0.3148193359375, 0.82421875, 1.3336181640625, 1.843017578125, 2.3524169921875, 2.86181640625, 3.3712158203125, 3.880615234375, 4.3900146484375, 4.8994140625, 5.4088134765625, 5.918212890625, 6.4276123046875, 6.93701171875, 7.4464111328125, 7.955810546875, 8.4652099609375, 8.974609375, 9.4840087890625, 9.993408203125, 10.5028076171875, 11.01220703125, 11.5216064453125, 12.031005859375, 12.5404052734375, 13.0498046875, 13.5592041015625, 14.068603515625, 14.5780029296875, 15.08740234375, 15.5968017578125, 16.106201171875, 16.6156005859375, 17.125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 5.0, 8.0, 6.0, 6.0, 6.0, 3.0, 9.0, 9.0, 21.0, 10.0, 14.0, 19.0, 20.0, 33.0, 29.0, 31.0, 30.0, 47.0, 58.0, 69.0, 126.0, 207.0, 1502.0, 226.0, 121.0, 60.0, 52.0, 36.0, 38.0, 35.0, 32.0, 18.0, 21.0, 22.0, 17.0, 13.0, 20.0, 14.0, 11.0, 11.0, 9.0, 6.0, 3.0, 2.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.3125, -34.19287109375, -33.0732421875, -31.95361328125, -30.833984375, -29.71435546875, -28.5947265625, -27.47509765625, -26.35546875, -25.23583984375, -24.1162109375, -22.99658203125, -21.876953125, -20.75732421875, -19.6376953125, -18.51806640625, -17.3984375, -16.27880859375, -15.1591796875, -14.03955078125, -12.919921875, -11.80029296875, -10.6806640625, -9.56103515625, -8.44140625, -7.32177734375, -6.2021484375, -5.08251953125, -3.962890625, -2.84326171875, -1.7236328125, -0.60400390625, 0.515625, 1.63525390625, 2.7548828125, 3.87451171875, 4.994140625, 6.11376953125, 7.2333984375, 8.35302734375, 9.47265625, 10.59228515625, 11.7119140625, 12.83154296875, 13.951171875, 15.07080078125, 16.1904296875, 17.31005859375, 18.4296875, 19.54931640625, 20.6689453125, 21.78857421875, 22.908203125, 24.02783203125, 25.1474609375, 26.26708984375, 27.38671875, 28.50634765625, 29.6259765625, 30.74560546875, 31.865234375, 32.98486328125, 34.1044921875, 35.22412109375, 36.34375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 11.0, 8.0, 5.0, 8.0, 14.0, 19.0, 27.0, 37.0, 47.0, 83.0, 142.0, 226.0, 413.0, 706.0, 2330.0, 115273.0, 2988693.0, 34695.0, 1438.0, 565.0, 341.0, 216.0, 120.0, 91.0, 54.0, 24.0, 31.0, 17.0, 15.0, 10.0, 6.0, 6.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-82.4375, -79.5322265625, -76.626953125, -73.7216796875, -70.81640625, -67.9111328125, -65.005859375, -62.1005859375, -59.1953125, -56.2900390625, -53.384765625, -50.4794921875, -47.57421875, -44.6689453125, -41.763671875, -38.8583984375, -35.953125, -33.0478515625, -30.142578125, -27.2373046875, -24.33203125, -21.4267578125, -18.521484375, -15.6162109375, -12.7109375, -9.8056640625, -6.900390625, -3.9951171875, -1.08984375, 1.8154296875, 4.720703125, 7.6259765625, 10.53125, 13.4365234375, 16.341796875, 19.2470703125, 22.15234375, 25.0576171875, 27.962890625, 30.8681640625, 33.7734375, 36.6787109375, 39.583984375, 42.4892578125, 45.39453125, 48.2998046875, 51.205078125, 54.1103515625, 57.015625, 59.9208984375, 62.826171875, 65.7314453125, 68.63671875, 71.5419921875, 74.447265625, 77.3525390625, 80.2578125, 83.1630859375, 86.068359375, 88.9736328125, 91.87890625, 94.7841796875, 97.689453125, 100.5947265625, 103.5]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.0, 436.0, 430.0, 66.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-364.7219543457031, -356.0268859863281, -347.331787109375, -338.63671875, -329.9416198730469, -321.2465515136719, -312.55145263671875, -303.85638427734375, -295.1612854003906, -286.4662170410156, -277.7711181640625, -269.0760498046875, -260.3809509277344, -251.6858673095703, -242.99078369140625, -234.29571533203125, -225.6006317138672, -216.90554809570312, -208.21046447753906, -199.515380859375, -190.82029724121094, -182.12521362304688, -173.43014526367188, -164.73504638671875, -156.03997802734375, -147.3448944091797, -138.64981079101562, -129.95472717285156, -121.2596435546875, -112.56455993652344, -103.8694839477539, -95.17440032958984, -86.47929382324219, -77.78421020507812, -69.08912658691406, -60.394046783447266, -51.6989631652832, -43.00387954711914, -34.308799743652344, -25.61371612548828, -16.91863250732422, -8.223549842834473, 0.47153282165527344, 9.166614532470703, 17.861698150634766, 26.556781768798828, 35.251861572265625, 43.94694519042969, 52.64202880859375, 61.33711242675781, 70.03219604492188, 78.72727966308594, 87.42236328125, 96.11744689941406, 104.8125228881836, 113.50760650634766, 122.20269012451172, 130.89776611328125, 139.5928497314453, 148.28793334960938, 156.98301696777344, 165.6781005859375, 174.37318420410156, 183.06826782226562, 191.7633514404297]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 7.0, 9.0, 6.0, 7.0, 11.0, 7.0, 8.0, 23.0, 12.0, 19.0, 22.0, 16.0, 29.0, 23.0, 34.0, 43.0, 40.0, 31.0, 39.0, 33.0, 33.0, 44.0, 40.0, 46.0, 38.0, 37.0, 29.0, 28.0, 30.0, 26.0, 33.0, 27.0, 21.0, 22.0, 20.0, 13.0, 12.0, 17.0, 12.0, 17.0, 4.0, 3.0, 9.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-72.80058288574219, -70.37996673583984, -67.95935821533203, -65.53874206542969, -63.11812973022461, -60.69751739501953, -58.27690124511719, -55.85628890991211, -53.43567657470703, -51.01506423950195, -48.594451904296875, -46.17383575439453, -43.75322341918945, -41.332611083984375, -38.91199493408203, -36.49138259887695, -34.070770263671875, -31.650157928466797, -29.229543685913086, -26.808929443359375, -24.388317108154297, -21.96770477294922, -19.547090530395508, -17.126476287841797, -14.705863952636719, -12.285250663757324, -9.86463737487793, -7.444024085998535, -5.023410797119141, -2.602797508239746, -0.18218421936035156, 2.2384300231933594, 4.659049987792969, 7.079663276672363, 9.500276565551758, 11.920889854431152, 14.341503143310547, 16.762115478515625, 19.182729721069336, 21.603343963623047, 24.023956298828125, 26.444568634033203, 28.865182876586914, 31.285797119140625, 33.7064094543457, 36.12702178955078, 38.547637939453125, 40.9682502746582, 43.38886260986328, 45.80947494506836, 48.23008728027344, 50.65070343017578, 53.07131576538086, 55.49192810058594, 57.91254425048828, 60.33315658569336, 62.75376892089844, 65.17438507080078, 67.5949935913086, 70.01560974121094, 72.43621826171875, 74.8568344116211, 77.27745056152344, 79.69805908203125, 82.1186752319336]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 8.0, 6.0, 7.0, 8.0, 12.0, 21.0, 12.0, 18.0, 16.0, 15.0, 25.0, 26.0, 32.0, 29.0, 52.0, 40.0, 45.0, 51.0, 38.0, 42.0, 44.0, 54.0, 43.0, 48.0, 53.0, 36.0, 32.0, 30.0, 36.0, 30.0, 14.0, 13.0, 16.0, 14.0, 10.0, 4.0, 8.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0234375, -13.5802001953125, -13.136962890625, -12.6937255859375, -12.25048828125, -11.8072509765625, -11.364013671875, -10.9207763671875, -10.4775390625, -10.0343017578125, -9.591064453125, -9.1478271484375, -8.70458984375, -8.2613525390625, -7.818115234375, -7.3748779296875, -6.931640625, -6.4884033203125, -6.045166015625, -5.6019287109375, -5.15869140625, -4.7154541015625, -4.272216796875, -3.8289794921875, -3.3857421875, -2.9425048828125, -2.499267578125, -2.0560302734375, -1.61279296875, -1.1695556640625, -0.726318359375, -0.2830810546875, 0.16015625, 0.6033935546875, 1.046630859375, 1.4898681640625, 1.93310546875, 2.3763427734375, 2.819580078125, 3.2628173828125, 3.7060546875, 4.1492919921875, 4.592529296875, 5.0357666015625, 5.47900390625, 5.9222412109375, 6.365478515625, 6.8087158203125, 7.251953125, 7.6951904296875, 8.138427734375, 8.5816650390625, 9.02490234375, 9.4681396484375, 9.911376953125, 10.3546142578125, 10.7978515625, 11.2410888671875, 11.684326171875, 12.1275634765625, 12.57080078125, 13.0140380859375, 13.457275390625, 13.9005126953125, 14.34375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 6.0, 10.0, 9.0, 19.0, 21.0, 21.0, 29.0, 37.0, 45.0, 77.0, 102.0, 161.0, 264.0, 445.0, 806.0, 1894.0, 5555.0, 23622.0, 134130.0, 712461.0, 1826554.0, 1156836.0, 271376.0, 45235.0, 9115.0, 2740.0, 1127.0, 595.0, 314.0, 201.0, 111.0, 96.0, 57.0, 35.0, 44.0, 25.0, 20.0, 12.0, 14.0, 8.0, 15.0, 3.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-17.328125, -16.798095703125, -16.26806640625, -15.738037109375, -15.2080078125, -14.677978515625, -14.14794921875, -13.617919921875, -13.087890625, -12.557861328125, -12.02783203125, -11.497802734375, -10.9677734375, -10.437744140625, -9.90771484375, -9.377685546875, -8.84765625, -8.317626953125, -7.78759765625, -7.257568359375, -6.7275390625, -6.197509765625, -5.66748046875, -5.137451171875, -4.607421875, -4.077392578125, -3.54736328125, -3.017333984375, -2.4873046875, -1.957275390625, -1.42724609375, -0.897216796875, -0.3671875, 0.162841796875, 0.69287109375, 1.222900390625, 1.7529296875, 2.282958984375, 2.81298828125, 3.343017578125, 3.873046875, 4.403076171875, 4.93310546875, 5.463134765625, 5.9931640625, 6.523193359375, 7.05322265625, 7.583251953125, 8.11328125, 8.643310546875, 9.17333984375, 9.703369140625, 10.2333984375, 10.763427734375, 11.29345703125, 11.823486328125, 12.353515625, 12.883544921875, 13.41357421875, 13.943603515625, 14.4736328125, 15.003662109375, 15.53369140625, 16.063720703125, 16.59375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 1.0, 2.0, 10.0, 5.0, 9.0, 9.0, 19.0, 27.0, 29.0, 35.0, 56.0, 79.0, 107.0, 165.0, 205.0, 282.0, 415.0, 452.0, 478.0, 439.0, 351.0, 260.0, 199.0, 117.0, 74.0, 62.0, 49.0, 32.0, 37.0, 25.0, 7.0, 12.0, 11.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.765625, -17.1787109375, -16.591796875, -16.0048828125, -15.41796875, -14.8310546875, -14.244140625, -13.6572265625, -13.0703125, -12.4833984375, -11.896484375, -11.3095703125, -10.72265625, -10.1357421875, -9.548828125, -8.9619140625, -8.375, -7.7880859375, -7.201171875, -6.6142578125, -6.02734375, -5.4404296875, -4.853515625, -4.2666015625, -3.6796875, -3.0927734375, -2.505859375, -1.9189453125, -1.33203125, -0.7451171875, -0.158203125, 0.4287109375, 1.015625, 1.6025390625, 2.189453125, 2.7763671875, 3.36328125, 3.9501953125, 4.537109375, 5.1240234375, 5.7109375, 6.2978515625, 6.884765625, 7.4716796875, 8.05859375, 8.6455078125, 9.232421875, 9.8193359375, 10.40625, 10.9931640625, 11.580078125, 12.1669921875, 12.75390625, 13.3408203125, 13.927734375, 14.5146484375, 15.1015625, 15.6884765625, 16.275390625, 16.8623046875, 17.44921875, 18.0361328125, 18.623046875, 19.2099609375, 19.796875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 11.0, 9.0, 14.0, 14.0, 22.0, 33.0, 46.0, 72.0, 93.0, 172.0, 284.0, 496.0, 1062.0, 2749.0, 8864.0, 37198.0, 240681.0, 2298373.0, 1429062.0, 140039.0, 24588.0, 6297.0, 2115.0, 874.0, 429.0, 230.0, 163.0, 91.0, 61.0, 39.0, 23.0, 19.0, 12.0, 19.0, 7.0, 0.0, 10.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-30.984375, -30.12060546875, -29.2568359375, -28.39306640625, -27.529296875, -26.66552734375, -25.8017578125, -24.93798828125, -24.07421875, -23.21044921875, -22.3466796875, -21.48291015625, -20.619140625, -19.75537109375, -18.8916015625, -18.02783203125, -17.1640625, -16.30029296875, -15.4365234375, -14.57275390625, -13.708984375, -12.84521484375, -11.9814453125, -11.11767578125, -10.25390625, -9.39013671875, -8.5263671875, -7.66259765625, -6.798828125, -5.93505859375, -5.0712890625, -4.20751953125, -3.34375, -2.47998046875, -1.6162109375, -0.75244140625, 0.111328125, 0.97509765625, 1.8388671875, 2.70263671875, 3.56640625, 4.43017578125, 5.2939453125, 6.15771484375, 7.021484375, 7.88525390625, 8.7490234375, 9.61279296875, 10.4765625, 11.34033203125, 12.2041015625, 13.06787109375, 13.931640625, 14.79541015625, 15.6591796875, 16.52294921875, 17.38671875, 18.25048828125, 19.1142578125, 19.97802734375, 20.841796875, 21.70556640625, 22.5693359375, 23.43310546875, 24.296875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 11.0, 178.0, 538.0, 259.0, 26.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.17774200439453, -114.42102813720703, -103.66431427001953, -92.90760040283203, -82.15088653564453, -71.39417266845703, -60.63745880126953, -49.88074493408203, -39.12403106689453, -28.36731719970703, -17.61060333251953, -6.853889465332031, 3.9028244018554688, 14.659538269042969, 25.41625213623047, 36.17296600341797, 46.92967987060547, 57.68639373779297, 68.44310760498047, 79.19982147216797, 89.95653533935547, 100.71324920654297, 111.46996307373047, 122.22667694091797, 132.9833984375, 143.7401123046875, 154.496826171875, 165.2535400390625, 176.01025390625, 186.7669677734375, 197.523681640625, 208.2803955078125, 219.037109375, 229.7938232421875, 240.550537109375, 251.3072509765625, 262.06396484375, 272.8206787109375, 283.577392578125, 294.3341064453125, 305.0908203125, 315.8475341796875, 326.604248046875, 337.3609619140625, 348.11767578125, 358.8743896484375, 369.631103515625, 380.3878173828125, 391.14453125, 401.9012451171875, 412.657958984375, 423.4146728515625, 434.17138671875, 444.9281005859375, 455.684814453125, 466.4415283203125, 477.1982421875, 487.9549560546875, 498.711669921875, 509.4683837890625, 520.22509765625, 530.9818115234375, 541.738525390625, 552.4952392578125, 563.251953125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 9.0, 8.0, 14.0, 7.0, 12.0, 18.0, 24.0, 22.0, 29.0, 24.0, 21.0, 25.0, 40.0, 55.0, 43.0, 42.0, 31.0, 42.0, 43.0, 47.0, 36.0, 33.0, 44.0, 34.0, 42.0, 35.0, 31.0, 27.0, 20.0, 20.0, 27.0, 18.0, 14.0, 14.0, 10.0, 5.0, 7.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.1490364074707, -54.22444152832031, -52.299842834472656, -50.375247955322266, -48.45064926147461, -46.52605438232422, -44.60145568847656, -42.67686080932617, -40.75226593017578, -38.82767105102539, -36.903072357177734, -34.978477478027344, -33.05387878417969, -31.129283905029297, -29.204687118530273, -27.28009033203125, -25.355491638183594, -23.43089485168457, -21.506298065185547, -19.581703186035156, -17.6571044921875, -15.732508659362793, -13.807912826538086, -11.883316040039062, -9.958719253540039, -8.034122467041016, -6.10952615737915, -4.184929847717285, -2.2603330612182617, -0.3357362747192383, 1.5888595581054688, 3.513456344604492, 5.43804931640625, 7.362646102905273, 9.287242889404297, 11.211838722229004, 13.136435508728027, 15.06103229522705, 16.985628128051758, 18.91022491455078, 20.834821701049805, 22.759418487548828, 24.68401527404785, 26.608612060546875, 28.533206939697266, 30.457805633544922, 32.38240051269531, 34.30699920654297, 36.23159408569336, 38.15618896484375, 40.080787658691406, 42.0053825378418, 43.92998123168945, 45.854576110839844, 47.7791748046875, 49.70376968383789, 51.62836456298828, 53.55295944213867, 55.47755813598633, 57.40215301513672, 59.326751708984375, 61.251346588134766, 63.175941467285156, 65.10054016113281, 67.02513885498047]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 7.0, 9.0, 12.0, 12.0, 10.0, 19.0, 9.0, 15.0, 17.0, 25.0, 17.0, 21.0, 30.0, 27.0, 28.0, 39.0, 37.0, 44.0, 47.0, 42.0, 35.0, 40.0, 36.0, 51.0, 28.0, 33.0, 29.0, 42.0, 28.0, 27.0, 24.0, 19.0, 20.0, 27.0, 12.0, 16.0, 9.0, 14.0, 8.0, 6.0, 5.0, 6.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-12.0546875, -11.6754150390625, -11.296142578125, -10.9168701171875, -10.53759765625, -10.1583251953125, -9.779052734375, -9.3997802734375, -9.0205078125, -8.6412353515625, -8.261962890625, -7.8826904296875, -7.50341796875, -7.1241455078125, -6.744873046875, -6.3656005859375, -5.986328125, -5.6070556640625, -5.227783203125, -4.8485107421875, -4.46923828125, -4.0899658203125, -3.710693359375, -3.3314208984375, -2.9521484375, -2.5728759765625, -2.193603515625, -1.8143310546875, -1.43505859375, -1.0557861328125, -0.676513671875, -0.2972412109375, 0.08203125, 0.4613037109375, 0.840576171875, 1.2198486328125, 1.59912109375, 1.9783935546875, 2.357666015625, 2.7369384765625, 3.1162109375, 3.4954833984375, 3.874755859375, 4.2540283203125, 4.63330078125, 5.0125732421875, 5.391845703125, 5.7711181640625, 6.150390625, 6.5296630859375, 6.908935546875, 7.2882080078125, 7.66748046875, 8.0467529296875, 8.426025390625, 8.8052978515625, 9.1845703125, 9.5638427734375, 9.943115234375, 10.3223876953125, 10.70166015625, 11.0809326171875, 11.460205078125, 11.8394775390625, 12.21875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 14.0, 8.0, 7.0, 22.0, 28.0, 53.0, 68.0, 84.0, 161.0, 195.0, 303.0, 424.0, 603.0, 932.0, 1279.0, 1892.0, 2617.0, 3949.0, 5604.0, 8073.0, 11732.0, 17144.0, 26184.0, 40700.0, 66046.0, 121540.0, 302263.0, 190521.0, 91385.0, 53194.0, 33039.0, 21622.0, 14361.0, 9994.0, 6831.0, 4878.0, 3337.0, 2342.0, 1641.0, 1108.0, 741.0, 536.0, 335.0, 257.0, 149.0, 117.0, 82.0, 59.0, 32.0, 28.0, 19.0, 11.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-3.1015625, -3.00396728515625, -2.9063720703125, -2.80877685546875, -2.711181640625, -2.61358642578125, -2.5159912109375, -2.41839599609375, -2.32080078125, -2.22320556640625, -2.1256103515625, -2.02801513671875, -1.930419921875, -1.83282470703125, -1.7352294921875, -1.63763427734375, -1.5400390625, -1.44244384765625, -1.3448486328125, -1.24725341796875, -1.149658203125, -1.05206298828125, -0.9544677734375, -0.85687255859375, -0.75927734375, -0.66168212890625, -0.5640869140625, -0.46649169921875, -0.368896484375, -0.27130126953125, -0.1737060546875, -0.07611083984375, 0.021484375, 0.11907958984375, 0.2166748046875, 0.31427001953125, 0.411865234375, 0.50946044921875, 0.6070556640625, 0.70465087890625, 0.80224609375, 0.89984130859375, 0.9974365234375, 1.09503173828125, 1.192626953125, 1.29022216796875, 1.3878173828125, 1.48541259765625, 1.5830078125, 1.68060302734375, 1.7781982421875, 1.87579345703125, 1.973388671875, 2.07098388671875, 2.1685791015625, 2.26617431640625, 2.36376953125, 2.46136474609375, 2.5589599609375, 2.65655517578125, 2.754150390625, 2.85174560546875, 2.9493408203125, 3.04693603515625, 3.14453125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 6.0, 4.0, 3.0, 10.0, 6.0, 8.0, 8.0, 12.0, 11.0, 19.0, 25.0, 16.0, 23.0, 18.0, 23.0, 32.0, 25.0, 41.0, 45.0, 46.0, 37.0, 36.0, 38.0, 36.0, 1054.0, 37.0, 35.0, 30.0, 29.0, 24.0, 31.0, 41.0, 40.0, 20.0, 24.0, 21.0, 12.0, 8.0, 19.0, 9.0, 6.0, 9.0, 12.0, 11.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.5703125, -7.334228515625, -7.09814453125, -6.862060546875, -6.6259765625, -6.389892578125, -6.15380859375, -5.917724609375, -5.681640625, -5.445556640625, -5.20947265625, -4.973388671875, -4.7373046875, -4.501220703125, -4.26513671875, -4.029052734375, -3.79296875, -3.556884765625, -3.32080078125, -3.084716796875, -2.8486328125, -2.612548828125, -2.37646484375, -2.140380859375, -1.904296875, -1.668212890625, -1.43212890625, -1.196044921875, -0.9599609375, -0.723876953125, -0.48779296875, -0.251708984375, -0.015625, 0.220458984375, 0.45654296875, 0.692626953125, 0.9287109375, 1.164794921875, 1.40087890625, 1.636962890625, 1.873046875, 2.109130859375, 2.34521484375, 2.581298828125, 2.8173828125, 3.053466796875, 3.28955078125, 3.525634765625, 3.76171875, 3.997802734375, 4.23388671875, 4.469970703125, 4.7060546875, 4.942138671875, 5.17822265625, 5.414306640625, 5.650390625, 5.886474609375, 6.12255859375, 6.358642578125, 6.5947265625, 6.830810546875, 7.06689453125, 7.302978515625, 7.5390625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 25.0, 26.0, 34.0, 56.0, 98.0, 138.0, 190.0, 283.0, 430.0, 590.0, 802.0, 1160.0, 1581.0, 2190.0, 2981.0, 4206.0, 6033.0, 8782.0, 12422.0, 18132.0, 27330.0, 40683.0, 62950.0, 100419.0, 191653.0, 1299109.0, 108980.0, 68348.0, 43975.0, 29235.0, 19490.0, 13370.0, 8925.0, 6501.0, 4590.0, 3304.0, 2318.0, 1661.0, 1190.0, 888.0, 622.0, 441.0, 314.0, 221.0, 153.0, 96.0, 87.0, 34.0, 20.0, 27.0, 10.0, 10.0, 6.0, 2.0, 1.0, 2.0, 1.0], "bins": [-2.8515625, -2.7626953125, -2.673828125, -2.5849609375, -2.49609375, -2.4072265625, -2.318359375, -2.2294921875, -2.140625, -2.0517578125, -1.962890625, -1.8740234375, -1.78515625, -1.6962890625, -1.607421875, -1.5185546875, -1.4296875, -1.3408203125, -1.251953125, -1.1630859375, -1.07421875, -0.9853515625, -0.896484375, -0.8076171875, -0.71875, -0.6298828125, -0.541015625, -0.4521484375, -0.36328125, -0.2744140625, -0.185546875, -0.0966796875, -0.0078125, 0.0810546875, 0.169921875, 0.2587890625, 0.34765625, 0.4365234375, 0.525390625, 0.6142578125, 0.703125, 0.7919921875, 0.880859375, 0.9697265625, 1.05859375, 1.1474609375, 1.236328125, 1.3251953125, 1.4140625, 1.5029296875, 1.591796875, 1.6806640625, 1.76953125, 1.8583984375, 1.947265625, 2.0361328125, 2.125, 2.2138671875, 2.302734375, 2.3916015625, 2.48046875, 2.5693359375, 2.658203125, 2.7470703125, 2.8359375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 10.0, 13.0, 13.0, 19.0, 20.0, 30.0, 58.0, 68.0, 117.0, 152.0, 119.0, 111.0, 65.0, 54.0, 45.0, 20.0, 23.0, 8.0, 11.0, 6.0, 10.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009703636169433594, -0.0009442195296287537, -0.000918075442314148, -0.0008919313549995422, -0.0008657872676849365, -0.0008396431803703308, -0.0008134990930557251, -0.0007873550057411194, -0.0007612109184265137, -0.000735066831111908, -0.0007089227437973022, -0.0006827786564826965, -0.0006566345691680908, -0.0006304904818534851, -0.0006043463945388794, -0.0005782023072242737, -0.000552058219909668, -0.0005259141325950623, -0.0004997700452804565, -0.00047362595796585083, -0.0004474818706512451, -0.0004213377833366394, -0.0003951936960220337, -0.000369049608707428, -0.00034290552139282227, -0.00031676143407821655, -0.00029061734676361084, -0.0002644732594490051, -0.00023832917213439941, -0.0002121850848197937, -0.000186040997505188, -0.00015989691019058228, -0.00013375282287597656, -0.00010760873556137085, -8.146464824676514e-05, -5.5320560932159424e-05, -2.917647361755371e-05, -3.032386302947998e-06, 2.3111701011657715e-05, 4.925578832626343e-05, 7.539987564086914e-05, 0.00010154396295547485, 0.00012768805027008057, 0.00015383213758468628, 0.000179976224899292, 0.0002061203122138977, 0.00023226439952850342, 0.00025840848684310913, 0.00028455257415771484, 0.00031069666147232056, 0.00033684074878692627, 0.000362984836101532, 0.0003891289234161377, 0.0004152730107307434, 0.0004414170980453491, 0.00046756118535995483, 0.0004937052726745605, 0.0005198493599891663, 0.000545993447303772, 0.0005721375346183777, 0.0005982816219329834, 0.0006244257092475891, 0.0006505697965621948, 0.0006767138838768005, 0.0007028579711914062]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 7.0, 3.0, 6.0, 4.0, 18.0, 15.0, 21.0, 20.0, 30.0, 34.0, 81.0, 144.0, 214.0, 418.0, 1402.0, 1031262.0, 13427.0, 681.0, 328.0, 171.0, 81.0, 51.0, 42.0, 30.0, 21.0, 16.0, 15.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01374053955078125, -0.01322638988494873, -0.012712240219116211, -0.012198090553283691, -0.011683940887451172, -0.011169791221618652, -0.010655641555786133, -0.010141491889953613, -0.009627342224121094, -0.009113192558288574, -0.008599042892456055, -0.008084893226623535, -0.007570743560791016, -0.007056593894958496, -0.0065424442291259766, -0.006028294563293457, -0.0055141448974609375, -0.004999995231628418, -0.0044858455657958984, -0.003971695899963379, -0.0034575462341308594, -0.00294339656829834, -0.0024292469024658203, -0.0019150972366333008, -0.0014009475708007812, -0.0008867979049682617, -0.0003726482391357422, 0.00014150142669677734, 0.0006556510925292969, 0.0011698007583618164, 0.001683950424194336, 0.0021981000900268555, 0.002712249755859375, 0.0032263994216918945, 0.003740549087524414, 0.004254698753356934, 0.004768848419189453, 0.005282998085021973, 0.005797147750854492, 0.006311297416687012, 0.006825447082519531, 0.007339596748352051, 0.00785374641418457, 0.00836789608001709, 0.00888204574584961, 0.009396195411682129, 0.009910345077514648, 0.010424494743347168, 0.010938644409179688, 0.011452794075012207, 0.011966943740844727, 0.012481093406677246, 0.012995243072509766, 0.013509392738342285, 0.014023542404174805, 0.014537692070007324, 0.015051841735839844, 0.015565991401672363, 0.016080141067504883, 0.016594290733337402, 0.017108440399169922, 0.01762259006500244, 0.01813673973083496, 0.01865088939666748, 0.0191650390625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 16.0, 50.0, 140.0, 303.0, 298.0, 161.0, 36.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008547219913452864, -0.0008295704610645771, -0.0008044189889915287, -0.0007792674587108195, -0.0007541159866377711, -0.0007289644563570619, -0.0007038129260763526, -0.0006786614540033042, -0.0006535099819302559, -0.0006283584516495466, -0.0006032069795764983, -0.000578055449295789, -0.0005529039772227407, -0.0005277524469420314, -0.0005026009166613221, -0.00047744944458827376, -0.0004522979143075645, -0.0004271464131306857, -0.0004019949119538069, -0.0003768433816730976, -0.00035169190960004926, -0.00032654037931934, -0.0003013888781424612, -0.00027623737696558237, -0.00025108587578870356, -0.00022593437461182475, -0.00020078287343494594, -0.0001756313577061519, -0.0001504798565292731, -0.00012532835535239428, -0.00010017683962360024, -7.502533844672143e-05, -4.9873837269842625e-05, -2.4722332454985008e-05, 4.291723598726094e-07, 2.5580680812709033e-05, 5.0732181989587843e-05, 7.588368316646665e-05, 0.00010103519889526069, 0.0001261867000721395, 0.0001513382012490183, 0.00017648970242589712, 0.00020164120360277593, 0.00022679271933156997, 0.000251944235060364, 0.00027709570713341236, 0.00030224723741412163, 0.00032739873859100044, 0.00035255023976787925, 0.00037770174094475806, 0.00040285324212163687, 0.00042800477240234613, 0.0004531562444753945, 0.00047830777475610375, 0.0005034592468291521, 0.0005286107771098614, 0.0005537623073905706, 0.0005789138376712799, 0.0006040653097443283, 0.0006292168400250375, 0.0006543683120980859, 0.0006795198423787951, 0.0007046713726595044, 0.0007298228447325528, 0.0007549743168056011]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 8.0, 5.0, 4.0, 12.0, 14.0, 19.0, 15.0, 16.0, 27.0, 24.0, 31.0, 32.0, 35.0, 45.0, 40.0, 29.0, 47.0, 29.0, 29.0, 52.0, 57.0, 37.0, 46.0, 33.0, 41.0, 40.0, 26.0, 36.0, 26.0, 32.0, 17.0, 25.0, 11.0, 12.0, 13.0, 12.0, 8.0, 5.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003191232681274414, -0.00030984170734882355, -0.0003005601465702057, -0.00029127858579158783, -0.00028199702501296997, -0.0002727154642343521, -0.00026343390345573425, -0.0002541523426771164, -0.00024487078189849854, -0.00023558922111988068, -0.00022630766034126282, -0.00021702609956264496, -0.0002077445387840271, -0.00019846297800540924, -0.00018918141722679138, -0.00017989985644817352, -0.00017061829566955566, -0.0001613367348909378, -0.00015205517411231995, -0.0001427736133337021, -0.00013349205255508423, -0.00012421049177646637, -0.00011492893099784851, -0.00010564737021923065, -9.636580944061279e-05, -8.708424866199493e-05, -7.780268788337708e-05, -6.852112710475922e-05, -5.923956632614136e-05, -4.99580055475235e-05, -4.067644476890564e-05, -3.139488399028778e-05, -2.2113323211669922e-05, -1.2831762433052063e-05, -3.550201654434204e-06, 5.731359124183655e-06, 1.5012919902801514e-05, 2.4294480681419373e-05, 3.357604146003723e-05, 4.285760223865509e-05, 5.213916301727295e-05, 6.142072379589081e-05, 7.070228457450867e-05, 7.998384535312653e-05, 8.926540613174438e-05, 9.854696691036224e-05, 0.0001078285276889801, 0.00011711008846759796, 0.00012639164924621582, 0.00013567321002483368, 0.00014495477080345154, 0.0001542363315820694, 0.00016351789236068726, 0.00017279945313930511, 0.00018208101391792297, 0.00019136257469654083, 0.0002006441354751587, 0.00020992569625377655, 0.0002192072570323944, 0.00022848881781101227, 0.00023777037858963013, 0.000247051939368248, 0.00025633350014686584, 0.0002656150609254837, 0.00027489662170410156]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 7.0, 9.0, 12.0, 12.0, 10.0, 19.0, 9.0, 15.0, 17.0, 25.0, 17.0, 21.0, 30.0, 27.0, 28.0, 39.0, 37.0, 44.0, 47.0, 42.0, 35.0, 40.0, 36.0, 51.0, 28.0, 33.0, 29.0, 42.0, 28.0, 27.0, 24.0, 19.0, 20.0, 27.0, 12.0, 16.0, 9.0, 14.0, 8.0, 6.0, 5.0, 6.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-12.0546875, -11.6754150390625, -11.296142578125, -10.9168701171875, -10.53759765625, -10.1583251953125, -9.779052734375, -9.3997802734375, -9.0205078125, -8.6412353515625, -8.261962890625, -7.8826904296875, -7.50341796875, -7.1241455078125, -6.744873046875, -6.3656005859375, -5.986328125, -5.6070556640625, -5.227783203125, -4.8485107421875, -4.46923828125, -4.0899658203125, -3.710693359375, -3.3314208984375, -2.9521484375, -2.5728759765625, -2.193603515625, -1.8143310546875, -1.43505859375, -1.0557861328125, -0.676513671875, -0.2972412109375, 0.08203125, 0.4613037109375, 0.840576171875, 1.2198486328125, 1.59912109375, 1.9783935546875, 2.357666015625, 2.7369384765625, 3.1162109375, 3.4954833984375, 3.874755859375, 4.2540283203125, 4.63330078125, 5.0125732421875, 5.391845703125, 5.7711181640625, 6.150390625, 6.5296630859375, 6.908935546875, 7.2882080078125, 7.66748046875, 8.0467529296875, 8.426025390625, 8.8052978515625, 9.1845703125, 9.5638427734375, 9.943115234375, 10.3223876953125, 10.70166015625, 11.0809326171875, 11.460205078125, 11.8394775390625, 12.21875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 12.0, 22.0, 16.0, 21.0, 34.0, 40.0, 64.0, 72.0, 105.0, 148.0, 192.0, 237.0, 358.0, 525.0, 800.0, 1353.0, 2511.0, 5719.0, 15060.0, 44479.0, 127636.0, 303592.0, 322192.0, 143678.0, 49390.0, 16851.0, 6259.0, 2911.0, 1534.0, 865.0, 518.0, 335.0, 274.0, 184.0, 118.0, 109.0, 89.0, 54.0, 51.0, 34.0, 31.0, 18.0, 12.0, 13.0, 10.0, 3.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.640625, -16.13720703125, -15.6337890625, -15.13037109375, -14.626953125, -14.12353515625, -13.6201171875, -13.11669921875, -12.61328125, -12.10986328125, -11.6064453125, -11.10302734375, -10.599609375, -10.09619140625, -9.5927734375, -9.08935546875, -8.5859375, -8.08251953125, -7.5791015625, -7.07568359375, -6.572265625, -6.06884765625, -5.5654296875, -5.06201171875, -4.55859375, -4.05517578125, -3.5517578125, -3.04833984375, -2.544921875, -2.04150390625, -1.5380859375, -1.03466796875, -0.53125, -0.02783203125, 0.4755859375, 0.97900390625, 1.482421875, 1.98583984375, 2.4892578125, 2.99267578125, 3.49609375, 3.99951171875, 4.5029296875, 5.00634765625, 5.509765625, 6.01318359375, 6.5166015625, 7.02001953125, 7.5234375, 8.02685546875, 8.5302734375, 9.03369140625, 9.537109375, 10.04052734375, 10.5439453125, 11.04736328125, 11.55078125, 12.05419921875, 12.5576171875, 13.06103515625, 13.564453125, 14.06787109375, 14.5712890625, 15.07470703125, 15.578125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 15.0, 18.0, 20.0, 26.0, 25.0, 31.0, 33.0, 32.0, 61.0, 68.0, 78.0, 128.0, 307.0, 1432.0, 249.0, 131.0, 61.0, 35.0, 51.0, 40.0, 31.0, 35.0, 22.0, 20.0, 19.0, 11.0, 12.0, 9.0, 7.0, 12.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.875, -37.6357421875, -36.396484375, -35.1572265625, -33.91796875, -32.6787109375, -31.439453125, -30.2001953125, -28.9609375, -27.7216796875, -26.482421875, -25.2431640625, -24.00390625, -22.7646484375, -21.525390625, -20.2861328125, -19.046875, -17.8076171875, -16.568359375, -15.3291015625, -14.08984375, -12.8505859375, -11.611328125, -10.3720703125, -9.1328125, -7.8935546875, -6.654296875, -5.4150390625, -4.17578125, -2.9365234375, -1.697265625, -0.4580078125, 0.78125, 2.0205078125, 3.259765625, 4.4990234375, 5.73828125, 6.9775390625, 8.216796875, 9.4560546875, 10.6953125, 11.9345703125, 13.173828125, 14.4130859375, 15.65234375, 16.8916015625, 18.130859375, 19.3701171875, 20.609375, 21.8486328125, 23.087890625, 24.3271484375, 25.56640625, 26.8056640625, 28.044921875, 29.2841796875, 30.5234375, 31.7626953125, 33.001953125, 34.2412109375, 35.48046875, 36.7197265625, 37.958984375, 39.1982421875, 40.4375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 5.0, 7.0, 7.0, 9.0, 14.0, 16.0, 26.0, 24.0, 44.0, 71.0, 84.0, 124.0, 191.0, 330.0, 587.0, 1186.0, 12733.0, 2792290.0, 332074.0, 3729.0, 859.0, 451.0, 274.0, 179.0, 109.0, 77.0, 51.0, 43.0, 28.0, 13.0, 18.0, 9.0, 15.0, 3.0, 4.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-92.9375, -90.10546875, -87.2734375, -84.44140625, -81.609375, -78.77734375, -75.9453125, -73.11328125, -70.28125, -67.44921875, -64.6171875, -61.78515625, -58.953125, -56.12109375, -53.2890625, -50.45703125, -47.625, -44.79296875, -41.9609375, -39.12890625, -36.296875, -33.46484375, -30.6328125, -27.80078125, -24.96875, -22.13671875, -19.3046875, -16.47265625, -13.640625, -10.80859375, -7.9765625, -5.14453125, -2.3125, 0.51953125, 3.3515625, 6.18359375, 9.015625, 11.84765625, 14.6796875, 17.51171875, 20.34375, 23.17578125, 26.0078125, 28.83984375, 31.671875, 34.50390625, 37.3359375, 40.16796875, 43.0, 45.83203125, 48.6640625, 51.49609375, 54.328125, 57.16015625, 59.9921875, 62.82421875, 65.65625, 68.48828125, 71.3203125, 74.15234375, 76.984375, 79.81640625, 82.6484375, 85.48046875, 88.3125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 12.0, 57.0, 163.0, 326.0, 281.0, 108.0, 45.0, 15.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.46192169189453, -36.72151184082031, -31.98110008239746, -27.24068832397461, -22.50027847290039, -17.759868621826172, -13.01945686340332, -8.279045104980469, -3.53863525390625, 1.2017755508422852, 5.94218635559082, 10.682597160339355, 15.42300796508789, 20.16341781616211, 24.90382957458496, 29.644241333007812, 34.38465118408203, 39.12506103515625, 43.86547088623047, 48.60588455200195, 53.34629440307617, 58.08670425415039, 62.827117919921875, 67.5675277709961, 72.30793762207031, 77.04834747314453, 81.78875732421875, 86.52916717529297, 91.26957702636719, 96.00999450683594, 100.75040435791016, 105.49081420898438, 110.23123168945312, 114.97164154052734, 119.71205139160156, 124.45246124267578, 129.19287109375, 133.93328857421875, 138.67369079589844, 143.4141082763672, 148.15451049804688, 152.89492797851562, 157.6353302001953, 162.37574768066406, 167.11614990234375, 171.8565673828125, 176.5969696044922, 181.33738708496094, 186.0778045654297, 190.81822204589844, 195.55862426757812, 200.29904174804688, 205.03944396972656, 209.7798614501953, 214.520263671875, 219.26068115234375, 224.0010986328125, 228.74151611328125, 233.48191833496094, 238.2223358154297, 242.96273803710938, 247.70315551757812, 252.4435577392578, 257.1839599609375, 261.92437744140625]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 6.0, 8.0, 4.0, 8.0, 10.0, 6.0, 17.0, 14.0, 18.0, 20.0, 21.0, 30.0, 34.0, 33.0, 34.0, 45.0, 36.0, 41.0, 45.0, 50.0, 37.0, 39.0, 35.0, 42.0, 51.0, 30.0, 36.0, 27.0, 30.0, 29.0, 28.0, 13.0, 25.0, 19.0, 12.0, 14.0, 13.0, 10.0, 8.0, 4.0, 2.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.55532836914062, -74.0134506225586, -71.47157287597656, -68.92969512939453, -66.3878173828125, -63.84593963623047, -61.30406188964844, -58.762184143066406, -56.220306396484375, -53.678428649902344, -51.13655090332031, -48.59467315673828, -46.05279541015625, -43.51091766357422, -40.96903991699219, -38.427162170410156, -35.885284423828125, -33.343406677246094, -30.801528930664062, -28.25965118408203, -25.7177734375, -23.17589569091797, -20.634017944335938, -18.092140197753906, -15.550262451171875, -13.008384704589844, -10.466506958007812, -7.924629211425781, -5.38275146484375, -2.8408737182617188, -0.2989959716796875, 2.2428817749023438, 4.784751892089844, 7.326629638671875, 9.868507385253906, 12.410385131835938, 14.952262878417969, 17.494140625, 20.03601837158203, 22.577896118164062, 25.119773864746094, 27.661651611328125, 30.203529357910156, 32.74540710449219, 35.28728485107422, 37.82916259765625, 40.37104034423828, 42.91291809082031, 45.454795837402344, 47.996673583984375, 50.538551330566406, 53.08042907714844, 55.62230682373047, 58.1641845703125, 60.70606231689453, 63.24794006347656, 65.7898178100586, 68.33169555664062, 70.87357330322266, 73.41545104980469, 75.95732879638672, 78.49920654296875, 81.04108428955078, 83.58296203613281, 86.12483978271484]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 8.0, 11.0, 5.0, 11.0, 7.0, 12.0, 7.0, 16.0, 16.0, 28.0, 22.0, 23.0, 37.0, 24.0, 25.0, 32.0, 36.0, 47.0, 33.0, 44.0, 39.0, 45.0, 43.0, 26.0, 47.0, 28.0, 44.0, 33.0, 34.0, 38.0, 25.0, 24.0, 19.0, 20.0, 15.0, 22.0, 9.0, 8.0, 8.0, 7.0, 7.0, 5.0, 10.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.8359375, -13.4339599609375, -13.031982421875, -12.6300048828125, -12.22802734375, -11.8260498046875, -11.424072265625, -11.0220947265625, -10.6201171875, -10.2181396484375, -9.816162109375, -9.4141845703125, -9.01220703125, -8.6102294921875, -8.208251953125, -7.8062744140625, -7.404296875, -7.0023193359375, -6.600341796875, -6.1983642578125, -5.79638671875, -5.3944091796875, -4.992431640625, -4.5904541015625, -4.1884765625, -3.7864990234375, -3.384521484375, -2.9825439453125, -2.58056640625, -2.1785888671875, -1.776611328125, -1.3746337890625, -0.97265625, -0.5706787109375, -0.168701171875, 0.2332763671875, 0.63525390625, 1.0372314453125, 1.439208984375, 1.8411865234375, 2.2431640625, 2.6451416015625, 3.047119140625, 3.4490966796875, 3.85107421875, 4.2530517578125, 4.655029296875, 5.0570068359375, 5.458984375, 5.8609619140625, 6.262939453125, 6.6649169921875, 7.06689453125, 7.4688720703125, 7.870849609375, 8.2728271484375, 8.6748046875, 9.0767822265625, 9.478759765625, 9.8807373046875, 10.28271484375, 10.6846923828125, 11.086669921875, 11.4886474609375, 11.890625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 8.0, 0.0, 6.0, 8.0, 13.0, 10.0, 21.0, 12.0, 22.0, 22.0, 26.0, 45.0, 52.0, 56.0, 74.0, 118.0, 157.0, 196.0, 247.0, 319.0, 439.0, 1371.0, 2875796.0, 1312474.0, 1083.0, 350.0, 272.0, 252.0, 178.0, 139.0, 106.0, 81.0, 64.0, 44.0, 40.0, 34.0, 26.0, 25.0, 22.0, 13.0, 9.0, 10.0, 12.0, 6.0, 5.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-147.25, -142.78125, -138.3125, -133.84375, -129.375, -124.90625, -120.4375, -115.96875, -111.5, -107.03125, -102.5625, -98.09375, -93.625, -89.15625, -84.6875, -80.21875, -75.75, -71.28125, -66.8125, -62.34375, -57.875, -53.40625, -48.9375, -44.46875, -40.0, -35.53125, -31.0625, -26.59375, -22.125, -17.65625, -13.1875, -8.71875, -4.25, 0.21875, 4.6875, 9.15625, 13.625, 18.09375, 22.5625, 27.03125, 31.5, 35.96875, 40.4375, 44.90625, 49.375, 53.84375, 58.3125, 62.78125, 67.25, 71.71875, 76.1875, 80.65625, 85.125, 89.59375, 94.0625, 98.53125, 103.0, 107.46875, 111.9375, 116.40625, 120.875, 125.34375, 129.8125, 134.28125, 138.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 9.0, 9.0, 8.0, 15.0, 25.0, 27.0, 51.0, 47.0, 63.0, 80.0, 98.0, 151.0, 220.0, 272.0, 361.0, 479.0, 490.0, 409.0, 316.0, 265.0, 171.0, 120.0, 90.0, 78.0, 44.0, 32.0, 29.0, 24.0, 16.0, 10.0, 11.0, 6.0, 11.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.359375, -18.776123046875, -18.19287109375, -17.609619140625, -17.0263671875, -16.443115234375, -15.85986328125, -15.276611328125, -14.693359375, -14.110107421875, -13.52685546875, -12.943603515625, -12.3603515625, -11.777099609375, -11.19384765625, -10.610595703125, -10.02734375, -9.444091796875, -8.86083984375, -8.277587890625, -7.6943359375, -7.111083984375, -6.52783203125, -5.944580078125, -5.361328125, -4.778076171875, -4.19482421875, -3.611572265625, -3.0283203125, -2.445068359375, -1.86181640625, -1.278564453125, -0.6953125, -0.112060546875, 0.47119140625, 1.054443359375, 1.6376953125, 2.220947265625, 2.80419921875, 3.387451171875, 3.970703125, 4.553955078125, 5.13720703125, 5.720458984375, 6.3037109375, 6.886962890625, 7.47021484375, 8.053466796875, 8.63671875, 9.219970703125, 9.80322265625, 10.386474609375, 10.9697265625, 11.552978515625, 12.13623046875, 12.719482421875, 13.302734375, 13.885986328125, 14.46923828125, 15.052490234375, 15.6357421875, 16.218994140625, 16.80224609375, 17.385498046875, 17.96875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 12.0, 17.0, 13.0, 20.0, 31.0, 24.0, 33.0, 35.0, 70.0, 103.0, 221.0, 676.0, 10775.0, 3691016.0, 487374.0, 2930.0, 433.0, 155.0, 85.0, 55.0, 39.0, 30.0, 22.0, 28.0, 12.0, 19.0, 10.0, 11.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.6875, -78.525390625, -75.36328125, -72.201171875, -69.0390625, -65.876953125, -62.71484375, -59.552734375, -56.390625, -53.228515625, -50.06640625, -46.904296875, -43.7421875, -40.580078125, -37.41796875, -34.255859375, -31.09375, -27.931640625, -24.76953125, -21.607421875, -18.4453125, -15.283203125, -12.12109375, -8.958984375, -5.796875, -2.634765625, 0.52734375, 3.689453125, 6.8515625, 10.013671875, 13.17578125, 16.337890625, 19.5, 22.662109375, 25.82421875, 28.986328125, 32.1484375, 35.310546875, 38.47265625, 41.634765625, 44.796875, 47.958984375, 51.12109375, 54.283203125, 57.4453125, 60.607421875, 63.76953125, 66.931640625, 70.09375, 73.255859375, 76.41796875, 79.580078125, 82.7421875, 85.904296875, 89.06640625, 92.228515625, 95.390625, 98.552734375, 101.71484375, 104.876953125, 108.0390625, 111.201171875, 114.36328125, 117.525390625, 120.6875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 77.0, 556.0, 353.0, 26.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-484.9032897949219, -472.0851745605469, -459.26708984375, -446.448974609375, -433.6308898925781, -420.8127746582031, -407.99468994140625, -395.17657470703125, -382.35845947265625, -369.54034423828125, -356.7222595214844, -343.9041442871094, -331.0860595703125, -318.2679443359375, -305.4498291015625, -292.6317443847656, -279.81365966796875, -266.99554443359375, -254.17745971679688, -241.35934448242188, -228.541259765625, -215.72314453125, -202.90504455566406, -190.08694458007812, -177.2688446044922, -164.45074462890625, -151.6326446533203, -138.81454467773438, -125.9964370727539, -113.17833709716797, -100.3602294921875, -87.54212951660156, -74.72406005859375, -61.90596008300781, -49.08785629272461, -36.269752502441406, -23.45165252685547, -10.633552551269531, 2.1845550537109375, 15.002655029296875, 27.820755004882812, 40.63885498046875, 53.45695877075195, 66.27506256103516, 79.0931625366211, 91.91126251220703, 104.7293701171875, 117.54747009277344, 130.36557006835938, 143.1836700439453, 156.00177001953125, 168.81988525390625, 181.63796997070312, 194.45608520507812, 207.27418518066406, 220.09228515625, 232.91038513183594, 245.72848510742188, 258.5466003417969, 271.36468505859375, 284.18280029296875, 297.0008850097656, 309.8190002441406, 322.6370849609375, 335.4552001953125]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 7.0, 2.0, 3.0, 13.0, 8.0, 20.0, 8.0, 21.0, 18.0, 21.0, 22.0, 22.0, 22.0, 30.0, 27.0, 26.0, 31.0, 42.0, 30.0, 29.0, 48.0, 47.0, 44.0, 40.0, 42.0, 31.0, 39.0, 22.0, 23.0, 32.0, 36.0, 32.0, 31.0, 21.0, 20.0, 20.0, 10.0, 10.0, 16.0, 10.0, 4.0, 9.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0], "bins": [-78.47827911376953, -76.45101928710938, -74.42375183105469, -72.39649200439453, -70.36923217773438, -68.34196472167969, -66.31470489501953, -64.28744506835938, -62.26017761230469, -60.232913970947266, -58.20565414428711, -56.17839050292969, -54.151126861572266, -52.123863220214844, -50.09660339355469, -48.069339752197266, -46.04207992553711, -44.01481628417969, -41.98755645751953, -39.96029281616211, -37.93302917480469, -35.90576934814453, -33.87850570678711, -31.851242065429688, -29.8239803314209, -27.79671859741211, -25.769454956054688, -23.7421932220459, -21.71493148803711, -19.687667846679688, -17.6604061126709, -15.633143424987793, -13.605884552001953, -11.578621864318848, -9.551359176635742, -7.524097442626953, -5.496834754943848, -3.469572067260742, -1.4423103332519531, 0.5849523544311523, 2.612215042114258, 4.639477729797363, 6.6667399406433105, 8.694002151489258, 10.721264839172363, 12.748527526855469, 14.775789260864258, 16.803050994873047, 18.83031463623047, 20.857576370239258, 22.88484001159668, 24.91210174560547, 26.93936538696289, 28.96662712097168, 30.99388885498047, 33.02115249633789, 35.04841613769531, 37.075679779052734, 39.10293960571289, 41.13020324707031, 43.157466888427734, 45.184730529785156, 47.21199035644531, 49.239253997802734, 51.26651382446289]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 11.0, 11.0, 8.0, 6.0, 13.0, 14.0, 15.0, 22.0, 21.0, 28.0, 30.0, 23.0, 29.0, 32.0, 28.0, 30.0, 29.0, 36.0, 38.0, 35.0, 39.0, 33.0, 30.0, 38.0, 40.0, 34.0, 32.0, 32.0, 28.0, 31.0, 19.0, 29.0, 20.0, 19.0, 11.0, 20.0, 13.0, 11.0, 8.0, 6.0, 8.0, 9.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.328125, -10.9697265625, -10.611328125, -10.2529296875, -9.89453125, -9.5361328125, -9.177734375, -8.8193359375, -8.4609375, -8.1025390625, -7.744140625, -7.3857421875, -7.02734375, -6.6689453125, -6.310546875, -5.9521484375, -5.59375, -5.2353515625, -4.876953125, -4.5185546875, -4.16015625, -3.8017578125, -3.443359375, -3.0849609375, -2.7265625, -2.3681640625, -2.009765625, -1.6513671875, -1.29296875, -0.9345703125, -0.576171875, -0.2177734375, 0.140625, 0.4990234375, 0.857421875, 1.2158203125, 1.57421875, 1.9326171875, 2.291015625, 2.6494140625, 3.0078125, 3.3662109375, 3.724609375, 4.0830078125, 4.44140625, 4.7998046875, 5.158203125, 5.5166015625, 5.875, 6.2333984375, 6.591796875, 6.9501953125, 7.30859375, 7.6669921875, 8.025390625, 8.3837890625, 8.7421875, 9.1005859375, 9.458984375, 9.8173828125, 10.17578125, 10.5341796875, 10.892578125, 11.2509765625, 11.609375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 14.0, 16.0, 24.0, 31.0, 39.0, 70.0, 117.0, 162.0, 263.0, 339.0, 554.0, 874.0, 1307.0, 1902.0, 2951.0, 4615.0, 6991.0, 11045.0, 17585.0, 28657.0, 47469.0, 83801.0, 169735.0, 344956.0, 140732.0, 72727.0, 41933.0, 25550.0, 15763.0, 9914.0, 6339.0, 4193.0, 2652.0, 1768.0, 1184.0, 770.0, 485.0, 336.0, 231.0, 151.0, 106.0, 56.0, 51.0, 31.0, 21.0, 11.0, 10.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.716796875, -3.602020263671875, -3.48724365234375, -3.372467041015625, -3.2576904296875, -3.142913818359375, -3.02813720703125, -2.913360595703125, -2.798583984375, -2.683807373046875, -2.56903076171875, -2.454254150390625, -2.3394775390625, -2.224700927734375, -2.10992431640625, -1.995147705078125, -1.88037109375, -1.765594482421875, -1.65081787109375, -1.536041259765625, -1.4212646484375, -1.306488037109375, -1.19171142578125, -1.076934814453125, -0.962158203125, -0.847381591796875, -0.73260498046875, -0.617828369140625, -0.5030517578125, -0.388275146484375, -0.27349853515625, -0.158721923828125, -0.0439453125, 0.070831298828125, 0.18560791015625, 0.300384521484375, 0.4151611328125, 0.529937744140625, 0.64471435546875, 0.759490966796875, 0.874267578125, 0.989044189453125, 1.10382080078125, 1.218597412109375, 1.3333740234375, 1.448150634765625, 1.56292724609375, 1.677703857421875, 1.79248046875, 1.907257080078125, 2.02203369140625, 2.136810302734375, 2.2515869140625, 2.366363525390625, 2.48114013671875, 2.595916748046875, 2.710693359375, 2.825469970703125, 2.94024658203125, 3.055023193359375, 3.1697998046875, 3.284576416015625, 3.39935302734375, 3.514129638671875, 3.62890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 2.0, 6.0, 10.0, 12.0, 13.0, 10.0, 13.0, 21.0, 13.0, 22.0, 28.0, 29.0, 37.0, 33.0, 37.0, 43.0, 42.0, 37.0, 53.0, 1080.0, 35.0, 46.0, 40.0, 42.0, 29.0, 40.0, 26.0, 29.0, 33.0, 22.0, 12.0, 17.0, 21.0, 18.0, 21.0, 12.0, 9.0, 10.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.98046875, -7.71441650390625, -7.4483642578125, -7.18231201171875, -6.916259765625, -6.65020751953125, -6.3841552734375, -6.11810302734375, -5.85205078125, -5.58599853515625, -5.3199462890625, -5.05389404296875, -4.787841796875, -4.52178955078125, -4.2557373046875, -3.98968505859375, -3.7236328125, -3.45758056640625, -3.1915283203125, -2.92547607421875, -2.659423828125, -2.39337158203125, -2.1273193359375, -1.86126708984375, -1.59521484375, -1.32916259765625, -1.0631103515625, -0.79705810546875, -0.531005859375, -0.26495361328125, 0.0010986328125, 0.26715087890625, 0.533203125, 0.79925537109375, 1.0653076171875, 1.33135986328125, 1.597412109375, 1.86346435546875, 2.1295166015625, 2.39556884765625, 2.66162109375, 2.92767333984375, 3.1937255859375, 3.45977783203125, 3.725830078125, 3.99188232421875, 4.2579345703125, 4.52398681640625, 4.7900390625, 5.05609130859375, 5.3221435546875, 5.58819580078125, 5.854248046875, 6.12030029296875, 6.3863525390625, 6.65240478515625, 6.91845703125, 7.18450927734375, 7.4505615234375, 7.71661376953125, 7.982666015625, 8.24871826171875, 8.5147705078125, 8.78082275390625, 9.046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 13.0, 22.0, 27.0, 28.0, 53.0, 67.0, 97.0, 162.0, 264.0, 342.0, 499.0, 829.0, 1226.0, 1789.0, 2683.0, 4076.0, 5908.0, 8746.0, 13354.0, 20787.0, 32095.0, 51054.0, 83677.0, 156857.0, 1377491.0, 130653.0, 74260.0, 45649.0, 29304.0, 18727.0, 11957.0, 7897.0, 5548.0, 3594.0, 2512.0, 1599.0, 1041.0, 712.0, 537.0, 333.0, 182.0, 149.0, 121.0, 81.0, 42.0, 34.0, 16.0, 13.0, 8.0, 8.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.080078125, -2.97869873046875, -2.8773193359375, -2.77593994140625, -2.674560546875, -2.57318115234375, -2.4718017578125, -2.37042236328125, -2.26904296875, -2.16766357421875, -2.0662841796875, -1.96490478515625, -1.863525390625, -1.76214599609375, -1.6607666015625, -1.55938720703125, -1.4580078125, -1.35662841796875, -1.2552490234375, -1.15386962890625, -1.052490234375, -0.95111083984375, -0.8497314453125, -0.74835205078125, -0.64697265625, -0.54559326171875, -0.4442138671875, -0.34283447265625, -0.241455078125, -0.14007568359375, -0.0386962890625, 0.06268310546875, 0.1640625, 0.26544189453125, 0.3668212890625, 0.46820068359375, 0.569580078125, 0.67095947265625, 0.7723388671875, 0.87371826171875, 0.97509765625, 1.07647705078125, 1.1778564453125, 1.27923583984375, 1.380615234375, 1.48199462890625, 1.5833740234375, 1.68475341796875, 1.7861328125, 1.88751220703125, 1.9888916015625, 2.09027099609375, 2.191650390625, 2.29302978515625, 2.3944091796875, 2.49578857421875, 2.59716796875, 2.69854736328125, 2.7999267578125, 2.90130615234375, 3.002685546875, 3.10406494140625, 3.2054443359375, 3.30682373046875, 3.408203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 11.0, 6.0, 9.0, 10.0, 7.0, 16.0, 12.0, 13.0, 17.0, 25.0, 35.0, 32.0, 32.0, 50.0, 47.0, 78.0, 73.0, 73.0, 63.0, 67.0, 67.0, 36.0, 53.0, 32.0, 21.0, 15.0, 21.0, 14.0, 8.0, 13.0, 13.0, 3.0, 7.0, 5.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0005106925964355469, -0.0004961714148521423, -0.0004816502332687378, -0.00046712905168533325, -0.0004526078701019287, -0.00043808668851852417, -0.00042356550693511963, -0.0004090443253517151, -0.00039452314376831055, -0.000380001962184906, -0.00036548078060150146, -0.0003509595990180969, -0.0003364384174346924, -0.00032191723585128784, -0.0003073960542678833, -0.00029287487268447876, -0.0002783536911010742, -0.0002638325095176697, -0.00024931132793426514, -0.0002347901463508606, -0.00022026896476745605, -0.00020574778318405151, -0.00019122660160064697, -0.00017670542001724243, -0.0001621842384338379, -0.00014766305685043335, -0.0001331418752670288, -0.00011862069368362427, -0.00010409951210021973, -8.957833051681519e-05, -7.505714893341064e-05, -6.0535967350006104e-05, -4.601478576660156e-05, -3.149360418319702e-05, -1.697242259979248e-05, -2.4512410163879395e-06, 1.2069940567016602e-05, 2.6591122150421143e-05, 4.1112303733825684e-05, 5.5633485317230225e-05, 7.015466690063477e-05, 8.46758484840393e-05, 9.919703006744385e-05, 0.00011371821165084839, 0.00012823939323425293, 0.00014276057481765747, 0.000157281756401062, 0.00017180293798446655, 0.0001863241195678711, 0.00020084530115127563, 0.00021536648273468018, 0.00022988766431808472, 0.00024440884590148926, 0.0002589300274848938, 0.00027345120906829834, 0.0002879723906517029, 0.0003024935722351074, 0.00031701475381851196, 0.0003315359354019165, 0.00034605711698532104, 0.0003605782985687256, 0.0003750994801521301, 0.00038962066173553467, 0.0004041418433189392, 0.00041866302490234375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 9.0, 10.0, 17.0, 17.0, 17.0, 33.0, 32.0, 49.0, 77.0, 110.0, 145.0, 219.0, 343.0, 601.0, 1453.0, 214910.0, 826468.0, 2148.0, 654.0, 374.0, 243.0, 153.0, 117.0, 67.0, 46.0, 51.0, 28.0, 27.0, 21.0, 21.0, 17.0, 13.0, 12.0, 14.0, 7.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00809478759765625, -0.007816672325134277, -0.007538557052612305, -0.007260441780090332, -0.006982326507568359, -0.006704211235046387, -0.006426095962524414, -0.006147980690002441, -0.005869865417480469, -0.005591750144958496, -0.0053136348724365234, -0.005035519599914551, -0.004757404327392578, -0.0044792890548706055, -0.004201173782348633, -0.00392305850982666, -0.0036449432373046875, -0.003366827964782715, -0.003088712692260742, -0.0028105974197387695, -0.002532482147216797, -0.0022543668746948242, -0.0019762516021728516, -0.001698136329650879, -0.0014200210571289062, -0.0011419057846069336, -0.0008637905120849609, -0.0005856752395629883, -0.0003075599670410156, -2.944469451904297e-05, 0.0002486705780029297, 0.0005267858505249023, 0.000804901123046875, 0.0010830163955688477, 0.0013611316680908203, 0.001639246940612793, 0.0019173622131347656, 0.0021954774856567383, 0.002473592758178711, 0.0027517080307006836, 0.0030298233032226562, 0.003307938575744629, 0.0035860538482666016, 0.0038641691207885742, 0.004142284393310547, 0.0044203996658325195, 0.004698514938354492, 0.004976630210876465, 0.0052547454833984375, 0.00553286075592041, 0.005810976028442383, 0.0060890913009643555, 0.006367206573486328, 0.006645321846008301, 0.0069234371185302734, 0.007201552391052246, 0.007479667663574219, 0.007757782936096191, 0.008035898208618164, 0.008314013481140137, 0.00859212875366211, 0.008870244026184082, 0.009148359298706055, 0.009426474571228027, 0.00970458984375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 22.0, 391.0, 540.0, 56.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022824176121503115, -0.002228217665106058, -0.0021740177180618048, -0.0021198177710175514, -0.0020656175911426544, -0.002011417644098401, -0.0019572176970541477, -0.0019030177500098944, -0.001848817802965641, -0.0017946178559213877, -0.0017404177924618125, -0.0016862178454175591, -0.0016320178983733058, -0.0015778178349137306, -0.0015236178878694773, -0.001469417940825224, -0.0014152178773656487, -0.0013610179303213954, -0.0013068178668618202, -0.0012526179198175669, -0.0011984179727733135, -0.0011442180257290602, -0.001090017962269485, -0.0010358180152252316, -0.0009816179517656565, -0.0009274179465137422, -0.0008732179994694889, -0.0008190179942175746, -0.0007648180471733212, -0.000710618041921407, -0.0006564180366694927, -0.0006022180896252394, -0.0005480180261656642, -0.0004938180209137499, -0.0004396180738694966, -0.0003854180686175823, -0.0003312180924694985, -0.0002770181163214147, -0.00022281811106950045, -0.00016861813492141664, -0.00011441815877333283, -6.0218175349291414e-05, -6.018191925249994e-06, 4.818179877474904e-05, 0.00010238177492283285, 0.00015658175107091665, 0.00021078175632283092, 0.0002649817324709147, 0.00031918170861899853, 0.00037338168476708233, 0.00042758166091516614, 0.0004817816661670804, 0.0005359816132113338, 0.000590181618463248, 0.0006443816237151623, 0.0006985815707594156, 0.0007527815760113299, 0.0008069815812632442, 0.0008611815283074975, 0.0009153815335594118, 0.000969581538811326, 0.0010237814858555794, 0.0010779814328998327, 0.001132181496359408, 0.0011863814434036613]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 4.0, 2.0, 3.0, 6.0, 9.0, 2.0, 9.0, 8.0, 11.0, 11.0, 12.0, 20.0, 19.0, 13.0, 25.0, 30.0, 26.0, 30.0, 35.0, 25.0, 29.0, 33.0, 39.0, 41.0, 38.0, 44.0, 44.0, 39.0, 36.0, 28.0, 38.0, 27.0, 41.0, 26.0, 27.0, 19.0, 24.0, 21.0, 13.0, 21.0, 11.0, 10.0, 3.0, 9.0, 11.0, 10.0, 7.0, 12.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019061565399169922, -0.00018392875790596008, -0.00017724186182022095, -0.0001705549657344818, -0.00016386806964874268, -0.00015718117356300354, -0.0001504942774772644, -0.00014380738139152527, -0.00013712048530578613, -0.000130433589220047, -0.00012374669313430786, -0.00011705979704856873, -0.00011037290096282959, -0.00010368600487709045, -9.699910879135132e-05, -9.031221270561218e-05, -8.362531661987305e-05, -7.693842053413391e-05, -7.025152444839478e-05, -6.356462836265564e-05, -5.6877732276916504e-05, -5.019083619117737e-05, -4.350394010543823e-05, -3.68170440196991e-05, -3.013014793395996e-05, -2.3443251848220825e-05, -1.675635576248169e-05, -1.0069459676742554e-05, -3.382563591003418e-06, 3.3043324947357178e-06, 9.991228580474854e-06, 1.667812466621399e-05, 2.3365020751953125e-05, 3.005191683769226e-05, 3.6738812923431396e-05, 4.342570900917053e-05, 5.011260509490967e-05, 5.6799501180648804e-05, 6.348639726638794e-05, 7.017329335212708e-05, 7.686018943786621e-05, 8.354708552360535e-05, 9.023398160934448e-05, 9.692087769508362e-05, 0.00010360777378082275, 0.00011029466986656189, 0.00011698156595230103, 0.00012366846203804016, 0.0001303553581237793, 0.00013704225420951843, 0.00014372915029525757, 0.0001504160463809967, 0.00015710294246673584, 0.00016378983855247498, 0.0001704767346382141, 0.00017716363072395325, 0.00018385052680969238, 0.00019053742289543152, 0.00019722431898117065, 0.0002039112150669098, 0.00021059811115264893, 0.00021728500723838806, 0.0002239719033241272, 0.00023065879940986633, 0.00023734569549560547]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 11.0, 11.0, 8.0, 6.0, 13.0, 14.0, 15.0, 22.0, 21.0, 28.0, 30.0, 23.0, 29.0, 32.0, 28.0, 30.0, 29.0, 36.0, 38.0, 36.0, 38.0, 33.0, 30.0, 38.0, 40.0, 34.0, 32.0, 32.0, 28.0, 31.0, 19.0, 29.0, 20.0, 19.0, 11.0, 20.0, 13.0, 11.0, 8.0, 6.0, 8.0, 9.0, 4.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.328125, -10.9697265625, -10.611328125, -10.2529296875, -9.89453125, -9.5361328125, -9.177734375, -8.8193359375, -8.4609375, -8.1025390625, -7.744140625, -7.3857421875, -7.02734375, -6.6689453125, -6.310546875, -5.9521484375, -5.59375, -5.2353515625, -4.876953125, -4.5185546875, -4.16015625, -3.8017578125, -3.443359375, -3.0849609375, -2.7265625, -2.3681640625, -2.009765625, -1.6513671875, -1.29296875, -0.9345703125, -0.576171875, -0.2177734375, 0.140625, 0.4990234375, 0.857421875, 1.2158203125, 1.57421875, 1.9326171875, 2.291015625, 2.6494140625, 3.0078125, 3.3662109375, 3.724609375, 4.0830078125, 4.44140625, 4.7998046875, 5.158203125, 5.5166015625, 5.875, 6.2333984375, 6.591796875, 6.9501953125, 7.30859375, 7.6669921875, 8.025390625, 8.3837890625, 8.7421875, 9.1005859375, 9.458984375, 9.8173828125, 10.17578125, 10.5341796875, 10.892578125, 11.2509765625, 11.609375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 8.0, 5.0, 6.0, 6.0, 6.0, 16.0, 24.0, 30.0, 40.0, 57.0, 52.0, 65.0, 83.0, 120.0, 167.0, 197.0, 259.0, 312.0, 405.0, 546.0, 688.0, 949.0, 1379.0, 2331.0, 5334.0, 20094.0, 96969.0, 394622.0, 393268.0, 97130.0, 20237.0, 5393.0, 2310.0, 1332.0, 992.0, 718.0, 507.0, 420.0, 336.0, 248.0, 217.0, 172.0, 106.0, 82.0, 64.0, 57.0, 51.0, 37.0, 38.0, 24.0, 9.0, 10.0, 7.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0], "bins": [-21.953125, -21.26708984375, -20.5810546875, -19.89501953125, -19.208984375, -18.52294921875, -17.8369140625, -17.15087890625, -16.46484375, -15.77880859375, -15.0927734375, -14.40673828125, -13.720703125, -13.03466796875, -12.3486328125, -11.66259765625, -10.9765625, -10.29052734375, -9.6044921875, -8.91845703125, -8.232421875, -7.54638671875, -6.8603515625, -6.17431640625, -5.48828125, -4.80224609375, -4.1162109375, -3.43017578125, -2.744140625, -2.05810546875, -1.3720703125, -0.68603515625, 0.0, 0.68603515625, 1.3720703125, 2.05810546875, 2.744140625, 3.43017578125, 4.1162109375, 4.80224609375, 5.48828125, 6.17431640625, 6.8603515625, 7.54638671875, 8.232421875, 8.91845703125, 9.6044921875, 10.29052734375, 10.9765625, 11.66259765625, 12.3486328125, 13.03466796875, 13.720703125, 14.40673828125, 15.0927734375, 15.77880859375, 16.46484375, 17.15087890625, 17.8369140625, 18.52294921875, 19.208984375, 19.89501953125, 20.5810546875, 21.26708984375, 21.953125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 8.0, 6.0, 4.0, 7.0, 18.0, 11.0, 16.0, 16.0, 19.0, 26.0, 28.0, 38.0, 52.0, 32.0, 48.0, 63.0, 88.0, 182.0, 1421.0, 364.0, 143.0, 82.0, 58.0, 55.0, 60.0, 26.0, 35.0, 26.0, 22.0, 24.0, 25.0, 9.0, 9.0, 8.0, 3.0, 7.0, 3.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.5, -39.370361328125, -38.24072265625, -37.111083984375, -35.9814453125, -34.851806640625, -33.72216796875, -32.592529296875, -31.462890625, -30.333251953125, -29.20361328125, -28.073974609375, -26.9443359375, -25.814697265625, -24.68505859375, -23.555419921875, -22.42578125, -21.296142578125, -20.16650390625, -19.036865234375, -17.9072265625, -16.777587890625, -15.64794921875, -14.518310546875, -13.388671875, -12.259033203125, -11.12939453125, -9.999755859375, -8.8701171875, -7.740478515625, -6.61083984375, -5.481201171875, -4.3515625, -3.221923828125, -2.09228515625, -0.962646484375, 0.1669921875, 1.296630859375, 2.42626953125, 3.555908203125, 4.685546875, 5.815185546875, 6.94482421875, 8.074462890625, 9.2041015625, 10.333740234375, 11.46337890625, 12.593017578125, 13.72265625, 14.852294921875, 15.98193359375, 17.111572265625, 18.2412109375, 19.370849609375, 20.50048828125, 21.630126953125, 22.759765625, 23.889404296875, 25.01904296875, 26.148681640625, 27.2783203125, 28.407958984375, 29.53759765625, 30.667236328125, 31.796875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 8.0, 16.0, 13.0, 15.0, 19.0, 28.0, 36.0, 38.0, 61.0, 92.0, 131.0, 201.0, 309.0, 498.0, 1009.0, 3408.0, 3119106.0, 17467.0, 1477.0, 630.0, 341.0, 204.0, 160.0, 101.0, 77.0, 49.0, 49.0, 22.0, 25.0, 16.0, 13.0, 9.0, 11.0, 10.0, 10.0, 6.0, 6.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-161.25, -156.314453125, -151.37890625, -146.443359375, -141.5078125, -136.572265625, -131.63671875, -126.701171875, -121.765625, -116.830078125, -111.89453125, -106.958984375, -102.0234375, -97.087890625, -92.15234375, -87.216796875, -82.28125, -77.345703125, -72.41015625, -67.474609375, -62.5390625, -57.603515625, -52.66796875, -47.732421875, -42.796875, -37.861328125, -32.92578125, -27.990234375, -23.0546875, -18.119140625, -13.18359375, -8.248046875, -3.3125, 1.623046875, 6.55859375, 11.494140625, 16.4296875, 21.365234375, 26.30078125, 31.236328125, 36.171875, 41.107421875, 46.04296875, 50.978515625, 55.9140625, 60.849609375, 65.78515625, 70.720703125, 75.65625, 80.591796875, 85.52734375, 90.462890625, 95.3984375, 100.333984375, 105.26953125, 110.205078125, 115.140625, 120.076171875, 125.01171875, 129.947265625, 134.8828125, 139.818359375, 144.75390625, 149.689453125, 154.625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 13.0, 45.0, 126.0, 244.0, 291.0, 196.0, 53.0, 32.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-183.0416259765625, -178.5869598388672, -174.1322784423828, -169.6776123046875, -165.2229461669922, -160.7682647705078, -156.3135986328125, -151.8589324951172, -147.4042510986328, -142.9495849609375, -138.49490356445312, -134.0402374267578, -129.5855712890625, -125.13088989257812, -120.67622375488281, -116.22154998779297, -111.76688385009766, -107.31221008300781, -102.8575439453125, -98.40287017822266, -93.94819641113281, -89.4935302734375, -85.03885650634766, -80.58418273925781, -76.1295166015625, -71.67484283447266, -67.22017669677734, -62.7655029296875, -58.310829162597656, -53.85615921020508, -49.4014892578125, -44.946815490722656, -40.492149353027344, -36.037479400634766, -31.582805633544922, -27.128135681152344, -22.673463821411133, -18.218791961669922, -13.764122009277344, -9.309450149536133, -4.854778289794922, -0.40010690689086914, 4.054564476013184, 8.509235382080078, 12.963907241821289, 17.4185791015625, 21.873249053955078, 26.32792091369629, 30.7825927734375, 35.23726272583008, 39.69193649291992, 44.1466064453125, 48.601280212402344, 53.05595016479492, 57.5106201171875, 61.965293884277344, 66.41996765136719, 70.87464141845703, 75.32930755615234, 79.78398132324219, 84.23865509033203, 88.69332885742188, 93.14799499511719, 97.60266876220703, 102.05733489990234]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 10.0, 15.0, 11.0, 22.0, 11.0, 15.0, 23.0, 33.0, 28.0, 34.0, 29.0, 38.0, 48.0, 30.0, 39.0, 48.0, 43.0, 39.0, 48.0, 40.0, 39.0, 40.0, 30.0, 31.0, 39.0, 28.0, 22.0, 19.0, 21.0, 11.0, 14.0, 9.0, 15.0, 7.0, 11.0, 10.0, 5.0, 9.0, 4.0, 4.0, 3.0, 0.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-83.04354858398438, -80.30003356933594, -77.5565185546875, -74.8130111694336, -72.06949615478516, -69.32598114013672, -66.58247375488281, -63.838958740234375, -61.09544372558594, -58.3519287109375, -55.60841751098633, -52.864906311035156, -50.12139129638672, -47.37787628173828, -44.63436508178711, -41.89085388183594, -39.1473388671875, -36.40382385253906, -33.66031265258789, -30.916799545288086, -28.17328643798828, -25.429773330688477, -22.686260223388672, -19.942747116088867, -17.199234008789062, -14.455720901489258, -11.712207794189453, -8.968694686889648, -6.225181579589844, -3.481668472290039, -0.7381553649902344, 2.0053577423095703, 4.748870849609375, 7.49238395690918, 10.235897064208984, 12.979410171508789, 15.722923278808594, 18.4664363861084, 21.209949493408203, 23.953462600708008, 26.696975708007812, 29.440488815307617, 32.18400192260742, 34.927513122558594, 37.67102813720703, 40.41454315185547, 43.15805435180664, 45.90156555175781, 48.64508056640625, 51.38859558105469, 54.13210678100586, 56.87561798095703, 59.61913299560547, 62.362648010253906, 65.10615539550781, 67.84967041015625, 70.59318542480469, 73.33670043945312, 76.08021545410156, 78.82372283935547, 81.5672378540039, 84.31075286865234, 87.05426025390625, 89.79777526855469, 92.54129028320312]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 8.0, 8.0, 11.0, 15.0, 20.0, 20.0, 20.0, 19.0, 32.0, 25.0, 32.0, 22.0, 23.0, 24.0, 39.0, 35.0, 34.0, 37.0, 38.0, 35.0, 44.0, 32.0, 33.0, 34.0, 28.0, 30.0, 25.0, 30.0, 19.0, 24.0, 29.0, 21.0, 19.0, 13.0, 12.0, 13.0, 7.0, 8.0, 9.0, 3.0, 9.0, 8.0, 13.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.7890625, -10.452392578125, -10.11572265625, -9.779052734375, -9.4423828125, -9.105712890625, -8.76904296875, -8.432373046875, -8.095703125, -7.759033203125, -7.42236328125, -7.085693359375, -6.7490234375, -6.412353515625, -6.07568359375, -5.739013671875, -5.40234375, -5.065673828125, -4.72900390625, -4.392333984375, -4.0556640625, -3.718994140625, -3.38232421875, -3.045654296875, -2.708984375, -2.372314453125, -2.03564453125, -1.698974609375, -1.3623046875, -1.025634765625, -0.68896484375, -0.352294921875, -0.015625, 0.321044921875, 0.65771484375, 0.994384765625, 1.3310546875, 1.667724609375, 2.00439453125, 2.341064453125, 2.677734375, 3.014404296875, 3.35107421875, 3.687744140625, 4.0244140625, 4.361083984375, 4.69775390625, 5.034423828125, 5.37109375, 5.707763671875, 6.04443359375, 6.381103515625, 6.7177734375, 7.054443359375, 7.39111328125, 7.727783203125, 8.064453125, 8.401123046875, 8.73779296875, 9.074462890625, 9.4111328125, 9.747802734375, 10.08447265625, 10.421142578125, 10.7578125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 11.0, 22.0, 23.0, 39.0, 62.0, 102.0, 167.0, 299.0, 563.0, 1242.0, 3545.0, 15234.0, 180481.0, 2101764.0, 1741333.0, 131735.0, 12494.0, 2868.0, 1117.0, 518.0, 263.0, 146.0, 88.0, 58.0, 35.0, 20.0, 20.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.71875, -30.725830078125, -29.73291015625, -28.739990234375, -27.7470703125, -26.754150390625, -25.76123046875, -24.768310546875, -23.775390625, -22.782470703125, -21.78955078125, -20.796630859375, -19.8037109375, -18.810791015625, -17.81787109375, -16.824951171875, -15.83203125, -14.839111328125, -13.84619140625, -12.853271484375, -11.8603515625, -10.867431640625, -9.87451171875, -8.881591796875, -7.888671875, -6.895751953125, -5.90283203125, -4.909912109375, -3.9169921875, -2.924072265625, -1.93115234375, -0.938232421875, 0.0546875, 1.047607421875, 2.04052734375, 3.033447265625, 4.0263671875, 5.019287109375, 6.01220703125, 7.005126953125, 7.998046875, 8.990966796875, 9.98388671875, 10.976806640625, 11.9697265625, 12.962646484375, 13.95556640625, 14.948486328125, 15.94140625, 16.934326171875, 17.92724609375, 18.920166015625, 19.9130859375, 20.906005859375, 21.89892578125, 22.891845703125, 23.884765625, 24.877685546875, 25.87060546875, 26.863525390625, 27.8564453125, 28.849365234375, 29.84228515625, 30.835205078125, 31.828125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 10.0, 6.0, 10.0, 13.0, 17.0, 22.0, 27.0, 43.0, 41.0, 72.0, 83.0, 110.0, 118.0, 183.0, 195.0, 260.0, 323.0, 380.0, 446.0, 368.0, 284.0, 237.0, 163.0, 127.0, 125.0, 85.0, 65.0, 48.0, 39.0, 44.0, 27.0, 22.0, 18.0, 11.0, 13.0, 14.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.495361328125, -15.91259765625, -15.329833984375, -14.7470703125, -14.164306640625, -13.58154296875, -12.998779296875, -12.416015625, -11.833251953125, -11.25048828125, -10.667724609375, -10.0849609375, -9.502197265625, -8.91943359375, -8.336669921875, -7.75390625, -7.171142578125, -6.58837890625, -6.005615234375, -5.4228515625, -4.840087890625, -4.25732421875, -3.674560546875, -3.091796875, -2.509033203125, -1.92626953125, -1.343505859375, -0.7607421875, -0.177978515625, 0.40478515625, 0.987548828125, 1.5703125, 2.153076171875, 2.73583984375, 3.318603515625, 3.9013671875, 4.484130859375, 5.06689453125, 5.649658203125, 6.232421875, 6.815185546875, 7.39794921875, 7.980712890625, 8.5634765625, 9.146240234375, 9.72900390625, 10.311767578125, 10.89453125, 11.477294921875, 12.06005859375, 12.642822265625, 13.2255859375, 13.808349609375, 14.39111328125, 14.973876953125, 15.556640625, 16.139404296875, 16.72216796875, 17.304931640625, 17.8876953125, 18.470458984375, 19.05322265625, 19.635986328125, 20.21875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 10.0, 9.0, 15.0, 38.0, 66.0, 75.0, 166.0, 309.0, 586.0, 1221.0, 2891.0, 14435.0, 460884.0, 3577866.0, 124204.0, 7354.0, 2184.0, 979.0, 453.0, 228.0, 124.0, 86.0, 41.0, 20.0, 14.0, 14.0, 5.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.375, -58.71337890625, -57.0517578125, -55.39013671875, -53.728515625, -52.06689453125, -50.4052734375, -48.74365234375, -47.08203125, -45.42041015625, -43.7587890625, -42.09716796875, -40.435546875, -38.77392578125, -37.1123046875, -35.45068359375, -33.7890625, -32.12744140625, -30.4658203125, -28.80419921875, -27.142578125, -25.48095703125, -23.8193359375, -22.15771484375, -20.49609375, -18.83447265625, -17.1728515625, -15.51123046875, -13.849609375, -12.18798828125, -10.5263671875, -8.86474609375, -7.203125, -5.54150390625, -3.8798828125, -2.21826171875, -0.556640625, 1.10498046875, 2.7666015625, 4.42822265625, 6.08984375, 7.75146484375, 9.4130859375, 11.07470703125, 12.736328125, 14.39794921875, 16.0595703125, 17.72119140625, 19.3828125, 21.04443359375, 22.7060546875, 24.36767578125, 26.029296875, 27.69091796875, 29.3525390625, 31.01416015625, 32.67578125, 34.33740234375, 35.9990234375, 37.66064453125, 39.322265625, 40.98388671875, 42.6455078125, 44.30712890625, 45.96875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 13.0, 105.0, 508.0, 322.0, 58.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.77920532226562, -183.43270874023438, -171.08621215820312, -158.73971557617188, -146.39321899414062, -134.04672241210938, -121.70024108886719, -109.35374450683594, -97.00724792480469, -84.66075134277344, -72.31425476074219, -59.96776580810547, -47.62126922607422, -35.27477264404297, -22.92828369140625, -10.581787109375, 1.76470947265625, 14.111204147338867, 26.457698822021484, 38.80419158935547, 51.15068817138672, 63.49718475341797, 75.84367370605469, 88.19017028808594, 100.53666687011719, 112.88316345214844, 125.22966003417969, 137.57614135742188, 149.92263793945312, 162.26913452148438, 174.61563110351562, 186.96212768554688, 199.30865478515625, 211.6551513671875, 224.00164794921875, 236.34814453125, 248.69464111328125, 261.0411376953125, 273.38763427734375, 285.734130859375, 298.08062744140625, 310.4271240234375, 322.77362060546875, 335.1201171875, 347.46661376953125, 359.8131103515625, 372.15960693359375, 384.506103515625, 396.8525695800781, 409.1990661621094, 421.5455627441406, 433.8920593261719, 446.2385559082031, 458.5850524902344, 470.9315185546875, 483.27801513671875, 495.62451171875, 507.97100830078125, 520.3175048828125, 532.6640014648438, 545.010498046875, 557.3569946289062, 569.7034912109375, 582.0499877929688, 594.396484375]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 7.0, 6.0, 6.0, 7.0, 5.0, 11.0, 11.0, 10.0, 16.0, 16.0, 17.0, 17.0, 23.0, 28.0, 33.0, 28.0, 27.0, 54.0, 35.0, 36.0, 28.0, 45.0, 39.0, 40.0, 28.0, 26.0, 33.0, 48.0, 36.0, 28.0, 18.0, 28.0, 22.0, 28.0, 18.0, 20.0, 19.0, 16.0, 19.0, 10.0, 12.0, 9.0, 6.0, 9.0, 7.0, 6.0, 6.0, 0.0, 3.0, 2.0, 4.0, 3.0], "bins": [-84.19775390625, -81.83589172363281, -79.47402954101562, -77.11216735839844, -74.75030517578125, -72.38844299316406, -70.02658081054688, -67.66472625732422, -65.30286407470703, -62.941001892089844, -60.579139709472656, -58.21727752685547, -55.85541915893555, -53.49355697631836, -51.13169479370117, -48.76983642578125, -46.4079704284668, -44.04610824584961, -41.68424606323242, -39.3223876953125, -36.96052551269531, -34.598663330078125, -32.23680114746094, -29.874940872192383, -27.513078689575195, -25.151216506958008, -22.789356231689453, -20.427494049072266, -18.065631866455078, -15.703771591186523, -13.341909408569336, -10.980049133300781, -8.618186950683594, -6.256325721740723, -3.8944640159606934, -1.532602310180664, 0.829258918762207, 3.191120147705078, 5.552982330322266, 7.91484260559082, 10.276704788208008, 12.638566017150879, 15.00042724609375, 17.362289428710938, 19.724151611328125, 22.08601188659668, 24.447874069213867, 26.809734344482422, 29.17159652709961, 31.533458709716797, 33.895320892333984, 36.257179260253906, 38.619041442871094, 40.98090362548828, 43.34276580810547, 45.704627990722656, 48.066490173339844, 50.42835235595703, 52.79021453857422, 55.152076721191406, 57.51393508911133, 59.875797271728516, 62.2376594543457, 64.59951782226562, 66.96138000488281]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 6.0, 4.0, 9.0, 10.0, 15.0, 19.0, 18.0, 17.0, 24.0, 27.0, 31.0, 22.0, 40.0, 43.0, 44.0, 47.0, 55.0, 43.0, 55.0, 53.0, 40.0, 40.0, 53.0, 39.0, 33.0, 39.0, 33.0, 30.0, 21.0, 22.0, 18.0, 10.0, 11.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.3426513671875, -8.997802734375, -8.6529541015625, -8.30810546875, -7.9632568359375, -7.618408203125, -7.2735595703125, -6.9287109375, -6.5838623046875, -6.239013671875, -5.8941650390625, -5.54931640625, -5.2044677734375, -4.859619140625, -4.5147705078125, -4.169921875, -3.8250732421875, -3.480224609375, -3.1353759765625, -2.79052734375, -2.4456787109375, -2.100830078125, -1.7559814453125, -1.4111328125, -1.0662841796875, -0.721435546875, -0.3765869140625, -0.03173828125, 0.3131103515625, 0.657958984375, 1.0028076171875, 1.34765625, 1.6925048828125, 2.037353515625, 2.3822021484375, 2.72705078125, 3.0718994140625, 3.416748046875, 3.7615966796875, 4.1064453125, 4.4512939453125, 4.796142578125, 5.1409912109375, 5.48583984375, 5.8306884765625, 6.175537109375, 6.5203857421875, 6.865234375, 7.2100830078125, 7.554931640625, 7.8997802734375, 8.24462890625, 8.5894775390625, 8.934326171875, 9.2791748046875, 9.6240234375, 9.9688720703125, 10.313720703125, 10.6585693359375, 11.00341796875, 11.3482666015625, 11.693115234375, 12.0379638671875, 12.3828125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 11.0, 7.0, 13.0, 40.0, 36.0, 58.0, 98.0, 143.0, 200.0, 329.0, 492.0, 843.0, 1432.0, 2307.0, 3965.0, 6899.0, 11931.0, 21226.0, 37914.0, 71019.0, 148408.0, 392547.0, 172599.0, 79198.0, 41886.0, 23386.0, 13126.0, 7491.0, 4418.0, 2532.0, 1548.0, 918.0, 564.0, 323.0, 200.0, 168.0, 84.0, 78.0, 36.0, 27.0, 13.0, 13.0, 7.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.83660888671875, -2.7337646484375, -2.63092041015625, -2.528076171875, -2.42523193359375, -2.3223876953125, -2.21954345703125, -2.11669921875, -2.01385498046875, -1.9110107421875, -1.80816650390625, -1.705322265625, -1.60247802734375, -1.4996337890625, -1.39678955078125, -1.2939453125, -1.19110107421875, -1.0882568359375, -0.98541259765625, -0.882568359375, -0.77972412109375, -0.6768798828125, -0.57403564453125, -0.47119140625, -0.36834716796875, -0.2655029296875, -0.16265869140625, -0.059814453125, 0.04302978515625, 0.1458740234375, 0.24871826171875, 0.3515625, 0.45440673828125, 0.5572509765625, 0.66009521484375, 0.762939453125, 0.86578369140625, 0.9686279296875, 1.07147216796875, 1.17431640625, 1.27716064453125, 1.3800048828125, 1.48284912109375, 1.585693359375, 1.68853759765625, 1.7913818359375, 1.89422607421875, 1.9970703125, 2.09991455078125, 2.2027587890625, 2.30560302734375, 2.408447265625, 2.51129150390625, 2.6141357421875, 2.71697998046875, 2.81982421875, 2.92266845703125, 3.0255126953125, 3.12835693359375, 3.231201171875, 3.33404541015625, 3.4368896484375, 3.53973388671875, 3.642578125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 1.0, 3.0, 10.0, 12.0, 13.0, 15.0, 17.0, 17.0, 26.0, 19.0, 29.0, 27.0, 25.0, 46.0, 43.0, 32.0, 40.0, 33.0, 40.0, 1055.0, 44.0, 38.0, 31.0, 39.0, 51.0, 36.0, 35.0, 26.0, 34.0, 23.0, 26.0, 29.0, 23.0, 16.0, 13.0, 11.0, 8.0, 5.0, 9.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.484375, -6.29254150390625, -6.1007080078125, -5.90887451171875, -5.717041015625, -5.52520751953125, -5.3333740234375, -5.14154052734375, -4.94970703125, -4.75787353515625, -4.5660400390625, -4.37420654296875, -4.182373046875, -3.99053955078125, -3.7987060546875, -3.60687255859375, -3.4150390625, -3.22320556640625, -3.0313720703125, -2.83953857421875, -2.647705078125, -2.45587158203125, -2.2640380859375, -2.07220458984375, -1.88037109375, -1.68853759765625, -1.4967041015625, -1.30487060546875, -1.113037109375, -0.92120361328125, -0.7293701171875, -0.53753662109375, -0.345703125, -0.15386962890625, 0.0379638671875, 0.22979736328125, 0.421630859375, 0.61346435546875, 0.8052978515625, 0.99713134765625, 1.18896484375, 1.38079833984375, 1.5726318359375, 1.76446533203125, 1.956298828125, 2.14813232421875, 2.3399658203125, 2.53179931640625, 2.7236328125, 2.91546630859375, 3.1072998046875, 3.29913330078125, 3.490966796875, 3.68280029296875, 3.8746337890625, 4.06646728515625, 4.25830078125, 4.45013427734375, 4.6419677734375, 4.83380126953125, 5.025634765625, 5.21746826171875, 5.4093017578125, 5.60113525390625, 5.79296875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 10.0, 15.0, 23.0, 29.0, 49.0, 71.0, 115.0, 163.0, 236.0, 342.0, 531.0, 801.0, 1169.0, 1681.0, 2477.0, 3773.0, 5829.0, 8648.0, 12786.0, 19801.0, 30794.0, 49210.0, 77923.0, 129132.0, 1344212.0, 158202.0, 90254.0, 56674.0, 35842.0, 22323.0, 14748.0, 9822.0, 6441.0, 4235.0, 2842.0, 1990.0, 1259.0, 878.0, 607.0, 390.0, 282.0, 189.0, 98.0, 91.0, 48.0, 28.0, 32.0, 15.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0], "bins": [-2.4453125, -2.372650146484375, -2.29998779296875, -2.227325439453125, -2.1546630859375, -2.082000732421875, -2.00933837890625, -1.936676025390625, -1.864013671875, -1.791351318359375, -1.71868896484375, -1.646026611328125, -1.5733642578125, -1.500701904296875, -1.42803955078125, -1.355377197265625, -1.28271484375, -1.210052490234375, -1.13739013671875, -1.064727783203125, -0.9920654296875, -0.919403076171875, -0.84674072265625, -0.774078369140625, -0.701416015625, -0.628753662109375, -0.55609130859375, -0.483428955078125, -0.4107666015625, -0.338104248046875, -0.26544189453125, -0.192779541015625, -0.1201171875, -0.047454833984375, 0.02520751953125, 0.097869873046875, 0.1705322265625, 0.243194580078125, 0.31585693359375, 0.388519287109375, 0.461181640625, 0.533843994140625, 0.60650634765625, 0.679168701171875, 0.7518310546875, 0.824493408203125, 0.89715576171875, 0.969818115234375, 1.04248046875, 1.115142822265625, 1.18780517578125, 1.260467529296875, 1.3331298828125, 1.405792236328125, 1.47845458984375, 1.551116943359375, 1.623779296875, 1.696441650390625, 1.76910400390625, 1.841766357421875, 1.9144287109375, 1.987091064453125, 2.05975341796875, 2.132415771484375, 2.205078125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 5.0, 5.0, 12.0, 14.0, 12.0, 24.0, 37.0, 40.0, 49.0, 62.0, 93.0, 83.0, 79.0, 82.0, 71.0, 55.0, 58.0, 40.0, 31.0, 19.0, 18.0, 14.0, 14.0, 12.0, 9.0, 10.0, 4.0, 6.0, 4.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003509521484375, -0.0003390386700630188, -0.0003271251916885376, -0.0003152117133140564, -0.0003032982349395752, -0.000291384756565094, -0.0002794712781906128, -0.0002675577998161316, -0.0002556443214416504, -0.0002437308430671692, -0.000231817364692688, -0.0002199038863182068, -0.00020799040794372559, -0.00019607692956924438, -0.00018416345119476318, -0.00017224997282028198, -0.00016033649444580078, -0.00014842301607131958, -0.00013650953769683838, -0.00012459605932235718, -0.00011268258094787598, -0.00010076910257339478, -8.885562419891357e-05, -7.694214582443237e-05, -6.502866744995117e-05, -5.311518907546997e-05, -4.120171070098877e-05, -2.928823232650757e-05, -1.7374753952026367e-05, -5.461275577545166e-06, 6.452202796936035e-06, 1.8365681171417236e-05, 3.0279159545898438e-05, 4.219263792037964e-05, 5.410611629486084e-05, 6.601959466934204e-05, 7.793307304382324e-05, 8.984655141830444e-05, 0.00010176002979278564, 0.00011367350816726685, 0.00012558698654174805, 0.00013750046491622925, 0.00014941394329071045, 0.00016132742166519165, 0.00017324090003967285, 0.00018515437841415405, 0.00019706785678863525, 0.00020898133516311646, 0.00022089481353759766, 0.00023280829191207886, 0.00024472177028656006, 0.00025663524866104126, 0.00026854872703552246, 0.00028046220541000366, 0.00029237568378448486, 0.00030428916215896606, 0.00031620264053344727, 0.00032811611890792847, 0.00034002959728240967, 0.00035194307565689087, 0.00036385655403137207, 0.00037577003240585327, 0.00038768351078033447, 0.0003995969891548157, 0.0004115104675292969]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 12.0, 7.0, 6.0, 12.0, 19.0, 12.0, 24.0, 35.0, 34.0, 44.0, 47.0, 67.0, 110.0, 179.0, 300.0, 435.0, 952.0, 16965.0, 1016227.0, 10887.0, 909.0, 419.0, 236.0, 182.0, 124.0, 87.0, 51.0, 35.0, 24.0, 15.0, 16.0, 19.0, 11.0, 8.0, 2.0, 3.0, 4.0, 7.0, 6.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00719451904296875, -0.006979525089263916, -0.006764531135559082, -0.006549537181854248, -0.006334543228149414, -0.00611954927444458, -0.005904555320739746, -0.005689561367034912, -0.005474567413330078, -0.005259573459625244, -0.00504457950592041, -0.004829585552215576, -0.004614591598510742, -0.004399597644805908, -0.004184603691101074, -0.00396960973739624, -0.0037546157836914062, -0.0035396218299865723, -0.0033246278762817383, -0.0031096339225769043, -0.0028946399688720703, -0.0026796460151672363, -0.0024646520614624023, -0.0022496581077575684, -0.0020346641540527344, -0.0018196702003479004, -0.0016046762466430664, -0.0013896822929382324, -0.0011746883392333984, -0.0009596943855285645, -0.0007447004318237305, -0.0005297064781188965, -0.0003147125244140625, -9.971857070922852e-05, 0.00011527538299560547, 0.00033026933670043945, 0.0005452632904052734, 0.0007602572441101074, 0.0009752511978149414, 0.0011902451515197754, 0.0014052391052246094, 0.0016202330589294434, 0.0018352270126342773, 0.0020502209663391113, 0.0022652149200439453, 0.0024802088737487793, 0.0026952028274536133, 0.0029101967811584473, 0.0031251907348632812, 0.0033401846885681152, 0.0035551786422729492, 0.003770172595977783, 0.003985166549682617, 0.004200160503387451, 0.004415154457092285, 0.004630148410797119, 0.004845142364501953, 0.005060136318206787, 0.005275130271911621, 0.005490124225616455, 0.005705118179321289, 0.005920112133026123, 0.006135106086730957, 0.006350100040435791, 0.006565093994140625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 68.0, 617.0, 311.0, 17.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023424976971000433, -0.002295452170073986, -0.002248406410217285, -0.002201360883191228, -0.002154315123334527, -0.0021072695963084698, -0.002060223836451769, -0.0020131783094257116, -0.0019661325495690107, -0.0019190869061276317, -0.0018720412626862526, -0.0018249956192448735, -0.0017779499758034945, -0.0017309044487774372, -0.0016838586889207363, -0.001636813161894679, -0.0015897676348686218, -0.0015427219914272428, -0.0014956763479858637, -0.0014486307045444846, -0.0014015850611031055, -0.0013545395340770483, -0.0013074937742203474, -0.0012604482471942902, -0.0012134024873375893, -0.0011663568438962102, -0.0011193112004548311, -0.001072265557013452, -0.001025219913572073, -0.0009781743865460157, -0.0009311286848969758, -0.0008840830996632576, -0.0008370374562218785, -0.0007899918127804995, -0.0007429461693391204, -0.0006959005258977413, -0.0006488549406640232, -0.0006018092972226441, -0.000554763653781265, -0.0005077180685475469, -0.00046067239600233734, -0.00041362675256095827, -0.00036658113822340965, -0.0003195354947820306, -0.0002724898513406515, -0.0002254442370031029, -0.00017839859356172383, -0.00013135297922417521, -8.430733578279614e-05, -3.7261703255353495e-05, 9.783929272089154e-06, 5.682956543751061e-05, 0.00010387519432697445, 0.0001509208232164383, 0.00019796646665781736, 0.000245012080995366, 0.00029205772443674505, 0.0003391033678781241, 0.00038614898221567273, 0.0004331946256570518, 0.00048024026909843087, 0.000527285854332149, 0.0005743314977735281, 0.0006213771412149072, 0.0006684227846562862]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 4.0, 7.0, 9.0, 15.0, 14.0, 18.0, 24.0, 18.0, 21.0, 27.0, 23.0, 24.0, 32.0, 33.0, 41.0, 35.0, 54.0, 44.0, 46.0, 55.0, 45.0, 36.0, 34.0, 31.0, 30.0, 35.0, 39.0, 21.0, 22.0, 23.0, 24.0, 15.0, 18.0, 13.0, 10.0, 14.0, 9.0, 8.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0001773834228515625, -0.00017187371850013733, -0.00016636401414871216, -0.000160854309797287, -0.00015534460544586182, -0.00014983490109443665, -0.00014432519674301147, -0.0001388154923915863, -0.00013330578804016113, -0.00012779608368873596, -0.0001222863793373108, -0.00011677667498588562, -0.00011126697063446045, -0.00010575726628303528, -0.00010024756193161011, -9.473785758018494e-05, -8.922815322875977e-05, -8.37184488773346e-05, -7.820874452590942e-05, -7.269904017448425e-05, -6.718933582305908e-05, -6.167963147163391e-05, -5.616992712020874e-05, -5.066022276878357e-05, -4.51505184173584e-05, -3.964081406593323e-05, -3.413110971450806e-05, -2.8621405363082886e-05, -2.3111701011657715e-05, -1.7601996660232544e-05, -1.2092292308807373e-05, -6.582587957382202e-06, -1.0728836059570312e-06, 4.43682074546814e-06, 9.94652509689331e-06, 1.545622944831848e-05, 2.0965933799743652e-05, 2.6475638151168823e-05, 3.1985342502593994e-05, 3.7495046854019165e-05, 4.3004751205444336e-05, 4.851445555686951e-05, 5.402415990829468e-05, 5.953386425971985e-05, 6.504356861114502e-05, 7.055327296257019e-05, 7.606297731399536e-05, 8.157268166542053e-05, 8.70823860168457e-05, 9.259209036827087e-05, 9.810179471969604e-05, 0.00010361149907112122, 0.00010912120342254639, 0.00011463090777397156, 0.00012014061212539673, 0.0001256503164768219, 0.00013116002082824707, 0.00013666972517967224, 0.0001421794295310974, 0.00014768913388252258, 0.00015319883823394775, 0.00015870854258537292, 0.0001642182469367981, 0.00016972795128822327, 0.00017523765563964844]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 6.0, 4.0, 9.0, 10.0, 15.0, 19.0, 18.0, 17.0, 24.0, 27.0, 31.0, 22.0, 40.0, 43.0, 44.0, 47.0, 55.0, 43.0, 55.0, 53.0, 40.0, 40.0, 53.0, 39.0, 33.0, 39.0, 33.0, 30.0, 21.0, 22.0, 18.0, 10.0, 11.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.3426513671875, -8.997802734375, -8.6529541015625, -8.30810546875, -7.9632568359375, -7.618408203125, -7.2735595703125, -6.9287109375, -6.5838623046875, -6.239013671875, -5.8941650390625, -5.54931640625, -5.2044677734375, -4.859619140625, -4.5147705078125, -4.169921875, -3.8250732421875, -3.480224609375, -3.1353759765625, -2.79052734375, -2.4456787109375, -2.100830078125, -1.7559814453125, -1.4111328125, -1.0662841796875, -0.721435546875, -0.3765869140625, -0.03173828125, 0.3131103515625, 0.657958984375, 1.0028076171875, 1.34765625, 1.6925048828125, 2.037353515625, 2.3822021484375, 2.72705078125, 3.0718994140625, 3.416748046875, 3.7615966796875, 4.1064453125, 4.4512939453125, 4.796142578125, 5.1409912109375, 5.48583984375, 5.8306884765625, 6.175537109375, 6.5203857421875, 6.865234375, 7.2100830078125, 7.554931640625, 7.8997802734375, 8.24462890625, 8.5894775390625, 8.934326171875, 9.2791748046875, 9.6240234375, 9.9688720703125, 10.313720703125, 10.6585693359375, 11.00341796875, 11.3482666015625, 11.693115234375, 12.0379638671875, 12.3828125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 10.0, 9.0, 10.0, 28.0, 47.0, 61.0, 68.0, 105.0, 145.0, 196.0, 270.0, 372.0, 537.0, 717.0, 1018.0, 1484.0, 2250.0, 3770.0, 9547.0, 66880.0, 622291.0, 294413.0, 28865.0, 6110.0, 2940.0, 1972.0, 1271.0, 914.0, 619.0, 470.0, 329.0, 243.0, 155.0, 121.0, 97.0, 62.0, 54.0, 33.0, 27.0, 18.0, 10.0, 10.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.84375, -26.968505859375, -26.09326171875, -25.218017578125, -24.3427734375, -23.467529296875, -22.59228515625, -21.717041015625, -20.841796875, -19.966552734375, -19.09130859375, -18.216064453125, -17.3408203125, -16.465576171875, -15.59033203125, -14.715087890625, -13.83984375, -12.964599609375, -12.08935546875, -11.214111328125, -10.3388671875, -9.463623046875, -8.58837890625, -7.713134765625, -6.837890625, -5.962646484375, -5.08740234375, -4.212158203125, -3.3369140625, -2.461669921875, -1.58642578125, -0.711181640625, 0.1640625, 1.039306640625, 1.91455078125, 2.789794921875, 3.6650390625, 4.540283203125, 5.41552734375, 6.290771484375, 7.166015625, 8.041259765625, 8.91650390625, 9.791748046875, 10.6669921875, 11.542236328125, 12.41748046875, 13.292724609375, 14.16796875, 15.043212890625, 15.91845703125, 16.793701171875, 17.6689453125, 18.544189453125, 19.41943359375, 20.294677734375, 21.169921875, 22.045166015625, 22.92041015625, 23.795654296875, 24.6708984375, 25.546142578125, 26.42138671875, 27.296630859375, 28.171875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 7.0, 7.0, 18.0, 12.0, 11.0, 13.0, 14.0, 13.0, 32.0, 24.0, 32.0, 40.0, 36.0, 41.0, 64.0, 78.0, 127.0, 202.0, 1398.0, 238.0, 139.0, 109.0, 67.0, 51.0, 36.0, 31.0, 27.0, 31.0, 20.0, 14.0, 14.0, 15.0, 9.0, 8.0, 9.0, 9.0, 12.0, 11.0, 5.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.96875, -21.25, -20.53125, -19.8125, -19.09375, -18.375, -17.65625, -16.9375, -16.21875, -15.5, -14.78125, -14.0625, -13.34375, -12.625, -11.90625, -11.1875, -10.46875, -9.75, -9.03125, -8.3125, -7.59375, -6.875, -6.15625, -5.4375, -4.71875, -4.0, -3.28125, -2.5625, -1.84375, -1.125, -0.40625, 0.3125, 1.03125, 1.75, 2.46875, 3.1875, 3.90625, 4.625, 5.34375, 6.0625, 6.78125, 7.5, 8.21875, 8.9375, 9.65625, 10.375, 11.09375, 11.8125, 12.53125, 13.25, 13.96875, 14.6875, 15.40625, 16.125, 16.84375, 17.5625, 18.28125, 19.0, 19.71875, 20.4375, 21.15625, 21.875, 22.59375, 23.3125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 8.0, 7.0, 10.0, 18.0, 20.0, 18.0, 26.0, 27.0, 48.0, 51.0, 82.0, 92.0, 126.0, 201.0, 314.0, 598.0, 1172.0, 2594.0, 40897.0, 3087255.0, 7966.0, 1870.0, 875.0, 460.0, 260.0, 186.0, 139.0, 83.0, 70.0, 38.0, 28.0, 38.0, 21.0, 11.0, 7.0, 11.0, 13.0, 12.0, 11.0, 7.0, 5.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0], "bins": [-102.0625, -99.1728515625, -96.283203125, -93.3935546875, -90.50390625, -87.6142578125, -84.724609375, -81.8349609375, -78.9453125, -76.0556640625, -73.166015625, -70.2763671875, -67.38671875, -64.4970703125, -61.607421875, -58.7177734375, -55.828125, -52.9384765625, -50.048828125, -47.1591796875, -44.26953125, -41.3798828125, -38.490234375, -35.6005859375, -32.7109375, -29.8212890625, -26.931640625, -24.0419921875, -21.15234375, -18.2626953125, -15.373046875, -12.4833984375, -9.59375, -6.7041015625, -3.814453125, -0.9248046875, 1.96484375, 4.8544921875, 7.744140625, 10.6337890625, 13.5234375, 16.4130859375, 19.302734375, 22.1923828125, 25.08203125, 27.9716796875, 30.861328125, 33.7509765625, 36.640625, 39.5302734375, 42.419921875, 45.3095703125, 48.19921875, 51.0888671875, 53.978515625, 56.8681640625, 59.7578125, 62.6474609375, 65.537109375, 68.4267578125, 71.31640625, 74.2060546875, 77.095703125, 79.9853515625, 82.875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 30.0, 116.0, 209.0, 334.0, 201.0, 88.0, 18.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-296.62420654296875, -290.95709228515625, -285.2899475097656, -279.6228332519531, -273.9557189941406, -268.28857421875, -262.6214599609375, -256.954345703125, -251.28721618652344, -245.62008666992188, -239.95297241210938, -234.2858428955078, -228.61871337890625, -222.95159912109375, -217.2844696044922, -211.61734008789062, -205.95022583007812, -200.28309631347656, -194.61598205566406, -188.9488525390625, -183.28173828125, -177.61460876464844, -171.94747924804688, -166.28036499023438, -160.6132354736328, -154.94610595703125, -149.27899169921875, -143.6118621826172, -137.94473266601562, -132.27761840820312, -126.61048889160156, -120.94336700439453, -115.27623748779297, -109.60911560058594, -103.94198608398438, -98.27486419677734, -92.60774230957031, -86.94062042236328, -81.27349853515625, -75.60636901855469, -69.93924713134766, -64.27212524414062, -58.60499954223633, -52.93787384033203, -47.270751953125, -41.60363006591797, -35.93650436401367, -30.269378662109375, -24.602256774902344, -18.93513298034668, -13.268009185791016, -7.600885391235352, -1.9337615966796875, 3.7333621978759766, 9.40048599243164, 15.067611694335938, 20.73473358154297, 26.401857376098633, 32.0689811706543, 37.736106872558594, 43.403228759765625, 49.070350646972656, 54.73747634887695, 60.40460205078125, 66.07172393798828]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 9.0, 5.0, 9.0, 7.0, 7.0, 16.0, 12.0, 18.0, 19.0, 26.0, 17.0, 21.0, 32.0, 22.0, 32.0, 34.0, 40.0, 49.0, 32.0, 34.0, 29.0, 41.0, 45.0, 38.0, 44.0, 33.0, 49.0, 39.0, 35.0, 23.0, 31.0, 23.0, 17.0, 16.0, 19.0, 10.0, 9.0, 9.0, 13.0, 5.0, 4.0, 4.0, 5.0, 11.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-67.85401153564453, -65.82284545898438, -63.791683197021484, -61.76051712036133, -59.72935104370117, -57.69818878173828, -55.667022705078125, -53.63585662841797, -51.60469055175781, -49.573524475097656, -47.542362213134766, -45.51119613647461, -43.48003005981445, -41.44886779785156, -39.417701721191406, -37.38653564453125, -35.35537338256836, -33.3242073059082, -31.29304313659668, -29.261878967285156, -27.230712890625, -25.199548721313477, -23.168384552001953, -21.137218475341797, -19.106054306030273, -17.07489013671875, -15.043724060058594, -13.01255989074707, -10.98139476776123, -8.95022964477539, -6.919065475463867, -4.887900352478027, -2.856739044189453, -0.8255741596221924, 1.2055907249450684, 3.23675537109375, 5.26792049407959, 7.29908561706543, 9.330249786376953, 11.361414909362793, 13.392580032348633, 15.423745155334473, 17.454910278320312, 19.486074447631836, 21.51723861694336, 23.548404693603516, 25.57956886291504, 27.610733032226562, 29.64189910888672, 31.673063278198242, 33.704227447509766, 35.73539352416992, 37.76655960083008, 39.79772186279297, 41.828887939453125, 43.86005401611328, 45.89122009277344, 47.922386169433594, 49.953548431396484, 51.98471450805664, 54.0158805847168, 56.04704284667969, 58.078208923339844, 60.109375, 62.14053726196289]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 16.0, 10.0, 11.0, 14.0, 23.0, 16.0, 19.0, 26.0, 37.0, 37.0, 42.0, 42.0, 36.0, 62.0, 51.0, 55.0, 61.0, 54.0, 46.0, 46.0, 40.0, 29.0, 29.0, 35.0, 44.0, 14.0, 15.0, 11.0, 16.0, 11.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.568115234375, -10.20654296875, -9.844970703125, -9.4833984375, -9.121826171875, -8.76025390625, -8.398681640625, -8.037109375, -7.675537109375, -7.31396484375, -6.952392578125, -6.5908203125, -6.229248046875, -5.86767578125, -5.506103515625, -5.14453125, -4.782958984375, -4.42138671875, -4.059814453125, -3.6982421875, -3.336669921875, -2.97509765625, -2.613525390625, -2.251953125, -1.890380859375, -1.52880859375, -1.167236328125, -0.8056640625, -0.444091796875, -0.08251953125, 0.279052734375, 0.640625, 1.002197265625, 1.36376953125, 1.725341796875, 2.0869140625, 2.448486328125, 2.81005859375, 3.171630859375, 3.533203125, 3.894775390625, 4.25634765625, 4.617919921875, 4.9794921875, 5.341064453125, 5.70263671875, 6.064208984375, 6.42578125, 6.787353515625, 7.14892578125, 7.510498046875, 7.8720703125, 8.233642578125, 8.59521484375, 8.956787109375, 9.318359375, 9.679931640625, 10.04150390625, 10.403076171875, 10.7646484375, 11.126220703125, 11.48779296875, 11.849365234375, 12.2109375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 3.0, 3.0, 8.0, 6.0, 6.0, 10.0, 14.0, 25.0, 16.0, 32.0, 34.0, 43.0, 48.0, 67.0, 91.0, 110.0, 194.0, 318.0, 528.0, 1145.0, 2575.0, 7029.0, 26271.0, 207154.0, 1806448.0, 1873369.0, 228518.0, 27607.0, 7395.0, 2518.0, 1115.0, 524.0, 339.0, 197.0, 120.0, 79.0, 71.0, 41.0, 37.0, 35.0, 27.0, 15.0, 20.0, 17.0, 15.0, 13.0, 6.0, 7.0, 4.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0], "bins": [-23.390625, -22.68212890625, -21.9736328125, -21.26513671875, -20.556640625, -19.84814453125, -19.1396484375, -18.43115234375, -17.72265625, -17.01416015625, -16.3056640625, -15.59716796875, -14.888671875, -14.18017578125, -13.4716796875, -12.76318359375, -12.0546875, -11.34619140625, -10.6376953125, -9.92919921875, -9.220703125, -8.51220703125, -7.8037109375, -7.09521484375, -6.38671875, -5.67822265625, -4.9697265625, -4.26123046875, -3.552734375, -2.84423828125, -2.1357421875, -1.42724609375, -0.71875, -0.01025390625, 0.6982421875, 1.40673828125, 2.115234375, 2.82373046875, 3.5322265625, 4.24072265625, 4.94921875, 5.65771484375, 6.3662109375, 7.07470703125, 7.783203125, 8.49169921875, 9.2001953125, 9.90869140625, 10.6171875, 11.32568359375, 12.0341796875, 12.74267578125, 13.451171875, 14.15966796875, 14.8681640625, 15.57666015625, 16.28515625, 16.99365234375, 17.7021484375, 18.41064453125, 19.119140625, 19.82763671875, 20.5361328125, 21.24462890625, 21.953125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 3.0, 7.0, 15.0, 14.0, 22.0, 16.0, 48.0, 48.0, 88.0, 91.0, 160.0, 211.0, 236.0, 357.0, 458.0, 509.0, 443.0, 372.0, 279.0, 202.0, 128.0, 105.0, 81.0, 43.0, 34.0, 24.0, 17.0, 14.0, 6.0, 9.0, 2.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0390625, -14.4530029296875, -13.866943359375, -13.2808837890625, -12.69482421875, -12.1087646484375, -11.522705078125, -10.9366455078125, -10.3505859375, -9.7645263671875, -9.178466796875, -8.5924072265625, -8.00634765625, -7.4202880859375, -6.834228515625, -6.2481689453125, -5.662109375, -5.0760498046875, -4.489990234375, -3.9039306640625, -3.31787109375, -2.7318115234375, -2.145751953125, -1.5596923828125, -0.9736328125, -0.3875732421875, 0.198486328125, 0.7845458984375, 1.37060546875, 1.9566650390625, 2.542724609375, 3.1287841796875, 3.71484375, 4.3009033203125, 4.886962890625, 5.4730224609375, 6.05908203125, 6.6451416015625, 7.231201171875, 7.8172607421875, 8.4033203125, 8.9893798828125, 9.575439453125, 10.1614990234375, 10.74755859375, 11.3336181640625, 11.919677734375, 12.5057373046875, 13.091796875, 13.6778564453125, 14.263916015625, 14.8499755859375, 15.43603515625, 16.0220947265625, 16.608154296875, 17.1942138671875, 17.7802734375, 18.3663330078125, 18.952392578125, 19.5384521484375, 20.12451171875, 20.7105712890625, 21.296630859375, 21.8826904296875, 22.46875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 4.0, 10.0, 8.0, 20.0, 18.0, 27.0, 55.0, 93.0, 169.0, 304.0, 639.0, 1573.0, 5300.0, 63567.0, 3869898.0, 240345.0, 8159.0, 2190.0, 845.0, 450.0, 234.0, 146.0, 72.0, 42.0, 33.0, 27.0, 15.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.03125, -52.37548828125, -50.7197265625, -49.06396484375, -47.408203125, -45.75244140625, -44.0966796875, -42.44091796875, -40.78515625, -39.12939453125, -37.4736328125, -35.81787109375, -34.162109375, -32.50634765625, -30.8505859375, -29.19482421875, -27.5390625, -25.88330078125, -24.2275390625, -22.57177734375, -20.916015625, -19.26025390625, -17.6044921875, -15.94873046875, -14.29296875, -12.63720703125, -10.9814453125, -9.32568359375, -7.669921875, -6.01416015625, -4.3583984375, -2.70263671875, -1.046875, 0.60888671875, 2.2646484375, 3.92041015625, 5.576171875, 7.23193359375, 8.8876953125, 10.54345703125, 12.19921875, 13.85498046875, 15.5107421875, 17.16650390625, 18.822265625, 20.47802734375, 22.1337890625, 23.78955078125, 25.4453125, 27.10107421875, 28.7568359375, 30.41259765625, 32.068359375, 33.72412109375, 35.3798828125, 37.03564453125, 38.69140625, 40.34716796875, 42.0029296875, 43.65869140625, 45.314453125, 46.97021484375, 48.6259765625, 50.28173828125, 51.9375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 76.0, 660.0, 261.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-433.57232666015625, -417.31134033203125, -401.05035400390625, -384.78936767578125, -368.52838134765625, -352.26739501953125, -336.00640869140625, -319.74542236328125, -303.48443603515625, -287.22344970703125, -270.96246337890625, -254.70147705078125, -238.44049072265625, -222.17950439453125, -205.9185333251953, -189.6575469970703, -173.39657592773438, -157.13558959960938, -140.87460327148438, -124.6136245727539, -108.3526382446289, -92.0916519165039, -75.83067321777344, -59.56968688964844, -43.30870056152344, -27.04771614074707, -10.786731719970703, 5.474250793457031, 21.73523712158203, 37.99622344970703, 54.2572021484375, 70.5181884765625, 86.7791748046875, 103.0401611328125, 119.3011474609375, 135.5621337890625, 151.8231201171875, 168.0841064453125, 184.34507751464844, 200.60606384277344, 216.86705017089844, 233.12803649902344, 249.38902282714844, 265.6499938964844, 281.9109802246094, 298.1719665527344, 314.4329528808594, 330.6939392089844, 346.9549255371094, 363.2159118652344, 379.4768981933594, 395.7378845214844, 411.9988708496094, 428.2598571777344, 444.52081298828125, 460.78179931640625, 477.04278564453125, 493.30377197265625, 509.56475830078125, 525.8257446289062, 542.0867309570312, 558.3477172851562, 574.6087036132812, 590.8696899414062, 607.1306762695312]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 7.0, 8.0, 4.0, 8.0, 9.0, 8.0, 21.0, 10.0, 21.0, 18.0, 26.0, 20.0, 30.0, 25.0, 24.0, 32.0, 40.0, 39.0, 38.0, 36.0, 44.0, 40.0, 34.0, 48.0, 23.0, 46.0, 38.0, 37.0, 38.0, 25.0, 27.0, 25.0, 21.0, 18.0, 9.0, 25.0, 9.0, 18.0, 11.0, 6.0, 6.0, 9.0, 4.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.023075103759766, -57.93684005737305, -55.85060119628906, -53.764366149902344, -51.678131103515625, -49.59189224243164, -47.50565719604492, -45.41941833496094, -43.33318328857422, -41.2469482421875, -39.160709381103516, -37.0744743347168, -34.98823547363281, -32.902000427246094, -30.815765380859375, -28.729528427124023, -26.643291473388672, -24.55705451965332, -22.47081756591797, -20.38458251953125, -18.2983455657959, -16.212108612060547, -14.125872611999512, -12.039636611938477, -9.953399658203125, -7.867163181304932, -5.780926704406738, -3.694690227508545, -1.6084537506103516, 0.477783203125, 2.564019203186035, 4.65025520324707, 6.7364959716796875, 8.822732925415039, 10.908968925476074, 12.99520492553711, 15.081441879272461, 17.167678833007812, 19.25391387939453, 21.340150833129883, 23.426387786865234, 25.512624740600586, 27.598861694335938, 29.685096740722656, 31.771333694458008, 33.85757064819336, 35.94380569458008, 38.03004455566406, 40.11627960205078, 42.2025146484375, 44.288753509521484, 46.3749885559082, 48.46122741699219, 50.547462463378906, 52.633697509765625, 54.719932556152344, 56.80617141723633, 58.89240646362305, 60.97864532470703, 63.06488037109375, 65.15111541748047, 67.23735046386719, 69.32359313964844, 71.40982818603516, 73.49606323242188]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 10.0, 14.0, 16.0, 14.0, 15.0, 20.0, 16.0, 15.0, 33.0, 25.0, 25.0, 33.0, 41.0, 45.0, 39.0, 51.0, 46.0, 57.0, 51.0, 38.0, 37.0, 37.0, 37.0, 36.0, 32.0, 30.0, 31.0, 22.0, 20.0, 19.0, 19.0, 16.0, 11.0, 11.0, 15.0, 1.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.6796875, -8.421630859375, -8.16357421875, -7.905517578125, -7.6474609375, -7.389404296875, -7.13134765625, -6.873291015625, -6.615234375, -6.357177734375, -6.09912109375, -5.841064453125, -5.5830078125, -5.324951171875, -5.06689453125, -4.808837890625, -4.55078125, -4.292724609375, -4.03466796875, -3.776611328125, -3.5185546875, -3.260498046875, -3.00244140625, -2.744384765625, -2.486328125, -2.228271484375, -1.97021484375, -1.712158203125, -1.4541015625, -1.196044921875, -0.93798828125, -0.679931640625, -0.421875, -0.163818359375, 0.09423828125, 0.352294921875, 0.6103515625, 0.868408203125, 1.12646484375, 1.384521484375, 1.642578125, 1.900634765625, 2.15869140625, 2.416748046875, 2.6748046875, 2.932861328125, 3.19091796875, 3.448974609375, 3.70703125, 3.965087890625, 4.22314453125, 4.481201171875, 4.7392578125, 4.997314453125, 5.25537109375, 5.513427734375, 5.771484375, 6.029541015625, 6.28759765625, 6.545654296875, 6.8037109375, 7.061767578125, 7.31982421875, 7.577880859375, 7.8359375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 5.0, 7.0, 7.0, 17.0, 24.0, 30.0, 33.0, 57.0, 69.0, 84.0, 136.0, 202.0, 223.0, 425.0, 558.0, 833.0, 1220.0, 1667.0, 2525.0, 3450.0, 5262.0, 7654.0, 11475.0, 16573.0, 25169.0, 38025.0, 59343.0, 98651.0, 213844.0, 269535.0, 106269.0, 62966.0, 40117.0, 26681.0, 17718.0, 11975.0, 7988.0, 5543.0, 3686.0, 2605.0, 1841.0, 1277.0, 827.0, 606.0, 387.0, 269.0, 206.0, 114.0, 112.0, 77.0, 55.0, 56.0, 22.0, 30.0, 10.0, 16.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.8779296875, -1.819366455078125, -1.76080322265625, -1.702239990234375, -1.6436767578125, -1.585113525390625, -1.52655029296875, -1.467987060546875, -1.409423828125, -1.350860595703125, -1.29229736328125, -1.233734130859375, -1.1751708984375, -1.116607666015625, -1.05804443359375, -0.999481201171875, -0.94091796875, -0.882354736328125, -0.82379150390625, -0.765228271484375, -0.7066650390625, -0.648101806640625, -0.58953857421875, -0.530975341796875, -0.472412109375, -0.413848876953125, -0.35528564453125, -0.296722412109375, -0.2381591796875, -0.179595947265625, -0.12103271484375, -0.062469482421875, -0.00390625, 0.054656982421875, 0.11322021484375, 0.171783447265625, 0.2303466796875, 0.288909912109375, 0.34747314453125, 0.406036376953125, 0.464599609375, 0.523162841796875, 0.58172607421875, 0.640289306640625, 0.6988525390625, 0.757415771484375, 0.81597900390625, 0.874542236328125, 0.93310546875, 0.991668701171875, 1.05023193359375, 1.108795166015625, 1.1673583984375, 1.225921630859375, 1.28448486328125, 1.343048095703125, 1.401611328125, 1.460174560546875, 1.51873779296875, 1.577301025390625, 1.6358642578125, 1.694427490234375, 1.75299072265625, 1.811553955078125, 1.8701171875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 6.0, 6.0, 7.0, 11.0, 17.0, 13.0, 10.0, 22.0, 13.0, 31.0, 23.0, 19.0, 33.0, 30.0, 44.0, 37.0, 48.0, 45.0, 47.0, 1067.0, 46.0, 34.0, 38.0, 40.0, 42.0, 39.0, 26.0, 26.0, 26.0, 30.0, 25.0, 29.0, 24.0, 14.0, 14.0, 7.0, 10.0, 5.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.52850341796875, -5.3656005859375, -5.20269775390625, -5.039794921875, -4.87689208984375, -4.7139892578125, -4.55108642578125, -4.38818359375, -4.22528076171875, -4.0623779296875, -3.89947509765625, -3.736572265625, -3.57366943359375, -3.4107666015625, -3.24786376953125, -3.0849609375, -2.92205810546875, -2.7591552734375, -2.59625244140625, -2.433349609375, -2.27044677734375, -2.1075439453125, -1.94464111328125, -1.78173828125, -1.61883544921875, -1.4559326171875, -1.29302978515625, -1.130126953125, -0.96722412109375, -0.8043212890625, -0.64141845703125, -0.478515625, -0.31561279296875, -0.1527099609375, 0.01019287109375, 0.173095703125, 0.33599853515625, 0.4989013671875, 0.66180419921875, 0.82470703125, 0.98760986328125, 1.1505126953125, 1.31341552734375, 1.476318359375, 1.63922119140625, 1.8021240234375, 1.96502685546875, 2.1279296875, 2.29083251953125, 2.4537353515625, 2.61663818359375, 2.779541015625, 2.94244384765625, 3.1053466796875, 3.26824951171875, 3.43115234375, 3.59405517578125, 3.7569580078125, 3.91986083984375, 4.082763671875, 4.24566650390625, 4.4085693359375, 4.57147216796875, 4.734375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 0.0, 10.0, 11.0, 22.0, 23.0, 45.0, 80.0, 103.0, 151.0, 267.0, 407.0, 594.0, 958.0, 1395.0, 2142.0, 3200.0, 5093.0, 7639.0, 11688.0, 18367.0, 28456.0, 45866.0, 74656.0, 133784.0, 1371828.0, 161529.0, 85791.0, 52472.0, 32530.0, 20128.0, 13156.0, 8612.0, 5500.0, 3632.0, 2320.0, 1627.0, 1026.0, 728.0, 461.0, 287.0, 204.0, 119.0, 84.0, 47.0, 37.0, 16.0, 22.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.142578125, -2.0788726806640625, -2.015167236328125, -1.9514617919921875, -1.88775634765625, -1.8240509033203125, -1.760345458984375, -1.6966400146484375, -1.6329345703125, -1.5692291259765625, -1.505523681640625, -1.4418182373046875, -1.37811279296875, -1.3144073486328125, -1.250701904296875, -1.1869964599609375, -1.123291015625, -1.0595855712890625, -0.995880126953125, -0.9321746826171875, -0.86846923828125, -0.8047637939453125, -0.741058349609375, -0.6773529052734375, -0.6136474609375, -0.5499420166015625, -0.486236572265625, -0.4225311279296875, -0.35882568359375, -0.2951202392578125, -0.231414794921875, -0.1677093505859375, -0.10400390625, -0.0402984619140625, 0.023406982421875, 0.0871124267578125, 0.15081787109375, 0.2145233154296875, 0.278228759765625, 0.3419342041015625, 0.4056396484375, 0.4693450927734375, 0.533050537109375, 0.5967559814453125, 0.66046142578125, 0.7241668701171875, 0.787872314453125, 0.8515777587890625, 0.915283203125, 0.9789886474609375, 1.042694091796875, 1.1063995361328125, 1.17010498046875, 1.2338104248046875, 1.297515869140625, 1.3612213134765625, 1.4249267578125, 1.4886322021484375, 1.552337646484375, 1.6160430908203125, 1.67974853515625, 1.7434539794921875, 1.807159423828125, 1.8708648681640625, 1.9345703125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 11.0, 10.0, 9.0, 10.0, 10.0, 19.0, 16.0, 19.0, 35.0, 19.0, 31.0, 48.0, 47.0, 66.0, 51.0, 71.0, 64.0, 71.0, 50.0, 42.0, 51.0, 39.0, 30.0, 22.0, 22.0, 27.0, 20.0, 16.0, 8.0, 10.0, 6.0, 9.0, 9.0, 4.0, 2.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003330707550048828, -0.0003230385482311249, -0.00031300634145736694, -0.000302974134683609, -0.0002929419279098511, -0.00028290972113609314, -0.0002728775143623352, -0.00026284530758857727, -0.00025281310081481934, -0.0002427808940410614, -0.00023274868726730347, -0.00022271648049354553, -0.0002126842737197876, -0.00020265206694602966, -0.00019261986017227173, -0.0001825876533985138, -0.00017255544662475586, -0.00016252323985099792, -0.00015249103307724, -0.00014245882630348206, -0.00013242661952972412, -0.0001223944127559662, -0.00011236220598220825, -0.00010232999920845032, -9.229779243469238e-05, -8.226558566093445e-05, -7.223337888717651e-05, -6.220117211341858e-05, -5.2168965339660645e-05, -4.213675856590271e-05, -3.2104551792144775e-05, -2.207234501838684e-05, -1.2040138244628906e-05, -2.0079314708709717e-06, 8.024275302886963e-06, 1.8056482076644897e-05, 2.8088688850402832e-05, 3.8120895624160767e-05, 4.81531023979187e-05, 5.8185309171676636e-05, 6.821751594543457e-05, 7.82497227191925e-05, 8.828192949295044e-05, 9.831413626670837e-05, 0.00010834634304046631, 0.00011837854981422424, 0.00012841075658798218, 0.0001384429633617401, 0.00014847517013549805, 0.00015850737690925598, 0.00016853958368301392, 0.00017857179045677185, 0.00018860399723052979, 0.00019863620400428772, 0.00020866841077804565, 0.0002187006175518036, 0.00022873282432556152, 0.00023876503109931946, 0.0002487972378730774, 0.00025882944464683533, 0.00026886165142059326, 0.0002788938581943512, 0.00028892606496810913, 0.00029895827174186707, 0.000308990478515625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 12.0, 14.0, 14.0, 26.0, 19.0, 21.0, 38.0, 36.0, 63.0, 64.0, 90.0, 125.0, 176.0, 288.0, 388.0, 625.0, 1409.0, 116673.0, 923404.0, 2642.0, 830.0, 466.0, 328.0, 177.0, 134.0, 115.0, 78.0, 57.0, 53.0, 32.0, 32.0, 21.0, 20.0, 13.0, 4.0, 8.0, 12.0, 4.0, 9.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004985809326171875, -0.00480884313583374, -0.0046318769454956055, -0.004454910755157471, -0.004277944564819336, -0.004100978374481201, -0.003924012184143066, -0.0037470459938049316, -0.003570079803466797, -0.003393113613128662, -0.0032161474227905273, -0.0030391812324523926, -0.002862215042114258, -0.002685248851776123, -0.0025082826614379883, -0.0023313164710998535, -0.0021543502807617188, -0.001977384090423584, -0.0018004179000854492, -0.0016234517097473145, -0.0014464855194091797, -0.001269519329071045, -0.0010925531387329102, -0.0009155869483947754, -0.0007386207580566406, -0.0005616545677185059, -0.0003846883773803711, -0.00020772218704223633, -3.075599670410156e-05, 0.0001462101936340332, 0.00032317638397216797, 0.0005001425743103027, 0.0006771087646484375, 0.0008540749549865723, 0.001031041145324707, 0.0012080073356628418, 0.0013849735260009766, 0.0015619397163391113, 0.001738905906677246, 0.0019158720970153809, 0.0020928382873535156, 0.0022698044776916504, 0.002446770668029785, 0.00262373685836792, 0.0028007030487060547, 0.0029776692390441895, 0.0031546354293823242, 0.003331601619720459, 0.0035085678100585938, 0.0036855340003967285, 0.0038625001907348633, 0.004039466381072998, 0.004216432571411133, 0.004393398761749268, 0.004570364952087402, 0.004747331142425537, 0.004924297332763672, 0.005101263523101807, 0.005278229713439941, 0.005455195903778076, 0.005632162094116211, 0.005809128284454346, 0.0059860944747924805, 0.006163060665130615, 0.00634002685546875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 14.0, 11.0, 126.0, 277.0, 289.0, 208.0, 64.0, 17.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004347774083726108, -0.0004204344004392624, -0.00040609139250591397, -0.00039174838457256556, -0.0003774054057430476, -0.0003630623978096992, -0.00034871938987635076, -0.00033437638194300234, -0.0003200334031134844, -0.00030569039518013597, -0.00029134738724678755, -0.00027700437931343913, -0.00026266140048392117, -0.00024831839255057275, -0.00023397538461722434, -0.00021963237668387592, -0.0002052893687505275, -0.00019094636081717908, -0.0001766033674357459, -0.00016226035950239748, -0.0001479173661209643, -0.00013357435818761587, -0.00011923135025426745, -0.00010488834959687665, -9.054534893948585e-05, -7.620234828209504e-05, -6.185934762470424e-05, -4.7516339691355824e-05, -3.317333903396502e-05, -1.8830338376574218e-05, -4.487330443225801e-06, 9.855670214165002e-06, 2.4198670871555805e-05, 3.854167152894661e-05, 5.288467582431622e-05, 6.722768011968583e-05, 8.157068077707663e-05, 9.591368143446743e-05, 0.00011025668936781585, 0.00012459969730116427, 0.00013894269068259746, 0.00015328569861594588, 0.00016762869199737906, 0.00018197169993072748, 0.0001963147078640759, 0.0002106577012455091, 0.0002250007091788575, 0.0002393437025602907, 0.0002536867104936391, 0.00026802971842698753, 0.00028237272636033595, 0.0002967157051898539, 0.0003110587131232023, 0.00032540172105655074, 0.00033974472898989916, 0.0003540877369232476, 0.000368430744856596, 0.0003827737527899444, 0.00039711676072329283, 0.00041145976865664124, 0.0004258027474861592, 0.0004401457554195076, 0.00045448876335285604, 0.00046883177128620446, 0.0004831747501157224]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 6.0, 7.0, 13.0, 9.0, 11.0, 16.0, 21.0, 22.0, 15.0, 30.0, 22.0, 27.0, 33.0, 44.0, 44.0, 34.0, 40.0, 39.0, 37.0, 42.0, 39.0, 45.0, 48.0, 33.0, 31.0, 29.0, 49.0, 25.0, 21.0, 23.0, 25.0, 18.0, 16.0, 16.0, 12.0, 12.0, 11.0, 5.0, 7.0, 5.0, 4.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001729130744934082, -0.00016749370843172073, -0.00016207434237003326, -0.0001566549763083458, -0.00015123561024665833, -0.00014581624418497086, -0.00014039687812328339, -0.00013497751206159592, -0.00012955814599990845, -0.00012413877993822098, -0.00011871941387653351, -0.00011330004781484604, -0.00010788068175315857, -0.0001024613156914711, -9.704194962978363e-05, -9.162258356809616e-05, -8.620321750640869e-05, -8.078385144472122e-05, -7.536448538303375e-05, -6.994511932134628e-05, -6.452575325965881e-05, -5.9106387197971344e-05, -5.3687021136283875e-05, -4.8267655074596405e-05, -4.2848289012908936e-05, -3.7428922951221466e-05, -3.2009556889533997e-05, -2.6590190827846527e-05, -2.1170824766159058e-05, -1.5751458704471588e-05, -1.0332092642784119e-05, -4.912726581096649e-06, 5.066394805908203e-07, 5.92600554227829e-06, 1.134537160396576e-05, 1.676473766565323e-05, 2.2184103727340698e-05, 2.7603469789028168e-05, 3.302283585071564e-05, 3.844220191240311e-05, 4.3861567974090576e-05, 4.9280934035778046e-05, 5.4700300097465515e-05, 6.0119666159152985e-05, 6.553903222084045e-05, 7.095839828252792e-05, 7.637776434421539e-05, 8.179713040590286e-05, 8.721649646759033e-05, 9.26358625292778e-05, 9.805522859096527e-05, 0.00010347459465265274, 0.00010889396071434021, 0.00011431332677602768, 0.00011973269283771515, 0.00012515205889940262, 0.0001305714249610901, 0.00013599079102277756, 0.00014141015708446503, 0.0001468295231461525, 0.00015224888920783997, 0.00015766825526952744, 0.0001630876213312149, 0.00016850698739290237, 0.00017392635345458984]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 10.0, 14.0, 16.0, 14.0, 15.0, 20.0, 16.0, 15.0, 33.0, 25.0, 25.0, 33.0, 41.0, 45.0, 39.0, 51.0, 46.0, 57.0, 51.0, 38.0, 37.0, 37.0, 37.0, 36.0, 32.0, 30.0, 31.0, 22.0, 20.0, 19.0, 19.0, 16.0, 11.0, 11.0, 15.0, 1.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.6796875, -8.421630859375, -8.16357421875, -7.905517578125, -7.6474609375, -7.389404296875, -7.13134765625, -6.873291015625, -6.615234375, -6.357177734375, -6.09912109375, -5.841064453125, -5.5830078125, -5.324951171875, -5.06689453125, -4.808837890625, -4.55078125, -4.292724609375, -4.03466796875, -3.776611328125, -3.5185546875, -3.260498046875, -3.00244140625, -2.744384765625, -2.486328125, -2.228271484375, -1.97021484375, -1.712158203125, -1.4541015625, -1.196044921875, -0.93798828125, -0.679931640625, -0.421875, -0.163818359375, 0.09423828125, 0.352294921875, 0.6103515625, 0.868408203125, 1.12646484375, 1.384521484375, 1.642578125, 1.900634765625, 2.15869140625, 2.416748046875, 2.6748046875, 2.932861328125, 3.19091796875, 3.448974609375, 3.70703125, 3.965087890625, 4.22314453125, 4.481201171875, 4.7392578125, 4.997314453125, 5.25537109375, 5.513427734375, 5.771484375, 6.029541015625, 6.28759765625, 6.545654296875, 6.8037109375, 7.061767578125, 7.31982421875, 7.577880859375, 7.8359375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 9.0, 3.0, 18.0, 23.0, 49.0, 39.0, 55.0, 79.0, 124.0, 135.0, 201.0, 314.0, 454.0, 682.0, 1129.0, 2037.0, 4318.0, 12114.0, 50005.0, 338058.0, 528544.0, 81070.0, 17195.0, 5640.0, 2490.0, 1284.0, 783.0, 513.0, 299.0, 235.0, 185.0, 109.0, 91.0, 70.0, 50.0, 32.0, 32.0, 19.0, 12.0, 11.0, 9.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.140625, -15.653564453125, -15.16650390625, -14.679443359375, -14.1923828125, -13.705322265625, -13.21826171875, -12.731201171875, -12.244140625, -11.757080078125, -11.27001953125, -10.782958984375, -10.2958984375, -9.808837890625, -9.32177734375, -8.834716796875, -8.34765625, -7.860595703125, -7.37353515625, -6.886474609375, -6.3994140625, -5.912353515625, -5.42529296875, -4.938232421875, -4.451171875, -3.964111328125, -3.47705078125, -2.989990234375, -2.5029296875, -2.015869140625, -1.52880859375, -1.041748046875, -0.5546875, -0.067626953125, 0.41943359375, 0.906494140625, 1.3935546875, 1.880615234375, 2.36767578125, 2.854736328125, 3.341796875, 3.828857421875, 4.31591796875, 4.802978515625, 5.2900390625, 5.777099609375, 6.26416015625, 6.751220703125, 7.23828125, 7.725341796875, 8.21240234375, 8.699462890625, 9.1865234375, 9.673583984375, 10.16064453125, 10.647705078125, 11.134765625, 11.621826171875, 12.10888671875, 12.595947265625, 13.0830078125, 13.570068359375, 14.05712890625, 14.544189453125, 15.03125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 6.0, 12.0, 10.0, 16.0, 15.0, 21.0, 17.0, 34.0, 29.0, 41.0, 49.0, 56.0, 82.0, 173.0, 1488.0, 404.0, 172.0, 87.0, 69.0, 35.0, 45.0, 38.0, 26.0, 21.0, 19.0, 11.0, 8.0, 15.0, 8.0, 7.0, 4.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.328125, -23.515380859375, -22.70263671875, -21.889892578125, -21.0771484375, -20.264404296875, -19.45166015625, -18.638916015625, -17.826171875, -17.013427734375, -16.20068359375, -15.387939453125, -14.5751953125, -13.762451171875, -12.94970703125, -12.136962890625, -11.32421875, -10.511474609375, -9.69873046875, -8.885986328125, -8.0732421875, -7.260498046875, -6.44775390625, -5.635009765625, -4.822265625, -4.009521484375, -3.19677734375, -2.384033203125, -1.5712890625, -0.758544921875, 0.05419921875, 0.866943359375, 1.6796875, 2.492431640625, 3.30517578125, 4.117919921875, 4.9306640625, 5.743408203125, 6.55615234375, 7.368896484375, 8.181640625, 8.994384765625, 9.80712890625, 10.619873046875, 11.4326171875, 12.245361328125, 13.05810546875, 13.870849609375, 14.68359375, 15.496337890625, 16.30908203125, 17.121826171875, 17.9345703125, 18.747314453125, 19.56005859375, 20.372802734375, 21.185546875, 21.998291015625, 22.81103515625, 23.623779296875, 24.4365234375, 25.249267578125, 26.06201171875, 26.874755859375, 27.6875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 10.0, 17.0, 16.0, 20.0, 28.0, 47.0, 50.0, 94.0, 107.0, 193.0, 259.0, 557.0, 1458.0, 8677.0, 3101117.0, 29461.0, 1951.0, 667.0, 326.0, 204.0, 134.0, 75.0, 55.0, 46.0, 22.0, 24.0, 26.0, 20.0, 7.0, 9.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-54.09375, -52.32763671875, -50.5615234375, -48.79541015625, -47.029296875, -45.26318359375, -43.4970703125, -41.73095703125, -39.96484375, -38.19873046875, -36.4326171875, -34.66650390625, -32.900390625, -31.13427734375, -29.3681640625, -27.60205078125, -25.8359375, -24.06982421875, -22.3037109375, -20.53759765625, -18.771484375, -17.00537109375, -15.2392578125, -13.47314453125, -11.70703125, -9.94091796875, -8.1748046875, -6.40869140625, -4.642578125, -2.87646484375, -1.1103515625, 0.65576171875, 2.421875, 4.18798828125, 5.9541015625, 7.72021484375, 9.486328125, 11.25244140625, 13.0185546875, 14.78466796875, 16.55078125, 18.31689453125, 20.0830078125, 21.84912109375, 23.615234375, 25.38134765625, 27.1474609375, 28.91357421875, 30.6796875, 32.44580078125, 34.2119140625, 35.97802734375, 37.744140625, 39.51025390625, 41.2763671875, 43.04248046875, 44.80859375, 46.57470703125, 48.3408203125, 50.10693359375, 51.873046875, 53.63916015625, 55.4052734375, 57.17138671875, 58.9375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [19.0, 51.0, 248.0, 450.0, 182.0, 49.0, 11.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.610172271728516, -8.819649696350098, -5.02912712097168, -1.2386045455932617, 2.5519180297851562, 6.342441558837891, 10.132963180541992, 13.923484802246094, 17.714008331298828, 21.504531860351562, 25.295053482055664, 29.085575103759766, 32.8760986328125, 36.666622161865234, 40.45714569091797, 44.24766540527344, 48.03818893432617, 51.828712463378906, 55.619232177734375, 59.40975570678711, 63.200279235839844, 66.99079895019531, 70.78132629394531, 74.57184600830078, 78.36236572265625, 82.15288543701172, 85.94341278076172, 89.73393249511719, 93.52445983886719, 97.31497955322266, 101.10549926757812, 104.89602661132812, 108.68655395507812, 112.4770736694336, 116.2676010131836, 120.05812072753906, 123.84864807128906, 127.63916778564453, 131.4296875, 135.22021484375, 139.0107421875, 142.80126953125, 146.59178161621094, 150.38230895996094, 154.17283630371094, 157.96334838867188, 161.75387573242188, 165.54440307617188, 169.3349151611328, 173.1254425048828, 176.91595458984375, 180.70648193359375, 184.49700927734375, 188.28753662109375, 192.0780487060547, 195.8685760498047, 199.65908813476562, 203.44961547851562, 207.24012756347656, 211.03065490722656, 214.82118225097656, 218.6116943359375, 222.4022216796875, 226.1927490234375, 229.9832763671875]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 8.0, 4.0, 5.0, 7.0, 7.0, 11.0, 11.0, 16.0, 19.0, 35.0, 26.0, 42.0, 36.0, 38.0, 40.0, 48.0, 40.0, 37.0, 57.0, 52.0, 35.0, 42.0, 26.0, 30.0, 43.0, 34.0, 30.0, 31.0, 30.0, 25.0, 21.0, 27.0, 11.0, 11.0, 13.0, 15.0, 6.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-53.00392532348633, -51.40496826171875, -49.80601119995117, -48.207054138183594, -46.608097076416016, -45.00914001464844, -43.41018295288086, -41.81122589111328, -40.2122688293457, -38.613311767578125, -37.01435470581055, -35.41539764404297, -33.81644058227539, -32.21748352050781, -30.618526458740234, -29.019569396972656, -27.420610427856445, -25.821653366088867, -24.22269630432129, -22.62373924255371, -21.024782180786133, -19.425825119018555, -17.826866149902344, -16.227909088134766, -14.628952980041504, -13.029995918273926, -11.431038856506348, -9.832080841064453, -8.233123779296875, -6.634167194366455, -5.035209655761719, -3.4362525939941406, -1.8372955322265625, -0.23833835124969482, 1.3606188297271729, 2.95957612991333, 4.558533191680908, 6.157490253448486, 7.756447792053223, 9.3554048538208, 10.954361915588379, 12.553318977355957, 14.152276039123535, 15.75123405456543, 17.350191116333008, 18.949148178100586, 20.548105239868164, 22.147062301635742, 23.74601936340332, 25.3449764251709, 26.943933486938477, 28.542890548706055, 30.141847610473633, 31.74080467224121, 33.33976364135742, 34.938720703125, 36.53767776489258, 38.136634826660156, 39.735591888427734, 41.33454895019531, 42.93350601196289, 44.53246307373047, 46.13142013549805, 47.730377197265625, 49.3293342590332]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 8.0, 8.0, 13.0, 15.0, 15.0, 22.0, 23.0, 24.0, 25.0, 43.0, 39.0, 37.0, 40.0, 45.0, 45.0, 49.0, 45.0, 43.0, 46.0, 47.0, 55.0, 26.0, 35.0, 30.0, 32.0, 26.0, 31.0, 13.0, 24.0, 14.0, 12.0, 15.0, 7.0, 5.0, 6.0, 6.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.1484375, -10.8441162109375, -10.539794921875, -10.2354736328125, -9.93115234375, -9.6268310546875, -9.322509765625, -9.0181884765625, -8.7138671875, -8.4095458984375, -8.105224609375, -7.8009033203125, -7.49658203125, -7.1922607421875, -6.887939453125, -6.5836181640625, -6.279296875, -5.9749755859375, -5.670654296875, -5.3663330078125, -5.06201171875, -4.7576904296875, -4.453369140625, -4.1490478515625, -3.8447265625, -3.5404052734375, -3.236083984375, -2.9317626953125, -2.62744140625, -2.3231201171875, -2.018798828125, -1.7144775390625, -1.41015625, -1.1058349609375, -0.801513671875, -0.4971923828125, -0.19287109375, 0.1114501953125, 0.415771484375, 0.7200927734375, 1.0244140625, 1.3287353515625, 1.633056640625, 1.9373779296875, 2.24169921875, 2.5460205078125, 2.850341796875, 3.1546630859375, 3.458984375, 3.7633056640625, 4.067626953125, 4.3719482421875, 4.67626953125, 4.9805908203125, 5.284912109375, 5.5892333984375, 5.8935546875, 6.1978759765625, 6.502197265625, 6.8065185546875, 7.11083984375, 7.4151611328125, 7.719482421875, 8.0238037109375, 8.328125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 10.0, 9.0, 9.0, 11.0, 12.0, 23.0, 21.0, 40.0, 45.0, 60.0, 99.0, 110.0, 160.0, 209.0, 310.0, 549.0, 781.0, 1335.0, 3538.0, 38922.0, 2809211.0, 1315662.0, 17073.0, 2695.0, 1203.0, 645.0, 392.0, 306.0, 214.0, 174.0, 119.0, 83.0, 72.0, 52.0, 25.0, 28.0, 14.0, 13.0, 9.0, 12.0, 7.0, 9.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0], "bins": [-56.0, -54.4814453125, -52.962890625, -51.4443359375, -49.92578125, -48.4072265625, -46.888671875, -45.3701171875, -43.8515625, -42.3330078125, -40.814453125, -39.2958984375, -37.77734375, -36.2587890625, -34.740234375, -33.2216796875, -31.703125, -30.1845703125, -28.666015625, -27.1474609375, -25.62890625, -24.1103515625, -22.591796875, -21.0732421875, -19.5546875, -18.0361328125, -16.517578125, -14.9990234375, -13.48046875, -11.9619140625, -10.443359375, -8.9248046875, -7.40625, -5.8876953125, -4.369140625, -2.8505859375, -1.33203125, 0.1865234375, 1.705078125, 3.2236328125, 4.7421875, 6.2607421875, 7.779296875, 9.2978515625, 10.81640625, 12.3349609375, 13.853515625, 15.3720703125, 16.890625, 18.4091796875, 19.927734375, 21.4462890625, 22.96484375, 24.4833984375, 26.001953125, 27.5205078125, 29.0390625, 30.5576171875, 32.076171875, 33.5947265625, 35.11328125, 36.6318359375, 38.150390625, 39.6689453125, 41.1875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 10.0, 11.0, 9.0, 30.0, 48.0, 52.0, 109.0, 200.0, 291.0, 470.0, 622.0, 689.0, 545.0, 384.0, 229.0, 135.0, 80.0, 54.0, 30.0, 15.0, 13.0, 14.0, 5.0, 3.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.390625, -20.70751953125, -20.0244140625, -19.34130859375, -18.658203125, -17.97509765625, -17.2919921875, -16.60888671875, -15.92578125, -15.24267578125, -14.5595703125, -13.87646484375, -13.193359375, -12.51025390625, -11.8271484375, -11.14404296875, -10.4609375, -9.77783203125, -9.0947265625, -8.41162109375, -7.728515625, -7.04541015625, -6.3623046875, -5.67919921875, -4.99609375, -4.31298828125, -3.6298828125, -2.94677734375, -2.263671875, -1.58056640625, -0.8974609375, -0.21435546875, 0.46875, 1.15185546875, 1.8349609375, 2.51806640625, 3.201171875, 3.88427734375, 4.5673828125, 5.25048828125, 5.93359375, 6.61669921875, 7.2998046875, 7.98291015625, 8.666015625, 9.34912109375, 10.0322265625, 10.71533203125, 11.3984375, 12.08154296875, 12.7646484375, 13.44775390625, 14.130859375, 14.81396484375, 15.4970703125, 16.18017578125, 16.86328125, 17.54638671875, 18.2294921875, 18.91259765625, 19.595703125, 20.27880859375, 20.9619140625, 21.64501953125, 22.328125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 8.0, 21.0, 30.0, 50.0, 95.0, 177.0, 343.0, 584.0, 1207.0, 2747.0, 7677.0, 36324.0, 373870.0, 3025278.0, 673280.0, 56186.0, 10137.0, 3282.0, 1388.0, 711.0, 360.0, 217.0, 127.0, 52.0, 46.0, 20.0, 7.0, 8.0, 6.0, 6.0, 7.0, 0.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.328125, -20.6533203125, -19.978515625, -19.3037109375, -18.62890625, -17.9541015625, -17.279296875, -16.6044921875, -15.9296875, -15.2548828125, -14.580078125, -13.9052734375, -13.23046875, -12.5556640625, -11.880859375, -11.2060546875, -10.53125, -9.8564453125, -9.181640625, -8.5068359375, -7.83203125, -7.1572265625, -6.482421875, -5.8076171875, -5.1328125, -4.4580078125, -3.783203125, -3.1083984375, -2.43359375, -1.7587890625, -1.083984375, -0.4091796875, 0.265625, 0.9404296875, 1.615234375, 2.2900390625, 2.96484375, 3.6396484375, 4.314453125, 4.9892578125, 5.6640625, 6.3388671875, 7.013671875, 7.6884765625, 8.36328125, 9.0380859375, 9.712890625, 10.3876953125, 11.0625, 11.7373046875, 12.412109375, 13.0869140625, 13.76171875, 14.4365234375, 15.111328125, 15.7861328125, 16.4609375, 17.1357421875, 17.810546875, 18.4853515625, 19.16015625, 19.8349609375, 20.509765625, 21.1845703125, 21.859375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 7.0, 14.0, 20.0, 27.0, 34.0, 54.0, 52.0, 82.0, 83.0, 107.0, 106.0, 90.0, 84.0, 61.0, 50.0, 45.0, 25.0, 20.0, 18.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.49153900146484, -72.17437744140625, -68.85720825195312, -65.54004669189453, -62.22288513183594, -58.905723571777344, -55.588558197021484, -52.271392822265625, -48.95423126220703, -45.63706970214844, -42.31990432739258, -39.00273895263672, -35.685577392578125, -32.36841583251953, -29.051250457763672, -25.734086990356445, -22.41692352294922, -19.099760055541992, -15.782596588134766, -12.465433120727539, -9.148269653320312, -5.831106185913086, -2.5139427185058594, 0.8032207489013672, 4.120384216308594, 7.43754768371582, 10.754711151123047, 14.071874618530273, 17.3890380859375, 20.706201553344727, 24.023365020751953, 27.34052848815918, 30.657684326171875, 33.97484588623047, 37.29201126098633, 40.60917663574219, 43.92633819580078, 47.243499755859375, 50.560665130615234, 53.877830505371094, 57.19499206542969, 60.51215362548828, 63.82931900024414, 67.146484375, 70.4636459350586, 73.78080749511719, 77.09797668457031, 80.4151382446289, 83.7322998046875, 87.0494613647461, 90.36662292480469, 93.68379211425781, 97.0009536743164, 100.318115234375, 103.63528442382812, 106.95244598388672, 110.26960754394531, 113.5867691040039, 116.9039306640625, 120.22109985351562, 123.53826141357422, 126.85542297363281, 130.17259216308594, 133.48974609375, 136.80691528320312]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 10.0, 6.0, 12.0, 14.0, 9.0, 15.0, 12.0, 28.0, 31.0, 27.0, 39.0, 32.0, 43.0, 35.0, 47.0, 37.0, 46.0, 37.0, 37.0, 40.0, 51.0, 31.0, 34.0, 32.0, 45.0, 29.0, 28.0, 23.0, 23.0, 15.0, 21.0, 18.0, 13.0, 15.0, 8.0, 7.0, 6.0, 5.0, 4.0, 5.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.383052825927734, -48.646949768066406, -46.91084671020508, -45.17474365234375, -43.43864059448242, -41.702537536621094, -39.966434478759766, -38.23033142089844, -36.49422836303711, -34.75812530517578, -33.02202224731445, -31.285919189453125, -29.549816131591797, -27.81371307373047, -26.07761001586914, -24.341506958007812, -22.605403900146484, -20.869300842285156, -19.133197784423828, -17.3970947265625, -15.660991668701172, -13.924888610839844, -12.188785552978516, -10.452682495117188, -8.71657943725586, -6.980476379394531, -5.244373321533203, -3.508270263671875, -1.7721672058105469, -0.03606414794921875, 1.7000389099121094, 3.4361419677734375, 5.172245025634766, 6.908348083496094, 8.644451141357422, 10.38055419921875, 12.116657257080078, 13.852760314941406, 15.588863372802734, 17.324966430664062, 19.06106948852539, 20.79717254638672, 22.533275604248047, 24.269378662109375, 26.005481719970703, 27.74158477783203, 29.47768783569336, 31.213790893554688, 32.949893951416016, 34.685997009277344, 36.42210006713867, 38.158203125, 39.89430618286133, 41.630409240722656, 43.366512298583984, 45.10261535644531, 46.83871841430664, 48.57482147216797, 50.3109245300293, 52.047027587890625, 53.78313064575195, 55.51923370361328, 57.25533676147461, 58.99143981933594, 60.727542877197266]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 12.0, 8.0, 13.0, 8.0, 11.0, 15.0, 16.0, 20.0, 23.0, 25.0, 33.0, 27.0, 48.0, 42.0, 39.0, 39.0, 51.0, 36.0, 52.0, 44.0, 44.0, 34.0, 40.0, 40.0, 34.0, 33.0, 27.0, 33.0, 16.0, 23.0, 15.0, 12.0, 16.0, 16.0, 12.0, 5.0, 7.0, 4.0, 6.0, 2.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.25, -82.2626953125, -79.275390625, -76.2880859375, -73.30078125, -70.3134765625, -67.326171875, -64.3388671875, -61.3515625, -58.3642578125, -55.376953125, -52.3896484375, -49.40234375, -46.4150390625, -43.427734375, -40.4404296875, -37.453125, -34.4658203125, -31.478515625, -28.4912109375, -25.50390625, -22.5166015625, -19.529296875, -16.5419921875, -13.5546875, -10.5673828125, -7.580078125, -4.5927734375, -1.60546875, 1.3818359375, 4.369140625, 7.3564453125, 10.34375, 13.3310546875, 16.318359375, 19.3056640625, 22.29296875, 25.2802734375, 28.267578125, 31.2548828125, 34.2421875, 37.2294921875, 40.216796875, 43.2041015625, 46.19140625, 49.1787109375, 52.166015625, 55.1533203125, 58.140625, 61.1279296875, 64.115234375, 67.1025390625, 70.08984375, 73.0771484375, 76.064453125, 79.0517578125, 82.0390625, 85.0263671875, 88.013671875, 91.0009765625, 93.98828125, 96.9755859375, 99.962890625, 102.9501953125, 105.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 5.0, 13.0, 20.0, 24.0, 48.0, 61.0, 91.0, 143.0, 208.0, 320.0, 468.0, 729.0, 1085.0, 1642.0, 2387.0, 3579.0, 5340.0, 8105.0, 11998.0, 18757.0, 30027.0, 50637.0, 91290.0, 202936.0, 333031.0, 120670.0, 62986.0, 36718.0, 22436.0, 14465.0, 9400.0, 6236.0, 4198.0, 2844.0, 1884.0, 1215.0, 887.0, 565.0, 381.0, 225.0, 171.0, 130.0, 70.0, 44.0, 30.0, 20.0, 17.0, 10.0, 2.0, 4.0, 0.0, 3.0, 2.0], "bins": [-27.265625, -26.490966796875, -25.71630859375, -24.941650390625, -24.1669921875, -23.392333984375, -22.61767578125, -21.843017578125, -21.068359375, -20.293701171875, -19.51904296875, -18.744384765625, -17.9697265625, -17.195068359375, -16.42041015625, -15.645751953125, -14.87109375, -14.096435546875, -13.32177734375, -12.547119140625, -11.7724609375, -10.997802734375, -10.22314453125, -9.448486328125, -8.673828125, -7.899169921875, -7.12451171875, -6.349853515625, -5.5751953125, -4.800537109375, -4.02587890625, -3.251220703125, -2.4765625, -1.701904296875, -0.92724609375, -0.152587890625, 0.6220703125, 1.396728515625, 2.17138671875, 2.946044921875, 3.720703125, 4.495361328125, 5.27001953125, 6.044677734375, 6.8193359375, 7.593994140625, 8.36865234375, 9.143310546875, 9.91796875, 10.692626953125, 11.46728515625, 12.241943359375, 13.0166015625, 13.791259765625, 14.56591796875, 15.340576171875, 16.115234375, 16.889892578125, 17.66455078125, 18.439208984375, 19.2138671875, 19.988525390625, 20.76318359375, 21.537841796875, 22.3125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 7.0, 10.0, 11.0, 6.0, 16.0, 21.0, 15.0, 31.0, 21.0, 26.0, 39.0, 30.0, 33.0, 40.0, 37.0, 30.0, 41.0, 43.0, 1058.0, 39.0, 45.0, 34.0, 34.0, 29.0, 32.0, 29.0, 28.0, 30.0, 33.0, 28.0, 16.0, 18.0, 17.0, 17.0, 13.0, 11.0, 9.0, 5.0, 8.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-55.96875, -54.208984375, -52.44921875, -50.689453125, -48.9296875, -47.169921875, -45.41015625, -43.650390625, -41.890625, -40.130859375, -38.37109375, -36.611328125, -34.8515625, -33.091796875, -31.33203125, -29.572265625, -27.8125, -26.052734375, -24.29296875, -22.533203125, -20.7734375, -19.013671875, -17.25390625, -15.494140625, -13.734375, -11.974609375, -10.21484375, -8.455078125, -6.6953125, -4.935546875, -3.17578125, -1.416015625, 0.34375, 2.103515625, 3.86328125, 5.623046875, 7.3828125, 9.142578125, 10.90234375, 12.662109375, 14.421875, 16.181640625, 17.94140625, 19.701171875, 21.4609375, 23.220703125, 24.98046875, 26.740234375, 28.5, 30.259765625, 32.01953125, 33.779296875, 35.5390625, 37.298828125, 39.05859375, 40.818359375, 42.578125, 44.337890625, 46.09765625, 47.857421875, 49.6171875, 51.376953125, 53.13671875, 54.896484375, 56.65625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 16.0, 29.0, 35.0, 52.0, 79.0, 131.0, 185.0, 265.0, 368.0, 526.0, 754.0, 1059.0, 1383.0, 2019.0, 2919.0, 4389.0, 6152.0, 9088.0, 13508.0, 20205.0, 30740.0, 46916.0, 72180.0, 116561.0, 1333126.0, 170839.0, 89928.0, 58345.0, 37971.0, 25294.0, 16498.0, 11098.0, 7474.0, 5258.0, 3465.0, 2492.0, 1711.0, 1201.0, 819.0, 606.0, 458.0, 317.0, 212.0, 156.0, 89.0, 76.0, 51.0, 29.0, 20.0, 7.0, 13.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-21.0, -20.338623046875, -19.67724609375, -19.015869140625, -18.3544921875, -17.693115234375, -17.03173828125, -16.370361328125, -15.708984375, -15.047607421875, -14.38623046875, -13.724853515625, -13.0634765625, -12.402099609375, -11.74072265625, -11.079345703125, -10.41796875, -9.756591796875, -9.09521484375, -8.433837890625, -7.7724609375, -7.111083984375, -6.44970703125, -5.788330078125, -5.126953125, -4.465576171875, -3.80419921875, -3.142822265625, -2.4814453125, -1.820068359375, -1.15869140625, -0.497314453125, 0.1640625, 0.825439453125, 1.48681640625, 2.148193359375, 2.8095703125, 3.470947265625, 4.13232421875, 4.793701171875, 5.455078125, 6.116455078125, 6.77783203125, 7.439208984375, 8.1005859375, 8.761962890625, 9.42333984375, 10.084716796875, 10.74609375, 11.407470703125, 12.06884765625, 12.730224609375, 13.3916015625, 14.052978515625, 14.71435546875, 15.375732421875, 16.037109375, 16.698486328125, 17.35986328125, 18.021240234375, 18.6826171875, 19.343994140625, 20.00537109375, 20.666748046875, 21.328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 9.0, 9.0, 5.0, 15.0, 22.0, 28.0, 32.0, 32.0, 44.0, 52.0, 50.0, 52.0, 68.0, 96.0, 65.0, 64.0, 71.0, 46.0, 41.0, 30.0, 24.0, 23.0, 16.0, 12.0, 17.0, 5.0, 8.0, 6.0, 6.0, 6.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0042724609375, -0.004152268171310425, -0.00403207540512085, -0.003911882638931274, -0.0037916898727416992, -0.003671497106552124, -0.003551304340362549, -0.0034311115741729736, -0.0033109188079833984, -0.0031907260417938232, -0.003070533275604248, -0.002950340509414673, -0.0028301477432250977, -0.0027099549770355225, -0.0025897622108459473, -0.002469569444656372, -0.002349376678466797, -0.0022291839122772217, -0.0021089911460876465, -0.0019887983798980713, -0.001868605613708496, -0.001748412847518921, -0.0016282200813293457, -0.0015080273151397705, -0.0013878345489501953, -0.0012676417827606201, -0.001147449016571045, -0.0010272562503814697, -0.0009070634841918945, -0.0007868707180023193, -0.0006666779518127441, -0.0005464851856231689, -0.00042629241943359375, -0.00030609965324401855, -0.00018590688705444336, -6.571412086486816e-05, 5.447864532470703e-05, 0.00017467141151428223, 0.0002948641777038574, 0.0004150569438934326, 0.0005352497100830078, 0.000655442476272583, 0.0007756352424621582, 0.0008958280086517334, 0.0010160207748413086, 0.0011362135410308838, 0.001256406307220459, 0.0013765990734100342, 0.0014967918395996094, 0.0016169846057891846, 0.0017371773719787598, 0.001857370138168335, 0.00197756290435791, 0.0020977556705474854, 0.0022179484367370605, 0.0023381412029266357, 0.002458333969116211, 0.002578526735305786, 0.0026987195014953613, 0.0028189122676849365, 0.0029391050338745117, 0.003059297800064087, 0.003179490566253662, 0.0032996833324432373, 0.0034198760986328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 3.0, 7.0, 15.0, 18.0, 26.0, 30.0, 42.0, 63.0, 81.0, 119.0, 197.0, 324.0, 482.0, 952.0, 1904.0, 4202.0, 10197.0, 28772.0, 88503.0, 307866.0, 414357.0, 126333.0, 39433.0, 13861.0, 5553.0, 2417.0, 1159.0, 637.0, 361.0, 180.0, 146.0, 93.0, 74.0, 44.0, 26.0, 26.0, 14.0, 9.0, 4.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205078125, -0.01980423927307129, -0.019100666046142578, -0.018397092819213867, -0.017693519592285156, -0.016989946365356445, -0.016286373138427734, -0.015582799911499023, -0.014879226684570312, -0.014175653457641602, -0.01347208023071289, -0.01276850700378418, -0.012064933776855469, -0.011361360549926758, -0.010657787322998047, -0.009954214096069336, -0.009250640869140625, -0.008547067642211914, -0.007843494415283203, -0.007139921188354492, -0.006436347961425781, -0.00573277473449707, -0.005029201507568359, -0.0043256282806396484, -0.0036220550537109375, -0.0029184818267822266, -0.0022149085998535156, -0.0015113353729248047, -0.0008077621459960938, -0.00010418891906738281, 0.0005993843078613281, 0.001302957534790039, 0.00200653076171875, 0.002710103988647461, 0.003413677215576172, 0.004117250442504883, 0.004820823669433594, 0.005524396896362305, 0.006227970123291016, 0.0069315433502197266, 0.0076351165771484375, 0.008338689804077148, 0.00904226303100586, 0.00974583625793457, 0.010449409484863281, 0.011152982711791992, 0.011856555938720703, 0.012560129165649414, 0.013263702392578125, 0.013967275619506836, 0.014670848846435547, 0.015374422073364258, 0.01607799530029297, 0.01678156852722168, 0.01748514175415039, 0.0181887149810791, 0.018892288208007812, 0.019595861434936523, 0.020299434661865234, 0.021003007888793945, 0.021706581115722656, 0.022410154342651367, 0.023113727569580078, 0.02381730079650879, 0.0245208740234375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 11.0, 12.0, 22.0, 34.0, 42.0, 90.0, 119.0, 143.0, 137.0, 125.0, 86.0, 78.0, 44.0, 34.0, 10.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.008746042847633362, -0.008561247028410435, -0.008376451209187508, -0.00819165538996458, -0.008006859570741653, -0.007822063751518726, -0.007637267932295799, -0.007452472113072872, -0.007267676293849945, -0.007082880474627018, -0.006898084655404091, -0.006713288836181164, -0.006528493016958237, -0.00634369719773531, -0.0061589013785123825, -0.005974105559289455, -0.005789309740066528, -0.005604513920843601, -0.005419718101620674, -0.005234922282397747, -0.00505012646317482, -0.004865330643951893, -0.004680534824728966, -0.004495739005506039, -0.004310943186283112, -0.0041261473670601845, -0.003941351547837257, -0.0037565557286143303, -0.003571759909391403, -0.003386964090168476, -0.003202168270945549, -0.003017372451722622, -0.0028325768653303385, -0.0026477810461074114, -0.0024629852268844843, -0.002278189407661557, -0.00209339358843863, -0.001908597769215703, -0.001723801949992776, -0.0015390061307698488, -0.0013542103115469217, -0.0011694144923239946, -0.0009846186731010675, -0.0007998228538781404, -0.0006150270346552134, -0.00043023121543228626, -0.00024543539620935917, -6.0639576986432076e-05, 0.00012415624223649502, 0.0003089520614594221, 0.0004937478806823492, 0.0006785436999052763, 0.0008633395191282034, 0.0010481353383511305, 0.0012329311575740576, 0.0014177269767969847, 0.0016025227960199118, 0.0017873186152428389, 0.001972114434465766, 0.002156910253688693, 0.00234170607291162, 0.0025265018921345472, 0.0027112977113574743, 0.0028960935305804014, 0.0030808893498033285]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 12.0, 9.0, 9.0, 6.0, 18.0, 16.0, 14.0, 17.0, 23.0, 26.0, 32.0, 37.0, 31.0, 33.0, 33.0, 36.0, 44.0, 31.0, 34.0, 36.0, 38.0, 37.0, 40.0, 38.0, 32.0, 34.0, 36.0, 26.0, 18.0, 24.0, 23.0, 25.0, 18.0, 14.0, 12.0, 17.0, 11.0, 11.0, 4.0, 11.0, 10.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0015822052955627441, -0.0015275003388524055, -0.001472795382142067, -0.0014180904254317284, -0.0013633854687213898, -0.0013086805120110512, -0.0012539755553007126, -0.001199270598590374, -0.0011445656418800354, -0.0010898606851696968, -0.0010351557284593582, -0.0009804507717490196, -0.000925745815038681, -0.0008710408583283424, -0.0008163359016180038, -0.0007616309449076653, -0.0007069259881973267, -0.0006522210314869881, -0.0005975160747766495, -0.0005428111180663109, -0.0004881061613559723, -0.0004334012046456337, -0.0003786962479352951, -0.0003239912912249565, -0.0002692863345146179, -0.00021458137780427933, -0.00015987642109394073, -0.00010517146438360214, -5.046650767326355e-05, 4.238449037075043e-06, 5.8943405747413635e-05, 0.00011364836245775223, 0.00016835331916809082, 0.0002230582758784294, 0.000277763232588768, 0.0003324681892991066, 0.0003871731460094452, 0.0004418781027197838, 0.0004965830594301224, 0.000551288016140461, 0.0006059929728507996, 0.0006606979295611382, 0.0007154028862714767, 0.0007701078429818153, 0.0008248127996921539, 0.0008795177564024925, 0.0009342227131128311, 0.0009889276698231697, 0.0010436326265335083, 0.001098337583243847, 0.0011530425399541855, 0.001207747496664524, 0.0012624524533748627, 0.0013171574100852013, 0.0013718623667955399, 0.0014265673235058784, 0.001481272280216217, 0.0015359772369265556, 0.0015906821936368942, 0.0016453871503472328, 0.0017000921070575714, 0.00175479706376791, 0.0018095020204782486, 0.0018642069771885872, 0.0019189119338989258]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 12.0, 8.0, 13.0, 8.0, 11.0, 15.0, 17.0, 20.0, 22.0, 25.0, 33.0, 27.0, 49.0, 41.0, 39.0, 39.0, 51.0, 36.0, 52.0, 44.0, 44.0, 34.0, 40.0, 40.0, 34.0, 33.0, 27.0, 32.0, 16.0, 24.0, 15.0, 12.0, 16.0, 16.0, 12.0, 5.0, 7.0, 4.0, 6.0, 2.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.1875, -82.2021484375, -79.216796875, -76.2314453125, -73.24609375, -70.2607421875, -67.275390625, -64.2900390625, -61.3046875, -58.3193359375, -55.333984375, -52.3486328125, -49.36328125, -46.3779296875, -43.392578125, -40.4072265625, -37.421875, -34.4365234375, -31.451171875, -28.4658203125, -25.48046875, -22.4951171875, -19.509765625, -16.5244140625, -13.5390625, -10.5537109375, -7.568359375, -4.5830078125, -1.59765625, 1.3876953125, 4.373046875, 7.3583984375, 10.34375, 13.3291015625, 16.314453125, 19.2998046875, 22.28515625, 25.2705078125, 28.255859375, 31.2412109375, 34.2265625, 37.2119140625, 40.197265625, 43.1826171875, 46.16796875, 49.1533203125, 52.138671875, 55.1240234375, 58.109375, 61.0947265625, 64.080078125, 67.0654296875, 70.05078125, 73.0361328125, 76.021484375, 79.0068359375, 81.9921875, 84.9775390625, 87.962890625, 90.9482421875, 93.93359375, 96.9189453125, 99.904296875, 102.8896484375, 105.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 11.0, 11.0, 13.0, 26.0, 32.0, 39.0, 63.0, 77.0, 131.0, 161.0, 320.0, 487.0, 887.0, 1627.0, 3473.0, 8766.0, 29500.0, 127620.0, 479288.0, 301839.0, 66037.0, 16768.0, 5755.0, 2561.0, 1233.0, 684.0, 408.0, 228.0, 140.0, 108.0, 87.0, 39.0, 37.0, 27.0, 21.0, 10.0, 7.0, 6.0, 9.0, 6.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -18.186279296875, -17.57568359375, -16.965087890625, -16.3544921875, -15.743896484375, -15.13330078125, -14.522705078125, -13.912109375, -13.301513671875, -12.69091796875, -12.080322265625, -11.4697265625, -10.859130859375, -10.24853515625, -9.637939453125, -9.02734375, -8.416748046875, -7.80615234375, -7.195556640625, -6.5849609375, -5.974365234375, -5.36376953125, -4.753173828125, -4.142578125, -3.531982421875, -2.92138671875, -2.310791015625, -1.7001953125, -1.089599609375, -0.47900390625, 0.131591796875, 0.7421875, 1.352783203125, 1.96337890625, 2.573974609375, 3.1845703125, 3.795166015625, 4.40576171875, 5.016357421875, 5.626953125, 6.237548828125, 6.84814453125, 7.458740234375, 8.0693359375, 8.679931640625, 9.29052734375, 9.901123046875, 10.51171875, 11.122314453125, 11.73291015625, 12.343505859375, 12.9541015625, 13.564697265625, 14.17529296875, 14.785888671875, 15.396484375, 16.007080078125, 16.61767578125, 17.228271484375, 17.8388671875, 18.449462890625, 19.06005859375, 19.670654296875, 20.28125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 3.0, 8.0, 8.0, 12.0, 8.0, 16.0, 19.0, 22.0, 30.0, 30.0, 37.0, 45.0, 48.0, 47.0, 62.0, 50.0, 69.0, 2082.0, 45.0, 39.0, 44.0, 47.0, 38.0, 30.0, 35.0, 31.0, 24.0, 27.0, 19.0, 10.0, 16.0, 12.0, 4.0, 7.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-156.625, -151.9375, -147.25, -142.5625, -137.875, -133.1875, -128.5, -123.8125, -119.125, -114.4375, -109.75, -105.0625, -100.375, -95.6875, -91.0, -86.3125, -81.625, -76.9375, -72.25, -67.5625, -62.875, -58.1875, -53.5, -48.8125, -44.125, -39.4375, -34.75, -30.0625, -25.375, -20.6875, -16.0, -11.3125, -6.625, -1.9375, 2.75, 7.4375, 12.125, 16.8125, 21.5, 26.1875, 30.875, 35.5625, 40.25, 44.9375, 49.625, 54.3125, 59.0, 63.6875, 68.375, 73.0625, 77.75, 82.4375, 87.125, 91.8125, 96.5, 101.1875, 105.875, 110.5625, 115.25, 119.9375, 124.625, 129.3125, 134.0, 138.6875, 143.375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 9.0, 5.0, 7.0, 9.0, 6.0, 9.0, 11.0, 17.0, 27.0, 37.0, 36.0, 56.0, 81.0, 131.0, 166.0, 262.0, 363.0, 579.0, 910.0, 1821.0, 5193.0, 24970.0, 228391.0, 2743818.0, 116558.0, 14604.0, 3704.0, 1468.0, 831.0, 483.0, 355.0, 241.0, 146.0, 109.0, 76.0, 48.0, 42.0, 21.0, 24.0, 18.0, 17.0, 7.0, 6.0, 8.0, 8.0, 8.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-28.484375, -27.63037109375, -26.7763671875, -25.92236328125, -25.068359375, -24.21435546875, -23.3603515625, -22.50634765625, -21.65234375, -20.79833984375, -19.9443359375, -19.09033203125, -18.236328125, -17.38232421875, -16.5283203125, -15.67431640625, -14.8203125, -13.96630859375, -13.1123046875, -12.25830078125, -11.404296875, -10.55029296875, -9.6962890625, -8.84228515625, -7.98828125, -7.13427734375, -6.2802734375, -5.42626953125, -4.572265625, -3.71826171875, -2.8642578125, -2.01025390625, -1.15625, -0.30224609375, 0.5517578125, 1.40576171875, 2.259765625, 3.11376953125, 3.9677734375, 4.82177734375, 5.67578125, 6.52978515625, 7.3837890625, 8.23779296875, 9.091796875, 9.94580078125, 10.7998046875, 11.65380859375, 12.5078125, 13.36181640625, 14.2158203125, 15.06982421875, 15.923828125, 16.77783203125, 17.6318359375, 18.48583984375, 19.33984375, 20.19384765625, 21.0478515625, 21.90185546875, 22.755859375, 23.60986328125, 24.4638671875, 25.31787109375, 26.171875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 29.0, 83.0, 180.0, 259.0, 217.0, 121.0, 37.0, 26.0, 14.0, 7.0, 1.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-159.02296447753906, -145.42848205566406, -131.83401489257812, -118.23953247070312, -104.64506530761719, -91.05058288574219, -77.45610809326172, -63.86163330078125, -50.26715850830078, -36.67268371582031, -23.07820701599121, -9.48373031616211, 4.110744476318359, 17.705223083496094, 31.299697875976562, 44.89417266845703, 58.4886474609375, 72.08312225341797, 85.67759704589844, 99.27207946777344, 112.86654663085938, 126.46102905273438, 140.05551147460938, 153.6499786376953, 167.24444580078125, 180.83892822265625, 194.4333953857422, 208.0278778076172, 221.62234497070312, 235.21682739257812, 248.81130981445312, 262.40576171875, 276.0002746582031, 289.5947570800781, 303.1892395019531, 316.78369140625, 330.378173828125, 343.97265625, 357.567138671875, 371.16162109375, 384.7560729980469, 398.3505554199219, 411.9450378417969, 425.53948974609375, 439.13397216796875, 452.72845458984375, 466.32293701171875, 479.91741943359375, 493.51190185546875, 507.10638427734375, 520.7008666992188, 534.2953491210938, 547.8898315429688, 561.4842529296875, 575.0787353515625, 588.6732177734375, 602.2677001953125, 615.8621826171875, 629.4566650390625, 643.0511474609375, 656.6456298828125, 670.2401123046875, 683.8345336914062, 697.4290161132812, 711.0234985351562]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 6.0, 5.0, 13.0, 9.0, 20.0, 19.0, 25.0, 22.0, 30.0, 36.0, 32.0, 28.0, 34.0, 50.0, 51.0, 55.0, 48.0, 60.0, 51.0, 38.0, 40.0, 47.0, 39.0, 35.0, 32.0, 29.0, 25.0, 23.0, 26.0, 20.0, 8.0, 13.0, 13.0, 6.0, 5.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-203.40155029296875, -197.100830078125, -190.80010986328125, -184.4993896484375, -178.1986541748047, -171.89793395996094, -165.5972137451172, -159.29649353027344, -152.99575805664062, -146.69503784179688, -140.39431762695312, -134.09359741210938, -127.79286193847656, -121.49214172363281, -115.19142150878906, -108.89070129394531, -102.58998107910156, -96.28926086425781, -89.98853302001953, -83.68781280517578, -77.3870849609375, -71.08636474609375, -64.78564453125, -58.484920501708984, -52.18419647216797, -45.88347244262695, -39.58274841308594, -33.28202819824219, -26.981304168701172, -20.680580139160156, -14.379859924316406, -8.07913589477539, -1.7784271240234375, 4.522295951843262, 10.823019027709961, 17.123741149902344, 23.42446517944336, 29.725189208984375, 36.025909423828125, 42.32663345336914, 48.627357482910156, 54.92808151245117, 61.22880554199219, 67.52952575683594, 73.83024597167969, 80.13097381591797, 86.43169403076172, 92.732421875, 99.03314208984375, 105.3338623046875, 111.63459014892578, 117.93531036376953, 124.23603820800781, 130.53675842285156, 136.8374786376953, 143.13819885253906, 149.43893432617188, 155.73965454101562, 162.04037475585938, 168.34109497070312, 174.64183044433594, 180.9425506591797, 187.24327087402344, 193.5439910888672, 199.84471130371094]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 9.0, 18.0, 17.0, 36.0, 46.0, 75.0, 116.0, 148.0, 236.0, 379.0, 525.0, 764.0, 1112.0, 1549.0, 2414.0, 3534.0, 5849.0, 1017226.0, 4817.0, 3088.0, 2148.0, 1416.0, 1010.0, 609.0, 438.0, 294.0, 220.0, 146.0, 92.0, 58.0, 63.0, 36.0, 21.0, 16.0, 7.0, 8.0, 5.0, 2.0, 0.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.07732009887695, -33.693241119384766, -32.30916213989258, -30.925085067749023, -29.54100799560547, -28.15692901611328, -26.772850036621094, -25.388771057128906, -24.00469398498535, -22.620615005493164, -21.23653793334961, -19.852458953857422, -18.468379974365234, -17.08430290222168, -15.700223922729492, -14.316145896911621, -12.93206787109375, -11.547989845275879, -10.163911819458008, -8.77983283996582, -7.395754814147949, -6.011676788330078, -4.627597808837891, -3.2435197830200195, -1.8594417572021484, -0.47536349296569824, 0.908714771270752, 2.2927932739257812, 3.6768712997436523, 5.060949325561523, 6.445028305053711, 7.829106330871582, 9.213188171386719, 10.59726619720459, 11.981344223022461, 13.365423202514648, 14.74950122833252, 16.13357925415039, 17.517658233642578, 18.901737213134766, 20.28581428527832, 21.669893264770508, 23.053970336914062, 24.43804931640625, 25.822128295898438, 27.206205368041992, 28.59028434753418, 29.974361419677734, 31.358440399169922, 32.74251937866211, 34.1265983581543, 35.51067352294922, 36.894752502441406, 38.278831481933594, 39.66291046142578, 41.04698944091797, 42.431068420410156, 43.815147399902344, 45.19922637939453, 46.58330535888672, 47.96738052368164, 49.35145950317383, 50.735538482666016, 52.1196174621582, 53.503692626953125]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 13.0, 32.0, 70.0, 94.0, 168.0, 34792.0, 51429804.0, 197.0, 55.0, 33.0, 29.0, 38.0, 27.0, 26.0, 19.0, 8.0, 9.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8377.4619140625, -8042.63916015625, -7707.81640625, -7372.99365234375, -7038.1708984375, -6703.34765625, -6368.52490234375, -6033.7021484375, -5698.87939453125, -5364.056640625, -5029.23388671875, -4694.4111328125, -4359.587890625, -4024.765380859375, -3689.9423828125, -3355.11962890625, -3020.296875, -2685.47412109375, -2350.6513671875, -2015.828369140625, -1681.005615234375, -1346.182861328125, -1011.3599853515625, -676.537109375, -341.71435546875, -6.89154052734375, 327.9312744140625, 662.7540893554688, 997.576904296875, 1332.399658203125, 1667.2225341796875, 2002.04541015625, 2336.8671875, 2671.68994140625, 3006.5126953125, 3341.335693359375, 3676.158447265625, 4010.981201171875, 4345.80419921875, 4680.626953125, 5015.44970703125, 5350.2724609375, 5685.09521484375, 6019.91796875, 6354.7412109375, 6689.5634765625, 7024.38671875, 7359.20947265625, 7694.0322265625, 8028.85498046875, 8363.677734375, 8698.5009765625, 9033.3232421875, 9368.146484375, 9702.96875, 10037.7919921875, 10372.615234375, 10707.4384765625, 11042.2607421875, 11377.083984375, 11711.90625, 12046.7294921875, 12381.5517578125, 12716.375, 13051.197265625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 5.0, 4.0, 11.0, 13.0, 25.0, 37.0, 63.0, 93.0, 124.0, 199.0, 235.0, 366.0, 603.0, 819.0, 1173.0, 1640.0, 2453.0, 3507.0, 5422.0, 7626.0, 11444.0, 16883.0, 25605.0, 37473.0, 58535.0, 88931.0, 142680.0, 243272.0, 587873.0, 3854257.0, 560189.0, 236408.0, 141051.0, 89528.0, 58309.0, 37847.0, 24960.0, 16963.0, 11161.0, 7599.0, 4988.0, 3421.0, 2355.0, 1586.0, 1229.0, 723.0, 545.0, 369.0, 275.0, 192.0, 121.0, 80.0, 64.0, 35.0, 28.0, 24.0, 5.0, 12.0, 5.0, 6.0], "bins": [-10.4921875, -10.1788330078125, -9.865478515625, -9.5521240234375, -9.23876953125, -8.9254150390625, -8.612060546875, -8.2987060546875, -7.9853515625, -7.6719970703125, -7.358642578125, -7.0452880859375, -6.73193359375, -6.4185791015625, -6.105224609375, -5.7918701171875, -5.478515625, -5.1651611328125, -4.851806640625, -4.5384521484375, -4.22509765625, -3.9117431640625, -3.598388671875, -3.2850341796875, -2.9716796875, -2.6583251953125, -2.344970703125, -2.0316162109375, -1.71826171875, -1.4049072265625, -1.091552734375, -0.7781982421875, -0.46484375, -0.1514892578125, 0.161865234375, 0.4752197265625, 0.78857421875, 1.1019287109375, 1.415283203125, 1.7286376953125, 2.0419921875, 2.3553466796875, 2.668701171875, 2.9820556640625, 3.29541015625, 3.6087646484375, 3.922119140625, 4.2354736328125, 4.548828125, 4.8621826171875, 5.175537109375, 5.4888916015625, 5.80224609375, 6.1156005859375, 6.428955078125, 6.7423095703125, 7.0556640625, 7.3690185546875, 7.682373046875, 7.9957275390625, 8.30908203125, 8.6224365234375, 8.935791015625, 9.2491455078125, 9.5625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 12.0, 13.0, 9.0, 10.0, 18.0, 12.0, 10.0, 24.0, 27.0, 18.0, 21.0, 25.0, 25.0, 27.0, 35.0, 46.0, 52.0, 101.0, 209.0, 598.0, 173.0, 110.0, 56.0, 32.0, 29.0, 38.0, 28.0, 35.0, 41.0, 27.0, 28.0, 20.0, 17.0, 20.0, 8.0, 7.0, 14.0, 8.0, 10.0, 2.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.6669921875, -17.068359375, -16.4697265625, -15.87109375, -15.2724609375, -14.673828125, -14.0751953125, -13.4765625, -12.8779296875, -12.279296875, -11.6806640625, -11.08203125, -10.4833984375, -9.884765625, -9.2861328125, -8.6875, -8.0888671875, -7.490234375, -6.8916015625, -6.29296875, -5.6943359375, -5.095703125, -4.4970703125, -3.8984375, -3.2998046875, -2.701171875, -2.1025390625, -1.50390625, -0.9052734375, -0.306640625, 0.2919921875, 0.890625, 1.4892578125, 2.087890625, 2.6865234375, 3.28515625, 3.8837890625, 4.482421875, 5.0810546875, 5.6796875, 6.2783203125, 6.876953125, 7.4755859375, 8.07421875, 8.6728515625, 9.271484375, 9.8701171875, 10.46875, 11.0673828125, 11.666015625, 12.2646484375, 12.86328125, 13.4619140625, 14.060546875, 14.6591796875, 15.2578125, 15.8564453125, 16.455078125, 17.0537109375, 17.65234375, 18.2509765625, 18.849609375, 19.4482421875, 20.046875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 6.0, 3.0, 15.0, 12.0, 15.0, 21.0, 47.0, 53.0, 93.0, 149.0, 197.0, 286.0, 445.0, 615.0, 974.0, 1484.0, 2355.0, 3606.0, 5354.0, 8402.0, 12873.0, 19991.0, 31225.0, 50276.0, 83745.0, 144959.0, 282325.0, 869526.0, 3814000.0, 463680.0, 203623.0, 112426.0, 65549.0, 40191.0, 25679.0, 16676.0, 10613.0, 6868.0, 4533.0, 2945.0, 1902.0, 1256.0, 793.0, 576.0, 325.0, 236.0, 167.0, 152.0, 57.0, 38.0, 37.0, 22.0, 15.0, 17.0, 7.0, 1.0, 8.0, 0.0, 0.0, 6.0], "bins": [-11.3984375, -11.0452880859375, -10.692138671875, -10.3389892578125, -9.98583984375, -9.6326904296875, -9.279541015625, -8.9263916015625, -8.5732421875, -8.2200927734375, -7.866943359375, -7.5137939453125, -7.16064453125, -6.8074951171875, -6.454345703125, -6.1011962890625, -5.748046875, -5.3948974609375, -5.041748046875, -4.6885986328125, -4.33544921875, -3.9822998046875, -3.629150390625, -3.2760009765625, -2.9228515625, -2.5697021484375, -2.216552734375, -1.8634033203125, -1.51025390625, -1.1571044921875, -0.803955078125, -0.4508056640625, -0.09765625, 0.2554931640625, 0.608642578125, 0.9617919921875, 1.31494140625, 1.6680908203125, 2.021240234375, 2.3743896484375, 2.7275390625, 3.0806884765625, 3.433837890625, 3.7869873046875, 4.14013671875, 4.4932861328125, 4.846435546875, 5.1995849609375, 5.552734375, 5.9058837890625, 6.259033203125, 6.6121826171875, 6.96533203125, 7.3184814453125, 7.671630859375, 8.0247802734375, 8.3779296875, 8.7310791015625, 9.084228515625, 9.4373779296875, 9.79052734375, 10.1436767578125, 10.496826171875, 10.8499755859375, 11.203125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 10.0, 9.0, 7.0, 8.0, 12.0, 6.0, 22.0, 11.0, 18.0, 14.0, 23.0, 18.0, 25.0, 30.0, 41.0, 31.0, 41.0, 71.0, 88.0, 162.0, 418.0, 356.0, 130.0, 67.0, 49.0, 54.0, 39.0, 37.0, 27.0, 18.0, 34.0, 24.0, 23.0, 23.0, 10.0, 11.0, 16.0, 10.0, 8.0, 8.0, 6.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.6875, -15.2254638671875, -14.763427734375, -14.3013916015625, -13.83935546875, -13.3773193359375, -12.915283203125, -12.4532470703125, -11.9912109375, -11.5291748046875, -11.067138671875, -10.6051025390625, -10.14306640625, -9.6810302734375, -9.218994140625, -8.7569580078125, -8.294921875, -7.8328857421875, -7.370849609375, -6.9088134765625, -6.44677734375, -5.9847412109375, -5.522705078125, -5.0606689453125, -4.5986328125, -4.1365966796875, -3.674560546875, -3.2125244140625, -2.75048828125, -2.2884521484375, -1.826416015625, -1.3643798828125, -0.90234375, -0.4403076171875, 0.021728515625, 0.4837646484375, 0.94580078125, 1.4078369140625, 1.869873046875, 2.3319091796875, 2.7939453125, 3.2559814453125, 3.718017578125, 4.1800537109375, 4.64208984375, 5.1041259765625, 5.566162109375, 6.0281982421875, 6.490234375, 6.9522705078125, 7.414306640625, 7.8763427734375, 8.33837890625, 8.8004150390625, 9.262451171875, 9.7244873046875, 10.1865234375, 10.6485595703125, 11.110595703125, 11.5726318359375, 12.03466796875, 12.4967041015625, 12.958740234375, 13.4207763671875, 13.8828125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 8.0, 6.0, 3.0, 24.0, 12.0, 8.0, 25.0, 13.0, 34.0, 55.0, 62.0, 85.0, 81.0, 90.0, 206.0, 266.0, 317.0, 410.0, 441.0, 669.0, 1008.0, 1212.0, 1849.0, 3122.0, 5180.0, 10196.0, 20968.0, 56548.0, 487228.0, 5591005.0, 61677.0, 22469.0, 10323.0, 5459.0, 3325.0, 2020.0, 1369.0, 894.0, 718.0, 484.0, 382.0, 246.0, 158.0, 177.0, 152.0, 110.0, 70.0, 44.0, 23.0, 62.0, 48.0, 41.0, 26.0, 14.0, 15.0, 0.0, 6.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-29.9375, -28.97265625, -28.0078125, -27.04296875, -26.078125, -25.11328125, -24.1484375, -23.18359375, -22.21875, -21.25390625, -20.2890625, -19.32421875, -18.359375, -17.39453125, -16.4296875, -15.46484375, -14.5, -13.53515625, -12.5703125, -11.60546875, -10.640625, -9.67578125, -8.7109375, -7.74609375, -6.78125, -5.81640625, -4.8515625, -3.88671875, -2.921875, -1.95703125, -0.9921875, -0.02734375, 0.9375, 1.90234375, 2.8671875, 3.83203125, 4.796875, 5.76171875, 6.7265625, 7.69140625, 8.65625, 9.62109375, 10.5859375, 11.55078125, 12.515625, 13.48046875, 14.4453125, 15.41015625, 16.375, 17.33984375, 18.3046875, 19.26953125, 20.234375, 21.19921875, 22.1640625, 23.12890625, 24.09375, 25.05859375, 26.0234375, 26.98828125, 27.953125, 28.91796875, 29.8828125, 30.84765625, 31.8125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 1.0, 5.0, 5.0, 6.0, 11.0, 9.0, 4.0, 7.0, 17.0, 15.0, 22.0, 21.0, 23.0, 29.0, 24.0, 37.0, 42.0, 52.0, 62.0, 106.0, 161.0, 300.0, 396.0, 151.0, 64.0, 60.0, 59.0, 35.0, 33.0, 31.0, 30.0, 37.0, 26.0, 16.0, 16.0, 23.0, 18.0, 13.0, 16.0, 6.0, 4.0, 5.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3359375, -10.0030517578125, -9.670166015625, -9.3372802734375, -9.00439453125, -8.6715087890625, -8.338623046875, -8.0057373046875, -7.6728515625, -7.3399658203125, -7.007080078125, -6.6741943359375, -6.34130859375, -6.0084228515625, -5.675537109375, -5.3426513671875, -5.009765625, -4.6768798828125, -4.343994140625, -4.0111083984375, -3.67822265625, -3.3453369140625, -3.012451171875, -2.6795654296875, -2.3466796875, -2.0137939453125, -1.680908203125, -1.3480224609375, -1.01513671875, -0.6822509765625, -0.349365234375, -0.0164794921875, 0.31640625, 0.6492919921875, 0.982177734375, 1.3150634765625, 1.64794921875, 1.9808349609375, 2.313720703125, 2.6466064453125, 2.9794921875, 3.3123779296875, 3.645263671875, 3.9781494140625, 4.31103515625, 4.6439208984375, 4.976806640625, 5.3096923828125, 5.642578125, 5.9754638671875, 6.308349609375, 6.6412353515625, 6.97412109375, 7.3070068359375, 7.639892578125, 7.9727783203125, 8.3056640625, 8.6385498046875, 8.971435546875, 9.3043212890625, 9.63720703125, 9.9700927734375, 10.302978515625, 10.6358642578125, 10.96875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 0.0, 3.0, 17.0, 22.0, 87.0, 226.0, 459.0, 111.0, 44.0, 17.0, 11.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-113.41607666015625, -111.28523254394531, -109.15438842773438, -107.02354431152344, -104.8927001953125, -102.76184844970703, -100.6310043334961, -98.50016021728516, -96.36931610107422, -94.23847198486328, -92.10762786865234, -89.9767837524414, -87.84593200683594, -85.715087890625, -83.58424377441406, -81.45339965820312, -79.32255554199219, -77.19171142578125, -75.06086730957031, -72.93002319335938, -70.79917907714844, -68.66832733154297, -66.53748321533203, -64.4066390991211, -62.275794982910156, -60.14495086669922, -58.01410675048828, -55.88325881958008, -53.75241470336914, -51.6215705871582, -49.49072265625, -47.35987854003906, -45.229042053222656, -43.09819793701172, -40.96735382080078, -38.83650588989258, -36.70566177368164, -34.5748176574707, -32.4439697265625, -30.313125610351562, -28.182281494140625, -26.051437377929688, -23.920591354370117, -21.789745330810547, -19.65890121459961, -17.528057098388672, -15.397211074829102, -13.266366004943848, -11.135520935058594, -9.00467586517334, -6.873830795288086, -4.742985725402832, -2.612140655517578, -0.4812955856323242, 1.6495494842529297, 3.7803945541381836, 5.9112396240234375, 8.042084693908691, 10.172929763793945, 12.3037748336792, 14.434619903564453, 16.56546401977539, 18.69631004333496, 20.82715606689453, 22.95800018310547]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 4.0, 7.0, 8.0, 13.0, 10.0, 9.0, 7.0, 18.0, 15.0, 19.0, 20.0, 24.0, 27.0, 40.0, 39.0, 38.0, 41.0, 35.0, 45.0, 48.0, 49.0, 46.0, 42.0, 29.0, 46.0, 48.0, 34.0, 36.0, 37.0, 27.0, 23.0, 19.0, 21.0, 16.0, 15.0, 7.0, 7.0, 14.0, 4.0, 6.0, 1.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.135906219482422, -17.60097312927246, -17.0660400390625, -16.53110694885254, -15.996174812316895, -15.461241722106934, -14.926309585571289, -14.391376495361328, -13.856443405151367, -13.321510314941406, -12.786577224731445, -12.2516450881958, -11.71671199798584, -11.181778907775879, -10.646846771240234, -10.111913681030273, -9.576980590820312, -9.042047500610352, -8.50711441040039, -7.972182273864746, -7.437249183654785, -6.902316093444824, -6.3673834800720215, -5.832450866699219, -5.297517776489258, -4.762584686279297, -4.227652072906494, -3.6927192211151123, -3.1577863693237305, -2.6228535175323486, -2.087920665740967, -1.552987813949585, -1.0180530548095703, -0.4831202030181885, 0.05181264877319336, 0.5867455005645752, 1.121678352355957, 1.6566112041473389, 2.1915440559387207, 2.7264769077301025, 3.2614097595214844, 3.796342611312866, 4.331275463104248, 4.866208076477051, 5.401141166687012, 5.936074256896973, 6.471006870269775, 7.005939483642578, 7.540872573852539, 8.0758056640625, 8.610738754272461, 9.145670890808105, 9.680603981018066, 10.215537071228027, 10.750469207763672, 11.285402297973633, 11.820335388183594, 12.355268478393555, 12.890201568603516, 13.42513370513916, 13.960066795349121, 14.494999885559082, 15.029932022094727, 15.564865112304688, 16.09979820251465]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 1.0, 4.0, 3.0, 7.0, 12.0, 14.0, 15.0, 25.0, 36.0, 53.0, 68.0, 124.0, 172.0, 280.0, 440.0, 712.0, 1191.0, 2115.0, 3895.0, 8197.0, 20380.0, 4058996.0, 74234.0, 12005.0, 5033.0, 2470.0, 1368.0, 791.0, 499.0, 359.0, 226.0, 143.0, 104.0, 85.0, 48.0, 39.0, 43.0, 24.0, 16.0, 10.0, 10.0, 12.0, 7.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0311431884765625, -0.02988886833190918, -0.02863454818725586, -0.02738022804260254, -0.02612590789794922, -0.0248715877532959, -0.023617267608642578, -0.022362947463989258, -0.021108627319335938, -0.019854307174682617, -0.018599987030029297, -0.017345666885375977, -0.016091346740722656, -0.014837026596069336, -0.013582706451416016, -0.012328386306762695, -0.011074066162109375, -0.009819746017456055, -0.008565425872802734, -0.007311105728149414, -0.006056785583496094, -0.0048024654388427734, -0.003548145294189453, -0.002293825149536133, -0.0010395050048828125, 0.0002148151397705078, 0.0014691352844238281, 0.0027234554290771484, 0.003977775573730469, 0.005232095718383789, 0.006486415863037109, 0.00774073600769043, 0.00899505615234375, 0.01024937629699707, 0.01150369644165039, 0.012758016586303711, 0.014012336730957031, 0.015266656875610352, 0.016520977020263672, 0.017775297164916992, 0.019029617309570312, 0.020283937454223633, 0.021538257598876953, 0.022792577743530273, 0.024046897888183594, 0.025301218032836914, 0.026555538177490234, 0.027809858322143555, 0.029064178466796875, 0.030318498611450195, 0.031572818756103516, 0.032827138900756836, 0.034081459045410156, 0.03533577919006348, 0.0365900993347168, 0.03784441947937012, 0.03909873962402344, 0.04035305976867676, 0.04160737991333008, 0.0428617000579834, 0.04411602020263672, 0.04537034034729004, 0.04662466049194336, 0.04787898063659668, 0.04913330078125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 1.0, 3.0, 7.0, 7.0, 2.0, 13.0, 7.0, 10.0, 9.0, 19.0, 14.0, 112.0, 662.0, 44.0, 11.0, 14.0, 8.0, 10.0, 5.0, 6.0, 7.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019044876098632812, -0.0018287450075149536, -0.001753002405166626, -0.0016772598028182983, -0.0016015172004699707, -0.001525774598121643, -0.0014500319957733154, -0.0013742893934249878, -0.0012985467910766602, -0.0012228041887283325, -0.0011470615863800049, -0.0010713189840316772, -0.0009955763816833496, -0.000919833779335022, -0.0008440911769866943, -0.0007683485746383667, -0.0006926059722900391, -0.0006168633699417114, -0.0005411207675933838, -0.00046537816524505615, -0.0003896355628967285, -0.0003138929605484009, -0.00023815035820007324, -0.0001624077558517456, -8.666515350341797e-05, -1.0922551155090332e-05, 6.48200511932373e-05, 0.00014056265354156494, 0.00021630525588989258, 0.0002920478582382202, 0.00036779046058654785, 0.0004435330629348755, 0.0005192756652832031, 0.0005950182676315308, 0.0006707608699798584, 0.000746503472328186, 0.0008222460746765137, 0.0008979886770248413, 0.0009737312793731689, 0.0010494738817214966, 0.0011252164840698242, 0.0012009590864181519, 0.0012767016887664795, 0.0013524442911148071, 0.0014281868934631348, 0.0015039294958114624, 0.00157967209815979, 0.0016554147005081177, 0.0017311573028564453, 0.001806899905204773, 0.0018826425075531006, 0.0019583851099014282, 0.002034127712249756, 0.0021098703145980835, 0.002185612916946411, 0.0022613555192947388, 0.0023370981216430664, 0.002412840723991394, 0.0024885833263397217, 0.0025643259286880493, 0.002640068531036377, 0.0027158111333847046, 0.0027915537357330322, 0.00286729633808136, 0.0029430389404296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 5.0, 6.0, 12.0, 18.0, 12.0, 42.0, 51.0, 41.0, 74.0, 113.0, 155.0, 248.0, 365.0, 586.0, 1108.0, 2006.0, 4913.0, 17302.0, 202003.0, 3916176.0, 35511.0, 7264.0, 2856.0, 1328.0, 784.0, 394.0, 266.0, 184.0, 134.0, 83.0, 60.0, 49.0, 30.0, 32.0, 24.0, 9.0, 10.0, 8.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050994873046875, -0.04930591583251953, -0.04761695861816406, -0.045928001403808594, -0.044239044189453125, -0.042550086975097656, -0.04086112976074219, -0.03917217254638672, -0.03748321533203125, -0.03579425811767578, -0.03410530090332031, -0.032416343688964844, -0.030727386474609375, -0.029038429260253906, -0.027349472045898438, -0.02566051483154297, -0.0239715576171875, -0.02228260040283203, -0.020593643188476562, -0.018904685974121094, -0.017215728759765625, -0.015526771545410156, -0.013837814331054688, -0.012148857116699219, -0.01045989990234375, -0.008770942687988281, -0.0070819854736328125, -0.005393028259277344, -0.003704071044921875, -0.0020151138305664062, -0.0003261566162109375, 0.0013628005981445312, 0.0030517578125, 0.004740715026855469, 0.0064296722412109375, 0.008118629455566406, 0.009807586669921875, 0.011496543884277344, 0.013185501098632812, 0.014874458312988281, 0.01656341552734375, 0.01825237274169922, 0.019941329956054688, 0.021630287170410156, 0.023319244384765625, 0.025008201599121094, 0.026697158813476562, 0.02838611602783203, 0.0300750732421875, 0.03176403045654297, 0.03345298767089844, 0.035141944885253906, 0.036830902099609375, 0.038519859313964844, 0.04020881652832031, 0.04189777374267578, 0.04358673095703125, 0.04527568817138672, 0.04696464538574219, 0.048653602600097656, 0.050342559814453125, 0.052031517028808594, 0.05372047424316406, 0.05540943145751953, 0.057098388671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 6.0, 6.0, 12.0, 13.0, 13.0, 6.0, 17.0, 10.0, 22.0, 35.0, 31.0, 36.0, 44.0, 54.0, 75.0, 123.0, 365.0, 2483.0, 280.0, 84.0, 64.0, 38.0, 44.0, 31.0, 30.0, 30.0, 24.0, 18.0, 13.0, 13.0, 8.0, 10.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004741668701171875, -0.004574477672576904, -0.004407286643981934, -0.004240095615386963, -0.004072904586791992, -0.0039057135581970215, -0.0037385225296020508, -0.00357133150100708, -0.0034041404724121094, -0.0032369494438171387, -0.003069758415222168, -0.0029025673866271973, -0.0027353763580322266, -0.002568185329437256, -0.002400994300842285, -0.0022338032722473145, -0.0020666122436523438, -0.001899421215057373, -0.0017322301864624023, -0.0015650391578674316, -0.001397848129272461, -0.0012306571006774902, -0.0010634660720825195, -0.0008962750434875488, -0.0007290840148925781, -0.0005618929862976074, -0.0003947019577026367, -0.00022751092910766602, -6.031990051269531e-05, 0.00010687112808227539, 0.0002740621566772461, 0.0004412531852722168, 0.0006084442138671875, 0.0007756352424621582, 0.0009428262710571289, 0.0011100172996520996, 0.0012772083282470703, 0.001444399356842041, 0.0016115903854370117, 0.0017787814140319824, 0.0019459724426269531, 0.002113163471221924, 0.0022803544998168945, 0.0024475455284118652, 0.002614736557006836, 0.0027819275856018066, 0.0029491186141967773, 0.003116309642791748, 0.0032835006713867188, 0.0034506916999816895, 0.00361788272857666, 0.003785073757171631, 0.0039522647857666016, 0.004119455814361572, 0.004286646842956543, 0.004453837871551514, 0.004621028900146484, 0.004788219928741455, 0.004955410957336426, 0.0051226019859313965, 0.005289793014526367, 0.005456984043121338, 0.005624175071716309, 0.005791366100311279, 0.00595855712890625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 10.0, 15.0, 12.0, 47.0, 175.0, 570.0, 100.0, 42.0, 15.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.11550533771514893, -0.112838976085186, -0.11017262190580368, -0.10750626027584076, -0.10483989864587784, -0.10217353701591492, -0.09950718283653259, -0.09684082120656967, -0.09417445957660675, -0.09150809794664383, -0.0888417437672615, -0.08617538213729858, -0.08350902050733566, -0.08084265887737274, -0.07817630469799042, -0.0755099430680275, -0.07284358888864517, -0.07017722725868225, -0.06751087307929993, -0.064844511449337, -0.062178149819374084, -0.05951179191470146, -0.05684543401002884, -0.05417907238006592, -0.051512714475393295, -0.04884635657072067, -0.04617999494075775, -0.04351363703608513, -0.040847279131412506, -0.038180917501449585, -0.03551455959677696, -0.03284820169210434, -0.030181847512722015, -0.027515487745404243, -0.02484912797808647, -0.02218277007341385, -0.019516410306096077, -0.016850050538778305, -0.014183692634105682, -0.01151733286678791, -0.008850973099470139, -0.006184613797813654, -0.0035182544961571693, -0.000851895660161972, 0.0018144641071557999, 0.004480823874473572, 0.0071471817791461945, 0.009813541546463966, 0.012479901313781738, 0.01514626108109951, 0.017812620848417282, 0.020478978753089905, 0.023145338520407677, 0.02581169828772545, 0.02847805619239807, 0.031144415959715843, 0.033810775727033615, 0.03647713363170624, 0.03914349526166916, 0.04180985316634178, 0.044476211071014404, 0.047142572700977325, 0.04980893060564995, 0.05247528851032257, 0.05514165014028549]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 11.0, 11.0, 11.0, 14.0, 11.0, 25.0, 28.0, 30.0, 45.0, 50.0, 52.0, 57.0, 50.0, 73.0, 67.0, 61.0, 60.0, 52.0, 52.0, 45.0, 28.0, 41.0, 30.0, 17.0, 14.0, 8.0, 13.0, 7.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.022283852100372314, -0.021612493321299553, -0.02094113454222679, -0.02026977576315403, -0.01959841698408127, -0.018927058205008507, -0.018255699425935745, -0.017584340646862984, -0.016912981867790222, -0.01624162308871746, -0.015570264309644699, -0.014898905530571938, -0.014227546751499176, -0.013556187972426414, -0.012884829193353653, -0.012213470414280891, -0.01154211163520813, -0.010870752856135368, -0.010199394077062607, -0.009528035297989845, -0.008856676518917084, -0.008185317739844322, -0.007513958960771561, -0.006842600181698799, -0.006171241402626038, -0.005499882623553276, -0.0048285238444805145, -0.004157165065407753, -0.0034858062863349915, -0.00281444750726223, -0.0021430887281894684, -0.0014717299491167068, -0.0008003711700439453, -0.00012901239097118378, 0.0005423463881015778, 0.0012137051671743393, 0.0018850639462471008, 0.0025564227253198624, 0.003227781504392624, 0.0038991402834653854, 0.004570499062538147, 0.0052418578416109085, 0.00591321662068367, 0.006584575399756432, 0.007255934178829193, 0.007927292957901955, 0.008598651736974716, 0.009270010516047478, 0.00994136929512024, 0.010612728074193, 0.011284086853265762, 0.011955445632338524, 0.012626804411411285, 0.013298163190484047, 0.013969521969556808, 0.01464088074862957, 0.015312239527702332, 0.015983598306775093, 0.016654957085847855, 0.017326315864920616, 0.017997674643993378, 0.01866903342306614, 0.0193403922021389, 0.020011750981211662, 0.020683109760284424]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 22.0, 10.0, 37.0, 33.0, 53.0, 89.0, 101.0, 160.0, 217.0, 362.0, 554.0, 847.0, 1392.0, 2352.0, 4054.0, 7583.0, 16275.0, 59601.0, 904031.0, 26712.0, 10831.0, 5423.0, 2910.0, 1756.0, 1051.0, 691.0, 408.0, 304.0, 183.0, 166.0, 103.0, 58.0, 53.0, 31.0, 18.0, 25.0, 14.0, 6.0, 6.0, 9.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.03564453125, -0.034539222717285156, -0.03343391418457031, -0.03232860565185547, -0.031223297119140625, -0.03011798858642578, -0.029012680053710938, -0.027907371520996094, -0.02680206298828125, -0.025696754455566406, -0.024591445922851562, -0.02348613739013672, -0.022380828857421875, -0.02127552032470703, -0.020170211791992188, -0.019064903259277344, -0.0179595947265625, -0.016854286193847656, -0.015748977661132812, -0.014643669128417969, -0.013538360595703125, -0.012433052062988281, -0.011327743530273438, -0.010222434997558594, -0.00911712646484375, -0.008011817932128906, -0.0069065093994140625, -0.005801200866699219, -0.004695892333984375, -0.0035905838012695312, -0.0024852752685546875, -0.0013799667358398438, -0.000274658203125, 0.0008306503295898438, 0.0019359588623046875, 0.0030412673950195312, 0.004146575927734375, 0.005251884460449219, 0.0063571929931640625, 0.007462501525878906, 0.00856781005859375, 0.009673118591308594, 0.010778427124023438, 0.011883735656738281, 0.012989044189453125, 0.014094352722167969, 0.015199661254882812, 0.016304969787597656, 0.0174102783203125, 0.018515586853027344, 0.019620895385742188, 0.02072620391845703, 0.021831512451171875, 0.02293682098388672, 0.024042129516601562, 0.025147438049316406, 0.02625274658203125, 0.027358055114746094, 0.028463363647460938, 0.02956867218017578, 0.030673980712890625, 0.03177928924560547, 0.03288459777832031, 0.033989906311035156, 0.03509521484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 3.0, 6.0, 0.0, 6.0, 6.0, 6.0, 5.0, 10.0, 9.0, 7.0, 15.0, 18.0, 13.0, 528.0, 267.0, 23.0, 12.0, 9.0, 11.0, 7.0, 7.0, 5.0, 7.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018768310546875, -0.0018014013767242432, -0.0017259716987609863, -0.0016505420207977295, -0.0015751123428344727, -0.0014996826648712158, -0.001424252986907959, -0.0013488233089447021, -0.0012733936309814453, -0.0011979639530181885, -0.0011225342750549316, -0.0010471045970916748, -0.000971674919128418, -0.0008962452411651611, -0.0008208155632019043, -0.0007453858852386475, -0.0006699562072753906, -0.0005945265293121338, -0.000519096851348877, -0.0004436671733856201, -0.0003682374954223633, -0.00029280781745910645, -0.0002173781394958496, -0.00014194846153259277, -6.651878356933594e-05, 8.910894393920898e-06, 8.434057235717773e-05, 0.00015977025032043457, 0.0002351999282836914, 0.00031062960624694824, 0.0003860592842102051, 0.0004614889621734619, 0.0005369186401367188, 0.0006123483180999756, 0.0006877779960632324, 0.0007632076740264893, 0.0008386373519897461, 0.0009140670299530029, 0.0009894967079162598, 0.0010649263858795166, 0.0011403560638427734, 0.0012157857418060303, 0.0012912154197692871, 0.001366645097732544, 0.0014420747756958008, 0.0015175044536590576, 0.0015929341316223145, 0.0016683638095855713, 0.0017437934875488281, 0.001819223165512085, 0.0018946528434753418, 0.0019700825214385986, 0.0020455121994018555, 0.0021209418773651123, 0.002196371555328369, 0.002271801233291626, 0.002347230911254883, 0.0024226605892181396, 0.0024980902671813965, 0.0025735199451446533, 0.00264894962310791, 0.002724379301071167, 0.002799808979034424, 0.0028752386569976807, 0.0029506683349609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 10.0, 11.0, 11.0, 22.0, 22.0, 31.0, 54.0, 52.0, 81.0, 106.0, 124.0, 176.0, 253.0, 337.0, 554.0, 819.0, 1219.0, 2172.0, 3998.0, 8719.0, 28503.0, 586766.0, 370958.0, 25511.0, 8122.0, 3856.0, 2170.0, 1294.0, 758.0, 515.0, 388.0, 265.0, 166.0, 123.0, 94.0, 79.0, 58.0, 36.0, 26.0, 18.0, 24.0, 13.0, 9.0, 6.0, 8.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.03948974609375, -0.03829193115234375, -0.0370941162109375, -0.03589630126953125, -0.034698486328125, -0.03350067138671875, -0.0323028564453125, -0.03110504150390625, -0.0299072265625, -0.02870941162109375, -0.0275115966796875, -0.02631378173828125, -0.025115966796875, -0.02391815185546875, -0.0227203369140625, -0.02152252197265625, -0.02032470703125, -0.01912689208984375, -0.0179290771484375, -0.01673126220703125, -0.015533447265625, -0.01433563232421875, -0.0131378173828125, -0.01194000244140625, -0.0107421875, -0.00954437255859375, -0.0083465576171875, -0.00714874267578125, -0.005950927734375, -0.00475311279296875, -0.0035552978515625, -0.00235748291015625, -0.00115966796875, 3.814697265625e-05, 0.0012359619140625, 0.00243377685546875, 0.003631591796875, 0.00482940673828125, 0.0060272216796875, 0.00722503662109375, 0.0084228515625, 0.00962066650390625, 0.0108184814453125, 0.01201629638671875, 0.013214111328125, 0.01441192626953125, 0.0156097412109375, 0.01680755615234375, 0.01800537109375, 0.01920318603515625, 0.0204010009765625, 0.02159881591796875, 0.022796630859375, 0.02399444580078125, 0.0251922607421875, 0.02639007568359375, 0.027587890625, 0.02878570556640625, 0.0299835205078125, 0.03118133544921875, 0.032379150390625, 0.03357696533203125, 0.0347747802734375, 0.03597259521484375, 0.03717041015625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 7.0, 7.0, 6.0, 8.0, 4.0, 14.0, 15.0, 13.0, 20.0, 22.0, 15.0, 24.0, 23.0, 37.0, 42.0, 32.0, 34.0, 35.0, 35.0, 41.0, 46.0, 31.0, 36.0, 37.0, 27.0, 35.0, 29.0, 34.0, 29.0, 29.0, 30.0, 23.0, 20.0, 26.0, 15.0, 15.0, 16.0, 12.0, 12.0, 9.0, 12.0, 6.0, 5.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.00794219970703125, -0.00770038366317749, -0.0074585676193237305, -0.007216751575469971, -0.006974935531616211, -0.006733119487762451, -0.006491303443908691, -0.006249487400054932, -0.006007671356201172, -0.005765855312347412, -0.005524039268493652, -0.005282223224639893, -0.005040407180786133, -0.004798591136932373, -0.004556775093078613, -0.0043149590492248535, -0.004073143005371094, -0.003831326961517334, -0.0035895109176635742, -0.0033476948738098145, -0.0031058788299560547, -0.002864062786102295, -0.002622246742248535, -0.0023804306983947754, -0.0021386146545410156, -0.0018967986106872559, -0.001654982566833496, -0.0014131665229797363, -0.0011713504791259766, -0.0009295344352722168, -0.000687718391418457, -0.00044590234756469727, -0.0002040863037109375, 3.7729740142822266e-05, 0.00027954578399658203, 0.0005213618278503418, 0.0007631778717041016, 0.0010049939155578613, 0.001246809959411621, 0.0014886260032653809, 0.0017304420471191406, 0.0019722580909729004, 0.00221407413482666, 0.00245589017868042, 0.0026977062225341797, 0.0029395222663879395, 0.0031813383102416992, 0.003423154354095459, 0.0036649703979492188, 0.0039067864418029785, 0.004148602485656738, 0.004390418529510498, 0.004632234573364258, 0.004874050617218018, 0.005115866661071777, 0.005357682704925537, 0.005599498748779297, 0.005841314792633057, 0.006083130836486816, 0.006324946880340576, 0.006566762924194336, 0.006808578968048096, 0.0070503950119018555, 0.007292211055755615, 0.007534027099609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 9.0, 7.0, 6.0, 12.0, 16.0, 19.0, 34.0, 80.0, 348.0, 3697.0, 1034520.0, 8982.0, 589.0, 108.0, 31.0, 17.0, 18.0, 16.0, 10.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04913330078125, -0.04775428771972656, -0.046375274658203125, -0.04499626159667969, -0.04361724853515625, -0.04223823547363281, -0.040859222412109375, -0.03948020935058594, -0.0381011962890625, -0.03672218322753906, -0.035343170166015625, -0.03396415710449219, -0.03258514404296875, -0.031206130981445312, -0.029827117919921875, -0.028448104858398438, -0.027069091796875, -0.025690078735351562, -0.024311065673828125, -0.022932052612304688, -0.02155303955078125, -0.020174026489257812, -0.018795013427734375, -0.017416000366210938, -0.0160369873046875, -0.014657974243164062, -0.013278961181640625, -0.011899948120117188, -0.01052093505859375, -0.009141921997070312, -0.007762908935546875, -0.0063838958740234375, -0.0050048828125, -0.0036258697509765625, -0.002246856689453125, -0.0008678436279296875, 0.00051116943359375, 0.0018901824951171875, 0.003269195556640625, 0.0046482086181640625, 0.0060272216796875, 0.0074062347412109375, 0.008785247802734375, 0.010164260864257812, 0.01154327392578125, 0.012922286987304688, 0.014301300048828125, 0.015680313110351562, 0.017059326171875, 0.018438339233398438, 0.019817352294921875, 0.021196365356445312, 0.02257537841796875, 0.023954391479492188, 0.025333404541015625, 0.026712417602539062, 0.0280914306640625, 0.029470443725585938, 0.030849456787109375, 0.03222846984863281, 0.03360748291015625, 0.03498649597167969, 0.036365509033203125, 0.03774452209472656, 0.03912353515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 7.0, 6.0, 2.0, 11.0, 4.0, 14.0, 18.0, 17.0, 44.0, 103.0, 266.0, 285.0, 83.0, 43.0, 21.0, 12.0, 7.0, 7.0, 4.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0022640228271484375, -0.002201065421104431, -0.002138108015060425, -0.0020751506090164185, -0.002012193202972412, -0.0019492357969284058, -0.0018862783908843994, -0.001823320984840393, -0.0017603635787963867, -0.0016974061727523804, -0.001634448766708374, -0.0015714913606643677, -0.0015085339546203613, -0.001445576548576355, -0.0013826191425323486, -0.0013196617364883423, -0.001256704330444336, -0.0011937469244003296, -0.0011307895183563232, -0.001067832112312317, -0.0010048747062683105, -0.0009419173002243042, -0.0008789598941802979, -0.0008160024881362915, -0.0007530450820922852, -0.0006900876760482788, -0.0006271302700042725, -0.0005641728639602661, -0.0005012154579162598, -0.0004382580518722534, -0.00037530064582824707, -0.0003123432397842407, -0.0002493858337402344, -0.00018642842769622803, -0.00012347102165222168, -6.051361560821533e-05, 2.4437904357910156e-06, 6.540119647979736e-05, 0.0001283586025238037, 0.00019131600856781006, 0.0002542734146118164, 0.00031723082065582275, 0.0003801882266998291, 0.00044314563274383545, 0.0005061030387878418, 0.0005690604448318481, 0.0006320178508758545, 0.0006949752569198608, 0.0007579326629638672, 0.0008208900690078735, 0.0008838474750518799, 0.0009468048810958862, 0.0010097622871398926, 0.001072719693183899, 0.0011356770992279053, 0.0011986345052719116, 0.001261591911315918, 0.0013245493173599243, 0.0013875067234039307, 0.001450464129447937, 0.0015134215354919434, 0.0015763789415359497, 0.001639336347579956, 0.0017022937536239624, 0.0017652511596679688]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 7.0, 12.0, 14.0, 13.0, 21.0, 27.0, 38.0, 57.0, 86.0, 147.0, 262.0, 457.0, 1018.0, 2536.0, 12593.0, 987770.0, 36384.0, 4218.0, 1367.0, 607.0, 361.0, 187.0, 125.0, 74.0, 56.0, 42.0, 23.0, 11.0, 6.0, 10.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.023193359375, -0.022504806518554688, -0.021816253662109375, -0.021127700805664062, -0.02043914794921875, -0.019750595092773438, -0.019062042236328125, -0.018373489379882812, -0.0176849365234375, -0.016996383666992188, -0.016307830810546875, -0.015619277954101562, -0.01493072509765625, -0.014242172241210938, -0.013553619384765625, -0.012865066528320312, -0.012176513671875, -0.011487960815429688, -0.010799407958984375, -0.010110855102539062, -0.00942230224609375, -0.008733749389648438, -0.008045196533203125, -0.0073566436767578125, -0.0066680908203125, -0.0059795379638671875, -0.005290985107421875, -0.0046024322509765625, -0.00391387939453125, -0.0032253265380859375, -0.002536773681640625, -0.0018482208251953125, -0.00115966796875, -0.0004711151123046875, 0.000217437744140625, 0.0009059906005859375, 0.00159454345703125, 0.0022830963134765625, 0.002971649169921875, 0.0036602020263671875, 0.0043487548828125, 0.0050373077392578125, 0.005725860595703125, 0.0064144134521484375, 0.00710296630859375, 0.0077915191650390625, 0.008480072021484375, 0.009168624877929688, 0.009857177734375, 0.010545730590820312, 0.011234283447265625, 0.011922836303710938, 0.01261138916015625, 0.013299942016601562, 0.013988494873046875, 0.014677047729492188, 0.0153656005859375, 0.016054153442382812, 0.016742706298828125, 0.017431259155273438, 0.01811981201171875, 0.018808364868164062, 0.019496917724609375, 0.020185470581054688, 0.0208740234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 12.0, 7.0, 9.0, 14.0, 12.0, 25.0, 36.0, 64.0, 178.0, 370.0, 99.0, 37.0, 20.0, 20.0, 17.0, 9.0, 17.0, 8.0, 7.0, 6.0, 6.0, 2.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005023956298828125, -0.00487285852432251, -0.0047217607498168945, -0.004570662975311279, -0.004419565200805664, -0.004268467426300049, -0.004117369651794434, -0.003966271877288818, -0.003815174102783203, -0.003664076328277588, -0.0035129785537719727, -0.0033618807792663574, -0.003210783004760742, -0.003059685230255127, -0.0029085874557495117, -0.0027574896812438965, -0.0026063919067382812, -0.002455294132232666, -0.0023041963577270508, -0.0021530985832214355, -0.0020020008087158203, -0.001850903034210205, -0.0016998052597045898, -0.0015487074851989746, -0.0013976097106933594, -0.0012465119361877441, -0.001095414161682129, -0.0009443163871765137, -0.0007932186126708984, -0.0006421208381652832, -0.000491023063659668, -0.00033992528915405273, -0.0001888275146484375, -3.7729740142822266e-05, 0.00011336803436279297, 0.0002644658088684082, 0.00041556358337402344, 0.0005666613578796387, 0.0007177591323852539, 0.0008688569068908691, 0.0010199546813964844, 0.0011710524559020996, 0.0013221502304077148, 0.00147324800491333, 0.0016243457794189453, 0.0017754435539245605, 0.0019265413284301758, 0.002077639102935791, 0.0022287368774414062, 0.0023798346519470215, 0.0025309324264526367, 0.002682030200958252, 0.002833127975463867, 0.0029842257499694824, 0.0031353235244750977, 0.003286421298980713, 0.003437519073486328, 0.0035886168479919434, 0.0037397146224975586, 0.003890812397003174, 0.004041910171508789, 0.004193007946014404, 0.0043441057205200195, 0.004495203495025635, 0.00464630126953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 9.0, 10.0, 15.0, 30.0, 130.0, 636.0, 95.0, 18.0, 9.0, 13.0, 8.0, 2.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26637715101242065, -0.254488468170166, -0.242599755525589, -0.23071107268333435, -0.21882237493991852, -0.20693367719650269, -0.19504499435424805, -0.18315629661083221, -0.17126759886741638, -0.15937890112400055, -0.14749020338058472, -0.13560152053833008, -0.12371282279491425, -0.11182412505149841, -0.09993543475866318, -0.08804674446582794, -0.07615804672241211, -0.06426934897899628, -0.05238065868616104, -0.04049196466803551, -0.028603270649909973, -0.01671457663178444, -0.004825882613658905, 0.007062807679176331, 0.018951505422592163, 0.030840199440717697, 0.04272889345884323, 0.054617587476968765, 0.0665062814950943, 0.07839497923851013, 0.09028366953134537, 0.1021723598241806, 0.11406102776527405, 0.12594972550868988, 0.1378384232521057, 0.14972710609436035, 0.16161580383777618, 0.17350450158119202, 0.18539318442344666, 0.1972818821668625, 0.20917057991027832, 0.22105927765369415, 0.23294797539710999, 0.24483665823936462, 0.25672537088394165, 0.2686140537261963, 0.2805027365684509, 0.29239141941070557, 0.3042801320552826, 0.31616881489753723, 0.32805752754211426, 0.3399462103843689, 0.35183489322662354, 0.36372360587120056, 0.3756122887134552, 0.3875010013580322, 0.39938968420028687, 0.4112783670425415, 0.42316707968711853, 0.43505576252937317, 0.4469444751739502, 0.45883315801620483, 0.4707218408584595, 0.4826105237007141, 0.49449923634529114]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 10.0, 13.0, 9.0, 10.0, 18.0, 29.0, 42.0, 86.0, 136.0, 197.0, 141.0, 111.0, 62.0, 39.0, 16.0, 12.0, 13.0, 9.0, 10.0, 4.0, 5.0, 8.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21385985612869263, -0.2080519199371338, -0.20224396884441376, -0.19643603265285492, -0.19062809646129608, -0.18482014536857605, -0.1790122091770172, -0.17320427298545837, -0.16739633679389954, -0.1615884006023407, -0.15578044950962067, -0.14997251331806183, -0.144164577126503, -0.13835662603378296, -0.13254868984222412, -0.12674075365066528, -0.12093280255794525, -0.11512485891580582, -0.10931692272424698, -0.10350897908210754, -0.0977010428905487, -0.09189309924840927, -0.08608515560626984, -0.080277219414711, -0.07446927577257156, -0.06866133213043213, -0.06285339593887329, -0.057045452296733856, -0.05123751237988472, -0.045429572463035583, -0.03962162882089615, -0.03381368890404701, -0.028005748987197876, -0.02219780907034874, -0.016389867290854454, -0.010581925511360168, -0.004773985594511032, 0.0010339543223381042, 0.006841897964477539, 0.012649837881326675, 0.018457777798175812, 0.024265717715024948, 0.030073659494519234, 0.03588160127401352, 0.041689541190862656, 0.04749748110771179, 0.05330542474985123, 0.05911336466670036, 0.0649213045835495, 0.07072924822568893, 0.07653718441724777, 0.08234512805938721, 0.08815306425094604, 0.09396100789308548, 0.09976895153522491, 0.10557688772678375, 0.11138483136892319, 0.11719277501106262, 0.12300071120262146, 0.1288086473941803, 0.13461659848690033, 0.14042453467845917, 0.1462324857711792, 0.15204042196273804, 0.15784835815429688]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 6.0, 13.0, 14.0, 13.0, 20.0, 30.0, 29.0, 58.0, 140.0, 2663.0, 4164606.0, 25798.0, 618.0, 111.0, 38.0, 30.0, 17.0, 14.0, 16.0, 8.0, 6.0, 5.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5, -3.3526611328125, -3.205322265625, -3.0579833984375, -2.91064453125, -2.7633056640625, -2.615966796875, -2.4686279296875, -2.3212890625, -2.1739501953125, -2.026611328125, -1.8792724609375, -1.73193359375, -1.5845947265625, -1.437255859375, -1.2899169921875, -1.142578125, -0.9952392578125, -0.847900390625, -0.7005615234375, -0.55322265625, -0.4058837890625, -0.258544921875, -0.1112060546875, 0.0361328125, 0.1834716796875, 0.330810546875, 0.4781494140625, 0.62548828125, 0.7728271484375, 0.920166015625, 1.0675048828125, 1.21484375, 1.3621826171875, 1.509521484375, 1.6568603515625, 1.80419921875, 1.9515380859375, 2.098876953125, 2.2462158203125, 2.3935546875, 2.5408935546875, 2.688232421875, 2.8355712890625, 2.98291015625, 3.1302490234375, 3.277587890625, 3.4249267578125, 3.572265625, 3.7196044921875, 3.866943359375, 4.0142822265625, 4.16162109375, 4.3089599609375, 4.456298828125, 4.6036376953125, 4.7509765625, 4.8983154296875, 5.045654296875, 5.1929931640625, 5.34033203125, 5.4876708984375, 5.635009765625, 5.7823486328125, 5.9296875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 1.0, 4.0, 6.0, 7.0, 4.0, 14.0, 7.0, 6.0, 10.0, 19.0, 17.0, 351.0, 430.0, 35.0, 11.0, 11.0, 8.0, 8.0, 9.0, 5.0, 7.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018367767333984375, -0.0017633140087127686, -0.0016898512840270996, -0.0016163885593414307, -0.0015429258346557617, -0.0014694631099700928, -0.0013960003852844238, -0.0013225376605987549, -0.001249074935913086, -0.001175612211227417, -0.001102149486541748, -0.001028686761856079, -0.0009552240371704102, -0.0008817613124847412, -0.0008082985877990723, -0.0007348358631134033, -0.0006613731384277344, -0.0005879104137420654, -0.0005144476890563965, -0.00044098496437072754, -0.0003675222396850586, -0.00029405951499938965, -0.0002205967903137207, -0.00014713406562805176, -7.367134094238281e-05, -2.086162567138672e-07, 7.325410842895508e-05, 0.00014671683311462402, 0.00022017955780029297, 0.0002936422824859619, 0.00036710500717163086, 0.0004405677318572998, 0.0005140304565429688, 0.0005874931812286377, 0.0006609559059143066, 0.0007344186305999756, 0.0008078813552856445, 0.0008813440799713135, 0.0009548068046569824, 0.0010282695293426514, 0.0011017322540283203, 0.0011751949787139893, 0.0012486577033996582, 0.0013221204280853271, 0.001395583152770996, 0.001469045877456665, 0.001542508602142334, 0.001615971326828003, 0.0016894340515136719, 0.0017628967761993408, 0.0018363595008850098, 0.0019098222255706787, 0.0019832849502563477, 0.0020567476749420166, 0.0021302103996276855, 0.0022036731243133545, 0.0022771358489990234, 0.0023505985736846924, 0.0024240612983703613, 0.0024975240230560303, 0.0025709867477416992, 0.002644449472427368, 0.002717912197113037, 0.002791374921798706, 0.002864837646484375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 8.0, 10.0, 17.0, 17.0, 19.0, 29.0, 39.0, 33.0, 44.0, 41.0, 63.0, 73.0, 84.0, 133.0, 140.0, 399.0, 12130.0, 4174005.0, 5859.0, 332.0, 148.0, 120.0, 103.0, 77.0, 66.0, 55.0, 59.0, 36.0, 24.0, 27.0, 22.0, 19.0, 5.0, 11.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.603515625, -0.5806732177734375, -0.557830810546875, -0.5349884033203125, -0.51214599609375, -0.4893035888671875, -0.466461181640625, -0.4436187744140625, -0.4207763671875, -0.3979339599609375, -0.375091552734375, -0.3522491455078125, -0.32940673828125, -0.3065643310546875, -0.283721923828125, -0.2608795166015625, -0.238037109375, -0.2151947021484375, -0.192352294921875, -0.1695098876953125, -0.14666748046875, -0.1238250732421875, -0.100982666015625, -0.0781402587890625, -0.0552978515625, -0.0324554443359375, -0.009613037109375, 0.0132293701171875, 0.03607177734375, 0.0589141845703125, 0.081756591796875, 0.1045989990234375, 0.12744140625, 0.1502838134765625, 0.173126220703125, 0.1959686279296875, 0.21881103515625, 0.2416534423828125, 0.264495849609375, 0.2873382568359375, 0.3101806640625, 0.3330230712890625, 0.355865478515625, 0.3787078857421875, 0.40155029296875, 0.4243927001953125, 0.447235107421875, 0.4700775146484375, 0.492919921875, 0.5157623291015625, 0.538604736328125, 0.5614471435546875, 0.58428955078125, 0.6071319580078125, 0.629974365234375, 0.6528167724609375, 0.6756591796875, 0.6985015869140625, 0.721343994140625, 0.7441864013671875, 0.76702880859375, 0.7898712158203125, 0.812713623046875, 0.8355560302734375, 0.8583984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 8.0, 13.0, 13.0, 16.0, 21.0, 35.0, 36.0, 37.0, 41.0, 44.0, 68.0, 70.0, 95.0, 122.0, 131.0, 164.0, 374.0, 1535.0, 292.0, 172.0, 126.0, 125.0, 101.0, 71.0, 70.0, 57.0, 54.0, 36.0, 26.0, 29.0, 21.0, 16.0, 8.0, 11.0, 5.0, 10.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004657745361328125, -0.004481017589569092, -0.004304289817810059, -0.004127562046051025, -0.003950834274291992, -0.003774106502532959, -0.0035973787307739258, -0.0034206509590148926, -0.0032439231872558594, -0.003067195415496826, -0.002890467643737793, -0.0027137398719787598, -0.0025370121002197266, -0.0023602843284606934, -0.00218355655670166, -0.002006828784942627, -0.0018301010131835938, -0.0016533732414245605, -0.0014766454696655273, -0.0012999176979064941, -0.001123189926147461, -0.0009464621543884277, -0.0007697343826293945, -0.0005930066108703613, -0.0004162788391113281, -0.00023955106735229492, -6.282329559326172e-05, 0.00011390447616577148, 0.0002906322479248047, 0.0004673600196838379, 0.0006440877914428711, 0.0008208155632019043, 0.0009975433349609375, 0.0011742711067199707, 0.001350998878479004, 0.0015277266502380371, 0.0017044544219970703, 0.0018811821937561035, 0.0020579099655151367, 0.00223463773727417, 0.002411365509033203, 0.0025880932807922363, 0.0027648210525512695, 0.0029415488243103027, 0.003118276596069336, 0.003295004367828369, 0.0034717321395874023, 0.0036484599113464355, 0.0038251876831054688, 0.004001915454864502, 0.004178643226623535, 0.004355370998382568, 0.0045320987701416016, 0.004708826541900635, 0.004885554313659668, 0.005062282085418701, 0.005239009857177734, 0.005415737628936768, 0.005592465400695801, 0.005769193172454834, 0.005945920944213867, 0.0061226487159729, 0.006299376487731934, 0.006476104259490967, 0.00665283203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 8.0, 14.0, 33.0, 76.0, 298.0, 359.0, 111.0, 37.0, 27.0, 10.0, 10.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185691237449646, -0.18147197365760803, -0.17725272476673126, -0.1730334609746933, -0.16881419718265533, -0.16459494829177856, -0.1603756844997406, -0.15615642070770264, -0.15193715691566467, -0.1477178931236267, -0.14349864423274994, -0.13927938044071198, -0.135060116648674, -0.13084086775779724, -0.12662160396575928, -0.12240234017372131, -0.11818309128284454, -0.11396383494138718, -0.10974457114934921, -0.10552531480789185, -0.10130605101585388, -0.09708679467439651, -0.09286753833293915, -0.08864827454090118, -0.08442901819944382, -0.08020976185798645, -0.07599049806594849, -0.07177124172449112, -0.06755198538303375, -0.06333272159099579, -0.05911346524953842, -0.054894205182790756, -0.05067494511604309, -0.046455685049295425, -0.04223642498254776, -0.03801716864109039, -0.03379790857434273, -0.029578648507595062, -0.025359390303492546, -0.02114013209939003, -0.016920872032642365, -0.012701612897217274, -0.008482353761792183, -0.004263094626367092, -4.383549094200134e-05, 0.004175424575805664, 0.00839468277990818, 0.012613940984010696, 0.016833201050758362, 0.021052461117506027, 0.025271719321608543, 0.02949097752571106, 0.033710237592458725, 0.03792949765920639, 0.04214875400066376, 0.04636801406741142, 0.05058727413415909, 0.054806534200906754, 0.05902579426765442, 0.06324505060911179, 0.06746430695056915, 0.07168357074260712, 0.07590282708406448, 0.08012208342552185, 0.08434134721755981]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 2.0, 5.0, 9.0, 12.0, 20.0, 17.0, 24.0, 26.0, 37.0, 43.0, 41.0, 36.0, 49.0, 49.0, 47.0, 66.0, 54.0, 57.0, 62.0, 51.0, 47.0, 41.0, 44.0, 30.0, 23.0, 22.0, 21.0, 19.0, 17.0, 7.0, 5.0, 6.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04750263690948486, -0.04616200178861618, -0.0448213666677475, -0.043480727821588516, -0.04214009270071983, -0.04079945757985115, -0.03945881873369217, -0.038118183612823486, -0.0367775484919548, -0.03543691337108612, -0.03409627825021744, -0.032755639404058456, -0.031415004283189774, -0.03007436916232109, -0.02873373217880726, -0.027393095195293427, -0.026052460074424744, -0.02471182495355606, -0.02337118797004223, -0.022030550986528397, -0.020689915865659714, -0.01934928074479103, -0.0180086437612772, -0.016668006777763367, -0.015327371656894684, -0.013986735604703426, -0.012646099552512169, -0.011305463500320911, -0.009964827448129654, -0.008624191395938396, -0.007283555343747139, -0.0059429192915558815, -0.004602283239364624, -0.0032616471871733665, -0.001921011134982109, -0.0005803750827908516, 0.0007602609694004059, 0.0021008970215916634, 0.003441533073782921, 0.004782169125974178, 0.006122805178165436, 0.007463441230356693, 0.00880407728254795, 0.010144713334739208, 0.011485349386930466, 0.012825985439121723, 0.01416662149131298, 0.015507257543504238, 0.016847893595695496, 0.01818852871656418, 0.01952916570007801, 0.020869802683591843, 0.022210437804460526, 0.02355107292532921, 0.02489170990884304, 0.026232346892356873, 0.027572982013225555, 0.02891361713409424, 0.03025425411760807, 0.0315948911011219, 0.032935526221990585, 0.03427616134285927, 0.03561680018901825, 0.03695743530988693, 0.038298070430755615]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 16.0, 19.0, 33.0, 30.0, 33.0, 59.0, 100.0, 142.0, 190.0, 277.0, 423.0, 593.0, 888.0, 1414.0, 2152.0, 3574.0, 6303.0, 11994.0, 28886.0, 892565.0, 61372.0, 16804.0, 8245.0, 4574.0, 2737.0, 1682.0, 1103.0, 731.0, 498.0, 326.0, 256.0, 153.0, 106.0, 79.0, 50.0, 31.0, 28.0, 23.0, 11.0, 16.0, 8.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.047607421875, -0.04615211486816406, -0.044696807861328125, -0.04324150085449219, -0.04178619384765625, -0.04033088684082031, -0.038875579833984375, -0.03742027282714844, -0.0359649658203125, -0.03450965881347656, -0.033054351806640625, -0.03159904479980469, -0.03014373779296875, -0.028688430786132812, -0.027233123779296875, -0.025777816772460938, -0.024322509765625, -0.022867202758789062, -0.021411895751953125, -0.019956588745117188, -0.01850128173828125, -0.017045974731445312, -0.015590667724609375, -0.014135360717773438, -0.0126800537109375, -0.011224746704101562, -0.009769439697265625, -0.008314132690429688, -0.00685882568359375, -0.0054035186767578125, -0.003948211669921875, -0.0024929046630859375, -0.00103759765625, 0.0004177093505859375, 0.001873016357421875, 0.0033283233642578125, 0.00478363037109375, 0.0062389373779296875, 0.007694244384765625, 0.009149551391601562, 0.0106048583984375, 0.012060165405273438, 0.013515472412109375, 0.014970779418945312, 0.01642608642578125, 0.017881393432617188, 0.019336700439453125, 0.020792007446289062, 0.022247314453125, 0.023702621459960938, 0.025157928466796875, 0.026613235473632812, 0.02806854248046875, 0.029523849487304688, 0.030979156494140625, 0.03243446350097656, 0.0338897705078125, 0.03534507751464844, 0.036800384521484375, 0.03825569152832031, 0.03971099853515625, 0.04116630554199219, 0.042621612548828125, 0.04407691955566406, 0.0455322265625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 6.0, 8.0, 13.0, 7.0, 12.0, 13.0, 15.0, 103.0, 606.0, 111.0, 12.0, 11.0, 5.0, 12.0, 7.0, 8.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018367767333984375, -0.001764446496963501, -0.0016921162605285645, -0.001619786024093628, -0.0015474557876586914, -0.0014751255512237549, -0.0014027953147888184, -0.0013304650783538818, -0.0012581348419189453, -0.0011858046054840088, -0.0011134743690490723, -0.0010411441326141357, -0.0009688138961791992, -0.0008964836597442627, -0.0008241534233093262, -0.0007518231868743896, -0.0006794929504394531, -0.0006071627140045166, -0.0005348324775695801, -0.00046250224113464355, -0.00039017200469970703, -0.0003178417682647705, -0.000245511531829834, -0.00017318129539489746, -0.00010085105895996094, -2.8520822525024414e-05, 4.380941390991211e-05, 0.00011613965034484863, 0.00018846988677978516, 0.0002608001232147217, 0.0003331303596496582, 0.0004054605960845947, 0.00047779083251953125, 0.0005501210689544678, 0.0006224513053894043, 0.0006947815418243408, 0.0007671117782592773, 0.0008394420146942139, 0.0009117722511291504, 0.000984102487564087, 0.0010564327239990234, 0.00112876296043396, 0.0012010931968688965, 0.001273423433303833, 0.0013457536697387695, 0.001418083906173706, 0.0014904141426086426, 0.001562744379043579, 0.0016350746154785156, 0.0017074048519134521, 0.0017797350883483887, 0.0018520653247833252, 0.0019243955612182617, 0.0019967257976531982, 0.0020690560340881348, 0.0021413862705230713, 0.002213716506958008, 0.0022860467433929443, 0.002358376979827881, 0.0024307072162628174, 0.002503037452697754, 0.0025753676891326904, 0.002647697925567627, 0.0027200281620025635, 0.0027923583984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 5.0, 7.0, 10.0, 6.0, 12.0, 13.0, 15.0, 19.0, 13.0, 19.0, 19.0, 32.0, 34.0, 59.0, 96.0, 488.0, 3904.0, 626243.0, 412766.0, 3834.0, 493.0, 125.0, 63.0, 33.0, 35.0, 30.0, 30.0, 24.0, 17.0, 21.0, 13.0, 9.0, 5.0, 8.0, 9.0, 8.0, 3.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11773681640625, -0.11381053924560547, -0.10988426208496094, -0.1059579849243164, -0.10203170776367188, -0.09810543060302734, -0.09417915344238281, -0.09025287628173828, -0.08632659912109375, -0.08240032196044922, -0.07847404479980469, -0.07454776763916016, -0.07062149047851562, -0.0666952133178711, -0.06276893615722656, -0.05884265899658203, -0.0549163818359375, -0.05099010467529297, -0.04706382751464844, -0.043137550354003906, -0.039211273193359375, -0.035284996032714844, -0.03135871887207031, -0.02743244171142578, -0.02350616455078125, -0.01957988739013672, -0.015653610229492188, -0.011727333068847656, -0.007801055908203125, -0.0038747787475585938, 5.14984130859375e-05, 0.003977775573730469, 0.007904052734375, 0.011830329895019531, 0.015756607055664062, 0.019682884216308594, 0.023609161376953125, 0.027535438537597656, 0.03146171569824219, 0.03538799285888672, 0.03931427001953125, 0.04324054718017578, 0.04716682434082031, 0.051093101501464844, 0.055019378662109375, 0.058945655822753906, 0.06287193298339844, 0.06679821014404297, 0.0707244873046875, 0.07465076446533203, 0.07857704162597656, 0.0825033187866211, 0.08642959594726562, 0.09035587310791016, 0.09428215026855469, 0.09820842742919922, 0.10213470458984375, 0.10606098175048828, 0.10998725891113281, 0.11391353607177734, 0.11783981323242188, 0.1217660903930664, 0.12569236755371094, 0.12961864471435547, 0.133544921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 2.0, 2.0, 8.0, 6.0, 5.0, 4.0, 5.0, 13.0, 11.0, 16.0, 18.0, 20.0, 19.0, 24.0, 20.0, 29.0, 22.0, 31.0, 34.0, 42.0, 36.0, 38.0, 57.0, 43.0, 37.0, 49.0, 37.0, 39.0, 46.0, 21.0, 27.0, 49.0, 29.0, 22.0, 30.0, 24.0, 15.0, 8.0, 11.0, 7.0, 12.0, 4.0, 9.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.005970001220703125, -0.005774199962615967, -0.005578398704528809, -0.00538259744644165, -0.005186796188354492, -0.004990994930267334, -0.004795193672180176, -0.004599392414093018, -0.004403591156005859, -0.004207789897918701, -0.004011988639831543, -0.0038161873817443848, -0.0036203861236572266, -0.0034245848655700684, -0.00322878360748291, -0.003032982349395752, -0.0028371810913085938, -0.0026413798332214355, -0.0024455785751342773, -0.002249777317047119, -0.002053976058959961, -0.0018581748008728027, -0.0016623735427856445, -0.0014665722846984863, -0.0012707710266113281, -0.00107496976852417, -0.0008791685104370117, -0.0006833672523498535, -0.0004875659942626953, -0.0002917647361755371, -9.59634780883789e-05, 9.98377799987793e-05, 0.0002956390380859375, 0.0004914402961730957, 0.0006872415542602539, 0.0008830428123474121, 0.0010788440704345703, 0.0012746453285217285, 0.0014704465866088867, 0.001666247844696045, 0.0018620491027832031, 0.0020578503608703613, 0.0022536516189575195, 0.0024494528770446777, 0.002645254135131836, 0.002841055393218994, 0.0030368566513061523, 0.0032326579093933105, 0.0034284591674804688, 0.003624260425567627, 0.003820061683654785, 0.004015862941741943, 0.0042116641998291016, 0.00440746545791626, 0.004603266716003418, 0.004799067974090576, 0.004994869232177734, 0.005190670490264893, 0.005386471748352051, 0.005582273006439209, 0.005778074264526367, 0.005973875522613525, 0.006169676780700684, 0.006365478038787842, 0.006561279296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 7.0, 8.0, 9.0, 27.0, 30.0, 71.0, 240.0, 3148.0, 1042781.0, 1893.0, 198.0, 73.0, 22.0, 12.0, 11.0, 11.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1365966796875, -0.1334514617919922, -0.13030624389648438, -0.12716102600097656, -0.12401580810546875, -0.12087059020996094, -0.11772537231445312, -0.11458015441894531, -0.1114349365234375, -0.10828971862792969, -0.10514450073242188, -0.10199928283691406, -0.09885406494140625, -0.09570884704589844, -0.09256362915039062, -0.08941841125488281, -0.086273193359375, -0.08312797546386719, -0.07998275756835938, -0.07683753967285156, -0.07369232177734375, -0.07054710388183594, -0.06740188598632812, -0.06425666809082031, -0.0611114501953125, -0.05796623229980469, -0.054821014404296875, -0.05167579650878906, -0.04853057861328125, -0.04538536071777344, -0.042240142822265625, -0.03909492492675781, -0.03594970703125, -0.03280448913574219, -0.029659271240234375, -0.026514053344726562, -0.02336883544921875, -0.020223617553710938, -0.017078399658203125, -0.013933181762695312, -0.0107879638671875, -0.0076427459716796875, -0.004497528076171875, -0.0013523101806640625, 0.00179290771484375, 0.0049381256103515625, 0.008083343505859375, 0.011228561401367188, 0.014373779296875, 0.017518997192382812, 0.020664215087890625, 0.023809432983398438, 0.02695465087890625, 0.030099868774414062, 0.033245086669921875, 0.03639030456542969, 0.0395355224609375, 0.04268074035644531, 0.045825958251953125, 0.04897117614746094, 0.05211639404296875, 0.05526161193847656, 0.058406829833984375, 0.06155204772949219, 0.064697265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 9.0, 13.0, 15.0, 42.0, 556.0, 255.0, 39.0, 24.0, 9.0, 12.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0045928955078125, -0.004362344741821289, -0.004131793975830078, -0.003901243209838867, -0.0036706924438476562, -0.0034401416778564453, -0.0032095909118652344, -0.0029790401458740234, -0.0027484893798828125, -0.0025179386138916016, -0.0022873878479003906, -0.0020568370819091797, -0.0018262863159179688, -0.0015957355499267578, -0.0013651847839355469, -0.001134634017944336, -0.000904083251953125, -0.0006735324859619141, -0.0004429817199707031, -0.0002124309539794922, 1.811981201171875e-05, 0.0002486705780029297, 0.0004792213439941406, 0.0007097721099853516, 0.0009403228759765625, 0.0011708736419677734, 0.0014014244079589844, 0.0016319751739501953, 0.0018625259399414062, 0.002093076705932617, 0.002323627471923828, 0.002554178237915039, 0.00278472900390625, 0.003015279769897461, 0.003245830535888672, 0.003476381301879883, 0.0037069320678710938, 0.003937482833862305, 0.004168033599853516, 0.0043985843658447266, 0.0046291351318359375, 0.0048596858978271484, 0.005090236663818359, 0.00532078742980957, 0.005551338195800781, 0.005781888961791992, 0.006012439727783203, 0.006242990493774414, 0.006473541259765625, 0.006704092025756836, 0.006934642791748047, 0.007165193557739258, 0.007395744323730469, 0.00762629508972168, 0.00785684585571289, 0.008087396621704102, 0.008317947387695312, 0.008548498153686523, 0.008779048919677734, 0.009009599685668945, 0.009240150451660156, 0.009470701217651367, 0.009701251983642578, 0.009931802749633789, 0.010162353515625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 12.0, 17.0, 51.0, 185.0, 2442.0, 1043158.0, 2382.0, 187.0, 63.0, 18.0, 6.0, 7.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09759521484375, -0.09459209442138672, -0.09158897399902344, -0.08858585357666016, -0.08558273315429688, -0.0825796127319336, -0.07957649230957031, -0.07657337188720703, -0.07357025146484375, -0.07056713104248047, -0.06756401062011719, -0.0645608901977539, -0.061557769775390625, -0.058554649353027344, -0.05555152893066406, -0.05254840850830078, -0.0495452880859375, -0.04654216766357422, -0.04353904724121094, -0.040535926818847656, -0.037532806396484375, -0.034529685974121094, -0.03152656555175781, -0.02852344512939453, -0.02552032470703125, -0.02251720428466797, -0.019514083862304688, -0.016510963439941406, -0.013507843017578125, -0.010504722595214844, -0.0075016021728515625, -0.004498481750488281, -0.001495361328125, 0.0015077590942382812, 0.0045108795166015625, 0.007513999938964844, 0.010517120361328125, 0.013520240783691406, 0.016523361206054688, 0.01952648162841797, 0.02252960205078125, 0.02553272247314453, 0.028535842895507812, 0.031538963317871094, 0.034542083740234375, 0.037545204162597656, 0.04054832458496094, 0.04355144500732422, 0.0465545654296875, 0.04955768585205078, 0.05256080627441406, 0.055563926696777344, 0.058567047119140625, 0.061570167541503906, 0.06457328796386719, 0.06757640838623047, 0.07057952880859375, 0.07358264923095703, 0.07658576965332031, 0.0795888900756836, 0.08259201049804688, 0.08559513092041016, 0.08859825134277344, 0.09160137176513672, 0.0946044921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 3.0, 7.0, 4.0, 11.0, 13.0, 16.0, 21.0, 24.0, 42.0, 85.0, 415.0, 156.0, 74.0, 33.0, 32.0, 16.0, 9.0, 10.0, 4.0, 5.0, 6.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.006862640380859375, -0.006653428077697754, -0.006444215774536133, -0.006235003471374512, -0.006025791168212891, -0.0058165788650512695, -0.0056073665618896484, -0.005398154258728027, -0.005188941955566406, -0.004979729652404785, -0.004770517349243164, -0.004561305046081543, -0.004352092742919922, -0.004142880439758301, -0.00393366813659668, -0.0037244558334350586, -0.0035152435302734375, -0.0033060312271118164, -0.0030968189239501953, -0.0028876066207885742, -0.002678394317626953, -0.002469182014465332, -0.002259969711303711, -0.00205075740814209, -0.0018415451049804688, -0.0016323328018188477, -0.0014231204986572266, -0.0012139081954956055, -0.0010046958923339844, -0.0007954835891723633, -0.0005862712860107422, -0.0003770589828491211, -0.0001678466796875, 4.1365623474121094e-05, 0.0002505779266357422, 0.0004597902297973633, 0.0006690025329589844, 0.0008782148361206055, 0.0010874271392822266, 0.0012966394424438477, 0.0015058517456054688, 0.0017150640487670898, 0.001924276351928711, 0.002133488655090332, 0.002342700958251953, 0.0025519132614135742, 0.0027611255645751953, 0.0029703378677368164, 0.0031795501708984375, 0.0033887624740600586, 0.0035979747772216797, 0.0038071870803833008, 0.004016399383544922, 0.004225611686706543, 0.004434823989868164, 0.004644036293029785, 0.004853248596191406, 0.005062460899353027, 0.0052716732025146484, 0.0054808855056762695, 0.005690097808837891, 0.005899310111999512, 0.006108522415161133, 0.006317734718322754, 0.006526947021484375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 31.0, 199.0, 618.0, 92.0, 31.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10193368047475815, -0.09288366138935089, -0.08383363485336304, -0.07478360831737518, -0.06573358923196793, -0.05668356642127037, -0.047633543610572815, -0.03858352452516556, -0.029533497989177704, -0.02048347517848015, -0.011433452367782593, -0.0023834295570850372, 0.006666593253612518, 0.015716616064310074, 0.02476663887500763, 0.033816657960414886, 0.04286668449640274, 0.051916707307100296, 0.06096673011779785, 0.0700167566537857, 0.07906677573919296, 0.08811679482460022, 0.09716682136058807, 0.10621684044599533, 0.11526686698198318, 0.12431688606739044, 0.1333669126033783, 0.14241693913936615, 0.151466965675354, 0.16051697731018066, 0.16956700384616852, 0.17861703038215637, 0.18766707181930542, 0.19671709835529327, 0.20576712489128113, 0.2148171365261078, 0.22386716306209564, 0.2329171895980835, 0.24196720123291016, 0.2510172128677368, 0.26006725430488586, 0.2691172659397125, 0.2781673073768616, 0.28721731901168823, 0.2962673306465149, 0.30531737208366394, 0.3143673837184906, 0.32341742515563965, 0.3324674367904663, 0.34151744842529297, 0.350567489862442, 0.3596175014972687, 0.3686675429344177, 0.3777175545692444, 0.38676756620407104, 0.3958175778388977, 0.40486761927604675, 0.4139176309108734, 0.42296767234802246, 0.4320176839828491, 0.4410676956176758, 0.45011773705482483, 0.4591677486896515, 0.46821779012680054, 0.4772678017616272]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 9.0, 16.0, 15.0, 28.0, 32.0, 27.0, 39.0, 44.0, 46.0, 56.0, 68.0, 77.0, 77.0, 74.0, 58.0, 55.0, 59.0, 37.0, 36.0, 25.0, 21.0, 14.0, 12.0, 14.0, 4.0, 5.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.053205668926239014, -0.05142106115818024, -0.04963645339012146, -0.04785184934735298, -0.046067241579294205, -0.04428263381123543, -0.04249802976846695, -0.04071342200040817, -0.038928814232349396, -0.03714420646429062, -0.03535959869623184, -0.033574994653463364, -0.03179038688540459, -0.03000577911734581, -0.028221173211932182, -0.026436567306518555, -0.024651959538459778, -0.022867351770401, -0.021082745864987373, -0.019298139959573746, -0.01751353219151497, -0.015728924423456192, -0.013944318518042564, -0.012159711681306362, -0.01037510484457016, -0.008590498007833958, -0.006805891171097755, -0.005021284334361553, -0.003236677497625351, -0.0014520706608891487, 0.00033253617584705353, 0.0021171430125832558, 0.003901749849319458, 0.00568635668605566, 0.0074709635227918625, 0.009255570359528065, 0.011040177196264267, 0.01282478403300047, 0.014609390869736671, 0.0163939967751503, 0.018178604543209076, 0.019963212311267853, 0.02174781821668148, 0.023532424122095108, 0.025317031890153885, 0.027101639658212662, 0.02888624556362629, 0.030670851469039917, 0.032455459237098694, 0.03424006700515747, 0.03602467477321625, 0.037809278815984726, 0.0395938865840435, 0.04137849435210228, 0.04316309839487076, 0.044947706162929535, 0.04673231393098831, 0.04851692169904709, 0.050301529467105865, 0.052086133509874344, 0.05387074127793312, 0.0556553490459919, 0.057439953088760376, 0.05922456085681915, 0.06100916862487793]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 0.0, 8.0, 4.0, 8.0, 0.0, 10.0, 12.0, 8.0, 10.0, 10.0, 16.0, 26.0, 16.0, 16.0, 28.0, 24.0, 281.0, 4193482.0, 148.0, 23.0, 22.0, 24.0, 12.0, 14.0, 12.0, 16.0, 10.0, 8.0, 6.0, 0.0, 8.0, 4.0, 4.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.662109375, -2.552642822265625, -2.44317626953125, -2.333709716796875, -2.2242431640625, -2.114776611328125, -2.00531005859375, -1.895843505859375, -1.786376953125, -1.676910400390625, -1.56744384765625, -1.457977294921875, -1.3485107421875, -1.239044189453125, -1.12957763671875, -1.020111083984375, -0.91064453125, -0.801177978515625, -0.69171142578125, -0.582244873046875, -0.4727783203125, -0.363311767578125, -0.25384521484375, -0.144378662109375, -0.034912109375, 0.074554443359375, 0.18402099609375, 0.293487548828125, 0.4029541015625, 0.512420654296875, 0.62188720703125, 0.731353759765625, 0.8408203125, 0.950286865234375, 1.05975341796875, 1.169219970703125, 1.2786865234375, 1.388153076171875, 1.49761962890625, 1.607086181640625, 1.716552734375, 1.826019287109375, 1.93548583984375, 2.044952392578125, 2.1544189453125, 2.263885498046875, 2.37335205078125, 2.482818603515625, 2.59228515625, 2.701751708984375, 2.81121826171875, 2.920684814453125, 3.0301513671875, 3.139617919921875, 3.24908447265625, 3.358551025390625, 3.468017578125, 3.577484130859375, 3.68695068359375, 3.796417236328125, 3.9058837890625, 4.015350341796875, 4.12481689453125, 4.234283447265625, 4.34375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 5.0, 9.0, 5.0, 12.0, 9.0, 13.0, 12.0, 19.0, 113.0, 479.0, 203.0, 28.0, 18.0, 9.0, 7.0, 7.0, 7.0, 8.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018596649169921875, -0.0017921626567840576, -0.0017246603965759277, -0.0016571581363677979, -0.001589655876159668, -0.001522153615951538, -0.0014546513557434082, -0.0013871490955352783, -0.0013196468353271484, -0.0012521445751190186, -0.0011846423149108887, -0.0011171400547027588, -0.001049637794494629, -0.000982135534286499, -0.0009146332740783691, -0.0008471310138702393, -0.0007796287536621094, -0.0007121264934539795, -0.0006446242332458496, -0.0005771219730377197, -0.0005096197128295898, -0.00044211745262145996, -0.0003746151924133301, -0.0003071129322052002, -0.0002396106719970703, -0.00017210841178894043, -0.00010460615158081055, -3.7103891372680664e-05, 3.039836883544922e-05, 9.79006290435791e-05, 0.00016540288925170898, 0.00023290514945983887, 0.00030040740966796875, 0.00036790966987609863, 0.0004354119300842285, 0.0005029141902923584, 0.0005704164505004883, 0.0006379187107086182, 0.000705420970916748, 0.0007729232311248779, 0.0008404254913330078, 0.0009079277515411377, 0.0009754300117492676, 0.0010429322719573975, 0.0011104345321655273, 0.0011779367923736572, 0.0012454390525817871, 0.001312941312789917, 0.0013804435729980469, 0.0014479458332061768, 0.0015154480934143066, 0.0015829503536224365, 0.0016504526138305664, 0.0017179548740386963, 0.0017854571342468262, 0.001852959394454956, 0.001920461654663086, 0.001987963914871216, 0.0020554661750793457, 0.0021229684352874756, 0.0021904706954956055, 0.0022579729557037354, 0.0023254752159118652, 0.002392977476119995, 0.002460479736328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 13.0, 9.0, 12.0, 25.0, 24.0, 39.0, 34.0, 59.0, 76.0, 121.0, 203.0, 407.0, 4191991.0, 559.0, 213.0, 135.0, 78.0, 68.0, 47.0, 26.0, 29.0, 25.0, 17.0, 14.0, 14.0, 4.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58251953125, -0.5628738403320312, -0.5432281494140625, -0.5235824584960938, -0.503936767578125, -0.48429107666015625, -0.4646453857421875, -0.44499969482421875, -0.42535400390625, -0.40570831298828125, -0.3860626220703125, -0.36641693115234375, -0.346771240234375, -0.32712554931640625, -0.3074798583984375, -0.28783416748046875, -0.2681884765625, -0.24854278564453125, -0.2288970947265625, -0.20925140380859375, -0.189605712890625, -0.16996002197265625, -0.1503143310546875, -0.13066864013671875, -0.11102294921875, -0.09137725830078125, -0.0717315673828125, -0.05208587646484375, -0.032440185546875, -0.01279449462890625, 0.0068511962890625, 0.02649688720703125, 0.046142578125, 0.06578826904296875, 0.0854339599609375, 0.10507965087890625, 0.124725341796875, 0.14437103271484375, 0.1640167236328125, 0.18366241455078125, 0.20330810546875, 0.22295379638671875, 0.2425994873046875, 0.26224517822265625, 0.281890869140625, 0.30153656005859375, 0.3211822509765625, 0.34082794189453125, 0.3604736328125, 0.38011932373046875, 0.3997650146484375, 0.41941070556640625, 0.439056396484375, 0.45870208740234375, 0.4783477783203125, 0.49799346923828125, 0.51763916015625, 0.5372848510742188, 0.5569305419921875, 0.5765762329101562, 0.596221923828125, 0.6158676147460938, 0.6355133056640625, 0.6551589965820312, 0.6748046875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 13.0, 18.0, 16.0, 22.0, 36.0, 39.0, 42.0, 89.0, 123.0, 207.0, 432.0, 1612.0, 652.0, 272.0, 144.0, 91.0, 66.0, 44.0, 31.0, 30.0, 22.0, 16.0, 10.0, 6.0, 7.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0038471221923828125, -0.0037132203578948975, -0.0035793185234069824, -0.0034454166889190674, -0.0033115148544311523, -0.0031776130199432373, -0.0030437111854553223, -0.0029098093509674072, -0.002775907516479492, -0.002642005681991577, -0.002508103847503662, -0.002374202013015747, -0.002240300178527832, -0.002106398344039917, -0.001972496509552002, -0.001838594675064087, -0.0017046928405761719, -0.0015707910060882568, -0.0014368891716003418, -0.0013029873371124268, -0.0011690855026245117, -0.0010351836681365967, -0.0009012818336486816, -0.0007673799991607666, -0.0006334781646728516, -0.0004995763301849365, -0.0003656744956970215, -0.00023177266120910645, -9.78708267211914e-05, 3.603100776672363e-05, 0.00016993284225463867, 0.0003038346767425537, 0.00043773651123046875, 0.0005716383457183838, 0.0007055401802062988, 0.0008394420146942139, 0.0009733438491821289, 0.001107245683670044, 0.001241147518157959, 0.001375049352645874, 0.001508951187133789, 0.001642853021621704, 0.0017767548561096191, 0.0019106566905975342, 0.0020445585250854492, 0.0021784603595733643, 0.0023123621940612793, 0.0024462640285491943, 0.0025801658630371094, 0.0027140676975250244, 0.0028479695320129395, 0.0029818713665008545, 0.0031157732009887695, 0.0032496750354766846, 0.0033835768699645996, 0.0035174787044525146, 0.0036513805389404297, 0.0037852823734283447, 0.00391918420791626, 0.004053086042404175, 0.00418698787689209, 0.004320889711380005, 0.00445479154586792, 0.004588693380355835, 0.00472259521484375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 34.0, 979.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6301983594894409, -0.6192108988761902, -0.6082234978675842, -0.5972360372543335, -0.5862486362457275, -0.5752611756324768, -0.5642737150192261, -0.5532863140106201, -0.5422988533973694, -0.5313113927841187, -0.5203239917755127, -0.509336531162262, -0.4983491003513336, -0.4873616695404053, -0.47637423872947693, -0.4653868079185486, -0.4543994069099426, -0.4434119760990143, -0.43242454528808594, -0.4214370846748352, -0.41044965386390686, -0.3994622230529785, -0.38847479224205017, -0.3774873614311218, -0.3664999008178711, -0.35551247000694275, -0.3445250391960144, -0.33353757858276367, -0.3225501477718353, -0.311562716960907, -0.30057528614997864, -0.2895878553390503, -0.27860039472579956, -0.2676129639148712, -0.25662553310394287, -0.24563808739185333, -0.234650656580925, -0.22366321086883545, -0.2126757800579071, -0.20168834924697876, -0.19070091843605042, -0.17971348762512207, -0.16872604191303253, -0.1577386111021042, -0.14675118029117584, -0.1357637345790863, -0.12477630376815796, -0.11378887295722961, -0.10280143469572067, -0.09181399643421173, -0.08082656562328339, -0.06983912736177444, -0.0588516928255558, -0.04786425828933716, -0.03687682002782822, -0.025889389216899872, -0.01490195095539093, -0.003914515487849712, 0.007072919979691505, 0.018060356378555298, 0.02904779091477394, 0.040035225450992584, 0.051022663712501526, 0.06201009452342987, 0.07299753278493881]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 12.0, 15.0, 18.0, 19.0, 39.0, 57.0, 60.0, 59.0, 97.0, 99.0, 98.0, 79.0, 78.0, 56.0, 52.0, 43.0, 27.0, 15.0, 15.0, 3.0, 8.0, 5.0, 5.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02575206756591797, -0.02501755580306053, -0.024283042177557945, -0.02354852855205536, -0.022814016789197922, -0.022079505026340485, -0.021344991400837898, -0.020610477775335312, -0.019875966012477875, -0.019141454249620438, -0.01840694062411785, -0.017672426998615265, -0.016937915235757828, -0.01620340347290039, -0.015468889847397804, -0.014734377153217793, -0.01399986445903778, -0.013265351764857769, -0.012530839070677757, -0.011796326376497746, -0.011061813682317734, -0.010327300988137722, -0.00959278829395771, -0.008858275599777699, -0.008123762905597687, -0.007389250211417675, -0.006654737517237663, -0.0059202248230576515, -0.00518571212887764, -0.004451199434697628, -0.0037166867405176163, -0.0029821740463376045, -0.0022476613521575928, -0.001513148657977581, -0.0007786359637975693, -4.4123269617557526e-05, 0.0006903894245624542, 0.001424902118742466, 0.0021594148129224777, 0.0028939275071024895, 0.0036284402012825012, 0.004362952895462513, 0.005097465589642525, 0.0058319782838225365, 0.006566490978002548, 0.00730100367218256, 0.008035516366362572, 0.008770029060542583, 0.009504541754722595, 0.010239054448902607, 0.010973567143082619, 0.01170807983726263, 0.012442592531442642, 0.013177105225622654, 0.013911617919802666, 0.014646130613982677, 0.01538064330816269, 0.016115155071020126, 0.016849668696522713, 0.0175841823220253, 0.018318694084882736, 0.019053205847740173, 0.01978771947324276, 0.020522233098745346, 0.021256744861602783]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 5.0, 8.0, 17.0, 4.0, 17.0, 23.0, 23.0, 33.0, 31.0, 31.0, 31.0, 46.0, 54.0, 119.0, 1085.0, 72374.0, 968184.0, 5801.0, 297.0, 70.0, 42.0, 41.0, 33.0, 34.0, 25.0, 26.0, 18.0, 15.0, 13.0, 10.0, 8.0, 7.0, 6.0, 10.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.059356689453125, -0.05771923065185547, -0.05608177185058594, -0.054444313049316406, -0.052806854248046875, -0.051169395446777344, -0.04953193664550781, -0.04789447784423828, -0.04625701904296875, -0.04461956024169922, -0.04298210144042969, -0.041344642639160156, -0.039707183837890625, -0.038069725036621094, -0.03643226623535156, -0.03479480743408203, -0.0331573486328125, -0.03151988983154297, -0.029882431030273438, -0.028244972229003906, -0.026607513427734375, -0.024970054626464844, -0.023332595825195312, -0.02169513702392578, -0.02005767822265625, -0.01842021942138672, -0.016782760620117188, -0.015145301818847656, -0.013507843017578125, -0.011870384216308594, -0.010232925415039062, -0.008595466613769531, -0.0069580078125, -0.005320549011230469, -0.0036830902099609375, -0.0020456314086914062, -0.000408172607421875, 0.0012292861938476562, 0.0028667449951171875, 0.004504203796386719, 0.00614166259765625, 0.007779121398925781, 0.009416580200195312, 0.011054039001464844, 0.012691497802734375, 0.014328956604003906, 0.015966415405273438, 0.01760387420654297, 0.0192413330078125, 0.02087879180908203, 0.022516250610351562, 0.024153709411621094, 0.025791168212890625, 0.027428627014160156, 0.029066085815429688, 0.03070354461669922, 0.03234100341796875, 0.03397846221923828, 0.03561592102050781, 0.037253379821777344, 0.038890838623046875, 0.040528297424316406, 0.04216575622558594, 0.04380321502685547, 0.045440673828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 2.0, 5.0, 5.0, 8.0, 16.0, 14.0, 16.0, 31.0, 30.0, 60.0, 80.0, 67.0, 102.0, 95.0, 101.0, 87.0, 73.0, 61.0, 39.0, 47.0, 20.0, 17.0, 8.0, 13.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0027484893798828125, -0.0026895254850387573, -0.002630561590194702, -0.002571597695350647, -0.002512633800506592, -0.0024536699056625366, -0.0023947060108184814, -0.0023357421159744263, -0.002276778221130371, -0.002217814326286316, -0.0021588504314422607, -0.0020998865365982056, -0.0020409226417541504, -0.001981958746910095, -0.00192299485206604, -0.0018640309572219849, -0.0018050670623779297, -0.0017461031675338745, -0.0016871392726898193, -0.0016281753778457642, -0.001569211483001709, -0.0015102475881576538, -0.0014512836933135986, -0.0013923197984695435, -0.0013333559036254883, -0.001274392008781433, -0.001215428113937378, -0.0011564642190933228, -0.0010975003242492676, -0.0010385364294052124, -0.0009795725345611572, -0.000920608639717102, -0.0008616447448730469, -0.0008026808500289917, -0.0007437169551849365, -0.0006847530603408813, -0.0006257891654968262, -0.000566825270652771, -0.0005078613758087158, -0.00044889748096466064, -0.00038993358612060547, -0.0003309696912765503, -0.0002720057964324951, -0.00021304190158843994, -0.00015407800674438477, -9.511411190032959e-05, -3.6150217056274414e-05, 2.2813677787780762e-05, 8.177757263183594e-05, 0.0001407414674758911, 0.0001997053623199463, 0.00025866925716400146, 0.00031763315200805664, 0.0003765970468521118, 0.000435560941696167, 0.0004945248365402222, 0.0005534887313842773, 0.0006124526262283325, 0.0006714165210723877, 0.0007303804159164429, 0.000789344310760498, 0.0008483082056045532, 0.0009072721004486084, 0.0009662359952926636, 0.0010251998901367188]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 10.0, 11.0, 15.0, 18.0, 20.0, 33.0, 35.0, 48.0, 91.0, 125.0, 156.0, 279.0, 469.0, 1181.0, 4984.0, 44445.0, 737244.0, 240128.0, 14980.0, 2481.0, 721.0, 321.0, 215.0, 139.0, 100.0, 72.0, 58.0, 48.0, 32.0, 22.0, 22.0, 11.0, 7.0, 10.0, 7.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026611328125, -0.025823354721069336, -0.025035381317138672, -0.024247407913208008, -0.023459434509277344, -0.02267146110534668, -0.021883487701416016, -0.02109551429748535, -0.020307540893554688, -0.019519567489624023, -0.01873159408569336, -0.017943620681762695, -0.01715564727783203, -0.016367673873901367, -0.015579700469970703, -0.014791727066040039, -0.014003753662109375, -0.013215780258178711, -0.012427806854248047, -0.011639833450317383, -0.010851860046386719, -0.010063886642456055, -0.00927591323852539, -0.008487939834594727, -0.0076999664306640625, -0.0069119930267333984, -0.006124019622802734, -0.00533604621887207, -0.004548072814941406, -0.003760099411010742, -0.002972126007080078, -0.002184152603149414, -0.00139617919921875, -0.0006082057952880859, 0.00017976760864257812, 0.0009677410125732422, 0.0017557144165039062, 0.0025436878204345703, 0.0033316612243652344, 0.0041196346282958984, 0.0049076080322265625, 0.0056955814361572266, 0.006483554840087891, 0.007271528244018555, 0.008059501647949219, 0.008847475051879883, 0.009635448455810547, 0.010423421859741211, 0.011211395263671875, 0.011999368667602539, 0.012787342071533203, 0.013575315475463867, 0.014363288879394531, 0.015151262283325195, 0.01593923568725586, 0.016727209091186523, 0.017515182495117188, 0.01830315589904785, 0.019091129302978516, 0.01987910270690918, 0.020667076110839844, 0.021455049514770508, 0.022243022918701172, 0.023030996322631836, 0.0238189697265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 8.0, 5.0, 11.0, 16.0, 17.0, 18.0, 18.0, 24.0, 32.0, 25.0, 20.0, 24.0, 36.0, 42.0, 47.0, 45.0, 42.0, 40.0, 40.0, 37.0, 46.0, 26.0, 32.0, 42.0, 29.0, 24.0, 34.0, 26.0, 27.0, 18.0, 26.0, 17.0, 17.0, 15.0, 16.0, 7.0, 7.0, 9.0, 11.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.005279541015625, -0.005106568336486816, -0.004933595657348633, -0.004760622978210449, -0.004587650299072266, -0.004414677619934082, -0.0042417049407958984, -0.004068732261657715, -0.0038957595825195312, -0.0037227869033813477, -0.003549814224243164, -0.0033768415451049805, -0.003203868865966797, -0.0030308961868286133, -0.0028579235076904297, -0.002684950828552246, -0.0025119781494140625, -0.002339005470275879, -0.0021660327911376953, -0.0019930601119995117, -0.0018200874328613281, -0.0016471147537231445, -0.001474142074584961, -0.0013011693954467773, -0.0011281967163085938, -0.0009552240371704102, -0.0007822513580322266, -0.000609278678894043, -0.0004363059997558594, -0.0002633333206176758, -9.036064147949219e-05, 8.26120376586914e-05, 0.000255584716796875, 0.0004285573959350586, 0.0006015300750732422, 0.0007745027542114258, 0.0009474754333496094, 0.001120448112487793, 0.0012934207916259766, 0.0014663934707641602, 0.0016393661499023438, 0.0018123388290405273, 0.001985311508178711, 0.0021582841873168945, 0.002331256866455078, 0.0025042295455932617, 0.0026772022247314453, 0.002850174903869629, 0.0030231475830078125, 0.003196120262145996, 0.0033690929412841797, 0.0035420656204223633, 0.003715038299560547, 0.0038880109786987305, 0.004060983657836914, 0.004233956336975098, 0.004406929016113281, 0.004579901695251465, 0.0047528743743896484, 0.004925847053527832, 0.005098819732666016, 0.005271792411804199, 0.005444765090942383, 0.005617737770080566, 0.00579071044921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 5.0, 7.0, 7.0, 7.0, 5.0, 16.0, 13.0, 22.0, 27.0, 31.0, 41.0, 60.0, 110.0, 125.0, 311.0, 791.0, 2971.0, 21981.0, 738288.0, 268003.0, 12307.0, 2146.0, 599.0, 225.0, 137.0, 78.0, 49.0, 41.0, 24.0, 21.0, 19.0, 15.0, 15.0, 11.0, 6.0, 10.0, 5.0, 3.0, 5.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02032470703125, -0.019620895385742188, -0.018917083740234375, -0.018213272094726562, -0.01750946044921875, -0.016805648803710938, -0.016101837158203125, -0.015398025512695312, -0.0146942138671875, -0.013990402221679688, -0.013286590576171875, -0.012582778930664062, -0.01187896728515625, -0.011175155639648438, -0.010471343994140625, -0.009767532348632812, -0.009063720703125, -0.008359909057617188, -0.007656097412109375, -0.0069522857666015625, -0.00624847412109375, -0.0055446624755859375, -0.004840850830078125, -0.0041370391845703125, -0.0034332275390625, -0.0027294158935546875, -0.002025604248046875, -0.0013217926025390625, -0.00061798095703125, 8.58306884765625e-05, 0.000789642333984375, 0.0014934539794921875, 0.002197265625, 0.0029010772705078125, 0.003604888916015625, 0.0043087005615234375, 0.00501251220703125, 0.0057163238525390625, 0.006420135498046875, 0.0071239471435546875, 0.0078277587890625, 0.008531570434570312, 0.009235382080078125, 0.009939193725585938, 0.01064300537109375, 0.011346817016601562, 0.012050628662109375, 0.012754440307617188, 0.013458251953125, 0.014162063598632812, 0.014865875244140625, 0.015569686889648438, 0.01627349853515625, 0.016977310180664062, 0.017681121826171875, 0.018384933471679688, 0.0190887451171875, 0.019792556762695312, 0.020496368408203125, 0.021200180053710938, 0.02190399169921875, 0.022607803344726562, 0.023311614990234375, 0.024015426635742188, 0.02471923828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 7.0, 12.0, 14.0, 25.0, 42.0, 104.0, 334.0, 262.0, 72.0, 42.0, 20.0, 7.0, 10.0, 9.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029087066650390625, -0.00028004124760627747, -0.0002692118287086487, -0.0002583824098110199, -0.0002475529909133911, -0.00023672357201576233, -0.00022589415311813354, -0.00021506473422050476, -0.00020423531532287598, -0.0001934058964252472, -0.0001825764775276184, -0.00017174705862998962, -0.00016091763973236084, -0.00015008822083473206, -0.00013925880193710327, -0.0001284293830394745, -0.0001175999641418457, -0.00010677054524421692, -9.594112634658813e-05, -8.511170744895935e-05, -7.428228855133057e-05, -6.345286965370178e-05, -5.2623450756073e-05, -4.1794031858444214e-05, -3.096461296081543e-05, -2.0135194063186646e-05, -9.305775165557861e-06, 1.5236437320709229e-06, 1.2353062629699707e-05, 2.318248152732849e-05, 3.4011900424957275e-05, 4.484131932258606e-05, 5.5670738220214844e-05, 6.650015711784363e-05, 7.732957601547241e-05, 8.81589949131012e-05, 9.898841381072998e-05, 0.00010981783270835876, 0.00012064725160598755, 0.00013147667050361633, 0.00014230608940124512, 0.0001531355082988739, 0.00016396492719650269, 0.00017479434609413147, 0.00018562376499176025, 0.00019645318388938904, 0.00020728260278701782, 0.0002181120216846466, 0.0002289414405822754, 0.00023977085947990417, 0.00025060027837753296, 0.00026142969727516174, 0.00027225911617279053, 0.0002830885350704193, 0.0002939179539680481, 0.0003047473728656769, 0.00031557679176330566, 0.00032640621066093445, 0.00033723562955856323, 0.000348065048456192, 0.0003588944673538208, 0.0003697238862514496, 0.00038055330514907837, 0.00039138272404670715, 0.00040221214294433594]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 7.0, 5.0, 6.0, 13.0, 9.0, 19.0, 33.0, 61.0, 139.0, 461.0, 3878.0, 999612.0, 42622.0, 1247.0, 244.0, 73.0, 38.0, 26.0, 22.0, 12.0, 6.0, 10.0, 4.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0882568359375, -0.08539009094238281, -0.08252334594726562, -0.07965660095214844, -0.07678985595703125, -0.07392311096191406, -0.07105636596679688, -0.06818962097167969, -0.0653228759765625, -0.06245613098144531, -0.059589385986328125, -0.05672264099121094, -0.05385589599609375, -0.05098915100097656, -0.048122406005859375, -0.04525566101074219, -0.042388916015625, -0.03952217102050781, -0.036655426025390625, -0.03378868103027344, -0.03092193603515625, -0.028055191040039062, -0.025188446044921875, -0.022321701049804688, -0.0194549560546875, -0.016588211059570312, -0.013721466064453125, -0.010854721069335938, -0.00798797607421875, -0.0051212310791015625, -0.002254486083984375, 0.0006122589111328125, 0.00347900390625, 0.0063457489013671875, 0.009212493896484375, 0.012079238891601562, 0.01494598388671875, 0.017812728881835938, 0.020679473876953125, 0.023546218872070312, 0.0264129638671875, 0.029279708862304688, 0.032146453857421875, 0.03501319885253906, 0.03787994384765625, 0.04074668884277344, 0.043613433837890625, 0.04648017883300781, 0.049346923828125, 0.05221366882324219, 0.055080413818359375, 0.05794715881347656, 0.06081390380859375, 0.06368064880371094, 0.06654739379882812, 0.06941413879394531, 0.0722808837890625, 0.07514762878417969, 0.07801437377929688, 0.08088111877441406, 0.08374786376953125, 0.08661460876464844, 0.08948135375976562, 0.09234809875488281, 0.09521484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 17.0, 25.0, 62.0, 154.0, 375.0, 205.0, 69.0, 36.0, 14.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.031951904296875, -0.03120255470275879, -0.030453205108642578, -0.029703855514526367, -0.028954505920410156, -0.028205156326293945, -0.027455806732177734, -0.026706457138061523, -0.025957107543945312, -0.0252077579498291, -0.02445840835571289, -0.02370905876159668, -0.02295970916748047, -0.022210359573364258, -0.021461009979248047, -0.020711660385131836, -0.019962310791015625, -0.019212961196899414, -0.018463611602783203, -0.017714262008666992, -0.01696491241455078, -0.01621556282043457, -0.01546621322631836, -0.014716863632202148, -0.013967514038085938, -0.013218164443969727, -0.012468814849853516, -0.011719465255737305, -0.010970115661621094, -0.010220766067504883, -0.009471416473388672, -0.008722066879272461, -0.00797271728515625, -0.007223367691040039, -0.006474018096923828, -0.005724668502807617, -0.004975318908691406, -0.004225969314575195, -0.0034766197204589844, -0.0027272701263427734, -0.0019779205322265625, -0.0012285709381103516, -0.0004792213439941406, 0.0002701282501220703, 0.0010194778442382812, 0.0017688274383544922, 0.002518177032470703, 0.003267526626586914, 0.004016876220703125, 0.004766225814819336, 0.005515575408935547, 0.006264925003051758, 0.007014274597167969, 0.00776362419128418, 0.00851297378540039, 0.009262323379516602, 0.010011672973632812, 0.010761022567749023, 0.011510372161865234, 0.012259721755981445, 0.013009071350097656, 0.013758420944213867, 0.014507770538330078, 0.015257120132446289, 0.0160064697265625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 20.0, 848.0, 142.0, 4.0, 1.0, 1.0], "bins": [-1.373142957687378, -1.3501344919204712, -1.3271260261535645, -1.3041174411773682, -1.2811089754104614, -1.2581005096435547, -1.235092043876648, -1.2120834589004517, -1.189074993133545, -1.1660665273666382, -1.1430580615997314, -1.1200494766235352, -1.0970410108566284, -1.0740325450897217, -1.051024079322815, -1.0280154943466187, -1.005007028579712, -0.9819985628128052, -0.9589900374412537, -0.9359815716743469, -0.9129730463027954, -0.8899645805358887, -0.8669560551643372, -0.8439475893974304, -0.8209391236305237, -0.7979306578636169, -0.7749221324920654, -0.7519136667251587, -0.7289051413536072, -0.7058966755867004, -0.6828881502151489, -0.6598796844482422, -0.6368711590766907, -0.6138626933097839, -0.5908541679382324, -0.5678457021713257, -0.5448371767997742, -0.5218287110328674, -0.4988201856613159, -0.4758117198944092, -0.45280319452285767, -0.42979469895362854, -0.4067862033843994, -0.3837777078151703, -0.36076921224594116, -0.33776071667671204, -0.3147522211074829, -0.29174375534057617, -0.26873522996902466, -0.24572673439979553, -0.2227182388305664, -0.19970974326133728, -0.17670124769210815, -0.15369275212287903, -0.1306842714548111, -0.10767577588558197, -0.08466729521751404, -0.06165879964828491, -0.038650307804346085, -0.015641815960407257, 0.007366679608821869, 0.030375175178050995, 0.053383663296699524, 0.07639215886592865, 0.09940065443515778]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 18.0, 23.0, 16.0, 32.0, 49.0, 49.0, 61.0, 63.0, 76.0, 67.0, 82.0, 59.0, 71.0, 81.0, 50.0, 54.0, 37.0, 28.0, 31.0, 16.0, 16.0, 8.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039511680603027344, -0.03701457381248474, -0.03451746329665184, -0.03202035278081894, -0.029523245990276337, -0.027026137337088585, -0.024529028683900833, -0.02203192003071308, -0.01953481137752533, -0.017037702724337578, -0.014540594071149826, -0.012043485417962074, -0.009546376764774323, -0.007049268111586571, -0.004552159458398819, -0.002055050805211067, 0.00044205784797668457, 0.0029391665011644363, 0.005436275154352188, 0.00793338380753994, 0.010430492460727692, 0.012927601113915443, 0.015424709767103195, 0.017921818420290947, 0.0204189270734787, 0.02291603572666645, 0.025413144379854202, 0.027910253033041954, 0.030407361686229706, 0.03290446847677231, 0.03540157899260521, 0.03789868950843811, 0.04039579629898071, 0.042892903089523315, 0.045390013605356216, 0.04788712412118912, 0.05038423091173172, 0.05288133770227432, 0.055378448218107224, 0.057875558733940125, 0.06037266552448273, 0.06286977231502533, 0.06536687910556793, 0.06786399334669113, 0.07036110013723373, 0.07285820692777634, 0.07535532116889954, 0.07785242795944214, 0.08034953474998474, 0.08284664154052734, 0.08534374833106995, 0.08784086257219315, 0.09033796936273575, 0.09283507615327835, 0.09533219039440155, 0.09782929718494415, 0.10032640397548676, 0.10282351076602936, 0.10532061755657196, 0.10781773179769516, 0.11031483858823776, 0.11281194537878036, 0.11530905961990356, 0.11780616641044617, 0.12030327320098877]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 14.0, 23.0, 23.0, 49.0, 81.0, 126.0, 250.0, 513.0, 1238.0, 4178256.0, 12843.0, 545.0, 193.0, 71.0, 40.0, 11.0, 6.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.264404296875, -0.25939035415649414, -0.2543764114379883, -0.24936246871948242, -0.24434852600097656, -0.2393345832824707, -0.23432064056396484, -0.22930669784545898, -0.22429275512695312, -0.21927881240844727, -0.2142648696899414, -0.20925092697143555, -0.2042369842529297, -0.19922304153442383, -0.19420909881591797, -0.1891951560974121, -0.18418121337890625, -0.1791672706604004, -0.17415332794189453, -0.16913938522338867, -0.1641254425048828, -0.15911149978637695, -0.1540975570678711, -0.14908361434936523, -0.14406967163085938, -0.13905572891235352, -0.13404178619384766, -0.1290278434753418, -0.12401390075683594, -0.11899995803833008, -0.11398601531982422, -0.10897207260131836, -0.1039581298828125, -0.09894418716430664, -0.09393024444580078, -0.08891630172729492, -0.08390235900878906, -0.0788884162902832, -0.07387447357177734, -0.06886053085327148, -0.06384658813476562, -0.058832645416259766, -0.053818702697753906, -0.04880475997924805, -0.04379081726074219, -0.03877687454223633, -0.03376293182373047, -0.02874898910522461, -0.02373504638671875, -0.01872110366821289, -0.013707160949707031, -0.008693218231201172, -0.0036792755126953125, 0.0013346672058105469, 0.006348609924316406, 0.011362552642822266, 0.016376495361328125, 0.021390438079833984, 0.026404380798339844, 0.0314183235168457, 0.03643226623535156, 0.04144620895385742, 0.04646015167236328, 0.05147409439086914, 0.056488037109375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 4.0, 13.0, 8.0, 21.0, 28.0, 33.0, 50.0, 54.0, 78.0, 88.0, 105.0, 97.0, 99.0, 92.0, 72.0, 53.0, 36.0, 23.0, 15.0, 14.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.003265380859375, -0.0031944215297698975, -0.003123462200164795, -0.0030525028705596924, -0.00298154354095459, -0.0029105842113494873, -0.0028396248817443848, -0.0027686655521392822, -0.0026977062225341797, -0.002626746892929077, -0.0025557875633239746, -0.002484828233718872, -0.0024138689041137695, -0.002342909574508667, -0.0022719502449035645, -0.002200990915298462, -0.0021300315856933594, -0.002059072256088257, -0.0019881129264831543, -0.0019171535968780518, -0.0018461942672729492, -0.0017752349376678467, -0.0017042756080627441, -0.0016333162784576416, -0.001562356948852539, -0.0014913976192474365, -0.001420438289642334, -0.0013494789600372314, -0.001278519630432129, -0.0012075603008270264, -0.0011366009712219238, -0.0010656416416168213, -0.0009946823120117188, -0.0009237229824066162, -0.0008527636528015137, -0.0007818043231964111, -0.0007108449935913086, -0.0006398856639862061, -0.0005689263343811035, -0.000497967004776001, -0.00042700767517089844, -0.0003560483455657959, -0.00028508901596069336, -0.00021412968635559082, -0.00014317035675048828, -7.221102714538574e-05, -1.2516975402832031e-06, 6.970763206481934e-05, 0.00014066696166992188, 0.00021162629127502441, 0.00028258562088012695, 0.0003535449504852295, 0.00042450428009033203, 0.0004954636096954346, 0.0005664229393005371, 0.0006373822689056396, 0.0007083415985107422, 0.0007793009281158447, 0.0008502602577209473, 0.0009212195873260498, 0.0009921789169311523, 0.0010631382465362549, 0.0011340975761413574, 0.00120505690574646, 0.0012760162353515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 10.0, 13.0, 36.0, 48.0, 98.0, 128.0, 169.0, 252.0, 762.0, 4189696.0, 2360.0, 261.0, 166.0, 111.0, 69.0, 42.0, 35.0, 14.0, 10.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65185546875, -0.6372528076171875, -0.622650146484375, -0.6080474853515625, -0.59344482421875, -0.5788421630859375, -0.564239501953125, -0.5496368408203125, -0.5350341796875, -0.5204315185546875, -0.505828857421875, -0.4912261962890625, -0.47662353515625, -0.4620208740234375, -0.447418212890625, -0.4328155517578125, -0.418212890625, -0.4036102294921875, -0.389007568359375, -0.3744049072265625, -0.35980224609375, -0.3451995849609375, -0.330596923828125, -0.3159942626953125, -0.3013916015625, -0.2867889404296875, -0.272186279296875, -0.2575836181640625, -0.24298095703125, -0.2283782958984375, -0.213775634765625, -0.1991729736328125, -0.1845703125, -0.1699676513671875, -0.155364990234375, -0.1407623291015625, -0.12615966796875, -0.1115570068359375, -0.096954345703125, -0.0823516845703125, -0.0677490234375, -0.0531463623046875, -0.038543701171875, -0.0239410400390625, -0.00933837890625, 0.0052642822265625, 0.019866943359375, 0.0344696044921875, 0.049072265625, 0.0636749267578125, 0.078277587890625, 0.0928802490234375, 0.10748291015625, 0.1220855712890625, 0.136688232421875, 0.1512908935546875, 0.1658935546875, 0.1804962158203125, 0.195098876953125, 0.2097015380859375, 0.22430419921875, 0.2389068603515625, 0.253509521484375, 0.2681121826171875, 0.28271484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 18.0, 306.0, 3605.0, 138.0, 17.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.064453125, -0.06330907344818115, -0.062165021896362305, -0.06102097034454346, -0.05987691879272461, -0.05873286724090576, -0.057588815689086914, -0.056444764137268066, -0.05530071258544922, -0.05415666103363037, -0.05301260948181152, -0.051868557929992676, -0.05072450637817383, -0.04958045482635498, -0.04843640327453613, -0.047292351722717285, -0.04614830017089844, -0.04500424861907959, -0.04386019706726074, -0.042716145515441895, -0.04157209396362305, -0.0404280424118042, -0.03928399085998535, -0.038139939308166504, -0.036995887756347656, -0.03585183620452881, -0.03470778465270996, -0.03356373310089111, -0.032419681549072266, -0.03127562999725342, -0.03013157844543457, -0.028987526893615723, -0.027843475341796875, -0.026699423789978027, -0.02555537223815918, -0.024411320686340332, -0.023267269134521484, -0.022123217582702637, -0.02097916603088379, -0.01983511447906494, -0.018691062927246094, -0.017547011375427246, -0.0164029598236084, -0.01525890827178955, -0.014114856719970703, -0.012970805168151855, -0.011826753616333008, -0.01068270206451416, -0.009538650512695312, -0.008394598960876465, -0.007250547409057617, -0.0061064958572387695, -0.004962444305419922, -0.0038183927536010742, -0.0026743412017822266, -0.001530289649963379, -0.00038623809814453125, 0.0007578134536743164, 0.001901865005493164, 0.0030459165573120117, 0.004189968109130859, 0.005334019660949707, 0.006478071212768555, 0.007622122764587402, 0.00876617431640625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 13.0, 55.0, 277.0, 561.0, 80.0, 10.0, 12.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6964147090911865, -0.6833183765411377, -0.6702221035957336, -0.6571257710456848, -0.644029438495636, -0.6309331059455872, -0.6178368330001831, -0.6047405004501343, -0.5916441679000854, -0.5785478353500366, -0.5654515624046326, -0.5523552298545837, -0.5392588973045349, -0.5261625647544861, -0.513066291809082, -0.4999699592590332, -0.48687365651130676, -0.4737773537635803, -0.4606810212135315, -0.44758471846580505, -0.4344883859157562, -0.4213920831680298, -0.40829575061798096, -0.3951994478702545, -0.3821031451225281, -0.36900684237480164, -0.3559105098247528, -0.34281420707702637, -0.32971787452697754, -0.3166215717792511, -0.30352526903152466, -0.29042893648147583, -0.277332603931427, -0.26423630118370056, -0.25113996863365173, -0.2380436658859253, -0.22494733333587646, -0.21185103058815002, -0.1987547129392624, -0.18565839529037476, -0.17256207764148712, -0.1594657599925995, -0.14636944234371185, -0.13327312469482422, -0.12017681449651718, -0.10708049684762955, -0.09398418664932251, -0.08088786900043488, -0.06779155135154724, -0.05469523370265961, -0.04159891977906227, -0.028502605855464935, -0.015406288206577301, -0.0023099705576896667, 0.01078633964061737, 0.023882657289505005, 0.03697897493839264, 0.05007529258728027, 0.06317161023616791, 0.07626792043447495, 0.08936423808336258, 0.10246055573225021, 0.11555686593055725, 0.12865318357944489, 0.14174950122833252]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 14.0, 20.0, 42.0, 74.0, 104.0, 135.0, 156.0, 157.0, 108.0, 93.0, 40.0, 29.0, 18.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1467735767364502, -0.14198756217956543, -0.13720156252384186, -0.1324155479669571, -0.12762954831123352, -0.12284353375434875, -0.11805751919746399, -0.11327151209115982, -0.10848550498485565, -0.10369949787855148, -0.09891349077224731, -0.09412747621536255, -0.08934146910905838, -0.08455546200275421, -0.07976944744586945, -0.07498344033956528, -0.07019743323326111, -0.06541142612695694, -0.06062541529536247, -0.055839404463768005, -0.05105339735746384, -0.04626739025115967, -0.0414813794195652, -0.036695368587970734, -0.031909361481666565, -0.027123352512717247, -0.02233734354376793, -0.01755133457481861, -0.012765325605869293, -0.007979316636919975, -0.0031933076679706573, 0.0015927031636238098, 0.0063787102699279785, 0.011164719238877296, 0.015950728207826614, 0.020736737176775932, 0.02552274614572525, 0.030308755114674568, 0.035094764083623886, 0.03988077491521835, 0.04466678202152252, 0.04945278912782669, 0.05423879995942116, 0.059024810791015625, 0.0638108178973198, 0.06859682500362396, 0.07338283956050873, 0.0781688466668129, 0.08295485377311707, 0.08774086087942123, 0.0925268679857254, 0.09731288254261017, 0.10209888964891434, 0.1068848967552185, 0.11167091131210327, 0.11645691841840744, 0.12124292552471161, 0.12602894008159637, 0.13081493973731995, 0.1356009542942047, 0.14038696885108948, 0.14517296850681305, 0.14995898306369781, 0.1547449827194214, 0.15953099727630615]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 7.0, 4.0, 5.0, 14.0, 3.0, 12.0, 15.0, 19.0, 20.0, 29.0, 47.0, 65.0, 100.0, 172.0, 253.0, 464.0, 950.0, 2402.0, 9665.0, 64449.0, 826133.0, 123631.0, 14052.0, 3350.0, 1180.0, 581.0, 304.0, 196.0, 111.0, 79.0, 59.0, 38.0, 35.0, 27.0, 12.0, 13.0, 10.0, 11.0, 4.0, 6.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-0.07342529296875, -0.07117462158203125, -0.0689239501953125, -0.06667327880859375, -0.064422607421875, -0.06217193603515625, -0.0599212646484375, -0.05767059326171875, -0.055419921875, -0.05316925048828125, -0.0509185791015625, -0.04866790771484375, -0.046417236328125, -0.04416656494140625, -0.0419158935546875, -0.03966522216796875, -0.03741455078125, -0.03516387939453125, -0.0329132080078125, -0.03066253662109375, -0.028411865234375, -0.02616119384765625, -0.0239105224609375, -0.02165985107421875, -0.0194091796875, -0.01715850830078125, -0.0149078369140625, -0.01265716552734375, -0.010406494140625, -0.00815582275390625, -0.0059051513671875, -0.00365447998046875, -0.00140380859375, 0.00084686279296875, 0.0030975341796875, 0.00534820556640625, 0.007598876953125, 0.00984954833984375, 0.0121002197265625, 0.01435089111328125, 0.0166015625, 0.01885223388671875, 0.0211029052734375, 0.02335357666015625, 0.025604248046875, 0.02785491943359375, 0.0301055908203125, 0.03235626220703125, 0.03460693359375, 0.03685760498046875, 0.0391082763671875, 0.04135894775390625, 0.043609619140625, 0.04586029052734375, 0.0481109619140625, 0.05036163330078125, 0.0526123046875, 0.05486297607421875, 0.0571136474609375, 0.05936431884765625, 0.061614990234375, 0.06386566162109375, 0.0661163330078125, 0.06836700439453125, 0.07061767578125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 14.0, 34.0, 35.0, 43.0, 76.0, 85.0, 131.0, 118.0, 117.0, 99.0, 75.0, 50.0, 38.0, 24.0, 19.0, 11.0, 6.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00800323486328125, -0.00777745246887207, -0.007551670074462891, -0.007325887680053711, -0.007100105285644531, -0.0068743228912353516, -0.006648540496826172, -0.006422758102416992, -0.0061969757080078125, -0.005971193313598633, -0.005745410919189453, -0.0055196285247802734, -0.005293846130371094, -0.005068063735961914, -0.004842281341552734, -0.004616498947143555, -0.004390716552734375, -0.004164934158325195, -0.003939151763916016, -0.003713369369506836, -0.0034875869750976562, -0.0032618045806884766, -0.003036022186279297, -0.002810239791870117, -0.0025844573974609375, -0.002358675003051758, -0.002132892608642578, -0.0019071102142333984, -0.0016813278198242188, -0.001455545425415039, -0.0012297630310058594, -0.0010039806365966797, -0.0007781982421875, -0.0005524158477783203, -0.0003266334533691406, -0.00010085105895996094, 0.00012493133544921875, 0.00035071372985839844, 0.0005764961242675781, 0.0008022785186767578, 0.0010280609130859375, 0.0012538433074951172, 0.0014796257019042969, 0.0017054080963134766, 0.0019311904907226562, 0.002156972885131836, 0.0023827552795410156, 0.0026085376739501953, 0.002834320068359375, 0.0030601024627685547, 0.0032858848571777344, 0.003511667251586914, 0.0037374496459960938, 0.0039632320404052734, 0.004189014434814453, 0.004414796829223633, 0.0046405792236328125, 0.004866361618041992, 0.005092144012451172, 0.0053179264068603516, 0.005543708801269531, 0.005769491195678711, 0.005995273590087891, 0.00622105598449707, 0.00644683837890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 11.0, 10.0, 14.0, 21.0, 26.0, 37.0, 51.0, 77.0, 152.0, 346.0, 1014.0, 4052.0, 26348.0, 568964.0, 420815.0, 21549.0, 3461.0, 892.0, 318.0, 142.0, 78.0, 49.0, 35.0, 23.0, 19.0, 11.0, 12.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05523681640625, -0.053452491760253906, -0.05166816711425781, -0.04988384246826172, -0.048099517822265625, -0.04631519317626953, -0.04453086853027344, -0.042746543884277344, -0.04096221923828125, -0.039177894592285156, -0.03739356994628906, -0.03560924530029297, -0.033824920654296875, -0.03204059600830078, -0.030256271362304688, -0.028471946716308594, -0.0266876220703125, -0.024903297424316406, -0.023118972778320312, -0.02133464813232422, -0.019550323486328125, -0.01776599884033203, -0.015981674194335938, -0.014197349548339844, -0.01241302490234375, -0.010628700256347656, -0.008844375610351562, -0.007060050964355469, -0.005275726318359375, -0.0034914016723632812, -0.0017070770263671875, 7.724761962890625e-05, 0.001861572265625, 0.0036458969116210938, 0.0054302215576171875, 0.007214546203613281, 0.008998870849609375, 0.010783195495605469, 0.012567520141601562, 0.014351844787597656, 0.01613616943359375, 0.017920494079589844, 0.019704818725585938, 0.02148914337158203, 0.023273468017578125, 0.02505779266357422, 0.026842117309570312, 0.028626441955566406, 0.0304107666015625, 0.032195091247558594, 0.03397941589355469, 0.03576374053955078, 0.037548065185546875, 0.03933238983154297, 0.04111671447753906, 0.042901039123535156, 0.04468536376953125, 0.046469688415527344, 0.04825401306152344, 0.05003833770751953, 0.051822662353515625, 0.05360698699951172, 0.05539131164550781, 0.057175636291503906, 0.0589599609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 7.0, 8.0, 6.0, 17.0, 16.0, 26.0, 17.0, 26.0, 40.0, 40.0, 38.0, 62.0, 68.0, 63.0, 62.0, 64.0, 55.0, 57.0, 58.0, 62.0, 39.0, 34.0, 28.0, 26.0, 16.0, 14.0, 12.0, 11.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0184783935546875, -0.0178835391998291, -0.017288684844970703, -0.016693830490112305, -0.016098976135253906, -0.015504121780395508, -0.01490926742553711, -0.014314413070678711, -0.013719558715820312, -0.013124704360961914, -0.012529850006103516, -0.011934995651245117, -0.011340141296386719, -0.01074528694152832, -0.010150432586669922, -0.009555578231811523, -0.008960723876953125, -0.008365869522094727, -0.007771015167236328, -0.00717616081237793, -0.006581306457519531, -0.005986452102661133, -0.005391597747802734, -0.004796743392944336, -0.0042018890380859375, -0.003607034683227539, -0.0030121803283691406, -0.002417325973510742, -0.0018224716186523438, -0.0012276172637939453, -0.0006327629089355469, -3.790855407714844e-05, 0.00055694580078125, 0.0011518001556396484, 0.0017466545104980469, 0.0023415088653564453, 0.0029363632202148438, 0.003531217575073242, 0.004126071929931641, 0.004720926284790039, 0.0053157806396484375, 0.005910634994506836, 0.006505489349365234, 0.007100343704223633, 0.007695198059082031, 0.00829005241394043, 0.008884906768798828, 0.009479761123657227, 0.010074615478515625, 0.010669469833374023, 0.011264324188232422, 0.01185917854309082, 0.012454032897949219, 0.013048887252807617, 0.013643741607666016, 0.014238595962524414, 0.014833450317382812, 0.015428304672241211, 0.01602315902709961, 0.016618013381958008, 0.017212867736816406, 0.017807722091674805, 0.018402576446533203, 0.0189974308013916, 0.01959228515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 9.0, 12.0, 15.0, 11.0, 30.0, 32.0, 47.0, 92.0, 204.0, 406.0, 891.0, 2672.0, 12909.0, 722256.0, 297016.0, 8254.0, 2157.0, 773.0, 343.0, 164.0, 92.0, 54.0, 32.0, 21.0, 10.0, 16.0, 10.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052459716796875, -0.05095624923706055, -0.049452781677246094, -0.04794931411743164, -0.04644584655761719, -0.044942378997802734, -0.04343891143798828, -0.04193544387817383, -0.040431976318359375, -0.03892850875854492, -0.03742504119873047, -0.035921573638916016, -0.03441810607910156, -0.03291463851928711, -0.031411170959472656, -0.029907703399658203, -0.02840423583984375, -0.026900768280029297, -0.025397300720214844, -0.02389383316040039, -0.022390365600585938, -0.020886898040771484, -0.01938343048095703, -0.017879962921142578, -0.016376495361328125, -0.014873027801513672, -0.013369560241699219, -0.011866092681884766, -0.010362625122070312, -0.00885915756225586, -0.007355690002441406, -0.005852222442626953, -0.0043487548828125, -0.002845287322998047, -0.0013418197631835938, 0.00016164779663085938, 0.0016651153564453125, 0.0031685829162597656, 0.004672050476074219, 0.006175518035888672, 0.007678985595703125, 0.009182453155517578, 0.010685920715332031, 0.012189388275146484, 0.013692855834960938, 0.01519632339477539, 0.016699790954589844, 0.018203258514404297, 0.01970672607421875, 0.021210193634033203, 0.022713661193847656, 0.02421712875366211, 0.025720596313476562, 0.027224063873291016, 0.02872753143310547, 0.030230998992919922, 0.031734466552734375, 0.03323793411254883, 0.03474140167236328, 0.036244869232177734, 0.03774833679199219, 0.03925180435180664, 0.040755271911621094, 0.04225873947143555, 0.04376220703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 2.0, 11.0, 12.0, 10.0, 23.0, 16.0, 32.0, 33.0, 41.0, 51.0, 89.0, 120.0, 153.0, 131.0, 87.0, 49.0, 37.0, 40.0, 17.0, 13.0, 11.0, 11.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011807680130004883, -0.00011302437633275986, -0.00010797195136547089, -0.00010291952639818192, -9.786710143089294e-05, -9.281467646360397e-05, -8.7762251496315e-05, -8.270982652902603e-05, -7.765740156173706e-05, -7.260497659444809e-05, -6.755255162715912e-05, -6.250012665987015e-05, -5.744770169258118e-05, -5.2395276725292206e-05, -4.7342851758003235e-05, -4.2290426790714264e-05, -3.723800182342529e-05, -3.218557685613632e-05, -2.713315188884735e-05, -2.208072692155838e-05, -1.702830195426941e-05, -1.1975876986980438e-05, -6.923452019691467e-06, -1.8710270524024963e-06, 3.1813979148864746e-06, 8.233822882175446e-06, 1.3286247849464417e-05, 1.8338672816753387e-05, 2.339109778404236e-05, 2.844352275133133e-05, 3.34959477186203e-05, 3.854837268590927e-05, 4.360079765319824e-05, 4.865322262048721e-05, 5.3705647587776184e-05, 5.8758072555065155e-05, 6.381049752235413e-05, 6.88629224896431e-05, 7.391534745693207e-05, 7.896777242422104e-05, 8.402019739151001e-05, 8.907262235879898e-05, 9.412504732608795e-05, 9.917747229337692e-05, 0.0001042298972606659, 0.00010928232222795486, 0.00011433474719524384, 0.0001193871721625328, 0.00012443959712982178, 0.00012949202209711075, 0.00013454444706439972, 0.0001395968720316887, 0.00014464929699897766, 0.00014970172196626663, 0.0001547541469335556, 0.00015980657190084457, 0.00016485899686813354, 0.00016991142183542252, 0.0001749638468027115, 0.00018001627177000046, 0.00018506869673728943, 0.0001901211217045784, 0.00019517354667186737, 0.00020022597163915634, 0.0002052783966064453]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 3.0, 8.0, 17.0, 23.0, 50.0, 91.0, 217.0, 771.0, 6566.0, 801366.0, 234682.0, 3753.0, 627.0, 192.0, 79.0, 48.0, 25.0, 8.0, 9.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.057861328125, -0.05553627014160156, -0.053211212158203125, -0.05088615417480469, -0.04856109619140625, -0.04623603820800781, -0.043910980224609375, -0.04158592224121094, -0.0392608642578125, -0.03693580627441406, -0.034610748291015625, -0.03228569030761719, -0.02996063232421875, -0.027635574340820312, -0.025310516357421875, -0.022985458374023438, -0.020660400390625, -0.018335342407226562, -0.016010284423828125, -0.013685226440429688, -0.01136016845703125, -0.009035110473632812, -0.006710052490234375, -0.0043849945068359375, -0.0020599365234375, 0.0002651214599609375, 0.002590179443359375, 0.0049152374267578125, 0.00724029541015625, 0.009565353393554688, 0.011890411376953125, 0.014215469360351562, 0.01654052734375, 0.018865585327148438, 0.021190643310546875, 0.023515701293945312, 0.02584075927734375, 0.028165817260742188, 0.030490875244140625, 0.03281593322753906, 0.0351409912109375, 0.03746604919433594, 0.039791107177734375, 0.04211616516113281, 0.04444122314453125, 0.04676628112792969, 0.049091339111328125, 0.05141639709472656, 0.053741455078125, 0.05606651306152344, 0.058391571044921875, 0.06071662902832031, 0.06304168701171875, 0.06536674499511719, 0.06769180297851562, 0.07001686096191406, 0.0723419189453125, 0.07466697692871094, 0.07699203491210938, 0.07931709289550781, 0.08164215087890625, 0.08396720886230469, 0.08629226684570312, 0.08861732482910156, 0.0909423828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 2.0, 6.0, 16.0, 17.0, 32.0, 39.0, 83.0, 137.0, 173.0, 188.0, 132.0, 63.0, 30.0, 28.0, 18.0, 11.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016326904296875, -0.015503883361816406, -0.014680862426757812, -0.013857841491699219, -0.013034820556640625, -0.012211799621582031, -0.011388778686523438, -0.010565757751464844, -0.00974273681640625, -0.008919715881347656, -0.008096694946289062, -0.007273674011230469, -0.006450653076171875, -0.005627632141113281, -0.0048046112060546875, -0.003981590270996094, -0.0031585693359375, -0.0023355484008789062, -0.0015125274658203125, -0.0006895065307617188, 0.000133514404296875, 0.0009565353393554688, 0.0017795562744140625, 0.0026025772094726562, 0.00342559814453125, 0.004248619079589844, 0.0050716400146484375, 0.005894660949707031, 0.006717681884765625, 0.007540702819824219, 0.008363723754882812, 0.009186744689941406, 0.010009765625, 0.010832786560058594, 0.011655807495117188, 0.012478828430175781, 0.013301849365234375, 0.014124870300292969, 0.014947891235351562, 0.015770912170410156, 0.01659393310546875, 0.017416954040527344, 0.018239974975585938, 0.01906299591064453, 0.019886016845703125, 0.02070903778076172, 0.021532058715820312, 0.022355079650878906, 0.0231781005859375, 0.024001121520996094, 0.024824142456054688, 0.02564716339111328, 0.026470184326171875, 0.02729320526123047, 0.028116226196289062, 0.028939247131347656, 0.02976226806640625, 0.030585289001464844, 0.03140830993652344, 0.03223133087158203, 0.033054351806640625, 0.03387737274169922, 0.03470039367675781, 0.035523414611816406, 0.036346435546875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 320.0, 605.0, 59.0, 12.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6035652160644531, -1.5738805532455444, -1.5441958904266357, -1.514511227607727, -1.4848265647888184, -1.4551417827606201, -1.4254571199417114, -1.3957724571228027, -1.366087794303894, -1.3364031314849854, -1.3067184686660767, -1.277033805847168, -1.2473490238189697, -1.217664361000061, -1.1879796981811523, -1.1582950353622437, -1.128610372543335, -1.0989257097244263, -1.0692410469055176, -1.0395563840866089, -1.0098717212677002, -0.9801869988441467, -0.9505022764205933, -0.9208176136016846, -0.8911329507827759, -0.8614482879638672, -0.8317636251449585, -0.802078902721405, -0.7723942399024963, -0.7427095770835876, -0.7130248546600342, -0.6833401918411255, -0.6536555290222168, -0.6239708662033081, -0.5942862033843994, -0.564601480960846, -0.5349168181419373, -0.5052321553230286, -0.4755474627017975, -0.4458627700805664, -0.4161781072616577, -0.386493444442749, -0.35680875182151794, -0.32712405920028687, -0.2974393963813782, -0.2677547335624695, -0.2380700409412384, -0.20838536322116852, -0.17870068550109863, -0.14901600778102875, -0.11933133006095886, -0.08964665234088898, -0.05996197462081909, -0.030277296900749207, -0.0005926191806793213, 0.029092058539390564, 0.05877673625946045, 0.08846141397953033, 0.11814609169960022, 0.1478307694196701, 0.17751544713974, 0.20720012485980988, 0.23688480257987976, 0.26656949520111084, 0.29625415802001953]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 9.0, 6.0, 12.0, 14.0, 35.0, 29.0, 37.0, 44.0, 66.0, 70.0, 64.0, 77.0, 75.0, 78.0, 75.0, 62.0, 59.0, 44.0, 40.0, 27.0, 33.0, 19.0, 11.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15021491050720215, -0.14463640749454498, -0.13905788958072662, -0.13347938656806946, -0.1279008835554123, -0.12232237309217453, -0.11674386262893677, -0.1111653596162796, -0.10558684915304184, -0.10000833868980408, -0.09442983567714691, -0.08885132521390915, -0.08327281475067139, -0.07769431173801422, -0.07211580127477646, -0.0665372908115387, -0.06095878779888153, -0.05538028106093407, -0.0498017743229866, -0.04422326385974884, -0.038644757121801376, -0.03306625038385391, -0.02748773992061615, -0.021909233182668686, -0.016330726444721222, -0.010752218775451183, -0.005173711106181145, 0.0004047974944114685, 0.0059833042323589325, 0.011561810970306396, 0.01714032143354416, 0.022718828171491623, 0.028297334909439087, 0.03387584164738655, 0.039454348385334015, 0.04503285884857178, 0.05061136558651924, 0.056189872324466705, 0.06176838278770447, 0.06734688580036163, 0.0729253962635994, 0.07850390672683716, 0.08408240973949432, 0.08966092020273209, 0.09523943066596985, 0.10081793367862701, 0.10639644414186478, 0.11197495460510254, 0.1175534576177597, 0.12313196808099747, 0.12871047854423523, 0.1342889815568924, 0.13986748456954956, 0.14544600248336792, 0.15102450549602509, 0.15660300850868225, 0.1621815264225006, 0.16776002943515778, 0.17333854734897614, 0.1789170503616333, 0.18449555337429047, 0.19007405638694763, 0.195652574300766, 0.20123107731342316, 0.20680958032608032]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 6.0, 14.0, 12.0, 6.0, 9.0, 13.0, 14.0, 20.0, 19.0, 17.0, 33.0, 43.0, 50.0, 79.0, 103.0, 161.0, 310.0, 498.0, 1084.0, 3094.0, 14618.0, 235106.0, 3880559.0, 49414.0, 6590.0, 1561.0, 510.0, 179.0, 84.0, 30.0, 16.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.1549072265625, -0.1517624855041504, -0.14861774444580078, -0.14547300338745117, -0.14232826232910156, -0.13918352127075195, -0.13603878021240234, -0.13289403915405273, -0.12974929809570312, -0.12660455703735352, -0.1234598159790039, -0.1203150749206543, -0.11717033386230469, -0.11402559280395508, -0.11088085174560547, -0.10773611068725586, -0.10459136962890625, -0.10144662857055664, -0.09830188751220703, -0.09515714645385742, -0.09201240539550781, -0.0888676643371582, -0.0857229232788086, -0.08257818222045898, -0.07943344116210938, -0.07628870010375977, -0.07314395904541016, -0.06999921798706055, -0.06685447692871094, -0.06370973587036133, -0.06056499481201172, -0.05742025375366211, -0.0542755126953125, -0.05113077163696289, -0.04798603057861328, -0.04484128952026367, -0.04169654846191406, -0.03855180740356445, -0.035407066345214844, -0.032262325286865234, -0.029117584228515625, -0.025972843170166016, -0.022828102111816406, -0.019683361053466797, -0.016538619995117188, -0.013393878936767578, -0.010249137878417969, -0.007104396820068359, -0.00395965576171875, -0.0008149147033691406, 0.0023298263549804688, 0.005474567413330078, 0.008619308471679688, 0.011764049530029297, 0.014908790588378906, 0.018053531646728516, 0.021198272705078125, 0.024343013763427734, 0.027487754821777344, 0.030632495880126953, 0.03377723693847656, 0.03692197799682617, 0.04006671905517578, 0.04321146011352539, 0.046356201171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 9.0, 15.0, 22.0, 38.0, 70.0, 60.0, 115.0, 108.0, 118.0, 122.0, 100.0, 66.0, 53.0, 35.0, 27.0, 15.0, 12.0, 7.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0105438232421875, -0.010295510292053223, -0.010047197341918945, -0.009798884391784668, -0.00955057144165039, -0.009302258491516113, -0.009053945541381836, -0.008805632591247559, -0.008557319641113281, -0.008309006690979004, -0.008060693740844727, -0.007812380790710449, -0.007564067840576172, -0.0073157548904418945, -0.007067441940307617, -0.00681912899017334, -0.0065708160400390625, -0.006322503089904785, -0.006074190139770508, -0.0058258771896362305, -0.005577564239501953, -0.005329251289367676, -0.0050809383392333984, -0.004832625389099121, -0.004584312438964844, -0.004335999488830566, -0.004087686538696289, -0.0038393735885620117, -0.0035910606384277344, -0.003342747688293457, -0.0030944347381591797, -0.0028461217880249023, -0.002597808837890625, -0.0023494958877563477, -0.0021011829376220703, -0.001852869987487793, -0.0016045570373535156, -0.0013562440872192383, -0.001107931137084961, -0.0008596181869506836, -0.0006113052368164062, -0.0003629922866821289, -0.00011467933654785156, 0.00013363361358642578, 0.0003819465637207031, 0.0006302595138549805, 0.0008785724639892578, 0.0011268854141235352, 0.0013751983642578125, 0.0016235113143920898, 0.0018718242645263672, 0.0021201372146606445, 0.002368450164794922, 0.0026167631149291992, 0.0028650760650634766, 0.003113389015197754, 0.0033617019653320312, 0.0036100149154663086, 0.003858327865600586, 0.004106640815734863, 0.004354953765869141, 0.004603266716003418, 0.004851579666137695, 0.005099892616271973, 0.00534820556640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 6.0, 9.0, 26.0, 37.0, 73.0, 164.0, 499.0, 3898.0, 4186095.0, 2940.0, 345.0, 113.0, 46.0, 22.0, 9.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83544921875, -0.8185672760009766, -0.8016853332519531, -0.7848033905029297, -0.7679214477539062, -0.7510395050048828, -0.7341575622558594, -0.7172756195068359, -0.7003936767578125, -0.6835117340087891, -0.6666297912597656, -0.6497478485107422, -0.6328659057617188, -0.6159839630126953, -0.5991020202636719, -0.5822200775146484, -0.565338134765625, -0.5484561920166016, -0.5315742492675781, -0.5146923065185547, -0.49781036376953125, -0.4809284210205078, -0.4640464782714844, -0.44716453552246094, -0.4302825927734375, -0.41340065002441406, -0.3965187072753906, -0.3796367645263672, -0.36275482177734375, -0.3458728790283203, -0.3289909362792969, -0.31210899353027344, -0.29522705078125, -0.27834510803222656, -0.2614631652832031, -0.2445812225341797, -0.22769927978515625, -0.2108173370361328, -0.19393539428710938, -0.17705345153808594, -0.1601715087890625, -0.14328956604003906, -0.12640762329101562, -0.10952568054199219, -0.09264373779296875, -0.07576179504394531, -0.058879852294921875, -0.04199790954589844, -0.025115966796875, -0.008234024047851562, 0.008647918701171875, 0.025529861450195312, 0.04241180419921875, 0.05929374694824219, 0.07617568969726562, 0.09305763244628906, 0.1099395751953125, 0.12682151794433594, 0.14370346069335938, 0.1605854034423828, 0.17746734619140625, 0.1943492889404297, 0.21123123168945312, 0.22811317443847656, 0.2449951171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 10.0, 20.0, 68.0, 365.0, 3204.0, 315.0, 61.0, 18.0, 8.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.07147216796875, -0.07018482685089111, -0.06889748573303223, -0.06761014461517334, -0.06632280349731445, -0.06503546237945557, -0.06374812126159668, -0.06246078014373779, -0.061173439025878906, -0.05988609790802002, -0.05859875679016113, -0.057311415672302246, -0.05602407455444336, -0.05473673343658447, -0.053449392318725586, -0.0521620512008667, -0.05087471008300781, -0.049587368965148926, -0.04830002784729004, -0.04701268672943115, -0.045725345611572266, -0.04443800449371338, -0.04315066337585449, -0.041863322257995605, -0.04057598114013672, -0.03928864002227783, -0.038001298904418945, -0.03671395778656006, -0.03542661666870117, -0.034139275550842285, -0.0328519344329834, -0.03156459331512451, -0.030277252197265625, -0.02898991107940674, -0.02770256996154785, -0.026415228843688965, -0.025127887725830078, -0.02384054660797119, -0.022553205490112305, -0.021265864372253418, -0.01997852325439453, -0.018691182136535645, -0.017403841018676758, -0.01611649990081787, -0.014829158782958984, -0.013541817665100098, -0.012254476547241211, -0.010967135429382324, -0.009679794311523438, -0.00839245319366455, -0.007105112075805664, -0.005817770957946777, -0.004530429840087891, -0.003243088722229004, -0.001955747604370117, -0.0006684064865112305, 0.0006189346313476562, 0.001906275749206543, 0.0031936168670654297, 0.004480957984924316, 0.005768299102783203, 0.00705564022064209, 0.008342981338500977, 0.009630322456359863, 0.01091766357421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 19.0, 23.0, 49.0, 129.0, 340.0, 266.0, 91.0, 29.0, 15.0, 9.0, 8.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.3429376482963562, -0.3360814154148102, -0.32922518253326416, -0.32236894965171814, -0.3155127167701721, -0.3086565136909485, -0.30180028080940247, -0.29494404792785645, -0.2880878150463104, -0.2812315821647644, -0.2743753492832184, -0.26751911640167236, -0.26066291332244873, -0.2538066804409027, -0.2469504475593567, -0.24009421467781067, -0.23323798179626465, -0.22638174891471863, -0.2195255160331726, -0.21266929805278778, -0.20581306517124176, -0.19895683228969574, -0.1921006143093109, -0.1852443814277649, -0.17838814854621887, -0.17153191566467285, -0.16467568278312683, -0.157819464802742, -0.15096323192119598, -0.14410699903964996, -0.13725078105926514, -0.13039454817771912, -0.1235383003950119, -0.11668206751346588, -0.10982584208250046, -0.10296961665153503, -0.09611338376998901, -0.089257150888443, -0.08240092545747757, -0.07554470002651215, -0.06868846714496613, -0.0618322379887104, -0.05497600883245468, -0.04811977967619896, -0.04126355051994324, -0.034407321363687515, -0.027551092207431793, -0.02069486305117607, -0.013838633894920349, -0.006982404738664627, -0.00012617558240890503, 0.006730053573846817, 0.013586282730102539, 0.02044251188635826, 0.027298741042613983, 0.034154970198869705, 0.04101119935512543, 0.04786742851138115, 0.05472365766763687, 0.06157988682389259, 0.06843611598014832, 0.07529234886169434, 0.08214857429265976, 0.08900479972362518, 0.0958610326051712]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 13.0, 10.0, 25.0, 25.0, 32.0, 58.0, 83.0, 82.0, 110.0, 104.0, 126.0, 78.0, 85.0, 55.0, 36.0, 35.0, 18.0, 18.0, 10.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16021275520324707, -0.15531077980995178, -0.1504087895154953, -0.1455068141222, -0.14060482382774353, -0.13570284843444824, -0.13080085813999176, -0.12589888274669647, -0.12099689990282059, -0.1160949170589447, -0.11119293421506882, -0.10629095137119293, -0.10138897597789764, -0.09648698568344116, -0.09158501029014587, -0.08668302744626999, -0.0817810446023941, -0.07687906175851822, -0.07197707891464233, -0.06707509607076645, -0.06217311695218086, -0.05727113410830498, -0.05236915498971939, -0.047467172145843506, -0.04256518930196762, -0.037663206458091736, -0.03276122361421585, -0.027859244495630264, -0.02295726165175438, -0.018055278807878494, -0.013153297826647758, -0.008251316845417023, -0.0033493340015411377, 0.0015526479110121727, 0.006454629823565483, 0.011356611736118793, 0.016258593648672104, 0.02116057649254799, 0.026062557473778725, 0.03096453845500946, 0.035866521298885345, 0.04076850414276123, 0.045670486986637115, 0.0505724661052227, 0.05547444894909859, 0.06037643179297447, 0.06527841091156006, 0.07018039375543594, 0.07508237659931183, 0.07998435944318771, 0.0848863422870636, 0.08978832513093948, 0.09469030797481537, 0.09959228336811066, 0.10449426621198654, 0.10939624905586243, 0.11429823189973831, 0.1192002147436142, 0.12410219758749008, 0.12900418043136597, 0.13390615582466125, 0.13880814611911774, 0.14371012151241302, 0.1486121118068695, 0.1535140872001648]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 10.0, 14.0, 21.0, 11.0, 30.0, 36.0, 41.0, 86.0, 95.0, 149.0, 233.0, 355.0, 626.0, 1446.0, 4431.0, 19117.0, 130379.0, 752462.0, 114377.0, 17479.0, 4067.0, 1291.0, 666.0, 340.0, 258.0, 163.0, 101.0, 79.0, 58.0, 35.0, 24.0, 25.0, 12.0, 11.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.087158203125, -0.08483219146728516, -0.08250617980957031, -0.08018016815185547, -0.07785415649414062, -0.07552814483642578, -0.07320213317871094, -0.0708761215209961, -0.06855010986328125, -0.0662240982055664, -0.06389808654785156, -0.06157207489013672, -0.059246063232421875, -0.05692005157470703, -0.05459403991699219, -0.052268028259277344, -0.0499420166015625, -0.047616004943847656, -0.04528999328613281, -0.04296398162841797, -0.040637969970703125, -0.03831195831298828, -0.03598594665527344, -0.033659934997558594, -0.03133392333984375, -0.029007911682128906, -0.026681900024414062, -0.02435588836669922, -0.022029876708984375, -0.01970386505126953, -0.017377853393554688, -0.015051841735839844, -0.012725830078125, -0.010399818420410156, -0.008073806762695312, -0.005747795104980469, -0.003421783447265625, -0.0010957717895507812, 0.0012302398681640625, 0.0035562515258789062, 0.00588226318359375, 0.008208274841308594, 0.010534286499023438, 0.012860298156738281, 0.015186309814453125, 0.01751232147216797, 0.019838333129882812, 0.022164344787597656, 0.0244903564453125, 0.026816368103027344, 0.029142379760742188, 0.03146839141845703, 0.033794403076171875, 0.03612041473388672, 0.03844642639160156, 0.040772438049316406, 0.04309844970703125, 0.045424461364746094, 0.04775047302246094, 0.05007648468017578, 0.052402496337890625, 0.05472850799560547, 0.05705451965332031, 0.059380531311035156, 0.06170654296875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 10.0, 12.0, 24.0, 38.0, 44.0, 83.0, 79.0, 106.0, 112.0, 94.0, 108.0, 86.0, 69.0, 51.0, 32.0, 18.0, 9.0, 9.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013153076171875, -0.012775421142578125, -0.01239776611328125, -0.012020111083984375, -0.0116424560546875, -0.011264801025390625, -0.01088714599609375, -0.010509490966796875, -0.0101318359375, -0.009754180908203125, -0.00937652587890625, -0.008998870849609375, -0.0086212158203125, -0.008243560791015625, -0.00786590576171875, -0.007488250732421875, -0.007110595703125, -0.006732940673828125, -0.00635528564453125, -0.005977630615234375, -0.0055999755859375, -0.005222320556640625, -0.00484466552734375, -0.004467010498046875, -0.00408935546875, -0.003711700439453125, -0.00333404541015625, -0.002956390380859375, -0.0025787353515625, -0.002201080322265625, -0.00182342529296875, -0.001445770263671875, -0.001068115234375, -0.000690460205078125, -0.00031280517578125, 6.4849853515625e-05, 0.0004425048828125, 0.000820159912109375, 0.00119781494140625, 0.001575469970703125, 0.001953125, 0.002330780029296875, 0.00270843505859375, 0.003086090087890625, 0.0034637451171875, 0.003841400146484375, 0.00421905517578125, 0.004596710205078125, 0.004974365234375, 0.005352020263671875, 0.00572967529296875, 0.006107330322265625, 0.0064849853515625, 0.006862640380859375, 0.00724029541015625, 0.007617950439453125, 0.00799560546875, 0.008373260498046875, 0.00875091552734375, 0.009128570556640625, 0.0095062255859375, 0.009883880615234375, 0.01026153564453125, 0.010639190673828125, 0.011016845703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 11.0, 9.0, 13.0, 20.0, 37.0, 48.0, 96.0, 179.0, 312.0, 634.0, 1609.0, 4259.0, 14562.0, 67359.0, 593688.0, 309783.0, 40539.0, 9934.0, 3107.0, 1188.0, 522.0, 250.0, 148.0, 77.0, 47.0, 39.0, 21.0, 11.0, 9.0, 10.0, 5.0, 5.0, 2.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04681396484375, -0.04524564743041992, -0.043677330017089844, -0.042109012603759766, -0.04054069519042969, -0.03897237777709961, -0.03740406036376953, -0.03583574295043945, -0.034267425537109375, -0.0326991081237793, -0.03113079071044922, -0.02956247329711914, -0.027994155883789062, -0.026425838470458984, -0.024857521057128906, -0.023289203643798828, -0.02172088623046875, -0.020152568817138672, -0.018584251403808594, -0.017015933990478516, -0.015447616577148438, -0.01387929916381836, -0.012310981750488281, -0.010742664337158203, -0.009174346923828125, -0.007606029510498047, -0.006037712097167969, -0.004469394683837891, -0.0029010772705078125, -0.0013327598571777344, 0.00023555755615234375, 0.0018038749694824219, 0.0033721923828125, 0.004940509796142578, 0.006508827209472656, 0.008077144622802734, 0.009645462036132812, 0.01121377944946289, 0.012782096862792969, 0.014350414276123047, 0.015918731689453125, 0.017487049102783203, 0.01905536651611328, 0.02062368392944336, 0.022192001342773438, 0.023760318756103516, 0.025328636169433594, 0.026896953582763672, 0.02846527099609375, 0.030033588409423828, 0.031601905822753906, 0.033170223236083984, 0.03473854064941406, 0.03630685806274414, 0.03787517547607422, 0.0394434928894043, 0.041011810302734375, 0.04258012771606445, 0.04414844512939453, 0.04571676254272461, 0.04728507995605469, 0.048853397369384766, 0.050421714782714844, 0.05199003219604492, 0.053558349609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 10.0, 8.0, 13.0, 12.0, 18.0, 25.0, 31.0, 31.0, 40.0, 48.0, 44.0, 66.0, 51.0, 59.0, 67.0, 83.0, 61.0, 50.0, 44.0, 49.0, 34.0, 28.0, 26.0, 26.0, 17.0, 8.0, 11.0, 7.0, 8.0, 5.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0284423828125, -0.027497291564941406, -0.026552200317382812, -0.02560710906982422, -0.024662017822265625, -0.02371692657470703, -0.022771835327148438, -0.021826744079589844, -0.02088165283203125, -0.019936561584472656, -0.018991470336914062, -0.01804637908935547, -0.017101287841796875, -0.01615619659423828, -0.015211105346679688, -0.014266014099121094, -0.0133209228515625, -0.012375831604003906, -0.011430740356445312, -0.010485649108886719, -0.009540557861328125, -0.008595466613769531, -0.0076503753662109375, -0.006705284118652344, -0.00576019287109375, -0.004815101623535156, -0.0038700103759765625, -0.0029249191284179688, -0.001979827880859375, -0.0010347366333007812, -8.96453857421875e-05, 0.0008554458618164062, 0.001800537109375, 0.0027456283569335938, 0.0036907196044921875, 0.004635810852050781, 0.005580902099609375, 0.006525993347167969, 0.0074710845947265625, 0.008416175842285156, 0.00936126708984375, 0.010306358337402344, 0.011251449584960938, 0.012196540832519531, 0.013141632080078125, 0.014086723327636719, 0.015031814575195312, 0.015976905822753906, 0.0169219970703125, 0.017867088317871094, 0.018812179565429688, 0.01975727081298828, 0.020702362060546875, 0.02164745330810547, 0.022592544555664062, 0.023537635803222656, 0.02448272705078125, 0.025427818298339844, 0.026372909545898438, 0.02731800079345703, 0.028263092041015625, 0.02920818328857422, 0.030153274536132812, 0.031098365783691406, 0.03204345703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 5.0, 6.0, 13.0, 15.0, 16.0, 21.0, 31.0, 30.0, 48.0, 58.0, 74.0, 125.0, 213.0, 510.0, 1619.0, 6545.0, 83742.0, 896115.0, 51644.0, 5318.0, 1338.0, 431.0, 200.0, 117.0, 73.0, 52.0, 46.0, 26.0, 24.0, 18.0, 19.0, 17.0, 8.0, 11.0, 11.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.037078857421875, -0.03603243827819824, -0.034986019134521484, -0.03393959999084473, -0.03289318084716797, -0.03184676170349121, -0.030800342559814453, -0.029753923416137695, -0.028707504272460938, -0.02766108512878418, -0.026614665985107422, -0.025568246841430664, -0.024521827697753906, -0.02347540855407715, -0.02242898941040039, -0.021382570266723633, -0.020336151123046875, -0.019289731979370117, -0.01824331283569336, -0.0171968936920166, -0.016150474548339844, -0.015104055404663086, -0.014057636260986328, -0.01301121711730957, -0.011964797973632812, -0.010918378829956055, -0.009871959686279297, -0.008825540542602539, -0.007779121398925781, -0.0067327022552490234, -0.005686283111572266, -0.004639863967895508, -0.00359344482421875, -0.002547025680541992, -0.0015006065368652344, -0.00045418739318847656, 0.0005922317504882812, 0.001638650894165039, 0.002685070037841797, 0.0037314891815185547, 0.0047779083251953125, 0.00582432746887207, 0.006870746612548828, 0.007917165756225586, 0.008963584899902344, 0.010010004043579102, 0.01105642318725586, 0.012102842330932617, 0.013149261474609375, 0.014195680618286133, 0.01524209976196289, 0.01628851890563965, 0.017334938049316406, 0.018381357192993164, 0.019427776336669922, 0.02047419548034668, 0.021520614624023438, 0.022567033767700195, 0.023613452911376953, 0.02465987205505371, 0.02570629119873047, 0.026752710342407227, 0.027799129486083984, 0.028845548629760742, 0.0298919677734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 10.0, 10.0, 13.0, 28.0, 29.0, 32.0, 55.0, 65.0, 97.0, 99.0, 102.0, 106.0, 100.0, 70.0, 42.0, 51.0, 22.0, 17.0, 17.0, 10.0, 12.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001189112663269043, -0.0001155780628323555, -0.0001122448593378067, -0.0001089116558432579, -0.0001055784523487091, -0.00010224524885416031, -9.891204535961151e-05, -9.557884186506271e-05, -9.224563837051392e-05, -8.891243487596512e-05, -8.557923138141632e-05, -8.224602788686752e-05, -7.891282439231873e-05, -7.557962089776993e-05, -7.224641740322113e-05, -6.891321390867233e-05, -6.558001041412354e-05, -6.224680691957474e-05, -5.891360342502594e-05, -5.558039993047714e-05, -5.2247196435928345e-05, -4.891399294137955e-05, -4.558078944683075e-05, -4.224758595228195e-05, -3.8914382457733154e-05, -3.558117896318436e-05, -3.224797546863556e-05, -2.891477197408676e-05, -2.5581568479537964e-05, -2.2248364984989166e-05, -1.891516149044037e-05, -1.558195799589157e-05, -1.2248754501342773e-05, -8.915551006793976e-06, -5.582347512245178e-06, -2.2491440176963806e-06, 1.084059476852417e-06, 4.417262971401215e-06, 7.750466465950012e-06, 1.108366996049881e-05, 1.4416873455047607e-05, 1.7750076949596405e-05, 2.1083280444145203e-05, 2.4416483938694e-05, 2.7749687433242798e-05, 3.1082890927791595e-05, 3.441609442234039e-05, 3.774929791688919e-05, 4.108250141143799e-05, 4.4415704905986786e-05, 4.7748908400535583e-05, 5.108211189508438e-05, 5.441531538963318e-05, 5.7748518884181976e-05, 6.108172237873077e-05, 6.441492587327957e-05, 6.774812936782837e-05, 7.108133286237717e-05, 7.441453635692596e-05, 7.774773985147476e-05, 8.108094334602356e-05, 8.441414684057236e-05, 8.774735033512115e-05, 9.108055382966995e-05, 9.441375732421875e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 6.0, 9.0, 17.0, 37.0, 84.0, 150.0, 507.0, 2133.0, 21395.0, 809818.0, 205762.0, 7039.0, 1059.0, 292.0, 107.0, 44.0, 25.0, 13.0, 11.0, 11.0, 6.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032257080078125, -0.03105306625366211, -0.02984905242919922, -0.028645038604736328, -0.027441024780273438, -0.026237010955810547, -0.025032997131347656, -0.023828983306884766, -0.022624969482421875, -0.021420955657958984, -0.020216941833496094, -0.019012928009033203, -0.017808914184570312, -0.016604900360107422, -0.015400886535644531, -0.01419687271118164, -0.01299285888671875, -0.01178884506225586, -0.010584831237792969, -0.009380817413330078, -0.008176803588867188, -0.006972789764404297, -0.005768775939941406, -0.004564762115478516, -0.003360748291015625, -0.0021567344665527344, -0.0009527206420898438, 0.0002512931823730469, 0.0014553070068359375, 0.002659320831298828, 0.0038633346557617188, 0.005067348480224609, 0.0062713623046875, 0.007475376129150391, 0.008679389953613281, 0.009883403778076172, 0.011087417602539062, 0.012291431427001953, 0.013495445251464844, 0.014699459075927734, 0.015903472900390625, 0.017107486724853516, 0.018311500549316406, 0.019515514373779297, 0.020719528198242188, 0.021923542022705078, 0.02312755584716797, 0.02433156967163086, 0.02553558349609375, 0.02673959732055664, 0.02794361114501953, 0.029147624969482422, 0.030351638793945312, 0.0315556526184082, 0.032759666442871094, 0.033963680267333984, 0.035167694091796875, 0.036371707916259766, 0.037575721740722656, 0.03877973556518555, 0.03998374938964844, 0.04118776321411133, 0.04239177703857422, 0.04359579086303711, 0.0447998046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 4.0, 12.0, 14.0, 20.0, 43.0, 70.0, 124.0, 155.0, 155.0, 147.0, 100.0, 52.0, 33.0, 15.0, 9.0, 10.0, 3.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0177764892578125, -0.017098665237426758, -0.016420841217041016, -0.015743017196655273, -0.015065193176269531, -0.014387369155883789, -0.013709545135498047, -0.013031721115112305, -0.012353897094726562, -0.01167607307434082, -0.010998249053955078, -0.010320425033569336, -0.009642601013183594, -0.008964776992797852, -0.00828695297241211, -0.007609128952026367, -0.006931304931640625, -0.006253480911254883, -0.005575656890869141, -0.0048978328704833984, -0.004220008850097656, -0.003542184829711914, -0.002864360809326172, -0.0021865367889404297, -0.0015087127685546875, -0.0008308887481689453, -0.00015306472778320312, 0.0005247592926025391, 0.0012025833129882812, 0.0018804073333740234, 0.0025582313537597656, 0.003236055374145508, 0.00391387939453125, 0.004591703414916992, 0.005269527435302734, 0.0059473514556884766, 0.006625175476074219, 0.007302999496459961, 0.007980823516845703, 0.008658647537231445, 0.009336471557617188, 0.01001429557800293, 0.010692119598388672, 0.011369943618774414, 0.012047767639160156, 0.012725591659545898, 0.01340341567993164, 0.014081239700317383, 0.014759063720703125, 0.015436887741088867, 0.01611471176147461, 0.01679253578186035, 0.017470359802246094, 0.018148183822631836, 0.018826007843017578, 0.01950383186340332, 0.020181655883789062, 0.020859479904174805, 0.021537303924560547, 0.02221512794494629, 0.02289295196533203, 0.023570775985717773, 0.024248600006103516, 0.024926424026489258, 0.025604248046875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 5.0, 24.0, 56.0, 261.0, 470.0, 146.0, 41.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9824375510215759, -0.9636198878288269, -0.9448022246360779, -0.9259845614433289, -0.9071669578552246, -0.8883492946624756, -0.8695316314697266, -0.8507139682769775, -0.8318963050842285, -0.8130786418914795, -0.7942609786987305, -0.7754433155059814, -0.7566256523132324, -0.7378080487251282, -0.7189903855323792, -0.7001727223396301, -0.6813550591468811, -0.6625373959541321, -0.6437197327613831, -0.624902069568634, -0.6060844659805298, -0.5872668027877808, -0.5684491395950317, -0.5496314764022827, -0.5308138132095337, -0.5119961500167847, -0.49317848682403564, -0.474360853433609, -0.45554319024086, -0.43672552704811096, -0.4179078936576843, -0.3990902304649353, -0.3802725672721863, -0.36145490407943726, -0.34263724088668823, -0.3238196074962616, -0.3050019443035126, -0.28618428111076355, -0.2673666477203369, -0.2485489845275879, -0.22973130643367767, -0.21091365814208984, -0.19209599494934082, -0.1732783317565918, -0.15446068346500397, -0.13564303517341614, -0.11682537198066711, -0.09800772368907928, -0.07919006049633026, -0.060372404754161835, -0.04155474901199341, -0.02273709326982498, -0.003919437527656555, 0.014898218214511871, 0.0337158739566803, 0.05253352224826813, 0.07135118544101715, 0.09016884118318558, 0.108986496925354, 0.12780416011810303, 0.14662180840969086, 0.1654394567012787, 0.1842571198940277, 0.20307476818561554, 0.22189243137836456]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 8.0, 9.0, 15.0, 19.0, 22.0, 24.0, 32.0, 36.0, 49.0, 59.0, 56.0, 55.0, 77.0, 69.0, 56.0, 75.0, 55.0, 46.0, 37.0, 41.0, 39.0, 27.0, 22.0, 14.0, 16.0, 11.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20135772228240967, -0.19570404291152954, -0.19005036354064941, -0.1843966841697693, -0.17874300479888916, -0.17308932542800903, -0.1674356460571289, -0.16178196668624878, -0.15612828731536865, -0.15047460794448853, -0.1448209285736084, -0.13916724920272827, -0.13351356983184814, -0.12785989046096802, -0.12220621109008789, -0.11655253171920776, -0.11089885234832764, -0.10524517297744751, -0.09959149360656738, -0.09393781423568726, -0.08828413486480713, -0.082630455493927, -0.07697677612304688, -0.07132309675216675, -0.06566941738128662, -0.060015738010406494, -0.05436205863952637, -0.04870837926864624, -0.04305469989776611, -0.037401020526885986, -0.03174734115600586, -0.026093661785125732, -0.020439982414245605, -0.014786303043365479, -0.009132623672485352, -0.0034789443016052246, 0.0021747350692749023, 0.00782841444015503, 0.013482093811035156, 0.019135773181915283, 0.02478945255279541, 0.030443131923675537, 0.036096811294555664, 0.04175049066543579, 0.04740417003631592, 0.053057849407196045, 0.05871152877807617, 0.0643652081489563, 0.07001888751983643, 0.07567256689071655, 0.08132624626159668, 0.0869799256324768, 0.09263360500335693, 0.09828728437423706, 0.10394096374511719, 0.10959464311599731, 0.11524832248687744, 0.12090200185775757, 0.1265556812286377, 0.13220936059951782, 0.13786303997039795, 0.14351671934127808, 0.1491703987121582, 0.15482407808303833, 0.16047775745391846]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 1.0, 12.0, 11.0, 12.0, 34.0, 43.0, 71.0, 105.0, 191.0, 363.0, 665.0, 1816.0, 8148.0, 175702.0, 3970799.0, 31349.0, 3541.0, 839.0, 303.0, 133.0, 67.0, 26.0, 15.0, 9.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1671142578125, -0.16333961486816406, -0.15956497192382812, -0.1557903289794922, -0.15201568603515625, -0.1482410430908203, -0.14446640014648438, -0.14069175720214844, -0.1369171142578125, -0.13314247131347656, -0.12936782836914062, -0.1255931854248047, -0.12181854248046875, -0.11804389953613281, -0.11426925659179688, -0.11049461364746094, -0.106719970703125, -0.10294532775878906, -0.09917068481445312, -0.09539604187011719, -0.09162139892578125, -0.08784675598144531, -0.08407211303710938, -0.08029747009277344, -0.0765228271484375, -0.07274818420410156, -0.06897354125976562, -0.06519889831542969, -0.06142425537109375, -0.05764961242675781, -0.053874969482421875, -0.05010032653808594, -0.04632568359375, -0.04255104064941406, -0.038776397705078125, -0.03500175476074219, -0.03122711181640625, -0.027452468872070312, -0.023677825927734375, -0.019903182983398438, -0.0161285400390625, -0.012353897094726562, -0.008579254150390625, -0.0048046112060546875, -0.00102996826171875, 0.0027446746826171875, 0.006519317626953125, 0.010293960571289062, 0.014068603515625, 0.017843246459960938, 0.021617889404296875, 0.025392532348632812, 0.02916717529296875, 0.03294181823730469, 0.036716461181640625, 0.04049110412597656, 0.0442657470703125, 0.04804039001464844, 0.051815032958984375, 0.05558967590332031, 0.05936431884765625, 0.06313896179199219, 0.06691360473632812, 0.07068824768066406, 0.074462890625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 8.0, 11.0, 14.0, 24.0, 35.0, 53.0, 57.0, 79.0, 63.0, 84.0, 90.0, 99.0, 70.0, 72.0, 57.0, 49.0, 46.0, 27.0, 20.0, 14.0, 7.0, 3.0, 6.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0124359130859375, -0.012122154235839844, -0.011808395385742188, -0.011494636535644531, -0.011180877685546875, -0.010867118835449219, -0.010553359985351562, -0.010239601135253906, -0.00992584228515625, -0.009612083435058594, -0.009298324584960938, -0.008984565734863281, -0.008670806884765625, -0.008357048034667969, -0.008043289184570312, -0.007729530334472656, -0.007415771484375, -0.007102012634277344, -0.0067882537841796875, -0.006474494934082031, -0.006160736083984375, -0.005846977233886719, -0.0055332183837890625, -0.005219459533691406, -0.00490570068359375, -0.004591941833496094, -0.0042781829833984375, -0.003964424133300781, -0.003650665283203125, -0.0033369064331054688, -0.0030231475830078125, -0.0027093887329101562, -0.0023956298828125, -0.0020818710327148438, -0.0017681121826171875, -0.0014543533325195312, -0.001140594482421875, -0.0008268356323242188, -0.0005130767822265625, -0.00019931793212890625, 0.00011444091796875, 0.00042819976806640625, 0.0007419586181640625, 0.0010557174682617188, 0.001369476318359375, 0.0016832351684570312, 0.0019969940185546875, 0.0023107528686523438, 0.00262451171875, 0.0029382705688476562, 0.0032520294189453125, 0.0035657882690429688, 0.003879547119140625, 0.004193305969238281, 0.0045070648193359375, 0.004820823669433594, 0.00513458251953125, 0.005448341369628906, 0.0057621002197265625, 0.006075859069824219, 0.006389617919921875, 0.006703376770019531, 0.0070171356201171875, 0.007330894470214844, 0.0076446533203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 13.0, 13.0, 20.0, 32.0, 36.0, 50.0, 74.0, 118.0, 237.0, 694.0, 4162881.0, 29111.0, 427.0, 203.0, 90.0, 60.0, 55.0, 29.0, 26.0, 17.0, 24.0, 25.0, 13.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264892578125, -0.2515449523925781, -0.23819732666015625, -0.22484970092773438, -0.2115020751953125, -0.19815444946289062, -0.18480682373046875, -0.17145919799804688, -0.158111572265625, -0.14476394653320312, -0.13141632080078125, -0.11806869506835938, -0.1047210693359375, -0.09137344360351562, -0.07802581787109375, -0.06467819213867188, -0.05133056640625, -0.037982940673828125, -0.02463531494140625, -0.011287689208984375, 0.0020599365234375, 0.015407562255859375, 0.02875518798828125, 0.042102813720703125, 0.055450439453125, 0.06879806518554688, 0.08214569091796875, 0.09549331665039062, 0.1088409423828125, 0.12218856811523438, 0.13553619384765625, 0.14888381958007812, 0.1622314453125, 0.17557907104492188, 0.18892669677734375, 0.20227432250976562, 0.2156219482421875, 0.22896957397460938, 0.24231719970703125, 0.2556648254394531, 0.269012451171875, 0.2823600769042969, 0.29570770263671875, 0.3090553283691406, 0.3224029541015625, 0.3357505798339844, 0.34909820556640625, 0.3624458312988281, 0.37579345703125, 0.3891410827636719, 0.40248870849609375, 0.4158363342285156, 0.4291839599609375, 0.4425315856933594, 0.45587921142578125, 0.4692268371582031, 0.482574462890625, 0.4959220886230469, 0.5092697143554688, 0.5226173400878906, 0.5359649658203125, 0.5493125915527344, 0.5626602172851562, 0.5760078430175781, 0.58935546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 13.0, 87.0, 3347.0, 603.0, 33.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04315185546875, -0.04085540771484375, -0.0385589599609375, -0.03626251220703125, -0.033966064453125, -0.03166961669921875, -0.0293731689453125, -0.02707672119140625, -0.0247802734375, -0.02248382568359375, -0.0201873779296875, -0.01789093017578125, -0.015594482421875, -0.01329803466796875, -0.0110015869140625, -0.00870513916015625, -0.00640869140625, -0.00411224365234375, -0.0018157958984375, 0.00048065185546875, 0.002777099609375, 0.00507354736328125, 0.0073699951171875, 0.00966644287109375, 0.011962890625, 0.01425933837890625, 0.0165557861328125, 0.01885223388671875, 0.021148681640625, 0.02344512939453125, 0.0257415771484375, 0.02803802490234375, 0.03033447265625, 0.03263092041015625, 0.0349273681640625, 0.03722381591796875, 0.039520263671875, 0.04181671142578125, 0.0441131591796875, 0.04640960693359375, 0.0487060546875, 0.05100250244140625, 0.0532989501953125, 0.05559539794921875, 0.057891845703125, 0.06018829345703125, 0.0624847412109375, 0.06478118896484375, 0.06707763671875, 0.06937408447265625, 0.0716705322265625, 0.07396697998046875, 0.076263427734375, 0.07855987548828125, 0.0808563232421875, 0.08315277099609375, 0.08544921875, 0.08774566650390625, 0.0900421142578125, 0.09233856201171875, 0.094635009765625, 0.09693145751953125, 0.0992279052734375, 0.10152435302734375, 0.10382080078125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 64.0, 740.0, 184.0, 12.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5950915813446045, -0.5774247050285339, -0.5597577691078186, -0.542090892791748, -0.5244239568710327, -0.5067570805549622, -0.4890902042388916, -0.47142329812049866, -0.4537563920021057, -0.43608948588371277, -0.4184225797653198, -0.40075570344924927, -0.3830887973308563, -0.3654218912124634, -0.3477550148963928, -0.3300881087779999, -0.31242120265960693, -0.294754296541214, -0.27708739042282104, -0.2594205141067505, -0.24175360798835754, -0.2240867018699646, -0.20641981065273285, -0.1887529194355011, -0.17108601331710815, -0.1534191071987152, -0.13575221598148346, -0.11808531731367111, -0.10041841864585876, -0.08275151997804642, -0.06508462131023407, -0.04741772264242172, -0.029750823974609375, -0.012083925306797028, 0.00558297336101532, 0.023249872028827667, 0.040916770696640015, 0.05858366936445236, 0.07625056803226471, 0.09391746670007706, 0.1115843653678894, 0.12925127148628235, 0.1469181627035141, 0.16458505392074585, 0.1822519600391388, 0.19991886615753174, 0.2175857573747635, 0.23525264859199524, 0.2529195547103882, 0.27058646082878113, 0.2882533669471741, 0.30592024326324463, 0.3235871493816376, 0.3412540555000305, 0.3589209318161011, 0.376587837934494, 0.39425474405288696, 0.4119216501712799, 0.42958855628967285, 0.4472554326057434, 0.46492233872413635, 0.4825892448425293, 0.5002561211585999, 0.5179230570793152, 0.5355899333953857]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 15.0, 33.0, 62.0, 86.0, 140.0, 155.0, 150.0, 125.0, 103.0, 59.0, 40.0, 18.0, 8.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.18072974681854248, -0.17625586688518524, -0.171781986951828, -0.16730810701847076, -0.16283422708511353, -0.1583603471517563, -0.15388646721839905, -0.14941257238388062, -0.14493870735168457, -0.14046482741832733, -0.1359909474849701, -0.13151706755161285, -0.12704318761825562, -0.12256930768489838, -0.11809542030096054, -0.1136215403676033, -0.10914765298366547, -0.10467377305030823, -0.10019989311695099, -0.09572601318359375, -0.09125213325023651, -0.08677825331687927, -0.08230436593294144, -0.0778304859995842, -0.07335660606622696, -0.06888272613286972, -0.06440884619951248, -0.059934962540864944, -0.055461082607507706, -0.05098720267415047, -0.04651331901550293, -0.04203943908214569, -0.03756555914878845, -0.03309167921543121, -0.028617797419428825, -0.024143915623426437, -0.0196700356900692, -0.01519615575671196, -0.010722273960709572, -0.006248392164707184, -0.001774512231349945, 0.0026993686333298683, 0.007173249498009682, 0.011647130362689495, 0.01612101122736931, 0.020594891160726547, 0.025068772956728935, 0.029542654752731323, 0.03401653468608856, 0.0384904146194458, 0.04296429455280304, 0.04743817821145058, 0.051912058144807816, 0.056385938078165054, 0.06085982173681259, 0.06533370167016983, 0.06980758160352707, 0.07428146153688431, 0.07875534147024155, 0.08322922140359879, 0.08770310878753662, 0.09217698872089386, 0.0966508686542511, 0.10112474858760834, 0.10559862852096558]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 9.0, 7.0, 8.0, 15.0, 23.0, 25.0, 41.0, 50.0, 81.0, 104.0, 148.0, 240.0, 361.0, 625.0, 1184.0, 2506.0, 6938.0, 21447.0, 83780.0, 471233.0, 366427.0, 65177.0, 17411.0, 5750.0, 2225.0, 1046.0, 573.0, 359.0, 230.0, 136.0, 102.0, 73.0, 62.0, 36.0, 33.0, 33.0, 16.0, 10.0, 10.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.037506103515625, -0.0362091064453125, -0.034912109375, -0.0336151123046875, -0.032318115234375, -0.0310211181640625, -0.02972412109375, -0.0284271240234375, -0.027130126953125, -0.0258331298828125, -0.0245361328125, -0.0232391357421875, -0.021942138671875, -0.0206451416015625, -0.01934814453125, -0.0180511474609375, -0.016754150390625, -0.0154571533203125, -0.01416015625, -0.0128631591796875, -0.011566162109375, -0.0102691650390625, -0.00897216796875, -0.0076751708984375, -0.006378173828125, -0.0050811767578125, -0.0037841796875, -0.0024871826171875, -0.001190185546875, 0.0001068115234375, 0.00140380859375, 0.0027008056640625, 0.003997802734375, 0.0052947998046875, 0.006591796875, 0.0078887939453125, 0.009185791015625, 0.0104827880859375, 0.01177978515625, 0.0130767822265625, 0.014373779296875, 0.0156707763671875, 0.0169677734375, 0.0182647705078125, 0.019561767578125, 0.0208587646484375, 0.02215576171875, 0.0234527587890625, 0.024749755859375, 0.0260467529296875, 0.02734375, 0.0286407470703125, 0.029937744140625, 0.0312347412109375, 0.03253173828125, 0.0338287353515625, 0.035125732421875, 0.0364227294921875, 0.0377197265625, 0.0390167236328125, 0.040313720703125, 0.0416107177734375, 0.04290771484375, 0.0442047119140625, 0.045501708984375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 10.0, 10.0, 15.0, 27.0, 49.0, 40.0, 62.0, 62.0, 74.0, 81.0, 96.0, 97.0, 72.0, 68.0, 53.0, 48.0, 32.0, 37.0, 20.0, 18.0, 11.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01052093505859375, -0.010216593742370605, -0.009912252426147461, -0.009607911109924316, -0.009303569793701172, -0.008999228477478027, -0.008694887161254883, -0.008390545845031738, -0.008086204528808594, -0.007781863212585449, -0.007477521896362305, -0.00717318058013916, -0.006868839263916016, -0.006564497947692871, -0.0062601566314697266, -0.005955815315246582, -0.0056514739990234375, -0.005347132682800293, -0.0050427913665771484, -0.004738450050354004, -0.004434108734130859, -0.004129767417907715, -0.0038254261016845703, -0.0035210847854614258, -0.0032167434692382812, -0.0029124021530151367, -0.002608060836791992, -0.0023037195205688477, -0.001999378204345703, -0.0016950368881225586, -0.001390695571899414, -0.0010863542556762695, -0.000782012939453125, -0.00047767162322998047, -0.00017333030700683594, 0.0001310110092163086, 0.0004353523254394531, 0.0007396936416625977, 0.0010440349578857422, 0.0013483762741088867, 0.0016527175903320312, 0.0019570589065551758, 0.0022614002227783203, 0.002565741539001465, 0.0028700828552246094, 0.003174424171447754, 0.0034787654876708984, 0.003783106803894043, 0.0040874481201171875, 0.004391789436340332, 0.0046961307525634766, 0.005000472068786621, 0.005304813385009766, 0.00560915470123291, 0.005913496017456055, 0.006217837333679199, 0.006522178649902344, 0.006826519966125488, 0.007130861282348633, 0.007435202598571777, 0.007739543914794922, 0.008043885231018066, 0.008348226547241211, 0.008652567863464355, 0.0089569091796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 7.0, 9.0, 13.0, 13.0, 36.0, 37.0, 52.0, 94.0, 155.0, 304.0, 593.0, 1192.0, 2813.0, 7534.0, 27747.0, 165569.0, 682992.0, 125254.0, 22746.0, 6643.0, 2434.0, 1030.0, 534.0, 273.0, 153.0, 109.0, 73.0, 44.0, 27.0, 20.0, 18.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0], "bins": [-0.057952880859375, -0.05648326873779297, -0.05501365661621094, -0.053544044494628906, -0.052074432373046875, -0.050604820251464844, -0.04913520812988281, -0.04766559600830078, -0.04619598388671875, -0.04472637176513672, -0.04325675964355469, -0.041787147521972656, -0.040317535400390625, -0.038847923278808594, -0.03737831115722656, -0.03590869903564453, -0.0344390869140625, -0.03296947479248047, -0.03149986267089844, -0.030030250549316406, -0.028560638427734375, -0.027091026306152344, -0.025621414184570312, -0.02415180206298828, -0.02268218994140625, -0.02121257781982422, -0.019742965698242188, -0.018273353576660156, -0.016803741455078125, -0.015334129333496094, -0.013864517211914062, -0.012394905090332031, -0.01092529296875, -0.009455680847167969, -0.007986068725585938, -0.006516456604003906, -0.005046844482421875, -0.0035772323608398438, -0.0021076202392578125, -0.0006380081176757812, 0.00083160400390625, 0.0023012161254882812, 0.0037708282470703125, 0.005240440368652344, 0.006710052490234375, 0.008179664611816406, 0.009649276733398438, 0.011118888854980469, 0.0125885009765625, 0.014058113098144531, 0.015527725219726562, 0.016997337341308594, 0.018466949462890625, 0.019936561584472656, 0.021406173706054688, 0.02287578582763672, 0.02434539794921875, 0.02581501007080078, 0.027284622192382812, 0.028754234313964844, 0.030223846435546875, 0.031693458557128906, 0.03316307067871094, 0.03463268280029297, 0.036102294921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 3.0, 7.0, 7.0, 8.0, 12.0, 20.0, 20.0, 37.0, 34.0, 46.0, 49.0, 54.0, 67.0, 54.0, 69.0, 70.0, 71.0, 66.0, 46.0, 49.0, 31.0, 42.0, 28.0, 22.0, 17.0, 12.0, 19.0, 5.0, 8.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.04034423828125, -0.03930783271789551, -0.038271427154541016, -0.03723502159118652, -0.03619861602783203, -0.03516221046447754, -0.03412580490112305, -0.033089399337768555, -0.03205299377441406, -0.03101658821105957, -0.029980182647705078, -0.028943777084350586, -0.027907371520996094, -0.0268709659576416, -0.02583456039428711, -0.024798154830932617, -0.023761749267578125, -0.022725343704223633, -0.02168893814086914, -0.02065253257751465, -0.019616127014160156, -0.018579721450805664, -0.017543315887451172, -0.01650691032409668, -0.015470504760742188, -0.014434099197387695, -0.013397693634033203, -0.012361288070678711, -0.011324882507324219, -0.010288476943969727, -0.009252071380615234, -0.008215665817260742, -0.00717926025390625, -0.006142854690551758, -0.005106449127197266, -0.0040700435638427734, -0.0030336380004882812, -0.001997232437133789, -0.0009608268737792969, 7.557868957519531e-05, 0.0011119842529296875, 0.0021483898162841797, 0.003184795379638672, 0.004221200942993164, 0.005257606506347656, 0.0062940120697021484, 0.007330417633056641, 0.008366823196411133, 0.009403228759765625, 0.010439634323120117, 0.01147603988647461, 0.012512445449829102, 0.013548851013183594, 0.014585256576538086, 0.015621662139892578, 0.01665806770324707, 0.017694473266601562, 0.018730878829956055, 0.019767284393310547, 0.02080368995666504, 0.02184009552001953, 0.022876501083374023, 0.023912906646728516, 0.024949312210083008, 0.0259857177734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 17.0, 13.0, 16.0, 24.0, 26.0, 40.0, 62.0, 83.0, 106.0, 198.0, 415.0, 858.0, 2508.0, 13498.0, 237576.0, 746077.0, 39497.0, 4952.0, 1307.0, 521.0, 265.0, 146.0, 104.0, 64.0, 45.0, 33.0, 29.0, 23.0, 9.0, 11.0, 5.0, 8.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0219573974609375, -0.021150827407836914, -0.020344257354736328, -0.019537687301635742, -0.018731117248535156, -0.01792454719543457, -0.017117977142333984, -0.0163114070892334, -0.015504837036132812, -0.014698266983032227, -0.01389169692993164, -0.013085126876831055, -0.012278556823730469, -0.011471986770629883, -0.010665416717529297, -0.009858846664428711, -0.009052276611328125, -0.008245706558227539, -0.007439136505126953, -0.006632566452026367, -0.005825996398925781, -0.005019426345825195, -0.004212856292724609, -0.0034062862396240234, -0.0025997161865234375, -0.0017931461334228516, -0.0009865760803222656, -0.0001800060272216797, 0.0006265640258789062, 0.0014331340789794922, 0.002239704132080078, 0.003046274185180664, 0.00385284423828125, 0.004659414291381836, 0.005465984344482422, 0.006272554397583008, 0.007079124450683594, 0.00788569450378418, 0.008692264556884766, 0.009498834609985352, 0.010305404663085938, 0.011111974716186523, 0.01191854476928711, 0.012725114822387695, 0.013531684875488281, 0.014338254928588867, 0.015144824981689453, 0.01595139503479004, 0.016757965087890625, 0.01756453514099121, 0.018371105194091797, 0.019177675247192383, 0.01998424530029297, 0.020790815353393555, 0.02159738540649414, 0.022403955459594727, 0.023210525512695312, 0.0240170955657959, 0.024823665618896484, 0.02563023567199707, 0.026436805725097656, 0.027243375778198242, 0.028049945831298828, 0.028856515884399414, 0.0296630859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 12.0, 9.0, 10.0, 22.0, 33.0, 51.0, 74.0, 120.0, 179.0, 173.0, 121.0, 79.0, 60.0, 21.0, 15.0, 11.0, 12.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017535686492919922, -0.00017154216766357422, -0.00016772747039794922, -0.00016391277313232422, -0.00016009807586669922, -0.00015628337860107422, -0.00015246868133544922, -0.00014865398406982422, -0.00014483928680419922, -0.00014102458953857422, -0.00013720989227294922, -0.00013339519500732422, -0.00012958049774169922, -0.00012576580047607422, -0.00012195110321044922, -0.00011813640594482422, -0.00011432170867919922, -0.00011050701141357422, -0.00010669231414794922, -0.00010287761688232422, -9.906291961669922e-05, -9.524822235107422e-05, -9.143352508544922e-05, -8.761882781982422e-05, -8.380413055419922e-05, -7.998943328857422e-05, -7.617473602294922e-05, -7.236003875732422e-05, -6.854534149169922e-05, -6.473064422607422e-05, -6.091594696044922e-05, -5.710124969482422e-05, -5.328655242919922e-05, -4.947185516357422e-05, -4.565715789794922e-05, -4.184246063232422e-05, -3.802776336669922e-05, -3.421306610107422e-05, -3.039836883544922e-05, -2.658367156982422e-05, -2.276897430419922e-05, -1.895427703857422e-05, -1.5139579772949219e-05, -1.1324882507324219e-05, -7.510185241699219e-06, -3.6954879760742188e-06, 1.1920928955078125e-07, 3.933906555175781e-06, 7.748603820800781e-06, 1.1563301086425781e-05, 1.537799835205078e-05, 1.919269561767578e-05, 2.300739288330078e-05, 2.682209014892578e-05, 3.063678741455078e-05, 3.445148468017578e-05, 3.826618194580078e-05, 4.208087921142578e-05, 4.589557647705078e-05, 4.971027374267578e-05, 5.352497100830078e-05, 5.733966827392578e-05, 6.115436553955078e-05, 6.496906280517578e-05, 6.878376007080078e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 13.0, 10.0, 18.0, 41.0, 56.0, 83.0, 147.0, 348.0, 1060.0, 6410.0, 161668.0, 844594.0, 30172.0, 2745.0, 693.0, 208.0, 116.0, 60.0, 44.0, 23.0, 25.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.046295166015625, -0.04524970054626465, -0.0442042350769043, -0.043158769607543945, -0.042113304138183594, -0.04106783866882324, -0.04002237319946289, -0.03897690773010254, -0.03793144226074219, -0.036885976791381836, -0.035840511322021484, -0.03479504585266113, -0.03374958038330078, -0.03270411491394043, -0.03165864944458008, -0.030613183975219727, -0.029567718505859375, -0.028522253036499023, -0.027476787567138672, -0.02643132209777832, -0.02538585662841797, -0.024340391159057617, -0.023294925689697266, -0.022249460220336914, -0.021203994750976562, -0.02015852928161621, -0.01911306381225586, -0.018067598342895508, -0.017022132873535156, -0.015976667404174805, -0.014931201934814453, -0.013885736465454102, -0.01284027099609375, -0.011794805526733398, -0.010749340057373047, -0.009703874588012695, -0.008658409118652344, -0.007612943649291992, -0.006567478179931641, -0.005522012710571289, -0.0044765472412109375, -0.003431081771850586, -0.0023856163024902344, -0.0013401508331298828, -0.00029468536376953125, 0.0007507801055908203, 0.0017962455749511719, 0.0028417110443115234, 0.003887176513671875, 0.0049326419830322266, 0.005978107452392578, 0.00702357292175293, 0.008069038391113281, 0.009114503860473633, 0.010159969329833984, 0.011205434799194336, 0.012250900268554688, 0.013296365737915039, 0.01434183120727539, 0.015387296676635742, 0.016432762145996094, 0.017478227615356445, 0.018523693084716797, 0.01956915855407715, 0.0206146240234375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 3.0, 10.0, 14.0, 24.0, 21.0, 48.0, 74.0, 153.0, 170.0, 157.0, 107.0, 83.0, 52.0, 29.0, 14.0, 8.0, 5.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.02655029296875, -0.025900959968566895, -0.02525162696838379, -0.024602293968200684, -0.023952960968017578, -0.023303627967834473, -0.022654294967651367, -0.02200496196746826, -0.021355628967285156, -0.02070629596710205, -0.020056962966918945, -0.01940762996673584, -0.018758296966552734, -0.01810896396636963, -0.017459630966186523, -0.016810297966003418, -0.016160964965820312, -0.015511631965637207, -0.014862298965454102, -0.014212965965270996, -0.01356363296508789, -0.012914299964904785, -0.01226496696472168, -0.011615633964538574, -0.010966300964355469, -0.010316967964172363, -0.009667634963989258, -0.009018301963806152, -0.008368968963623047, -0.007719635963439941, -0.007070302963256836, -0.0064209699630737305, -0.005771636962890625, -0.0051223039627075195, -0.004472970962524414, -0.0038236379623413086, -0.003174304962158203, -0.0025249719619750977, -0.0018756389617919922, -0.0012263059616088867, -0.0005769729614257812, 7.236003875732422e-05, 0.0007216930389404297, 0.0013710260391235352, 0.0020203590393066406, 0.002669692039489746, 0.0033190250396728516, 0.003968358039855957, 0.0046176910400390625, 0.005267024040222168, 0.0059163570404052734, 0.006565690040588379, 0.007215023040771484, 0.00786435604095459, 0.008513689041137695, 0.0091630220413208, 0.009812355041503906, 0.010461688041687012, 0.011111021041870117, 0.011760354042053223, 0.012409687042236328, 0.013059020042419434, 0.013708353042602539, 0.014357686042785645, 0.01500701904296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 9.0, 17.0, 27.0, 56.0, 131.0, 238.0, 258.0, 134.0, 55.0, 24.0, 20.0, 14.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0], "bins": [-0.5437684655189514, -0.5331311225891113, -0.5224937796592712, -0.5118564367294312, -0.5012190937995911, -0.490581750869751, -0.4799444079399109, -0.4693070650100708, -0.4586697220802307, -0.4480323791503906, -0.43739503622055054, -0.42675769329071045, -0.41612035036087036, -0.4054830074310303, -0.3948456645011902, -0.3842083215713501, -0.37357097864151, -0.3629336357116699, -0.35229629278182983, -0.34165894985198975, -0.33102160692214966, -0.32038426399230957, -0.3097469210624695, -0.2991095781326294, -0.2884722352027893, -0.2778348922729492, -0.26719754934310913, -0.25656020641326904, -0.24592286348342896, -0.23528552055358887, -0.22464817762374878, -0.2140108346939087, -0.20337346196174622, -0.19273611903190613, -0.18209877610206604, -0.17146143317222595, -0.16082409024238586, -0.15018674731254578, -0.1395494043827057, -0.1289120614528656, -0.11827471852302551, -0.10763737559318542, -0.09700003266334534, -0.08636268973350525, -0.07572534680366516, -0.06508800387382507, -0.054450660943984985, -0.0438133180141449, -0.03317597508430481, -0.02253863215446472, -0.011901289224624634, -0.001263946294784546, 0.009373396635055542, 0.02001073956489563, 0.030648082494735718, 0.041285425424575806, 0.051922768354415894, 0.06256011128425598, 0.07319745421409607, 0.08383479714393616, 0.09447214007377625, 0.10510948300361633, 0.11574682593345642, 0.1263841688632965, 0.1370215117931366]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 9.0, 9.0, 17.0, 17.0, 22.0, 20.0, 36.0, 26.0, 24.0, 39.0, 39.0, 43.0, 36.0, 46.0, 52.0, 52.0, 53.0, 63.0, 48.0, 42.0, 34.0, 40.0, 34.0, 34.0, 36.0, 16.0, 17.0, 19.0, 16.0, 13.0, 7.0, 6.0, 10.0, 4.0, 2.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17190831899642944, -0.16710087656974792, -0.1622934341430664, -0.1574859917163849, -0.15267854928970337, -0.14787112176418304, -0.14306367933750153, -0.13825623691082, -0.1334487944841385, -0.12864135205745697, -0.12383390963077545, -0.11902647465467453, -0.11421903222799301, -0.10941158980131149, -0.10460415482521057, -0.09979671239852905, -0.09498926997184753, -0.09018182754516602, -0.0853743851184845, -0.08056695014238358, -0.07575950771570206, -0.07095206528902054, -0.06614463031291962, -0.0613371878862381, -0.05652974545955658, -0.05172230303287506, -0.04691486433148384, -0.04210742563009262, -0.0372999832034111, -0.032492540776729584, -0.027685102075338364, -0.022877663373947144, -0.018070220947265625, -0.013262780383229256, -0.008455339819192886, -0.003647899255156517, 0.0011595413088798523, 0.005966981872916222, 0.010774422436952591, 0.015581861138343811, 0.02038930356502533, 0.0251967441290617, 0.030004184693098068, 0.03481162339448929, 0.03961906582117081, 0.044426508247852325, 0.049233946949243546, 0.054041385650634766, 0.058848828077316284, 0.0636562705039978, 0.06846371293067932, 0.07327114790678024, 0.07807859033346176, 0.08288603276014328, 0.0876934677362442, 0.09250091016292572, 0.09730835258960724, 0.10211579501628876, 0.10692323744297028, 0.1117306724190712, 0.11653811484575272, 0.12134555727243423, 0.12615299224853516, 0.13096043467521667, 0.1357678771018982]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 6.0, 8.0, 16.0, 15.0, 20.0, 28.0, 30.0, 40.0, 82.0, 90.0, 122.0, 237.0, 394.0, 625.0, 1252.0, 2817.0, 7784.0, 28793.0, 274637.0, 3705485.0, 141153.0, 20853.0, 5900.0, 2102.0, 846.0, 385.0, 220.0, 121.0, 77.0, 40.0, 39.0, 19.0, 9.0, 7.0, 6.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07012939453125, -0.0682535171508789, -0.06637763977050781, -0.06450176239013672, -0.06262588500976562, -0.06075000762939453, -0.05887413024902344, -0.056998252868652344, -0.05512237548828125, -0.053246498107910156, -0.05137062072753906, -0.04949474334716797, -0.047618865966796875, -0.04574298858642578, -0.04386711120605469, -0.041991233825683594, -0.0401153564453125, -0.038239479064941406, -0.03636360168457031, -0.03448772430419922, -0.032611846923828125, -0.03073596954345703, -0.028860092163085938, -0.026984214782714844, -0.02510833740234375, -0.023232460021972656, -0.021356582641601562, -0.01948070526123047, -0.017604827880859375, -0.01572895050048828, -0.013853073120117188, -0.011977195739746094, -0.010101318359375, -0.008225440979003906, -0.0063495635986328125, -0.004473686218261719, -0.002597808837890625, -0.0007219314575195312, 0.0011539459228515625, 0.0030298233032226562, 0.00490570068359375, 0.006781578063964844, 0.008657455444335938, 0.010533332824707031, 0.012409210205078125, 0.014285087585449219, 0.016160964965820312, 0.018036842346191406, 0.0199127197265625, 0.021788597106933594, 0.023664474487304688, 0.02554035186767578, 0.027416229248046875, 0.02929210662841797, 0.031167984008789062, 0.033043861389160156, 0.03491973876953125, 0.036795616149902344, 0.03867149353027344, 0.04054737091064453, 0.042423248291015625, 0.04429912567138672, 0.04617500305175781, 0.048050880432128906, 0.0499267578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 0.0, 11.0, 11.0, 13.0, 21.0, 37.0, 45.0, 57.0, 70.0, 80.0, 87.0, 94.0, 99.0, 60.0, 66.0, 55.0, 52.0, 38.0, 34.0, 30.0, 20.0, 4.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01041412353515625, -0.010114312171936035, -0.00981450080871582, -0.009514689445495605, -0.00921487808227539, -0.008915066719055176, -0.008615255355834961, -0.008315443992614746, -0.008015632629394531, -0.007715821266174316, -0.0074160099029541016, -0.007116198539733887, -0.006816387176513672, -0.006516575813293457, -0.006216764450073242, -0.005916953086853027, -0.0056171417236328125, -0.005317330360412598, -0.005017518997192383, -0.004717707633972168, -0.004417896270751953, -0.004118084907531738, -0.0038182735443115234, -0.0035184621810913086, -0.0032186508178710938, -0.002918839454650879, -0.002619028091430664, -0.0023192167282104492, -0.0020194053649902344, -0.0017195940017700195, -0.0014197826385498047, -0.0011199712753295898, -0.000820159912109375, -0.0005203485488891602, -0.0002205371856689453, 7.927417755126953e-05, 0.0003790855407714844, 0.0006788969039916992, 0.000978708267211914, 0.001278519630432129, 0.0015783309936523438, 0.0018781423568725586, 0.0021779537200927734, 0.0024777650833129883, 0.002777576446533203, 0.003077387809753418, 0.003377199172973633, 0.0036770105361938477, 0.0039768218994140625, 0.004276633262634277, 0.004576444625854492, 0.004876255989074707, 0.005176067352294922, 0.005475878715515137, 0.0057756900787353516, 0.006075501441955566, 0.006375312805175781, 0.006675124168395996, 0.006974935531616211, 0.007274746894836426, 0.007574558258056641, 0.007874369621276855, 0.00817418098449707, 0.008473992347717285, 0.0087738037109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 10.0, 19.0, 25.0, 32.0, 58.0, 107.0, 178.0, 343.0, 808.0, 2708.0, 12433.0, 775159.0, 3379586.0, 17422.0, 3533.0, 1089.0, 386.0, 164.0, 95.0, 44.0, 31.0, 19.0, 11.0, 5.0, 4.0, 9.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11993408203125, -0.1161947250366211, -0.11245536804199219, -0.10871601104736328, -0.10497665405273438, -0.10123729705810547, -0.09749794006347656, -0.09375858306884766, -0.09001922607421875, -0.08627986907958984, -0.08254051208496094, -0.07880115509033203, -0.07506179809570312, -0.07132244110107422, -0.06758308410644531, -0.0638437271118164, -0.0601043701171875, -0.056365013122558594, -0.05262565612792969, -0.04888629913330078, -0.045146942138671875, -0.04140758514404297, -0.03766822814941406, -0.033928871154785156, -0.03018951416015625, -0.026450157165527344, -0.022710800170898438, -0.01897144317626953, -0.015232086181640625, -0.011492729187011719, -0.0077533721923828125, -0.004014015197753906, -0.000274658203125, 0.0034646987915039062, 0.0072040557861328125, 0.010943412780761719, 0.014682769775390625, 0.01842212677001953, 0.022161483764648438, 0.025900840759277344, 0.02964019775390625, 0.033379554748535156, 0.03711891174316406, 0.04085826873779297, 0.044597625732421875, 0.04833698272705078, 0.05207633972167969, 0.055815696716308594, 0.0595550537109375, 0.0632944107055664, 0.06703376770019531, 0.07077312469482422, 0.07451248168945312, 0.07825183868408203, 0.08199119567871094, 0.08573055267333984, 0.08946990966796875, 0.09320926666259766, 0.09694862365722656, 0.10068798065185547, 0.10442733764648438, 0.10816669464111328, 0.11190605163574219, 0.1156454086303711, 0.119384765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 2.0, 11.0, 12.0, 23.0, 52.0, 150.0, 523.0, 2232.0, 743.0, 173.0, 73.0, 23.0, 12.0, 10.0, 9.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04351806640625, -0.0424959659576416, -0.0414738655090332, -0.040451765060424805, -0.039429664611816406, -0.03840756416320801, -0.03738546371459961, -0.03636336326599121, -0.03534126281738281, -0.034319162368774414, -0.033297061920166016, -0.03227496147155762, -0.03125286102294922, -0.03023076057434082, -0.029208660125732422, -0.028186559677124023, -0.027164459228515625, -0.026142358779907227, -0.025120258331298828, -0.02409815788269043, -0.02307605743408203, -0.022053956985473633, -0.021031856536865234, -0.020009756088256836, -0.018987655639648438, -0.01796555519104004, -0.01694345474243164, -0.015921354293823242, -0.014899253845214844, -0.013877153396606445, -0.012855052947998047, -0.011832952499389648, -0.01081085205078125, -0.009788751602172852, -0.008766651153564453, -0.007744550704956055, -0.006722450256347656, -0.005700349807739258, -0.004678249359130859, -0.003656148910522461, -0.0026340484619140625, -0.001611948013305664, -0.0005898475646972656, 0.0004322528839111328, 0.0014543533325195312, 0.0024764537811279297, 0.003498554229736328, 0.0045206546783447266, 0.005542755126953125, 0.0065648555755615234, 0.007586956024169922, 0.00860905647277832, 0.009631156921386719, 0.010653257369995117, 0.011675357818603516, 0.012697458267211914, 0.013719558715820312, 0.014741659164428711, 0.01576375961303711, 0.016785860061645508, 0.017807960510253906, 0.018830060958862305, 0.019852161407470703, 0.0208742618560791, 0.0218963623046875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 9.0, 29.0, 234.0, 547.0, 159.0, 20.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2559463381767273, -0.24125222861766815, -0.226558119058609, -0.21186402440071106, -0.19716991484165192, -0.18247580528259277, -0.16778171062469482, -0.15308760106563568, -0.13839349150657654, -0.1236993819475174, -0.10900527983903885, -0.0943111777305603, -0.07961706817150116, -0.06492295861244202, -0.05022885650396347, -0.035534754395484924, -0.02084064483642578, -0.006146539002656937, 0.008547566831111908, 0.023241672664880753, 0.0379357784986496, 0.05262988805770874, 0.06732399016618729, 0.08201809227466583, 0.09671220183372498, 0.11140631139278412, 0.12610042095184326, 0.1407945156097412, 0.15548862516880035, 0.1701827347278595, 0.18487682938575745, 0.1995709389448166, 0.21426504850387573, 0.22895915806293488, 0.24365326762199402, 0.25834736227989197, 0.2730414867401123, 0.28773558139801025, 0.3024296760559082, 0.31712377071380615, 0.3318178951740265, 0.34651198983192444, 0.3612061142921448, 0.3759002089500427, 0.3905943036079407, 0.405288428068161, 0.41998252272605896, 0.4346766471862793, 0.44937074184417725, 0.4640648365020752, 0.47875896096229553, 0.4934530556201935, 0.5081471800804138, 0.5228412747383118, 0.5375353693962097, 0.5522294640541077, 0.5669236183166504, 0.5816177129745483, 0.5963118076324463, 0.611005961894989, 0.625700056552887, 0.6403941512107849, 0.6550882458686829, 0.6697823405265808, 0.6844764351844788]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 12.0, 20.0, 22.0, 33.0, 38.0, 49.0, 51.0, 57.0, 79.0, 68.0, 61.0, 79.0, 70.0, 62.0, 37.0, 54.0, 44.0, 39.0, 28.0, 19.0, 10.0, 17.0, 11.0, 3.0, 7.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06843847036361694, -0.06586591899394989, -0.06329336017370224, -0.06072080880403519, -0.058148253709077835, -0.05557569861412048, -0.05300314724445343, -0.05043059214949608, -0.04785803705453873, -0.045285481959581375, -0.04271292686462402, -0.04014037549495697, -0.03756782039999962, -0.03499526530504227, -0.032422713935375214, -0.029850158840417862, -0.02727760374546051, -0.02470504865050316, -0.022132495418190956, -0.019559942185878754, -0.016987387090921402, -0.014414832927286625, -0.011842278763651848, -0.009269725531339645, -0.006697170436382294, -0.004124616272747517, -0.0015520621091127396, 0.0010204920545220375, 0.0035930462181568146, 0.006165600381791592, 0.008738154545426369, 0.011310707777738571, 0.013883262872695923, 0.016455817967653275, 0.019028371199965477, 0.02160092443227768, 0.02417347952723503, 0.026746034622192383, 0.029318587854504585, 0.03189114108681679, 0.03446369618177414, 0.03703625127673149, 0.03960880637168884, 0.042181357741355896, 0.04475391283631325, 0.0473264679312706, 0.04989901930093765, 0.052471574395895004, 0.055044129490852356, 0.05761668458580971, 0.06018923968076706, 0.06276179105043411, 0.06533434987068176, 0.06790690124034882, 0.07047945261001587, 0.07305200397968292, 0.07562456279993057, 0.07819711416959763, 0.08076967298984528, 0.08334222435951233, 0.08591477572917938, 0.08848733454942703, 0.09105988591909409, 0.09363244473934174, 0.09620499610900879]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 11.0, 14.0, 27.0, 37.0, 54.0, 82.0, 104.0, 184.0, 265.0, 448.0, 885.0, 1843.0, 4894.0, 18747.0, 102742.0, 640525.0, 230667.0, 34056.0, 7733.0, 2552.0, 1188.0, 559.0, 314.0, 215.0, 120.0, 93.0, 50.0, 41.0, 32.0, 17.0, 10.0, 10.0, 13.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04364013671875, -0.04211902618408203, -0.04059791564941406, -0.039076805114746094, -0.037555694580078125, -0.036034584045410156, -0.03451347351074219, -0.03299236297607422, -0.03147125244140625, -0.02995014190673828, -0.028429031372070312, -0.026907920837402344, -0.025386810302734375, -0.023865699768066406, -0.022344589233398438, -0.02082347869873047, -0.0193023681640625, -0.01778125762939453, -0.016260147094726562, -0.014739036560058594, -0.013217926025390625, -0.011696815490722656, -0.010175704956054688, -0.008654594421386719, -0.00713348388671875, -0.005612373352050781, -0.0040912628173828125, -0.0025701522827148438, -0.001049041748046875, 0.00047206878662109375, 0.0019931793212890625, 0.0035142898559570312, 0.005035400390625, 0.006556510925292969, 0.008077621459960938, 0.009598731994628906, 0.011119842529296875, 0.012640953063964844, 0.014162063598632812, 0.01568317413330078, 0.01720428466796875, 0.01872539520263672, 0.020246505737304688, 0.021767616271972656, 0.023288726806640625, 0.024809837341308594, 0.026330947875976562, 0.02785205841064453, 0.0293731689453125, 0.03089427947998047, 0.03241539001464844, 0.033936500549316406, 0.035457611083984375, 0.036978721618652344, 0.03849983215332031, 0.04002094268798828, 0.04154205322265625, 0.04306316375732422, 0.04458427429199219, 0.046105384826660156, 0.047626495361328125, 0.049147605895996094, 0.05066871643066406, 0.05218982696533203, 0.0537109375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 10.0, 17.0, 22.0, 26.0, 44.0, 64.0, 82.0, 82.0, 99.0, 106.0, 98.0, 78.0, 65.0, 63.0, 49.0, 34.0, 27.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01024627685546875, -0.009930729866027832, -0.009615182876586914, -0.009299635887145996, -0.008984088897705078, -0.00866854190826416, -0.008352994918823242, -0.008037447929382324, -0.007721900939941406, -0.007406353950500488, -0.00709080696105957, -0.006775259971618652, -0.006459712982177734, -0.006144165992736816, -0.0058286190032958984, -0.0055130720138549805, -0.0051975250244140625, -0.0048819780349731445, -0.0045664310455322266, -0.004250884056091309, -0.003935337066650391, -0.0036197900772094727, -0.0033042430877685547, -0.0029886960983276367, -0.0026731491088867188, -0.0023576021194458008, -0.002042055130004883, -0.0017265081405639648, -0.0014109611511230469, -0.001095414161682129, -0.0007798671722412109, -0.00046432018280029297, -0.000148773193359375, 0.00016677379608154297, 0.00048232078552246094, 0.0007978677749633789, 0.0011134147644042969, 0.0014289617538452148, 0.0017445087432861328, 0.0020600557327270508, 0.0023756027221679688, 0.0026911497116088867, 0.0030066967010498047, 0.0033222436904907227, 0.0036377906799316406, 0.003953337669372559, 0.0042688846588134766, 0.0045844316482543945, 0.0048999786376953125, 0.0052155256271362305, 0.0055310726165771484, 0.005846619606018066, 0.006162166595458984, 0.006477713584899902, 0.00679326057434082, 0.007108807563781738, 0.007424354553222656, 0.007739901542663574, 0.008055448532104492, 0.00837099552154541, 0.008686542510986328, 0.009002089500427246, 0.009317636489868164, 0.009633183479309082, 0.00994873046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 10.0, 11.0, 18.0, 19.0, 31.0, 51.0, 66.0, 122.0, 164.0, 249.0, 379.0, 590.0, 1002.0, 1685.0, 3012.0, 5252.0, 9548.0, 18160.0, 36287.0, 75553.0, 176218.0, 316742.0, 218676.0, 93922.0, 43304.0, 21537.0, 11213.0, 6139.0, 3487.0, 1945.0, 1206.0, 700.0, 445.0, 281.0, 183.0, 96.0, 66.0, 53.0, 37.0, 25.0, 23.0, 10.0, 10.0, 10.0, 3.0, 4.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.014495849609375, -0.014037609100341797, -0.013579368591308594, -0.01312112808227539, -0.012662887573242188, -0.012204647064208984, -0.011746406555175781, -0.011288166046142578, -0.010829925537109375, -0.010371685028076172, -0.009913444519042969, -0.009455204010009766, -0.008996963500976562, -0.00853872299194336, -0.008080482482910156, -0.007622241973876953, -0.00716400146484375, -0.006705760955810547, -0.006247520446777344, -0.005789279937744141, -0.0053310394287109375, -0.004872798919677734, -0.004414558410644531, -0.003956317901611328, -0.003498077392578125, -0.003039836883544922, -0.0025815963745117188, -0.0021233558654785156, -0.0016651153564453125, -0.0012068748474121094, -0.0007486343383789062, -0.0002903938293457031, 0.0001678466796875, 0.0006260871887207031, 0.0010843276977539062, 0.0015425682067871094, 0.0020008087158203125, 0.0024590492248535156, 0.0029172897338867188, 0.003375530242919922, 0.003833770751953125, 0.004292011260986328, 0.004750251770019531, 0.005208492279052734, 0.0056667327880859375, 0.006124973297119141, 0.006583213806152344, 0.007041454315185547, 0.00749969482421875, 0.007957935333251953, 0.008416175842285156, 0.00887441635131836, 0.009332656860351562, 0.009790897369384766, 0.010249137878417969, 0.010707378387451172, 0.011165618896484375, 0.011623859405517578, 0.012082099914550781, 0.012540340423583984, 0.012998580932617188, 0.01345682144165039, 0.013915061950683594, 0.014373302459716797, 0.01483154296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 7.0, 7.0, 11.0, 21.0, 10.0, 13.0, 20.0, 30.0, 28.0, 21.0, 37.0, 26.0, 36.0, 41.0, 48.0, 46.0, 54.0, 42.0, 47.0, 37.0, 31.0, 44.0, 33.0, 39.0, 31.0, 39.0, 27.0, 21.0, 26.0, 23.0, 19.0, 12.0, 13.0, 9.0, 9.0, 7.0, 2.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0189971923828125, -0.018414020538330078, -0.017830848693847656, -0.017247676849365234, -0.016664505004882812, -0.01608133316040039, -0.015498161315917969, -0.014914989471435547, -0.014331817626953125, -0.013748645782470703, -0.013165473937988281, -0.01258230209350586, -0.011999130249023438, -0.011415958404541016, -0.010832786560058594, -0.010249614715576172, -0.00966644287109375, -0.009083271026611328, -0.008500099182128906, -0.007916927337646484, -0.0073337554931640625, -0.006750583648681641, -0.006167411804199219, -0.005584239959716797, -0.005001068115234375, -0.004417896270751953, -0.0038347244262695312, -0.0032515525817871094, -0.0026683807373046875, -0.0020852088928222656, -0.0015020370483398438, -0.0009188652038574219, -0.000335693359375, 0.0002474784851074219, 0.0008306503295898438, 0.0014138221740722656, 0.0019969940185546875, 0.0025801658630371094, 0.0031633377075195312, 0.003746509552001953, 0.004329681396484375, 0.004912853240966797, 0.005496025085449219, 0.006079196929931641, 0.0066623687744140625, 0.007245540618896484, 0.007828712463378906, 0.008411884307861328, 0.00899505615234375, 0.009578227996826172, 0.010161399841308594, 0.010744571685791016, 0.011327743530273438, 0.01191091537475586, 0.012494087219238281, 0.013077259063720703, 0.013660430908203125, 0.014243602752685547, 0.014826774597167969, 0.01540994644165039, 0.015993118286132812, 0.016576290130615234, 0.017159461975097656, 0.017742633819580078, 0.0183258056640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 12.0, 10.0, 21.0, 20.0, 30.0, 44.0, 52.0, 86.0, 111.0, 175.0, 301.0, 460.0, 912.0, 1988.0, 6060.0, 23481.0, 123450.0, 476880.0, 330899.0, 63385.0, 13233.0, 3681.0, 1386.0, 680.0, 380.0, 229.0, 153.0, 113.0, 71.0, 59.0, 46.0, 27.0, 22.0, 23.0, 16.0, 10.0, 8.0, 5.0, 5.0, 4.0, 6.0, 2.0, 1.0, 3.0], "bins": [-0.01239013671875, -0.012062430381774902, -0.011734724044799805, -0.011407017707824707, -0.01107931137084961, -0.010751605033874512, -0.010423898696899414, -0.010096192359924316, -0.009768486022949219, -0.009440779685974121, -0.009113073348999023, -0.008785367012023926, -0.008457660675048828, -0.00812995433807373, -0.007802248001098633, -0.007474541664123535, -0.0071468353271484375, -0.00681912899017334, -0.006491422653198242, -0.0061637163162231445, -0.005836009979248047, -0.005508303642272949, -0.0051805973052978516, -0.004852890968322754, -0.004525184631347656, -0.004197478294372559, -0.003869771957397461, -0.0035420656204223633, -0.0032143592834472656, -0.002886652946472168, -0.0025589466094970703, -0.0022312402725219727, -0.001903533935546875, -0.0015758275985717773, -0.0012481212615966797, -0.000920414924621582, -0.0005927085876464844, -0.0002650022506713867, 6.270408630371094e-05, 0.0003904104232788086, 0.0007181167602539062, 0.001045823097229004, 0.0013735294342041016, 0.0017012357711791992, 0.002028942108154297, 0.0023566484451293945, 0.002684354782104492, 0.00301206111907959, 0.0033397674560546875, 0.003667473793029785, 0.003995180130004883, 0.0043228864669799805, 0.004650592803955078, 0.004978299140930176, 0.0053060054779052734, 0.005633711814880371, 0.005961418151855469, 0.006289124488830566, 0.006616830825805664, 0.006944537162780762, 0.007272243499755859, 0.007599949836730957, 0.007927656173706055, 0.008255362510681152, 0.00858306884765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 5.0, 4.0, 15.0, 22.0, 22.0, 33.0, 55.0, 62.0, 86.0, 86.0, 106.0, 100.0, 90.0, 83.0, 58.0, 54.0, 40.0, 29.0, 17.0, 14.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.56382942199707e-05, -7.303338497877121e-05, -7.042847573757172e-05, -6.782356649637222e-05, -6.521865725517273e-05, -6.261374801397324e-05, -6.000883877277374e-05, -5.740392953157425e-05, -5.4799020290374756e-05, -5.219411104917526e-05, -4.958920180797577e-05, -4.6984292566776276e-05, -4.437938332557678e-05, -4.177447408437729e-05, -3.9169564843177795e-05, -3.65646556019783e-05, -3.395974636077881e-05, -3.1354837119579315e-05, -2.8749927878379822e-05, -2.614501863718033e-05, -2.3540109395980835e-05, -2.093520015478134e-05, -1.8330290913581848e-05, -1.5725381672382355e-05, -1.3120472431182861e-05, -1.0515563189983368e-05, -7.910653948783875e-06, -5.305744707584381e-06, -2.7008354663848877e-06, -9.592622518539429e-08, 2.508983016014099e-06, 5.1138922572135925e-06, 7.718801498413086e-06, 1.032371073961258e-05, 1.2928619980812073e-05, 1.5533529222011566e-05, 1.813843846321106e-05, 2.0743347704410553e-05, 2.3348256945610046e-05, 2.595316618680954e-05, 2.8558075428009033e-05, 3.1162984669208527e-05, 3.376789391040802e-05, 3.6372803151607513e-05, 3.897771239280701e-05, 4.15826216340065e-05, 4.4187530875205994e-05, 4.679244011640549e-05, 4.939734935760498e-05, 5.2002258598804474e-05, 5.460716784000397e-05, 5.721207708120346e-05, 5.9816986322402954e-05, 6.242189556360245e-05, 6.502680480480194e-05, 6.763171404600143e-05, 7.023662328720093e-05, 7.284153252840042e-05, 7.544644176959991e-05, 7.805135101079941e-05, 8.06562602519989e-05, 8.32611694931984e-05, 8.586607873439789e-05, 8.847098797559738e-05, 9.107589721679688e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 2.0, 5.0, 7.0, 15.0, 32.0, 47.0, 61.0, 114.0, 176.0, 322.0, 588.0, 1409.0, 4172.0, 17925.0, 131465.0, 580564.0, 267140.0, 34321.0, 6508.0, 1931.0, 840.0, 407.0, 178.0, 121.0, 78.0, 48.0, 21.0, 22.0, 15.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0158538818359375, -0.015433073043823242, -0.015012264251708984, -0.014591455459594727, -0.014170646667480469, -0.013749837875366211, -0.013329029083251953, -0.012908220291137695, -0.012487411499023438, -0.01206660270690918, -0.011645793914794922, -0.011224985122680664, -0.010804176330566406, -0.010383367538452148, -0.00996255874633789, -0.009541749954223633, -0.009120941162109375, -0.008700132369995117, -0.00827932357788086, -0.007858514785766602, -0.007437705993652344, -0.007016897201538086, -0.006596088409423828, -0.00617527961730957, -0.0057544708251953125, -0.005333662033081055, -0.004912853240966797, -0.004492044448852539, -0.004071235656738281, -0.0036504268646240234, -0.0032296180725097656, -0.002808809280395508, -0.00238800048828125, -0.001967191696166992, -0.0015463829040527344, -0.0011255741119384766, -0.0007047653198242188, -0.00028395652770996094, 0.00013685226440429688, 0.0005576610565185547, 0.0009784698486328125, 0.0013992786407470703, 0.0018200874328613281, 0.002240896224975586, 0.0026617050170898438, 0.0030825138092041016, 0.0035033226013183594, 0.003924131393432617, 0.004344940185546875, 0.004765748977661133, 0.005186557769775391, 0.0056073665618896484, 0.006028175354003906, 0.006448984146118164, 0.006869792938232422, 0.00729060173034668, 0.0077114105224609375, 0.008132219314575195, 0.008553028106689453, 0.008973836898803711, 0.009394645690917969, 0.009815454483032227, 0.010236263275146484, 0.010657072067260742, 0.011077880859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 11.0, 30.0, 27.0, 59.0, 87.0, 109.0, 143.0, 149.0, 122.0, 96.0, 46.0, 44.0, 22.0, 13.0, 11.0, 9.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0171051025390625, -0.01657271385192871, -0.016040325164794922, -0.015507936477661133, -0.014975547790527344, -0.014443159103393555, -0.013910770416259766, -0.013378381729125977, -0.012845993041992188, -0.012313604354858398, -0.01178121566772461, -0.01124882698059082, -0.010716438293457031, -0.010184049606323242, -0.009651660919189453, -0.009119272232055664, -0.008586883544921875, -0.008054494857788086, -0.007522106170654297, -0.006989717483520508, -0.006457328796386719, -0.00592494010925293, -0.005392551422119141, -0.0048601627349853516, -0.0043277740478515625, -0.0037953853607177734, -0.0032629966735839844, -0.0027306079864501953, -0.0021982192993164062, -0.0016658306121826172, -0.0011334419250488281, -0.0006010532379150391, -6.866455078125e-05, 0.00046372413635253906, 0.0009961128234863281, 0.0015285015106201172, 0.0020608901977539062, 0.0025932788848876953, 0.0031256675720214844, 0.0036580562591552734, 0.0041904449462890625, 0.0047228336334228516, 0.005255222320556641, 0.00578761100769043, 0.006319999694824219, 0.006852388381958008, 0.007384777069091797, 0.007917165756225586, 0.008449554443359375, 0.008981943130493164, 0.009514331817626953, 0.010046720504760742, 0.010579109191894531, 0.01111149787902832, 0.01164388656616211, 0.012176275253295898, 0.012708663940429688, 0.013241052627563477, 0.013773441314697266, 0.014305830001831055, 0.014838218688964844, 0.015370607376098633, 0.015902996063232422, 0.01643538475036621, 0.0169677734375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 3.0, 6.0, 13.0, 20.0, 37.0, 46.0, 59.0, 90.0, 112.0, 142.0, 121.0, 98.0, 75.0, 59.0, 37.0, 22.0, 26.0, 13.0, 5.0, 8.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07135280966758728, -0.06702051311731339, -0.06268821656703949, -0.058355916291475296, -0.0540236197412014, -0.049691323190927505, -0.04535902291536331, -0.041026726365089417, -0.03669442981481552, -0.032362133264541626, -0.02802983485162258, -0.023697536438703537, -0.01936523988842964, -0.015032943338155746, -0.010700644925236702, -0.0063683465123176575, -0.002036049962043762, 0.0022962475195527077, 0.0066285450011491776, 0.010960842482745647, 0.015293139964342117, 0.019625436514616013, 0.023957734927535057, 0.0282900333404541, 0.032622329890728, 0.03695462644100189, 0.04128692299127579, 0.04561922326683998, 0.049951519817113876, 0.05428381636738777, 0.058616116642951965, 0.06294841319322586, 0.06728069484233856, 0.07161299139261246, 0.07594528794288635, 0.08027758449316025, 0.08460988104343414, 0.08894218504428864, 0.09327448159456253, 0.09760677814483643, 0.10193907469511032, 0.10627137124538422, 0.11060366779565811, 0.114935964345932, 0.1192682683467865, 0.1236005574464798, 0.1279328614473343, 0.1322651505470276, 0.13659745454788208, 0.14092975854873657, 0.14526204764842987, 0.14959435164928436, 0.15392664074897766, 0.15825894474983215, 0.16259123384952545, 0.16692353785037994, 0.17125582695007324, 0.17558813095092773, 0.17992042005062103, 0.18425272405147552, 0.18858501315116882, 0.19291731715202332, 0.1972496062517166, 0.2015819102525711, 0.2059142142534256]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 4.0, 4.0, 3.0, 7.0, 5.0, 14.0, 12.0, 15.0, 17.0, 15.0, 25.0, 26.0, 32.0, 34.0, 31.0, 34.0, 27.0, 50.0, 45.0, 31.0, 39.0, 43.0, 42.0, 38.0, 36.0, 42.0, 42.0, 34.0, 27.0, 32.0, 19.0, 27.0, 20.0, 17.0, 14.0, 18.0, 13.0, 7.0, 11.0, 17.0, 5.0, 9.0, 5.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.09580373764038086, -0.09271527081727982, -0.08962679654359818, -0.08653832972049713, -0.08344985544681549, -0.08036138862371445, -0.0772729218006134, -0.07418444752693176, -0.07109598070383072, -0.06800751388072968, -0.06491903960704803, -0.06183057278394699, -0.05874210223555565, -0.05565363168716431, -0.05256516486406326, -0.04947669431567192, -0.04638822376728058, -0.043299753218889236, -0.040211282670497894, -0.03712281584739685, -0.03403434529900551, -0.030945874750614166, -0.027857406064867973, -0.02476893737912178, -0.021680466830730438, -0.018591996282339096, -0.015503527596592903, -0.012415057979524136, -0.009326588362455368, -0.0062381187453866005, -0.003149649128317833, -6.118044257164001e-05, 0.003027290105819702, 0.00611575972288847, 0.009204229339957237, 0.012292698957026005, 0.015381168574094772, 0.018469639122486115, 0.021558107808232307, 0.0246465764939785, 0.027735047042369843, 0.030823517590761185, 0.03391198813915253, 0.03700045496225357, 0.04008892551064491, 0.043177396059036255, 0.0462658628821373, 0.04935433343052864, 0.05244280397891998, 0.055531274527311325, 0.05861974507570267, 0.06170821189880371, 0.06479668617248535, 0.0678851529955864, 0.07097361981868744, 0.07406209409236908, 0.07715056091547012, 0.08023902773857117, 0.08332750201225281, 0.08641596883535385, 0.0895044356584549, 0.09259290993213654, 0.09568137675523758, 0.09876984357833862, 0.10185831785202026]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 2.0, 3.0, 4.0, 12.0, 16.0, 25.0, 19.0, 31.0, 48.0, 78.0, 125.0, 185.0, 318.0, 531.0, 1214.0, 2942.0, 8911.0, 41510.0, 1063662.0, 3000141.0, 58037.0, 10746.0, 3158.0, 1250.0, 561.0, 282.0, 180.0, 113.0, 54.0, 42.0, 25.0, 26.0, 8.0, 9.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03570556640625, -0.03455686569213867, -0.033408164978027344, -0.032259464263916016, -0.031110763549804688, -0.02996206283569336, -0.02881336212158203, -0.027664661407470703, -0.026515960693359375, -0.025367259979248047, -0.02421855926513672, -0.02306985855102539, -0.021921157836914062, -0.020772457122802734, -0.019623756408691406, -0.018475055694580078, -0.01732635498046875, -0.016177654266357422, -0.015028953552246094, -0.013880252838134766, -0.012731552124023438, -0.01158285140991211, -0.010434150695800781, -0.009285449981689453, -0.008136749267578125, -0.006988048553466797, -0.005839347839355469, -0.004690647125244141, -0.0035419464111328125, -0.0023932456970214844, -0.0012445449829101562, -9.584426879882812e-05, 0.0010528564453125, 0.002201557159423828, 0.0033502578735351562, 0.004498958587646484, 0.0056476593017578125, 0.006796360015869141, 0.007945060729980469, 0.009093761444091797, 0.010242462158203125, 0.011391162872314453, 0.012539863586425781, 0.01368856430053711, 0.014837265014648438, 0.015985965728759766, 0.017134666442871094, 0.018283367156982422, 0.01943206787109375, 0.020580768585205078, 0.021729469299316406, 0.022878170013427734, 0.024026870727539062, 0.02517557144165039, 0.02632427215576172, 0.027472972869873047, 0.028621673583984375, 0.029770374298095703, 0.03091907501220703, 0.03206777572631836, 0.03321647644042969, 0.034365177154541016, 0.035513877868652344, 0.03666257858276367, 0.037811279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 18.0, 25.0, 27.0, 34.0, 50.0, 71.0, 69.0, 66.0, 84.0, 96.0, 78.0, 99.0, 67.0, 58.0, 45.0, 26.0, 37.0, 9.0, 10.0, 9.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.009368896484375, -0.009078264236450195, -0.00878763198852539, -0.008496999740600586, -0.008206367492675781, -0.007915735244750977, -0.007625102996826172, -0.007334470748901367, -0.0070438385009765625, -0.006753206253051758, -0.006462574005126953, -0.0061719417572021484, -0.005881309509277344, -0.005590677261352539, -0.005300045013427734, -0.00500941276550293, -0.004718780517578125, -0.00442814826965332, -0.004137516021728516, -0.003846883773803711, -0.0035562515258789062, -0.0032656192779541016, -0.002974987030029297, -0.002684354782104492, -0.0023937225341796875, -0.002103090286254883, -0.0018124580383300781, -0.0015218257904052734, -0.0012311935424804688, -0.0009405612945556641, -0.0006499290466308594, -0.0003592967987060547, -6.866455078125e-05, 0.0002219676971435547, 0.0005125999450683594, 0.0008032321929931641, 0.0010938644409179688, 0.0013844966888427734, 0.0016751289367675781, 0.001965761184692383, 0.0022563934326171875, 0.002547025680541992, 0.002837657928466797, 0.0031282901763916016, 0.0034189224243164062, 0.003709554672241211, 0.004000186920166016, 0.00429081916809082, 0.004581451416015625, 0.00487208366394043, 0.005162715911865234, 0.005453348159790039, 0.005743980407714844, 0.0060346126556396484, 0.006325244903564453, 0.006615877151489258, 0.0069065093994140625, 0.007197141647338867, 0.007487773895263672, 0.0077784061431884766, 0.008069038391113281, 0.008359670639038086, 0.00865030288696289, 0.008940935134887695, 0.0092315673828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 11.0, 7.0, 11.0, 15.0, 22.0, 36.0, 49.0, 61.0, 98.0, 184.0, 282.0, 634.0, 1757.0, 6254.0, 31777.0, 698826.0, 3364615.0, 74578.0, 10566.0, 2712.0, 828.0, 400.0, 195.0, 110.0, 76.0, 55.0, 39.0, 22.0, 12.0, 17.0, 9.0, 4.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03253173828125, -0.03145408630371094, -0.030376434326171875, -0.029298782348632812, -0.02822113037109375, -0.027143478393554688, -0.026065826416015625, -0.024988174438476562, -0.0239105224609375, -0.022832870483398438, -0.021755218505859375, -0.020677566528320312, -0.01959991455078125, -0.018522262573242188, -0.017444610595703125, -0.016366958618164062, -0.015289306640625, -0.014211654663085938, -0.013134002685546875, -0.012056350708007812, -0.01097869873046875, -0.009901046752929688, -0.008823394775390625, -0.0077457427978515625, -0.0066680908203125, -0.0055904388427734375, -0.004512786865234375, -0.0034351348876953125, -0.00235748291015625, -0.0012798309326171875, -0.000202178955078125, 0.0008754730224609375, 0.001953125, 0.0030307769775390625, 0.004108428955078125, 0.0051860809326171875, 0.00626373291015625, 0.0073413848876953125, 0.008419036865234375, 0.009496688842773438, 0.0105743408203125, 0.011651992797851562, 0.012729644775390625, 0.013807296752929688, 0.01488494873046875, 0.015962600708007812, 0.017040252685546875, 0.018117904663085938, 0.019195556640625, 0.020273208618164062, 0.021350860595703125, 0.022428512573242188, 0.02350616455078125, 0.024583816528320312, 0.025661468505859375, 0.026739120483398438, 0.0278167724609375, 0.028894424438476562, 0.029972076416015625, 0.031049728393554688, 0.03212738037109375, 0.03320503234863281, 0.034282684326171875, 0.03536033630371094, 0.03643798828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 8.0, 2.0, 9.0, 10.0, 17.0, 22.0, 21.0, 52.0, 119.0, 233.0, 724.0, 1599.0, 719.0, 261.0, 141.0, 60.0, 28.0, 14.0, 13.0, 9.0, 5.0, 2.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01491546630859375, -0.014537572860717773, -0.014159679412841797, -0.01378178596496582, -0.013403892517089844, -0.013025999069213867, -0.01264810562133789, -0.012270212173461914, -0.011892318725585938, -0.011514425277709961, -0.011136531829833984, -0.010758638381958008, -0.010380744934082031, -0.010002851486206055, -0.009624958038330078, -0.009247064590454102, -0.008869171142578125, -0.008491277694702148, -0.008113384246826172, -0.007735490798950195, -0.007357597351074219, -0.006979703903198242, -0.006601810455322266, -0.006223917007446289, -0.0058460235595703125, -0.005468130111694336, -0.005090236663818359, -0.004712343215942383, -0.004334449768066406, -0.00395655632019043, -0.003578662872314453, -0.0032007694244384766, -0.0028228759765625, -0.0024449825286865234, -0.002067089080810547, -0.0016891956329345703, -0.0013113021850585938, -0.0009334087371826172, -0.0005555152893066406, -0.00017762184143066406, 0.0002002716064453125, 0.0005781650543212891, 0.0009560585021972656, 0.0013339519500732422, 0.0017118453979492188, 0.0020897388458251953, 0.002467632293701172, 0.0028455257415771484, 0.003223419189453125, 0.0036013126373291016, 0.003979206085205078, 0.004357099533081055, 0.004734992980957031, 0.005112886428833008, 0.005490779876708984, 0.005868673324584961, 0.0062465667724609375, 0.006624460220336914, 0.007002353668212891, 0.007380247116088867, 0.007758140563964844, 0.00813603401184082, 0.008513927459716797, 0.008891820907592773, 0.00926971435546875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 49.0, 340.0, 493.0, 103.0, 18.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24192523956298828, -0.23437495529651642, -0.22682467103004456, -0.2192743867635727, -0.21172410249710083, -0.20417381823062897, -0.1966235339641571, -0.18907324969768524, -0.18152296543121338, -0.17397268116474152, -0.16642239689826965, -0.1588721126317978, -0.15132182836532593, -0.14377154409885406, -0.1362212598323822, -0.12867097556591034, -0.12112069129943848, -0.11357040703296661, -0.10602012276649475, -0.09846983850002289, -0.09091955423355103, -0.08336926996707916, -0.0758189857006073, -0.06826870143413544, -0.060718417167663574, -0.05316813290119171, -0.04561784863471985, -0.038067564368247986, -0.030517280101776123, -0.02296699583530426, -0.015416711568832397, -0.007866427302360535, -0.0003161430358886719, 0.007234141230583191, 0.014784425497055054, 0.022334709763526917, 0.02988499402999878, 0.03743527829647064, 0.044985562562942505, 0.05253584682941437, 0.06008613109588623, 0.0676364153623581, 0.07518669962882996, 0.08273698389530182, 0.09028726816177368, 0.09783755242824554, 0.10538783669471741, 0.11293812096118927, 0.12048840522766113, 0.128038689494133, 0.13558897376060486, 0.14313925802707672, 0.15068954229354858, 0.15823982656002045, 0.1657901108264923, 0.17334039509296417, 0.18089067935943604, 0.1884409636259079, 0.19599124789237976, 0.20354153215885162, 0.2110918164253235, 0.21864210069179535, 0.2261923849582672, 0.23374266922473907, 0.24129295349121094]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 9.0, 5.0, 8.0, 9.0, 20.0, 18.0, 30.0, 46.0, 53.0, 59.0, 61.0, 54.0, 56.0, 73.0, 61.0, 68.0, 61.0, 52.0, 46.0, 47.0, 41.0, 34.0, 29.0, 14.0, 6.0, 13.0, 10.0, 4.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030660152435302734, -0.029400061815977097, -0.028139973059296608, -0.02687988430261612, -0.02561979368329048, -0.024359703063964844, -0.023099614307284355, -0.021839525550603867, -0.02057943493127823, -0.01931934431195259, -0.018059255555272102, -0.016799166798591614, -0.015539076179265976, -0.014278986491262913, -0.01301889680325985, -0.011758807115256786, -0.010498717427253723, -0.00923862773925066, -0.007978538051247597, -0.0067184483632445335, -0.00545835867524147, -0.004198268987238407, -0.002938179299235344, -0.0016780896112322807, -0.00041799992322921753, 0.0008420897647738457, 0.002102179452776909, 0.003362269140779972, 0.004622358828783035, 0.0058824485167860985, 0.007142538204789162, 0.008402627892792225, 0.009662717580795288, 0.010922807268798351, 0.012182896956801414, 0.013442986644804478, 0.014703076332807541, 0.01596316695213318, 0.017223255708813667, 0.018483344465494156, 0.019743435084819794, 0.02100352570414543, 0.02226361446082592, 0.02352370321750641, 0.024783793836832047, 0.026043884456157684, 0.027303973212838173, 0.02856406196951866, 0.0298241525888443, 0.031084243208169937, 0.032344333827495575, 0.033604420721530914, 0.03486451134085655, 0.03612460196018219, 0.03738468885421753, 0.03864477947354317, 0.039904870092868805, 0.04116496071219444, 0.04242505133152008, 0.04368513822555542, 0.04494522884488106, 0.046205319464206696, 0.047465406358242035, 0.04872549697756767, 0.04998558759689331]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 7.0, 3.0, 0.0, 4.0, 10.0, 10.0, 15.0, 14.0, 22.0, 30.0, 52.0, 79.0, 81.0, 128.0, 195.0, 290.0, 412.0, 732.0, 1275.0, 2494.0, 5932.0, 16201.0, 52594.0, 220383.0, 499032.0, 179790.0, 44252.0, 13941.0, 5190.0, 2275.0, 1147.0, 682.0, 414.0, 253.0, 175.0, 133.0, 94.0, 74.0, 36.0, 40.0, 19.0, 19.0, 8.0, 10.0, 7.0, 2.0, 4.0, 2.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023345947265625, -0.02252483367919922, -0.021703720092773438, -0.020882606506347656, -0.020061492919921875, -0.019240379333496094, -0.018419265747070312, -0.01759815216064453, -0.01677703857421875, -0.01595592498779297, -0.015134811401367188, -0.014313697814941406, -0.013492584228515625, -0.012671470642089844, -0.011850357055664062, -0.011029243469238281, -0.0102081298828125, -0.009387016296386719, -0.008565902709960938, -0.007744789123535156, -0.006923675537109375, -0.006102561950683594, -0.0052814483642578125, -0.004460334777832031, -0.00363922119140625, -0.0028181076049804688, -0.0019969940185546875, -0.0011758804321289062, -0.000354766845703125, 0.00046634674072265625, 0.0012874603271484375, 0.0021085739135742188, 0.0029296875, 0.0037508010864257812, 0.0045719146728515625, 0.005393028259277344, 0.006214141845703125, 0.007035255432128906, 0.007856369018554688, 0.008677482604980469, 0.00949859619140625, 0.010319709777832031, 0.011140823364257812, 0.011961936950683594, 0.012783050537109375, 0.013604164123535156, 0.014425277709960938, 0.015246391296386719, 0.0160675048828125, 0.01688861846923828, 0.017709732055664062, 0.018530845642089844, 0.019351959228515625, 0.020173072814941406, 0.020994186401367188, 0.02181529998779297, 0.02263641357421875, 0.02345752716064453, 0.024278640747070312, 0.025099754333496094, 0.025920867919921875, 0.026741981506347656, 0.027563095092773438, 0.02838420867919922, 0.029205322265625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 22.0, 32.0, 25.0, 45.0, 59.0, 67.0, 77.0, 82.0, 99.0, 96.0, 84.0, 80.0, 66.0, 48.0, 38.0, 20.0, 15.0, 10.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01035308837890625, -0.010053515434265137, -0.009753942489624023, -0.00945436954498291, -0.009154796600341797, -0.008855223655700684, -0.00855565071105957, -0.008256077766418457, -0.007956504821777344, -0.0076569318771362305, -0.007357358932495117, -0.007057785987854004, -0.006758213043212891, -0.006458640098571777, -0.006159067153930664, -0.005859494209289551, -0.0055599212646484375, -0.005260348320007324, -0.004960775375366211, -0.004661202430725098, -0.004361629486083984, -0.004062056541442871, -0.003762483596801758, -0.0034629106521606445, -0.0031633377075195312, -0.002863764762878418, -0.0025641918182373047, -0.0022646188735961914, -0.001965045928955078, -0.0016654729843139648, -0.0013659000396728516, -0.0010663270950317383, -0.000766754150390625, -0.0004671812057495117, -0.00016760826110839844, 0.00013196468353271484, 0.0004315376281738281, 0.0007311105728149414, 0.0010306835174560547, 0.001330256462097168, 0.0016298294067382812, 0.0019294023513793945, 0.002228975296020508, 0.002528548240661621, 0.0028281211853027344, 0.0031276941299438477, 0.003427267074584961, 0.0037268400192260742, 0.0040264129638671875, 0.004325985908508301, 0.004625558853149414, 0.004925131797790527, 0.005224704742431641, 0.005524277687072754, 0.005823850631713867, 0.0061234235763549805, 0.006422996520996094, 0.006722569465637207, 0.00702214241027832, 0.007321715354919434, 0.007621288299560547, 0.00792086124420166, 0.008220434188842773, 0.008520007133483887, 0.008819580078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 9.0, 18.0, 12.0, 24.0, 54.0, 79.0, 115.0, 164.0, 313.0, 447.0, 772.0, 1397.0, 2821.0, 5248.0, 10415.0, 22571.0, 51811.0, 132114.0, 308350.0, 296456.0, 124113.0, 48887.0, 21403.0, 9916.0, 5115.0, 2564.0, 1410.0, 788.0, 413.0, 265.0, 181.0, 106.0, 68.0, 26.0, 25.0, 24.0, 17.0, 10.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01358795166015625, -0.013118863105773926, -0.012649774551391602, -0.012180685997009277, -0.011711597442626953, -0.011242508888244629, -0.010773420333862305, -0.01030433177947998, -0.009835243225097656, -0.009366154670715332, -0.008897066116333008, -0.008427977561950684, -0.00795888900756836, -0.007489800453186035, -0.007020711898803711, -0.006551623344421387, -0.0060825347900390625, -0.005613446235656738, -0.005144357681274414, -0.00467526912689209, -0.004206180572509766, -0.0037370920181274414, -0.003268003463745117, -0.002798914909362793, -0.0023298263549804688, -0.0018607378005981445, -0.0013916492462158203, -0.0009225606918334961, -0.0004534721374511719, 1.5616416931152344e-05, 0.00048470497131347656, 0.0009537935256958008, 0.001422882080078125, 0.0018919706344604492, 0.0023610591888427734, 0.0028301477432250977, 0.003299236297607422, 0.003768324851989746, 0.00423741340637207, 0.0047065019607543945, 0.005175590515136719, 0.005644679069519043, 0.006113767623901367, 0.006582856178283691, 0.007051944732666016, 0.00752103328704834, 0.007990121841430664, 0.008459210395812988, 0.008928298950195312, 0.009397387504577637, 0.009866476058959961, 0.010335564613342285, 0.01080465316772461, 0.011273741722106934, 0.011742830276489258, 0.012211918830871582, 0.012681007385253906, 0.01315009593963623, 0.013619184494018555, 0.014088273048400879, 0.014557361602783203, 0.015026450157165527, 0.015495538711547852, 0.015964627265930176, 0.0164337158203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 2.0, 5.0, 5.0, 12.0, 11.0, 9.0, 16.0, 21.0, 21.0, 26.0, 29.0, 31.0, 38.0, 41.0, 47.0, 41.0, 31.0, 53.0, 50.0, 39.0, 51.0, 35.0, 43.0, 44.0, 30.0, 34.0, 44.0, 33.0, 21.0, 28.0, 24.0, 16.0, 13.0, 8.0, 17.0, 11.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.022216796875, -0.0215914249420166, -0.020966053009033203, -0.020340681076049805, -0.019715309143066406, -0.019089937210083008, -0.01846456527709961, -0.01783919334411621, -0.017213821411132812, -0.016588449478149414, -0.015963077545166016, -0.015337705612182617, -0.014712333679199219, -0.01408696174621582, -0.013461589813232422, -0.012836217880249023, -0.012210845947265625, -0.011585474014282227, -0.010960102081298828, -0.01033473014831543, -0.009709358215332031, -0.009083986282348633, -0.008458614349365234, -0.007833242416381836, -0.0072078704833984375, -0.006582498550415039, -0.005957126617431641, -0.005331754684448242, -0.004706382751464844, -0.004081010818481445, -0.003455638885498047, -0.0028302669525146484, -0.00220489501953125, -0.0015795230865478516, -0.0009541511535644531, -0.0003287792205810547, 0.00029659271240234375, 0.0009219646453857422, 0.0015473365783691406, 0.002172708511352539, 0.0027980804443359375, 0.003423452377319336, 0.004048824310302734, 0.004674196243286133, 0.005299568176269531, 0.00592494010925293, 0.006550312042236328, 0.0071756839752197266, 0.007801055908203125, 0.008426427841186523, 0.009051799774169922, 0.00967717170715332, 0.010302543640136719, 0.010927915573120117, 0.011553287506103516, 0.012178659439086914, 0.012804031372070312, 0.013429403305053711, 0.01405477523803711, 0.014680147171020508, 0.015305519104003906, 0.015930891036987305, 0.016556262969970703, 0.0171816349029541, 0.0178070068359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 11.0, 9.0, 18.0, 26.0, 42.0, 55.0, 72.0, 148.0, 259.0, 797.0, 2870.0, 17326.0, 275662.0, 686320.0, 56574.0, 5967.0, 1445.0, 423.0, 213.0, 128.0, 63.0, 37.0, 32.0, 15.0, 10.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.0213165283203125, -0.02082347869873047, -0.020330429077148438, -0.019837379455566406, -0.019344329833984375, -0.018851280212402344, -0.018358230590820312, -0.01786518096923828, -0.01737213134765625, -0.01687908172607422, -0.016386032104492188, -0.015892982482910156, -0.015399932861328125, -0.014906883239746094, -0.014413833618164062, -0.013920783996582031, -0.013427734375, -0.012934684753417969, -0.012441635131835938, -0.011948585510253906, -0.011455535888671875, -0.010962486267089844, -0.010469436645507812, -0.009976387023925781, -0.00948333740234375, -0.008990287780761719, -0.008497238159179688, -0.008004188537597656, -0.007511138916015625, -0.007018089294433594, -0.0065250396728515625, -0.006031990051269531, -0.0055389404296875, -0.005045890808105469, -0.0045528411865234375, -0.004059791564941406, -0.003566741943359375, -0.0030736923217773438, -0.0025806427001953125, -0.0020875930786132812, -0.00159454345703125, -0.0011014938354492188, -0.0006084442138671875, -0.00011539459228515625, 0.000377655029296875, 0.0008707046508789062, 0.0013637542724609375, 0.0018568038940429688, 0.002349853515625, 0.0028429031372070312, 0.0033359527587890625, 0.0038290023803710938, 0.004322052001953125, 0.004815101623535156, 0.0053081512451171875, 0.005801200866699219, 0.00629425048828125, 0.006787300109863281, 0.0072803497314453125, 0.007773399353027344, 0.008266448974609375, 0.008759498596191406, 0.009252548217773438, 0.009745597839355469, 0.0102386474609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 25.0, 37.0, 90.0, 122.0, 121.0, 179.0, 156.0, 107.0, 66.0, 42.0, 27.0, 16.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.09566879272461e-05, -8.674152195453644e-05, -8.252635598182678e-05, -7.831119000911713e-05, -7.409602403640747e-05, -6.988085806369781e-05, -6.566569209098816e-05, -6.14505261182785e-05, -5.723536014556885e-05, -5.302019417285919e-05, -4.8805028200149536e-05, -4.458986222743988e-05, -4.0374696254730225e-05, -3.615953028202057e-05, -3.194436430931091e-05, -2.7729198336601257e-05, -2.35140323638916e-05, -1.9298866391181946e-05, -1.508370041847229e-05, -1.0868534445762634e-05, -6.6533684730529785e-06, -2.4382025003433228e-06, 1.776963472366333e-06, 5.992129445075989e-06, 1.0207295417785645e-05, 1.44224613904953e-05, 1.8637627363204956e-05, 2.2852793335914612e-05, 2.7067959308624268e-05, 3.128312528133392e-05, 3.549829125404358e-05, 3.9713457226753235e-05, 4.392862319946289e-05, 4.8143789172172546e-05, 5.23589551448822e-05, 5.657412111759186e-05, 6.0789287090301514e-05, 6.500445306301117e-05, 6.921961903572083e-05, 7.343478500843048e-05, 7.764995098114014e-05, 8.186511695384979e-05, 8.608028292655945e-05, 9.02954488992691e-05, 9.451061487197876e-05, 9.872578084468842e-05, 0.00010294094681739807, 0.00010715611279010773, 0.00011137127876281738, 0.00011558644473552704, 0.0001198016107082367, 0.00012401677668094635, 0.000128231942653656, 0.00013244710862636566, 0.00013666227459907532, 0.00014087744057178497, 0.00014509260654449463, 0.00014930777251720428, 0.00015352293848991394, 0.0001577381044626236, 0.00016195327043533325, 0.0001661684364080429, 0.00017038360238075256, 0.00017459876835346222, 0.00017881393432617188]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 10.0, 26.0, 40.0, 37.0, 64.0, 148.0, 232.0, 392.0, 816.0, 1824.0, 5059.0, 18182.0, 94837.0, 435400.0, 390626.0, 77710.0, 15380.0, 4506.0, 1593.0, 711.0, 403.0, 209.0, 132.0, 71.0, 45.0, 24.0, 16.0, 16.0, 9.0, 6.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00962066650390625, -0.009309768676757812, -0.008998870849609375, -0.008687973022460938, -0.0083770751953125, -0.008066177368164062, -0.007755279541015625, -0.0074443817138671875, -0.00713348388671875, -0.0068225860595703125, -0.006511688232421875, -0.0062007904052734375, -0.005889892578125, -0.0055789947509765625, -0.005268096923828125, -0.0049571990966796875, -0.00464630126953125, -0.0043354034423828125, -0.004024505615234375, -0.0037136077880859375, -0.0034027099609375, -0.0030918121337890625, -0.002780914306640625, -0.0024700164794921875, -0.00215911865234375, -0.0018482208251953125, -0.001537322998046875, -0.0012264251708984375, -0.00091552734375, -0.0006046295166015625, -0.000293731689453125, 1.71661376953125e-05, 0.00032806396484375, 0.0006389617919921875, 0.000949859619140625, 0.0012607574462890625, 0.0015716552734375, 0.0018825531005859375, 0.002193450927734375, 0.0025043487548828125, 0.00281524658203125, 0.0031261444091796875, 0.003437042236328125, 0.0037479400634765625, 0.004058837890625, 0.0043697357177734375, 0.004680633544921875, 0.0049915313720703125, 0.00530242919921875, 0.0056133270263671875, 0.005924224853515625, 0.0062351226806640625, 0.0065460205078125, 0.0068569183349609375, 0.007167816162109375, 0.0074787139892578125, 0.00778961181640625, 0.008100509643554688, 0.008411407470703125, 0.008722305297851562, 0.009033203125, 0.009344100952148438, 0.009654998779296875, 0.009965896606445312, 0.01027679443359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 7.0, 4.0, 8.0, 13.0, 18.0, 24.0, 21.0, 31.0, 40.0, 57.0, 63.0, 82.0, 71.0, 89.0, 104.0, 75.0, 70.0, 47.0, 49.0, 27.0, 26.0, 14.0, 11.0, 15.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00922393798828125, -0.00894784927368164, -0.008671760559082031, -0.008395671844482422, -0.008119583129882812, -0.007843494415283203, -0.007567405700683594, -0.007291316986083984, -0.007015228271484375, -0.006739139556884766, -0.006463050842285156, -0.006186962127685547, -0.0059108734130859375, -0.005634784698486328, -0.005358695983886719, -0.005082607269287109, -0.0048065185546875, -0.004530429840087891, -0.004254341125488281, -0.003978252410888672, -0.0037021636962890625, -0.003426074981689453, -0.0031499862670898438, -0.0028738975524902344, -0.002597808837890625, -0.0023217201232910156, -0.0020456314086914062, -0.0017695426940917969, -0.0014934539794921875, -0.0012173652648925781, -0.0009412765502929688, -0.0006651878356933594, -0.00038909912109375, -0.00011301040649414062, 0.00016307830810546875, 0.0004391670227050781, 0.0007152557373046875, 0.0009913444519042969, 0.0012674331665039062, 0.0015435218811035156, 0.001819610595703125, 0.0020956993103027344, 0.0023717880249023438, 0.002647876739501953, 0.0029239654541015625, 0.003200054168701172, 0.0034761428833007812, 0.0037522315979003906, 0.0040283203125, 0.004304409027099609, 0.004580497741699219, 0.004856586456298828, 0.0051326751708984375, 0.005408763885498047, 0.005684852600097656, 0.005960941314697266, 0.006237030029296875, 0.006513118743896484, 0.006789207458496094, 0.007065296173095703, 0.0073413848876953125, 0.007617473602294922, 0.007893562316894531, 0.00816965103149414, 0.00844573974609375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 7.0, 13.0, 10.0, 25.0, 47.0, 71.0, 135.0, 167.0, 181.0, 152.0, 91.0, 46.0, 25.0, 11.0, 12.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17151640355587006, -0.16563548147678375, -0.15975457429885864, -0.15387365221977234, -0.14799273014068604, -0.14211180806159973, -0.13623088598251343, -0.13034997880458832, -0.12446905672550201, -0.11858813464641571, -0.11270722001791, -0.1068263053894043, -0.100945383310318, -0.09506446123123169, -0.08918354660272598, -0.08330263197422028, -0.07742170989513397, -0.07154078781604767, -0.06565987318754196, -0.059778954833745956, -0.05389803647994995, -0.048017118126153946, -0.04213619977235794, -0.036255281418561935, -0.03037436306476593, -0.024493444710969925, -0.01861252635717392, -0.012731608003377914, -0.006850689649581909, -0.0009697712957859039, 0.004911147058010101, 0.010792065411806107, 0.016672998666763306, 0.02255391702055931, 0.028434835374355316, 0.03431575372815132, 0.04019667208194733, 0.04607759043574333, 0.05195850878953934, 0.05783942714333534, 0.06372034549713135, 0.06960126757621765, 0.07548218220472336, 0.08136309683322906, 0.08724401891231537, 0.09312494099140167, 0.09900585561990738, 0.10488677024841309, 0.11076769232749939, 0.1166486144065857, 0.1225295290350914, 0.1284104436635971, 0.1342913657426834, 0.14017228782176971, 0.14605319499969482, 0.15193411707878113, 0.15781503915786743, 0.16369596123695374, 0.16957688331604004, 0.17545779049396515, 0.18133871257305145, 0.18721963465213776, 0.19310054183006287, 0.19898146390914917, 0.20486238598823547]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 9.0, 5.0, 9.0, 12.0, 16.0, 26.0, 21.0, 32.0, 34.0, 41.0, 32.0, 34.0, 44.0, 40.0, 41.0, 48.0, 70.0, 50.0, 44.0, 56.0, 41.0, 41.0, 30.0, 36.0, 34.0, 29.0, 20.0, 20.0, 13.0, 7.0, 15.0, 11.0, 10.0, 5.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1271079182624817, -0.12351687997579575, -0.1199258416891098, -0.11633481085300446, -0.11274377256631851, -0.10915273427963257, -0.10556170344352722, -0.10197066515684128, -0.09837962687015533, -0.09478858858346939, -0.09119755029678345, -0.0876065194606781, -0.08401548117399216, -0.08042444288730621, -0.07683341205120087, -0.07324237376451492, -0.06965133547782898, -0.06606029719114304, -0.06246926262974739, -0.058878228068351746, -0.0552871897816658, -0.05169615149497986, -0.04810511693358421, -0.04451408237218857, -0.040923044085502625, -0.03733200579881668, -0.033740971237421036, -0.03014993481338024, -0.026558898389339447, -0.022967861965298653, -0.01937682554125786, -0.015785789117217064, -0.01219475269317627, -0.008603716269135475, -0.005012679845094681, -0.0014216434210538864, 0.002169393002986908, 0.005760429427027702, 0.009351465851068497, 0.012942502275109291, 0.016533538699150085, 0.02012457512319088, 0.023715611547231674, 0.02730664797127247, 0.030897684395313263, 0.03448872268199921, 0.03807975724339485, 0.0416707918047905, 0.04526183009147644, 0.048852868378162384, 0.05244390293955803, 0.056034937500953674, 0.05962597578763962, 0.06321701407432556, 0.06680804491043091, 0.07039908319711685, 0.0739901214838028, 0.07758115977048874, 0.08117219805717468, 0.08476322889328003, 0.08835426717996597, 0.09194530546665192, 0.09553633630275726, 0.0991273745894432, 0.10271841287612915]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 9.0, 21.0, 46.0, 129.0, 392.0, 1756.0, 18710.0, 4050333.0, 118152.0, 3811.0, 633.0, 195.0, 68.0, 22.0, 9.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033111572265625, -0.030286312103271484, -0.02746105194091797, -0.024635791778564453, -0.021810531616210938, -0.018985271453857422, -0.016160011291503906, -0.01333475112915039, -0.010509490966796875, -0.007684230804443359, -0.004858970642089844, -0.002033710479736328, 0.0007915496826171875, 0.003616809844970703, 0.006442070007324219, 0.009267330169677734, 0.01209259033203125, 0.014917850494384766, 0.01774311065673828, 0.020568370819091797, 0.023393630981445312, 0.026218891143798828, 0.029044151306152344, 0.03186941146850586, 0.034694671630859375, 0.03751993179321289, 0.040345191955566406, 0.04317045211791992, 0.04599571228027344, 0.04882097244262695, 0.05164623260498047, 0.054471492767333984, 0.0572967529296875, 0.060122013092041016, 0.06294727325439453, 0.06577253341674805, 0.06859779357910156, 0.07142305374145508, 0.0742483139038086, 0.07707357406616211, 0.07989883422851562, 0.08272409439086914, 0.08554935455322266, 0.08837461471557617, 0.09119987487792969, 0.0940251350402832, 0.09685039520263672, 0.09967565536499023, 0.10250091552734375, 0.10532617568969727, 0.10815143585205078, 0.1109766960144043, 0.11380195617675781, 0.11662721633911133, 0.11945247650146484, 0.12227773666381836, 0.12510299682617188, 0.1279282569885254, 0.1307535171508789, 0.13357877731323242, 0.13640403747558594, 0.13922929763793945, 0.14205455780029297, 0.14487981796264648, 0.147705078125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 5.0, 20.0, 23.0, 35.0, 37.0, 36.0, 62.0, 90.0, 72.0, 77.0, 74.0, 75.0, 78.0, 68.0, 65.0, 58.0, 35.0, 32.0, 15.0, 11.0, 7.0, 5.0, 8.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0101165771484375, -0.009822249412536621, -0.009527921676635742, -0.009233593940734863, -0.008939266204833984, -0.008644938468933105, -0.008350610733032227, -0.008056282997131348, -0.007761955261230469, -0.00746762752532959, -0.007173299789428711, -0.006878972053527832, -0.006584644317626953, -0.006290316581726074, -0.005995988845825195, -0.005701661109924316, -0.0054073333740234375, -0.005113005638122559, -0.00481867790222168, -0.004524350166320801, -0.004230022430419922, -0.003935694694519043, -0.003641366958618164, -0.003347039222717285, -0.0030527114868164062, -0.0027583837509155273, -0.0024640560150146484, -0.0021697282791137695, -0.0018754005432128906, -0.0015810728073120117, -0.0012867450714111328, -0.000992417335510254, -0.000698089599609375, -0.0004037618637084961, -0.00010943412780761719, 0.00018489360809326172, 0.0004792213439941406, 0.0007735490798950195, 0.0010678768157958984, 0.0013622045516967773, 0.0016565322875976562, 0.0019508600234985352, 0.002245187759399414, 0.002539515495300293, 0.002833843231201172, 0.0031281709671020508, 0.0034224987030029297, 0.0037168264389038086, 0.0040111541748046875, 0.004305481910705566, 0.004599809646606445, 0.004894137382507324, 0.005188465118408203, 0.005482792854309082, 0.005777120590209961, 0.00607144832611084, 0.006365776062011719, 0.006660103797912598, 0.0069544315338134766, 0.0072487592697143555, 0.007543087005615234, 0.007837414741516113, 0.008131742477416992, 0.008426070213317871, 0.00872039794921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 10.0, 9.0, 19.0, 14.0, 20.0, 36.0, 53.0, 69.0, 104.0, 155.0, 260.0, 478.0, 968.0, 2444.0, 7560.0, 33018.0, 339032.0, 3566965.0, 207091.0, 25252.0, 6310.0, 2194.0, 871.0, 469.0, 260.0, 176.0, 128.0, 96.0, 56.0, 32.0, 36.0, 23.0, 10.0, 11.0, 14.0, 17.0, 4.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.02435302734375, -0.023496150970458984, -0.02263927459716797, -0.021782398223876953, -0.020925521850585938, -0.020068645477294922, -0.019211769104003906, -0.01835489273071289, -0.017498016357421875, -0.01664113998413086, -0.015784263610839844, -0.014927387237548828, -0.014070510864257812, -0.013213634490966797, -0.012356758117675781, -0.011499881744384766, -0.01064300537109375, -0.009786128997802734, -0.008929252624511719, -0.008072376251220703, -0.0072154998779296875, -0.006358623504638672, -0.005501747131347656, -0.004644870758056641, -0.003787994384765625, -0.0029311180114746094, -0.0020742416381835938, -0.0012173652648925781, -0.0003604888916015625, 0.0004963874816894531, 0.0013532638549804688, 0.0022101402282714844, 0.0030670166015625, 0.003923892974853516, 0.004780769348144531, 0.005637645721435547, 0.0064945220947265625, 0.007351398468017578, 0.008208274841308594, 0.00906515121459961, 0.009922027587890625, 0.01077890396118164, 0.011635780334472656, 0.012492656707763672, 0.013349533081054688, 0.014206409454345703, 0.015063285827636719, 0.015920162200927734, 0.01677703857421875, 0.017633914947509766, 0.01849079132080078, 0.019347667694091797, 0.020204544067382812, 0.021061420440673828, 0.021918296813964844, 0.02277517318725586, 0.023632049560546875, 0.02448892593383789, 0.025345802307128906, 0.026202678680419922, 0.027059555053710938, 0.027916431427001953, 0.02877330780029297, 0.029630184173583984, 0.030487060546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 9.0, 13.0, 28.0, 27.0, 47.0, 59.0, 156.0, 317.0, 766.0, 1451.0, 634.0, 257.0, 119.0, 72.0, 40.0, 29.0, 18.0, 8.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00760650634765625, -0.007213711738586426, -0.0068209171295166016, -0.006428122520446777, -0.006035327911376953, -0.005642533302307129, -0.005249738693237305, -0.0048569440841674805, -0.004464149475097656, -0.004071354866027832, -0.003678560256958008, -0.0032857656478881836, -0.0028929710388183594, -0.002500176429748535, -0.002107381820678711, -0.0017145872116088867, -0.0013217926025390625, -0.0009289979934692383, -0.0005362033843994141, -0.00014340877532958984, 0.0002493858337402344, 0.0006421804428100586, 0.0010349750518798828, 0.001427769660949707, 0.0018205642700195312, 0.0022133588790893555, 0.0026061534881591797, 0.002998948097229004, 0.003391742706298828, 0.0037845373153686523, 0.0041773319244384766, 0.004570126533508301, 0.004962921142578125, 0.005355715751647949, 0.0057485103607177734, 0.006141304969787598, 0.006534099578857422, 0.006926894187927246, 0.00731968879699707, 0.0077124834060668945, 0.008105278015136719, 0.008498072624206543, 0.008890867233276367, 0.009283661842346191, 0.009676456451416016, 0.01006925106048584, 0.010462045669555664, 0.010854840278625488, 0.011247634887695312, 0.011640429496765137, 0.012033224105834961, 0.012426018714904785, 0.01281881332397461, 0.013211607933044434, 0.013604402542114258, 0.013997197151184082, 0.014389991760253906, 0.01478278636932373, 0.015175580978393555, 0.015568375587463379, 0.015961170196533203, 0.016353964805603027, 0.01674675941467285, 0.017139554023742676, 0.0175323486328125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 9.0, 100.0, 415.0, 371.0, 90.0, 13.0, 10.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34768426418304443, -0.34057748317718506, -0.3334707021713257, -0.3263639509677887, -0.3192571699619293, -0.31215038895606995, -0.30504360795021057, -0.2979368567466736, -0.2908300757408142, -0.28372329473495483, -0.27661651372909546, -0.26950976252555847, -0.2624029815196991, -0.2552962005138397, -0.24818943440914154, -0.24108265340328217, -0.23397588729858398, -0.2268691062927246, -0.21976234018802643, -0.21265555918216705, -0.20554879307746887, -0.1984420120716095, -0.19133524596691132, -0.18422846496105194, -0.17712168395519257, -0.1700149029493332, -0.162908136844635, -0.15580135583877563, -0.14869458973407745, -0.14158780872821808, -0.1344810426235199, -0.12737426161766052, -0.12026749551296234, -0.11316072195768356, -0.10605394840240479, -0.09894717484712601, -0.09184040129184723, -0.08473362028598785, -0.07762685418128967, -0.0705200731754303, -0.06341330707073212, -0.05630653351545334, -0.04919975996017456, -0.04209298640489578, -0.034986212849617004, -0.027879435569047928, -0.02077266201376915, -0.013665888458490372, -0.006559111177921295, 0.0005476628430187702, 0.007654436863958836, 0.014761211350560188, 0.021867984905838966, 0.028974760323762894, 0.03608153387904167, 0.04318830743432045, 0.05029508098959923, 0.057401854544878006, 0.06450863182544708, 0.07161540538072586, 0.07872217893600464, 0.08582895249128342, 0.0929357260465622, 0.10004249960184097, 0.10714927315711975]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 3.0, 14.0, 10.0, 14.0, 17.0, 30.0, 35.0, 47.0, 56.0, 47.0, 61.0, 51.0, 74.0, 76.0, 69.0, 50.0, 63.0, 46.0, 50.0, 40.0, 27.0, 37.0, 22.0, 16.0, 11.0, 16.0, 10.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03694802522659302, -0.03555016219615936, -0.03415229916572571, -0.03275443613529205, -0.0313565731048584, -0.029958710074424744, -0.02856084704399109, -0.027162984013557434, -0.02576512098312378, -0.024367257952690125, -0.02296939492225647, -0.021571531891822815, -0.02017366886138916, -0.018775805830955505, -0.01737794280052185, -0.015980079770088196, -0.014582216739654541, -0.013184353709220886, -0.011786490678787231, -0.010388627648353577, -0.008990764617919922, -0.007592901587486267, -0.006195038557052612, -0.0047971755266189575, -0.0033993124961853027, -0.002001449465751648, -0.0006035864353179932, 0.0007942765951156616, 0.0021921396255493164, 0.003590002655982971, 0.004987865686416626, 0.006385728716850281, 0.0077835917472839355, 0.00918145477771759, 0.010579317808151245, 0.0119771808385849, 0.013375043869018555, 0.01477290689945221, 0.016170769929885864, 0.01756863296031952, 0.018966495990753174, 0.02036435902118683, 0.021762222051620483, 0.023160085082054138, 0.024557948112487793, 0.025955811142921448, 0.027353674173355103, 0.028751537203788757, 0.030149400234222412, 0.03154726326465607, 0.03294512629508972, 0.034342989325523376, 0.03574085235595703, 0.037138715386390686, 0.03853657841682434, 0.039934441447257996, 0.04133230447769165, 0.042730167508125305, 0.04412803053855896, 0.045525893568992615, 0.04692375659942627, 0.048321619629859924, 0.04971948266029358, 0.051117345690727234, 0.05251520872116089]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 10.0, 5.0, 9.0, 10.0, 20.0, 22.0, 31.0, 32.0, 48.0, 75.0, 116.0, 151.0, 250.0, 392.0, 731.0, 1314.0, 2555.0, 5505.0, 13615.0, 45158.0, 284295.0, 573536.0, 84667.0, 20831.0, 7721.0, 3436.0, 1637.0, 914.0, 529.0, 298.0, 178.0, 136.0, 66.0, 78.0, 43.0, 35.0, 29.0, 13.0, 13.0, 15.0, 11.0, 4.0, 7.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.048919677734375, -0.047489166259765625, -0.04605865478515625, -0.044628143310546875, -0.0431976318359375, -0.041767120361328125, -0.04033660888671875, -0.038906097412109375, -0.0374755859375, -0.036045074462890625, -0.03461456298828125, -0.033184051513671875, -0.0317535400390625, -0.030323028564453125, -0.02889251708984375, -0.027462005615234375, -0.026031494140625, -0.024600982666015625, -0.02317047119140625, -0.021739959716796875, -0.0203094482421875, -0.018878936767578125, -0.01744842529296875, -0.016017913818359375, -0.01458740234375, -0.013156890869140625, -0.01172637939453125, -0.010295867919921875, -0.0088653564453125, -0.007434844970703125, -0.00600433349609375, -0.004573822021484375, -0.003143310546875, -0.001712799072265625, -0.00028228759765625, 0.001148223876953125, 0.0025787353515625, 0.004009246826171875, 0.00543975830078125, 0.006870269775390625, 0.00830078125, 0.009731292724609375, 0.01116180419921875, 0.012592315673828125, 0.0140228271484375, 0.015453338623046875, 0.01688385009765625, 0.018314361572265625, 0.019744873046875, 0.021175384521484375, 0.02260589599609375, 0.024036407470703125, 0.0254669189453125, 0.026897430419921875, 0.02832794189453125, 0.029758453369140625, 0.03118896484375, 0.032619476318359375, 0.03404998779296875, 0.035480499267578125, 0.0369110107421875, 0.038341522216796875, 0.03977203369140625, 0.041202545166015625, 0.042633056640625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 0.0, 6.0, 6.0, 7.0, 15.0, 19.0, 32.0, 29.0, 40.0, 58.0, 62.0, 70.0, 78.0, 83.0, 60.0, 60.0, 55.0, 68.0, 63.0, 54.0, 47.0, 24.0, 19.0, 14.0, 7.0, 6.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.00827789306640625, -0.008011341094970703, -0.007744789123535156, -0.007478237152099609, -0.0072116851806640625, -0.006945133209228516, -0.006678581237792969, -0.006412029266357422, -0.006145477294921875, -0.005878925323486328, -0.005612373352050781, -0.005345821380615234, -0.0050792694091796875, -0.004812717437744141, -0.004546165466308594, -0.004279613494873047, -0.0040130615234375, -0.003746509552001953, -0.0034799575805664062, -0.0032134056091308594, -0.0029468536376953125, -0.0026803016662597656, -0.0024137496948242188, -0.002147197723388672, -0.001880645751953125, -0.0016140937805175781, -0.0013475418090820312, -0.0010809898376464844, -0.0008144378662109375, -0.0005478858947753906, -0.00028133392333984375, -1.4781951904296875e-05, 0.00025177001953125, 0.0005183219909667969, 0.0007848739624023438, 0.0010514259338378906, 0.0013179779052734375, 0.0015845298767089844, 0.0018510818481445312, 0.002117633819580078, 0.002384185791015625, 0.002650737762451172, 0.0029172897338867188, 0.0031838417053222656, 0.0034503936767578125, 0.0037169456481933594, 0.003983497619628906, 0.004250049591064453, 0.0045166015625, 0.004783153533935547, 0.005049705505371094, 0.005316257476806641, 0.0055828094482421875, 0.005849361419677734, 0.006115913391113281, 0.006382465362548828, 0.006649017333984375, 0.006915569305419922, 0.007182121276855469, 0.007448673248291016, 0.0077152252197265625, 0.00798177719116211, 0.008248329162597656, 0.008514881134033203, 0.00878143310546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 8.0, 11.0, 16.0, 18.0, 29.0, 33.0, 43.0, 80.0, 96.0, 150.0, 248.0, 356.0, 572.0, 1015.0, 1757.0, 3078.0, 5950.0, 12223.0, 28059.0, 76167.0, 250063.0, 422668.0, 155181.0, 50828.0, 20264.0, 9105.0, 4534.0, 2417.0, 1367.0, 772.0, 495.0, 313.0, 208.0, 122.0, 82.0, 71.0, 44.0, 32.0, 15.0, 18.0, 16.0, 8.0, 5.0, 3.0, 7.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0], "bins": [-0.020111083984375, -0.019524812698364258, -0.018938541412353516, -0.018352270126342773, -0.01776599884033203, -0.01717972755432129, -0.016593456268310547, -0.016007184982299805, -0.015420913696289062, -0.01483464241027832, -0.014248371124267578, -0.013662099838256836, -0.013075828552246094, -0.012489557266235352, -0.01190328598022461, -0.011317014694213867, -0.010730743408203125, -0.010144472122192383, -0.00955820083618164, -0.008971929550170898, -0.008385658264160156, -0.007799386978149414, -0.007213115692138672, -0.00662684440612793, -0.0060405731201171875, -0.005454301834106445, -0.004868030548095703, -0.004281759262084961, -0.0036954879760742188, -0.0031092166900634766, -0.0025229454040527344, -0.0019366741180419922, -0.00135040283203125, -0.0007641315460205078, -0.00017786026000976562, 0.00040841102600097656, 0.0009946823120117188, 0.001580953598022461, 0.002167224884033203, 0.0027534961700439453, 0.0033397674560546875, 0.00392603874206543, 0.004512310028076172, 0.005098581314086914, 0.005684852600097656, 0.0062711238861083984, 0.006857395172119141, 0.007443666458129883, 0.008029937744140625, 0.008616209030151367, 0.00920248031616211, 0.009788751602172852, 0.010375022888183594, 0.010961294174194336, 0.011547565460205078, 0.01213383674621582, 0.012720108032226562, 0.013306379318237305, 0.013892650604248047, 0.014478921890258789, 0.015065193176269531, 0.015651464462280273, 0.016237735748291016, 0.016824007034301758, 0.0174102783203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 8.0, 10.0, 6.0, 9.0, 17.0, 20.0, 25.0, 34.0, 37.0, 51.0, 36.0, 41.0, 36.0, 46.0, 48.0, 64.0, 46.0, 43.0, 52.0, 44.0, 47.0, 45.0, 35.0, 25.0, 32.0, 27.0, 25.0, 18.0, 10.0, 11.0, 6.0, 11.0, 8.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02093505859375, -0.020252227783203125, -0.01956939697265625, -0.018886566162109375, -0.0182037353515625, -0.017520904541015625, -0.01683807373046875, -0.016155242919921875, -0.015472412109375, -0.014789581298828125, -0.01410675048828125, -0.013423919677734375, -0.0127410888671875, -0.012058258056640625, -0.01137542724609375, -0.010692596435546875, -0.010009765625, -0.009326934814453125, -0.00864410400390625, -0.007961273193359375, -0.0072784423828125, -0.006595611572265625, -0.00591278076171875, -0.005229949951171875, -0.004547119140625, -0.003864288330078125, -0.00318145751953125, -0.002498626708984375, -0.0018157958984375, -0.001132965087890625, -0.00045013427734375, 0.000232696533203125, 0.00091552734375, 0.001598358154296875, 0.00228118896484375, 0.002964019775390625, 0.0036468505859375, 0.004329681396484375, 0.00501251220703125, 0.005695343017578125, 0.006378173828125, 0.007061004638671875, 0.00774383544921875, 0.008426666259765625, 0.0091094970703125, 0.009792327880859375, 0.01047515869140625, 0.011157989501953125, 0.0118408203125, 0.012523651123046875, 0.01320648193359375, 0.013889312744140625, 0.0145721435546875, 0.015254974365234375, 0.01593780517578125, 0.016620635986328125, 0.017303466796875, 0.017986297607421875, 0.01866912841796875, 0.019351959228515625, 0.0200347900390625, 0.020717620849609375, 0.02140045166015625, 0.022083282470703125, 0.02276611328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 13.0, 9.0, 13.0, 11.0, 22.0, 21.0, 19.0, 32.0, 41.0, 55.0, 87.0, 124.0, 188.0, 419.0, 931.0, 3531.0, 52239.0, 951563.0, 34519.0, 2928.0, 799.0, 368.0, 191.0, 130.0, 72.0, 56.0, 40.0, 26.0, 30.0, 17.0, 11.0, 12.0, 7.0, 3.0, 12.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.033111572265625, -0.03217744827270508, -0.031243324279785156, -0.030309200286865234, -0.029375076293945312, -0.02844095230102539, -0.02750682830810547, -0.026572704315185547, -0.025638580322265625, -0.024704456329345703, -0.02377033233642578, -0.02283620834350586, -0.021902084350585938, -0.020967960357666016, -0.020033836364746094, -0.019099712371826172, -0.01816558837890625, -0.017231464385986328, -0.016297340393066406, -0.015363216400146484, -0.014429092407226562, -0.01349496841430664, -0.012560844421386719, -0.011626720428466797, -0.010692596435546875, -0.009758472442626953, -0.008824348449707031, -0.00789022445678711, -0.0069561004638671875, -0.006021976470947266, -0.005087852478027344, -0.004153728485107422, -0.0032196044921875, -0.002285480499267578, -0.0013513565063476562, -0.0004172325134277344, 0.0005168914794921875, 0.0014510154724121094, 0.0023851394653320312, 0.003319263458251953, 0.004253387451171875, 0.005187511444091797, 0.006121635437011719, 0.007055759429931641, 0.007989883422851562, 0.008924007415771484, 0.009858131408691406, 0.010792255401611328, 0.01172637939453125, 0.012660503387451172, 0.013594627380371094, 0.014528751373291016, 0.015462875366210938, 0.01639699935913086, 0.01733112335205078, 0.018265247344970703, 0.019199371337890625, 0.020133495330810547, 0.02106761932373047, 0.02200174331665039, 0.022935867309570312, 0.023869991302490234, 0.024804115295410156, 0.025738239288330078, 0.02667236328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 14.0, 37.0, 98.0, 327.0, 358.0, 121.0, 33.0, 11.0, 10.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002512931823730469, -0.00023876875638961792, -0.00022624433040618896, -0.00021371990442276, -0.00020119547843933105, -0.0001886710524559021, -0.00017614662647247314, -0.0001636222004890442, -0.00015109777450561523, -0.00013857334852218628, -0.00012604892253875732, -0.00011352449655532837, -0.00010100007057189941, -8.847564458847046e-05, -7.59512186050415e-05, -6.342679262161255e-05, -5.0902366638183594e-05, -3.837794065475464e-05, -2.5853514671325684e-05, -1.3329088687896729e-05, -8.046627044677734e-07, 1.1719763278961182e-05, 2.4244189262390137e-05, 3.676861524581909e-05, 4.929304122924805e-05, 6.1817467212677e-05, 7.434189319610596e-05, 8.686631917953491e-05, 9.939074516296387e-05, 0.00011191517114639282, 0.00012443959712982178, 0.00013696402311325073, 0.0001494884490966797, 0.00016201287508010864, 0.0001745373010635376, 0.00018706172704696655, 0.0001995861530303955, 0.00021211057901382446, 0.00022463500499725342, 0.00023715943098068237, 0.00024968385696411133, 0.0002622082829475403, 0.00027473270893096924, 0.0002872571349143982, 0.00029978156089782715, 0.0003123059868812561, 0.00032483041286468506, 0.000337354838848114, 0.00034987926483154297, 0.0003624036908149719, 0.0003749281167984009, 0.00038745254278182983, 0.0003999769687652588, 0.00041250139474868774, 0.0004250258207321167, 0.00043755024671554565, 0.0004500746726989746, 0.00046259909868240356, 0.0004751235246658325, 0.0004876479506492615, 0.0005001723766326904, 0.0005126968026161194, 0.0005252212285995483, 0.0005377456545829773, 0.0005502700805664062]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 5.0, 1.0, 11.0, 15.0, 42.0, 69.0, 140.0, 323.0, 854.0, 3520.0, 52898.0, 946788.0, 39454.0, 3140.0, 760.0, 260.0, 123.0, 53.0, 36.0, 24.0, 16.0, 7.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033477783203125, -0.03262948989868164, -0.03178119659423828, -0.030932903289794922, -0.030084609985351562, -0.029236316680908203, -0.028388023376464844, -0.027539730072021484, -0.026691436767578125, -0.025843143463134766, -0.024994850158691406, -0.024146556854248047, -0.023298263549804688, -0.022449970245361328, -0.02160167694091797, -0.02075338363647461, -0.01990509033203125, -0.01905679702758789, -0.01820850372314453, -0.017360210418701172, -0.016511917114257812, -0.015663623809814453, -0.014815330505371094, -0.013967037200927734, -0.013118743896484375, -0.012270450592041016, -0.011422157287597656, -0.010573863983154297, -0.009725570678710938, -0.008877277374267578, -0.008028984069824219, -0.007180690765380859, -0.0063323974609375, -0.005484104156494141, -0.004635810852050781, -0.003787517547607422, -0.0029392242431640625, -0.002090930938720703, -0.0012426376342773438, -0.0003943443298339844, 0.000453948974609375, 0.0013022422790527344, 0.0021505355834960938, 0.002998828887939453, 0.0038471221923828125, 0.004695415496826172, 0.005543708801269531, 0.006392002105712891, 0.00724029541015625, 0.00808858871459961, 0.008936882019042969, 0.009785175323486328, 0.010633468627929688, 0.011481761932373047, 0.012330055236816406, 0.013178348541259766, 0.014026641845703125, 0.014874935150146484, 0.015723228454589844, 0.016571521759033203, 0.017419815063476562, 0.018268108367919922, 0.01911640167236328, 0.01996469497680664, 0.02081298828125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 7.0, 8.0, 16.0, 24.0, 42.0, 79.0, 123.0, 168.0, 181.0, 149.0, 90.0, 51.0, 26.0, 12.0, 9.0, 5.0, 4.0, 4.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.032867431640625, -0.03218567371368408, -0.031503915786743164, -0.030822157859802246, -0.030140399932861328, -0.02945864200592041, -0.028776884078979492, -0.028095126152038574, -0.027413368225097656, -0.02673161029815674, -0.02604985237121582, -0.025368094444274902, -0.024686336517333984, -0.024004578590393066, -0.02332282066345215, -0.02264106273651123, -0.021959304809570312, -0.021277546882629395, -0.020595788955688477, -0.01991403102874756, -0.01923227310180664, -0.018550515174865723, -0.017868757247924805, -0.017186999320983887, -0.01650524139404297, -0.01582348346710205, -0.015141725540161133, -0.014459967613220215, -0.013778209686279297, -0.013096451759338379, -0.012414693832397461, -0.011732935905456543, -0.011051177978515625, -0.010369420051574707, -0.009687662124633789, -0.009005904197692871, -0.008324146270751953, -0.007642388343811035, -0.006960630416870117, -0.006278872489929199, -0.005597114562988281, -0.004915356636047363, -0.004233598709106445, -0.0035518407821655273, -0.0028700828552246094, -0.0021883249282836914, -0.0015065670013427734, -0.0008248090744018555, -0.0001430511474609375, 0.0005387067794799805, 0.0012204647064208984, 0.0019022226333618164, 0.0025839805603027344, 0.0032657384872436523, 0.00394749641418457, 0.004629254341125488, 0.005311012268066406, 0.005992770195007324, 0.006674528121948242, 0.00735628604888916, 0.008038043975830078, 0.008719801902770996, 0.009401559829711914, 0.010083317756652832, 0.01076507568359375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 30.0, 63.0, 222.0, 385.0, 194.0, 81.0, 17.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24824097752571106, -0.23308803141117096, -0.21793508529663086, -0.20278215408325195, -0.18762919306755066, -0.17247626185417175, -0.15732331573963165, -0.14217036962509155, -0.12701742351055145, -0.11186447739601135, -0.09671153128147125, -0.08155859261751175, -0.06640564650297165, -0.05125270038843155, -0.036099761724472046, -0.020946815609931946, -0.005793869495391846, 0.009359074756503105, 0.024512019008398056, 0.03966496139764786, 0.05481790751218796, 0.06997085362672806, 0.08512379229068756, 0.10027673840522766, 0.11542968451976776, 0.13058263063430786, 0.14573557674884796, 0.16088852286338806, 0.17604145407676697, 0.19119441509246826, 0.20634734630584717, 0.22150029242038727, 0.23665326833724976, 0.25180619955062866, 0.26695916056632996, 0.28211209177970886, 0.29726505279541016, 0.31241798400878906, 0.32757091522216797, 0.34272387623786926, 0.35787683725357056, 0.37302976846694946, 0.38818272948265076, 0.40333566069602966, 0.41848862171173096, 0.43364155292510986, 0.44879448413848877, 0.46394744515419006, 0.47910037636756897, 0.4942533075809479, 0.5094062685966492, 0.5245591998100281, 0.539712131023407, 0.5548651218414307, 0.5700180530548096, 0.5851709842681885, 0.6003239154815674, 0.6154768466949463, 0.6306297779083252, 0.6457827687263489, 0.6609356999397278, 0.6760886311531067, 0.6912415623664856, 0.7063945531845093, 0.7215474843978882]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 11.0, 5.0, 11.0, 9.0, 15.0, 15.0, 15.0, 13.0, 18.0, 20.0, 28.0, 26.0, 31.0, 31.0, 38.0, 33.0, 36.0, 35.0, 41.0, 52.0, 42.0, 38.0, 33.0, 41.0, 41.0, 41.0, 26.0, 28.0, 27.0, 26.0, 32.0, 23.0, 18.0, 14.0, 15.0, 16.0, 8.0, 8.0, 5.0, 7.0, 9.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08281546831130981, -0.0800701454281807, -0.07732482254505157, -0.07457949221134186, -0.07183416932821274, -0.06908884644508362, -0.0663435161113739, -0.06359819322824478, -0.06085287034511566, -0.05810754746198654, -0.05536222085356712, -0.052616894245147705, -0.049871571362018585, -0.047126248478889465, -0.04438092187047005, -0.04163559526205063, -0.03889027237892151, -0.03614494949579239, -0.03339962288737297, -0.0306542981415987, -0.027908973395824432, -0.025163648650050163, -0.022418323904275894, -0.019672999158501625, -0.016927674412727356, -0.014182349666953087, -0.011437024921178818, -0.008691700175404549, -0.0059463754296302795, -0.0032010506838560104, -0.00045572593808174133, 0.0022895988076925278, 0.005034923553466797, 0.007780248299241066, 0.010525573045015335, 0.013270897790789604, 0.016016222536563873, 0.018761547282338142, 0.02150687202811241, 0.02425219677388668, 0.02699752151966095, 0.02974284626543522, 0.03248817101120949, 0.035233497619628906, 0.037978820502758026, 0.040724143385887146, 0.043469469994306564, 0.04621479660272598, 0.0489601194858551, 0.05170544236898422, 0.05445076897740364, 0.05719609558582306, 0.05994141846895218, 0.0626867413520813, 0.06543207168579102, 0.06817739456892014, 0.07092271745204926, 0.07366804033517838, 0.0764133632183075, 0.07915869355201721, 0.08190401643514633, 0.08464933931827545, 0.08739466965198517, 0.09013999253511429, 0.09288531541824341]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 4.0, 12.0, 20.0, 18.0, 48.0, 57.0, 125.0, 169.0, 341.0, 732.0, 1769.0, 6132.0, 45814.0, 3948748.0, 174330.0, 11026.0, 2826.0, 1057.0, 449.0, 255.0, 143.0, 76.0, 52.0, 24.0, 11.0, 11.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05950927734375, -0.057793617248535156, -0.05607795715332031, -0.05436229705810547, -0.052646636962890625, -0.05093097686767578, -0.04921531677246094, -0.047499656677246094, -0.04578399658203125, -0.044068336486816406, -0.04235267639160156, -0.04063701629638672, -0.038921356201171875, -0.03720569610595703, -0.03549003601074219, -0.033774375915527344, -0.0320587158203125, -0.030343055725097656, -0.028627395629882812, -0.02691173553466797, -0.025196075439453125, -0.02348041534423828, -0.021764755249023438, -0.020049095153808594, -0.01833343505859375, -0.016617774963378906, -0.014902114868164062, -0.013186454772949219, -0.011470794677734375, -0.009755134582519531, -0.008039474487304688, -0.006323814392089844, -0.004608154296875, -0.0028924942016601562, -0.0011768341064453125, 0.0005388259887695312, 0.002254486083984375, 0.003970146179199219, 0.0056858062744140625, 0.007401466369628906, 0.00911712646484375, 0.010832786560058594, 0.012548446655273438, 0.014264106750488281, 0.015979766845703125, 0.01769542694091797, 0.019411087036132812, 0.021126747131347656, 0.0228424072265625, 0.024558067321777344, 0.026273727416992188, 0.02798938751220703, 0.029705047607421875, 0.03142070770263672, 0.03313636779785156, 0.034852027893066406, 0.03656768798828125, 0.038283348083496094, 0.03999900817871094, 0.04171466827392578, 0.043430328369140625, 0.04514598846435547, 0.04686164855957031, 0.048577308654785156, 0.05029296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 5.0, 6.0, 6.0, 7.0, 12.0, 21.0, 22.0, 36.0, 50.0, 43.0, 60.0, 70.0, 78.0, 76.0, 74.0, 78.0, 65.0, 56.0, 59.0, 55.0, 35.0, 22.0, 19.0, 11.0, 8.0, 11.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.00853729248046875, -0.008262872695922852, -0.007988452911376953, -0.007714033126831055, -0.007439613342285156, -0.007165193557739258, -0.006890773773193359, -0.006616353988647461, -0.0063419342041015625, -0.006067514419555664, -0.005793094635009766, -0.005518674850463867, -0.005244255065917969, -0.00496983528137207, -0.004695415496826172, -0.0044209957122802734, -0.004146575927734375, -0.0038721561431884766, -0.003597736358642578, -0.0033233165740966797, -0.0030488967895507812, -0.002774477005004883, -0.0025000572204589844, -0.002225637435913086, -0.0019512176513671875, -0.001676797866821289, -0.0014023780822753906, -0.0011279582977294922, -0.0008535385131835938, -0.0005791187286376953, -0.0003046989440917969, -3.0279159545898438e-05, 0.000244140625, 0.0005185604095458984, 0.0007929801940917969, 0.0010673999786376953, 0.0013418197631835938, 0.0016162395477294922, 0.0018906593322753906, 0.002165079116821289, 0.0024394989013671875, 0.002713918685913086, 0.0029883384704589844, 0.003262758255004883, 0.0035371780395507812, 0.0038115978240966797, 0.004086017608642578, 0.0043604373931884766, 0.004634857177734375, 0.0049092769622802734, 0.005183696746826172, 0.00545811653137207, 0.005732536315917969, 0.006006956100463867, 0.006281375885009766, 0.006555795669555664, 0.0068302154541015625, 0.007104635238647461, 0.007379055023193359, 0.007653474807739258, 0.007927894592285156, 0.008202314376831055, 0.008476734161376953, 0.008751153945922852, 0.00902557373046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 11.0, 9.0, 27.0, 40.0, 89.0, 172.0, 296.0, 577.0, 1353.0, 3643.0, 16714.0, 389293.0, 3726253.0, 45508.0, 6388.0, 2041.0, 906.0, 436.0, 238.0, 123.0, 80.0, 47.0, 12.0, 13.0, 7.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0335693359375, -0.032183170318603516, -0.03079700469970703, -0.029410839080810547, -0.028024673461914062, -0.026638507843017578, -0.025252342224121094, -0.02386617660522461, -0.022480010986328125, -0.02109384536743164, -0.019707679748535156, -0.018321514129638672, -0.016935348510742188, -0.015549182891845703, -0.014163017272949219, -0.012776851654052734, -0.01139068603515625, -0.010004520416259766, -0.008618354797363281, -0.007232189178466797, -0.0058460235595703125, -0.004459857940673828, -0.0030736923217773438, -0.0016875267028808594, -0.000301361083984375, 0.0010848045349121094, 0.0024709701538085938, 0.003857135772705078, 0.0052433013916015625, 0.006629467010498047, 0.008015632629394531, 0.009401798248291016, 0.0107879638671875, 0.012174129486083984, 0.013560295104980469, 0.014946460723876953, 0.016332626342773438, 0.017718791961669922, 0.019104957580566406, 0.02049112319946289, 0.021877288818359375, 0.02326345443725586, 0.024649620056152344, 0.026035785675048828, 0.027421951293945312, 0.028808116912841797, 0.03019428253173828, 0.031580448150634766, 0.03296661376953125, 0.034352779388427734, 0.03573894500732422, 0.0371251106262207, 0.03851127624511719, 0.03989744186401367, 0.041283607482910156, 0.04266977310180664, 0.044055938720703125, 0.04544210433959961, 0.046828269958496094, 0.04821443557739258, 0.04960060119628906, 0.05098676681518555, 0.05237293243408203, 0.053759098052978516, 0.055145263671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 15.0, 26.0, 87.0, 188.0, 804.0, 2233.0, 467.0, 143.0, 51.0, 19.0, 12.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0225067138671875, -0.021919727325439453, -0.021332740783691406, -0.02074575424194336, -0.020158767700195312, -0.019571781158447266, -0.01898479461669922, -0.018397808074951172, -0.017810821533203125, -0.017223834991455078, -0.01663684844970703, -0.016049861907958984, -0.015462875366210938, -0.01487588882446289, -0.014288902282714844, -0.013701915740966797, -0.01311492919921875, -0.012527942657470703, -0.011940956115722656, -0.01135396957397461, -0.010766983032226562, -0.010179996490478516, -0.009593009948730469, -0.009006023406982422, -0.008419036865234375, -0.007832050323486328, -0.007245063781738281, -0.006658077239990234, -0.0060710906982421875, -0.005484104156494141, -0.004897117614746094, -0.004310131072998047, -0.00372314453125, -0.003136157989501953, -0.0025491714477539062, -0.0019621849060058594, -0.0013751983642578125, -0.0007882118225097656, -0.00020122528076171875, 0.0003857612609863281, 0.000972747802734375, 0.0015597343444824219, 0.0021467208862304688, 0.0027337074279785156, 0.0033206939697265625, 0.003907680511474609, 0.004494667053222656, 0.005081653594970703, 0.00566864013671875, 0.006255626678466797, 0.006842613220214844, 0.007429599761962891, 0.008016586303710938, 0.008603572845458984, 0.009190559387207031, 0.009777545928955078, 0.010364532470703125, 0.010951519012451172, 0.011538505554199219, 0.012125492095947266, 0.012712478637695312, 0.01329946517944336, 0.013886451721191406, 0.014473438262939453, 0.0150604248046875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 13.0, 36.0, 59.0, 120.0, 195.0, 216.0, 180.0, 86.0, 48.0, 15.0, 14.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09401434659957886, -0.09120509773492813, -0.0883958488702774, -0.08558660745620728, -0.08277735859155655, -0.07996810972690582, -0.0771588608622551, -0.07434961199760437, -0.07154036313295364, -0.06873111426830292, -0.06592186540365219, -0.06311261653900146, -0.06030337139964104, -0.05749412626028061, -0.05468487739562988, -0.051875628530979156, -0.04906638339161873, -0.046257134526968, -0.043447889387607574, -0.04063864052295685, -0.03782939165830612, -0.035020142793655396, -0.03221089765429497, -0.02940164878964424, -0.026592401787638664, -0.023783154785633087, -0.02097390592098236, -0.018164658918976784, -0.015355410985648632, -0.01254616305232048, -0.009736916050314903, -0.006927667185664177, -0.0041184201836586, -0.0013091724831610918, 0.0015000752173364162, 0.004309322685003281, 0.007118570618331432, 0.009927818551659584, 0.012737065553665161, 0.015546314418315887, 0.018355561420321465, 0.02116480842232704, 0.023974057286977768, 0.026783304288983345, 0.029592551290988922, 0.03240180015563965, 0.035211049020290375, 0.0380202978849411, 0.04082954302430153, 0.043638791888952255, 0.04644803702831268, 0.04925728589296341, 0.052066534757614136, 0.05487578362226486, 0.05768502876162529, 0.060494277626276016, 0.06330352276563644, 0.06611277163028717, 0.0689220204949379, 0.07173126935958862, 0.07454051077365875, 0.07734975963830948, 0.0801590085029602, 0.08296825736761093, 0.08577750623226166]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 5.0, 14.0, 9.0, 10.0, 17.0, 31.0, 27.0, 31.0, 38.0, 41.0, 51.0, 55.0, 48.0, 55.0, 53.0, 69.0, 63.0, 52.0, 59.0, 39.0, 29.0, 51.0, 17.0, 33.0, 25.0, 20.0, 12.0, 12.0, 11.0, 4.0, 2.0, 5.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0357738733291626, -0.03460797667503357, -0.03344208002090454, -0.03227618709206581, -0.031110290437936783, -0.029944393783807755, -0.028778498992323875, -0.027612604200839996, -0.026446707546710968, -0.02528081089258194, -0.02411491610109806, -0.02294902130961418, -0.021783124655485153, -0.020617228001356125, -0.019451333209872246, -0.018285438418388367, -0.01711954176425934, -0.01595364511013031, -0.014787750318646431, -0.013621854595839977, -0.012455958873033524, -0.01129006315022707, -0.010124167427420616, -0.008958271704614162, -0.007792375981807709, -0.006626480259001255, -0.005460584536194801, -0.004294688813388348, -0.003128793090581894, -0.00196289736777544, -0.0007970016449689865, 0.0003688940778374672, 0.001534789800643921, 0.0027006855234503746, 0.0038665812462568283, 0.005032476969063282, 0.006198372691869736, 0.007364268414676189, 0.008530164137482643, 0.009696059860289097, 0.01086195558309555, 0.012027851305902004, 0.013193747028708458, 0.014359642751514912, 0.015525538474321365, 0.016691435128450394, 0.017857329919934273, 0.019023224711418152, 0.02018912136554718, 0.02135501801967621, 0.022520912811160088, 0.023686807602643967, 0.024852704256772995, 0.026018600910902023, 0.027184495702385902, 0.02835039049386978, 0.02951628714799881, 0.030682183802127838, 0.031848080456256866, 0.033013973385095596, 0.034179870039224625, 0.03534576669335365, 0.03651165962219238, 0.03767755627632141, 0.03884345293045044]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 12.0, 15.0, 20.0, 21.0, 27.0, 35.0, 66.0, 101.0, 158.0, 259.0, 490.0, 1032.0, 2381.0, 6378.0, 23540.0, 204386.0, 711946.0, 76451.0, 13482.0, 4257.0, 1706.0, 708.0, 420.0, 230.0, 144.0, 75.0, 57.0, 46.0, 22.0, 29.0, 19.0, 13.0, 8.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05413818359375, -0.05246257781982422, -0.05078697204589844, -0.049111366271972656, -0.047435760498046875, -0.045760154724121094, -0.04408454895019531, -0.04240894317626953, -0.04073333740234375, -0.03905773162841797, -0.03738212585449219, -0.035706520080566406, -0.034030914306640625, -0.032355308532714844, -0.030679702758789062, -0.02900409698486328, -0.0273284912109375, -0.02565288543701172, -0.023977279663085938, -0.022301673889160156, -0.020626068115234375, -0.018950462341308594, -0.017274856567382812, -0.015599250793457031, -0.01392364501953125, -0.012248039245605469, -0.010572433471679688, -0.008896827697753906, -0.007221221923828125, -0.005545616149902344, -0.0038700103759765625, -0.0021944046020507812, -0.000518798828125, 0.0011568069458007812, 0.0028324127197265625, 0.004508018493652344, 0.006183624267578125, 0.007859230041503906, 0.009534835815429688, 0.011210441589355469, 0.01288604736328125, 0.014561653137207031, 0.016237258911132812, 0.017912864685058594, 0.019588470458984375, 0.021264076232910156, 0.022939682006835938, 0.02461528778076172, 0.0262908935546875, 0.02796649932861328, 0.029642105102539062, 0.031317710876464844, 0.032993316650390625, 0.034668922424316406, 0.03634452819824219, 0.03802013397216797, 0.03969573974609375, 0.04137134552001953, 0.04304695129394531, 0.044722557067871094, 0.046398162841796875, 0.048073768615722656, 0.04974937438964844, 0.05142498016357422, 0.0531005859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 10.0, 12.0, 18.0, 22.0, 35.0, 48.0, 48.0, 63.0, 67.0, 77.0, 72.0, 96.0, 85.0, 58.0, 50.0, 57.0, 53.0, 26.0, 25.0, 17.0, 13.0, 11.0, 6.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.009124755859375, -0.00883948802947998, -0.008554220199584961, -0.008268952369689941, -0.007983684539794922, -0.007698416709899902, -0.007413148880004883, -0.007127881050109863, -0.006842613220214844, -0.006557345390319824, -0.006272077560424805, -0.005986809730529785, -0.005701541900634766, -0.005416274070739746, -0.0051310062408447266, -0.004845738410949707, -0.0045604705810546875, -0.004275202751159668, -0.0039899349212646484, -0.003704667091369629, -0.0034193992614746094, -0.00313413143157959, -0.0028488636016845703, -0.0025635957717895508, -0.0022783279418945312, -0.0019930601119995117, -0.0017077922821044922, -0.0014225244522094727, -0.0011372566223144531, -0.0008519887924194336, -0.0005667209625244141, -0.00028145313262939453, 3.814697265625e-06, 0.00028908252716064453, 0.0005743503570556641, 0.0008596181869506836, 0.0011448860168457031, 0.0014301538467407227, 0.0017154216766357422, 0.0020006895065307617, 0.0022859573364257812, 0.0025712251663208008, 0.0028564929962158203, 0.00314176082611084, 0.0034270286560058594, 0.003712296485900879, 0.0039975643157958984, 0.004282832145690918, 0.0045680999755859375, 0.004853367805480957, 0.0051386356353759766, 0.005423903465270996, 0.005709171295166016, 0.005994439125061035, 0.006279706954956055, 0.006564974784851074, 0.006850242614746094, 0.007135510444641113, 0.007420778274536133, 0.007706046104431152, 0.007991313934326172, 0.008276581764221191, 0.008561849594116211, 0.00884711742401123, 0.00913238525390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 6.0, 11.0, 18.0, 19.0, 23.0, 49.0, 63.0, 110.0, 130.0, 206.0, 312.0, 477.0, 831.0, 1376.0, 2174.0, 3720.0, 6636.0, 12590.0, 26632.0, 65750.0, 189221.0, 375256.0, 222853.0, 77494.0, 30539.0, 14300.0, 7359.0, 4029.0, 2374.0, 1479.0, 907.0, 570.0, 317.0, 223.0, 140.0, 108.0, 72.0, 53.0, 39.0, 22.0, 14.0, 16.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.014068603515625, -0.01362311840057373, -0.013177633285522461, -0.012732148170471191, -0.012286663055419922, -0.011841177940368652, -0.011395692825317383, -0.010950207710266113, -0.010504722595214844, -0.010059237480163574, -0.009613752365112305, -0.009168267250061035, -0.008722782135009766, -0.008277297019958496, -0.007831811904907227, -0.007386326789855957, -0.0069408416748046875, -0.006495356559753418, -0.0060498714447021484, -0.005604386329650879, -0.005158901214599609, -0.00471341609954834, -0.00426793098449707, -0.0038224458694458008, -0.0033769607543945312, -0.0029314756393432617, -0.002485990524291992, -0.0020405054092407227, -0.0015950202941894531, -0.0011495351791381836, -0.0007040500640869141, -0.00025856494903564453, 0.000186920166015625, 0.0006324052810668945, 0.001077890396118164, 0.0015233755111694336, 0.001968860626220703, 0.0024143457412719727, 0.002859830856323242, 0.0033053159713745117, 0.0037508010864257812, 0.004196286201477051, 0.00464177131652832, 0.00508725643157959, 0.005532741546630859, 0.005978226661682129, 0.0064237117767333984, 0.006869196891784668, 0.0073146820068359375, 0.007760167121887207, 0.008205652236938477, 0.008651137351989746, 0.009096622467041016, 0.009542107582092285, 0.009987592697143555, 0.010433077812194824, 0.010878562927246094, 0.011324048042297363, 0.011769533157348633, 0.012215018272399902, 0.012660503387451172, 0.013105988502502441, 0.013551473617553711, 0.01399695873260498, 0.01444244384765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 6.0, 7.0, 5.0, 15.0, 16.0, 18.0, 17.0, 27.0, 26.0, 37.0, 24.0, 32.0, 38.0, 47.0, 38.0, 47.0, 38.0, 54.0, 37.0, 34.0, 32.0, 45.0, 25.0, 37.0, 44.0, 30.0, 29.0, 36.0, 26.0, 16.0, 23.0, 16.0, 14.0, 15.0, 9.0, 9.0, 3.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0182037353515625, -0.0176239013671875, -0.0170440673828125, -0.0164642333984375, -0.0158843994140625, -0.0153045654296875, -0.0147247314453125, -0.0141448974609375, -0.0135650634765625, -0.0129852294921875, -0.0124053955078125, -0.0118255615234375, -0.0112457275390625, -0.0106658935546875, -0.0100860595703125, -0.0095062255859375, -0.0089263916015625, -0.0083465576171875, -0.0077667236328125, -0.0071868896484375, -0.0066070556640625, -0.0060272216796875, -0.0054473876953125, -0.0048675537109375, -0.0042877197265625, -0.0037078857421875, -0.0031280517578125, -0.0025482177734375, -0.0019683837890625, -0.0013885498046875, -0.0008087158203125, -0.0002288818359375, 0.0003509521484375, 0.0009307861328125, 0.0015106201171875, 0.0020904541015625, 0.0026702880859375, 0.0032501220703125, 0.0038299560546875, 0.0044097900390625, 0.0049896240234375, 0.0055694580078125, 0.0061492919921875, 0.0067291259765625, 0.0073089599609375, 0.0078887939453125, 0.0084686279296875, 0.0090484619140625, 0.0096282958984375, 0.0102081298828125, 0.0107879638671875, 0.0113677978515625, 0.0119476318359375, 0.0125274658203125, 0.0131072998046875, 0.0136871337890625, 0.0142669677734375, 0.0148468017578125, 0.0154266357421875, 0.0160064697265625, 0.0165863037109375, 0.0171661376953125, 0.0177459716796875, 0.0183258056640625, 0.0189056396484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 3.0, 2.0, 17.0, 21.0, 28.0, 47.0, 73.0, 113.0, 159.0, 288.0, 566.0, 1378.0, 6406.0, 86122.0, 852532.0, 91367.0, 6617.0, 1437.0, 591.0, 302.0, 171.0, 113.0, 89.0, 33.0, 35.0, 15.0, 11.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0264434814453125, -0.025790691375732422, -0.025137901306152344, -0.024485111236572266, -0.023832321166992188, -0.02317953109741211, -0.02252674102783203, -0.021873950958251953, -0.021221160888671875, -0.020568370819091797, -0.01991558074951172, -0.01926279067993164, -0.018610000610351562, -0.017957210540771484, -0.017304420471191406, -0.016651630401611328, -0.01599884033203125, -0.015346050262451172, -0.014693260192871094, -0.014040470123291016, -0.013387680053710938, -0.01273488998413086, -0.012082099914550781, -0.011429309844970703, -0.010776519775390625, -0.010123729705810547, -0.009470939636230469, -0.00881814956665039, -0.008165359497070312, -0.007512569427490234, -0.006859779357910156, -0.006206989288330078, -0.00555419921875, -0.004901409149169922, -0.004248619079589844, -0.0035958290100097656, -0.0029430389404296875, -0.0022902488708496094, -0.0016374588012695312, -0.0009846687316894531, -0.000331878662109375, 0.0003209114074707031, 0.0009737014770507812, 0.0016264915466308594, 0.0022792816162109375, 0.0029320716857910156, 0.0035848617553710938, 0.004237651824951172, 0.00489044189453125, 0.005543231964111328, 0.006196022033691406, 0.006848812103271484, 0.0075016021728515625, 0.00815439224243164, 0.008807182312011719, 0.009459972381591797, 0.010112762451171875, 0.010765552520751953, 0.011418342590332031, 0.01207113265991211, 0.012723922729492188, 0.013376712799072266, 0.014029502868652344, 0.014682292938232422, 0.0153350830078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 42.0, 216.0, 415.0, 238.0, 63.0, 23.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002067089080810547, -0.00019494816660881042, -0.00018318742513656616, -0.0001714266836643219, -0.00015966594219207764, -0.00014790520071983337, -0.0001361444592475891, -0.00012438371777534485, -0.00011262297630310059, -0.00010086223483085632, -8.910149335861206e-05, -7.73407518863678e-05, -6.558001041412354e-05, -5.381926894187927e-05, -4.205852746963501e-05, -3.0297785997390747e-05, -1.8537044525146484e-05, -6.776303052902222e-06, 4.984438419342041e-06, 1.6745179891586304e-05, 2.8505921363830566e-05, 4.026666283607483e-05, 5.202740430831909e-05, 6.378814578056335e-05, 7.554888725280762e-05, 8.730962872505188e-05, 9.907037019729614e-05, 0.0001108311116695404, 0.00012259185314178467, 0.00013435259461402893, 0.0001461133360862732, 0.00015787407755851746, 0.00016963481903076172, 0.00018139556050300598, 0.00019315630197525024, 0.0002049170434474945, 0.00021667778491973877, 0.00022843852639198303, 0.0002401992678642273, 0.00025196000933647156, 0.0002637207508087158, 0.0002754814922809601, 0.00028724223375320435, 0.0002990029752254486, 0.00031076371669769287, 0.00032252445816993713, 0.0003342851996421814, 0.00034604594111442566, 0.0003578066825866699, 0.0003695674240589142, 0.00038132816553115845, 0.0003930889070034027, 0.00040484964847564697, 0.00041661038994789124, 0.0004283711314201355, 0.00044013187289237976, 0.000451892614364624, 0.0004636533558368683, 0.00047541409730911255, 0.0004871748387813568, 0.0004989355802536011, 0.0005106963217258453, 0.0005224570631980896, 0.0005342178046703339, 0.0005459785461425781]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 12.0, 18.0, 21.0, 34.0, 64.0, 96.0, 236.0, 735.0, 3552.0, 53993.0, 873160.0, 109971.0, 5090.0, 984.0, 312.0, 114.0, 55.0, 37.0, 19.0, 6.0, 13.0, 7.0, 2.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.016510009765625, -0.015838623046875, -0.015167236328125, -0.014495849609375, -0.013824462890625, -0.013153076171875, -0.012481689453125, -0.011810302734375, -0.011138916015625, -0.010467529296875, -0.009796142578125, -0.009124755859375, -0.008453369140625, -0.007781982421875, -0.007110595703125, -0.006439208984375, -0.005767822265625, -0.005096435546875, -0.004425048828125, -0.003753662109375, -0.003082275390625, -0.002410888671875, -0.001739501953125, -0.001068115234375, -0.000396728515625, 0.000274658203125, 0.000946044921875, 0.001617431640625, 0.002288818359375, 0.002960205078125, 0.003631591796875, 0.004302978515625, 0.004974365234375, 0.005645751953125, 0.006317138671875, 0.006988525390625, 0.007659912109375, 0.008331298828125, 0.009002685546875, 0.009674072265625, 0.010345458984375, 0.011016845703125, 0.011688232421875, 0.012359619140625, 0.013031005859375, 0.013702392578125, 0.014373779296875, 0.015045166015625, 0.015716552734375, 0.016387939453125, 0.017059326171875, 0.017730712890625, 0.018402099609375, 0.019073486328125, 0.019744873046875, 0.020416259765625, 0.021087646484375, 0.021759033203125, 0.022430419921875, 0.023101806640625, 0.023773193359375, 0.024444580078125, 0.025115966796875, 0.025787353515625, 0.026458740234375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 5.0, 8.0, 3.0, 9.0, 7.0, 19.0, 24.0, 39.0, 66.0, 90.0, 90.0, 120.0, 114.0, 105.0, 94.0, 73.0, 44.0, 22.0, 16.0, 17.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01251983642578125, -0.012058854103088379, -0.011597871780395508, -0.011136889457702637, -0.010675907135009766, -0.010214924812316895, -0.009753942489624023, -0.009292960166931152, -0.008831977844238281, -0.00837099552154541, -0.007910013198852539, -0.007449030876159668, -0.006988048553466797, -0.006527066230773926, -0.006066083908081055, -0.005605101585388184, -0.0051441192626953125, -0.004683136940002441, -0.00422215461730957, -0.0037611722946166992, -0.003300189971923828, -0.002839207649230957, -0.002378225326538086, -0.0019172430038452148, -0.0014562606811523438, -0.0009952783584594727, -0.0005342960357666016, -7.331371307373047e-05, 0.0003876686096191406, 0.0008486509323120117, 0.0013096332550048828, 0.001770615577697754, 0.002231597900390625, 0.002692580223083496, 0.003153562545776367, 0.0036145448684692383, 0.004075527191162109, 0.0045365095138549805, 0.0049974918365478516, 0.005458474159240723, 0.005919456481933594, 0.006380438804626465, 0.006841421127319336, 0.007302403450012207, 0.007763385772705078, 0.00822436809539795, 0.00868535041809082, 0.009146332740783691, 0.009607315063476562, 0.010068297386169434, 0.010529279708862305, 0.010990262031555176, 0.011451244354248047, 0.011912226676940918, 0.012373208999633789, 0.01283419132232666, 0.013295173645019531, 0.013756155967712402, 0.014217138290405273, 0.014678120613098145, 0.015139102935791016, 0.015600085258483887, 0.016061067581176758, 0.01652204990386963, 0.0169830322265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 27.0, 128.0, 387.0, 358.0, 82.0, 18.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2876220643520355, -0.2707435190677643, -0.25386497378349304, -0.2369864284992218, -0.22010788321495056, -0.20322933793067932, -0.1863507777452469, -0.16947223246097565, -0.1525936871767044, -0.13571514189243317, -0.11883659660816193, -0.10195804387331009, -0.08507949858903885, -0.06820095330476761, -0.05132240056991577, -0.03444385528564453, -0.01756531000137329, -0.0006867628544569016, 0.016191784292459488, 0.03307033330202103, 0.04994887858629227, 0.06682742387056351, 0.08370597660541534, 0.10058452188968658, 0.11746306717395782, 0.13434161245822906, 0.1512201577425003, 0.16809871792793274, 0.18497726321220398, 0.20185580849647522, 0.21873435378074646, 0.2356128990650177, 0.25249141454696655, 0.2693699598312378, 0.28624850511550903, 0.3031270503997803, 0.3200055956840515, 0.33688414096832275, 0.353762686252594, 0.37064123153686523, 0.3875197768211365, 0.4043983221054077, 0.42127686738967896, 0.4381554126739502, 0.45503395795822144, 0.4719125032424927, 0.4887910485267639, 0.5056695938110352, 0.5225481986999512, 0.5394267439842224, 0.5563052892684937, 0.5731838345527649, 0.5900623798370361, 0.6069409251213074, 0.6238194704055786, 0.6406980156898499, 0.6575765609741211, 0.6744551062583923, 0.6913336515426636, 0.7082121968269348, 0.725090742111206, 0.7419692873954773, 0.7588478326797485, 0.7757263779640198, 0.792604923248291]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 4.0, 6.0, 13.0, 10.0, 13.0, 10.0, 17.0, 13.0, 14.0, 22.0, 27.0, 28.0, 34.0, 36.0, 37.0, 31.0, 32.0, 30.0, 33.0, 38.0, 46.0, 32.0, 41.0, 39.0, 42.0, 31.0, 32.0, 27.0, 30.0, 29.0, 21.0, 28.0, 25.0, 10.0, 19.0, 11.0, 11.0, 10.0, 10.0, 8.0, 11.0, 7.0, 2.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0826493501663208, -0.08013132959604263, -0.07761330902576447, -0.0750952959060669, -0.07257727533578873, -0.07005925476551056, -0.06754124164581299, -0.06502322107553482, -0.06250520050525665, -0.059987179934978485, -0.057469163089990616, -0.05495114624500275, -0.05243312567472458, -0.04991510510444641, -0.04739708825945854, -0.04487907141447067, -0.042361050844192505, -0.03984303027391434, -0.03732501342892647, -0.0348069965839386, -0.03228897601366043, -0.029770957306027412, -0.027252938598394394, -0.024734919890761375, -0.022216901183128357, -0.01969888247549534, -0.01718086376786232, -0.014662845060229301, -0.012144826352596283, -0.009626807644963264, -0.007108788937330246, -0.0045907702296972275, -0.002072751522064209, 0.0004452671855688095, 0.002963285893201828, 0.0054813046008348465, 0.007999323308467865, 0.010517342016100883, 0.013035360723733902, 0.01555337943136692, 0.01807139813899994, 0.020589416846632957, 0.023107435554265976, 0.025625454261898994, 0.028143472969532013, 0.03066149167716503, 0.03317951038479805, 0.03569752722978592, 0.03821554780006409, 0.040733568370342255, 0.043251585215330124, 0.04576960206031799, 0.04828762263059616, 0.05080564320087433, 0.0533236600458622, 0.05584167689085007, 0.058359697461128235, 0.0608777180314064, 0.06339573860168457, 0.06591375172138214, 0.06843177229166031, 0.07094979286193848, 0.07346780598163605, 0.07598582655191422, 0.07850384712219238]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 10.0, 11.0, 7.0, 18.0, 29.0, 37.0, 49.0, 56.0, 91.0, 115.0, 179.0, 205.0, 320.0, 454.0, 658.0, 1010.0, 1741.0, 3376.0, 7807.0, 27939.0, 376597.0, 3690174.0, 59534.0, 12701.0, 4853.0, 2322.0, 1344.0, 840.0, 517.0, 396.0, 230.0, 183.0, 146.0, 76.0, 73.0, 51.0, 37.0, 24.0, 24.0, 14.0, 6.0, 12.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.040679931640625, -0.03955650329589844, -0.038433074951171875, -0.03730964660644531, -0.03618621826171875, -0.03506278991699219, -0.033939361572265625, -0.03281593322753906, -0.0316925048828125, -0.030569076538085938, -0.029445648193359375, -0.028322219848632812, -0.02719879150390625, -0.026075363159179688, -0.024951934814453125, -0.023828506469726562, -0.022705078125, -0.021581649780273438, -0.020458221435546875, -0.019334793090820312, -0.01821136474609375, -0.017087936401367188, -0.015964508056640625, -0.014841079711914062, -0.0137176513671875, -0.012594223022460938, -0.011470794677734375, -0.010347366333007812, -0.00922393798828125, -0.008100509643554688, -0.006977081298828125, -0.0058536529541015625, -0.004730224609375, -0.0036067962646484375, -0.002483367919921875, -0.0013599395751953125, -0.00023651123046875, 0.0008869171142578125, 0.002010345458984375, 0.0031337738037109375, 0.0042572021484375, 0.0053806304931640625, 0.006504058837890625, 0.0076274871826171875, 0.00875091552734375, 0.009874343872070312, 0.010997772216796875, 0.012121200561523438, 0.01324462890625, 0.014368057250976562, 0.015491485595703125, 0.016614913940429688, 0.01773834228515625, 0.018861770629882812, 0.019985198974609375, 0.021108627319335938, 0.0222320556640625, 0.023355484008789062, 0.024478912353515625, 0.025602340698242188, 0.02672576904296875, 0.027849197387695312, 0.028972625732421875, 0.030096054077148438, 0.031219482421875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 15.0, 16.0, 21.0, 16.0, 32.0, 39.0, 38.0, 53.0, 73.0, 69.0, 93.0, 84.0, 65.0, 67.0, 71.0, 63.0, 45.0, 35.0, 23.0, 13.0, 18.0, 15.0, 9.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.0093231201171875, -0.00903463363647461, -0.008746147155761719, -0.008457660675048828, -0.008169174194335938, -0.007880687713623047, -0.007592201232910156, -0.007303714752197266, -0.007015228271484375, -0.006726741790771484, -0.006438255310058594, -0.006149768829345703, -0.0058612823486328125, -0.005572795867919922, -0.005284309387207031, -0.004995822906494141, -0.00470733642578125, -0.004418849945068359, -0.004130363464355469, -0.003841876983642578, -0.0035533905029296875, -0.003264904022216797, -0.0029764175415039062, -0.0026879310607910156, -0.002399444580078125, -0.0021109580993652344, -0.0018224716186523438, -0.0015339851379394531, -0.0012454986572265625, -0.0009570121765136719, -0.0006685256958007812, -0.0003800392150878906, -9.1552734375e-05, 0.00019693374633789062, 0.00048542022705078125, 0.0007739067077636719, 0.0010623931884765625, 0.0013508796691894531, 0.0016393661499023438, 0.0019278526306152344, 0.002216339111328125, 0.0025048255920410156, 0.0027933120727539062, 0.003081798553466797, 0.0033702850341796875, 0.003658771514892578, 0.003947257995605469, 0.004235744476318359, 0.00452423095703125, 0.004812717437744141, 0.005101203918457031, 0.005389690399169922, 0.0056781768798828125, 0.005966663360595703, 0.006255149841308594, 0.006543636322021484, 0.006832122802734375, 0.007120609283447266, 0.007409095764160156, 0.007697582244873047, 0.007986068725585938, 0.008274555206298828, 0.008563041687011719, 0.00885152816772461, 0.0091400146484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 8.0, 19.0, 30.0, 52.0, 86.0, 145.0, 311.0, 634.0, 1478.0, 4115.0, 15039.0, 133832.0, 3918551.0, 100459.0, 13228.0, 3627.0, 1375.0, 599.0, 343.0, 154.0, 93.0, 53.0, 32.0, 12.0, 13.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.053741455078125, -0.05260896682739258, -0.051476478576660156, -0.050343990325927734, -0.04921150207519531, -0.04807901382446289, -0.04694652557373047, -0.04581403732299805, -0.044681549072265625, -0.0435490608215332, -0.04241657257080078, -0.04128408432006836, -0.04015159606933594, -0.039019107818603516, -0.037886619567871094, -0.03675413131713867, -0.03562164306640625, -0.03448915481567383, -0.033356666564941406, -0.032224178314208984, -0.031091690063476562, -0.02995920181274414, -0.02882671356201172, -0.027694225311279297, -0.026561737060546875, -0.025429248809814453, -0.02429676055908203, -0.02316427230834961, -0.022031784057617188, -0.020899295806884766, -0.019766807556152344, -0.018634319305419922, -0.0175018310546875, -0.016369342803955078, -0.015236854553222656, -0.014104366302490234, -0.012971878051757812, -0.01183938980102539, -0.010706901550292969, -0.009574413299560547, -0.008441925048828125, -0.007309436798095703, -0.006176948547363281, -0.005044460296630859, -0.0039119720458984375, -0.0027794837951660156, -0.0016469955444335938, -0.0005145072937011719, 0.00061798095703125, 0.0017504692077636719, 0.0028829574584960938, 0.004015445709228516, 0.0051479339599609375, 0.006280422210693359, 0.007412910461425781, 0.008545398712158203, 0.009677886962890625, 0.010810375213623047, 0.011942863464355469, 0.01307535171508789, 0.014207839965820312, 0.015340328216552734, 0.016472816467285156, 0.017605304718017578, 0.01873779296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 10.0, 13.0, 28.0, 36.0, 61.0, 165.0, 555.0, 2315.0, 554.0, 169.0, 66.0, 31.0, 22.0, 13.0, 11.0, 3.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009490966796875, -0.009069204330444336, -0.008647441864013672, -0.008225679397583008, -0.007803916931152344, -0.00738215446472168, -0.006960391998291016, -0.0065386295318603516, -0.0061168670654296875, -0.0056951045989990234, -0.005273342132568359, -0.004851579666137695, -0.004429817199707031, -0.004008054733276367, -0.003586292266845703, -0.003164529800415039, -0.002742767333984375, -0.002321004867553711, -0.0018992424011230469, -0.0014774799346923828, -0.0010557174682617188, -0.0006339550018310547, -0.00021219253540039062, 0.00020956993103027344, 0.0006313323974609375, 0.0010530948638916016, 0.0014748573303222656, 0.0018966197967529297, 0.0023183822631835938, 0.002740144729614258, 0.003161907196044922, 0.003583669662475586, 0.00400543212890625, 0.004427194595336914, 0.004848957061767578, 0.005270719528198242, 0.005692481994628906, 0.00611424446105957, 0.006536006927490234, 0.0069577693939208984, 0.0073795318603515625, 0.0078012943267822266, 0.00822305679321289, 0.008644819259643555, 0.009066581726074219, 0.009488344192504883, 0.009910106658935547, 0.010331869125366211, 0.010753631591796875, 0.011175394058227539, 0.011597156524658203, 0.012018918991088867, 0.012440681457519531, 0.012862443923950195, 0.01328420639038086, 0.013705968856811523, 0.014127731323242188, 0.014549493789672852, 0.014971256256103516, 0.01539301872253418, 0.015814781188964844, 0.016236543655395508, 0.016658306121826172, 0.017080068588256836, 0.0175018310546875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 25.0, 84.0, 278.0, 331.0, 167.0, 60.0, 19.0, 13.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09847377240657806, -0.09486760944128036, -0.09126145392656326, -0.08765529096126556, -0.08404913544654846, -0.08044297248125076, -0.07683680951595306, -0.07323065400123596, -0.06962449103593826, -0.06601832807064056, -0.06241217255592346, -0.05880600959062576, -0.05519985035061836, -0.05159369111061096, -0.04798752814531326, -0.04438136890530586, -0.04077520966529846, -0.03716905042529106, -0.03356289118528366, -0.029956728219985962, -0.02635056897997856, -0.02274440973997116, -0.01913824863731861, -0.015532087534666061, -0.011925928294658661, -0.008319768123328686, -0.004713607951998711, -0.0011074477806687355, 0.0024987123906612396, 0.00610487163066864, 0.00971103273332119, 0.01331719383597374, 0.01692335307598114, 0.02052951231598854, 0.02413567341864109, 0.02774183452129364, 0.03134799376130104, 0.03495415300130844, 0.03856031596660614, 0.04216647520661354, 0.04577263444662094, 0.04937879368662834, 0.05298495292663574, 0.05659111589193344, 0.06019727513194084, 0.06380343437194824, 0.06740959733724594, 0.07101576030254364, 0.07462191581726074, 0.07822807878255844, 0.08183423429727554, 0.08544039726257324, 0.08904655277729034, 0.09265271574258804, 0.09625887870788574, 0.09986503422260284, 0.10347119718790054, 0.10707736015319824, 0.11068351566791534, 0.11428967863321304, 0.11789584159851074, 0.12150199711322784, 0.12510815262794495, 0.12871432304382324, 0.13232047855854034]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 9.0, 8.0, 15.0, 12.0, 14.0, 23.0, 37.0, 32.0, 21.0, 37.0, 33.0, 42.0, 41.0, 46.0, 43.0, 49.0, 48.0, 50.0, 50.0, 36.0, 47.0, 40.0, 38.0, 38.0, 29.0, 20.0, 24.0, 22.0, 19.0, 13.0, 12.0, 10.0, 11.0, 2.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.023458898067474365, -0.022695351392030716, -0.021931806579232216, -0.021168261766433716, -0.020404715090990067, -0.019641168415546417, -0.018877623602747917, -0.018114078789949417, -0.017350532114505768, -0.01658698543906212, -0.01582344062626362, -0.015059894882142544, -0.014296349138021469, -0.013532803393900394, -0.01276925764977932, -0.012005711905658245, -0.01124216616153717, -0.010478620417416096, -0.009715074673295021, -0.008951528929173946, -0.008187983185052872, -0.007424437440931797, -0.006660891696810722, -0.005897345952689648, -0.005133800208568573, -0.004370254464447498, -0.0036067087203264236, -0.002843162976205349, -0.0020796172320842743, -0.0013160714879631996, -0.0005525257438421249, 0.00021102000027894974, 0.0009745657444000244, 0.001738111488521099, 0.0025016572326421738, 0.0032652029767632484, 0.004028748720884323, 0.004792294465005398, 0.0055558402091264725, 0.006319385953247547, 0.007082931697368622, 0.007846477441489697, 0.008610023185610771, 0.009373568929731846, 0.01013711467385292, 0.010900660417973995, 0.01166420616209507, 0.012427751906216145, 0.01319129765033722, 0.013954843394458294, 0.014718389138579369, 0.015481934882700443, 0.016245480626821518, 0.017009027302265167, 0.017772572115063667, 0.018536116927862167, 0.019299663603305817, 0.020063210278749466, 0.020826755091547966, 0.021590299904346466, 0.022353846579790115, 0.023117393255233765, 0.023880938068032265, 0.024644482880830765, 0.025408029556274414]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 5.0, 16.0, 20.0, 32.0, 45.0, 56.0, 100.0, 127.0, 233.0, 375.0, 583.0, 960.0, 1744.0, 3589.0, 7602.0, 18063.0, 51291.0, 164968.0, 385804.0, 272961.0, 88605.0, 29311.0, 11461.0, 4927.0, 2458.0, 1256.0, 762.0, 412.0, 284.0, 171.0, 116.0, 78.0, 47.0, 19.0, 28.0, 17.0, 9.0, 8.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0174560546875, -0.016888141632080078, -0.016320228576660156, -0.015752315521240234, -0.015184402465820312, -0.01461648941040039, -0.014048576354980469, -0.013480663299560547, -0.012912750244140625, -0.012344837188720703, -0.011776924133300781, -0.01120901107788086, -0.010641098022460938, -0.010073184967041016, -0.009505271911621094, -0.008937358856201172, -0.00836944580078125, -0.007801532745361328, -0.007233619689941406, -0.006665706634521484, -0.0060977935791015625, -0.005529880523681641, -0.004961967468261719, -0.004394054412841797, -0.003826141357421875, -0.003258228302001953, -0.0026903152465820312, -0.0021224021911621094, -0.0015544891357421875, -0.0009865760803222656, -0.00041866302490234375, 0.00014925003051757812, 0.0007171630859375, 0.0012850761413574219, 0.0018529891967773438, 0.0024209022521972656, 0.0029888153076171875, 0.0035567283630371094, 0.004124641418457031, 0.004692554473876953, 0.005260467529296875, 0.005828380584716797, 0.006396293640136719, 0.006964206695556641, 0.0075321197509765625, 0.008100032806396484, 0.008667945861816406, 0.009235858917236328, 0.00980377197265625, 0.010371685028076172, 0.010939598083496094, 0.011507511138916016, 0.012075424194335938, 0.01264333724975586, 0.013211250305175781, 0.013779163360595703, 0.014347076416015625, 0.014914989471435547, 0.015482902526855469, 0.01605081558227539, 0.016618728637695312, 0.017186641693115234, 0.017754554748535156, 0.018322467803955078, 0.018890380859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 14.0, 12.0, 20.0, 21.0, 26.0, 44.0, 47.0, 76.0, 87.0, 72.0, 82.0, 74.0, 68.0, 71.0, 75.0, 48.0, 40.0, 36.0, 25.0, 12.0, 18.0, 7.0, 6.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0098419189453125, -0.009534358978271484, -0.009226799011230469, -0.008919239044189453, -0.008611679077148438, -0.008304119110107422, -0.007996559143066406, -0.007688999176025391, -0.007381439208984375, -0.007073879241943359, -0.006766319274902344, -0.006458759307861328, -0.0061511993408203125, -0.005843639373779297, -0.005536079406738281, -0.005228519439697266, -0.00492095947265625, -0.004613399505615234, -0.004305839538574219, -0.003998279571533203, -0.0036907196044921875, -0.003383159637451172, -0.0030755996704101562, -0.0027680397033691406, -0.002460479736328125, -0.0021529197692871094, -0.0018453598022460938, -0.0015377998352050781, -0.0012302398681640625, -0.0009226799011230469, -0.0006151199340820312, -0.0003075599670410156, 0.0, 0.0003075599670410156, 0.0006151199340820312, 0.0009226799011230469, 0.0012302398681640625, 0.0015377998352050781, 0.0018453598022460938, 0.0021529197692871094, 0.002460479736328125, 0.0027680397033691406, 0.0030755996704101562, 0.003383159637451172, 0.0036907196044921875, 0.003998279571533203, 0.004305839538574219, 0.004613399505615234, 0.00492095947265625, 0.005228519439697266, 0.005536079406738281, 0.005843639373779297, 0.0061511993408203125, 0.006458759307861328, 0.006766319274902344, 0.007073879241943359, 0.007381439208984375, 0.007688999176025391, 0.007996559143066406, 0.008304119110107422, 0.008611679077148438, 0.008919239044189453, 0.009226799011230469, 0.009534358978271484, 0.0098419189453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 2.0, 5.0, 10.0, 10.0, 14.0, 21.0, 14.0, 45.0, 22.0, 44.0, 66.0, 91.0, 150.0, 210.0, 383.0, 640.0, 1168.0, 2436.0, 5525.0, 13738.0, 37113.0, 122773.0, 388178.0, 329737.0, 95432.0, 30145.0, 11292.0, 4599.0, 2137.0, 1025.0, 554.0, 319.0, 201.0, 122.0, 78.0, 63.0, 46.0, 33.0, 33.0, 22.0, 12.0, 10.0, 10.0, 14.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.01491546630859375, -0.014432787895202637, -0.013950109481811523, -0.01346743106842041, -0.012984752655029297, -0.012502074241638184, -0.01201939582824707, -0.011536717414855957, -0.011054039001464844, -0.01057136058807373, -0.010088682174682617, -0.009606003761291504, -0.00912332534790039, -0.008640646934509277, -0.008157968521118164, -0.007675290107727051, -0.0071926116943359375, -0.006709933280944824, -0.006227254867553711, -0.005744576454162598, -0.005261898040771484, -0.004779219627380371, -0.004296541213989258, -0.0038138628005981445, -0.0033311843872070312, -0.002848505973815918, -0.0023658275604248047, -0.0018831491470336914, -0.0014004707336425781, -0.0009177923202514648, -0.00043511390686035156, 4.756450653076172e-05, 0.000530242919921875, 0.0010129213333129883, 0.0014955997467041016, 0.001978278160095215, 0.002460956573486328, 0.0029436349868774414, 0.0034263134002685547, 0.003908991813659668, 0.004391670227050781, 0.0048743486404418945, 0.005357027053833008, 0.005839705467224121, 0.006322383880615234, 0.006805062294006348, 0.007287740707397461, 0.007770419120788574, 0.008253097534179688, 0.0087357759475708, 0.009218454360961914, 0.009701132774353027, 0.01018381118774414, 0.010666489601135254, 0.011149168014526367, 0.01163184642791748, 0.012114524841308594, 0.012597203254699707, 0.01307988166809082, 0.013562560081481934, 0.014045238494873047, 0.01452791690826416, 0.015010595321655273, 0.015493273735046387, 0.0159759521484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 4.0, 2.0, 6.0, 7.0, 4.0, 7.0, 5.0, 7.0, 6.0, 20.0, 16.0, 14.0, 24.0, 15.0, 22.0, 24.0, 32.0, 29.0, 35.0, 38.0, 33.0, 36.0, 48.0, 46.0, 41.0, 42.0, 34.0, 33.0, 53.0, 38.0, 38.0, 35.0, 31.0, 21.0, 16.0, 27.0, 12.0, 19.0, 17.0, 16.0, 12.0, 5.0, 8.0, 10.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0228118896484375, -0.02215099334716797, -0.021490097045898438, -0.020829200744628906, -0.020168304443359375, -0.019507408142089844, -0.018846511840820312, -0.01818561553955078, -0.01752471923828125, -0.01686382293701172, -0.016202926635742188, -0.015542030334472656, -0.014881134033203125, -0.014220237731933594, -0.013559341430664062, -0.012898445129394531, -0.012237548828125, -0.011576652526855469, -0.010915756225585938, -0.010254859924316406, -0.009593963623046875, -0.008933067321777344, -0.008272171020507812, -0.007611274719238281, -0.00695037841796875, -0.006289482116699219, -0.0056285858154296875, -0.004967689514160156, -0.004306793212890625, -0.0036458969116210938, -0.0029850006103515625, -0.0023241043090820312, -0.0016632080078125, -0.0010023117065429688, -0.0003414154052734375, 0.00031948089599609375, 0.000980377197265625, 0.0016412734985351562, 0.0023021697998046875, 0.0029630661010742188, 0.00362396240234375, 0.004284858703613281, 0.0049457550048828125, 0.005606651306152344, 0.006267547607421875, 0.006928443908691406, 0.0075893402099609375, 0.008250236511230469, 0.0089111328125, 0.009572029113769531, 0.010232925415039062, 0.010893821716308594, 0.011554718017578125, 0.012215614318847656, 0.012876510620117188, 0.013537406921386719, 0.01419830322265625, 0.014859199523925781, 0.015520095825195312, 0.016180992126464844, 0.016841888427734375, 0.017502784729003906, 0.018163681030273438, 0.01882457733154297, 0.0194854736328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 13.0, 25.0, 56.0, 141.0, 373.0, 1212.0, 4344.0, 23214.0, 330968.0, 631794.0, 46813.0, 6992.0, 1693.0, 542.0, 182.0, 91.0, 47.0, 16.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0176239013671875, -0.01714956760406494, -0.016675233840942383, -0.016200900077819824, -0.015726566314697266, -0.015252232551574707, -0.014777898788452148, -0.01430356502532959, -0.013829231262207031, -0.013354897499084473, -0.012880563735961914, -0.012406229972839355, -0.011931896209716797, -0.011457562446594238, -0.01098322868347168, -0.010508894920349121, -0.010034561157226562, -0.009560227394104004, -0.009085893630981445, -0.008611559867858887, -0.008137226104736328, -0.0076628923416137695, -0.007188558578491211, -0.006714224815368652, -0.006239891052246094, -0.005765557289123535, -0.0052912235260009766, -0.004816889762878418, -0.004342555999755859, -0.0038682222366333008, -0.003393888473510742, -0.0029195547103881836, -0.002445220947265625, -0.0019708871841430664, -0.0014965534210205078, -0.0010222196578979492, -0.0005478858947753906, -7.355213165283203e-05, 0.00040078163146972656, 0.0008751153945922852, 0.0013494491577148438, 0.0018237829208374023, 0.002298116683959961, 0.0027724504470825195, 0.003246784210205078, 0.0037211179733276367, 0.004195451736450195, 0.004669785499572754, 0.0051441192626953125, 0.005618453025817871, 0.00609278678894043, 0.006567120552062988, 0.007041454315185547, 0.0075157880783081055, 0.007990121841430664, 0.008464455604553223, 0.008938789367675781, 0.00941312313079834, 0.009887456893920898, 0.010361790657043457, 0.010836124420166016, 0.011310458183288574, 0.011784791946411133, 0.012259125709533691, 0.01273345947265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 8.0, 5.0, 22.0, 38.0, 87.0, 143.0, 223.0, 189.0, 146.0, 72.0, 45.0, 19.0, 10.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00018453598022460938, -0.00018042884767055511, -0.00017632171511650085, -0.0001722145825624466, -0.00016810745000839233, -0.00016400031745433807, -0.0001598931849002838, -0.00015578605234622955, -0.0001516789197921753, -0.00014757178723812103, -0.00014346465468406677, -0.0001393575221300125, -0.00013525038957595825, -0.000131143257021904, -0.00012703612446784973, -0.00012292899191379547, -0.00011882185935974121, -0.00011471472680568695, -0.00011060759425163269, -0.00010650046169757843, -0.00010239332914352417, -9.828619658946991e-05, -9.417906403541565e-05, -9.007193148136139e-05, -8.596479892730713e-05, -8.185766637325287e-05, -7.775053381919861e-05, -7.364340126514435e-05, -6.953626871109009e-05, -6.542913615703583e-05, -6.132200360298157e-05, -5.721487104892731e-05, -5.310773849487305e-05, -4.900060594081879e-05, -4.4893473386764526e-05, -4.0786340832710266e-05, -3.6679208278656006e-05, -3.2572075724601746e-05, -2.8464943170547485e-05, -2.4357810616493225e-05, -2.0250678062438965e-05, -1.6143545508384705e-05, -1.2036412954330444e-05, -7.929280400276184e-06, -3.822147846221924e-06, 2.849847078323364e-07, 4.392117261886597e-06, 8.499249815940857e-06, 1.2606382369995117e-05, 1.6713514924049377e-05, 2.0820647478103638e-05, 2.4927780032157898e-05, 2.9034912586212158e-05, 3.314204514026642e-05, 3.724917769432068e-05, 4.135631024837494e-05, 4.54634428024292e-05, 4.957057535648346e-05, 5.367770791053772e-05, 5.778484046459198e-05, 6.189197301864624e-05, 6.59991055727005e-05, 7.010623812675476e-05, 7.421337068080902e-05, 7.832050323486328e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 11.0, 16.0, 25.0, 38.0, 60.0, 94.0, 156.0, 327.0, 802.0, 3004.0, 20742.0, 381664.0, 599855.0, 35693.0, 4183.0, 1053.0, 360.0, 177.0, 113.0, 61.0, 38.0, 28.0, 18.0, 9.0, 8.0, 4.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208892822265625, -0.02035510540008545, -0.0198209285736084, -0.019286751747131348, -0.018752574920654297, -0.018218398094177246, -0.017684221267700195, -0.017150044441223145, -0.016615867614746094, -0.016081690788269043, -0.015547513961791992, -0.015013337135314941, -0.01447916030883789, -0.01394498348236084, -0.013410806655883789, -0.012876629829406738, -0.012342453002929688, -0.011808276176452637, -0.011274099349975586, -0.010739922523498535, -0.010205745697021484, -0.009671568870544434, -0.009137392044067383, -0.008603215217590332, -0.008069038391113281, -0.0075348615646362305, -0.00700068473815918, -0.006466507911682129, -0.005932331085205078, -0.005398154258728027, -0.0048639774322509766, -0.004329800605773926, -0.003795623779296875, -0.0032614469528198242, -0.0027272701263427734, -0.0021930932998657227, -0.0016589164733886719, -0.001124739646911621, -0.0005905628204345703, -5.638599395751953e-05, 0.00047779083251953125, 0.001011967658996582, 0.0015461444854736328, 0.0020803213119506836, 0.0026144981384277344, 0.003148674964904785, 0.003682851791381836, 0.004217028617858887, 0.0047512054443359375, 0.005285382270812988, 0.005819559097290039, 0.00635373592376709, 0.006887912750244141, 0.007422089576721191, 0.007956266403198242, 0.008490443229675293, 0.009024620056152344, 0.009558796882629395, 0.010092973709106445, 0.010627150535583496, 0.011161327362060547, 0.011695504188537598, 0.012229681015014648, 0.0127638578414917, 0.01329803466796875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 8.0, 21.0, 25.0, 39.0, 42.0, 60.0, 84.0, 91.0, 95.0, 105.0, 109.0, 77.0, 67.0, 59.0, 35.0, 36.0, 21.0, 6.0, 11.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01519775390625, -0.01482999324798584, -0.01446223258972168, -0.01409447193145752, -0.01372671127319336, -0.0133589506149292, -0.012991189956665039, -0.012623429298400879, -0.012255668640136719, -0.011887907981872559, -0.011520147323608398, -0.011152386665344238, -0.010784626007080078, -0.010416865348815918, -0.010049104690551758, -0.009681344032287598, -0.009313583374023438, -0.008945822715759277, -0.008578062057495117, -0.008210301399230957, -0.007842540740966797, -0.007474780082702637, -0.0071070194244384766, -0.006739258766174316, -0.006371498107910156, -0.006003737449645996, -0.005635976791381836, -0.005268216133117676, -0.004900455474853516, -0.0045326948165893555, -0.004164934158325195, -0.003797173500061035, -0.003429412841796875, -0.003061652183532715, -0.0026938915252685547, -0.0023261308670043945, -0.0019583702087402344, -0.0015906095504760742, -0.001222848892211914, -0.0008550882339477539, -0.00048732757568359375, -0.0001195669174194336, 0.00024819374084472656, 0.0006159543991088867, 0.0009837150573730469, 0.001351475715637207, 0.0017192363739013672, 0.0020869970321655273, 0.0024547576904296875, 0.0028225183486938477, 0.003190279006958008, 0.003558039665222168, 0.003925800323486328, 0.004293560981750488, 0.0046613216400146484, 0.005029082298278809, 0.005396842956542969, 0.005764603614807129, 0.006132364273071289, 0.006500124931335449, 0.006867885589599609, 0.0072356462478637695, 0.00760340690612793, 0.00797116756439209, 0.00833892822265625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 10.0, 40.0, 220.0, 413.0, 249.0, 64.0, 16.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7612881064414978, -0.7459147572517395, -0.730541467666626, -0.7151681184768677, -0.6997948288917542, -0.6844214797019958, -0.6690481901168823, -0.653674840927124, -0.6383015513420105, -0.6229282021522522, -0.6075549125671387, -0.5921815633773804, -0.5768082737922668, -0.5614349246025085, -0.546061635017395, -0.5306882858276367, -0.5153149366378784, -0.4999416172504425, -0.4845682978630066, -0.4691949784755707, -0.45382165908813477, -0.43844833970069885, -0.42307502031326294, -0.40770167112350464, -0.3923283815383911, -0.3769550621509552, -0.3615817427635193, -0.3462084233760834, -0.33083510398864746, -0.31546178460121155, -0.30008846521377563, -0.28471511602401733, -0.2693418562412262, -0.2539685368537903, -0.23859521746635437, -0.22322189807891846, -0.20784857869148254, -0.19247525930404663, -0.17710192501544952, -0.1617286056280136, -0.1463552862405777, -0.13098196685314178, -0.11560864746570587, -0.10023532062768936, -0.08486200124025345, -0.06948868185281754, -0.054115355014801025, -0.03874203562736511, -0.0233687162399292, -0.007995394989848137, 0.007377926260232925, 0.022751249372959137, 0.03812456876039505, 0.05349788814783096, 0.06887121498584747, 0.08424453437328339, 0.0996178537607193, 0.11499117314815521, 0.13036449253559113, 0.14573782682418823, 0.16111114621162415, 0.17648446559906006, 0.19185778498649597, 0.20723110437393188, 0.2226044237613678]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 5.0, 6.0, 10.0, 8.0, 5.0, 11.0, 10.0, 15.0, 14.0, 12.0, 19.0, 20.0, 21.0, 20.0, 26.0, 27.0, 32.0, 28.0, 32.0, 32.0, 35.0, 44.0, 44.0, 36.0, 54.0, 46.0, 38.0, 33.0, 33.0, 27.0, 29.0, 25.0, 28.0, 25.0, 13.0, 23.0, 18.0, 12.0, 17.0, 18.0, 15.0, 6.0, 6.0, 7.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.10703080892562866, -0.10381944477558136, -0.10060808807611465, -0.09739673137664795, -0.09418536722660065, -0.09097400307655334, -0.08776264637708664, -0.08455128967761993, -0.08133992552757263, -0.07812856137752533, -0.07491720467805862, -0.07170584797859192, -0.06849448382854462, -0.06528311967849731, -0.06207176297903061, -0.058860402554273605, -0.0556490421295166, -0.0524376817047596, -0.049226321280002594, -0.04601496085524559, -0.042803600430488586, -0.03959224000573158, -0.03638087958097458, -0.033169519156217575, -0.02995815873146057, -0.026746798306703568, -0.023535437881946564, -0.02032407745718956, -0.017112717032432556, -0.013901356607675552, -0.010689996182918549, -0.007478635758161545, -0.004267275333404541, -0.0010559149086475372, 0.0021554455161094666, 0.00536680594086647, 0.008578166365623474, 0.011789526790380478, 0.015000887215137482, 0.018212247639894485, 0.02142360806465149, 0.024634968489408493, 0.027846328914165497, 0.0310576893389225, 0.034269049763679504, 0.03748041018843651, 0.04069177061319351, 0.043903131037950516, 0.04711449146270752, 0.05032585188746452, 0.05353721231222153, 0.05674857273697853, 0.059959933161735535, 0.06317129731178284, 0.06638265401124954, 0.06959401071071625, 0.07280537486076355, 0.07601673901081085, 0.07922809571027756, 0.08243945240974426, 0.08565081655979156, 0.08886218070983887, 0.09207353740930557, 0.09528489410877228, 0.09849625825881958]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 14.0, 10.0, 18.0, 28.0, 30.0, 38.0, 78.0, 142.0, 248.0, 400.0, 681.0, 1333.0, 2883.0, 7645.0, 34391.0, 2496242.0, 1604704.0, 31994.0, 7432.0, 2801.0, 1328.0, 684.0, 390.0, 244.0, 144.0, 108.0, 58.0, 57.0, 37.0, 21.0, 19.0, 15.0, 6.0, 11.0, 8.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0295867919921875, -0.028631925582885742, -0.027677059173583984, -0.026722192764282227, -0.02576732635498047, -0.02481245994567871, -0.023857593536376953, -0.022902727127075195, -0.021947860717773438, -0.02099299430847168, -0.020038127899169922, -0.019083261489868164, -0.018128395080566406, -0.01717352867126465, -0.01621866226196289, -0.015263795852661133, -0.014308929443359375, -0.013354063034057617, -0.01239919662475586, -0.011444330215454102, -0.010489463806152344, -0.009534597396850586, -0.008579730987548828, -0.00762486457824707, -0.0066699981689453125, -0.005715131759643555, -0.004760265350341797, -0.003805398941040039, -0.0028505325317382812, -0.0018956661224365234, -0.0009407997131347656, 1.4066696166992188e-05, 0.00096893310546875, 0.0019237995147705078, 0.0028786659240722656, 0.0038335323333740234, 0.004788398742675781, 0.005743265151977539, 0.006698131561279297, 0.007652997970581055, 0.008607864379882812, 0.00956273078918457, 0.010517597198486328, 0.011472463607788086, 0.012427330017089844, 0.013382196426391602, 0.01433706283569336, 0.015291929244995117, 0.016246795654296875, 0.017201662063598633, 0.01815652847290039, 0.01911139488220215, 0.020066261291503906, 0.021021127700805664, 0.021975994110107422, 0.02293086051940918, 0.023885726928710938, 0.024840593338012695, 0.025795459747314453, 0.02675032615661621, 0.02770519256591797, 0.028660058975219727, 0.029614925384521484, 0.030569791793823242, 0.031524658203125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 13.0, 16.0, 15.0, 20.0, 36.0, 40.0, 52.0, 65.0, 76.0, 60.0, 86.0, 79.0, 78.0, 63.0, 87.0, 53.0, 34.0, 33.0, 28.0, 17.0, 8.0, 12.0, 7.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0106048583984375, -0.010284423828125, -0.0099639892578125, -0.0096435546875, -0.0093231201171875, -0.009002685546875, -0.0086822509765625, -0.00836181640625, -0.0080413818359375, -0.007720947265625, -0.0074005126953125, -0.007080078125, -0.0067596435546875, -0.006439208984375, -0.0061187744140625, -0.00579833984375, -0.0054779052734375, -0.005157470703125, -0.0048370361328125, -0.0045166015625, -0.0041961669921875, -0.003875732421875, -0.0035552978515625, -0.00323486328125, -0.0029144287109375, -0.002593994140625, -0.0022735595703125, -0.001953125, -0.0016326904296875, -0.001312255859375, -0.0009918212890625, -0.00067138671875, -0.0003509521484375, -3.0517578125e-05, 0.0002899169921875, 0.0006103515625, 0.0009307861328125, 0.001251220703125, 0.0015716552734375, 0.00189208984375, 0.0022125244140625, 0.002532958984375, 0.0028533935546875, 0.003173828125, 0.0034942626953125, 0.003814697265625, 0.0041351318359375, 0.00445556640625, 0.0047760009765625, 0.005096435546875, 0.0054168701171875, 0.0057373046875, 0.0060577392578125, 0.006378173828125, 0.0066986083984375, 0.00701904296875, 0.0073394775390625, 0.007659912109375, 0.0079803466796875, 0.00830078125, 0.0086212158203125, 0.008941650390625, 0.0092620849609375, 0.00958251953125, 0.0099029541015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 15.0, 10.0, 30.0, 35.0, 48.0, 82.0, 111.0, 209.0, 377.0, 832.0, 2342.0, 8810.0, 79299.0, 3963939.0, 122603.0, 10998.0, 2618.0, 928.0, 404.0, 231.0, 125.0, 86.0, 52.0, 40.0, 16.0, 15.0, 13.0, 4.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03179931640625, -0.03075885772705078, -0.029718399047851562, -0.028677940368652344, -0.027637481689453125, -0.026597023010253906, -0.025556564331054688, -0.02451610565185547, -0.02347564697265625, -0.02243518829345703, -0.021394729614257812, -0.020354270935058594, -0.019313812255859375, -0.018273353576660156, -0.017232894897460938, -0.01619243621826172, -0.0151519775390625, -0.014111518859863281, -0.013071060180664062, -0.012030601501464844, -0.010990142822265625, -0.009949684143066406, -0.008909225463867188, -0.007868766784667969, -0.00682830810546875, -0.005787849426269531, -0.0047473907470703125, -0.0037069320678710938, -0.002666473388671875, -0.0016260147094726562, -0.0005855560302734375, 0.00045490264892578125, 0.001495361328125, 0.0025358200073242188, 0.0035762786865234375, 0.004616737365722656, 0.005657196044921875, 0.006697654724121094, 0.0077381134033203125, 0.008778572082519531, 0.00981903076171875, 0.010859489440917969, 0.011899948120117188, 0.012940406799316406, 0.013980865478515625, 0.015021324157714844, 0.016061782836914062, 0.01710224151611328, 0.0181427001953125, 0.01918315887451172, 0.020223617553710938, 0.021264076232910156, 0.022304534912109375, 0.023344993591308594, 0.024385452270507812, 0.02542591094970703, 0.02646636962890625, 0.02750682830810547, 0.028547286987304688, 0.029587745666503906, 0.030628204345703125, 0.031668663024902344, 0.03270912170410156, 0.03374958038330078, 0.0347900390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 13.0, 18.0, 44.0, 98.0, 428.0, 2772.0, 468.0, 111.0, 50.0, 28.0, 17.0, 8.0, 5.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01068115234375, -0.01007223129272461, -0.009463310241699219, -0.008854389190673828, -0.008245468139648438, -0.007636547088623047, -0.007027626037597656, -0.006418704986572266, -0.005809783935546875, -0.005200862884521484, -0.004591941833496094, -0.003983020782470703, -0.0033740997314453125, -0.002765178680419922, -0.0021562576293945312, -0.0015473365783691406, -0.00093841552734375, -0.0003294944763183594, 0.00027942657470703125, 0.0008883476257324219, 0.0014972686767578125, 0.002106189727783203, 0.0027151107788085938, 0.0033240318298339844, 0.003932952880859375, 0.004541873931884766, 0.005150794982910156, 0.005759716033935547, 0.0063686370849609375, 0.006977558135986328, 0.007586479187011719, 0.00819540023803711, 0.0088043212890625, 0.00941324234008789, 0.010022163391113281, 0.010631084442138672, 0.011240005493164062, 0.011848926544189453, 0.012457847595214844, 0.013066768646240234, 0.013675689697265625, 0.014284610748291016, 0.014893531799316406, 0.015502452850341797, 0.016111373901367188, 0.016720294952392578, 0.01732921600341797, 0.01793813705444336, 0.01854705810546875, 0.01915597915649414, 0.01976490020751953, 0.020373821258544922, 0.020982742309570312, 0.021591663360595703, 0.022200584411621094, 0.022809505462646484, 0.023418426513671875, 0.024027347564697266, 0.024636268615722656, 0.025245189666748047, 0.025854110717773438, 0.026463031768798828, 0.02707195281982422, 0.02768087387084961, 0.028289794921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 8.0, 49.0, 253.0, 471.0, 163.0, 33.0, 9.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07124335318803787, -0.06655369699001312, -0.06186404079198837, -0.05717438459396362, -0.05248472839593887, -0.047795072197914124, -0.04310541972517967, -0.03841576352715492, -0.03372610732913017, -0.029036451131105423, -0.024346794933080673, -0.019657140597701073, -0.014967484399676323, -0.010277828201651573, -0.005588173866271973, -0.0008985176682472229, 0.003791138529777527, 0.008480794727802277, 0.013170449994504452, 0.017860105261206627, 0.022549761459231377, 0.027239417657256126, 0.03192907199263573, 0.03661872819066048, 0.041308384388685226, 0.045998040586709976, 0.050687696784734726, 0.05537734925746918, 0.06006700545549393, 0.06475666165351868, 0.06944631785154343, 0.07413597404956818, 0.07882562279701233, 0.08351527899503708, 0.08820493519306183, 0.09289459139108658, 0.09758424758911133, 0.10227390378713608, 0.10696355998516083, 0.11165320873260498, 0.11634287238121033, 0.12103252857923508, 0.12572218477725983, 0.13041183352470398, 0.13510149717330933, 0.13979114592075348, 0.14448080956935883, 0.14917045831680298, 0.15386012196540833, 0.15854977071285248, 0.16323943436145782, 0.16792908310890198, 0.17261874675750732, 0.17730839550495148, 0.18199805915355682, 0.18668770790100098, 0.19137735664844513, 0.19606700539588928, 0.20075666904449463, 0.20544631779193878, 0.21013598144054413, 0.21482563018798828, 0.21951529383659363, 0.22420494258403778, 0.22889460623264313]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 13.0, 11.0, 21.0, 34.0, 42.0, 40.0, 64.0, 67.0, 77.0, 80.0, 88.0, 82.0, 65.0, 56.0, 71.0, 48.0, 43.0, 26.0, 19.0, 11.0, 7.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05135703086853027, -0.04979030415415764, -0.048223577439785004, -0.04665685072541237, -0.045090124011039734, -0.0435233972966671, -0.041956670582294464, -0.04038994386792183, -0.038823217153549194, -0.03725649043917656, -0.035689763724803925, -0.03412303701043129, -0.032556310296058655, -0.03098958358168602, -0.029422856867313385, -0.02785613015294075, -0.026289403438568115, -0.02472267672419548, -0.023155950009822845, -0.02158922329545021, -0.020022496581077576, -0.01845576986670494, -0.016889043152332306, -0.015322316437959671, -0.013755589723587036, -0.012188863009214401, -0.010622136294841766, -0.009055409580469131, -0.007488682866096497, -0.005921956151723862, -0.004355229437351227, -0.002788502722978592, -0.001221776008605957, 0.00034495070576667786, 0.0019116774201393127, 0.0034784041345119476, 0.0050451308488845825, 0.006611857563257217, 0.008178584277629852, 0.009745310992002487, 0.011312037706375122, 0.012878764420747757, 0.014445491135120392, 0.016012217849493027, 0.01757894456386566, 0.019145671278238297, 0.02071239799261093, 0.022279124706983566, 0.0238458514213562, 0.025412578135728836, 0.02697930485010147, 0.028546031564474106, 0.03011275827884674, 0.031679484993219376, 0.03324621170759201, 0.034812938421964645, 0.03637966513633728, 0.037946391850709915, 0.03951311856508255, 0.041079845279455185, 0.04264657199382782, 0.044213298708200455, 0.04578002542257309, 0.047346752136945724, 0.04891347885131836]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 11.0, 8.0, 30.0, 28.0, 68.0, 126.0, 245.0, 445.0, 971.0, 2325.0, 6706.0, 24331.0, 148814.0, 664139.0, 162780.0, 26040.0, 7054.0, 2429.0, 1022.0, 447.0, 231.0, 120.0, 71.0, 44.0, 19.0, 15.0, 14.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0262908935546875, -0.025429487228393555, -0.02456808090209961, -0.023706674575805664, -0.02284526824951172, -0.021983861923217773, -0.021122455596923828, -0.020261049270629883, -0.019399642944335938, -0.018538236618041992, -0.017676830291748047, -0.0168154239654541, -0.015954017639160156, -0.015092611312866211, -0.014231204986572266, -0.01336979866027832, -0.012508392333984375, -0.01164698600769043, -0.010785579681396484, -0.009924173355102539, -0.009062767028808594, -0.008201360702514648, -0.007339954376220703, -0.006478548049926758, -0.0056171417236328125, -0.004755735397338867, -0.003894329071044922, -0.0030329227447509766, -0.0021715164184570312, -0.001310110092163086, -0.0004487037658691406, 0.0004127025604248047, 0.00127410888671875, 0.0021355152130126953, 0.0029969215393066406, 0.003858327865600586, 0.004719734191894531, 0.0055811405181884766, 0.006442546844482422, 0.007303953170776367, 0.008165359497070312, 0.009026765823364258, 0.009888172149658203, 0.010749578475952148, 0.011610984802246094, 0.012472391128540039, 0.013333797454833984, 0.01419520378112793, 0.015056610107421875, 0.01591801643371582, 0.016779422760009766, 0.01764082908630371, 0.018502235412597656, 0.0193636417388916, 0.020225048065185547, 0.021086454391479492, 0.021947860717773438, 0.022809267044067383, 0.023670673370361328, 0.024532079696655273, 0.02539348602294922, 0.026254892349243164, 0.02711629867553711, 0.027977705001831055, 0.028839111328125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 17.0, 22.0, 24.0, 33.0, 49.0, 60.0, 62.0, 87.0, 78.0, 76.0, 82.0, 91.0, 76.0, 61.0, 47.0, 35.0, 21.0, 22.0, 7.0, 9.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.01198577880859375, -0.01162874698638916, -0.01127171516418457, -0.01091468334197998, -0.01055765151977539, -0.0102006196975708, -0.009843587875366211, -0.009486556053161621, -0.009129524230957031, -0.008772492408752441, -0.008415460586547852, -0.008058428764343262, -0.007701396942138672, -0.007344365119934082, -0.006987333297729492, -0.006630301475524902, -0.0062732696533203125, -0.005916237831115723, -0.005559206008911133, -0.005202174186706543, -0.004845142364501953, -0.004488110542297363, -0.0041310787200927734, -0.0037740468978881836, -0.0034170150756835938, -0.003059983253479004, -0.002702951431274414, -0.0023459196090698242, -0.0019888877868652344, -0.0016318559646606445, -0.0012748241424560547, -0.0009177923202514648, -0.000560760498046875, -0.00020372867584228516, 0.0001533031463623047, 0.0005103349685668945, 0.0008673667907714844, 0.0012243986129760742, 0.001581430435180664, 0.001938462257385254, 0.0022954940795898438, 0.0026525259017944336, 0.0030095577239990234, 0.0033665895462036133, 0.003723621368408203, 0.004080653190612793, 0.004437685012817383, 0.004794716835021973, 0.0051517486572265625, 0.005508780479431152, 0.005865812301635742, 0.006222844123840332, 0.006579875946044922, 0.006936907768249512, 0.0072939395904541016, 0.007650971412658691, 0.008008003234863281, 0.008365035057067871, 0.008722066879272461, 0.00907909870147705, 0.00943613052368164, 0.00979316234588623, 0.01015019416809082, 0.01050722599029541, 0.0108642578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 11.0, 23.0, 30.0, 21.0, 48.0, 51.0, 78.0, 103.0, 189.0, 255.0, 510.0, 1010.0, 2282.0, 6585.0, 25805.0, 147570.0, 674208.0, 152240.0, 26091.0, 6805.0, 2348.0, 962.0, 493.0, 276.0, 167.0, 114.0, 78.0, 49.0, 24.0, 29.0, 16.0, 22.0, 11.0, 8.0, 7.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0215301513671875, -0.02090620994567871, -0.020282268524169922, -0.019658327102661133, -0.019034385681152344, -0.018410444259643555, -0.017786502838134766, -0.017162561416625977, -0.016538619995117188, -0.0159146785736084, -0.01529073715209961, -0.01466679573059082, -0.014042854309082031, -0.013418912887573242, -0.012794971466064453, -0.012171030044555664, -0.011547088623046875, -0.010923147201538086, -0.010299205780029297, -0.009675264358520508, -0.009051322937011719, -0.00842738151550293, -0.007803440093994141, -0.0071794986724853516, -0.0065555572509765625, -0.0059316158294677734, -0.005307674407958984, -0.004683732986450195, -0.004059791564941406, -0.003435850143432617, -0.002811908721923828, -0.002187967300415039, -0.00156402587890625, -0.0009400844573974609, -0.0003161430358886719, 0.0003077983856201172, 0.0009317398071289062, 0.0015556812286376953, 0.0021796226501464844, 0.0028035640716552734, 0.0034275054931640625, 0.0040514469146728516, 0.004675388336181641, 0.00529932975769043, 0.005923271179199219, 0.006547212600708008, 0.007171154022216797, 0.007795095443725586, 0.008419036865234375, 0.009042978286743164, 0.009666919708251953, 0.010290861129760742, 0.010914802551269531, 0.01153874397277832, 0.01216268539428711, 0.012786626815795898, 0.013410568237304688, 0.014034509658813477, 0.014658451080322266, 0.015282392501831055, 0.015906333923339844, 0.016530275344848633, 0.017154216766357422, 0.01777815818786621, 0.018402099609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 11.0, 9.0, 6.0, 7.0, 7.0, 15.0, 18.0, 23.0, 13.0, 21.0, 24.0, 32.0, 47.0, 34.0, 51.0, 42.0, 48.0, 49.0, 49.0, 48.0, 54.0, 46.0, 49.0, 61.0, 39.0, 36.0, 34.0, 20.0, 24.0, 14.0, 11.0, 13.0, 12.0, 9.0, 4.0, 1.0, 9.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.027374267578125, -0.026536226272583008, -0.025698184967041016, -0.024860143661499023, -0.02402210235595703, -0.02318406105041504, -0.022346019744873047, -0.021507978439331055, -0.020669937133789062, -0.01983189582824707, -0.018993854522705078, -0.018155813217163086, -0.017317771911621094, -0.0164797306060791, -0.01564168930053711, -0.014803647994995117, -0.013965606689453125, -0.013127565383911133, -0.01228952407836914, -0.011451482772827148, -0.010613441467285156, -0.009775400161743164, -0.008937358856201172, -0.00809931755065918, -0.0072612762451171875, -0.006423234939575195, -0.005585193634033203, -0.004747152328491211, -0.003909111022949219, -0.0030710697174072266, -0.0022330284118652344, -0.0013949871063232422, -0.00055694580078125, 0.0002810955047607422, 0.0011191368103027344, 0.0019571781158447266, 0.0027952194213867188, 0.003633260726928711, 0.004471302032470703, 0.005309343338012695, 0.0061473846435546875, 0.00698542594909668, 0.007823467254638672, 0.008661508560180664, 0.009499549865722656, 0.010337591171264648, 0.01117563247680664, 0.012013673782348633, 0.012851715087890625, 0.013689756393432617, 0.01452779769897461, 0.015365839004516602, 0.016203880310058594, 0.017041921615600586, 0.017879962921142578, 0.01871800422668457, 0.019556045532226562, 0.020394086837768555, 0.021232128143310547, 0.02207016944885254, 0.02290821075439453, 0.023746252059936523, 0.024584293365478516, 0.025422334671020508, 0.0262603759765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 5.0, 2.0, 1.0, 4.0, 6.0, 10.0, 21.0, 31.0, 38.0, 90.0, 148.0, 306.0, 776.0, 3190.0, 55984.0, 950201.0, 33840.0, 2586.0, 689.0, 298.0, 118.0, 84.0, 52.0, 21.0, 20.0, 20.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0285491943359375, -0.027843236923217773, -0.027137279510498047, -0.02643132209777832, -0.025725364685058594, -0.025019407272338867, -0.02431344985961914, -0.023607492446899414, -0.022901535034179688, -0.02219557762145996, -0.021489620208740234, -0.020783662796020508, -0.02007770538330078, -0.019371747970581055, -0.018665790557861328, -0.0179598331451416, -0.017253875732421875, -0.01654791831970215, -0.015841960906982422, -0.015136003494262695, -0.014430046081542969, -0.013724088668823242, -0.013018131256103516, -0.012312173843383789, -0.011606216430664062, -0.010900259017944336, -0.01019430160522461, -0.009488344192504883, -0.008782386779785156, -0.00807642936706543, -0.007370471954345703, -0.0066645145416259766, -0.00595855712890625, -0.0052525997161865234, -0.004546642303466797, -0.0038406848907470703, -0.0031347274780273438, -0.002428770065307617, -0.0017228126525878906, -0.001016855239868164, -0.0003108978271484375, 0.00039505958557128906, 0.0011010169982910156, 0.0018069744110107422, 0.0025129318237304688, 0.0032188892364501953, 0.003924846649169922, 0.0046308040618896484, 0.005336761474609375, 0.0060427188873291016, 0.006748676300048828, 0.007454633712768555, 0.008160591125488281, 0.008866548538208008, 0.009572505950927734, 0.010278463363647461, 0.010984420776367188, 0.011690378189086914, 0.01239633560180664, 0.013102293014526367, 0.013808250427246094, 0.01451420783996582, 0.015220165252685547, 0.015926122665405273, 0.016632080078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 7.0, 15.0, 10.0, 20.0, 28.0, 20.0, 41.0, 44.0, 63.0, 70.0, 87.0, 92.0, 90.0, 93.0, 78.0, 55.0, 37.0, 37.0, 33.0, 25.0, 17.0, 11.0, 7.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.516145706176758e-05, -7.336307317018509e-05, -7.15646892786026e-05, -6.976630538702011e-05, -6.796792149543762e-05, -6.616953760385513e-05, -6.437115371227264e-05, -6.257276982069016e-05, -6.0774385929107666e-05, -5.897600203752518e-05, -5.717761814594269e-05, -5.53792342543602e-05, -5.358085036277771e-05, -5.178246647119522e-05, -4.998408257961273e-05, -4.818569868803024e-05, -4.6387314796447754e-05, -4.4588930904865265e-05, -4.2790547013282776e-05, -4.099216312170029e-05, -3.91937792301178e-05, -3.739539533853531e-05, -3.559701144695282e-05, -3.379862755537033e-05, -3.200024366378784e-05, -3.0201859772205353e-05, -2.8403475880622864e-05, -2.6605091989040375e-05, -2.4806708097457886e-05, -2.3008324205875397e-05, -2.1209940314292908e-05, -1.941155642271042e-05, -1.761317253112793e-05, -1.581478863954544e-05, -1.4016404747962952e-05, -1.2218020856380463e-05, -1.0419636964797974e-05, -8.621253073215485e-06, -6.822869181632996e-06, -5.024485290050507e-06, -3.2261013984680176e-06, -1.4277175068855286e-06, 3.7066638469696045e-07, 2.1690502762794495e-06, 3.9674341678619385e-06, 5.7658180594444275e-06, 7.5642019510269165e-06, 9.362585842609406e-06, 1.1160969734191895e-05, 1.2959353625774384e-05, 1.4757737517356873e-05, 1.655612140893936e-05, 1.835450530052185e-05, 2.015288919210434e-05, 2.195127308368683e-05, 2.3749656975269318e-05, 2.5548040866851807e-05, 2.7346424758434296e-05, 2.9144808650016785e-05, 3.0943192541599274e-05, 3.274157643318176e-05, 3.453996032476425e-05, 3.633834421634674e-05, 3.813672810792923e-05, 3.993511199951172e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 5.0, 4.0, 6.0, 14.0, 11.0, 22.0, 44.0, 106.0, 224.0, 571.0, 2224.0, 20108.0, 785772.0, 230656.0, 6886.0, 1214.0, 370.0, 137.0, 83.0, 39.0, 26.0, 12.0, 8.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02301025390625, -0.02240157127380371, -0.021792888641357422, -0.021184206008911133, -0.020575523376464844, -0.019966840744018555, -0.019358158111572266, -0.018749475479125977, -0.018140792846679688, -0.0175321102142334, -0.01692342758178711, -0.01631474494934082, -0.01570606231689453, -0.015097379684448242, -0.014488697052001953, -0.013880014419555664, -0.013271331787109375, -0.012662649154663086, -0.012053966522216797, -0.011445283889770508, -0.010836601257324219, -0.01022791862487793, -0.00961923599243164, -0.009010553359985352, -0.008401870727539062, -0.0077931880950927734, -0.007184505462646484, -0.006575822830200195, -0.005967140197753906, -0.005358457565307617, -0.004749774932861328, -0.004141092300415039, -0.00353240966796875, -0.002923727035522461, -0.002315044403076172, -0.0017063617706298828, -0.0010976791381835938, -0.0004889965057373047, 0.00011968612670898438, 0.0007283687591552734, 0.0013370513916015625, 0.0019457340240478516, 0.0025544166564941406, 0.0031630992889404297, 0.0037717819213867188, 0.004380464553833008, 0.004989147186279297, 0.005597829818725586, 0.006206512451171875, 0.006815195083618164, 0.007423877716064453, 0.008032560348510742, 0.008641242980957031, 0.00924992561340332, 0.00985860824584961, 0.010467290878295898, 0.011075973510742188, 0.011684656143188477, 0.012293338775634766, 0.012902021408081055, 0.013510704040527344, 0.014119386672973633, 0.014728069305419922, 0.015336751937866211, 0.0159454345703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 9.0, 21.0, 49.0, 131.0, 240.0, 257.0, 161.0, 65.0, 26.0, 8.0, 7.0, 4.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0288543701171875, -0.028097152709960938, -0.027339935302734375, -0.026582717895507812, -0.02582550048828125, -0.025068283081054688, -0.024311065673828125, -0.023553848266601562, -0.022796630859375, -0.022039413452148438, -0.021282196044921875, -0.020524978637695312, -0.01976776123046875, -0.019010543823242188, -0.018253326416015625, -0.017496109008789062, -0.0167388916015625, -0.015981674194335938, -0.015224456787109375, -0.014467239379882812, -0.01371002197265625, -0.012952804565429688, -0.012195587158203125, -0.011438369750976562, -0.01068115234375, -0.009923934936523438, -0.009166717529296875, -0.008409500122070312, -0.00765228271484375, -0.0068950653076171875, -0.006137847900390625, -0.0053806304931640625, -0.0046234130859375, -0.0038661956787109375, -0.003108978271484375, -0.0023517608642578125, -0.00159454345703125, -0.0008373260498046875, -8.0108642578125e-05, 0.0006771087646484375, 0.001434326171875, 0.0021915435791015625, 0.002948760986328125, 0.0037059783935546875, 0.00446319580078125, 0.0052204132080078125, 0.005977630615234375, 0.0067348480224609375, 0.0074920654296875, 0.008249282836914062, 0.009006500244140625, 0.009763717651367188, 0.01052093505859375, 0.011278152465820312, 0.012035369873046875, 0.012792587280273438, 0.0135498046875, 0.014307022094726562, 0.015064239501953125, 0.015821456909179688, 0.01657867431640625, 0.017335891723632812, 0.018093109130859375, 0.018850326538085938, 0.0196075439453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 9.0, 14.0, 53.0, 200.0, 378.0, 254.0, 76.0, 19.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.6090952157974243, -0.5977507829666138, -0.5864062905311584, -0.5750618577003479, -0.5637174248695374, -0.5523729920387268, -0.5410284996032715, -0.5296840667724609, -0.5183396339416504, -0.5069952011108398, -0.4956507384777069, -0.484306275844574, -0.4729618430137634, -0.4616173803806305, -0.45027291774749756, -0.438928484916687, -0.4275840222835541, -0.41623955965042114, -0.4048951268196106, -0.39355066418647766, -0.3822062313556671, -0.3708617687225342, -0.35951733589172363, -0.3481728732585907, -0.33682841062545776, -0.32548394799232483, -0.3141395151615143, -0.30279505252838135, -0.2914506196975708, -0.28010615706443787, -0.26876169443130493, -0.2574172616004944, -0.24607279896736145, -0.2347283512353897, -0.22338390350341797, -0.21203944087028503, -0.2006950080394745, -0.18935054540634155, -0.1780060976743698, -0.16666164994239807, -0.15531720221042633, -0.1439727544784546, -0.13262830674648285, -0.12128385156393051, -0.10993940383195877, -0.09859495609998703, -0.08725050091743469, -0.07590605318546295, -0.06456160545349121, -0.05321715772151947, -0.04187270626425743, -0.030528254806995392, -0.01918380707502365, -0.00783935934305191, 0.0035050958395004272, 0.014849543571472168, 0.02619399130344391, 0.03753843903541565, 0.04888289049267769, 0.06022734194993973, 0.07157178968191147, 0.08291623741388321, 0.09426069259643555, 0.10560514032840729, 0.11694958806037903]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 7.0, 6.0, 7.0, 1.0, 15.0, 11.0, 13.0, 18.0, 17.0, 17.0, 23.0, 25.0, 24.0, 37.0, 34.0, 38.0, 39.0, 36.0, 28.0, 35.0, 59.0, 48.0, 45.0, 52.0, 37.0, 44.0, 37.0, 30.0, 24.0, 24.0, 17.0, 22.0, 26.0, 16.0, 18.0, 15.0, 14.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12144136428833008, -0.1178487241268158, -0.11425607651472092, -0.11066343635320663, -0.10707078874111176, -0.10347814857959747, -0.09988550841808319, -0.09629286825656891, -0.09270022064447403, -0.08910758048295975, -0.08551493287086487, -0.08192229270935059, -0.0783296525478363, -0.07473700493574142, -0.07114436477422714, -0.06755171716213226, -0.06395907700061798, -0.0603664331138134, -0.05677378922700882, -0.05318114906549454, -0.04958850517868996, -0.045995861291885376, -0.042403221130371094, -0.03881057724356651, -0.03521793335676193, -0.03162528946995735, -0.02803264744579792, -0.02444000542163849, -0.020847361534833908, -0.017254717648029327, -0.013662075623869896, -0.010069433599710464, -0.006476789712905884, -0.0028841467574238777, 0.0007084961980581284, 0.004301139153540134, 0.00789378210902214, 0.011486425995826721, 0.015079068019986153, 0.018671710044145584, 0.022264353930950165, 0.025856997817754745, 0.029449639841914177, 0.03304228186607361, 0.03663492575287819, 0.04022756963968277, 0.04382020980119705, 0.04741285368800163, 0.05100549757480621, 0.054598141461610794, 0.058190785348415375, 0.06178342550992966, 0.06537607312202454, 0.06896871328353882, 0.0725613534450531, 0.07615399360656738, 0.07974664121866226, 0.08333928138017654, 0.08693192899227142, 0.0905245691537857, 0.09411720931529999, 0.09770985692739487, 0.10130249708890915, 0.10489514470100403, 0.10848778486251831]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 14.0, 27.0, 27.0, 51.0, 72.0, 90.0, 140.0, 196.0, 284.0, 479.0, 1079.0, 5532.0, 288604.0, 3886530.0, 8139.0, 1398.0, 592.0, 329.0, 216.0, 159.0, 92.0, 68.0, 50.0, 29.0, 24.0, 15.0, 5.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0272064208984375, -0.025915861129760742, -0.024625301361083984, -0.023334741592407227, -0.02204418182373047, -0.02075362205505371, -0.019463062286376953, -0.018172502517700195, -0.016881942749023438, -0.01559138298034668, -0.014300823211669922, -0.013010263442993164, -0.011719703674316406, -0.010429143905639648, -0.00913858413696289, -0.007848024368286133, -0.006557464599609375, -0.005266904830932617, -0.003976345062255859, -0.0026857852935791016, -0.0013952255249023438, -0.00010466575622558594, 0.0011858940124511719, 0.0024764537811279297, 0.0037670135498046875, 0.005057573318481445, 0.006348133087158203, 0.007638692855834961, 0.008929252624511719, 0.010219812393188477, 0.011510372161865234, 0.012800931930541992, 0.01409149169921875, 0.015382051467895508, 0.016672611236572266, 0.017963171005249023, 0.01925373077392578, 0.02054429054260254, 0.021834850311279297, 0.023125410079956055, 0.024415969848632812, 0.02570652961730957, 0.026997089385986328, 0.028287649154663086, 0.029578208923339844, 0.0308687686920166, 0.03215932846069336, 0.03344988822937012, 0.034740447998046875, 0.03603100776672363, 0.03732156753540039, 0.03861212730407715, 0.039902687072753906, 0.041193246841430664, 0.04248380661010742, 0.04377436637878418, 0.04506492614746094, 0.046355485916137695, 0.04764604568481445, 0.04893660545349121, 0.05022716522216797, 0.05151772499084473, 0.052808284759521484, 0.05409884452819824, 0.055389404296875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 8.0, 10.0, 17.0, 23.0, 29.0, 30.0, 53.0, 61.0, 78.0, 89.0, 73.0, 84.0, 95.0, 75.0, 63.0, 54.0, 48.0, 25.0, 28.0, 10.0, 10.0, 5.0, 14.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0119171142578125, -0.01154792308807373, -0.011178731918334961, -0.010809540748596191, -0.010440349578857422, -0.010071158409118652, -0.009701967239379883, -0.009332776069641113, -0.008963584899902344, -0.008594393730163574, -0.008225202560424805, -0.007856011390686035, -0.007486820220947266, -0.007117629051208496, -0.0067484378814697266, -0.006379246711730957, -0.0060100555419921875, -0.005640864372253418, -0.0052716732025146484, -0.004902482032775879, -0.004533290863037109, -0.00416409969329834, -0.0037949085235595703, -0.0034257173538208008, -0.0030565261840820312, -0.0026873350143432617, -0.002318143844604492, -0.0019489526748657227, -0.0015797615051269531, -0.0012105703353881836, -0.0008413791656494141, -0.00047218799591064453, -0.000102996826171875, 0.00026619434356689453, 0.0006353855133056641, 0.0010045766830444336, 0.0013737678527832031, 0.0017429590225219727, 0.002112150192260742, 0.0024813413619995117, 0.0028505325317382812, 0.0032197237014770508, 0.0035889148712158203, 0.00395810604095459, 0.004327297210693359, 0.004696488380432129, 0.0050656795501708984, 0.005434870719909668, 0.0058040618896484375, 0.006173253059387207, 0.0065424442291259766, 0.006911635398864746, 0.007280826568603516, 0.007650017738342285, 0.008019208908081055, 0.008388400077819824, 0.008757591247558594, 0.009126782417297363, 0.009495973587036133, 0.009865164756774902, 0.010234355926513672, 0.010603547096252441, 0.010972738265991211, 0.01134192943572998, 0.01171112060546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 9.0, 11.0, 17.0, 34.0, 44.0, 70.0, 103.0, 172.0, 350.0, 846.0, 2712.0, 17414.0, 3924044.0, 235864.0, 9459.0, 1868.0, 594.0, 259.0, 135.0, 104.0, 58.0, 41.0, 25.0, 14.0, 9.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0237274169921875, -0.02284407615661621, -0.021960735321044922, -0.021077394485473633, -0.020194053649902344, -0.019310712814331055, -0.018427371978759766, -0.017544031143188477, -0.016660690307617188, -0.0157773494720459, -0.01489400863647461, -0.01401066780090332, -0.013127326965332031, -0.012243986129760742, -0.011360645294189453, -0.010477304458618164, -0.009593963623046875, -0.008710622787475586, -0.007827281951904297, -0.006943941116333008, -0.006060600280761719, -0.00517725944519043, -0.004293918609619141, -0.0034105777740478516, -0.0025272369384765625, -0.0016438961029052734, -0.0007605552673339844, 0.0001227855682373047, 0.0010061264038085938, 0.0018894672393798828, 0.002772808074951172, 0.003656148910522461, 0.00453948974609375, 0.005422830581665039, 0.006306171417236328, 0.007189512252807617, 0.008072853088378906, 0.008956193923950195, 0.009839534759521484, 0.010722875595092773, 0.011606216430664062, 0.012489557266235352, 0.01337289810180664, 0.01425623893737793, 0.015139579772949219, 0.016022920608520508, 0.016906261444091797, 0.017789602279663086, 0.018672943115234375, 0.019556283950805664, 0.020439624786376953, 0.021322965621948242, 0.02220630645751953, 0.02308964729309082, 0.02397298812866211, 0.0248563289642334, 0.025739669799804688, 0.026623010635375977, 0.027506351470947266, 0.028389692306518555, 0.029273033142089844, 0.030156373977661133, 0.031039714813232422, 0.03192305564880371, 0.032806396484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 11.0, 20.0, 37.0, 110.0, 585.0, 3111.0, 112.0, 42.0, 22.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002635955810546875, -0.0024725794792175293, -0.0023092031478881836, -0.002145826816558838, -0.001982450485229492, -0.0018190741539001465, -0.0016556978225708008, -0.001492321491241455, -0.0013289451599121094, -0.0011655688285827637, -0.001002192497253418, -0.0008388161659240723, -0.0006754398345947266, -0.0005120635032653809, -0.00034868717193603516, -0.00018531084060668945, -2.193450927734375e-05, 0.00014144182205200195, 0.00030481815338134766, 0.00046819448471069336, 0.0006315708160400391, 0.0007949471473693848, 0.0009583234786987305, 0.0011216998100280762, 0.0012850761413574219, 0.0014484524726867676, 0.0016118288040161133, 0.001775205135345459, 0.0019385814666748047, 0.0021019577980041504, 0.002265334129333496, 0.002428710460662842, 0.0025920867919921875, 0.002755463123321533, 0.002918839454650879, 0.0030822157859802246, 0.0032455921173095703, 0.003408968448638916, 0.0035723447799682617, 0.0037357211112976074, 0.003899097442626953, 0.004062473773956299, 0.0042258501052856445, 0.00438922643661499, 0.004552602767944336, 0.004715979099273682, 0.004879355430603027, 0.005042731761932373, 0.005206108093261719, 0.0053694844245910645, 0.00553286075592041, 0.005696237087249756, 0.0058596134185791016, 0.006022989749908447, 0.006186366081237793, 0.006349742412567139, 0.006513118743896484, 0.00667649507522583, 0.006839871406555176, 0.0070032477378845215, 0.007166624069213867, 0.007330000400543213, 0.007493376731872559, 0.007656753063201904, 0.00782012939453125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 15.0, 60.0, 186.0, 283.0, 275.0, 124.0, 42.0, 12.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014445389620959759, -0.013472361490130424, -0.012499332427978516, -0.011526304297149181, -0.010553276166319847, -0.009580247104167938, -0.008607218973338604, -0.007634190376847982, -0.006661161780357361, -0.005688133183866739, -0.004715104587376118, -0.0037420764565467834, -0.002769047860056162, -0.0017960192635655403, -0.0008229911327362061, 0.0001500374637544155, 0.001123066060245037, 0.0020960946567356586, 0.0030691230203956366, 0.0040421513840556145, 0.005015179980546236, 0.005988208577036858, 0.006961236707866192, 0.007934264838695526, 0.008907293900847435, 0.00988032203167677, 0.010853351093828678, 0.011826379224658012, 0.012799408286809921, 0.013772436417639256, 0.01474546454846859, 0.0157184936106205, 0.01669152081012726, 0.017664549872279167, 0.018637577071785927, 0.019610606133937836, 0.020583635196089745, 0.021556664258241653, 0.022529691457748413, 0.023502720519900322, 0.02447574958205223, 0.02544877864420414, 0.0264218058437109, 0.027394834905862808, 0.028367863968014717, 0.029340893030166626, 0.030313920229673386, 0.031286947429180145, 0.0322599783539772, 0.03323300555348396, 0.03420603647828102, 0.03517906367778778, 0.03615209087729454, 0.0371251218020916, 0.03809814900159836, 0.03907117620110512, 0.04004420340061188, 0.04101723060011864, 0.041990261524915695, 0.042963288724422455, 0.043936315923929214, 0.04490934684872627, 0.04588237404823303, 0.04685540124773979, 0.04782843217253685]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 4.0, 6.0, 6.0, 7.0, 9.0, 18.0, 10.0, 13.0, 20.0, 27.0, 27.0, 34.0, 32.0, 25.0, 30.0, 44.0, 54.0, 39.0, 38.0, 44.0, 42.0, 31.0, 43.0, 38.0, 38.0, 21.0, 27.0, 35.0, 38.0, 17.0, 22.0, 23.0, 21.0, 16.0, 19.0, 13.0, 18.0, 13.0, 3.0, 5.0, 2.0, 4.0, 5.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.005124390125274658, -0.004947606474161148, -0.004770822823047638, -0.004594039171934128, -0.004417255520820618, -0.0042404718697071075, -0.004063688218593597, -0.0038869045674800873, -0.003710120916366577, -0.003533337265253067, -0.003356553614139557, -0.0031797699630260468, -0.0030029863119125366, -0.0028262026607990265, -0.0026494190096855164, -0.0024726353585720062, -0.002295851707458496, -0.002119068056344986, -0.0019422844052314758, -0.0017655007541179657, -0.0015887171030044556, -0.0014119334518909454, -0.0012351498007774353, -0.0010583661496639252, -0.000881582498550415, -0.0007047988474369049, -0.0005280151963233948, -0.00035123154520988464, -0.0001744478940963745, 2.33575701713562e-06, 0.00017911940813064575, 0.0003559030592441559, 0.000532686710357666, 0.0007094703614711761, 0.0008862540125846863, 0.0010630376636981964, 0.0012398213148117065, 0.0014166049659252167, 0.0015933886170387268, 0.001770172268152237, 0.001946955919265747, 0.002123739570379257, 0.0023005232214927673, 0.0024773068726062775, 0.0026540905237197876, 0.0028308741748332977, 0.003007657825946808, 0.003184441477060318, 0.003361225128173828, 0.0035380087792873383, 0.0037147924304008484, 0.0038915760815143585, 0.004068359732627869, 0.004245143383741379, 0.004421927034854889, 0.004598710685968399, 0.004775494337081909, 0.004952277988195419, 0.0051290616393089294, 0.00530584529042244, 0.00548262894153595, 0.00565941259264946, 0.00583619624376297, 0.00601297989487648, 0.00618976354598999]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 6.0, 11.0, 19.0, 31.0, 63.0, 97.0, 148.0, 307.0, 646.0, 1400.0, 3678.0, 12006.0, 51816.0, 295143.0, 526358.0, 122334.0, 23720.0, 6539.0, 2273.0, 951.0, 488.0, 207.0, 126.0, 68.0, 43.0, 20.0, 14.0, 14.0, 7.0, 5.0, 3.0, 0.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0216217041015625, -0.020929813385009766, -0.02023792266845703, -0.019546031951904297, -0.018854141235351562, -0.018162250518798828, -0.017470359802246094, -0.01677846908569336, -0.016086578369140625, -0.01539468765258789, -0.014702796936035156, -0.014010906219482422, -0.013319015502929688, -0.012627124786376953, -0.011935234069824219, -0.011243343353271484, -0.01055145263671875, -0.009859561920166016, -0.009167671203613281, -0.008475780487060547, -0.0077838897705078125, -0.007091999053955078, -0.006400108337402344, -0.005708217620849609, -0.005016326904296875, -0.004324436187744141, -0.0036325454711914062, -0.002940654754638672, -0.0022487640380859375, -0.0015568733215332031, -0.0008649826049804688, -0.00017309188842773438, 0.000518798828125, 0.0012106895446777344, 0.0019025802612304688, 0.002594470977783203, 0.0032863616943359375, 0.003978252410888672, 0.004670143127441406, 0.005362033843994141, 0.006053924560546875, 0.006745815277099609, 0.007437705993652344, 0.008129596710205078, 0.008821487426757812, 0.009513378143310547, 0.010205268859863281, 0.010897159576416016, 0.01158905029296875, 0.012280941009521484, 0.012972831726074219, 0.013664722442626953, 0.014356613159179688, 0.015048503875732422, 0.015740394592285156, 0.01643228530883789, 0.017124176025390625, 0.01781606674194336, 0.018507957458496094, 0.019199848175048828, 0.019891738891601562, 0.020583629608154297, 0.02127552032470703, 0.021967411041259766, 0.0226593017578125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 8.0, 14.0, 17.0, 23.0, 28.0, 38.0, 48.0, 64.0, 66.0, 74.0, 71.0, 100.0, 83.0, 81.0, 63.0, 57.0, 42.0, 29.0, 29.0, 10.0, 15.0, 6.0, 14.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.011871337890625, -0.011504530906677246, -0.011137723922729492, -0.010770916938781738, -0.010404109954833984, -0.01003730297088623, -0.009670495986938477, -0.009303689002990723, -0.008936882019042969, -0.008570075035095215, -0.008203268051147461, -0.007836461067199707, -0.007469654083251953, -0.007102847099304199, -0.006736040115356445, -0.006369233131408691, -0.0060024261474609375, -0.005635619163513184, -0.00526881217956543, -0.004902005195617676, -0.004535198211669922, -0.004168391227722168, -0.003801584243774414, -0.00343477725982666, -0.0030679702758789062, -0.0027011632919311523, -0.0023343563079833984, -0.0019675493240356445, -0.0016007423400878906, -0.0012339353561401367, -0.0008671283721923828, -0.0005003213882446289, -0.000133514404296875, 0.0002332925796508789, 0.0006000995635986328, 0.0009669065475463867, 0.0013337135314941406, 0.0017005205154418945, 0.0020673274993896484, 0.0024341344833374023, 0.0028009414672851562, 0.00316774845123291, 0.003534555435180664, 0.003901362419128418, 0.004268169403076172, 0.004634976387023926, 0.00500178337097168, 0.005368590354919434, 0.0057353973388671875, 0.006102204322814941, 0.006469011306762695, 0.006835818290710449, 0.007202625274658203, 0.007569432258605957, 0.007936239242553711, 0.008303046226501465, 0.008669853210449219, 0.009036660194396973, 0.009403467178344727, 0.00977027416229248, 0.010137081146240234, 0.010503888130187988, 0.010870695114135742, 0.011237502098083496, 0.01160430908203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 7.0, 9.0, 18.0, 18.0, 18.0, 32.0, 28.0, 51.0, 40.0, 69.0, 82.0, 122.0, 183.0, 293.0, 618.0, 1310.0, 3445.0, 11023.0, 44694.0, 269462.0, 574229.0, 110190.0, 22139.0, 6177.0, 2172.0, 837.0, 384.0, 260.0, 153.0, 125.0, 76.0, 64.0, 51.0, 35.0, 25.0, 23.0, 12.0, 16.0, 10.0, 11.0, 8.0, 4.0, 7.0, 0.0, 7.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.0186614990234375, -0.018132328987121582, -0.017603158950805664, -0.017073988914489746, -0.016544818878173828, -0.01601564884185791, -0.015486478805541992, -0.014957308769226074, -0.014428138732910156, -0.013898968696594238, -0.01336979866027832, -0.012840628623962402, -0.012311458587646484, -0.011782288551330566, -0.011253118515014648, -0.01072394847869873, -0.010194778442382812, -0.009665608406066895, -0.009136438369750977, -0.008607268333435059, -0.00807809829711914, -0.007548928260803223, -0.007019758224487305, -0.006490588188171387, -0.005961418151855469, -0.005432248115539551, -0.004903078079223633, -0.004373908042907715, -0.003844738006591797, -0.003315567970275879, -0.002786397933959961, -0.002257227897644043, -0.001728057861328125, -0.001198887825012207, -0.0006697177886962891, -0.0001405477523803711, 0.0003886222839355469, 0.0009177923202514648, 0.0014469623565673828, 0.0019761323928833008, 0.0025053024291992188, 0.0030344724655151367, 0.0035636425018310547, 0.004092812538146973, 0.004621982574462891, 0.005151152610778809, 0.0056803226470947266, 0.0062094926834106445, 0.0067386627197265625, 0.0072678327560424805, 0.0077970027923583984, 0.008326172828674316, 0.008855342864990234, 0.009384512901306152, 0.00991368293762207, 0.010442852973937988, 0.010972023010253906, 0.011501193046569824, 0.012030363082885742, 0.01255953311920166, 0.013088703155517578, 0.013617873191833496, 0.014147043228149414, 0.014676213264465332, 0.01520538330078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 4.0, 13.0, 6.0, 13.0, 20.0, 21.0, 23.0, 34.0, 26.0, 39.0, 32.0, 37.0, 40.0, 53.0, 43.0, 44.0, 51.0, 46.0, 43.0, 42.0, 40.0, 49.0, 29.0, 25.0, 37.0, 31.0, 27.0, 22.0, 17.0, 13.0, 16.0, 11.0, 7.0, 5.0, 8.0, 10.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0249176025390625, -0.0241391658782959, -0.023360729217529297, -0.022582292556762695, -0.021803855895996094, -0.021025419235229492, -0.02024698257446289, -0.01946854591369629, -0.018690109252929688, -0.017911672592163086, -0.017133235931396484, -0.016354799270629883, -0.015576362609863281, -0.01479792594909668, -0.014019489288330078, -0.013241052627563477, -0.012462615966796875, -0.011684179306030273, -0.010905742645263672, -0.01012730598449707, -0.009348869323730469, -0.008570432662963867, -0.007791996002197266, -0.007013559341430664, -0.0062351226806640625, -0.005456686019897461, -0.004678249359130859, -0.003899812698364258, -0.0031213760375976562, -0.0023429393768310547, -0.0015645027160644531, -0.0007860660552978516, -7.62939453125e-06, 0.0007708072662353516, 0.0015492439270019531, 0.0023276805877685547, 0.0031061172485351562, 0.003884553909301758, 0.004662990570068359, 0.005441427230834961, 0.0062198638916015625, 0.006998300552368164, 0.007776737213134766, 0.008555173873901367, 0.009333610534667969, 0.01011204719543457, 0.010890483856201172, 0.011668920516967773, 0.012447357177734375, 0.013225793838500977, 0.014004230499267578, 0.01478266716003418, 0.015561103820800781, 0.016339540481567383, 0.017117977142333984, 0.017896413803100586, 0.018674850463867188, 0.01945328712463379, 0.02023172378540039, 0.021010160446166992, 0.021788597106933594, 0.022567033767700195, 0.023345470428466797, 0.0241239070892334, 0.02490234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 11.0, 14.0, 12.0, 26.0, 15.0, 34.0, 62.0, 95.0, 117.0, 191.0, 298.0, 512.0, 946.0, 1720.0, 3780.0, 9064.0, 25353.0, 80406.0, 279222.0, 429702.0, 147974.0, 43308.0, 14624.0, 5484.0, 2650.0, 1208.0, 637.0, 369.0, 257.0, 161.0, 87.0, 58.0, 45.0, 33.0, 22.0, 13.0, 10.0, 12.0, 2.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004711151123046875, -0.004560351371765137, -0.0044095516204833984, -0.00425875186920166, -0.004107952117919922, -0.003957152366638184, -0.0038063526153564453, -0.003655552864074707, -0.0035047531127929688, -0.0033539533615112305, -0.003203153610229492, -0.003052353858947754, -0.0029015541076660156, -0.0027507543563842773, -0.002599954605102539, -0.0024491548538208008, -0.0022983551025390625, -0.0021475553512573242, -0.001996755599975586, -0.0018459558486938477, -0.0016951560974121094, -0.001544356346130371, -0.0013935565948486328, -0.0012427568435668945, -0.0010919570922851562, -0.000941157341003418, -0.0007903575897216797, -0.0006395578384399414, -0.0004887580871582031, -0.00033795833587646484, -0.00018715858459472656, -3.635883331298828e-05, 0.00011444091796875, 0.0002652406692504883, 0.00041604042053222656, 0.0005668401718139648, 0.0007176399230957031, 0.0008684396743774414, 0.0010192394256591797, 0.001170039176940918, 0.0013208389282226562, 0.0014716386795043945, 0.0016224384307861328, 0.001773238182067871, 0.0019240379333496094, 0.0020748376846313477, 0.002225637435913086, 0.0023764371871948242, 0.0025272369384765625, 0.0026780366897583008, 0.002828836441040039, 0.0029796361923217773, 0.0031304359436035156, 0.003281235694885254, 0.003432035446166992, 0.0035828351974487305, 0.0037336349487304688, 0.003884434700012207, 0.004035234451293945, 0.004186034202575684, 0.004336833953857422, 0.00448763370513916, 0.0046384334564208984, 0.004789233207702637, 0.004940032958984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 8.0, 2.0, 14.0, 12.0, 12.0, 21.0, 20.0, 23.0, 36.0, 41.0, 47.0, 67.0, 71.0, 75.0, 64.0, 67.0, 68.0, 54.0, 47.0, 39.0, 41.0, 24.0, 33.0, 12.0, 22.0, 27.0, 10.0, 11.0, 4.0, 10.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.839897155761719e-05, -4.697777330875397e-05, -4.555657505989075e-05, -4.413537681102753e-05, -4.271417856216431e-05, -4.1292980313301086e-05, -3.9871782064437866e-05, -3.8450583815574646e-05, -3.7029385566711426e-05, -3.5608187317848206e-05, -3.4186989068984985e-05, -3.2765790820121765e-05, -3.1344592571258545e-05, -2.9923394322395325e-05, -2.8502196073532104e-05, -2.7080997824668884e-05, -2.5659799575805664e-05, -2.4238601326942444e-05, -2.2817403078079224e-05, -2.1396204829216003e-05, -1.9975006580352783e-05, -1.8553808331489563e-05, -1.7132610082626343e-05, -1.5711411833763123e-05, -1.4290213584899902e-05, -1.2869015336036682e-05, -1.1447817087173462e-05, -1.0026618838310242e-05, -8.605420589447021e-06, -7.184222340583801e-06, -5.763024091720581e-06, -4.341825842857361e-06, -2.9206275939941406e-06, -1.4994293451309204e-06, -7.82310962677002e-08, 1.34296715259552e-06, 2.7641654014587402e-06, 4.1853636503219604e-06, 5.606561899185181e-06, 7.027760148048401e-06, 8.448958396911621e-06, 9.870156645774841e-06, 1.1291354894638062e-05, 1.2712553143501282e-05, 1.4133751392364502e-05, 1.5554949641227722e-05, 1.6976147890090942e-05, 1.8397346138954163e-05, 1.9818544387817383e-05, 2.1239742636680603e-05, 2.2660940885543823e-05, 2.4082139134407043e-05, 2.5503337383270264e-05, 2.6924535632133484e-05, 2.8345733880996704e-05, 2.9766932129859924e-05, 3.1188130378723145e-05, 3.2609328627586365e-05, 3.4030526876449585e-05, 3.5451725125312805e-05, 3.6872923374176025e-05, 3.8294121623039246e-05, 3.9715319871902466e-05, 4.1136518120765686e-05, 4.2557716369628906e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 10.0, 9.0, 20.0, 40.0, 56.0, 116.0, 206.0, 454.0, 989.0, 2380.0, 6911.0, 24605.0, 119501.0, 515687.0, 300963.0, 56189.0, 13335.0, 4104.0, 1565.0, 692.0, 313.0, 155.0, 91.0, 54.0, 31.0, 20.0, 18.0, 7.0, 8.0, 7.0, 5.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00650787353515625, -0.006289303302764893, -0.006070733070373535, -0.005852162837982178, -0.00563359260559082, -0.005415022373199463, -0.0051964521408081055, -0.004977881908416748, -0.004759311676025391, -0.004540741443634033, -0.004322171211242676, -0.004103600978851318, -0.003885030746459961, -0.0036664605140686035, -0.003447890281677246, -0.0032293200492858887, -0.0030107498168945312, -0.002792179584503174, -0.0025736093521118164, -0.002355039119720459, -0.0021364688873291016, -0.0019178986549377441, -0.0016993284225463867, -0.0014807581901550293, -0.0012621879577636719, -0.0010436177253723145, -0.000825047492980957, -0.0006064772605895996, -0.0003879070281982422, -0.00016933679580688477, 4.9233436584472656e-05, 0.0002678036689758301, 0.0004863739013671875, 0.0007049441337585449, 0.0009235143661499023, 0.0011420845985412598, 0.0013606548309326172, 0.0015792250633239746, 0.001797795295715332, 0.0020163655281066895, 0.002234935760498047, 0.0024535059928894043, 0.0026720762252807617, 0.002890646457672119, 0.0031092166900634766, 0.003327786922454834, 0.0035463571548461914, 0.003764927387237549, 0.003983497619628906, 0.004202067852020264, 0.004420638084411621, 0.0046392083168029785, 0.004857778549194336, 0.005076348781585693, 0.005294919013977051, 0.005513489246368408, 0.005732059478759766, 0.005950629711151123, 0.0061691999435424805, 0.006387770175933838, 0.006606340408325195, 0.006824910640716553, 0.00704348087310791, 0.007262051105499268, 0.007480621337890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 9.0, 5.0, 10.0, 12.0, 22.0, 19.0, 37.0, 29.0, 41.0, 51.0, 55.0, 47.0, 86.0, 72.0, 72.0, 67.0, 67.0, 47.0, 49.0, 40.0, 34.0, 31.0, 22.0, 13.0, 13.0, 11.0, 5.0, 9.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005908966064453125, -0.005712628364562988, -0.0055162906646728516, -0.005319952964782715, -0.005123615264892578, -0.004927277565002441, -0.004730939865112305, -0.004534602165222168, -0.004338264465332031, -0.0041419267654418945, -0.003945589065551758, -0.003749251365661621, -0.0035529136657714844, -0.0033565759658813477, -0.003160238265991211, -0.0029639005661010742, -0.0027675628662109375, -0.0025712251663208008, -0.002374887466430664, -0.0021785497665405273, -0.0019822120666503906, -0.001785874366760254, -0.0015895366668701172, -0.0013931989669799805, -0.0011968612670898438, -0.001000523567199707, -0.0008041858673095703, -0.0006078481674194336, -0.0004115104675292969, -0.00021517276763916016, -1.8835067749023438e-05, 0.00017750263214111328, 0.00037384033203125, 0.0005701780319213867, 0.0007665157318115234, 0.0009628534317016602, 0.0011591911315917969, 0.0013555288314819336, 0.0015518665313720703, 0.001748204231262207, 0.0019445419311523438, 0.0021408796310424805, 0.002337217330932617, 0.002533555030822754, 0.0027298927307128906, 0.0029262304306030273, 0.003122568130493164, 0.0033189058303833008, 0.0035152435302734375, 0.0037115812301635742, 0.003907918930053711, 0.004104256629943848, 0.004300594329833984, 0.004496932029724121, 0.004693269729614258, 0.0048896074295043945, 0.005085945129394531, 0.005282282829284668, 0.005478620529174805, 0.005674958229064941, 0.005871295928955078, 0.006067633628845215, 0.0062639713287353516, 0.006460309028625488, 0.006656646728515625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 3.0, 14.0, 20.0, 26.0, 50.0, 60.0, 66.0, 102.0, 124.0, 116.0, 107.0, 81.0, 78.0, 45.0, 34.0, 29.0, 15.0, 6.0, 7.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06379878520965576, -0.06030626222491264, -0.056813742965459824, -0.053321219980716705, -0.049828700721263885, -0.04633617773652077, -0.04284365475177765, -0.03935113549232483, -0.03585861623287201, -0.03236609324812889, -0.02887357398867607, -0.025381051003932953, -0.021888531744480133, -0.018396008759737015, -0.014903487637639046, -0.011410966515541077, -0.007918443530797958, -0.004425922408699989, -0.000933400820940733, 0.0025591207668185234, 0.0060516418889164925, 0.009544163942337036, 0.013036685064435005, 0.016529206186532974, 0.020021727308630943, 0.023514248430728912, 0.02700676955282688, 0.03049929067492485, 0.03399181365966797, 0.03748433291912079, 0.04097685590386391, 0.044469378888607025, 0.047961898148059845, 0.05145442113280296, 0.05494694039225578, 0.0584394633769989, 0.06193198263645172, 0.06542450189590454, 0.06891702860593796, 0.07240954786539078, 0.0759020671248436, 0.07939458638429642, 0.08288711309432983, 0.08637963235378265, 0.08987215161323547, 0.0933646708726883, 0.09685719758272171, 0.10034971684217453, 0.10384224355220795, 0.10733476281166077, 0.11082728952169418, 0.114319808781147, 0.11781232804059982, 0.12130485475063324, 0.12479737401008606, 0.12828989326953888, 0.1317824125289917, 0.13527493178844452, 0.13876745104789734, 0.14225997030735016, 0.14575250446796417, 0.149245023727417, 0.1527375429868698, 0.15623006224632263, 0.15972258150577545]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 8.0, 3.0, 8.0, 10.0, 9.0, 18.0, 13.0, 14.0, 17.0, 20.0, 22.0, 25.0, 25.0, 24.0, 19.0, 39.0, 34.0, 33.0, 47.0, 47.0, 58.0, 37.0, 55.0, 47.0, 40.0, 37.0, 30.0, 33.0, 27.0, 30.0, 20.0, 26.0, 12.0, 16.0, 14.0, 14.0, 4.0, 12.0, 7.0, 6.0, 8.0, 5.0, 7.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.10489803552627563, -0.10159571468830109, -0.09829338639974594, -0.0949910581111908, -0.09168873727321625, -0.0883864164352417, -0.08508408814668655, -0.08178175985813141, -0.07847943902015686, -0.07517711818218231, -0.07187478989362717, -0.06857246160507202, -0.06527014076709747, -0.061967816203832626, -0.05866549164056778, -0.05536316707730293, -0.052060842514038086, -0.04875851795077324, -0.04545619338750839, -0.042153868824243546, -0.0388515442609787, -0.03554921969771385, -0.032246895134449005, -0.02894457057118416, -0.02564224600791931, -0.022339921444654465, -0.019037596881389618, -0.01573527231812477, -0.012432947754859924, -0.009130623191595078, -0.005828298628330231, -0.002525974065065384, 0.0007763504981994629, 0.00407867506146431, 0.0073809996247291565, 0.010683324187994003, 0.01398564875125885, 0.017287973314523697, 0.020590297877788544, 0.02389262244105339, 0.027194947004318237, 0.030497271567583084, 0.03379959613084793, 0.03710192069411278, 0.040404245257377625, 0.04370656982064247, 0.04700889438390732, 0.050311218947172165, 0.05361354351043701, 0.05691586807370186, 0.060218192636966705, 0.06352052092552185, 0.0668228417634964, 0.07012516260147095, 0.07342749089002609, 0.07672981917858124, 0.08003214001655579, 0.08333446085453033, 0.08663678914308548, 0.08993911743164062, 0.09324143826961517, 0.09654375910758972, 0.09984608739614487, 0.10314841568470001, 0.10645073652267456]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 9.0, 7.0, 7.0, 19.0, 24.0, 31.0, 47.0, 56.0, 70.0, 126.0, 210.0, 506.0, 1325.0, 5765.0, 70562.0, 4085396.0, 24730.0, 3433.0, 980.0, 374.0, 178.0, 105.0, 57.0, 66.0, 43.0, 25.0, 16.0, 19.0, 17.0, 16.0, 10.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.0379638671875, -0.03697371482849121, -0.03598356246948242, -0.03499341011047363, -0.034003257751464844, -0.033013105392456055, -0.032022953033447266, -0.031032800674438477, -0.030042648315429688, -0.0290524959564209, -0.02806234359741211, -0.02707219123840332, -0.02608203887939453, -0.025091886520385742, -0.024101734161376953, -0.023111581802368164, -0.022121429443359375, -0.021131277084350586, -0.020141124725341797, -0.019150972366333008, -0.01816082000732422, -0.01717066764831543, -0.01618051528930664, -0.015190362930297852, -0.014200210571289062, -0.013210058212280273, -0.012219905853271484, -0.011229753494262695, -0.010239601135253906, -0.009249448776245117, -0.008259296417236328, -0.007269144058227539, -0.00627899169921875, -0.005288839340209961, -0.004298686981201172, -0.003308534622192383, -0.0023183822631835938, -0.0013282299041748047, -0.0003380775451660156, 0.0006520748138427734, 0.0016422271728515625, 0.0026323795318603516, 0.0036225318908691406, 0.00461268424987793, 0.005602836608886719, 0.006592988967895508, 0.007583141326904297, 0.008573293685913086, 0.009563446044921875, 0.010553598403930664, 0.011543750762939453, 0.012533903121948242, 0.013524055480957031, 0.01451420783996582, 0.01550436019897461, 0.0164945125579834, 0.017484664916992188, 0.018474817276000977, 0.019464969635009766, 0.020455121994018555, 0.021445274353027344, 0.022435426712036133, 0.023425579071044922, 0.02441573143005371, 0.0254058837890625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 11.0, 11.0, 13.0, 18.0, 35.0, 36.0, 45.0, 72.0, 71.0, 69.0, 76.0, 79.0, 95.0, 84.0, 69.0, 49.0, 50.0, 21.0, 23.0, 21.0, 11.0, 10.0, 8.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.01168060302734375, -0.011319279670715332, -0.010957956314086914, -0.010596632957458496, -0.010235309600830078, -0.00987398624420166, -0.009512662887573242, -0.009151339530944824, -0.008790016174316406, -0.008428692817687988, -0.00806736946105957, -0.007706046104431152, -0.007344722747802734, -0.006983399391174316, -0.0066220760345458984, -0.0062607526779174805, -0.0058994293212890625, -0.0055381059646606445, -0.0051767826080322266, -0.004815459251403809, -0.004454135894775391, -0.004092812538146973, -0.0037314891815185547, -0.0033701658248901367, -0.0030088424682617188, -0.0026475191116333008, -0.002286195755004883, -0.0019248723983764648, -0.0015635490417480469, -0.001202225685119629, -0.0008409023284912109, -0.00047957897186279297, -0.000118255615234375, 0.00024306774139404297, 0.0006043910980224609, 0.0009657144546508789, 0.0013270378112792969, 0.0016883611679077148, 0.002049684524536133, 0.0024110078811645508, 0.0027723312377929688, 0.0031336545944213867, 0.0034949779510498047, 0.0038563013076782227, 0.004217624664306641, 0.004578948020935059, 0.0049402713775634766, 0.0053015947341918945, 0.0056629180908203125, 0.0060242414474487305, 0.0063855648040771484, 0.006746888160705566, 0.007108211517333984, 0.007469534873962402, 0.00783085823059082, 0.008192181587219238, 0.008553504943847656, 0.008914828300476074, 0.009276151657104492, 0.00963747501373291, 0.009998798370361328, 0.010360121726989746, 0.010721445083618164, 0.011082768440246582, 0.011444091796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 11.0, 8.0, 9.0, 16.0, 27.0, 34.0, 46.0, 86.0, 142.0, 189.0, 359.0, 700.0, 1467.0, 3334.0, 8996.0, 35438.0, 841806.0, 3246878.0, 38692.0, 9560.0, 3449.0, 1409.0, 699.0, 388.0, 220.0, 122.0, 68.0, 34.0, 29.0, 22.0, 17.0, 6.0, 10.0, 9.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01016998291015625, -0.009763598442077637, -0.009357213973999023, -0.00895082950592041, -0.008544445037841797, -0.008138060569763184, -0.00773167610168457, -0.007325291633605957, -0.006918907165527344, -0.0065125226974487305, -0.006106138229370117, -0.005699753761291504, -0.005293369293212891, -0.004886984825134277, -0.004480600357055664, -0.004074215888977051, -0.0036678314208984375, -0.0032614469528198242, -0.002855062484741211, -0.0024486780166625977, -0.0020422935485839844, -0.001635909080505371, -0.0012295246124267578, -0.0008231401443481445, -0.00041675567626953125, -1.0371208190917969e-05, 0.0003960132598876953, 0.0008023977279663086, 0.0012087821960449219, 0.0016151666641235352, 0.0020215511322021484, 0.0024279356002807617, 0.002834320068359375, 0.0032407045364379883, 0.0036470890045166016, 0.004053473472595215, 0.004459857940673828, 0.004866242408752441, 0.005272626876831055, 0.005679011344909668, 0.006085395812988281, 0.0064917802810668945, 0.006898164749145508, 0.007304549217224121, 0.007710933685302734, 0.008117318153381348, 0.008523702621459961, 0.008930087089538574, 0.009336471557617188, 0.0097428560256958, 0.010149240493774414, 0.010555624961853027, 0.01096200942993164, 0.011368393898010254, 0.011774778366088867, 0.01218116283416748, 0.012587547302246094, 0.012993931770324707, 0.01340031623840332, 0.013806700706481934, 0.014213085174560547, 0.01461946964263916, 0.015025854110717773, 0.015432238578796387, 0.015838623046875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 10.0, 11.0, 12.0, 11.0, 28.0, 28.0, 43.0, 82.0, 309.0, 2869.0, 396.0, 122.0, 54.0, 27.0, 16.0, 11.0, 10.0, 5.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0019426345825195312, -0.0018527060747146606, -0.00176277756690979, -0.0016728490591049194, -0.0015829205513000488, -0.0014929920434951782, -0.0014030635356903076, -0.001313135027885437, -0.0012232065200805664, -0.0011332780122756958, -0.0010433495044708252, -0.0009534209966659546, -0.000863492488861084, -0.0007735639810562134, -0.0006836354732513428, -0.0005937069654464722, -0.0005037784576416016, -0.00041384994983673096, -0.00032392144203186035, -0.00023399293422698975, -0.00014406442642211914, -5.4135918617248535e-05, 3.579258918762207e-05, 0.00012572109699249268, 0.00021564960479736328, 0.0003055781126022339, 0.0003955066204071045, 0.0004854351282119751, 0.0005753636360168457, 0.0006652921438217163, 0.0007552206516265869, 0.0008451491594314575, 0.0009350776672363281, 0.0010250061750411987, 0.0011149346828460693, 0.00120486319065094, 0.0012947916984558105, 0.0013847202062606812, 0.0014746487140655518, 0.0015645772218704224, 0.001654505729675293, 0.0017444342374801636, 0.0018343627452850342, 0.0019242912530899048, 0.0020142197608947754, 0.002104148268699646, 0.0021940767765045166, 0.002284005284309387, 0.002373933792114258, 0.0024638622999191284, 0.002553790807723999, 0.0026437193155288696, 0.0027336478233337402, 0.002823576331138611, 0.0029135048389434814, 0.003003433346748352, 0.0030933618545532227, 0.0031832903623580933, 0.003273218870162964, 0.0033631473779678345, 0.003453075885772705, 0.0035430043935775757, 0.0036329329013824463, 0.003722861409187317, 0.0038127899169921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 11.0, 59.0, 147.0, 250.0, 244.0, 182.0, 75.0, 22.0, 7.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013111122883856297, -0.012131751514971256, -0.011152379214763641, -0.010173007845878601, -0.00919363647699356, -0.00821426510810852, -0.007234893273562193, -0.006255521439015865, -0.005276150070130825, -0.004296778701245785, -0.003317406866699457, -0.0023380352649837732, -0.0013586636632680893, -0.000379292294383049, 0.0006000795401632786, 0.0015794513747096062, 0.0025588227435946465, 0.0035381943453103304, 0.004517565947026014, 0.005496937781572342, 0.006476309150457382, 0.0074556805193424225, 0.008435051888227463, 0.009414424188435078, 0.010393795557320118, 0.011373166926205158, 0.012352539226412773, 0.013331910595297813, 0.014311281964182854, 0.015290653333067894, 0.016270024701952934, 0.017249397933483124, 0.018228769302368164, 0.019208140671253204, 0.020187512040138245, 0.021166883409023285, 0.022146254777908325, 0.023125626146793365, 0.024104999378323555, 0.025084370747208595, 0.026063742116093636, 0.027043113484978676, 0.028022484853863716, 0.029001856222748756, 0.029981229454278946, 0.030960600823163986, 0.031939972192049026, 0.03291934356093407, 0.03389871492981911, 0.03487808629870415, 0.03585745766758919, 0.03683682903647423, 0.03781620040535927, 0.03879557177424431, 0.03977494314312935, 0.04075431823730469, 0.04173368960618973, 0.04271306097507477, 0.04369243234395981, 0.04467180371284485, 0.04565117508172989, 0.04663054645061493, 0.04760991781949997, 0.04858928918838501, 0.04956866055727005]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 9.0, 7.0, 16.0, 14.0, 12.0, 24.0, 22.0, 26.0, 28.0, 33.0, 28.0, 33.0, 31.0, 42.0, 45.0, 50.0, 37.0, 41.0, 42.0, 32.0, 32.0, 48.0, 38.0, 41.0, 39.0, 33.0, 34.0, 28.0, 22.0, 20.0, 18.0, 10.0, 9.0, 10.0, 6.0, 7.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0068076252937316895, -0.006594793871045113, -0.006381962448358536, -0.006169131025671959, -0.005956299602985382, -0.005743468180298805, -0.005530636757612228, -0.0053178053349256516, -0.005104973912239075, -0.004892142489552498, -0.004679311066865921, -0.004466479644179344, -0.004253648221492767, -0.0040408167988061905, -0.0038279853761196136, -0.003615153953433037, -0.00340232253074646, -0.003189491108059883, -0.0029766596853733063, -0.0027638282626867294, -0.0025509968400001526, -0.0023381654173135757, -0.002125333994626999, -0.001912502571940422, -0.0016996711492538452, -0.0014868397265672684, -0.0012740083038806915, -0.0010611768811941147, -0.0008483454585075378, -0.000635514035820961, -0.00042268261313438416, -0.0002098511904478073, 2.9802322387695312e-06, 0.00021581165492534637, 0.0004286430776119232, 0.0006414745002985001, 0.0008543059229850769, 0.0010671373456716537, 0.0012799687683582306, 0.0014928001910448074, 0.0017056316137313843, 0.0019184630364179611, 0.002131294459104538, 0.002344125881791115, 0.0025569573044776917, 0.0027697887271642685, 0.0029826201498508453, 0.003195451572537422, 0.003408282995223999, 0.003621114417910576, 0.0038339458405971527, 0.0040467772632837296, 0.004259608685970306, 0.004472440108656883, 0.00468527153134346, 0.004898102954030037, 0.005110934376716614, 0.005323765799403191, 0.0055365972220897675, 0.005749428644776344, 0.005962260067462921, 0.006175091490149498, 0.006387922912836075, 0.006600754335522652, 0.0068135857582092285]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 5.0, 9.0, 16.0, 21.0, 30.0, 70.0, 96.0, 188.0, 297.0, 620.0, 1269.0, 2930.0, 8025.0, 27429.0, 129946.0, 508565.0, 290458.0, 56177.0, 14161.0, 4537.0, 1838.0, 846.0, 457.0, 253.0, 135.0, 66.0, 32.0, 25.0, 23.0, 8.0, 9.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01425933837890625, -0.013726115226745605, -0.013192892074584961, -0.012659668922424316, -0.012126445770263672, -0.011593222618103027, -0.011059999465942383, -0.010526776313781738, -0.009993553161621094, -0.00946033000946045, -0.008927106857299805, -0.00839388370513916, -0.007860660552978516, -0.007327437400817871, -0.0067942142486572266, -0.006260991096496582, -0.0057277679443359375, -0.005194544792175293, -0.0046613216400146484, -0.004128098487854004, -0.0035948753356933594, -0.003061652183532715, -0.0025284290313720703, -0.0019952058792114258, -0.0014619827270507812, -0.0009287595748901367, -0.0003955364227294922, 0.00013768672943115234, 0.0006709098815917969, 0.0012041330337524414, 0.001737356185913086, 0.0022705793380737305, 0.002803802490234375, 0.0033370256423950195, 0.003870248794555664, 0.004403471946716309, 0.004936695098876953, 0.005469918251037598, 0.006003141403198242, 0.006536364555358887, 0.007069587707519531, 0.007602810859680176, 0.00813603401184082, 0.008669257164001465, 0.00920248031616211, 0.009735703468322754, 0.010268926620483398, 0.010802149772644043, 0.011335372924804688, 0.011868596076965332, 0.012401819229125977, 0.012935042381286621, 0.013468265533447266, 0.01400148868560791, 0.014534711837768555, 0.0150679349899292, 0.015601158142089844, 0.01613438129425049, 0.016667604446411133, 0.017200827598571777, 0.017734050750732422, 0.018267273902893066, 0.01880049705505371, 0.019333720207214355, 0.019866943359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 10.0, 7.0, 13.0, 16.0, 23.0, 30.0, 39.0, 47.0, 66.0, 76.0, 65.0, 82.0, 72.0, 87.0, 73.0, 75.0, 50.0, 40.0, 37.0, 22.0, 20.0, 12.0, 13.0, 9.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.01165008544921875, -0.011289715766906738, -0.010929346084594727, -0.010568976402282715, -0.010208606719970703, -0.009848237037658691, -0.00948786735534668, -0.009127497673034668, -0.008767127990722656, -0.008406758308410645, -0.008046388626098633, -0.007686018943786621, -0.007325649261474609, -0.006965279579162598, -0.006604909896850586, -0.006244540214538574, -0.0058841705322265625, -0.005523800849914551, -0.005163431167602539, -0.004803061485290527, -0.004442691802978516, -0.004082322120666504, -0.003721952438354492, -0.0033615827560424805, -0.0030012130737304688, -0.002640843391418457, -0.0022804737091064453, -0.0019201040267944336, -0.0015597343444824219, -0.0011993646621704102, -0.0008389949798583984, -0.0004786252975463867, -0.000118255615234375, 0.00024211406707763672, 0.0006024837493896484, 0.0009628534317016602, 0.0013232231140136719, 0.0016835927963256836, 0.0020439624786376953, 0.002404332160949707, 0.0027647018432617188, 0.0031250715255737305, 0.003485441207885742, 0.003845810890197754, 0.004206180572509766, 0.004566550254821777, 0.004926919937133789, 0.005287289619445801, 0.0056476593017578125, 0.006008028984069824, 0.006368398666381836, 0.006728768348693848, 0.007089138031005859, 0.007449507713317871, 0.007809877395629883, 0.008170247077941895, 0.008530616760253906, 0.008890986442565918, 0.00925135612487793, 0.009611725807189941, 0.009972095489501953, 0.010332465171813965, 0.010692834854125977, 0.011053204536437988, 0.01141357421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 11.0, 6.0, 9.0, 18.0, 14.0, 32.0, 47.0, 73.0, 104.0, 176.0, 255.0, 482.0, 1293.0, 4566.0, 37138.0, 579583.0, 394196.0, 24748.0, 3530.0, 1072.0, 436.0, 275.0, 135.0, 92.0, 86.0, 56.0, 25.0, 20.0, 13.0, 12.0, 19.0, 9.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02362060546875, -0.022924184799194336, -0.022227764129638672, -0.021531343460083008, -0.020834922790527344, -0.02013850212097168, -0.019442081451416016, -0.01874566078186035, -0.018049240112304688, -0.017352819442749023, -0.01665639877319336, -0.015959978103637695, -0.015263557434082031, -0.014567136764526367, -0.013870716094970703, -0.013174295425415039, -0.012477874755859375, -0.011781454086303711, -0.011085033416748047, -0.010388612747192383, -0.009692192077636719, -0.008995771408081055, -0.00829935073852539, -0.0076029300689697266, -0.0069065093994140625, -0.0062100887298583984, -0.005513668060302734, -0.00481724739074707, -0.004120826721191406, -0.003424406051635742, -0.002727985382080078, -0.002031564712524414, -0.00133514404296875, -0.0006387233734130859, 5.7697296142578125e-05, 0.0007541179656982422, 0.0014505386352539062, 0.0021469593048095703, 0.0028433799743652344, 0.0035398006439208984, 0.0042362213134765625, 0.0049326419830322266, 0.005629062652587891, 0.006325483322143555, 0.007021903991699219, 0.007718324661254883, 0.008414745330810547, 0.009111166000366211, 0.009807586669921875, 0.010504007339477539, 0.011200428009033203, 0.011896848678588867, 0.012593269348144531, 0.013289690017700195, 0.01398611068725586, 0.014682531356811523, 0.015378952026367188, 0.01607537269592285, 0.016771793365478516, 0.01746821403503418, 0.018164634704589844, 0.018861055374145508, 0.019557476043701172, 0.020253896713256836, 0.0209503173828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 10.0, 9.0, 11.0, 4.0, 17.0, 13.0, 18.0, 19.0, 18.0, 20.0, 39.0, 29.0, 39.0, 39.0, 51.0, 38.0, 42.0, 45.0, 43.0, 46.0, 44.0, 37.0, 56.0, 40.0, 39.0, 24.0, 44.0, 33.0, 20.0, 23.0, 11.0, 19.0, 7.0, 17.0, 9.0, 4.0, 9.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.022735595703125, -0.021991729736328125, -0.02124786376953125, -0.020503997802734375, -0.0197601318359375, -0.019016265869140625, -0.01827239990234375, -0.017528533935546875, -0.01678466796875, -0.016040802001953125, -0.01529693603515625, -0.014553070068359375, -0.0138092041015625, -0.013065338134765625, -0.01232147216796875, -0.011577606201171875, -0.010833740234375, -0.010089874267578125, -0.00934600830078125, -0.008602142333984375, -0.0078582763671875, -0.007114410400390625, -0.00637054443359375, -0.005626678466796875, -0.0048828125, -0.004138946533203125, -0.00339508056640625, -0.002651214599609375, -0.0019073486328125, -0.001163482666015625, -0.00041961669921875, 0.000324249267578125, 0.001068115234375, 0.001811981201171875, 0.00255584716796875, 0.003299713134765625, 0.0040435791015625, 0.004787445068359375, 0.00553131103515625, 0.006275177001953125, 0.00701904296875, 0.007762908935546875, 0.00850677490234375, 0.009250640869140625, 0.0099945068359375, 0.010738372802734375, 0.01148223876953125, 0.012226104736328125, 0.012969970703125, 0.013713836669921875, 0.01445770263671875, 0.015201568603515625, 0.0159454345703125, 0.016689300537109375, 0.01743316650390625, 0.018177032470703125, 0.0189208984375, 0.019664764404296875, 0.02040863037109375, 0.021152496337890625, 0.0218963623046875, 0.022640228271484375, 0.02338409423828125, 0.024127960205078125, 0.024871826171875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 11.0, 2.0, 15.0, 18.0, 30.0, 61.0, 102.0, 223.0, 564.0, 2281.0, 24377.0, 839414.0, 173789.0, 5980.0, 1026.0, 339.0, 144.0, 71.0, 51.0, 25.0, 18.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01187896728515625, -0.011450886726379395, -0.011022806167602539, -0.010594725608825684, -0.010166645050048828, -0.009738564491271973, -0.009310483932495117, -0.008882403373718262, -0.008454322814941406, -0.00802624225616455, -0.007598161697387695, -0.00717008113861084, -0.006742000579833984, -0.006313920021057129, -0.0058858394622802734, -0.005457758903503418, -0.0050296783447265625, -0.004601597785949707, -0.0041735172271728516, -0.003745436668395996, -0.0033173561096191406, -0.002889275550842285, -0.0024611949920654297, -0.0020331144332885742, -0.0016050338745117188, -0.0011769533157348633, -0.0007488727569580078, -0.00032079219818115234, 0.00010728836059570312, 0.0005353689193725586, 0.0009634494781494141, 0.0013915300369262695, 0.001819610595703125, 0.0022476911544799805, 0.002675771713256836, 0.0031038522720336914, 0.003531932830810547, 0.003960013389587402, 0.004388093948364258, 0.004816174507141113, 0.005244255065917969, 0.005672335624694824, 0.00610041618347168, 0.006528496742248535, 0.006956577301025391, 0.007384657859802246, 0.007812738418579102, 0.008240818977355957, 0.008668899536132812, 0.009096980094909668, 0.009525060653686523, 0.009953141212463379, 0.010381221771240234, 0.01080930233001709, 0.011237382888793945, 0.0116654634475708, 0.012093544006347656, 0.012521624565124512, 0.012949705123901367, 0.013377785682678223, 0.013805866241455078, 0.014233946800231934, 0.014662027359008789, 0.015090107917785645, 0.0155181884765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 8.0, 4.0, 8.0, 13.0, 20.0, 16.0, 19.0, 28.0, 24.0, 37.0, 37.0, 73.0, 48.0, 71.0, 55.0, 73.0, 87.0, 62.0, 56.0, 32.0, 40.0, 36.0, 29.0, 27.0, 26.0, 13.0, 11.0, 8.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5643577575683594e-05, -3.442354500293732e-05, -3.320351243019104e-05, -3.198347985744476e-05, -3.0763447284698486e-05, -2.954341471195221e-05, -2.8323382139205933e-05, -2.7103349566459656e-05, -2.588331699371338e-05, -2.4663284420967102e-05, -2.3443251848220825e-05, -2.222321927547455e-05, -2.100318670272827e-05, -1.9783154129981995e-05, -1.8563121557235718e-05, -1.734308898448944e-05, -1.6123056411743164e-05, -1.4903023838996887e-05, -1.368299126625061e-05, -1.2462958693504333e-05, -1.1242926120758057e-05, -1.002289354801178e-05, -8.802860975265503e-06, -7.582828402519226e-06, -6.362795829772949e-06, -5.142763257026672e-06, -3.9227306842803955e-06, -2.7026981115341187e-06, -1.4826655387878418e-06, -2.6263296604156494e-07, 9.57399606704712e-07, 2.1774321794509888e-06, 3.3974647521972656e-06, 4.6174973249435425e-06, 5.837529897689819e-06, 7.057562470436096e-06, 8.277595043182373e-06, 9.49762761592865e-06, 1.0717660188674927e-05, 1.1937692761421204e-05, 1.315772533416748e-05, 1.4377757906913757e-05, 1.5597790479660034e-05, 1.681782305240631e-05, 1.8037855625152588e-05, 1.9257888197898865e-05, 2.047792077064514e-05, 2.169795334339142e-05, 2.2917985916137695e-05, 2.4138018488883972e-05, 2.535805106163025e-05, 2.6578083634376526e-05, 2.7798116207122803e-05, 2.901814877986908e-05, 3.0238181352615356e-05, 3.145821392536163e-05, 3.267824649810791e-05, 3.389827907085419e-05, 3.5118311643600464e-05, 3.633834421634674e-05, 3.755837678909302e-05, 3.8778409361839294e-05, 3.999844193458557e-05, 4.121847450733185e-05, 4.2438507080078125e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 11.0, 18.0, 29.0, 34.0, 89.0, 184.0, 407.0, 957.0, 3586.0, 31584.0, 735521.0, 261322.0, 11436.0, 2063.0, 717.0, 285.0, 151.0, 57.0, 37.0, 13.0, 14.0, 11.0, 7.0, 10.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.013671875, -0.013300418853759766, -0.012928962707519531, -0.012557506561279297, -0.012186050415039062, -0.011814594268798828, -0.011443138122558594, -0.01107168197631836, -0.010700225830078125, -0.01032876968383789, -0.009957313537597656, -0.009585857391357422, -0.009214401245117188, -0.008842945098876953, -0.008471488952636719, -0.008100032806396484, -0.00772857666015625, -0.007357120513916016, -0.006985664367675781, -0.006614208221435547, -0.0062427520751953125, -0.005871295928955078, -0.005499839782714844, -0.005128383636474609, -0.004756927490234375, -0.004385471343994141, -0.004014015197753906, -0.003642559051513672, -0.0032711029052734375, -0.002899646759033203, -0.0025281906127929688, -0.0021567344665527344, -0.0017852783203125, -0.0014138221740722656, -0.0010423660278320312, -0.0006709098815917969, -0.0002994537353515625, 7.200241088867188e-05, 0.00044345855712890625, 0.0008149147033691406, 0.001186370849609375, 0.0015578269958496094, 0.0019292831420898438, 0.002300739288330078, 0.0026721954345703125, 0.003043651580810547, 0.0034151077270507812, 0.0037865638732910156, 0.00415802001953125, 0.004529476165771484, 0.004900932312011719, 0.005272388458251953, 0.0056438446044921875, 0.006015300750732422, 0.006386756896972656, 0.006758213043212891, 0.007129669189453125, 0.007501125335693359, 0.007872581481933594, 0.008244037628173828, 0.008615493774414062, 0.008986949920654297, 0.009358406066894531, 0.009729862213134766, 0.010101318359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 11.0, 10.0, 22.0, 33.0, 63.0, 135.0, 168.0, 162.0, 155.0, 96.0, 63.0, 44.0, 13.0, 15.0, 3.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017608642578125, -0.017150521278381348, -0.016692399978637695, -0.016234278678894043, -0.01577615737915039, -0.015318036079406738, -0.014859914779663086, -0.014401793479919434, -0.013943672180175781, -0.013485550880432129, -0.013027429580688477, -0.012569308280944824, -0.012111186981201172, -0.01165306568145752, -0.011194944381713867, -0.010736823081970215, -0.010278701782226562, -0.00982058048248291, -0.009362459182739258, -0.008904337882995605, -0.008446216583251953, -0.0079880952835083, -0.0075299739837646484, -0.007071852684020996, -0.006613731384277344, -0.006155610084533691, -0.005697488784790039, -0.005239367485046387, -0.004781246185302734, -0.004323124885559082, -0.0038650035858154297, -0.0034068822860717773, -0.002948760986328125, -0.0024906396865844727, -0.0020325183868408203, -0.001574397087097168, -0.0011162757873535156, -0.0006581544876098633, -0.00020003318786621094, 0.0002580881118774414, 0.0007162094116210938, 0.001174330711364746, 0.0016324520111083984, 0.0020905733108520508, 0.002548694610595703, 0.0030068159103393555, 0.003464937210083008, 0.00392305850982666, 0.0043811798095703125, 0.004839301109313965, 0.005297422409057617, 0.0057555437088012695, 0.006213665008544922, 0.006671786308288574, 0.0071299076080322266, 0.007588028907775879, 0.008046150207519531, 0.008504271507263184, 0.008962392807006836, 0.009420514106750488, 0.00987863540649414, 0.010336756706237793, 0.010794878005981445, 0.011252999305725098, 0.01171112060546875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 12.0, 19.0, 28.0, 73.0, 153.0, 227.0, 205.0, 148.0, 73.0, 33.0, 15.0, 9.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06512139737606049, -0.05953649431467056, -0.05395159125328064, -0.04836668819189072, -0.04278178513050079, -0.03719688206911087, -0.03161197900772095, -0.026027075946331024, -0.0204421728849411, -0.014857269823551178, -0.009272366762161255, -0.003687463700771332, 0.0018974393606185913, 0.007482342422008514, 0.013067245483398438, 0.01865214854478836, 0.024237051606178284, 0.029821954667568207, 0.03540685772895813, 0.04099176079034805, 0.046576663851737976, 0.0521615669131279, 0.05774646997451782, 0.06333137303590775, 0.06891627609729767, 0.07450117915868759, 0.08008608222007751, 0.08567098528146744, 0.09125588834285736, 0.09684079140424728, 0.10242569446563721, 0.10801059752702713, 0.11359548568725586, 0.11918038874864578, 0.1247652918100357, 0.13035020232200623, 0.13593509793281555, 0.14151999354362488, 0.1471049040555954, 0.15268981456756592, 0.15827471017837524, 0.16385960578918457, 0.1694445163011551, 0.1750294268131256, 0.18061432242393494, 0.18619921803474426, 0.19178412854671478, 0.1973690390586853, 0.20295393466949463, 0.20853883028030396, 0.21412374079227448, 0.219708651304245, 0.22529354691505432, 0.23087844252586365, 0.23646335303783417, 0.2420482635498047, 0.247633159160614, 0.25321805477142334, 0.25880295038223267, 0.2643878757953644, 0.2699727714061737, 0.27555766701698303, 0.28114259243011475, 0.2867274880409241, 0.2923123836517334]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 9.0, 9.0, 8.0, 7.0, 8.0, 9.0, 20.0, 20.0, 18.0, 19.0, 30.0, 27.0, 38.0, 39.0, 41.0, 41.0, 46.0, 53.0, 63.0, 50.0, 41.0, 50.0, 46.0, 38.0, 43.0, 30.0, 29.0, 32.0, 22.0, 24.0, 17.0, 9.0, 11.0, 8.0, 11.0, 10.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11191123723983765, -0.10828864574432373, -0.10466606169939041, -0.10104347765445709, -0.09742088615894318, -0.09379829466342926, -0.09017571061849594, -0.08655312657356262, -0.0829305350780487, -0.07930794358253479, -0.07568535953760147, -0.07206277549266815, -0.06844018399715424, -0.06481759250164032, -0.061195008456707, -0.05757242068648338, -0.053949832916259766, -0.05032724514603615, -0.04670465737581253, -0.04308206960558891, -0.039459481835365295, -0.03583689406514168, -0.03221430629491806, -0.028591718524694443, -0.024969130754470825, -0.021346542984247208, -0.01772395521402359, -0.014101367443799973, -0.010478779673576355, -0.006856191903352737, -0.00323360413312912, 0.0003889836370944977, 0.004011571407318115, 0.007634159177541733, 0.01125674694776535, 0.014879334717988968, 0.018501922488212585, 0.022124510258436203, 0.02574709802865982, 0.029369685798883438, 0.032992273569107056, 0.03661486133933067, 0.04023744910955429, 0.04386003687977791, 0.047482624650001526, 0.05110521242022514, 0.05472780019044876, 0.05835038796067238, 0.061972975730895996, 0.06559556722640991, 0.06921815127134323, 0.07284073531627655, 0.07646332681179047, 0.08008591830730438, 0.0837085023522377, 0.08733108639717102, 0.09095367789268494, 0.09457626938819885, 0.09819885343313217, 0.10182143747806549, 0.1054440289735794, 0.10906662046909332, 0.11268920451402664, 0.11631178855895996, 0.11993438005447388]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 8.0, 5.0, 11.0, 14.0, 21.0, 29.0, 28.0, 30.0, 49.0, 62.0, 105.0, 137.0, 264.0, 1190.0, 19721.0, 4163829.0, 7350.0, 714.0, 220.0, 128.0, 84.0, 54.0, 44.0, 40.0, 24.0, 22.0, 20.0, 17.0, 11.0, 16.0, 4.0, 7.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.055572509765625, -0.05380105972290039, -0.05202960968017578, -0.05025815963745117, -0.04848670959472656, -0.04671525955200195, -0.044943809509277344, -0.043172359466552734, -0.041400909423828125, -0.039629459381103516, -0.037858009338378906, -0.0360865592956543, -0.03431510925292969, -0.03254365921020508, -0.03077220916748047, -0.02900075912475586, -0.02722930908203125, -0.02545785903930664, -0.02368640899658203, -0.021914958953857422, -0.020143508911132812, -0.018372058868408203, -0.016600608825683594, -0.014829158782958984, -0.013057708740234375, -0.011286258697509766, -0.009514808654785156, -0.007743358612060547, -0.0059719085693359375, -0.004200458526611328, -0.0024290084838867188, -0.0006575584411621094, 0.0011138916015625, 0.0028853416442871094, 0.004656791687011719, 0.006428241729736328, 0.008199691772460938, 0.009971141815185547, 0.011742591857910156, 0.013514041900634766, 0.015285491943359375, 0.017056941986083984, 0.018828392028808594, 0.020599842071533203, 0.022371292114257812, 0.024142742156982422, 0.02591419219970703, 0.02768564224243164, 0.02945709228515625, 0.03122854232788086, 0.03299999237060547, 0.03477144241333008, 0.03654289245605469, 0.0383143424987793, 0.040085792541503906, 0.041857242584228516, 0.043628692626953125, 0.045400142669677734, 0.047171592712402344, 0.04894304275512695, 0.05071449279785156, 0.05248594284057617, 0.05425739288330078, 0.05602884292602539, 0.05780029296875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 10.0, 10.0, 6.0, 26.0, 20.0, 41.0, 45.0, 52.0, 60.0, 62.0, 68.0, 79.0, 73.0, 80.0, 69.0, 71.0, 52.0, 43.0, 30.0, 17.0, 21.0, 15.0, 12.0, 11.0, 8.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0112457275390625, -0.010895609855651855, -0.010545492172241211, -0.010195374488830566, -0.009845256805419922, -0.009495139122009277, -0.009145021438598633, -0.008794903755187988, -0.008444786071777344, -0.0080946683883667, -0.007744550704956055, -0.00739443302154541, -0.007044315338134766, -0.006694197654724121, -0.0063440799713134766, -0.005993962287902832, -0.0056438446044921875, -0.005293726921081543, -0.0049436092376708984, -0.004593491554260254, -0.004243373870849609, -0.003893256187438965, -0.0035431385040283203, -0.0031930208206176758, -0.0028429031372070312, -0.0024927854537963867, -0.002142667770385742, -0.0017925500869750977, -0.0014424324035644531, -0.0010923147201538086, -0.0007421970367431641, -0.00039207935333251953, -4.1961669921875e-05, 0.00030815601348876953, 0.0006582736968994141, 0.0010083913803100586, 0.0013585090637207031, 0.0017086267471313477, 0.002058744430541992, 0.0024088621139526367, 0.0027589797973632812, 0.0031090974807739258, 0.0034592151641845703, 0.003809332847595215, 0.004159450531005859, 0.004509568214416504, 0.0048596858978271484, 0.005209803581237793, 0.0055599212646484375, 0.005910038948059082, 0.0062601566314697266, 0.006610274314880371, 0.006960391998291016, 0.00731050968170166, 0.007660627365112305, 0.00801074504852295, 0.008360862731933594, 0.008710980415344238, 0.009061098098754883, 0.009411215782165527, 0.009761333465576172, 0.010111451148986816, 0.010461568832397461, 0.010811686515808105, 0.01116180419921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 8.0, 5.0, 6.0, 8.0, 7.0, 16.0, 19.0, 32.0, 45.0, 47.0, 60.0, 90.0, 116.0, 168.0, 250.0, 434.0, 826.0, 2021.0, 7761.0, 63252.0, 4076242.0, 33925.0, 5428.0, 1595.0, 678.0, 343.0, 259.0, 162.0, 123.0, 93.0, 60.0, 62.0, 44.0, 32.0, 18.0, 14.0, 17.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0226593017578125, -0.02193737030029297, -0.021215438842773438, -0.020493507385253906, -0.019771575927734375, -0.019049644470214844, -0.018327713012695312, -0.01760578155517578, -0.01688385009765625, -0.01616191864013672, -0.015439987182617188, -0.014718055725097656, -0.013996124267578125, -0.013274192810058594, -0.012552261352539062, -0.011830329895019531, -0.0111083984375, -0.010386466979980469, -0.009664535522460938, -0.008942604064941406, -0.008220672607421875, -0.007498741149902344, -0.0067768096923828125, -0.006054878234863281, -0.00533294677734375, -0.004611015319824219, -0.0038890838623046875, -0.0031671524047851562, -0.002445220947265625, -0.0017232894897460938, -0.0010013580322265625, -0.00027942657470703125, 0.0004425048828125, 0.0011644363403320312, 0.0018863677978515625, 0.0026082992553710938, 0.003330230712890625, 0.004052162170410156, 0.0047740936279296875, 0.005496025085449219, 0.00621795654296875, 0.006939888000488281, 0.0076618194580078125, 0.008383750915527344, 0.009105682373046875, 0.009827613830566406, 0.010549545288085938, 0.011271476745605469, 0.011993408203125, 0.012715339660644531, 0.013437271118164062, 0.014159202575683594, 0.014881134033203125, 0.015603065490722656, 0.016324996948242188, 0.01704692840576172, 0.01776885986328125, 0.01849079132080078, 0.019212722778320312, 0.019934654235839844, 0.020656585693359375, 0.021378517150878906, 0.022100448608398438, 0.02282238006591797, 0.0235443115234375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 15.0, 41.0, 276.0, 3646.0, 58.0, 26.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0102386474609375, -0.009910345077514648, -0.009582042694091797, -0.009253740310668945, -0.008925437927246094, -0.008597135543823242, -0.00826883316040039, -0.007940530776977539, -0.0076122283935546875, -0.007283926010131836, -0.006955623626708984, -0.006627321243286133, -0.006299018859863281, -0.00597071647644043, -0.005642414093017578, -0.0053141117095947266, -0.004985809326171875, -0.0046575069427490234, -0.004329204559326172, -0.00400090217590332, -0.0036725997924804688, -0.003344297409057617, -0.0030159950256347656, -0.002687692642211914, -0.0023593902587890625, -0.002031087875366211, -0.0017027854919433594, -0.0013744831085205078, -0.0010461807250976562, -0.0007178783416748047, -0.0003895759582519531, -6.127357482910156e-05, 0.00026702880859375, 0.0005953311920166016, 0.0009236335754394531, 0.0012519359588623047, 0.0015802383422851562, 0.0019085407257080078, 0.0022368431091308594, 0.002565145492553711, 0.0028934478759765625, 0.003221750259399414, 0.0035500526428222656, 0.003878355026245117, 0.004206657409667969, 0.00453495979309082, 0.004863262176513672, 0.0051915645599365234, 0.005519866943359375, 0.0058481693267822266, 0.006176471710205078, 0.00650477409362793, 0.006833076477050781, 0.007161378860473633, 0.007489681243896484, 0.007817983627319336, 0.008146286010742188, 0.008474588394165039, 0.00880289077758789, 0.009131193161010742, 0.009459495544433594, 0.009787797927856445, 0.010116100311279297, 0.010444402694702148, 0.010772705078125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 7.0, 19.0, 58.0, 241.0, 417.0, 200.0, 45.0, 9.0, 10.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043829768896102905, -0.04223943129181862, -0.040649089962244034, -0.03905875235795975, -0.03746841475367546, -0.035878077149391174, -0.03428773581981659, -0.0326973982155323, -0.031107060611248016, -0.02951672114431858, -0.027926383540034294, -0.02633604407310486, -0.024745706468820572, -0.023155367001891136, -0.0215650275349617, -0.019974689930677414, -0.018384350463747978, -0.016794010996818542, -0.015203673392534256, -0.01361333392560482, -0.012022996321320534, -0.010432656854391098, -0.008842318318784237, -0.007251979783177376, -0.005661641247570515, -0.0040713027119636536, -0.002480963943526149, -0.000890625175088644, 0.0006997133605182171, 0.0022900523617863655, 0.0038803908973932266, 0.005470729433000088, 0.007061067968606949, 0.00865140650421381, 0.010241745039820671, 0.011832084506750107, 0.013422422111034393, 0.015012761577963829, 0.016603101044893265, 0.01819343864917755, 0.019783776253461838, 0.021374115720391273, 0.02296445332467556, 0.024554792791604996, 0.026145130395889282, 0.027735469862818718, 0.029325809329748154, 0.03091614693403244, 0.032506488263607025, 0.03409682586789131, 0.0356871671974659, 0.03727750480175018, 0.03886784240603447, 0.040458180010318756, 0.04204852133989334, 0.04363885894417763, 0.045229196548461914, 0.0468195341527462, 0.048409875482320786, 0.05000021308660507, 0.05159055069088936, 0.053180888295173645, 0.05477122962474823, 0.056361567229032516, 0.0579519048333168]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 8.0, 8.0, 9.0, 13.0, 13.0, 16.0, 20.0, 22.0, 23.0, 25.0, 30.0, 34.0, 34.0, 34.0, 40.0, 39.0, 40.0, 47.0, 48.0, 35.0, 46.0, 35.0, 41.0, 40.0, 45.0, 35.0, 29.0, 24.0, 27.0, 29.0, 14.0, 23.0, 14.0, 10.0, 19.0, 7.0, 9.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007561683654785156, -0.007277561351656914, -0.006993439048528671, -0.006709316745400429, -0.006425194442272186, -0.006141072139143944, -0.005856949836015701, -0.005572827532887459, -0.005288705229759216, -0.005004582926630974, -0.004720460623502731, -0.004436338320374489, -0.004152216017246246, -0.003868093714118004, -0.0035839714109897614, -0.003299849107861519, -0.0030157268047332764, -0.002731604501605034, -0.0024474821984767914, -0.002163359895348549, -0.0018792375922203064, -0.001595115289092064, -0.0013109929859638214, -0.001026870682835579, -0.0007427483797073364, -0.00045862607657909393, -0.00017450377345085144, 0.00010961852967739105, 0.00039374083280563354, 0.000677863135933876, 0.0009619854390621185, 0.001246107742190361, 0.0015302300453186035, 0.001814352348446846, 0.0020984746515750885, 0.002382596954703331, 0.0026667192578315735, 0.002950841560959816, 0.0032349638640880585, 0.003519086167216301, 0.0038032084703445435, 0.004087330773472786, 0.0043714530766010284, 0.004655575379729271, 0.004939697682857513, 0.005223819985985756, 0.005507942289113998, 0.005792064592242241, 0.006076186895370483, 0.006360309198498726, 0.006644431501626968, 0.006928553804755211, 0.007212676107883453, 0.007496798411011696, 0.007780920714139938, 0.00806504301726818, 0.008349165320396423, 0.008633287623524666, 0.008917409926652908, 0.00920153222978115, 0.009485654532909393, 0.009769776836037636, 0.010053899139165878, 0.01033802144229412, 0.010622143745422363]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 5.0, 7.0, 4.0, 7.0, 5.0, 10.0, 14.0, 14.0, 22.0, 26.0, 41.0, 45.0, 62.0, 107.0, 161.0, 222.0, 377.0, 590.0, 961.0, 1674.0, 3019.0, 6610.0, 16765.0, 51856.0, 173009.0, 384996.0, 272527.0, 88731.0, 27354.0, 9678.0, 4222.0, 2143.0, 1199.0, 716.0, 464.0, 279.0, 220.0, 121.0, 74.0, 54.0, 40.0, 27.0, 30.0, 14.0, 10.0, 7.0, 11.0, 7.0, 2.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0], "bins": [-0.01042938232421875, -0.010100603103637695, -0.00977182388305664, -0.009443044662475586, -0.009114265441894531, -0.008785486221313477, -0.008456707000732422, -0.008127927780151367, -0.0077991485595703125, -0.007470369338989258, -0.007141590118408203, -0.0068128108978271484, -0.006484031677246094, -0.006155252456665039, -0.005826473236083984, -0.00549769401550293, -0.005168914794921875, -0.00484013557434082, -0.004511356353759766, -0.004182577133178711, -0.0038537979125976562, -0.0035250186920166016, -0.003196239471435547, -0.002867460250854492, -0.0025386810302734375, -0.002209901809692383, -0.0018811225891113281, -0.0015523433685302734, -0.0012235641479492188, -0.0008947849273681641, -0.0005660057067871094, -0.0002372264862060547, 9.1552734375e-05, 0.0004203319549560547, 0.0007491111755371094, 0.001077890396118164, 0.0014066696166992188, 0.0017354488372802734, 0.002064228057861328, 0.002393007278442383, 0.0027217864990234375, 0.003050565719604492, 0.003379344940185547, 0.0037081241607666016, 0.004036903381347656, 0.004365682601928711, 0.004694461822509766, 0.00502324104309082, 0.005352020263671875, 0.00568079948425293, 0.006009578704833984, 0.006338357925415039, 0.006667137145996094, 0.0069959163665771484, 0.007324695587158203, 0.007653474807739258, 0.007982254028320312, 0.008311033248901367, 0.008639812469482422, 0.008968591690063477, 0.009297370910644531, 0.009626150131225586, 0.00995492935180664, 0.010283708572387695, 0.01061248779296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 8.0, 8.0, 13.0, 24.0, 23.0, 38.0, 44.0, 47.0, 61.0, 61.0, 57.0, 75.0, 78.0, 72.0, 69.0, 61.0, 61.0, 46.0, 25.0, 29.0, 27.0, 11.0, 14.0, 17.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0114898681640625, -0.011134624481201172, -0.010779380798339844, -0.010424137115478516, -0.010068893432617188, -0.00971364974975586, -0.009358406066894531, -0.009003162384033203, -0.008647918701171875, -0.008292675018310547, -0.007937431335449219, -0.007582187652587891, -0.0072269439697265625, -0.006871700286865234, -0.006516456604003906, -0.006161212921142578, -0.00580596923828125, -0.005450725555419922, -0.005095481872558594, -0.004740238189697266, -0.0043849945068359375, -0.004029750823974609, -0.0036745071411132812, -0.003319263458251953, -0.002964019775390625, -0.002608776092529297, -0.0022535324096679688, -0.0018982887268066406, -0.0015430450439453125, -0.0011878013610839844, -0.0008325576782226562, -0.0004773139953613281, -0.0001220703125, 0.00023317337036132812, 0.0005884170532226562, 0.0009436607360839844, 0.0012989044189453125, 0.0016541481018066406, 0.0020093917846679688, 0.002364635467529297, 0.002719879150390625, 0.003075122833251953, 0.0034303665161132812, 0.0037856101989746094, 0.0041408538818359375, 0.004496097564697266, 0.004851341247558594, 0.005206584930419922, 0.00556182861328125, 0.005917072296142578, 0.006272315979003906, 0.006627559661865234, 0.0069828033447265625, 0.007338047027587891, 0.007693290710449219, 0.008048534393310547, 0.008403778076171875, 0.008759021759033203, 0.009114265441894531, 0.00946950912475586, 0.009824752807617188, 0.010179996490478516, 0.010535240173339844, 0.010890483856201172, 0.0112457275390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 10.0, 8.0, 17.0, 21.0, 39.0, 50.0, 70.0, 104.0, 150.0, 236.0, 385.0, 727.0, 1389.0, 3331.0, 10541.0, 76245.0, 724587.0, 202902.0, 18874.0, 4737.0, 1838.0, 933.0, 519.0, 280.0, 181.0, 107.0, 66.0, 55.0, 39.0, 34.0, 10.0, 15.0, 8.0, 12.0, 5.0, 3.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196685791015625, -0.01904773712158203, -0.018426895141601562, -0.017806053161621094, -0.017185211181640625, -0.016564369201660156, -0.015943527221679688, -0.015322685241699219, -0.01470184326171875, -0.014081001281738281, -0.013460159301757812, -0.012839317321777344, -0.012218475341796875, -0.011597633361816406, -0.010976791381835938, -0.010355949401855469, -0.009735107421875, -0.009114265441894531, -0.008493423461914062, -0.007872581481933594, -0.007251739501953125, -0.006630897521972656, -0.0060100555419921875, -0.005389213562011719, -0.00476837158203125, -0.004147529602050781, -0.0035266876220703125, -0.0029058456420898438, -0.002285003662109375, -0.0016641616821289062, -0.0010433197021484375, -0.00042247772216796875, 0.0001983642578125, 0.0008192062377929688, 0.0014400482177734375, 0.0020608901977539062, 0.002681732177734375, 0.0033025741577148438, 0.0039234161376953125, 0.004544258117675781, 0.00516510009765625, 0.005785942077636719, 0.0064067840576171875, 0.007027626037597656, 0.007648468017578125, 0.008269309997558594, 0.008890151977539062, 0.009510993957519531, 0.0101318359375, 0.010752677917480469, 0.011373519897460938, 0.011994361877441406, 0.012615203857421875, 0.013236045837402344, 0.013856887817382812, 0.014477729797363281, 0.01509857177734375, 0.01571941375732422, 0.016340255737304688, 0.016961097717285156, 0.017581939697265625, 0.018202781677246094, 0.018823623657226562, 0.01944446563720703, 0.0200653076171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 11.0, 8.0, 11.0, 15.0, 20.0, 21.0, 33.0, 23.0, 32.0, 35.0, 39.0, 60.0, 52.0, 62.0, 52.0, 53.0, 61.0, 57.0, 53.0, 46.0, 35.0, 41.0, 38.0, 21.0, 27.0, 23.0, 17.0, 14.0, 12.0, 3.0, 9.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0345458984375, -0.03341341018676758, -0.032280921936035156, -0.031148433685302734, -0.030015945434570312, -0.02888345718383789, -0.02775096893310547, -0.026618480682373047, -0.025485992431640625, -0.024353504180908203, -0.02322101593017578, -0.02208852767944336, -0.020956039428710938, -0.019823551177978516, -0.018691062927246094, -0.017558574676513672, -0.01642608642578125, -0.015293598175048828, -0.014161109924316406, -0.013028621673583984, -0.011896133422851562, -0.01076364517211914, -0.009631156921386719, -0.008498668670654297, -0.007366180419921875, -0.006233692169189453, -0.005101203918457031, -0.003968715667724609, -0.0028362274169921875, -0.0017037391662597656, -0.0005712509155273438, 0.0005612373352050781, 0.0016937255859375, 0.002826213836669922, 0.003958702087402344, 0.005091190338134766, 0.0062236785888671875, 0.007356166839599609, 0.008488655090332031, 0.009621143341064453, 0.010753631591796875, 0.011886119842529297, 0.013018608093261719, 0.01415109634399414, 0.015283584594726562, 0.016416072845458984, 0.017548561096191406, 0.018681049346923828, 0.01981353759765625, 0.020946025848388672, 0.022078514099121094, 0.023211002349853516, 0.024343490600585938, 0.02547597885131836, 0.02660846710205078, 0.027740955352783203, 0.028873443603515625, 0.030005931854248047, 0.03113842010498047, 0.03227090835571289, 0.03340339660644531, 0.034535884857177734, 0.035668373107910156, 0.03680086135864258, 0.037933349609375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 8.0, 4.0, 3.0, 15.0, 19.0, 18.0, 21.0, 34.0, 37.0, 72.0, 109.0, 166.0, 267.0, 440.0, 962.0, 2219.0, 6360.0, 104578.0, 912457.0, 14186.0, 3467.0, 1427.0, 710.0, 353.0, 218.0, 148.0, 72.0, 53.0, 37.0, 27.0, 14.0, 7.0, 12.0, 8.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.027862548828125, -0.027133703231811523, -0.026404857635498047, -0.02567601203918457, -0.024947166442871094, -0.024218320846557617, -0.02348947525024414, -0.022760629653930664, -0.022031784057617188, -0.02130293846130371, -0.020574092864990234, -0.019845247268676758, -0.01911640167236328, -0.018387556076049805, -0.017658710479736328, -0.01692986488342285, -0.016201019287109375, -0.015472173690795898, -0.014743328094482422, -0.014014482498168945, -0.013285636901855469, -0.012556791305541992, -0.011827945709228516, -0.011099100112915039, -0.010370254516601562, -0.009641408920288086, -0.00891256332397461, -0.008183717727661133, -0.007454872131347656, -0.00672602653503418, -0.005997180938720703, -0.0052683353424072266, -0.00453948974609375, -0.0038106441497802734, -0.003081798553466797, -0.0023529529571533203, -0.0016241073608398438, -0.0008952617645263672, -0.00016641616821289062, 0.0005624294281005859, 0.0012912750244140625, 0.002020120620727539, 0.0027489662170410156, 0.003477811813354492, 0.004206657409667969, 0.004935503005981445, 0.005664348602294922, 0.0063931941986083984, 0.007122039794921875, 0.007850885391235352, 0.008579730987548828, 0.009308576583862305, 0.010037422180175781, 0.010766267776489258, 0.011495113372802734, 0.012223958969116211, 0.012952804565429688, 0.013681650161743164, 0.01441049575805664, 0.015139341354370117, 0.015868186950683594, 0.01659703254699707, 0.017325878143310547, 0.018054723739624023, 0.0187835693359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 10.0, 10.0, 4.0, 14.0, 14.0, 27.0, 35.0, 42.0, 72.0, 85.0, 134.0, 151.0, 123.0, 79.0, 64.0, 37.0, 31.0, 23.0, 12.0, 8.0, 4.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984306335449219e-05, -5.7806260883808136e-05, -5.5769458413124084e-05, -5.373265594244003e-05, -5.169585347175598e-05, -4.965905100107193e-05, -4.762224853038788e-05, -4.558544605970383e-05, -4.3548643589019775e-05, -4.1511841118335724e-05, -3.947503864765167e-05, -3.743823617696762e-05, -3.540143370628357e-05, -3.336463123559952e-05, -3.1327828764915466e-05, -2.9291026294231415e-05, -2.7254223823547363e-05, -2.5217421352863312e-05, -2.318061888217926e-05, -2.114381641149521e-05, -1.9107013940811157e-05, -1.7070211470127106e-05, -1.5033408999443054e-05, -1.2996606528759003e-05, -1.0959804058074951e-05, -8.9230015873909e-06, -6.886199116706848e-06, -4.849396646022797e-06, -2.812594175338745e-06, -7.757917046546936e-07, 1.261010766029358e-06, 3.2978132367134094e-06, 5.334615707397461e-06, 7.3714181780815125e-06, 9.408220648765564e-06, 1.1445023119449615e-05, 1.3481825590133667e-05, 1.551862806081772e-05, 1.755543053150177e-05, 1.959223300218582e-05, 2.1629035472869873e-05, 2.3665837943553925e-05, 2.5702640414237976e-05, 2.7739442884922028e-05, 2.977624535560608e-05, 3.181304782629013e-05, 3.384985029697418e-05, 3.5886652767658234e-05, 3.7923455238342285e-05, 3.996025770902634e-05, 4.199706017971039e-05, 4.403386265039444e-05, 4.607066512107849e-05, 4.810746759176254e-05, 5.0144270062446594e-05, 5.2181072533130646e-05, 5.42178750038147e-05, 5.625467747449875e-05, 5.82914799451828e-05, 6.032828241586685e-05, 6.23650848865509e-05, 6.440188735723495e-05, 6.6438689827919e-05, 6.847549229860306e-05, 7.051229476928711e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 13.0, 12.0, 25.0, 40.0, 52.0, 92.0, 152.0, 254.0, 510.0, 981.0, 2325.0, 6759.0, 112213.0, 901373.0, 17106.0, 3597.0, 1480.0, 661.0, 341.0, 198.0, 129.0, 76.0, 35.0, 36.0, 21.0, 15.0, 5.0, 7.0, 4.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01873779296875, -0.018074512481689453, -0.017411231994628906, -0.01674795150756836, -0.016084671020507812, -0.015421390533447266, -0.014758110046386719, -0.014094829559326172, -0.013431549072265625, -0.012768268585205078, -0.012104988098144531, -0.011441707611083984, -0.010778427124023438, -0.01011514663696289, -0.009451866149902344, -0.008788585662841797, -0.00812530517578125, -0.007462024688720703, -0.006798744201660156, -0.006135463714599609, -0.0054721832275390625, -0.004808902740478516, -0.004145622253417969, -0.003482341766357422, -0.002819061279296875, -0.002155780792236328, -0.0014925003051757812, -0.0008292198181152344, -0.0001659393310546875, 0.0004973411560058594, 0.0011606216430664062, 0.0018239021301269531, 0.0024871826171875, 0.003150463104248047, 0.0038137435913085938, 0.004477024078369141, 0.0051403045654296875, 0.005803585052490234, 0.006466865539550781, 0.007130146026611328, 0.007793426513671875, 0.008456707000732422, 0.009119987487792969, 0.009783267974853516, 0.010446548461914062, 0.01110982894897461, 0.011773109436035156, 0.012436389923095703, 0.01309967041015625, 0.013762950897216797, 0.014426231384277344, 0.01508951187133789, 0.015752792358398438, 0.016416072845458984, 0.01707935333251953, 0.017742633819580078, 0.018405914306640625, 0.019069194793701172, 0.01973247528076172, 0.020395755767822266, 0.021059036254882812, 0.02172231674194336, 0.022385597229003906, 0.023048877716064453, 0.023712158203125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 9.0, 25.0, 165.0, 571.0, 155.0, 25.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07025146484375, -0.06842756271362305, -0.0666036605834961, -0.06477975845336914, -0.06295585632324219, -0.061131954193115234, -0.05930805206298828, -0.05748414993286133, -0.055660247802734375, -0.05383634567260742, -0.05201244354248047, -0.050188541412353516, -0.04836463928222656, -0.04654073715209961, -0.044716835021972656, -0.0428929328918457, -0.04106903076171875, -0.0392451286315918, -0.037421226501464844, -0.03559732437133789, -0.03377342224121094, -0.031949520111083984, -0.03012561798095703, -0.028301715850830078, -0.026477813720703125, -0.024653911590576172, -0.02283000946044922, -0.021006107330322266, -0.019182205200195312, -0.01735830307006836, -0.015534400939941406, -0.013710498809814453, -0.0118865966796875, -0.010062694549560547, -0.008238792419433594, -0.006414890289306641, -0.0045909881591796875, -0.0027670860290527344, -0.0009431838989257812, 0.0008807182312011719, 0.002704620361328125, 0.004528522491455078, 0.006352424621582031, 0.008176326751708984, 0.010000228881835938, 0.01182413101196289, 0.013648033142089844, 0.015471935272216797, 0.01729583740234375, 0.019119739532470703, 0.020943641662597656, 0.02276754379272461, 0.024591445922851562, 0.026415348052978516, 0.02823925018310547, 0.030063152313232422, 0.031887054443359375, 0.03371095657348633, 0.03553485870361328, 0.037358760833740234, 0.03918266296386719, 0.04100656509399414, 0.042830467224121094, 0.04465436935424805, 0.046478271484375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 16.0, 22.0, 24.0, 42.0, 73.0, 125.0, 159.0, 216.0, 172.0, 88.0, 24.0, 19.0, 10.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2453514188528061, -0.23803828656673431, -0.23072515428066254, -0.22341202199459076, -0.2160988748073578, -0.208785742521286, -0.20147261023521423, -0.19415947794914246, -0.18684634566307068, -0.1795332133769989, -0.17222008109092712, -0.16490694880485535, -0.15759381651878357, -0.1502806842327118, -0.14296753704547882, -0.13565440475940704, -0.12834127247333527, -0.12102814018726349, -0.11371500790119171, -0.10640186816453934, -0.09908873587846756, -0.09177560359239578, -0.08446246385574341, -0.07714933156967163, -0.06983619928359985, -0.06252306699752808, -0.055209930986166, -0.047896794974803925, -0.04058366268873215, -0.03327053040266037, -0.025957394391298294, -0.018644258379936218, -0.011331140995025635, -0.004018006846308708, 0.0032951273024082184, 0.010608261451125145, 0.01792139559984207, 0.02523452788591385, 0.032547663897275925, 0.039860799908638, 0.04717393219470978, 0.054487064480781555, 0.06180020049214363, 0.0691133365035057, 0.07642646878957748, 0.08373960107564926, 0.09105274081230164, 0.09836587309837341, 0.10567900538444519, 0.11299213767051697, 0.12030526995658875, 0.12761840224266052, 0.1349315345287323, 0.14224466681480408, 0.14955781400203705, 0.15687094628810883, 0.1641840785741806, 0.17149721086025238, 0.17881034314632416, 0.18612347543239594, 0.1934366226196289, 0.20074975490570068, 0.20806288719177246, 0.21537601947784424, 0.22268915176391602]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 7.0, 11.0, 5.0, 9.0, 11.0, 8.0, 16.0, 21.0, 25.0, 18.0, 26.0, 35.0, 43.0, 40.0, 40.0, 52.0, 53.0, 50.0, 57.0, 49.0, 46.0, 51.0, 44.0, 43.0, 43.0, 35.0, 22.0, 26.0, 14.0, 17.0, 25.0, 21.0, 12.0, 6.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.19137269258499146, -0.1856820285320282, -0.17999134957790375, -0.1743006855249405, -0.16861000657081604, -0.16291934251785278, -0.15722867846488953, -0.15153801441192627, -0.14584733545780182, -0.14015667140483856, -0.1344659924507141, -0.12877532839775085, -0.123084656894207, -0.11739398539066315, -0.11170332133769989, -0.10601264983415604, -0.10032197833061218, -0.09463130682706833, -0.08894063532352448, -0.08324997127056122, -0.07755929976701736, -0.07186862826347351, -0.06617796421051025, -0.0604872927069664, -0.054796621203422546, -0.04910594969987869, -0.04341528192162514, -0.03772461414337158, -0.03203394263982773, -0.026343272998929024, -0.02065260335803032, -0.014961935579776764, -0.00927126407623291, -0.0035805944353342056, 0.002110075205564499, 0.007800744846463203, 0.013491414487361908, 0.019182084128260612, 0.024872753769159317, 0.030563421547412872, 0.036254093050956726, 0.04194476455450058, 0.047635432332754135, 0.05332610011100769, 0.059016771614551544, 0.0647074431180954, 0.07039810717105865, 0.07608877867460251, 0.08177945017814636, 0.08747012168169022, 0.09316079318523407, 0.09885145723819733, 0.10454212874174118, 0.11023280024528503, 0.11592346429824829, 0.12161413580179214, 0.127304807305336, 0.13299547135829926, 0.1386861503124237, 0.14437681436538696, 0.15006747841835022, 0.15575815737247467, 0.16144882142543793, 0.16713950037956238, 0.17283016443252563]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 6.0, 8.0, 9.0, 21.0, 11.0, 22.0, 28.0, 44.0, 57.0, 117.0, 128.0, 213.0, 356.0, 778.0, 1924.0, 8189.0, 130059.0, 4026011.0, 20309.0, 3491.0, 1152.0, 487.0, 277.0, 176.0, 112.0, 75.0, 60.0, 49.0, 23.0, 16.0, 21.0, 14.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.025238037109375, -0.02434396743774414, -0.02344989776611328, -0.022555828094482422, -0.021661758422851562, -0.020767688751220703, -0.019873619079589844, -0.018979549407958984, -0.018085479736328125, -0.017191410064697266, -0.016297340393066406, -0.015403270721435547, -0.014509201049804688, -0.013615131378173828, -0.012721061706542969, -0.01182699203491211, -0.01093292236328125, -0.01003885269165039, -0.009144783020019531, -0.008250713348388672, -0.0073566436767578125, -0.006462574005126953, -0.005568504333496094, -0.004674434661865234, -0.003780364990234375, -0.0028862953186035156, -0.0019922256469726562, -0.0010981559753417969, -0.0002040863037109375, 0.0006899833679199219, 0.0015840530395507812, 0.0024781227111816406, 0.0033721923828125, 0.004266262054443359, 0.005160331726074219, 0.006054401397705078, 0.0069484710693359375, 0.007842540740966797, 0.008736610412597656, 0.009630680084228516, 0.010524749755859375, 0.011418819427490234, 0.012312889099121094, 0.013206958770751953, 0.014101028442382812, 0.014995098114013672, 0.01588916778564453, 0.01678323745727539, 0.01767730712890625, 0.01857137680053711, 0.01946544647216797, 0.020359516143798828, 0.021253585815429688, 0.022147655487060547, 0.023041725158691406, 0.023935794830322266, 0.024829864501953125, 0.025723934173583984, 0.026618003845214844, 0.027512073516845703, 0.028406143188476562, 0.029300212860107422, 0.03019428253173828, 0.03108835220336914, 0.031982421875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 6.0, 8.0, 13.0, 25.0, 26.0, 25.0, 36.0, 42.0, 42.0, 61.0, 53.0, 65.0, 60.0, 75.0, 72.0, 76.0, 73.0, 54.0, 48.0, 34.0, 27.0, 15.0, 13.0, 11.0, 6.0, 9.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.011749267578125, -0.011382579803466797, -0.011015892028808594, -0.01064920425415039, -0.010282516479492188, -0.009915828704833984, -0.009549140930175781, -0.009182453155517578, -0.008815765380859375, -0.008449077606201172, -0.008082389831542969, -0.007715702056884766, -0.0073490142822265625, -0.006982326507568359, -0.006615638732910156, -0.006248950958251953, -0.00588226318359375, -0.005515575408935547, -0.005148887634277344, -0.004782199859619141, -0.0044155120849609375, -0.004048824310302734, -0.0036821365356445312, -0.003315448760986328, -0.002948760986328125, -0.002582073211669922, -0.0022153854370117188, -0.0018486976623535156, -0.0014820098876953125, -0.0011153221130371094, -0.0007486343383789062, -0.0003819465637207031, -1.52587890625e-05, 0.0003514289855957031, 0.0007181167602539062, 0.0010848045349121094, 0.0014514923095703125, 0.0018181800842285156, 0.0021848678588867188, 0.002551555633544922, 0.002918243408203125, 0.003284931182861328, 0.0036516189575195312, 0.004018306732177734, 0.0043849945068359375, 0.004751682281494141, 0.005118370056152344, 0.005485057830810547, 0.00585174560546875, 0.006218433380126953, 0.006585121154785156, 0.006951808929443359, 0.0073184967041015625, 0.007685184478759766, 0.008051872253417969, 0.008418560028076172, 0.008785247802734375, 0.009151935577392578, 0.009518623352050781, 0.009885311126708984, 0.010251998901367188, 0.01061868667602539, 0.010985374450683594, 0.011352062225341797, 0.01171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 5.0, 10.0, 17.0, 16.0, 26.0, 35.0, 43.0, 65.0, 79.0, 106.0, 164.0, 250.0, 556.0, 2839.0, 3088217.0, 1097657.0, 2703.0, 617.0, 292.0, 161.0, 104.0, 81.0, 59.0, 48.0, 36.0, 33.0, 21.0, 8.0, 8.0, 7.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08837890625, -0.08577919006347656, -0.08317947387695312, -0.08057975769042969, -0.07798004150390625, -0.07538032531738281, -0.07278060913085938, -0.07018089294433594, -0.0675811767578125, -0.06498146057128906, -0.062381744384765625, -0.05978202819824219, -0.05718231201171875, -0.05458259582519531, -0.051982879638671875, -0.04938316345214844, -0.046783447265625, -0.04418373107910156, -0.041584014892578125, -0.03898429870605469, -0.03638458251953125, -0.03378486633300781, -0.031185150146484375, -0.028585433959960938, -0.0259857177734375, -0.023386001586914062, -0.020786285400390625, -0.018186569213867188, -0.01558685302734375, -0.012987136840820312, -0.010387420654296875, -0.0077877044677734375, -0.00518798828125, -0.0025882720947265625, 1.1444091796875e-05, 0.0026111602783203125, 0.00521087646484375, 0.0078105926513671875, 0.010410308837890625, 0.013010025024414062, 0.0156097412109375, 0.018209457397460938, 0.020809173583984375, 0.023408889770507812, 0.02600860595703125, 0.028608322143554688, 0.031208038330078125, 0.03380775451660156, 0.036407470703125, 0.03900718688964844, 0.041606903076171875, 0.04420661926269531, 0.04680633544921875, 0.04940605163574219, 0.052005767822265625, 0.05460548400878906, 0.0572052001953125, 0.05980491638183594, 0.062404632568359375, 0.06500434875488281, 0.06760406494140625, 0.07020378112792969, 0.07280349731445312, 0.07540321350097656, 0.0780029296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 27.0, 113.0, 3807.0, 95.0, 18.0, 13.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.045654296875, -0.044499874114990234, -0.04334545135498047, -0.0421910285949707, -0.04103660583496094, -0.03988218307495117, -0.038727760314941406, -0.03757333755493164, -0.036418914794921875, -0.03526449203491211, -0.034110069274902344, -0.03295564651489258, -0.03180122375488281, -0.030646800994873047, -0.02949237823486328, -0.028337955474853516, -0.02718353271484375, -0.026029109954833984, -0.02487468719482422, -0.023720264434814453, -0.022565841674804688, -0.021411418914794922, -0.020256996154785156, -0.01910257339477539, -0.017948150634765625, -0.01679372787475586, -0.015639305114746094, -0.014484882354736328, -0.013330459594726562, -0.012176036834716797, -0.011021614074707031, -0.009867191314697266, -0.0087127685546875, -0.007558345794677734, -0.006403923034667969, -0.005249500274658203, -0.0040950775146484375, -0.002940654754638672, -0.0017862319946289062, -0.0006318092346191406, 0.000522613525390625, 0.0016770362854003906, 0.0028314590454101562, 0.003985881805419922, 0.0051403045654296875, 0.006294727325439453, 0.007449150085449219, 0.008603572845458984, 0.00975799560546875, 0.010912418365478516, 0.012066841125488281, 0.013221263885498047, 0.014375686645507812, 0.015530109405517578, 0.016684532165527344, 0.01783895492553711, 0.018993377685546875, 0.02014780044555664, 0.021302223205566406, 0.022456645965576172, 0.023611068725585938, 0.024765491485595703, 0.02591991424560547, 0.027074337005615234, 0.028228759765625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 6.0, 7.0, 16.0, 24.0, 28.0, 45.0, 80.0, 112.0, 177.0, 186.0, 125.0, 95.0, 37.0, 27.0, 11.0, 11.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0940178856253624, -0.09185920655727386, -0.08970052003860474, -0.0875418409705162, -0.08538316190242767, -0.08322447538375854, -0.08106579631567001, -0.07890711724758148, -0.07674843072891235, -0.07458975166082382, -0.0724310651421547, -0.07027238607406616, -0.06811370700597763, -0.0659550279378891, -0.06379634141921997, -0.06163766235113144, -0.05947898328304291, -0.05732030048966408, -0.055161621421575546, -0.053002938628196716, -0.050844259560108185, -0.048685576766729355, -0.046526893973350525, -0.04436821490526199, -0.04220953211188316, -0.040050849318504333, -0.0378921702504158, -0.03573348745703697, -0.03357480466365814, -0.03141612559556961, -0.02925744280219078, -0.0270987618714571, -0.02494008094072342, -0.02278140000998974, -0.020622719079256058, -0.018464036285877228, -0.016305355355143547, -0.014146674424409866, -0.011987992562353611, -0.009829310700297356, -0.007670629769563675, -0.005511948373168707, -0.003353266976773739, -0.0011945855803787708, 0.0009640958160161972, 0.003122776746749878, 0.005281458608806133, 0.007440140470862389, 0.00959882140159607, 0.01175750233232975, 0.013916184194386005, 0.01607486605644226, 0.01823354698717594, 0.020392227917909622, 0.022550910711288452, 0.024709591642022133, 0.026868272572755814, 0.029026953503489494, 0.031185634434223175, 0.033344317227602005, 0.035503000020980835, 0.037661679089069366, 0.039820361882448196, 0.041979044675827026, 0.04413772374391556]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 4.0, 9.0, 3.0, 6.0, 9.0, 4.0, 10.0, 17.0, 15.0, 18.0, 30.0, 27.0, 40.0, 33.0, 34.0, 36.0, 44.0, 44.0, 56.0, 61.0, 51.0, 56.0, 35.0, 45.0, 50.0, 47.0, 39.0, 31.0, 30.0, 19.0, 15.0, 15.0, 11.0, 19.0, 11.0, 10.0, 5.0, 4.0, 0.0, 4.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04304862022399902, -0.04181289300322533, -0.04057716578245163, -0.039341434836387634, -0.03810570761561394, -0.03686998039484024, -0.035634249448776245, -0.03439852222800255, -0.03316279500722885, -0.031927067786455154, -0.03069133870303631, -0.029455609619617462, -0.028219882398843765, -0.02698415517807007, -0.025748426094651222, -0.024512697011232376, -0.02327696979045868, -0.022041242569684982, -0.020805513486266136, -0.01956978440284729, -0.018334057182073593, -0.017098329961299896, -0.01586260087788105, -0.014626872725784779, -0.013391144573688507, -0.012155416421592236, -0.010919688269495964, -0.009683960117399693, -0.008448231965303421, -0.0072125038132071495, -0.005976775661110878, -0.0047410475090146065, -0.003505319356918335, -0.0022695912048220634, -0.001033863052725792, 0.00020186509937047958, 0.001437593251466751, 0.0026733214035630226, 0.003909049555659294, 0.005144777707755566, 0.006380505859851837, 0.007616234011948109, 0.00885196216404438, 0.010087690316140652, 0.011323418468236923, 0.012559146620333195, 0.013794874772429466, 0.015030602924525738, 0.01626633107662201, 0.017502058297395706, 0.018737787380814552, 0.0199735164642334, 0.021209243685007095, 0.022444970905780792, 0.02368069998919964, 0.024916429072618484, 0.02615215629339218, 0.02738788351416588, 0.028623612597584724, 0.02985934168100357, 0.031095068901777267, 0.032330796122550964, 0.03356652706861496, 0.03480225428938866, 0.036037981510162354]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 9.0, 8.0, 8.0, 12.0, 18.0, 29.0, 50.0, 80.0, 131.0, 228.0, 491.0, 915.0, 2146.0, 5461.0, 15966.0, 60552.0, 267183.0, 489332.0, 152906.0, 35860.0, 10434.0, 3647.0, 1510.0, 726.0, 353.0, 189.0, 133.0, 53.0, 35.0, 27.0, 16.0, 14.0, 12.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0173797607421875, -0.01687324047088623, -0.01636672019958496, -0.01586019992828369, -0.015353679656982422, -0.014847159385681152, -0.014340639114379883, -0.013834118843078613, -0.013327598571777344, -0.012821078300476074, -0.012314558029174805, -0.011808037757873535, -0.011301517486572266, -0.010794997215270996, -0.010288476943969727, -0.009781956672668457, -0.009275436401367188, -0.008768916130065918, -0.008262395858764648, -0.007755875587463379, -0.007249355316162109, -0.00674283504486084, -0.00623631477355957, -0.005729794502258301, -0.005223274230957031, -0.004716753959655762, -0.004210233688354492, -0.0037037134170532227, -0.003197193145751953, -0.0026906728744506836, -0.002184152603149414, -0.0016776323318481445, -0.001171112060546875, -0.0006645917892456055, -0.00015807151794433594, 0.0003484487533569336, 0.0008549690246582031, 0.0013614892959594727, 0.0018680095672607422, 0.0023745298385620117, 0.0028810501098632812, 0.0033875703811645508, 0.0038940906524658203, 0.00440061092376709, 0.004907131195068359, 0.005413651466369629, 0.0059201717376708984, 0.006426692008972168, 0.0069332122802734375, 0.007439732551574707, 0.007946252822875977, 0.008452773094177246, 0.008959293365478516, 0.009465813636779785, 0.009972333908081055, 0.010478854179382324, 0.010985374450683594, 0.011491894721984863, 0.011998414993286133, 0.012504935264587402, 0.013011455535888672, 0.013517975807189941, 0.014024496078491211, 0.01453101634979248, 0.01503753662109375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 8.0, 8.0, 11.0, 16.0, 28.0, 20.0, 35.0, 42.0, 46.0, 44.0, 59.0, 65.0, 58.0, 73.0, 55.0, 69.0, 70.0, 61.0, 45.0, 43.0, 36.0, 22.0, 26.0, 8.0, 9.0, 8.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0116729736328125, -0.01130211353302002, -0.010931253433227539, -0.010560393333435059, -0.010189533233642578, -0.009818673133850098, -0.009447813034057617, -0.009076952934265137, -0.008706092834472656, -0.008335232734680176, -0.007964372634887695, -0.007593512535095215, -0.007222652435302734, -0.006851792335510254, -0.0064809322357177734, -0.006110072135925293, -0.0057392120361328125, -0.005368351936340332, -0.0049974918365478516, -0.004626631736755371, -0.004255771636962891, -0.00388491153717041, -0.0035140514373779297, -0.0031431913375854492, -0.0027723312377929688, -0.0024014711380004883, -0.002030611038208008, -0.0016597509384155273, -0.0012888908386230469, -0.0009180307388305664, -0.0005471706390380859, -0.00017631053924560547, 0.000194549560546875, 0.0005654096603393555, 0.0009362697601318359, 0.0013071298599243164, 0.0016779899597167969, 0.0020488500595092773, 0.002419710159301758, 0.0027905702590942383, 0.0031614303588867188, 0.0035322904586791992, 0.0039031505584716797, 0.00427401065826416, 0.004644870758056641, 0.005015730857849121, 0.0053865909576416016, 0.005757451057434082, 0.0061283111572265625, 0.006499171257019043, 0.0068700313568115234, 0.007240891456604004, 0.007611751556396484, 0.007982611656188965, 0.008353471755981445, 0.008724331855773926, 0.009095191955566406, 0.009466052055358887, 0.009836912155151367, 0.010207772254943848, 0.010578632354736328, 0.010949492454528809, 0.011320352554321289, 0.01169121265411377, 0.01206207275390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 5.0, 5.0, 6.0, 11.0, 14.0, 23.0, 27.0, 48.0, 57.0, 81.0, 145.0, 177.0, 265.0, 500.0, 931.0, 2032.0, 6234.0, 32699.0, 365442.0, 574691.0, 51342.0, 8540.0, 2614.0, 1076.0, 575.0, 339.0, 188.0, 148.0, 91.0, 67.0, 51.0, 31.0, 18.0, 20.0, 14.0, 5.0, 9.0, 5.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0209197998046875, -0.020175457000732422, -0.019431114196777344, -0.018686771392822266, -0.017942428588867188, -0.01719808578491211, -0.01645374298095703, -0.015709400177001953, -0.014965057373046875, -0.014220714569091797, -0.013476371765136719, -0.01273202896118164, -0.011987686157226562, -0.011243343353271484, -0.010499000549316406, -0.009754657745361328, -0.00901031494140625, -0.008265972137451172, -0.007521629333496094, -0.006777286529541016, -0.0060329437255859375, -0.005288600921630859, -0.004544258117675781, -0.003799915313720703, -0.003055572509765625, -0.002311229705810547, -0.0015668869018554688, -0.0008225440979003906, -7.82012939453125e-05, 0.0006661415100097656, 0.0014104843139648438, 0.002154827117919922, 0.002899169921875, 0.003643512725830078, 0.004387855529785156, 0.005132198333740234, 0.0058765411376953125, 0.006620883941650391, 0.007365226745605469, 0.008109569549560547, 0.008853912353515625, 0.009598255157470703, 0.010342597961425781, 0.01108694076538086, 0.011831283569335938, 0.012575626373291016, 0.013319969177246094, 0.014064311981201172, 0.01480865478515625, 0.015552997589111328, 0.016297340393066406, 0.017041683197021484, 0.017786026000976562, 0.01853036880493164, 0.01927471160888672, 0.020019054412841797, 0.020763397216796875, 0.021507740020751953, 0.02225208282470703, 0.02299642562866211, 0.023740768432617188, 0.024485111236572266, 0.025229454040527344, 0.025973796844482422, 0.0267181396484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 14.0, 9.0, 7.0, 8.0, 19.0, 28.0, 34.0, 45.0, 45.0, 47.0, 65.0, 54.0, 52.0, 62.0, 61.0, 63.0, 59.0, 59.0, 44.0, 43.0, 36.0, 27.0, 29.0, 30.0, 18.0, 13.0, 7.0, 5.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04315185546875, -0.041759490966796875, -0.04036712646484375, -0.038974761962890625, -0.0375823974609375, -0.036190032958984375, -0.03479766845703125, -0.033405303955078125, -0.032012939453125, -0.030620574951171875, -0.02922821044921875, -0.027835845947265625, -0.0264434814453125, -0.025051116943359375, -0.02365875244140625, -0.022266387939453125, -0.0208740234375, -0.019481658935546875, -0.01808929443359375, -0.016696929931640625, -0.0153045654296875, -0.013912200927734375, -0.01251983642578125, -0.011127471923828125, -0.009735107421875, -0.008342742919921875, -0.00695037841796875, -0.005558013916015625, -0.0041656494140625, -0.002773284912109375, -0.00138092041015625, 1.1444091796875e-05, 0.00140380859375, 0.002796173095703125, 0.00418853759765625, 0.005580902099609375, 0.0069732666015625, 0.008365631103515625, 0.00975799560546875, 0.011150360107421875, 0.012542724609375, 0.013935089111328125, 0.01532745361328125, 0.016719818115234375, 0.0181121826171875, 0.019504547119140625, 0.02089691162109375, 0.022289276123046875, 0.023681640625, 0.025074005126953125, 0.02646636962890625, 0.027858734130859375, 0.0292510986328125, 0.030643463134765625, 0.03203582763671875, 0.033428192138671875, 0.034820556640625, 0.036212921142578125, 0.03760528564453125, 0.038997650146484375, 0.0403900146484375, 0.041782379150390625, 0.04317474365234375, 0.044567108154296875, 0.04595947265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 4.0, 7.0, 7.0, 20.0, 18.0, 22.0, 31.0, 44.0, 89.0, 130.0, 290.0, 678.0, 1947.0, 8825.0, 96126.0, 840866.0, 87886.0, 8382.0, 1816.0, 694.0, 272.0, 152.0, 84.0, 37.0, 30.0, 25.0, 27.0, 10.0, 9.0, 9.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.014251708984375, -0.013899683952331543, -0.013547658920288086, -0.013195633888244629, -0.012843608856201172, -0.012491583824157715, -0.012139558792114258, -0.0117875337600708, -0.011435508728027344, -0.011083483695983887, -0.01073145866394043, -0.010379433631896973, -0.010027408599853516, -0.009675383567810059, -0.009323358535766602, -0.008971333503723145, -0.008619308471679688, -0.00826728343963623, -0.007915258407592773, -0.007563233375549316, -0.007211208343505859, -0.006859183311462402, -0.006507158279418945, -0.006155133247375488, -0.005803108215332031, -0.005451083183288574, -0.005099058151245117, -0.00474703311920166, -0.004395008087158203, -0.004042983055114746, -0.003690958023071289, -0.003338932991027832, -0.002986907958984375, -0.002634882926940918, -0.002282857894897461, -0.001930832862854004, -0.0015788078308105469, -0.0012267827987670898, -0.0008747577667236328, -0.0005227327346801758, -0.00017070770263671875, 0.00018131732940673828, 0.0005333423614501953, 0.0008853673934936523, 0.0012373924255371094, 0.0015894174575805664, 0.0019414424896240234, 0.0022934675216674805, 0.0026454925537109375, 0.0029975175857543945, 0.0033495426177978516, 0.0037015676498413086, 0.004053592681884766, 0.004405617713928223, 0.00475764274597168, 0.005109667778015137, 0.005461692810058594, 0.005813717842102051, 0.006165742874145508, 0.006517767906188965, 0.006869792938232422, 0.007221817970275879, 0.007573843002319336, 0.007925868034362793, 0.00827789306640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 11.0, 8.0, 16.0, 14.0, 24.0, 28.0, 41.0, 41.0, 70.0, 84.0, 72.0, 109.0, 99.0, 90.0, 67.0, 57.0, 34.0, 36.0, 25.0, 14.0, 18.0, 8.0, 7.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3272972106933594e-05, -4.185270518064499e-05, -4.0432438254356384e-05, -3.901217132806778e-05, -3.7591904401779175e-05, -3.617163747549057e-05, -3.4751370549201965e-05, -3.333110362291336e-05, -3.1910836696624756e-05, -3.049056977033615e-05, -2.9070302844047546e-05, -2.765003591775894e-05, -2.6229768991470337e-05, -2.4809502065181732e-05, -2.3389235138893127e-05, -2.1968968212604523e-05, -2.0548701286315918e-05, -1.9128434360027313e-05, -1.770816743373871e-05, -1.6287900507450104e-05, -1.4867633581161499e-05, -1.3447366654872894e-05, -1.202709972858429e-05, -1.0606832802295685e-05, -9.18656587600708e-06, -7.766298949718475e-06, -6.346032023429871e-06, -4.925765097141266e-06, -3.505498170852661e-06, -2.0852312445640564e-06, -6.649643182754517e-07, 7.553026080131531e-07, 2.175569534301758e-06, 3.5958364605903625e-06, 5.016103386878967e-06, 6.436370313167572e-06, 7.856637239456177e-06, 9.276904165744781e-06, 1.0697171092033386e-05, 1.2117438018321991e-05, 1.3537704944610596e-05, 1.49579718708992e-05, 1.6378238797187805e-05, 1.779850572347641e-05, 1.9218772649765015e-05, 2.063903957605362e-05, 2.2059306502342224e-05, 2.347957342863083e-05, 2.4899840354919434e-05, 2.632010728120804e-05, 2.7740374207496643e-05, 2.9160641133785248e-05, 3.058090806007385e-05, 3.200117498636246e-05, 3.342144191265106e-05, 3.484170883893967e-05, 3.626197576522827e-05, 3.7682242691516876e-05, 3.910250961780548e-05, 4.0522776544094086e-05, 4.194304347038269e-05, 4.3363310396671295e-05, 4.47835773229599e-05, 4.6203844249248505e-05, 4.762411117553711e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 19.0, 23.0, 49.0, 65.0, 133.0, 285.0, 706.0, 2518.0, 18554.0, 719232.0, 294034.0, 10024.0, 1784.0, 572.0, 240.0, 132.0, 65.0, 36.0, 21.0, 11.0, 11.0, 10.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0208282470703125, -0.020342469215393066, -0.019856691360473633, -0.0193709135055542, -0.018885135650634766, -0.018399357795715332, -0.0179135799407959, -0.017427802085876465, -0.01694202423095703, -0.016456246376037598, -0.015970468521118164, -0.01548469066619873, -0.014998912811279297, -0.014513134956359863, -0.01402735710144043, -0.013541579246520996, -0.013055801391601562, -0.012570023536682129, -0.012084245681762695, -0.011598467826843262, -0.011112689971923828, -0.010626912117004395, -0.010141134262084961, -0.009655356407165527, -0.009169578552246094, -0.00868380069732666, -0.008198022842407227, -0.007712244987487793, -0.007226467132568359, -0.006740689277648926, -0.006254911422729492, -0.005769133567810059, -0.005283355712890625, -0.004797577857971191, -0.004311800003051758, -0.0038260221481323242, -0.0033402442932128906, -0.002854466438293457, -0.0023686885833740234, -0.0018829107284545898, -0.0013971328735351562, -0.0009113550186157227, -0.00042557716369628906, 6.020069122314453e-05, 0.0005459785461425781, 0.0010317564010620117, 0.0015175342559814453, 0.002003312110900879, 0.0024890899658203125, 0.002974867820739746, 0.0034606456756591797, 0.003946423530578613, 0.004432201385498047, 0.0049179792404174805, 0.005403757095336914, 0.005889534950256348, 0.006375312805175781, 0.006861090660095215, 0.0073468685150146484, 0.007832646369934082, 0.008318424224853516, 0.00880420207977295, 0.009289979934692383, 0.009775757789611816, 0.01026153564453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 5.0, 6.0, 12.0, 11.0, 21.0, 38.0, 33.0, 71.0, 80.0, 117.0, 165.0, 151.0, 102.0, 73.0, 47.0, 31.0, 16.0, 10.0, 11.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007404327392578125, -0.006900966167449951, -0.006397604942321777, -0.0058942437171936035, -0.00539088249206543, -0.004887521266937256, -0.004384160041809082, -0.003880798816680908, -0.0033774375915527344, -0.0028740763664245605, -0.0023707151412963867, -0.0018673539161682129, -0.001363992691040039, -0.0008606314659118652, -0.0003572702407836914, 0.00014609098434448242, 0.0006494522094726562, 0.00115281343460083, 0.001656174659729004, 0.0021595358848571777, 0.0026628971099853516, 0.0031662583351135254, 0.0036696195602416992, 0.004172980785369873, 0.004676342010498047, 0.005179703235626221, 0.0056830644607543945, 0.006186425685882568, 0.006689786911010742, 0.007193148136138916, 0.00769650936126709, 0.008199870586395264, 0.008703231811523438, 0.009206593036651611, 0.009709954261779785, 0.010213315486907959, 0.010716676712036133, 0.011220037937164307, 0.01172339916229248, 0.012226760387420654, 0.012730121612548828, 0.013233482837677002, 0.013736844062805176, 0.01424020528793335, 0.014743566513061523, 0.015246927738189697, 0.01575028896331787, 0.016253650188446045, 0.01675701141357422, 0.017260372638702393, 0.017763733863830566, 0.01826709508895874, 0.018770456314086914, 0.019273817539215088, 0.01977717876434326, 0.020280539989471436, 0.02078390121459961, 0.021287262439727783, 0.021790623664855957, 0.02229398488998413, 0.022797346115112305, 0.02330070734024048, 0.023804068565368652, 0.024307429790496826, 0.024810791015625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 4.0, 2.0, 4.0, 10.0, 12.0, 26.0, 38.0, 69.0, 106.0, 159.0, 164.0, 165.0, 113.0, 56.0, 37.0, 12.0, 12.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13776442408561707, -0.13234345614910126, -0.12692247331142426, -0.12150149792432785, -0.11608052253723145, -0.11065954715013504, -0.10523857176303864, -0.09981760382652283, -0.09439662098884583, -0.08897564560174942, -0.08355467021465302, -0.07813369482755661, -0.0727127194404602, -0.0672917440533638, -0.061870772391557693, -0.05644979700446129, -0.05102882534265518, -0.04560784995555878, -0.04018687456846237, -0.03476589918136597, -0.02934492565691471, -0.023923950269818306, -0.01850297674536705, -0.013082001358270645, -0.00766102597117424, -0.0022400510497391224, 0.0031809238716959953, 0.008601898327469826, 0.01402287371456623, 0.019443849101662636, 0.02486482262611389, 0.030285798013210297, 0.0357067734003067, 0.04112774878740311, 0.04654872417449951, 0.05196969956159592, 0.05739067494869232, 0.06281165033578873, 0.06823262572288513, 0.07365359365940094, 0.07907457649707794, 0.08449555188417435, 0.08991652727127075, 0.09533750265836716, 0.10075847804546356, 0.10617945343255997, 0.11160042881965637, 0.11702139675617218, 0.12244237214326859, 0.127863347530365, 0.1332843154668808, 0.1387052983045578, 0.1441262662410736, 0.1495472490787506, 0.15496821701526642, 0.16038919985294342, 0.16581016778945923, 0.17123113572597504, 0.17665211856365204, 0.18207308650016785, 0.18749406933784485, 0.19291503727436066, 0.19833602011203766, 0.20375698804855347, 0.20917797088623047]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 6.0, 4.0, 6.0, 11.0, 8.0, 17.0, 15.0, 18.0, 21.0, 41.0, 26.0, 49.0, 47.0, 48.0, 57.0, 55.0, 51.0, 47.0, 50.0, 40.0, 59.0, 57.0, 38.0, 30.0, 29.0, 34.0, 28.0, 20.0, 15.0, 13.0, 18.0, 7.0, 13.0, 10.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15233856439590454, -0.1469634473323822, -0.14158833026885986, -0.13621321320533752, -0.13083809614181519, -0.12546297907829285, -0.12008786201477051, -0.11471274495124817, -0.10933762788772583, -0.10396251082420349, -0.09858739376068115, -0.09321227669715881, -0.08783715963363647, -0.08246204257011414, -0.0770869255065918, -0.07171180844306946, -0.06633669137954712, -0.06096157431602478, -0.05558645725250244, -0.0502113401889801, -0.044836223125457764, -0.039461106061935425, -0.034085988998413086, -0.028710871934890747, -0.023335754871368408, -0.01796063780784607, -0.01258552074432373, -0.007210403680801392, -0.0018352866172790527, 0.003539830446243286, 0.008914947509765625, 0.014290064573287964, 0.019665181636810303, 0.02504029870033264, 0.03041541576385498, 0.03579053282737732, 0.04116564989089966, 0.046540766954422, 0.051915884017944336, 0.057291001081466675, 0.06266611814498901, 0.06804123520851135, 0.07341635227203369, 0.07879146933555603, 0.08416658639907837, 0.08954170346260071, 0.09491682052612305, 0.10029193758964539, 0.10566705465316772, 0.11104217171669006, 0.1164172887802124, 0.12179240584373474, 0.12716752290725708, 0.13254263997077942, 0.13791775703430176, 0.1432928740978241, 0.14866799116134644, 0.15404310822486877, 0.1594182252883911, 0.16479334235191345, 0.1701684594154358, 0.17554357647895813, 0.18091869354248047, 0.1862938106060028, 0.19166892766952515]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [7.0, 8.0, 17.0, 40.0, 77.0, 121.0, 285.0, 672.0, 1619.0, 4491.0, 17174.0, 131301.0, 3785033.0, 223609.0, 20859.0, 5392.0, 1946.0, 758.0, 392.0, 196.0, 111.0, 78.0, 55.0, 23.0, 14.0, 10.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0088653564453125, -0.008160829544067383, -0.007456302642822266, -0.0067517757415771484, -0.006047248840332031, -0.005342721939086914, -0.004638195037841797, -0.00393366813659668, -0.0032291412353515625, -0.0025246143341064453, -0.0018200874328613281, -0.001115560531616211, -0.00041103363037109375, 0.00029349327087402344, 0.0009980201721191406, 0.0017025470733642578, 0.002407073974609375, 0.003111600875854492, 0.0038161277770996094, 0.0045206546783447266, 0.005225181579589844, 0.005929708480834961, 0.006634235382080078, 0.007338762283325195, 0.008043289184570312, 0.00874781608581543, 0.009452342987060547, 0.010156869888305664, 0.010861396789550781, 0.011565923690795898, 0.012270450592041016, 0.012974977493286133, 0.01367950439453125, 0.014384031295776367, 0.015088558197021484, 0.0157930850982666, 0.01649761199951172, 0.017202138900756836, 0.017906665802001953, 0.01861119270324707, 0.019315719604492188, 0.020020246505737305, 0.020724773406982422, 0.02142930030822754, 0.022133827209472656, 0.022838354110717773, 0.02354288101196289, 0.024247407913208008, 0.024951934814453125, 0.025656461715698242, 0.02636098861694336, 0.027065515518188477, 0.027770042419433594, 0.02847456932067871, 0.029179096221923828, 0.029883623123168945, 0.030588150024414062, 0.03129267692565918, 0.0319972038269043, 0.032701730728149414, 0.03340625762939453, 0.03411078453063965, 0.034815311431884766, 0.03551983833312988, 0.036224365234375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 9.0, 6.0, 4.0, 6.0, 17.0, 15.0, 21.0, 35.0, 34.0, 43.0, 66.0, 79.0, 68.0, 69.0, 80.0, 84.0, 75.0, 76.0, 49.0, 31.0, 39.0, 34.0, 21.0, 12.0, 16.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010650634765625, -0.010231256484985352, -0.009811878204345703, -0.009392499923706055, -0.008973121643066406, -0.008553743362426758, -0.00813436508178711, -0.007714986801147461, -0.0072956085205078125, -0.006876230239868164, -0.006456851959228516, -0.006037473678588867, -0.005618095397949219, -0.00519871711730957, -0.004779338836669922, -0.0043599605560302734, -0.003940582275390625, -0.0035212039947509766, -0.003101825714111328, -0.0026824474334716797, -0.0022630691528320312, -0.0018436908721923828, -0.0014243125915527344, -0.001004934310913086, -0.0005855560302734375, -0.00016617774963378906, 0.0002532005310058594, 0.0006725788116455078, 0.0010919570922851562, 0.0015113353729248047, 0.0019307136535644531, 0.0023500919342041016, 0.00276947021484375, 0.0031888484954833984, 0.003608226776123047, 0.004027605056762695, 0.004446983337402344, 0.004866361618041992, 0.005285739898681641, 0.005705118179321289, 0.0061244964599609375, 0.006543874740600586, 0.006963253021240234, 0.007382631301879883, 0.007802009582519531, 0.00822138786315918, 0.008640766143798828, 0.009060144424438477, 0.009479522705078125, 0.009898900985717773, 0.010318279266357422, 0.01073765754699707, 0.011157035827636719, 0.011576414108276367, 0.011995792388916016, 0.012415170669555664, 0.012834548950195312, 0.013253927230834961, 0.01367330551147461, 0.014092683792114258, 0.014512062072753906, 0.014931440353393555, 0.015350818634033203, 0.01577019691467285, 0.0161895751953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 19.0, 14.0, 26.0, 29.0, 49.0, 88.0, 163.0, 363.0, 1428.0, 9925.0, 158524.0, 3965390.0, 51900.0, 4863.0, 874.0, 282.0, 107.0, 73.0, 40.0, 32.0, 16.0, 17.0, 13.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.035736083984375, -0.03455781936645508, -0.033379554748535156, -0.032201290130615234, -0.031023025512695312, -0.02984476089477539, -0.02866649627685547, -0.027488231658935547, -0.026309967041015625, -0.025131702423095703, -0.02395343780517578, -0.02277517318725586, -0.021596908569335938, -0.020418643951416016, -0.019240379333496094, -0.018062114715576172, -0.01688385009765625, -0.015705585479736328, -0.014527320861816406, -0.013349056243896484, -0.012170791625976562, -0.01099252700805664, -0.009814262390136719, -0.008635997772216797, -0.007457733154296875, -0.006279468536376953, -0.005101203918457031, -0.003922939300537109, -0.0027446746826171875, -0.0015664100646972656, -0.00038814544677734375, 0.0007901191711425781, 0.0019683837890625, 0.003146648406982422, 0.004324913024902344, 0.005503177642822266, 0.0066814422607421875, 0.00785970687866211, 0.009037971496582031, 0.010216236114501953, 0.011394500732421875, 0.012572765350341797, 0.013751029968261719, 0.01492929458618164, 0.016107559204101562, 0.017285823822021484, 0.018464088439941406, 0.019642353057861328, 0.02082061767578125, 0.021998882293701172, 0.023177146911621094, 0.024355411529541016, 0.025533676147460938, 0.02671194076538086, 0.02789020538330078, 0.029068470001220703, 0.030246734619140625, 0.03142499923706055, 0.03260326385498047, 0.03378152847290039, 0.03495979309082031, 0.036138057708740234, 0.037316322326660156, 0.03849458694458008, 0.0396728515625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 8.0, 3.0, 3.0, 13.0, 13.0, 17.0, 27.0, 42.0, 67.0, 165.0, 457.0, 1282.0, 1158.0, 361.0, 172.0, 82.0, 42.0, 36.0, 31.0, 16.0, 17.0, 12.0, 9.0, 9.0, 2.0, 6.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022491455078125, -0.021789073944091797, -0.021086692810058594, -0.02038431167602539, -0.019681930541992188, -0.018979549407958984, -0.01827716827392578, -0.017574787139892578, -0.016872406005859375, -0.016170024871826172, -0.015467643737792969, -0.014765262603759766, -0.014062881469726562, -0.01336050033569336, -0.012658119201660156, -0.011955738067626953, -0.01125335693359375, -0.010550975799560547, -0.009848594665527344, -0.00914621353149414, -0.008443832397460938, -0.007741451263427734, -0.007039070129394531, -0.006336688995361328, -0.005634307861328125, -0.004931926727294922, -0.004229545593261719, -0.0035271644592285156, -0.0028247833251953125, -0.0021224021911621094, -0.0014200210571289062, -0.0007176399230957031, -1.52587890625e-05, 0.0006871223449707031, 0.0013895034790039062, 0.0020918846130371094, 0.0027942657470703125, 0.0034966468811035156, 0.004199028015136719, 0.004901409149169922, 0.005603790283203125, 0.006306171417236328, 0.007008552551269531, 0.007710933685302734, 0.008413314819335938, 0.00911569595336914, 0.009818077087402344, 0.010520458221435547, 0.01122283935546875, 0.011925220489501953, 0.012627601623535156, 0.01332998275756836, 0.014032363891601562, 0.014734745025634766, 0.015437126159667969, 0.016139507293701172, 0.016841888427734375, 0.017544269561767578, 0.01824665069580078, 0.018949031829833984, 0.019651412963867188, 0.02035379409790039, 0.021056175231933594, 0.021758556365966797, 0.0224609375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 14.0, 36.0, 125.0, 278.0, 325.0, 148.0, 38.0, 10.0, 7.0, 3.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1583833396434784, -0.14961114525794983, -0.14083895087242126, -0.1320667564868927, -0.12329456210136414, -0.11452236771583557, -0.105750173330307, -0.09697797894477844, -0.08820578455924988, -0.07943359017372131, -0.07066139578819275, -0.061889201402664185, -0.05311700701713562, -0.044344812631607056, -0.03557261824607849, -0.026800423860549927, -0.018028229475021362, -0.009256035089492798, -0.0004838407039642334, 0.008288353681564331, 0.017060548067092896, 0.02583274245262146, 0.034604936838150024, 0.04337713122367859, 0.05214932560920715, 0.06092151999473572, 0.06969371438026428, 0.07846590876579285, 0.08723810315132141, 0.09601029753684998, 0.10478249192237854, 0.1135546863079071, 0.12232691049575806, 0.13109910488128662, 0.13987129926681519, 0.14864349365234375, 0.15741568803787231, 0.16618788242340088, 0.17496007680892944, 0.183732271194458, 0.19250446557998657, 0.20127665996551514, 0.2100488543510437, 0.21882104873657227, 0.22759324312210083, 0.2363654375076294, 0.24513763189315796, 0.2539098262786865, 0.2626820206642151, 0.27145421504974365, 0.2802264094352722, 0.2889986038208008, 0.29777079820632935, 0.3065429925918579, 0.3153151869773865, 0.32408738136291504, 0.3328595757484436, 0.34163177013397217, 0.35040396451950073, 0.3591761589050293, 0.36794835329055786, 0.3767205476760864, 0.385492742061615, 0.39426493644714355, 0.4030371308326721]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 8.0, 17.0, 12.0, 10.0, 13.0, 18.0, 36.0, 31.0, 30.0, 44.0, 53.0, 64.0, 46.0, 52.0, 52.0, 61.0, 46.0, 50.0, 56.0, 44.0, 45.0, 46.0, 30.0, 28.0, 28.0, 24.0, 11.0, 14.0, 7.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10541015863418579, -0.1023077666759491, -0.0992053747177124, -0.09610298275947571, -0.09300059080123901, -0.08989819884300232, -0.08679580688476562, -0.08369341492652893, -0.08059102296829224, -0.07748863101005554, -0.07438623905181885, -0.07128384709358215, -0.06818145513534546, -0.06507906317710876, -0.06197667121887207, -0.058874279260635376, -0.05577188730239868, -0.05266949534416199, -0.04956710338592529, -0.0464647114276886, -0.043362319469451904, -0.04025992751121521, -0.037157535552978516, -0.03405514359474182, -0.030952751636505127, -0.027850359678268433, -0.02474796772003174, -0.021645575761795044, -0.01854318380355835, -0.015440791845321655, -0.012338399887084961, -0.009236007928848267, -0.006133615970611572, -0.003031224012374878, 7.11679458618164e-05, 0.0031735599040985107, 0.006275951862335205, 0.0093783438205719, 0.012480735778808594, 0.015583127737045288, 0.018685519695281982, 0.021787911653518677, 0.02489030361175537, 0.027992695569992065, 0.03109508752822876, 0.034197479486465454, 0.03729987144470215, 0.04040226340293884, 0.04350465536117554, 0.04660704731941223, 0.049709439277648926, 0.05281183123588562, 0.055914223194122314, 0.05901661515235901, 0.0621190071105957, 0.0652213990688324, 0.06832379102706909, 0.07142618298530579, 0.07452857494354248, 0.07763096690177917, 0.08073335886001587, 0.08383575081825256, 0.08693814277648926, 0.09004053473472595, 0.09314292669296265]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 15.0, 21.0, 28.0, 39.0, 55.0, 89.0, 121.0, 194.0, 263.0, 426.0, 748.0, 1243.0, 2160.0, 3930.0, 7568.0, 15461.0, 35413.0, 83618.0, 200074.0, 324560.0, 211293.0, 89665.0, 37650.0, 16361.0, 7959.0, 4086.0, 2201.0, 1263.0, 730.0, 446.0, 275.0, 198.0, 140.0, 83.0, 55.0, 39.0, 27.0, 21.0, 7.0, 2.0, 5.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0097808837890625, -0.00946056842803955, -0.009140253067016602, -0.008819937705993652, -0.008499622344970703, -0.008179306983947754, -0.007858991622924805, -0.0075386762619018555, -0.007218360900878906, -0.006898045539855957, -0.006577730178833008, -0.006257414817810059, -0.005937099456787109, -0.00561678409576416, -0.005296468734741211, -0.004976153373718262, -0.0046558380126953125, -0.004335522651672363, -0.004015207290649414, -0.003694891929626465, -0.0033745765686035156, -0.0030542612075805664, -0.002733945846557617, -0.002413630485534668, -0.0020933151245117188, -0.0017729997634887695, -0.0014526844024658203, -0.001132369041442871, -0.0008120536804199219, -0.0004917383193969727, -0.00017142295837402344, 0.00014889240264892578, 0.000469207763671875, 0.0007895231246948242, 0.0011098384857177734, 0.0014301538467407227, 0.0017504692077636719, 0.002070784568786621, 0.0023910999298095703, 0.0027114152908325195, 0.0030317306518554688, 0.003352046012878418, 0.003672361373901367, 0.003992676734924316, 0.004312992095947266, 0.004633307456970215, 0.004953622817993164, 0.005273938179016113, 0.0055942535400390625, 0.005914568901062012, 0.006234884262084961, 0.00655519962310791, 0.006875514984130859, 0.007195830345153809, 0.007516145706176758, 0.007836461067199707, 0.008156776428222656, 0.008477091789245605, 0.008797407150268555, 0.009117722511291504, 0.009438037872314453, 0.009758353233337402, 0.010078668594360352, 0.0103989839553833, 0.01071929931640625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 4.0, 6.0, 14.0, 10.0, 27.0, 32.0, 39.0, 37.0, 43.0, 60.0, 50.0, 67.0, 63.0, 66.0, 73.0, 64.0, 74.0, 54.0, 38.0, 46.0, 35.0, 18.0, 21.0, 14.0, 10.0, 11.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.01113128662109375, -0.01076650619506836, -0.010401725769042969, -0.010036945343017578, -0.009672164916992188, -0.009307384490966797, -0.008942604064941406, -0.008577823638916016, -0.008213043212890625, -0.007848262786865234, -0.007483482360839844, -0.007118701934814453, -0.0067539215087890625, -0.006389141082763672, -0.006024360656738281, -0.005659580230712891, -0.0052947998046875, -0.004930019378662109, -0.004565238952636719, -0.004200458526611328, -0.0038356781005859375, -0.003470897674560547, -0.0031061172485351562, -0.0027413368225097656, -0.002376556396484375, -0.0020117759704589844, -0.0016469955444335938, -0.0012822151184082031, -0.0009174346923828125, -0.0005526542663574219, -0.00018787384033203125, 0.00017690658569335938, 0.00054168701171875, 0.0009064674377441406, 0.0012712478637695312, 0.0016360282897949219, 0.0020008087158203125, 0.002365589141845703, 0.0027303695678710938, 0.0030951499938964844, 0.003459930419921875, 0.0038247108459472656, 0.004189491271972656, 0.004554271697998047, 0.0049190521240234375, 0.005283832550048828, 0.005648612976074219, 0.006013393402099609, 0.006378173828125, 0.006742954254150391, 0.007107734680175781, 0.007472515106201172, 0.007837295532226562, 0.008202075958251953, 0.008566856384277344, 0.008931636810302734, 0.009296417236328125, 0.009661197662353516, 0.010025978088378906, 0.010390758514404297, 0.010755538940429688, 0.011120319366455078, 0.011485099792480469, 0.01184988021850586, 0.01221466064453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 7.0, 12.0, 29.0, 43.0, 69.0, 115.0, 201.0, 360.0, 672.0, 1335.0, 3707.0, 19807.0, 378063.0, 608874.0, 27551.0, 4390.0, 1571.0, 760.0, 384.0, 237.0, 140.0, 73.0, 57.0, 27.0, 23.0, 14.0, 8.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.039215087890625, -0.03821134567260742, -0.037207603454589844, -0.036203861236572266, -0.03520011901855469, -0.03419637680053711, -0.03319263458251953, -0.03218889236450195, -0.031185150146484375, -0.030181407928466797, -0.02917766571044922, -0.02817392349243164, -0.027170181274414062, -0.026166439056396484, -0.025162696838378906, -0.024158954620361328, -0.02315521240234375, -0.022151470184326172, -0.021147727966308594, -0.020143985748291016, -0.019140243530273438, -0.01813650131225586, -0.01713275909423828, -0.016129016876220703, -0.015125274658203125, -0.014121532440185547, -0.013117790222167969, -0.01211404800415039, -0.011110305786132812, -0.010106563568115234, -0.009102821350097656, -0.008099079132080078, -0.0070953369140625, -0.006091594696044922, -0.005087852478027344, -0.004084110260009766, -0.0030803680419921875, -0.0020766258239746094, -0.0010728836059570312, -6.914138793945312e-05, 0.000934600830078125, 0.0019383430480957031, 0.0029420852661132812, 0.003945827484130859, 0.0049495697021484375, 0.005953311920166016, 0.006957054138183594, 0.007960796356201172, 0.00896453857421875, 0.009968280792236328, 0.010972023010253906, 0.011975765228271484, 0.012979507446289062, 0.01398324966430664, 0.014986991882324219, 0.015990734100341797, 0.016994476318359375, 0.017998218536376953, 0.01900196075439453, 0.02000570297241211, 0.021009445190429688, 0.022013187408447266, 0.023016929626464844, 0.024020671844482422, 0.0250244140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 6.0, 13.0, 6.0, 15.0, 22.0, 23.0, 15.0, 22.0, 34.0, 44.0, 41.0, 31.0, 58.0, 41.0, 51.0, 38.0, 37.0, 46.0, 38.0, 47.0, 47.0, 59.0, 27.0, 45.0, 23.0, 27.0, 23.0, 22.0, 16.0, 10.0, 14.0, 10.0, 7.0, 6.0, 4.0, 3.0, 13.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0308837890625, -0.029927968978881836, -0.028972148895263672, -0.028016328811645508, -0.027060508728027344, -0.02610468864440918, -0.025148868560791016, -0.02419304847717285, -0.023237228393554688, -0.022281408309936523, -0.02132558822631836, -0.020369768142700195, -0.01941394805908203, -0.018458127975463867, -0.017502307891845703, -0.01654648780822754, -0.015590667724609375, -0.014634847640991211, -0.013679027557373047, -0.012723207473754883, -0.011767387390136719, -0.010811567306518555, -0.00985574722290039, -0.008899927139282227, -0.007944107055664062, -0.0069882869720458984, -0.006032466888427734, -0.00507664680480957, -0.004120826721191406, -0.003165006637573242, -0.002209186553955078, -0.001253366470336914, -0.00029754638671875, 0.0006582736968994141, 0.0016140937805175781, 0.002569913864135742, 0.0035257339477539062, 0.00448155403137207, 0.005437374114990234, 0.0063931941986083984, 0.0073490142822265625, 0.008304834365844727, 0.00926065444946289, 0.010216474533081055, 0.011172294616699219, 0.012128114700317383, 0.013083934783935547, 0.014039754867553711, 0.014995574951171875, 0.01595139503479004, 0.016907215118408203, 0.017863035202026367, 0.01881885528564453, 0.019774675369262695, 0.02073049545288086, 0.021686315536499023, 0.022642135620117188, 0.02359795570373535, 0.024553775787353516, 0.02550959587097168, 0.026465415954589844, 0.027421236038208008, 0.028377056121826172, 0.029332876205444336, 0.0302886962890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 12.0, 11.0, 17.0, 24.0, 16.0, 41.0, 40.0, 77.0, 121.0, 250.0, 373.0, 747.0, 1545.0, 4424.0, 30148.0, 985486.0, 18566.0, 3685.0, 1380.0, 631.0, 352.0, 210.0, 133.0, 67.0, 66.0, 27.0, 24.0, 17.0, 15.0, 4.0, 9.0, 4.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.037750244140625, -0.03665351867675781, -0.035556793212890625, -0.03446006774902344, -0.03336334228515625, -0.03226661682128906, -0.031169891357421875, -0.030073165893554688, -0.0289764404296875, -0.027879714965820312, -0.026782989501953125, -0.025686264038085938, -0.02458953857421875, -0.023492813110351562, -0.022396087646484375, -0.021299362182617188, -0.02020263671875, -0.019105911254882812, -0.018009185791015625, -0.016912460327148438, -0.01581573486328125, -0.014719009399414062, -0.013622283935546875, -0.012525558471679688, -0.0114288330078125, -0.010332107543945312, -0.009235382080078125, -0.008138656616210938, -0.00704193115234375, -0.0059452056884765625, -0.004848480224609375, -0.0037517547607421875, -0.002655029296875, -0.0015583038330078125, -0.000461578369140625, 0.0006351470947265625, 0.00173187255859375, 0.0028285980224609375, 0.003925323486328125, 0.0050220489501953125, 0.0061187744140625, 0.0072154998779296875, 0.008312225341796875, 0.009408950805664062, 0.01050567626953125, 0.011602401733398438, 0.012699127197265625, 0.013795852661132812, 0.014892578125, 0.015989303588867188, 0.017086029052734375, 0.018182754516601562, 0.01927947998046875, 0.020376205444335938, 0.021472930908203125, 0.022569656372070312, 0.0236663818359375, 0.024763107299804688, 0.025859832763671875, 0.026956558227539062, 0.02805328369140625, 0.029150009155273438, 0.030246734619140625, 0.03134346008300781, 0.032440185546875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 14.0, 8.0, 19.0, 18.0, 23.0, 41.0, 37.0, 62.0, 62.0, 59.0, 87.0, 87.0, 65.0, 63.0, 57.0, 62.0, 33.0, 31.0, 35.0, 28.0, 8.0, 12.0, 9.0, 10.0, 7.0, 7.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6716461181640625e-05, -3.55355441570282e-05, -3.435462713241577e-05, -3.3173710107803345e-05, -3.199279308319092e-05, -3.081187605857849e-05, -2.9630959033966064e-05, -2.8450042009353638e-05, -2.726912498474121e-05, -2.6088207960128784e-05, -2.4907290935516357e-05, -2.372637391090393e-05, -2.2545456886291504e-05, -2.1364539861679077e-05, -2.018362283706665e-05, -1.9002705812454224e-05, -1.7821788787841797e-05, -1.664087176322937e-05, -1.5459954738616943e-05, -1.4279037714004517e-05, -1.309812068939209e-05, -1.1917203664779663e-05, -1.0736286640167236e-05, -9.55536961555481e-06, -8.374452590942383e-06, -7.193535566329956e-06, -6.012618541717529e-06, -4.8317015171051025e-06, -3.6507844924926758e-06, -2.469867467880249e-06, -1.2889504432678223e-06, -1.0803341865539551e-07, 1.0728836059570312e-06, 2.253800630569458e-06, 3.4347176551818848e-06, 4.6156346797943115e-06, 5.796551704406738e-06, 6.977468729019165e-06, 8.158385753631592e-06, 9.339302778244019e-06, 1.0520219802856445e-05, 1.1701136827468872e-05, 1.2882053852081299e-05, 1.4062970876693726e-05, 1.5243887901306152e-05, 1.642480492591858e-05, 1.7605721950531006e-05, 1.8786638975143433e-05, 1.996755599975586e-05, 2.1148473024368286e-05, 2.2329390048980713e-05, 2.351030707359314e-05, 2.4691224098205566e-05, 2.5872141122817993e-05, 2.705305814743042e-05, 2.8233975172042847e-05, 2.9414892196655273e-05, 3.05958092212677e-05, 3.177672624588013e-05, 3.2957643270492554e-05, 3.413856029510498e-05, 3.531947731971741e-05, 3.6500394344329834e-05, 3.768131136894226e-05, 3.886222839355469e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 10.0, 9.0, 11.0, 15.0, 21.0, 32.0, 39.0, 58.0, 109.0, 224.0, 674.0, 2017.0, 12253.0, 979585.0, 48095.0, 3717.0, 944.0, 334.0, 143.0, 102.0, 50.0, 19.0, 25.0, 9.0, 13.0, 7.0, 10.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0418701171875, -0.04069709777832031, -0.039524078369140625, -0.03835105895996094, -0.03717803955078125, -0.03600502014160156, -0.034832000732421875, -0.03365898132324219, -0.0324859619140625, -0.03131294250488281, -0.030139923095703125, -0.028966903686523438, -0.02779388427734375, -0.026620864868164062, -0.025447845458984375, -0.024274826049804688, -0.023101806640625, -0.021928787231445312, -0.020755767822265625, -0.019582748413085938, -0.01840972900390625, -0.017236709594726562, -0.016063690185546875, -0.014890670776367188, -0.0137176513671875, -0.012544631958007812, -0.011371612548828125, -0.010198593139648438, -0.00902557373046875, -0.007852554321289062, -0.006679534912109375, -0.0055065155029296875, -0.00433349609375, -0.0031604766845703125, -0.001987457275390625, -0.0008144378662109375, 0.00035858154296875, 0.0015316009521484375, 0.002704620361328125, 0.0038776397705078125, 0.0050506591796875, 0.0062236785888671875, 0.007396697998046875, 0.008569717407226562, 0.00974273681640625, 0.010915756225585938, 0.012088775634765625, 0.013261795043945312, 0.014434814453125, 0.015607833862304688, 0.016780853271484375, 0.017953872680664062, 0.01912689208984375, 0.020299911499023438, 0.021472930908203125, 0.022645950317382812, 0.0238189697265625, 0.024991989135742188, 0.026165008544921875, 0.027338027954101562, 0.02851104736328125, 0.029684066772460938, 0.030857086181640625, 0.03203010559082031, 0.033203125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 14.0, 20.0, 59.0, 106.0, 251.0, 246.0, 155.0, 71.0, 24.0, 18.0, 8.0, 0.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0364990234375, -0.03554248809814453, -0.03458595275878906, -0.033629417419433594, -0.032672882080078125, -0.031716346740722656, -0.030759811401367188, -0.02980327606201172, -0.02884674072265625, -0.02789020538330078, -0.026933670043945312, -0.025977134704589844, -0.025020599365234375, -0.024064064025878906, -0.023107528686523438, -0.02215099334716797, -0.0211944580078125, -0.02023792266845703, -0.019281387329101562, -0.018324851989746094, -0.017368316650390625, -0.016411781311035156, -0.015455245971679688, -0.014498710632324219, -0.01354217529296875, -0.012585639953613281, -0.011629104614257812, -0.010672569274902344, -0.009716033935546875, -0.008759498596191406, -0.0078029632568359375, -0.006846427917480469, -0.005889892578125, -0.004933357238769531, -0.0039768218994140625, -0.0030202865600585938, -0.002063751220703125, -0.0011072158813476562, -0.0001506805419921875, 0.0008058547973632812, 0.00176239013671875, 0.0027189254760742188, 0.0036754608154296875, 0.004631996154785156, 0.005588531494140625, 0.006545066833496094, 0.0075016021728515625, 0.008458137512207031, 0.0094146728515625, 0.010371208190917969, 0.011327743530273438, 0.012284278869628906, 0.013240814208984375, 0.014197349548339844, 0.015153884887695312, 0.01611042022705078, 0.01706695556640625, 0.01802349090576172, 0.018980026245117188, 0.019936561584472656, 0.020893096923828125, 0.021849632263183594, 0.022806167602539062, 0.02376270294189453, 0.02471923828125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 9.0, 14.0, 51.0, 206.0, 455.0, 217.0, 32.0, 9.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.1172791719436646, -1.0975604057312012, -1.0778415203094482, -1.0581227540969849, -1.038403868675232, -1.0186851024627686, -0.9989662170410156, -0.9792473912239075, -0.9595285654067993, -0.9398097395896912, -0.920090913772583, -0.9003720879554749, -0.8806532621383667, -0.8609344363212585, -0.8412156105041504, -0.8214967846870422, -0.8017779588699341, -0.7820591330528259, -0.7623403072357178, -0.7426214814186096, -0.7229026556015015, -0.7031838297843933, -0.6834650039672852, -0.663746178150177, -0.6440274119377136, -0.6243085861206055, -0.6045897603034973, -0.5848709344863892, -0.565152108669281, -0.5454332828521729, -0.5257144570350647, -0.5059956312179565, -0.486276775598526, -0.46655794978141785, -0.4468391239643097, -0.42712029814720154, -0.4074014723300934, -0.38768264651298523, -0.36796385049819946, -0.3482450246810913, -0.32852619886398315, -0.308807373046875, -0.28908854722976685, -0.2693697214126587, -0.24965089559555054, -0.22993206977844238, -0.21021325886249542, -0.19049443304538727, -0.17077559232711792, -0.15105676651000977, -0.1313379406929016, -0.11161912232637405, -0.0919002965092659, -0.07218147069215775, -0.05246265232563019, -0.032743826508522034, -0.01302500069141388, 0.006693823263049126, 0.02641264721751213, 0.04613146930932999, 0.06585029512643814, 0.0855691209435463, 0.10528793931007385, 0.125006765127182, 0.14472559094429016]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 7.0, 11.0, 11.0, 18.0, 18.0, 16.0, 23.0, 23.0, 27.0, 31.0, 38.0, 39.0, 51.0, 58.0, 51.0, 58.0, 46.0, 49.0, 45.0, 36.0, 46.0, 40.0, 42.0, 44.0, 15.0, 17.0, 20.0, 15.0, 18.0, 17.0, 18.0, 10.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12390303611755371, -0.11959967762231827, -0.11529632657766342, -0.11099296808242798, -0.10668961703777313, -0.10238625854253769, -0.09808290004730225, -0.0937795490026474, -0.08947619050741196, -0.08517283201217651, -0.08086948096752167, -0.07656612247228622, -0.07226276397705078, -0.06795941293239594, -0.06365605443716049, -0.05935269966721535, -0.0550493448972702, -0.05074599012732506, -0.04644263535737991, -0.04213927686214447, -0.037835922092199326, -0.03353256732225418, -0.029229210689663887, -0.024925854057073593, -0.02062249928712845, -0.016319144517183304, -0.01201578788459301, -0.007712432183325291, -0.0034090764820575714, 0.0008942782878875732, 0.005197634920477867, 0.009500991553068161, 0.013804346323013306, 0.01810770109295845, 0.022411057725548744, 0.026714414358139038, 0.031017769128084183, 0.03532112389802933, 0.03962448239326477, 0.043927837163209915, 0.04823119193315506, 0.052534546703100204, 0.05683790147304535, 0.06114125996828079, 0.06544461846351624, 0.06974796950817108, 0.07405132800340652, 0.07835468649864197, 0.08265803754329681, 0.08696139603853226, 0.0912647470831871, 0.09556810557842255, 0.09987145662307739, 0.10417481511831284, 0.10847817361354828, 0.11278152465820312, 0.11708488315343857, 0.12138824164867401, 0.12569159269332886, 0.1299949437379837, 0.13429830968379974, 0.1386016607284546, 0.14290501177310944, 0.14720837771892548, 0.15151172876358032]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 30.0, 97.0, 315.0, 3732431.0, 461009.0, 299.0, 81.0, 22.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09100341796875, -0.07580280303955078, -0.06060218811035156, -0.045401573181152344, -0.030200958251953125, -0.015000343322753906, 0.0002002716064453125, 0.015400886535644531, 0.03060150146484375, 0.04580211639404297, 0.06100273132324219, 0.0762033462524414, 0.09140396118164062, 0.10660457611083984, 0.12180519104003906, 0.13700580596923828, 0.1522064208984375, 0.16740703582763672, 0.18260765075683594, 0.19780826568603516, 0.21300888061523438, 0.2282094955444336, 0.2434101104736328, 0.25861072540283203, 0.27381134033203125, 0.28901195526123047, 0.3042125701904297, 0.3194131851196289, 0.3346138000488281, 0.34981441497802734, 0.36501502990722656, 0.3802156448364258, 0.395416259765625, 0.4106168746948242, 0.42581748962402344, 0.44101810455322266, 0.4562187194824219, 0.4714193344116211, 0.4866199493408203, 0.5018205642700195, 0.5170211791992188, 0.532221794128418, 0.5474224090576172, 0.5626230239868164, 0.5778236389160156, 0.5930242538452148, 0.6082248687744141, 0.6234254837036133, 0.6386260986328125, 0.6538267135620117, 0.6690273284912109, 0.6842279434204102, 0.6994285583496094, 0.7146291732788086, 0.7298297882080078, 0.745030403137207, 0.7602310180664062, 0.7754316329956055, 0.7906322479248047, 0.8058328628540039, 0.8210334777832031, 0.8362340927124023, 0.8514347076416016, 0.8666353225708008, 0.8818359375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 8.0, 5.0, 13.0, 14.0, 16.0, 33.0, 39.0, 54.0, 57.0, 74.0, 68.0, 63.0, 67.0, 91.0, 78.0, 71.0, 40.0, 44.0, 39.0, 27.0, 25.0, 27.0, 14.0, 12.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01158905029296875, -0.0111846923828125, -0.01078033447265625, -0.0103759765625, -0.00997161865234375, -0.0095672607421875, -0.00916290283203125, -0.008758544921875, -0.00835418701171875, -0.0079498291015625, -0.00754547119140625, -0.00714111328125, -0.00673675537109375, -0.0063323974609375, -0.00592803955078125, -0.005523681640625, -0.00511932373046875, -0.0047149658203125, -0.00431060791015625, -0.00390625, -0.00350189208984375, -0.0030975341796875, -0.00269317626953125, -0.002288818359375, -0.00188446044921875, -0.0014801025390625, -0.00107574462890625, -0.00067138671875, -0.00026702880859375, 0.0001373291015625, 0.00054168701171875, 0.000946044921875, 0.00135040283203125, 0.0017547607421875, 0.00215911865234375, 0.0025634765625, 0.00296783447265625, 0.0033721923828125, 0.00377655029296875, 0.004180908203125, 0.00458526611328125, 0.0049896240234375, 0.00539398193359375, 0.00579833984375, 0.00620269775390625, 0.0066070556640625, 0.00701141357421875, 0.007415771484375, 0.00782012939453125, 0.0082244873046875, 0.00862884521484375, 0.009033203125, 0.00943756103515625, 0.0098419189453125, 0.01024627685546875, 0.010650634765625, 0.01105499267578125, 0.0114593505859375, 0.01186370849609375, 0.01226806640625, 0.01267242431640625, 0.0130767822265625, 0.01348114013671875, 0.013885498046875, 0.01428985595703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 14.0, 21.0, 39.0, 75.0, 120.0, 288.0, 993.0, 10205.0, 3995052.0, 182189.0, 4138.0, 726.0, 217.0, 114.0, 48.0, 20.0, 10.0, 7.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07452392578125, -0.07238340377807617, -0.07024288177490234, -0.06810235977172852, -0.06596183776855469, -0.06382131576538086, -0.06168079376220703, -0.0595402717590332, -0.057399749755859375, -0.05525922775268555, -0.05311870574951172, -0.05097818374633789, -0.04883766174316406, -0.046697139739990234, -0.044556617736816406, -0.04241609573364258, -0.04027557373046875, -0.03813505172729492, -0.035994529724121094, -0.033854007720947266, -0.03171348571777344, -0.02957296371459961, -0.02743244171142578, -0.025291919708251953, -0.023151397705078125, -0.021010875701904297, -0.01887035369873047, -0.01672983169555664, -0.014589309692382812, -0.012448787689208984, -0.010308265686035156, -0.008167743682861328, -0.0060272216796875, -0.003886699676513672, -0.0017461776733398438, 0.0003943443298339844, 0.0025348663330078125, 0.004675388336181641, 0.006815910339355469, 0.008956432342529297, 0.011096954345703125, 0.013237476348876953, 0.015377998352050781, 0.01751852035522461, 0.019659042358398438, 0.021799564361572266, 0.023940086364746094, 0.026080608367919922, 0.02822113037109375, 0.030361652374267578, 0.032502174377441406, 0.034642696380615234, 0.03678321838378906, 0.03892374038696289, 0.04106426239013672, 0.04320478439331055, 0.045345306396484375, 0.0474858283996582, 0.04962635040283203, 0.05176687240600586, 0.05390739440917969, 0.056047916412353516, 0.058188438415527344, 0.06032896041870117, 0.062469482421875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 14.0, 26.0, 50.0, 126.0, 602.0, 2282.0, 687.0, 158.0, 59.0, 28.0, 9.0, 12.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047454833984375, -0.04615640640258789, -0.04485797882080078, -0.04355955123901367, -0.04226112365722656, -0.04096269607543945, -0.039664268493652344, -0.038365840911865234, -0.037067413330078125, -0.035768985748291016, -0.034470558166503906, -0.0331721305847168, -0.03187370300292969, -0.030575275421142578, -0.02927684783935547, -0.02797842025756836, -0.02667999267578125, -0.02538156509399414, -0.02408313751220703, -0.022784709930419922, -0.021486282348632812, -0.020187854766845703, -0.018889427185058594, -0.017590999603271484, -0.016292572021484375, -0.014994144439697266, -0.013695716857910156, -0.012397289276123047, -0.011098861694335938, -0.009800434112548828, -0.008502006530761719, -0.007203578948974609, -0.0059051513671875, -0.004606723785400391, -0.0033082962036132812, -0.002009868621826172, -0.0007114410400390625, 0.0005869865417480469, 0.0018854141235351562, 0.0031838417053222656, 0.004482269287109375, 0.005780696868896484, 0.007079124450683594, 0.008377552032470703, 0.009675979614257812, 0.010974407196044922, 0.012272834777832031, 0.01357126235961914, 0.01486968994140625, 0.01616811752319336, 0.01746654510498047, 0.018764972686767578, 0.020063400268554688, 0.021361827850341797, 0.022660255432128906, 0.023958683013916016, 0.025257110595703125, 0.026555538177490234, 0.027853965759277344, 0.029152393341064453, 0.030450820922851562, 0.03174924850463867, 0.03304767608642578, 0.03434610366821289, 0.03564453125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 31.0, 106.0, 325.0, 335.0, 119.0, 41.0, 13.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28381311893463135, -0.27367180585861206, -0.2635304927825928, -0.2533891499042511, -0.2432478368282318, -0.23310652375221252, -0.22296521067619324, -0.21282389760017395, -0.20268256962299347, -0.19254125654697418, -0.1823999285697937, -0.17225861549377441, -0.16211730241775513, -0.15197597444057465, -0.14183466136455536, -0.13169333338737488, -0.12155202031135559, -0.1114106997847557, -0.10126937925815582, -0.09112806618213654, -0.08098674565553665, -0.07084542512893677, -0.06070410832762718, -0.050562791526317596, -0.04042147099971771, -0.030280152335762978, -0.020138833671808243, -0.009997515007853508, 0.0001438036561012268, 0.01028512418270111, 0.020426440984010696, 0.030567757785320282, 0.040709108114242554, 0.05085042864084244, 0.06099174544215202, 0.07113306224346161, 0.08127438277006149, 0.09141570329666138, 0.10155701637268066, 0.11169833689928055, 0.12183965742588043, 0.13198097050189972, 0.1421222984790802, 0.1522636115550995, 0.16240492463111877, 0.17254625260829926, 0.18268756568431854, 0.19282889366149902, 0.2029702067375183, 0.2131115198135376, 0.22325284779071808, 0.23339416086673737, 0.24353548884391785, 0.25367680191993713, 0.2638181149959564, 0.2739594280719757, 0.2841007709503174, 0.29424208402633667, 0.30438339710235596, 0.31452473998069763, 0.3246660530567169, 0.3348073661327362, 0.3449486792087555, 0.3550899922847748, 0.36523130536079407]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 8.0, 4.0, 12.0, 23.0, 25.0, 36.0, 41.0, 61.0, 47.0, 55.0, 67.0, 76.0, 66.0, 73.0, 75.0, 63.0, 52.0, 48.0, 39.0, 33.0, 27.0, 18.0, 18.0, 14.0, 8.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.13489288091659546, -0.13153484463691711, -0.12817679345607758, -0.12481874972581863, -0.12146070599555969, -0.11810266226530075, -0.11474461853504181, -0.11138657480478287, -0.10802853107452393, -0.10467048734426498, -0.10131244361400604, -0.0979543998837471, -0.09459635615348816, -0.09123831242322922, -0.08788026869297028, -0.08452222496271133, -0.08116418123245239, -0.07780613750219345, -0.07444809377193451, -0.07109005004167557, -0.06773200631141663, -0.06437396258115768, -0.06101591885089874, -0.0576578751206398, -0.05429983139038086, -0.05094178766012192, -0.047583743929862976, -0.044225700199604034, -0.04086765646934509, -0.03750961273908615, -0.03415156900882721, -0.030793525278568268, -0.027435481548309326, -0.024077437818050385, -0.020719394087791443, -0.0173613503575325, -0.01400330662727356, -0.010645262897014618, -0.007287219166755676, -0.003929175436496735, -0.000571131706237793, 0.0027869120240211487, 0.00614495575428009, 0.009502999484539032, 0.012861043214797974, 0.016219086945056915, 0.019577130675315857, 0.0229351744055748, 0.02629321813583374, 0.029651261866092682, 0.033009305596351624, 0.036367349326610565, 0.03972539305686951, 0.04308343678712845, 0.04644148051738739, 0.04979952424764633, 0.05315756797790527, 0.056515611708164215, 0.05987365543842316, 0.0632316991686821, 0.06658974289894104, 0.06994778662919998, 0.07330583035945892, 0.07666387408971786, 0.0800219178199768]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 9.0, 16.0, 47.0, 113.0, 360.0, 1297.0, 5971.0, 38052.0, 374656.0, 556760.0, 60301.0, 8454.0, 1820.0, 451.0, 141.0, 56.0, 18.0, 12.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0295867919921875, -0.028453588485717773, -0.027320384979248047, -0.02618718147277832, -0.025053977966308594, -0.023920774459838867, -0.02278757095336914, -0.021654367446899414, -0.020521163940429688, -0.01938796043395996, -0.018254756927490234, -0.017121553421020508, -0.01598834991455078, -0.014855146408081055, -0.013721942901611328, -0.012588739395141602, -0.011455535888671875, -0.010322332382202148, -0.009189128875732422, -0.008055925369262695, -0.006922721862792969, -0.005789518356323242, -0.004656314849853516, -0.003523111343383789, -0.0023899078369140625, -0.001256704330444336, -0.00012350082397460938, 0.0010097026824951172, 0.0021429061889648438, 0.0032761096954345703, 0.004409313201904297, 0.0055425167083740234, 0.00667572021484375, 0.0078089237213134766, 0.008942127227783203, 0.01007533073425293, 0.011208534240722656, 0.012341737747192383, 0.01347494125366211, 0.014608144760131836, 0.015741348266601562, 0.01687455177307129, 0.018007755279541016, 0.019140958786010742, 0.02027416229248047, 0.021407365798950195, 0.022540569305419922, 0.02367377281188965, 0.024806976318359375, 0.0259401798248291, 0.027073383331298828, 0.028206586837768555, 0.02933979034423828, 0.030472993850708008, 0.031606197357177734, 0.03273940086364746, 0.03387260437011719, 0.035005807876586914, 0.03613901138305664, 0.03727221488952637, 0.038405418395996094, 0.03953862190246582, 0.04067182540893555, 0.04180502891540527, 0.042938232421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 10.0, 6.0, 3.0, 2.0, 7.0, 10.0, 14.0, 19.0, 33.0, 28.0, 36.0, 47.0, 60.0, 51.0, 56.0, 53.0, 65.0, 71.0, 76.0, 43.0, 51.0, 46.0, 43.0, 47.0, 30.0, 16.0, 24.0, 19.0, 13.0, 10.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01038360595703125, -0.010024189949035645, -0.009664773941040039, -0.009305357933044434, -0.008945941925048828, -0.008586525917053223, -0.008227109909057617, -0.007867693901062012, -0.007508277893066406, -0.007148861885070801, -0.006789445877075195, -0.00643002986907959, -0.006070613861083984, -0.005711197853088379, -0.0053517818450927734, -0.004992365837097168, -0.0046329498291015625, -0.004273533821105957, -0.0039141178131103516, -0.003554701805114746, -0.0031952857971191406, -0.002835869789123535, -0.0024764537811279297, -0.0021170377731323242, -0.0017576217651367188, -0.0013982057571411133, -0.0010387897491455078, -0.0006793737411499023, -0.0003199577331542969, 3.9458274841308594e-05, 0.00039887428283691406, 0.0007582902908325195, 0.001117706298828125, 0.0014771223068237305, 0.001836538314819336, 0.0021959543228149414, 0.002555370330810547, 0.0029147863388061523, 0.003274202346801758, 0.0036336183547973633, 0.003993034362792969, 0.004352450370788574, 0.00471186637878418, 0.005071282386779785, 0.005430698394775391, 0.005790114402770996, 0.0061495304107666016, 0.006508946418762207, 0.0068683624267578125, 0.007227778434753418, 0.0075871944427490234, 0.007946610450744629, 0.008306026458740234, 0.00866544246673584, 0.009024858474731445, 0.00938427448272705, 0.009743690490722656, 0.010103106498718262, 0.010462522506713867, 0.010821938514709473, 0.011181354522705078, 0.011540770530700684, 0.011900186538696289, 0.012259602546691895, 0.0126190185546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 8.0, 2.0, 7.0, 9.0, 11.0, 17.0, 23.0, 25.0, 47.0, 57.0, 77.0, 111.0, 159.0, 260.0, 429.0, 681.0, 1369.0, 2992.0, 8699.0, 37126.0, 223505.0, 622363.0, 118215.0, 21723.0, 5794.0, 2150.0, 1037.0, 618.0, 360.0, 228.0, 134.0, 94.0, 59.0, 47.0, 28.0, 18.0, 14.0, 14.0, 15.0, 4.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0235595703125, -0.022807598114013672, -0.022055625915527344, -0.021303653717041016, -0.020551681518554688, -0.01979970932006836, -0.01904773712158203, -0.018295764923095703, -0.017543792724609375, -0.016791820526123047, -0.01603984832763672, -0.01528787612915039, -0.014535903930664062, -0.013783931732177734, -0.013031959533691406, -0.012279987335205078, -0.01152801513671875, -0.010776042938232422, -0.010024070739746094, -0.009272098541259766, -0.008520126342773438, -0.007768154144287109, -0.007016181945800781, -0.006264209747314453, -0.005512237548828125, -0.004760265350341797, -0.004008293151855469, -0.0032563209533691406, -0.0025043487548828125, -0.0017523765563964844, -0.0010004043579101562, -0.0002484321594238281, 0.0005035400390625, 0.0012555122375488281, 0.0020074844360351562, 0.0027594566345214844, 0.0035114288330078125, 0.004263401031494141, 0.005015373229980469, 0.005767345428466797, 0.006519317626953125, 0.007271289825439453, 0.008023262023925781, 0.00877523422241211, 0.009527206420898438, 0.010279178619384766, 0.011031150817871094, 0.011783123016357422, 0.01253509521484375, 0.013287067413330078, 0.014039039611816406, 0.014791011810302734, 0.015542984008789062, 0.01629495620727539, 0.01704692840576172, 0.017798900604248047, 0.018550872802734375, 0.019302845001220703, 0.02005481719970703, 0.02080678939819336, 0.021558761596679688, 0.022310733795166016, 0.023062705993652344, 0.023814678192138672, 0.024566650390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 11.0, 11.0, 15.0, 18.0, 10.0, 28.0, 44.0, 25.0, 38.0, 42.0, 41.0, 49.0, 53.0, 66.0, 53.0, 68.0, 57.0, 59.0, 47.0, 42.0, 31.0, 31.0, 36.0, 23.0, 26.0, 12.0, 18.0, 9.0, 15.0, 5.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036529541015625, -0.035308837890625, -0.034088134765625, -0.032867431640625, -0.031646728515625, -0.030426025390625, -0.029205322265625, -0.027984619140625, -0.026763916015625, -0.025543212890625, -0.024322509765625, -0.023101806640625, -0.021881103515625, -0.020660400390625, -0.019439697265625, -0.018218994140625, -0.016998291015625, -0.015777587890625, -0.014556884765625, -0.013336181640625, -0.012115478515625, -0.010894775390625, -0.009674072265625, -0.008453369140625, -0.007232666015625, -0.006011962890625, -0.004791259765625, -0.003570556640625, -0.002349853515625, -0.001129150390625, 9.1552734375e-05, 0.001312255859375, 0.002532958984375, 0.003753662109375, 0.004974365234375, 0.006195068359375, 0.007415771484375, 0.008636474609375, 0.009857177734375, 0.011077880859375, 0.012298583984375, 0.013519287109375, 0.014739990234375, 0.015960693359375, 0.017181396484375, 0.018402099609375, 0.019622802734375, 0.020843505859375, 0.022064208984375, 0.023284912109375, 0.024505615234375, 0.025726318359375, 0.026947021484375, 0.028167724609375, 0.029388427734375, 0.030609130859375, 0.031829833984375, 0.033050537109375, 0.034271240234375, 0.035491943359375, 0.036712646484375, 0.037933349609375, 0.039154052734375, 0.040374755859375, 0.041595458984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 13.0, 16.0, 35.0, 54.0, 115.0, 285.0, 1018.0, 9019.0, 1021959.0, 14256.0, 1198.0, 315.0, 125.0, 63.0, 35.0, 15.0, 16.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07177734375, -0.0694284439086914, -0.06707954406738281, -0.06473064422607422, -0.062381744384765625, -0.06003284454345703, -0.05768394470214844, -0.055335044860839844, -0.05298614501953125, -0.050637245178222656, -0.04828834533691406, -0.04593944549560547, -0.043590545654296875, -0.04124164581298828, -0.03889274597167969, -0.036543846130371094, -0.0341949462890625, -0.031846046447753906, -0.029497146606445312, -0.02714824676513672, -0.024799346923828125, -0.02245044708251953, -0.020101547241210938, -0.017752647399902344, -0.01540374755859375, -0.013054847717285156, -0.010705947875976562, -0.008357048034667969, -0.006008148193359375, -0.0036592483520507812, -0.0013103485107421875, 0.0010385513305664062, 0.003387451171875, 0.005736351013183594, 0.008085250854492188, 0.010434150695800781, 0.012783050537109375, 0.015131950378417969, 0.017480850219726562, 0.019829750061035156, 0.02217864990234375, 0.024527549743652344, 0.026876449584960938, 0.02922534942626953, 0.031574249267578125, 0.03392314910888672, 0.03627204895019531, 0.038620948791503906, 0.0409698486328125, 0.043318748474121094, 0.04566764831542969, 0.04801654815673828, 0.050365447998046875, 0.05271434783935547, 0.05506324768066406, 0.057412147521972656, 0.05976104736328125, 0.062109947204589844, 0.06445884704589844, 0.06680774688720703, 0.06915664672851562, 0.07150554656982422, 0.07385444641113281, 0.0762033462524414, 0.07855224609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 9.0, 9.0, 6.0, 16.0, 18.0, 31.0, 64.0, 90.0, 154.0, 187.0, 157.0, 102.0, 54.0, 31.0, 21.0, 16.0, 9.0, 7.0, 9.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.716085433959961e-05, -5.463138222694397e-05, -5.210191011428833e-05, -4.957243800163269e-05, -4.704296588897705e-05, -4.451349377632141e-05, -4.198402166366577e-05, -3.945454955101013e-05, -3.692507743835449e-05, -3.439560532569885e-05, -3.186613321304321e-05, -2.9336661100387573e-05, -2.6807188987731934e-05, -2.4277716875076294e-05, -2.1748244762420654e-05, -1.9218772649765015e-05, -1.6689300537109375e-05, -1.4159828424453735e-05, -1.1630356311798096e-05, -9.100884199142456e-06, -6.571412086486816e-06, -4.041939973831177e-06, -1.5124678611755371e-06, 1.0170042514801025e-06, 3.546476364135742e-06, 6.075948476791382e-06, 8.605420589447021e-06, 1.1134892702102661e-05, 1.36643648147583e-05, 1.619383692741394e-05, 1.872330904006958e-05, 2.125278115272522e-05, 2.378225326538086e-05, 2.63117253780365e-05, 2.884119749069214e-05, 3.137066960334778e-05, 3.390014171600342e-05, 3.642961382865906e-05, 3.89590859413147e-05, 4.148855805397034e-05, 4.4018030166625977e-05, 4.6547502279281616e-05, 4.9076974391937256e-05, 5.1606446504592896e-05, 5.4135918617248535e-05, 5.6665390729904175e-05, 5.9194862842559814e-05, 6.172433495521545e-05, 6.42538070678711e-05, 6.678327918052673e-05, 6.931275129318237e-05, 7.184222340583801e-05, 7.437169551849365e-05, 7.690116763114929e-05, 7.943063974380493e-05, 8.196011185646057e-05, 8.448958396911621e-05, 8.701905608177185e-05, 8.954852819442749e-05, 9.207800030708313e-05, 9.460747241973877e-05, 9.713694453239441e-05, 9.966641664505005e-05, 0.00010219588875770569, 0.00010472536087036133]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 18.0, 20.0, 34.0, 64.0, 129.0, 240.0, 621.0, 2007.0, 10558.0, 610759.0, 411721.0, 9510.0, 1818.0, 557.0, 220.0, 105.0, 56.0, 41.0, 18.0, 13.0, 11.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04248046875, -0.04136180877685547, -0.04024314880371094, -0.039124488830566406, -0.038005828857421875, -0.036887168884277344, -0.03576850891113281, -0.03464984893798828, -0.03353118896484375, -0.03241252899169922, -0.03129386901855469, -0.030175209045410156, -0.029056549072265625, -0.027937889099121094, -0.026819229125976562, -0.02570056915283203, -0.0245819091796875, -0.02346324920654297, -0.022344589233398438, -0.021225929260253906, -0.020107269287109375, -0.018988609313964844, -0.017869949340820312, -0.01675128936767578, -0.01563262939453125, -0.014513969421386719, -0.013395309448242188, -0.012276649475097656, -0.011157989501953125, -0.010039329528808594, -0.008920669555664062, -0.007802009582519531, -0.006683349609375, -0.005564689636230469, -0.0044460296630859375, -0.0033273696899414062, -0.002208709716796875, -0.0010900497436523438, 2.86102294921875e-05, 0.0011472702026367188, 0.00226593017578125, 0.0033845901489257812, 0.0045032501220703125, 0.005621910095214844, 0.006740570068359375, 0.007859230041503906, 0.008977890014648438, 0.010096549987792969, 0.0112152099609375, 0.012333869934082031, 0.013452529907226562, 0.014571189880371094, 0.015689849853515625, 0.016808509826660156, 0.017927169799804688, 0.01904582977294922, 0.02016448974609375, 0.02128314971923828, 0.022401809692382812, 0.023520469665527344, 0.024639129638671875, 0.025757789611816406, 0.026876449584960938, 0.02799510955810547, 0.02911376953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 11.0, 18.0, 21.0, 35.0, 44.0, 67.0, 121.0, 142.0, 152.0, 120.0, 92.0, 54.0, 37.0, 23.0, 15.0, 9.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0221099853515625, -0.021422863006591797, -0.020735740661621094, -0.02004861831665039, -0.019361495971679688, -0.018674373626708984, -0.01798725128173828, -0.017300128936767578, -0.016613006591796875, -0.015925884246826172, -0.015238761901855469, -0.014551639556884766, -0.013864517211914062, -0.01317739486694336, -0.012490272521972656, -0.011803150177001953, -0.01111602783203125, -0.010428905487060547, -0.009741783142089844, -0.00905466079711914, -0.008367538452148438, -0.007680416107177734, -0.006993293762207031, -0.006306171417236328, -0.005619049072265625, -0.004931926727294922, -0.004244804382324219, -0.0035576820373535156, -0.0028705596923828125, -0.0021834373474121094, -0.0014963150024414062, -0.0008091926574707031, -0.0001220703125, 0.0005650520324707031, 0.0012521743774414062, 0.0019392967224121094, 0.0026264190673828125, 0.0033135414123535156, 0.004000663757324219, 0.004687786102294922, 0.005374908447265625, 0.006062030792236328, 0.006749153137207031, 0.007436275482177734, 0.008123397827148438, 0.00881052017211914, 0.009497642517089844, 0.010184764862060547, 0.01087188720703125, 0.011559009552001953, 0.012246131896972656, 0.01293325424194336, 0.013620376586914062, 0.014307498931884766, 0.014994621276855469, 0.015681743621826172, 0.016368865966796875, 0.017055988311767578, 0.01774311065673828, 0.018430233001708984, 0.019117355346679688, 0.01980447769165039, 0.020491600036621094, 0.021178722381591797, 0.0218658447265625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 27.0, 50.0, 226.0, 432.0, 192.0, 44.0, 11.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6043671369552612, -0.5868990421295166, -0.5694310069084167, -0.5519629120826721, -0.5344948768615723, -0.5170267820358276, -0.4995587170124054, -0.48209065198898315, -0.4646225869655609, -0.44715452194213867, -0.42968645691871643, -0.4122183918952942, -0.39475029706954956, -0.3772822618484497, -0.3598141670227051, -0.34234610199928284, -0.3248780369758606, -0.30740997195243835, -0.2899419069290161, -0.27247384190559387, -0.25500577688217163, -0.2375376969575882, -0.22006961703300476, -0.20260155200958252, -0.18513348698616028, -0.16766542196273804, -0.1501973569393158, -0.13272927701473236, -0.11526121199131012, -0.09779314696788788, -0.08032507449388504, -0.0628570020198822, -0.04538893699645996, -0.02792086824774742, -0.010452799499034882, 0.007015269249677658, 0.024483337998390198, 0.04195140302181244, 0.05941947549581528, 0.07688754796981812, 0.09435561299324036, 0.1118236780166626, 0.12929174304008484, 0.14675982296466827, 0.16422788798809052, 0.18169595301151276, 0.1991640329360962, 0.21663209795951843, 0.23410016298294067, 0.2515682280063629, 0.26903629302978516, 0.2865043580532074, 0.30397242307662964, 0.32144051790237427, 0.3389085829257965, 0.35637664794921875, 0.373844712972641, 0.39131277799606323, 0.4087808430194855, 0.4262489080429077, 0.44371700286865234, 0.4611850380897522, 0.4786531329154968, 0.49612119793891907, 0.5135892629623413]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 12.0, 27.0, 13.0, 26.0, 29.0, 45.0, 59.0, 39.0, 49.0, 63.0, 65.0, 84.0, 64.0, 65.0, 49.0, 51.0, 44.0, 37.0, 45.0, 28.0, 20.0, 21.0, 12.0, 10.0, 6.0, 9.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20341086387634277, -0.1973525434732437, -0.19129422307014465, -0.1852359175682068, -0.17917759716510773, -0.17311927676200867, -0.1670609712600708, -0.16100265085697174, -0.15494433045387268, -0.14888601005077362, -0.14282768964767456, -0.1367693841457367, -0.13071106374263763, -0.12465274333953857, -0.11859443038702011, -0.11253611743450165, -0.10647779703140259, -0.10041947662830353, -0.09436116367578506, -0.0883028507232666, -0.08224453032016754, -0.07618620991706848, -0.07012789696455002, -0.06406958401203156, -0.058011263608932495, -0.051952946931123734, -0.04589463025331497, -0.03983631357550621, -0.03377799689769745, -0.027719680219888687, -0.021661363542079926, -0.015603046864271164, -0.009544730186462402, -0.0034864135086536407, 0.002571903169155121, 0.008630219846963882, 0.014688536524772644, 0.020746853202581406, 0.026805169880390167, 0.03286348655819893, 0.03892180323600769, 0.04498011991381645, 0.051038436591625214, 0.057096753269433975, 0.06315506994724274, 0.0692133903503418, 0.07527170330286026, 0.08133001625537872, 0.08738833665847778, 0.09344665706157684, 0.0995049700140953, 0.10556328296661377, 0.11162160336971283, 0.11767992377281189, 0.12373823672533035, 0.12979654967784882, 0.13585487008094788, 0.14191319048404694, 0.147971510887146, 0.15402981638908386, 0.16008813679218292, 0.16614645719528198, 0.17220476269721985, 0.1782630831003189, 0.18432140350341797]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 5.0, 21.0, 32.0, 89.0, 251.0, 1931.0, 854319.0, 3334114.0, 3082.0, 308.0, 81.0, 31.0, 16.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0271148681640625, -0.024419546127319336, -0.021724224090576172, -0.019028902053833008, -0.016333580017089844, -0.01363825798034668, -0.010942935943603516, -0.008247613906860352, -0.0055522918701171875, -0.0028569698333740234, -0.00016164779663085938, 0.0025336742401123047, 0.005228996276855469, 0.007924318313598633, 0.010619640350341797, 0.013314962387084961, 0.016010284423828125, 0.01870560646057129, 0.021400928497314453, 0.024096250534057617, 0.02679157257080078, 0.029486894607543945, 0.03218221664428711, 0.03487753868103027, 0.03757286071777344, 0.0402681827545166, 0.042963504791259766, 0.04565882682800293, 0.048354148864746094, 0.05104947090148926, 0.05374479293823242, 0.056440114974975586, 0.05913543701171875, 0.061830759048461914, 0.06452608108520508, 0.06722140312194824, 0.0699167251586914, 0.07261204719543457, 0.07530736923217773, 0.0780026912689209, 0.08069801330566406, 0.08339333534240723, 0.08608865737915039, 0.08878397941589355, 0.09147930145263672, 0.09417462348937988, 0.09686994552612305, 0.09956526756286621, 0.10226058959960938, 0.10495591163635254, 0.1076512336730957, 0.11034655570983887, 0.11304187774658203, 0.1157371997833252, 0.11843252182006836, 0.12112784385681152, 0.12382316589355469, 0.12651848793029785, 0.12921380996704102, 0.13190913200378418, 0.13460445404052734, 0.1372997760772705, 0.13999509811401367, 0.14269042015075684, 0.1453857421875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 10.0, 18.0, 20.0, 53.0, 53.0, 82.0, 107.0, 103.0, 131.0, 123.0, 80.0, 68.0, 56.0, 30.0, 18.0, 16.0, 13.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025299072265625, -0.024700641632080078, -0.024102210998535156, -0.023503780364990234, -0.022905349731445312, -0.02230691909790039, -0.02170848846435547, -0.021110057830810547, -0.020511627197265625, -0.019913196563720703, -0.01931476593017578, -0.01871633529663086, -0.018117904663085938, -0.017519474029541016, -0.016921043395996094, -0.016322612762451172, -0.01572418212890625, -0.015125751495361328, -0.014527320861816406, -0.013928890228271484, -0.013330459594726562, -0.01273202896118164, -0.012133598327636719, -0.011535167694091797, -0.010936737060546875, -0.010338306427001953, -0.009739875793457031, -0.00914144515991211, -0.008543014526367188, -0.007944583892822266, -0.007346153259277344, -0.006747722625732422, -0.0061492919921875, -0.005550861358642578, -0.004952430725097656, -0.004354000091552734, -0.0037555694580078125, -0.0031571388244628906, -0.0025587081909179688, -0.001960277557373047, -0.001361846923828125, -0.0007634162902832031, -0.00016498565673828125, 0.0004334449768066406, 0.0010318756103515625, 0.0016303062438964844, 0.0022287368774414062, 0.002827167510986328, 0.00342559814453125, 0.004024028778076172, 0.004622459411621094, 0.005220890045166016, 0.0058193206787109375, 0.006417751312255859, 0.007016181945800781, 0.007614612579345703, 0.008213043212890625, 0.008811473846435547, 0.009409904479980469, 0.01000833511352539, 0.010606765747070312, 0.011205196380615234, 0.011803627014160156, 0.012402057647705078, 0.01300048828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 10.0, 4.0, 4.0, 10.0, 10.0, 32.0, 29.0, 51.0, 75.0, 109.0, 172.0, 333.0, 783.0, 2320.0, 10972.0, 98863.0, 3742569.0, 306755.0, 23892.0, 4566.0, 1448.0, 551.0, 227.0, 164.0, 95.0, 71.0, 46.0, 33.0, 22.0, 15.0, 17.0, 7.0, 13.0, 5.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0285186767578125, -0.02752375602722168, -0.02652883529663086, -0.02553391456604004, -0.02453899383544922, -0.0235440731048584, -0.022549152374267578, -0.021554231643676758, -0.020559310913085938, -0.019564390182495117, -0.018569469451904297, -0.017574548721313477, -0.016579627990722656, -0.015584707260131836, -0.014589786529541016, -0.013594865798950195, -0.012599945068359375, -0.011605024337768555, -0.010610103607177734, -0.009615182876586914, -0.008620262145996094, -0.0076253414154052734, -0.006630420684814453, -0.005635499954223633, -0.0046405792236328125, -0.003645658493041992, -0.002650737762451172, -0.0016558170318603516, -0.0006608963012695312, 0.00033402442932128906, 0.0013289451599121094, 0.0023238658905029297, 0.00331878662109375, 0.00431370735168457, 0.005308628082275391, 0.006303548812866211, 0.007298469543457031, 0.008293390274047852, 0.009288311004638672, 0.010283231735229492, 0.011278152465820312, 0.012273073196411133, 0.013267993927001953, 0.014262914657592773, 0.015257835388183594, 0.016252756118774414, 0.017247676849365234, 0.018242597579956055, 0.019237518310546875, 0.020232439041137695, 0.021227359771728516, 0.022222280502319336, 0.023217201232910156, 0.024212121963500977, 0.025207042694091797, 0.026201963424682617, 0.027196884155273438, 0.028191804885864258, 0.029186725616455078, 0.0301816463470459, 0.03117656707763672, 0.03217148780822754, 0.03316640853881836, 0.03416132926940918, 0.03515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 9.0, 10.0, 8.0, 13.0, 21.0, 31.0, 43.0, 87.0, 171.0, 322.0, 747.0, 1140.0, 723.0, 310.0, 157.0, 70.0, 64.0, 36.0, 24.0, 22.0, 12.0, 11.0, 14.0, 8.0, 6.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0191497802734375, -0.01833367347717285, -0.017517566680908203, -0.016701459884643555, -0.015885353088378906, -0.015069246292114258, -0.01425313949584961, -0.013437032699584961, -0.012620925903320312, -0.011804819107055664, -0.010988712310791016, -0.010172605514526367, -0.009356498718261719, -0.00854039192199707, -0.007724285125732422, -0.0069081783294677734, -0.006092071533203125, -0.0052759647369384766, -0.004459857940673828, -0.0036437511444091797, -0.0028276443481445312, -0.002011537551879883, -0.0011954307556152344, -0.00037932395935058594, 0.0004367828369140625, 0.001252889633178711, 0.0020689964294433594, 0.002885103225708008, 0.0037012100219726562, 0.004517316818237305, 0.005333423614501953, 0.0061495304107666016, 0.00696563720703125, 0.0077817440032958984, 0.008597850799560547, 0.009413957595825195, 0.010230064392089844, 0.011046171188354492, 0.01186227798461914, 0.012678384780883789, 0.013494491577148438, 0.014310598373413086, 0.015126705169677734, 0.015942811965942383, 0.01675891876220703, 0.01757502555847168, 0.018391132354736328, 0.019207239151000977, 0.020023345947265625, 0.020839452743530273, 0.021655559539794922, 0.02247166633605957, 0.02328777313232422, 0.024103879928588867, 0.024919986724853516, 0.025736093521118164, 0.026552200317382812, 0.02736830711364746, 0.02818441390991211, 0.029000520706176758, 0.029816627502441406, 0.030632734298706055, 0.0314488410949707, 0.03226494789123535, 0.0330810546875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 16.0, 27.0, 59.0, 154.0, 244.0, 269.0, 116.0, 54.0, 20.0, 15.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38885754346847534, -0.377643883228302, -0.3664301931858063, -0.35521653294563293, -0.3440028429031372, -0.33278918266296387, -0.32157549262046814, -0.3103618323802948, -0.2991481423377991, -0.28793448209762573, -0.27672079205513, -0.26550713181495667, -0.25429344177246094, -0.2430797666311264, -0.23186609148979187, -0.22065243124961853, -0.209438756108284, -0.19822508096694946, -0.18701140582561493, -0.1757977306842804, -0.16458405554294586, -0.15337038040161133, -0.142156720161438, -0.13094303011894226, -0.11972936242818832, -0.10851568728685379, -0.09730201214551926, -0.08608834445476532, -0.07487466931343079, -0.06366099417209625, -0.05244731903076172, -0.041233643889427185, -0.03001996874809265, -0.018806293606758118, -0.007592620328068733, 0.0036210529506206512, 0.014834728091955185, 0.02604840323328972, 0.037262074649333954, 0.04847574979066849, 0.05968942493200302, 0.07090310007333755, 0.08211677521467209, 0.09333044290542603, 0.10454411804676056, 0.11575779318809509, 0.12697146832942963, 0.13818514347076416, 0.1493988186120987, 0.16061249375343323, 0.17182616889476776, 0.1830398440361023, 0.19425351917743683, 0.20546719431877136, 0.2166808545589447, 0.22789454460144043, 0.23910820484161377, 0.2503218650817871, 0.26153555512428284, 0.2727492153644562, 0.2839629054069519, 0.29517656564712524, 0.30639025568962097, 0.3176039159297943, 0.32881760597229004]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 10.0, 11.0, 16.0, 9.0, 32.0, 32.0, 29.0, 42.0, 46.0, 56.0, 62.0, 74.0, 65.0, 69.0, 63.0, 59.0, 61.0, 49.0, 39.0, 34.0, 31.0, 23.0, 26.0, 19.0, 11.0, 7.0, 9.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0763278603553772, -0.07244311273097992, -0.06855837255716324, -0.06467363238334656, -0.06078888475894928, -0.0569041408598423, -0.05301939696073532, -0.04913465306162834, -0.04524990916252136, -0.04136516526341438, -0.037480421364307404, -0.033595677465200424, -0.029710933566093445, -0.025826189666986465, -0.021941445767879486, -0.018056701868772507, -0.014171957969665527, -0.010287214070558548, -0.006402470171451569, -0.0025177262723445892, 0.0013670176267623901, 0.0052517615258693695, 0.009136505424976349, 0.013021249324083328, 0.016905993223190308, 0.020790737122297287, 0.024675481021404266, 0.028560224920511246, 0.032444968819618225, 0.036329712718725204, 0.040214456617832184, 0.04409920051693916, 0.04798394441604614, 0.05186868831515312, 0.0557534322142601, 0.05963817611336708, 0.06352292001247406, 0.06740766763687134, 0.07129240781068802, 0.0751771479845047, 0.07906189560890198, 0.08294664323329926, 0.08683138340711594, 0.09071612358093262, 0.0946008712053299, 0.09848561882972717, 0.10237035900354385, 0.10625509917736053, 0.11013984680175781, 0.11402459442615509, 0.11790933459997177, 0.12179407477378845, 0.12567882239818573, 0.129563570022583, 0.1334483027458191, 0.13733305037021637, 0.14121779799461365, 0.14510254561901093, 0.1489872932434082, 0.1528720259666443, 0.15675677359104156, 0.16064152121543884, 0.16452625393867493, 0.1684110015630722, 0.17229574918746948]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 7.0, 9.0, 12.0, 21.0, 39.0, 51.0, 81.0, 138.0, 295.0, 477.0, 818.0, 1563.0, 3449.0, 7411.0, 18769.0, 49220.0, 133941.0, 315071.0, 308639.0, 129113.0, 47218.0, 18033.0, 7430.0, 3299.0, 1541.0, 828.0, 488.0, 238.0, 131.0, 69.0, 49.0, 39.0, 29.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01456451416015625, -0.014078736305236816, -0.013592958450317383, -0.01310718059539795, -0.012621402740478516, -0.012135624885559082, -0.011649847030639648, -0.011164069175720215, -0.010678291320800781, -0.010192513465881348, -0.009706735610961914, -0.00922095775604248, -0.008735179901123047, -0.008249402046203613, -0.00776362419128418, -0.007277846336364746, -0.0067920684814453125, -0.006306290626525879, -0.005820512771606445, -0.005334734916687012, -0.004848957061767578, -0.0043631792068481445, -0.003877401351928711, -0.0033916234970092773, -0.0029058456420898438, -0.00242006778717041, -0.0019342899322509766, -0.001448512077331543, -0.0009627342224121094, -0.0004769563674926758, 8.821487426757812e-06, 0.0004945993423461914, 0.000980377197265625, 0.0014661550521850586, 0.0019519329071044922, 0.0024377107620239258, 0.0029234886169433594, 0.003409266471862793, 0.0038950443267822266, 0.00438082218170166, 0.004866600036621094, 0.005352377891540527, 0.005838155746459961, 0.0063239336013793945, 0.006809711456298828, 0.007295489311218262, 0.007781267166137695, 0.008267045021057129, 0.008752822875976562, 0.009238600730895996, 0.00972437858581543, 0.010210156440734863, 0.010695934295654297, 0.01118171215057373, 0.011667490005493164, 0.012153267860412598, 0.012639045715332031, 0.013124823570251465, 0.013610601425170898, 0.014096379280090332, 0.014582157135009766, 0.0150679349899292, 0.015553712844848633, 0.016039490699768066, 0.0165252685546875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 11.0, 7.0, 15.0, 22.0, 20.0, 53.0, 44.0, 49.0, 54.0, 52.0, 82.0, 75.0, 66.0, 73.0, 71.0, 59.0, 57.0, 41.0, 34.0, 21.0, 19.0, 16.0, 14.0, 5.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01149749755859375, -0.011115193367004395, -0.010732889175415039, -0.010350584983825684, -0.009968280792236328, -0.009585976600646973, -0.009203672409057617, -0.008821368217468262, -0.008439064025878906, -0.00805675983428955, -0.007674455642700195, -0.00729215145111084, -0.006909847259521484, -0.006527543067932129, -0.0061452388763427734, -0.005762934684753418, -0.0053806304931640625, -0.004998326301574707, -0.0046160221099853516, -0.004233717918395996, -0.0038514137268066406, -0.003469109535217285, -0.0030868053436279297, -0.0027045011520385742, -0.0023221969604492188, -0.0019398927688598633, -0.0015575885772705078, -0.0011752843856811523, -0.0007929801940917969, -0.0004106760025024414, -2.8371810913085938e-05, 0.00035393238067626953, 0.000736236572265625, 0.0011185407638549805, 0.001500844955444336, 0.0018831491470336914, 0.002265453338623047, 0.0026477575302124023, 0.003030061721801758, 0.0034123659133911133, 0.0037946701049804688, 0.004176974296569824, 0.00455927848815918, 0.004941582679748535, 0.005323886871337891, 0.005706191062927246, 0.0060884952545166016, 0.006470799446105957, 0.0068531036376953125, 0.007235407829284668, 0.0076177120208740234, 0.008000016212463379, 0.008382320404052734, 0.00876462459564209, 0.009146928787231445, 0.0095292329788208, 0.009911537170410156, 0.010293841361999512, 0.010676145553588867, 0.011058449745178223, 0.011440753936767578, 0.011823058128356934, 0.012205362319946289, 0.012587666511535645, 0.012969970703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 3.0, 12.0, 21.0, 34.0, 49.0, 61.0, 75.0, 123.0, 200.0, 302.0, 420.0, 733.0, 1309.0, 2703.0, 8259.0, 47312.0, 572006.0, 364614.0, 37598.0, 7153.0, 2396.0, 1169.0, 660.0, 425.0, 282.0, 200.0, 135.0, 90.0, 48.0, 35.0, 32.0, 23.0, 13.0, 10.0, 14.0, 4.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029754638671875, -0.028689861297607422, -0.027625083923339844, -0.026560306549072266, -0.025495529174804688, -0.02443075180053711, -0.02336597442626953, -0.022301197052001953, -0.021236419677734375, -0.020171642303466797, -0.01910686492919922, -0.01804208755493164, -0.016977310180664062, -0.015912532806396484, -0.014847755432128906, -0.013782978057861328, -0.01271820068359375, -0.011653423309326172, -0.010588645935058594, -0.009523868560791016, -0.008459091186523438, -0.007394313812255859, -0.006329536437988281, -0.005264759063720703, -0.004199981689453125, -0.003135204315185547, -0.0020704269409179688, -0.0010056495666503906, 5.91278076171875e-05, 0.0011239051818847656, 0.0021886825561523438, 0.003253459930419922, 0.0043182373046875, 0.005383014678955078, 0.006447792053222656, 0.007512569427490234, 0.008577346801757812, 0.00964212417602539, 0.010706901550292969, 0.011771678924560547, 0.012836456298828125, 0.013901233673095703, 0.014966011047363281, 0.01603078842163086, 0.017095565795898438, 0.018160343170166016, 0.019225120544433594, 0.020289897918701172, 0.02135467529296875, 0.022419452667236328, 0.023484230041503906, 0.024549007415771484, 0.025613784790039062, 0.02667856216430664, 0.02774333953857422, 0.028808116912841797, 0.029872894287109375, 0.030937671661376953, 0.03200244903564453, 0.03306722640991211, 0.03413200378417969, 0.035196781158447266, 0.036261558532714844, 0.03732633590698242, 0.03839111328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 8.0, 1.0, 5.0, 9.0, 8.0, 11.0, 14.0, 12.0, 17.0, 25.0, 23.0, 35.0, 39.0, 38.0, 43.0, 50.0, 56.0, 43.0, 43.0, 56.0, 56.0, 40.0, 59.0, 45.0, 33.0, 43.0, 28.0, 36.0, 28.0, 15.0, 19.0, 18.0, 5.0, 15.0, 10.0, 4.0, 5.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034759521484375, -0.03357553482055664, -0.03239154815673828, -0.031207561492919922, -0.030023574829101562, -0.028839588165283203, -0.027655601501464844, -0.026471614837646484, -0.025287628173828125, -0.024103641510009766, -0.022919654846191406, -0.021735668182373047, -0.020551681518554688, -0.019367694854736328, -0.01818370819091797, -0.01699972152709961, -0.01581573486328125, -0.01463174819946289, -0.013447761535644531, -0.012263774871826172, -0.011079788208007812, -0.009895801544189453, -0.008711814880371094, -0.007527828216552734, -0.006343841552734375, -0.005159854888916016, -0.003975868225097656, -0.002791881561279297, -0.0016078948974609375, -0.0004239082336425781, 0.0007600784301757812, 0.0019440650939941406, 0.0031280517578125, 0.004312038421630859, 0.005496025085449219, 0.006680011749267578, 0.007863998413085938, 0.009047985076904297, 0.010231971740722656, 0.011415958404541016, 0.012599945068359375, 0.013783931732177734, 0.014967918395996094, 0.016151905059814453, 0.017335891723632812, 0.018519878387451172, 0.01970386505126953, 0.02088785171508789, 0.02207183837890625, 0.02325582504272461, 0.02443981170654297, 0.025623798370361328, 0.026807785034179688, 0.027991771697998047, 0.029175758361816406, 0.030359745025634766, 0.031543731689453125, 0.032727718353271484, 0.033911705017089844, 0.0350956916809082, 0.03627967834472656, 0.03746366500854492, 0.03864765167236328, 0.03983163833618164, 0.041015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 10.0, 25.0, 19.0, 41.0, 57.0, 77.0, 132.0, 200.0, 349.0, 534.0, 997.0, 2023.0, 4055.0, 9874.0, 32661.0, 809053.0, 155283.0, 19701.0, 6889.0, 3005.0, 1488.0, 845.0, 439.0, 288.0, 159.0, 123.0, 59.0, 61.0, 25.0, 18.0, 24.0, 8.0, 8.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029693603515625, -0.028760194778442383, -0.027826786041259766, -0.02689337730407715, -0.02595996856689453, -0.025026559829711914, -0.024093151092529297, -0.02315974235534668, -0.022226333618164062, -0.021292924880981445, -0.020359516143798828, -0.01942610740661621, -0.018492698669433594, -0.017559289932250977, -0.01662588119506836, -0.015692472457885742, -0.014759063720703125, -0.013825654983520508, -0.01289224624633789, -0.011958837509155273, -0.011025428771972656, -0.010092020034790039, -0.009158611297607422, -0.008225202560424805, -0.0072917938232421875, -0.00635838508605957, -0.005424976348876953, -0.004491567611694336, -0.0035581588745117188, -0.0026247501373291016, -0.0016913414001464844, -0.0007579326629638672, 0.00017547607421875, 0.0011088848114013672, 0.0020422935485839844, 0.0029757022857666016, 0.003909111022949219, 0.004842519760131836, 0.005775928497314453, 0.00670933723449707, 0.0076427459716796875, 0.008576154708862305, 0.009509563446044922, 0.010442972183227539, 0.011376380920410156, 0.012309789657592773, 0.01324319839477539, 0.014176607131958008, 0.015110015869140625, 0.016043424606323242, 0.01697683334350586, 0.017910242080688477, 0.018843650817871094, 0.01977705955505371, 0.020710468292236328, 0.021643877029418945, 0.022577285766601562, 0.02351069450378418, 0.024444103240966797, 0.025377511978149414, 0.02631092071533203, 0.02724432945251465, 0.028177738189697266, 0.029111146926879883, 0.0300445556640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 1.0, 10.0, 5.0, 2.0, 9.0, 12.0, 12.0, 15.0, 25.0, 23.0, 19.0, 22.0, 26.0, 52.0, 48.0, 46.0, 82.0, 64.0, 66.0, 84.0, 59.0, 53.0, 39.0, 31.0, 30.0, 24.0, 11.0, 14.0, 18.0, 12.0, 11.0, 12.0, 8.0, 11.0, 6.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.731250762939453e-05, -3.618840128183365e-05, -3.5064294934272766e-05, -3.3940188586711884e-05, -3.2816082239151e-05, -3.169197589159012e-05, -3.0567869544029236e-05, -2.9443763196468353e-05, -2.831965684890747e-05, -2.7195550501346588e-05, -2.6071444153785706e-05, -2.4947337806224823e-05, -2.382323145866394e-05, -2.2699125111103058e-05, -2.1575018763542175e-05, -2.0450912415981293e-05, -1.932680606842041e-05, -1.8202699720859528e-05, -1.7078593373298645e-05, -1.5954487025737762e-05, -1.483038067817688e-05, -1.3706274330615997e-05, -1.2582167983055115e-05, -1.1458061635494232e-05, -1.033395528793335e-05, -9.209848940372467e-06, -8.085742592811584e-06, -6.961636245250702e-06, -5.837529897689819e-06, -4.713423550128937e-06, -3.589317202568054e-06, -2.4652108550071716e-06, -1.341104507446289e-06, -2.169981598854065e-07, 9.071081876754761e-07, 2.0312145352363586e-06, 3.155320882797241e-06, 4.279427230358124e-06, 5.403533577919006e-06, 6.527639925479889e-06, 7.651746273040771e-06, 8.775852620601654e-06, 9.899958968162537e-06, 1.102406531572342e-05, 1.2148171663284302e-05, 1.3272278010845184e-05, 1.4396384358406067e-05, 1.552049070596695e-05, 1.6644597053527832e-05, 1.7768703401088715e-05, 1.8892809748649597e-05, 2.001691609621048e-05, 2.1141022443771362e-05, 2.2265128791332245e-05, 2.3389235138893127e-05, 2.451334148645401e-05, 2.5637447834014893e-05, 2.6761554181575775e-05, 2.7885660529136658e-05, 2.900976687669754e-05, 3.0133873224258423e-05, 3.1257979571819305e-05, 3.238208591938019e-05, 3.350619226694107e-05, 3.463029861450195e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 8.0, 5.0, 3.0, 6.0, 7.0, 17.0, 37.0, 42.0, 68.0, 109.0, 142.0, 244.0, 435.0, 894.0, 1984.0, 4529.0, 12148.0, 43350.0, 878638.0, 78943.0, 16224.0, 5979.0, 2360.0, 1019.0, 540.0, 283.0, 188.0, 125.0, 74.0, 47.0, 31.0, 16.0, 16.0, 10.0, 11.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0281524658203125, -0.027202367782592773, -0.026252269744873047, -0.02530217170715332, -0.024352073669433594, -0.023401975631713867, -0.02245187759399414, -0.021501779556274414, -0.020551681518554688, -0.01960158348083496, -0.018651485443115234, -0.017701387405395508, -0.01675128936767578, -0.015801191329956055, -0.014851093292236328, -0.013900995254516602, -0.012950897216796875, -0.012000799179077148, -0.011050701141357422, -0.010100603103637695, -0.009150505065917969, -0.008200407028198242, -0.007250308990478516, -0.006300210952758789, -0.0053501129150390625, -0.004400014877319336, -0.0034499168395996094, -0.002499818801879883, -0.0015497207641601562, -0.0005996227264404297, 0.0003504753112792969, 0.0013005733489990234, 0.00225067138671875, 0.0032007694244384766, 0.004150867462158203, 0.00510096549987793, 0.006051063537597656, 0.007001161575317383, 0.00795125961303711, 0.008901357650756836, 0.009851455688476562, 0.010801553726196289, 0.011751651763916016, 0.012701749801635742, 0.013651847839355469, 0.014601945877075195, 0.015552043914794922, 0.01650214195251465, 0.017452239990234375, 0.0184023380279541, 0.019352436065673828, 0.020302534103393555, 0.02125263214111328, 0.022202730178833008, 0.023152828216552734, 0.02410292625427246, 0.025053024291992188, 0.026003122329711914, 0.02695322036743164, 0.027903318405151367, 0.028853416442871094, 0.02980351448059082, 0.030753612518310547, 0.03170371055603027, 0.03265380859375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 4.0, 5.0, 8.0, 3.0, 5.0, 7.0, 14.0, 12.0, 18.0, 22.0, 38.0, 84.0, 132.0, 143.0, 153.0, 100.0, 76.0, 38.0, 31.0, 24.0, 5.0, 10.0, 9.0, 13.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.02227783203125, -0.021637916564941406, -0.020998001098632812, -0.02035808563232422, -0.019718170166015625, -0.01907825469970703, -0.018438339233398438, -0.017798423767089844, -0.01715850830078125, -0.016518592834472656, -0.015878677368164062, -0.015238761901855469, -0.014598846435546875, -0.013958930969238281, -0.013319015502929688, -0.012679100036621094, -0.0120391845703125, -0.011399269104003906, -0.010759353637695312, -0.010119438171386719, -0.009479522705078125, -0.008839607238769531, -0.008199691772460938, -0.007559776306152344, -0.00691986083984375, -0.006279945373535156, -0.0056400299072265625, -0.005000114440917969, -0.004360198974609375, -0.0037202835083007812, -0.0030803680419921875, -0.0024404525756835938, -0.001800537109375, -0.0011606216430664062, -0.0005207061767578125, 0.00011920928955078125, 0.000759124755859375, 0.0013990402221679688, 0.0020389556884765625, 0.0026788711547851562, 0.00331878662109375, 0.003958702087402344, 0.0045986175537109375, 0.005238533020019531, 0.005878448486328125, 0.006518363952636719, 0.0071582794189453125, 0.007798194885253906, 0.0084381103515625, 0.009078025817871094, 0.009717941284179688, 0.010357856750488281, 0.010997772216796875, 0.011637687683105469, 0.012277603149414062, 0.012917518615722656, 0.01355743408203125, 0.014197349548339844, 0.014837265014648438, 0.015477180480957031, 0.016117095947265625, 0.01675701141357422, 0.017396926879882812, 0.018036842346191406, 0.0186767578125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 3.0, 13.0, 14.0, 33.0, 64.0, 106.0, 217.0, 250.0, 149.0, 79.0, 38.0, 14.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34992358088493347, -0.33544108271598816, -0.32095855474472046, -0.30647605657577515, -0.29199355840682983, -0.2775110602378845, -0.2630285620689392, -0.2485460340976715, -0.2340635359287262, -0.21958103775978088, -0.20509852468967438, -0.19061601161956787, -0.17613351345062256, -0.16165101528167725, -0.14716850221157074, -0.13268598914146423, -0.11820349097251892, -0.10372098535299301, -0.0892384797334671, -0.07475597411394119, -0.06027346849441528, -0.045790962874889374, -0.031308457255363464, -0.016825951635837555, -0.0023434460163116455, 0.012139059603214264, 0.026621565222740173, 0.04110407084226608, 0.05558657646179199, 0.0700690820813179, 0.08455158770084381, 0.09903409332036972, 0.11351662874221802, 0.12799912691116333, 0.14248163998126984, 0.15696415305137634, 0.17144665122032166, 0.18592914938926697, 0.20041166245937347, 0.21489417552947998, 0.2293766736984253, 0.2438591718673706, 0.2583416700363159, 0.2728241980075836, 0.28730669617652893, 0.30178919434547424, 0.31627172231674194, 0.33075422048568726, 0.34523671865463257, 0.3597192168235779, 0.3742017149925232, 0.3886842429637909, 0.4031667411327362, 0.4176492393016815, 0.4321317672729492, 0.44661426544189453, 0.46109676361083984, 0.47557926177978516, 0.49006175994873047, 0.5045442581176758, 0.5190267562866211, 0.5335093140602112, 0.5479918122291565, 0.5624743103981018, 0.5769568085670471]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 4.0, 6.0, 7.0, 7.0, 12.0, 5.0, 17.0, 9.0, 18.0, 25.0, 16.0, 24.0, 21.0, 24.0, 34.0, 30.0, 42.0, 49.0, 53.0, 72.0, 64.0, 55.0, 51.0, 37.0, 37.0, 33.0, 30.0, 28.0, 17.0, 27.0, 24.0, 25.0, 19.0, 18.0, 7.0, 11.0, 7.0, 10.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.1523405909538269, -0.14789266884326935, -0.1434447467327118, -0.13899683952331543, -0.13454891741275787, -0.13010099530220032, -0.12565307319164276, -0.1212051510810852, -0.11675723642110825, -0.11230931431055069, -0.10786139965057373, -0.10341347754001617, -0.09896555542945862, -0.09451764076948166, -0.0900697186589241, -0.08562180399894714, -0.08117388188838959, -0.07672595977783203, -0.07227804511785507, -0.06783012300729752, -0.06338220834732056, -0.058934286236763, -0.054486364126205444, -0.05003844574093819, -0.04559052735567093, -0.04114260897040367, -0.036694690585136414, -0.03224676847457886, -0.0277988500893116, -0.023350931704044342, -0.018903011456131935, -0.014455091208219528, -0.01000717282295227, -0.005559253506362438, -0.001111334189772606, 0.0033365851268172264, 0.007784504443407059, 0.012232422828674316, 0.016680343076586723, 0.02112826332449913, 0.025576181709766388, 0.030024100095033646, 0.0344720184803009, 0.03891994059085846, 0.04336785897612572, 0.047815777361392975, 0.05226369947195053, 0.05671161785721779, 0.061159536242485046, 0.0656074583530426, 0.07005537301301956, 0.07450329512357712, 0.07895120978355408, 0.08339913189411163, 0.08784705400466919, 0.09229497611522675, 0.0967428907752037, 0.10119081288576126, 0.10563872754573822, 0.11008664965629578, 0.11453457176685333, 0.11898248642683029, 0.12343040853738785, 0.1278783231973648, 0.13232624530792236]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 7.0, 13.0, 9.0, 17.0, 23.0, 37.0, 49.0, 97.0, 157.0, 390.0, 923.0, 3225.0, 16037.0, 222408.0, 3701788.0, 226687.0, 17071.0, 3444.0, 1057.0, 369.0, 189.0, 85.0, 57.0, 28.0, 26.0, 16.0, 10.0, 8.0, 7.0, 9.0, 6.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028961181640625, -0.028011798858642578, -0.027062416076660156, -0.026113033294677734, -0.025163650512695312, -0.02421426773071289, -0.02326488494873047, -0.022315502166748047, -0.021366119384765625, -0.020416736602783203, -0.01946735382080078, -0.01851797103881836, -0.017568588256835938, -0.016619205474853516, -0.015669822692871094, -0.014720439910888672, -0.01377105712890625, -0.012821674346923828, -0.011872291564941406, -0.010922908782958984, -0.009973526000976562, -0.00902414321899414, -0.008074760437011719, -0.007125377655029297, -0.006175994873046875, -0.005226612091064453, -0.004277229309082031, -0.0033278465270996094, -0.0023784637451171875, -0.0014290809631347656, -0.00047969818115234375, 0.0004696846008300781, 0.0014190673828125, 0.002368450164794922, 0.0033178329467773438, 0.004267215728759766, 0.0052165985107421875, 0.006165981292724609, 0.007115364074707031, 0.008064746856689453, 0.009014129638671875, 0.009963512420654297, 0.010912895202636719, 0.01186227798461914, 0.012811660766601562, 0.013761043548583984, 0.014710426330566406, 0.015659809112548828, 0.01660919189453125, 0.017558574676513672, 0.018507957458496094, 0.019457340240478516, 0.020406723022460938, 0.02135610580444336, 0.02230548858642578, 0.023254871368408203, 0.024204254150390625, 0.025153636932373047, 0.02610301971435547, 0.02705240249633789, 0.028001785278320312, 0.028951168060302734, 0.029900550842285156, 0.030849933624267578, 0.03179931640625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 4.0, 6.0, 12.0, 7.0, 17.0, 17.0, 19.0, 17.0, 32.0, 41.0, 47.0, 40.0, 50.0, 49.0, 62.0, 78.0, 52.0, 58.0, 53.0, 44.0, 38.0, 56.0, 38.0, 30.0, 25.0, 22.0, 16.0, 20.0, 15.0, 9.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.010162353515625, -0.009826183319091797, -0.009490013122558594, -0.00915384292602539, -0.008817672729492188, -0.008481502532958984, -0.008145332336425781, -0.007809162139892578, -0.007472991943359375, -0.007136821746826172, -0.006800651550292969, -0.006464481353759766, -0.0061283111572265625, -0.005792140960693359, -0.005455970764160156, -0.005119800567626953, -0.00478363037109375, -0.004447460174560547, -0.004111289978027344, -0.0037751197814941406, -0.0034389495849609375, -0.0031027793884277344, -0.0027666091918945312, -0.002430438995361328, -0.002094268798828125, -0.0017580986022949219, -0.0014219284057617188, -0.0010857582092285156, -0.0007495880126953125, -0.0004134178161621094, -7.724761962890625e-05, 0.0002589225769042969, 0.0005950927734375, 0.0009312629699707031, 0.0012674331665039062, 0.0016036033630371094, 0.0019397735595703125, 0.0022759437561035156, 0.0026121139526367188, 0.002948284149169922, 0.003284454345703125, 0.003620624542236328, 0.003956794738769531, 0.004292964935302734, 0.0046291351318359375, 0.004965305328369141, 0.005301475524902344, 0.005637645721435547, 0.00597381591796875, 0.006309986114501953, 0.006646156311035156, 0.006982326507568359, 0.0073184967041015625, 0.007654666900634766, 0.007990837097167969, 0.008327007293701172, 0.008663177490234375, 0.008999347686767578, 0.009335517883300781, 0.009671688079833984, 0.010007858276367188, 0.01034402847290039, 0.010680198669433594, 0.011016368865966797, 0.0113525390625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 7.0, 5.0, 5.0, 4.0, 4.0, 12.0, 14.0, 12.0, 19.0, 21.0, 24.0, 35.0, 47.0, 56.0, 74.0, 115.0, 179.0, 234.0, 394.0, 750.0, 1820.0, 7063.0, 72126.0, 3873252.0, 220439.0, 12747.0, 2381.0, 913.0, 454.0, 269.0, 162.0, 139.0, 105.0, 81.0, 71.0, 59.0, 40.0, 30.0, 24.0, 22.0, 20.0, 15.0, 12.0, 14.0, 4.0, 8.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.040985107421875, -0.03950309753417969, -0.038021087646484375, -0.03653907775878906, -0.03505706787109375, -0.03357505798339844, -0.032093048095703125, -0.030611038208007812, -0.0291290283203125, -0.027647018432617188, -0.026165008544921875, -0.024682998657226562, -0.02320098876953125, -0.021718978881835938, -0.020236968994140625, -0.018754959106445312, -0.01727294921875, -0.015790939331054688, -0.014308929443359375, -0.012826919555664062, -0.01134490966796875, -0.009862899780273438, -0.008380889892578125, -0.0068988800048828125, -0.0054168701171875, -0.0039348602294921875, -0.002452850341796875, -0.0009708404541015625, 0.00051116943359375, 0.0019931793212890625, 0.003475189208984375, 0.0049571990966796875, 0.006439208984375, 0.007921218872070312, 0.009403228759765625, 0.010885238647460938, 0.01236724853515625, 0.013849258422851562, 0.015331268310546875, 0.016813278198242188, 0.0182952880859375, 0.019777297973632812, 0.021259307861328125, 0.022741317749023438, 0.02422332763671875, 0.025705337524414062, 0.027187347412109375, 0.028669357299804688, 0.0301513671875, 0.03163337707519531, 0.033115386962890625, 0.03459739685058594, 0.03607940673828125, 0.03756141662597656, 0.039043426513671875, 0.04052543640136719, 0.0420074462890625, 0.04348945617675781, 0.044971466064453125, 0.04645347595214844, 0.04793548583984375, 0.04941749572753906, 0.050899505615234375, 0.05238151550292969, 0.053863525390625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 10.0, 18.0, 42.0, 57.0, 105.0, 191.0, 660.0, 1452.0, 947.0, 306.0, 119.0, 62.0, 33.0, 22.0, 13.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.041717529296875, -0.04035615921020508, -0.038994789123535156, -0.037633419036865234, -0.03627204895019531, -0.03491067886352539, -0.03354930877685547, -0.03218793869018555, -0.030826568603515625, -0.029465198516845703, -0.02810382843017578, -0.02674245834350586, -0.025381088256835938, -0.024019718170166016, -0.022658348083496094, -0.021296977996826172, -0.01993560791015625, -0.018574237823486328, -0.017212867736816406, -0.015851497650146484, -0.014490127563476562, -0.01312875747680664, -0.011767387390136719, -0.010406017303466797, -0.009044647216796875, -0.007683277130126953, -0.006321907043457031, -0.004960536956787109, -0.0035991668701171875, -0.0022377967834472656, -0.0008764266967773438, 0.0004849433898925781, 0.0018463134765625, 0.003207683563232422, 0.004569053649902344, 0.005930423736572266, 0.0072917938232421875, 0.00865316390991211, 0.010014533996582031, 0.011375904083251953, 0.012737274169921875, 0.014098644256591797, 0.015460014343261719, 0.01682138442993164, 0.018182754516601562, 0.019544124603271484, 0.020905494689941406, 0.022266864776611328, 0.02362823486328125, 0.024989604949951172, 0.026350975036621094, 0.027712345123291016, 0.029073715209960938, 0.03043508529663086, 0.03179645538330078, 0.0331578254699707, 0.034519195556640625, 0.03588056564331055, 0.03724193572998047, 0.03860330581665039, 0.03996467590332031, 0.041326045989990234, 0.042687416076660156, 0.04404878616333008, 0.04541015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 2.0, 3.0, 6.0, 1.0, 7.0, 12.0, 19.0, 49.0, 86.0, 143.0, 196.0, 186.0, 125.0, 58.0, 52.0, 20.0, 9.0, 11.0, 10.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26120105385780334, -0.2501150965690613, -0.2390291690826416, -0.22794322669506073, -0.21685728430747986, -0.205771341919899, -0.19468539953231812, -0.18359945714473724, -0.17251351475715637, -0.1614275723695755, -0.15034162998199463, -0.13925568759441376, -0.12816974520683289, -0.11708380281925201, -0.10599786043167114, -0.09491191804409027, -0.0838259756565094, -0.07274003326892853, -0.061654090881347656, -0.050568148493766785, -0.03948220610618591, -0.02839626371860504, -0.01731032133102417, -0.006224378943443298, 0.004861563444137573, 0.015947505831718445, 0.027033448219299316, 0.03811939060688019, 0.04920533299446106, 0.06029127538204193, 0.0713772177696228, 0.08246316015720367, 0.09354913234710693, 0.1046350747346878, 0.11572101712226868, 0.12680695950984955, 0.13789290189743042, 0.1489788442850113, 0.16006478667259216, 0.17115072906017303, 0.1822366714477539, 0.19332261383533478, 0.20440855622291565, 0.21549449861049652, 0.2265804409980774, 0.23766638338565826, 0.24875232577323914, 0.2598382830619812, 0.2709242105484009, 0.28201013803482056, 0.2930960953235626, 0.3041820526123047, 0.31526798009872437, 0.32635390758514404, 0.3374398648738861, 0.3485258221626282, 0.35961174964904785, 0.37069767713546753, 0.3817836344242096, 0.39286959171295166, 0.40395551919937134, 0.415041446685791, 0.4261274039745331, 0.43721336126327515, 0.4482992887496948]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 1.0, 11.0, 17.0, 18.0, 29.0, 32.0, 40.0, 79.0, 81.0, 103.0, 98.0, 79.0, 110.0, 62.0, 82.0, 42.0, 34.0, 32.0, 27.0, 10.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21377688646316528, -0.2059030681848526, -0.19802924990653992, -0.19015543162822723, -0.18228161334991455, -0.17440779507160187, -0.16653397679328918, -0.1586601436138153, -0.15078634023666382, -0.14291252195835114, -0.13503870368003845, -0.12716488540172577, -0.11929106712341309, -0.1114172488451004, -0.10354342311620712, -0.09566960483789444, -0.08779577910900116, -0.07992196083068848, -0.0720481425523758, -0.06417432427406311, -0.05630050227046013, -0.048426683992147446, -0.040552861988544464, -0.03267904371023178, -0.024805225431919098, -0.016931407153606415, -0.009057587012648582, -0.0011837668716907501, 0.006690051406621933, 0.014563869684934616, 0.022437691688537598, 0.03031150996685028, 0.038185328245162964, 0.04605914652347565, 0.05393296480178833, 0.06180678680539131, 0.0696806013584137, 0.07755441963672638, 0.08542824536561966, 0.09330206364393234, 0.10117588192224503, 0.10904970020055771, 0.11692351847887039, 0.12479734420776367, 0.13267116248607635, 0.14054498076438904, 0.14841879904270172, 0.1562926173210144, 0.1641664355993271, 0.17204025387763977, 0.17991407215595245, 0.18778789043426514, 0.19566170871257782, 0.2035355269908905, 0.21140936017036438, 0.21928316354751587, 0.22715699672698975, 0.23503081500530243, 0.2429046332836151, 0.250778466463089, 0.2586522698402405, 0.26652610301971436, 0.27439990639686584, 0.2822737395763397, 0.2901475429534912]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 8.0, 9.0, 18.0, 22.0, 28.0, 49.0, 66.0, 126.0, 195.0, 264.0, 479.0, 831.0, 1393.0, 2662.0, 5221.0, 11265.0, 26559.0, 66984.0, 179805.0, 368039.0, 234540.0, 88095.0, 34003.0, 14207.0, 6417.0, 3289.0, 1639.0, 898.0, 560.0, 349.0, 185.0, 112.0, 66.0, 58.0, 32.0, 20.0, 16.0, 11.0, 8.0, 6.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169677734375, -0.016375303268432617, -0.015782833099365234, -0.015190362930297852, -0.014597892761230469, -0.014005422592163086, -0.013412952423095703, -0.01282048225402832, -0.012228012084960938, -0.011635541915893555, -0.011043071746826172, -0.010450601577758789, -0.009858131408691406, -0.009265661239624023, -0.00867319107055664, -0.008080720901489258, -0.007488250732421875, -0.006895780563354492, -0.006303310394287109, -0.0057108402252197266, -0.005118370056152344, -0.004525899887084961, -0.003933429718017578, -0.0033409595489501953, -0.0027484893798828125, -0.0021560192108154297, -0.0015635490417480469, -0.0009710788726806641, -0.00037860870361328125, 0.00021386146545410156, 0.0008063316345214844, 0.0013988018035888672, 0.00199127197265625, 0.002583742141723633, 0.0031762123107910156, 0.0037686824798583984, 0.004361152648925781, 0.004953622817993164, 0.005546092987060547, 0.00613856315612793, 0.0067310333251953125, 0.007323503494262695, 0.007915973663330078, 0.008508443832397461, 0.009100914001464844, 0.009693384170532227, 0.01028585433959961, 0.010878324508666992, 0.011470794677734375, 0.012063264846801758, 0.01265573501586914, 0.013248205184936523, 0.013840675354003906, 0.014433145523071289, 0.015025615692138672, 0.015618085861206055, 0.016210556030273438, 0.01680302619934082, 0.017395496368408203, 0.017987966537475586, 0.01858043670654297, 0.01917290687561035, 0.019765377044677734, 0.020357847213745117, 0.0209503173828125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 10.0, 4.0, 11.0, 15.0, 13.0, 18.0, 20.0, 30.0, 23.0, 30.0, 32.0, 34.0, 40.0, 49.0, 59.0, 59.0, 49.0, 64.0, 45.0, 50.0, 39.0, 49.0, 32.0, 34.0, 25.0, 31.0, 31.0, 21.0, 16.0, 16.0, 11.0, 8.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00959014892578125, -0.009249091148376465, -0.00890803337097168, -0.008566975593566895, -0.00822591781616211, -0.007884860038757324, -0.007543802261352539, -0.007202744483947754, -0.006861686706542969, -0.006520628929138184, -0.0061795711517333984, -0.005838513374328613, -0.005497455596923828, -0.005156397819519043, -0.004815340042114258, -0.004474282264709473, -0.0041332244873046875, -0.0037921667098999023, -0.003451108932495117, -0.003110051155090332, -0.002768993377685547, -0.0024279356002807617, -0.0020868778228759766, -0.0017458200454711914, -0.0014047622680664062, -0.001063704490661621, -0.0007226467132568359, -0.0003815889358520508, -4.0531158447265625e-05, 0.00030052661895751953, 0.0006415843963623047, 0.0009826421737670898, 0.001323699951171875, 0.0016647577285766602, 0.0020058155059814453, 0.0023468732833862305, 0.0026879310607910156, 0.0030289888381958008, 0.003370046615600586, 0.003711104393005371, 0.004052162170410156, 0.004393219947814941, 0.0047342777252197266, 0.005075335502624512, 0.005416393280029297, 0.005757451057434082, 0.006098508834838867, 0.006439566612243652, 0.0067806243896484375, 0.007121682167053223, 0.007462739944458008, 0.007803797721862793, 0.008144855499267578, 0.008485913276672363, 0.008826971054077148, 0.009168028831481934, 0.009509086608886719, 0.009850144386291504, 0.010191202163696289, 0.010532259941101074, 0.01087331771850586, 0.011214375495910645, 0.01155543327331543, 0.011896491050720215, 0.012237548828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 7.0, 3.0, 12.0, 12.0, 10.0, 16.0, 16.0, 40.0, 57.0, 77.0, 85.0, 177.0, 243.0, 361.0, 563.0, 979.0, 2043.0, 5293.0, 21134.0, 160722.0, 746464.0, 88120.0, 13964.0, 4103.0, 1682.0, 807.0, 536.0, 352.0, 199.0, 123.0, 88.0, 73.0, 46.0, 42.0, 30.0, 27.0, 12.0, 10.0, 11.0, 5.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.050445556640625, -0.04897785186767578, -0.04751014709472656, -0.046042442321777344, -0.044574737548828125, -0.043107032775878906, -0.04163932800292969, -0.04017162322998047, -0.03870391845703125, -0.03723621368408203, -0.03576850891113281, -0.034300804138183594, -0.032833099365234375, -0.031365394592285156, -0.029897689819335938, -0.02842998504638672, -0.0269622802734375, -0.02549457550048828, -0.024026870727539062, -0.022559165954589844, -0.021091461181640625, -0.019623756408691406, -0.018156051635742188, -0.01668834686279297, -0.01522064208984375, -0.013752937316894531, -0.012285232543945312, -0.010817527770996094, -0.009349822998046875, -0.007882118225097656, -0.0064144134521484375, -0.004946708679199219, -0.00347900390625, -0.0020112991333007812, -0.0005435943603515625, 0.0009241104125976562, 0.002391815185546875, 0.0038595199584960938, 0.0053272247314453125, 0.006794929504394531, 0.00826263427734375, 0.009730339050292969, 0.011198043823242188, 0.012665748596191406, 0.014133453369140625, 0.015601158142089844, 0.017068862915039062, 0.01853656768798828, 0.0200042724609375, 0.02147197723388672, 0.022939682006835938, 0.024407386779785156, 0.025875091552734375, 0.027342796325683594, 0.028810501098632812, 0.03027820587158203, 0.03174591064453125, 0.03321361541748047, 0.03468132019042969, 0.036149024963378906, 0.037616729736328125, 0.039084434509277344, 0.04055213928222656, 0.04201984405517578, 0.043487548828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 1.0, 6.0, 4.0, 7.0, 12.0, 15.0, 15.0, 20.0, 24.0, 19.0, 29.0, 32.0, 32.0, 49.0, 50.0, 43.0, 58.0, 60.0, 55.0, 64.0, 37.0, 48.0, 36.0, 39.0, 37.0, 34.0, 34.0, 19.0, 17.0, 25.0, 17.0, 13.0, 12.0, 6.0, 5.0, 2.0, 7.0, 3.0, 6.0, 4.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04266357421875, -0.04126167297363281, -0.039859771728515625, -0.03845787048339844, -0.03705596923828125, -0.03565406799316406, -0.034252166748046875, -0.03285026550292969, -0.0314483642578125, -0.030046463012695312, -0.028644561767578125, -0.027242660522460938, -0.02584075927734375, -0.024438858032226562, -0.023036956787109375, -0.021635055541992188, -0.020233154296875, -0.018831253051757812, -0.017429351806640625, -0.016027450561523438, -0.01462554931640625, -0.013223648071289062, -0.011821746826171875, -0.010419845581054688, -0.0090179443359375, -0.0076160430908203125, -0.006214141845703125, -0.0048122406005859375, -0.00341033935546875, -0.0020084381103515625, -0.000606536865234375, 0.0007953643798828125, 0.002197265625, 0.0035991668701171875, 0.005001068115234375, 0.0064029693603515625, 0.00780487060546875, 0.009206771850585938, 0.010608673095703125, 0.012010574340820312, 0.0134124755859375, 0.014814376831054688, 0.016216278076171875, 0.017618179321289062, 0.01902008056640625, 0.020421981811523438, 0.021823883056640625, 0.023225784301757812, 0.024627685546875, 0.026029586791992188, 0.027431488037109375, 0.028833389282226562, 0.03023529052734375, 0.03163719177246094, 0.033039093017578125, 0.03444099426269531, 0.0358428955078125, 0.03724479675292969, 0.038646697998046875, 0.04004859924316406, 0.04145050048828125, 0.04285240173339844, 0.044254302978515625, 0.04565620422363281, 0.04705810546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 12.0, 14.0, 37.0, 46.0, 79.0, 171.0, 332.0, 832.0, 2329.0, 8283.0, 38475.0, 716601.0, 248560.0, 24152.0, 5619.0, 1762.0, 671.0, 267.0, 130.0, 78.0, 49.0, 24.0, 9.0, 6.0, 4.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.03802490234375, -0.037137746810913086, -0.03625059127807617, -0.03536343574523926, -0.034476280212402344, -0.03358912467956543, -0.032701969146728516, -0.0318148136138916, -0.030927658081054688, -0.030040502548217773, -0.02915334701538086, -0.028266191482543945, -0.02737903594970703, -0.026491880416870117, -0.025604724884033203, -0.02471756935119629, -0.023830413818359375, -0.02294325828552246, -0.022056102752685547, -0.021168947219848633, -0.02028179168701172, -0.019394636154174805, -0.01850748062133789, -0.017620325088500977, -0.016733169555664062, -0.01584601402282715, -0.014958858489990234, -0.01407170295715332, -0.013184547424316406, -0.012297391891479492, -0.011410236358642578, -0.010523080825805664, -0.00963592529296875, -0.008748769760131836, -0.007861614227294922, -0.006974458694458008, -0.006087303161621094, -0.00520014762878418, -0.004312992095947266, -0.0034258365631103516, -0.0025386810302734375, -0.0016515254974365234, -0.0007643699645996094, 0.0001227855682373047, 0.0010099411010742188, 0.0018970966339111328, 0.002784252166748047, 0.003671407699584961, 0.004558563232421875, 0.005445718765258789, 0.006332874298095703, 0.007220029830932617, 0.008107185363769531, 0.008994340896606445, 0.00988149642944336, 0.010768651962280273, 0.011655807495117188, 0.012542963027954102, 0.013430118560791016, 0.01431727409362793, 0.015204429626464844, 0.016091585159301758, 0.016978740692138672, 0.017865896224975586, 0.0187530517578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 7.0, 5.0, 7.0, 4.0, 9.0, 11.0, 8.0, 15.0, 9.0, 24.0, 17.0, 19.0, 35.0, 45.0, 78.0, 79.0, 84.0, 103.0, 76.0, 70.0, 58.0, 48.0, 28.0, 33.0, 26.0, 10.0, 16.0, 10.0, 6.0, 12.0, 11.0, 8.0, 8.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.9577484130859375e-05, -3.827642649412155e-05, -3.697536885738373e-05, -3.5674311220645905e-05, -3.437325358390808e-05, -3.307219594717026e-05, -3.1771138310432434e-05, -3.047008067369461e-05, -2.9169023036956787e-05, -2.7867965400218964e-05, -2.656690776348114e-05, -2.5265850126743317e-05, -2.3964792490005493e-05, -2.266373485326767e-05, -2.1362677216529846e-05, -2.0061619579792023e-05, -1.87605619430542e-05, -1.7459504306316376e-05, -1.6158446669578552e-05, -1.4857389032840729e-05, -1.3556331396102905e-05, -1.2255273759365082e-05, -1.0954216122627258e-05, -9.653158485889435e-06, -8.352100849151611e-06, -7.051043212413788e-06, -5.749985575675964e-06, -4.448927938938141e-06, -3.1478703022003174e-06, -1.846812665462494e-06, -5.457550287246704e-07, 7.553026080131531e-07, 2.0563602447509766e-06, 3.3574178814888e-06, 4.6584755182266235e-06, 5.959533154964447e-06, 7.2605907917022705e-06, 8.561648428440094e-06, 9.862706065177917e-06, 1.1163763701915741e-05, 1.2464821338653564e-05, 1.3765878975391388e-05, 1.5066936612129211e-05, 1.6367994248867035e-05, 1.766905188560486e-05, 1.8970109522342682e-05, 2.0271167159080505e-05, 2.157222479581833e-05, 2.2873282432556152e-05, 2.4174340069293976e-05, 2.54753977060318e-05, 2.6776455342769623e-05, 2.8077512979507446e-05, 2.937857061624527e-05, 3.067962825298309e-05, 3.198068588972092e-05, 3.328174352645874e-05, 3.4582801163196564e-05, 3.588385879993439e-05, 3.718491643667221e-05, 3.8485974073410034e-05, 3.978703171014786e-05, 4.108808934688568e-05, 4.2389146983623505e-05, 4.369020462036133e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 16.0, 22.0, 34.0, 48.0, 72.0, 113.0, 236.0, 458.0, 902.0, 2177.0, 6422.0, 26110.0, 201963.0, 728515.0, 62507.0, 12449.0, 3782.0, 1331.0, 642.0, 306.0, 182.0, 98.0, 57.0, 33.0, 26.0, 20.0, 9.0, 6.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01611328125, -0.015420198440551758, -0.014727115631103516, -0.014034032821655273, -0.013340950012207031, -0.012647867202758789, -0.011954784393310547, -0.011261701583862305, -0.010568618774414062, -0.00987553596496582, -0.009182453155517578, -0.008489370346069336, -0.007796287536621094, -0.0071032047271728516, -0.006410121917724609, -0.005717039108276367, -0.005023956298828125, -0.004330873489379883, -0.0036377906799316406, -0.0029447078704833984, -0.0022516250610351562, -0.001558542251586914, -0.0008654594421386719, -0.0001723766326904297, 0.0005207061767578125, 0.0012137889862060547, 0.0019068717956542969, 0.002599954605102539, 0.0032930374145507812, 0.0039861202239990234, 0.004679203033447266, 0.005372285842895508, 0.00606536865234375, 0.006758451461791992, 0.007451534271240234, 0.008144617080688477, 0.008837699890136719, 0.009530782699584961, 0.010223865509033203, 0.010916948318481445, 0.011610031127929688, 0.01230311393737793, 0.012996196746826172, 0.013689279556274414, 0.014382362365722656, 0.015075445175170898, 0.01576852798461914, 0.016461610794067383, 0.017154693603515625, 0.017847776412963867, 0.01854085922241211, 0.01923394203186035, 0.019927024841308594, 0.020620107650756836, 0.021313190460205078, 0.02200627326965332, 0.022699356079101562, 0.023392438888549805, 0.024085521697998047, 0.02477860450744629, 0.02547168731689453, 0.026164770126342773, 0.026857852935791016, 0.027550935745239258, 0.0282440185546875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 7.0, 4.0, 10.0, 13.0, 26.0, 33.0, 42.0, 64.0, 81.0, 104.0, 145.0, 128.0, 92.0, 84.0, 51.0, 36.0, 22.0, 19.0, 16.0, 12.0, 1.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0260162353515625, -0.02534627914428711, -0.02467632293701172, -0.024006366729736328, -0.023336410522460938, -0.022666454315185547, -0.021996498107910156, -0.021326541900634766, -0.020656585693359375, -0.019986629486083984, -0.019316673278808594, -0.018646717071533203, -0.017976760864257812, -0.017306804656982422, -0.01663684844970703, -0.01596689224243164, -0.01529693603515625, -0.01462697982788086, -0.013957023620605469, -0.013287067413330078, -0.012617111206054688, -0.011947154998779297, -0.011277198791503906, -0.010607242584228516, -0.009937286376953125, -0.009267330169677734, -0.008597373962402344, -0.007927417755126953, -0.0072574615478515625, -0.006587505340576172, -0.005917549133300781, -0.005247592926025391, -0.00457763671875, -0.003907680511474609, -0.0032377243041992188, -0.002567768096923828, -0.0018978118896484375, -0.0012278556823730469, -0.0005578994750976562, 0.00011205673217773438, 0.000782012939453125, 0.0014519691467285156, 0.0021219253540039062, 0.002791881561279297, 0.0034618377685546875, 0.004131793975830078, 0.004801750183105469, 0.005471706390380859, 0.00614166259765625, 0.006811618804931641, 0.007481575012207031, 0.008151531219482422, 0.008821487426757812, 0.009491443634033203, 0.010161399841308594, 0.010831356048583984, 0.011501312255859375, 0.012171268463134766, 0.012841224670410156, 0.013511180877685547, 0.014181137084960938, 0.014851093292236328, 0.015521049499511719, 0.01619100570678711, 0.0168609619140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 14.0, 33.0, 73.0, 161.0, 294.0, 196.0, 99.0, 54.0, 26.0, 11.0, 7.0, 4.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40993165969848633, -0.396430641412735, -0.38292965292930603, -0.3694286346435547, -0.35592764616012573, -0.3424266278743744, -0.32892560958862305, -0.3154246211051941, -0.30192360281944275, -0.2884225845336914, -0.27492159605026245, -0.2614205777645111, -0.24791957437992096, -0.2344185709953308, -0.22091755270957947, -0.20741654932498932, -0.19391554594039917, -0.18041454255580902, -0.16691353917121887, -0.15341252088546753, -0.13991151750087738, -0.12641051411628723, -0.11290950328111649, -0.09940849244594574, -0.08590748906135559, -0.07240648567676544, -0.058905474841594696, -0.04540446773171425, -0.0319034606218338, -0.018402457237243652, -0.0049014464020729065, 0.00859956443309784, 0.022100597620010376, 0.03560160472989082, 0.04910261183977127, 0.06260362267494202, 0.07610462605953217, 0.08960562944412231, 0.10310664027929306, 0.1166076511144638, 0.13010865449905396, 0.1436096578836441, 0.15711066126823425, 0.1706116795539856, 0.18411268293857574, 0.1976136863231659, 0.21111470460891724, 0.22461570799350739, 0.23811671137809753, 0.2516177296638489, 0.26511871814727783, 0.2786197364330292, 0.2921207547187805, 0.3056217432022095, 0.3191227614879608, 0.33262377977371216, 0.3461247682571411, 0.35962578654289246, 0.3731267750263214, 0.38662779331207275, 0.4001287817955017, 0.41362980008125305, 0.4271308183670044, 0.44063180685043335, 0.4541328251361847]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 9.0, 5.0, 8.0, 9.0, 18.0, 15.0, 21.0, 19.0, 18.0, 19.0, 30.0, 25.0, 39.0, 32.0, 63.0, 75.0, 77.0, 82.0, 67.0, 48.0, 46.0, 29.0, 26.0, 27.0, 25.0, 18.0, 17.0, 17.0, 24.0, 14.0, 14.0, 9.0, 9.0, 8.0, 10.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18436723947525024, -0.17846879363059998, -0.1725703328847885, -0.16667188704013824, -0.16077342629432678, -0.1548749804496765, -0.14897653460502625, -0.14307808876037598, -0.13717962801456451, -0.13128118216991425, -0.12538272142410278, -0.11948427557945251, -0.11358582228422165, -0.10768736898899078, -0.10178892314434052, -0.09589046984910965, -0.08999201655387878, -0.08409356325864792, -0.07819510996341705, -0.07229666411876678, -0.06639821082353592, -0.060499757528305054, -0.05460130795836449, -0.04870285838842392, -0.042804405093193054, -0.03690595179796219, -0.03100750222802162, -0.025109050795435905, -0.01921059936285019, -0.013312147930264473, -0.007413696497678757, -0.0015152469277381897, 0.004383206367492676, 0.010281657800078392, 0.01618010923266411, 0.022078560665249825, 0.02797701209783554, 0.033875465393066406, 0.03977391496300697, 0.04567236453294754, 0.051570817828178406, 0.05746927112340927, 0.06336772441864014, 0.0692661702632904, 0.07516462355852127, 0.08106307685375214, 0.0869615226984024, 0.09285997599363327, 0.09875842928886414, 0.104656882584095, 0.11055533587932587, 0.11645378172397614, 0.122352235019207, 0.12825068831443787, 0.13414913415908813, 0.1400475800037384, 0.14594604074954987, 0.15184448659420013, 0.1577429473400116, 0.16364139318466187, 0.16953983902931213, 0.1754382997751236, 0.18133674561977386, 0.18723520636558533, 0.1931336522102356]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 8.0, 10.0, 10.0, 25.0, 25.0, 40.0, 70.0, 116.0, 224.0, 460.0, 1090.0, 2679.0, 9222.0, 50327.0, 1202807.0, 2811959.0, 94845.0, 14009.0, 3845.0, 1340.0, 537.0, 257.0, 126.0, 87.0, 52.0, 32.0, 23.0, 17.0, 6.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0276031494140625, -0.026655912399291992, -0.025708675384521484, -0.024761438369750977, -0.02381420135498047, -0.02286696434020996, -0.021919727325439453, -0.020972490310668945, -0.020025253295898438, -0.01907801628112793, -0.018130779266357422, -0.017183542251586914, -0.016236305236816406, -0.015289068222045898, -0.01434183120727539, -0.013394594192504883, -0.012447357177734375, -0.011500120162963867, -0.01055288314819336, -0.009605646133422852, -0.008658409118652344, -0.007711172103881836, -0.006763935089111328, -0.00581669807434082, -0.0048694610595703125, -0.003922224044799805, -0.002974987030029297, -0.002027750015258789, -0.0010805130004882812, -0.00013327598571777344, 0.0008139610290527344, 0.0017611980438232422, 0.00270843505859375, 0.003655672073364258, 0.004602909088134766, 0.0055501461029052734, 0.006497383117675781, 0.007444620132446289, 0.008391857147216797, 0.009339094161987305, 0.010286331176757812, 0.01123356819152832, 0.012180805206298828, 0.013128042221069336, 0.014075279235839844, 0.015022516250610352, 0.01596975326538086, 0.016916990280151367, 0.017864227294921875, 0.018811464309692383, 0.01975870132446289, 0.0207059383392334, 0.021653175354003906, 0.022600412368774414, 0.023547649383544922, 0.02449488639831543, 0.025442123413085938, 0.026389360427856445, 0.027336597442626953, 0.02828383445739746, 0.02923107147216797, 0.030178308486938477, 0.031125545501708984, 0.03207278251647949, 0.03302001953125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 13.0, 12.0, 11.0, 22.0, 23.0, 38.0, 38.0, 27.0, 42.0, 47.0, 50.0, 51.0, 60.0, 52.0, 53.0, 65.0, 48.0, 60.0, 40.0, 41.0, 38.0, 27.0, 27.0, 20.0, 18.0, 14.0, 9.0, 8.0, 6.0, 7.0, 2.0, 3.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01012420654296875, -0.00977480411529541, -0.00942540168762207, -0.00907599925994873, -0.00872659683227539, -0.00837719440460205, -0.008027791976928711, -0.007678389549255371, -0.007328987121582031, -0.006979584693908691, -0.0066301822662353516, -0.006280779838562012, -0.005931377410888672, -0.005581974983215332, -0.005232572555541992, -0.004883170127868652, -0.0045337677001953125, -0.004184365272521973, -0.003834962844848633, -0.003485560417175293, -0.003136157989501953, -0.0027867555618286133, -0.0024373531341552734, -0.0020879507064819336, -0.0017385482788085938, -0.001389145851135254, -0.001039743423461914, -0.0006903409957885742, -0.0003409385681152344, 8.463859558105469e-06, 0.0003578662872314453, 0.0007072687149047852, 0.001056671142578125, 0.0014060735702514648, 0.0017554759979248047, 0.0021048784255981445, 0.0024542808532714844, 0.0028036832809448242, 0.003153085708618164, 0.003502488136291504, 0.0038518905639648438, 0.004201292991638184, 0.0045506954193115234, 0.004900097846984863, 0.005249500274658203, 0.005598902702331543, 0.005948305130004883, 0.006297707557678223, 0.0066471099853515625, 0.006996512413024902, 0.007345914840698242, 0.007695317268371582, 0.008044719696044922, 0.008394122123718262, 0.008743524551391602, 0.009092926979064941, 0.009442329406738281, 0.009791731834411621, 0.010141134262084961, 0.0104905366897583, 0.01083993911743164, 0.01118934154510498, 0.01153874397277832, 0.01188814640045166, 0.012237548828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 8.0, 8.0, 20.0, 13.0, 17.0, 28.0, 34.0, 43.0, 58.0, 88.0, 96.0, 130.0, 207.0, 317.0, 469.0, 872.0, 2513.0, 40351.0, 4107131.0, 36695.0, 2488.0, 878.0, 537.0, 352.0, 234.0, 175.0, 123.0, 98.0, 82.0, 55.0, 37.0, 29.0, 18.0, 22.0, 18.0, 7.0, 7.0, 5.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09112548828125, -0.08792686462402344, -0.08472824096679688, -0.08152961730957031, -0.07833099365234375, -0.07513236999511719, -0.07193374633789062, -0.06873512268066406, -0.0655364990234375, -0.06233787536621094, -0.059139251708984375, -0.05594062805175781, -0.05274200439453125, -0.04954338073730469, -0.046344757080078125, -0.04314613342285156, -0.039947509765625, -0.03674888610839844, -0.033550262451171875, -0.030351638793945312, -0.02715301513671875, -0.023954391479492188, -0.020755767822265625, -0.017557144165039062, -0.0143585205078125, -0.011159896850585938, -0.007961273193359375, -0.0047626495361328125, -0.00156402587890625, 0.0016345977783203125, 0.004833221435546875, 0.008031845092773438, 0.01123046875, 0.014429092407226562, 0.017627716064453125, 0.020826339721679688, 0.02402496337890625, 0.027223587036132812, 0.030422210693359375, 0.03362083435058594, 0.0368194580078125, 0.04001808166503906, 0.043216705322265625, 0.04641532897949219, 0.04961395263671875, 0.05281257629394531, 0.056011199951171875, 0.05920982360839844, 0.062408447265625, 0.06560707092285156, 0.06880569458007812, 0.07200431823730469, 0.07520294189453125, 0.07840156555175781, 0.08160018920898438, 0.08479881286621094, 0.0879974365234375, 0.09119606018066406, 0.09439468383789062, 0.09759330749511719, 0.10079193115234375, 0.10399055480957031, 0.10718917846679688, 0.11038780212402344, 0.11358642578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 12.0, 43.0, 91.0, 330.0, 1937.0, 1369.0, 185.0, 63.0, 20.0, 6.0, 10.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0833740234375, -0.08037853240966797, -0.07738304138183594, -0.0743875503540039, -0.07139205932617188, -0.06839656829833984, -0.06540107727050781, -0.06240558624267578, -0.05941009521484375, -0.05641460418701172, -0.05341911315917969, -0.050423622131347656, -0.047428131103515625, -0.044432640075683594, -0.04143714904785156, -0.03844165802001953, -0.0354461669921875, -0.03245067596435547, -0.029455184936523438, -0.026459693908691406, -0.023464202880859375, -0.020468711853027344, -0.017473220825195312, -0.014477729797363281, -0.01148223876953125, -0.008486747741699219, -0.0054912567138671875, -0.0024957656860351562, 0.000499725341796875, 0.0034952163696289062, 0.0064907073974609375, 0.009486198425292969, 0.012481689453125, 0.015477180480957031, 0.018472671508789062, 0.021468162536621094, 0.024463653564453125, 0.027459144592285156, 0.030454635620117188, 0.03345012664794922, 0.03644561767578125, 0.03944110870361328, 0.04243659973144531, 0.045432090759277344, 0.048427581787109375, 0.051423072814941406, 0.05441856384277344, 0.05741405487060547, 0.0604095458984375, 0.06340503692626953, 0.06640052795410156, 0.0693960189819336, 0.07239151000976562, 0.07538700103759766, 0.07838249206542969, 0.08137798309326172, 0.08437347412109375, 0.08736896514892578, 0.09036445617675781, 0.09335994720458984, 0.09635543823242188, 0.0993509292602539, 0.10234642028808594, 0.10534191131591797, 0.10833740234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 16.0, 33.0, 113.0, 247.0, 349.0, 134.0, 56.0, 14.0, 8.0, 9.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4741882085800171, -0.44468289613723755, -0.4151776134967804, -0.38567230105400085, -0.3561669886112213, -0.32666170597076416, -0.2971563935279846, -0.2676510810852051, -0.23814578354358673, -0.20864048600196838, -0.17913517355918884, -0.1496298760175705, -0.12012457102537155, -0.09061926603317261, -0.06111396849155426, -0.03160865604877472, -0.002103358507156372, 0.027401944622397423, 0.05690724775195122, 0.08641254901885986, 0.11591785401105881, 0.14542315900325775, 0.1749284565448761, 0.20443376898765564, 0.233939066529274, 0.26344436407089233, 0.2929496765136719, 0.3224549889564514, 0.35196027159690857, 0.3814655840396881, 0.41097086668014526, 0.4404761791229248, 0.46998149156570435, 0.4994868040084839, 0.5289921164512634, 0.558497428894043, 0.5880026817321777, 0.6175079941749573, 0.6470133066177368, 0.6765186190605164, 0.7060239315032959, 0.7355292439460754, 0.765034556388855, 0.7945398092269897, 0.8240451216697693, 0.8535504341125488, 0.8830557465553284, 0.9125610589981079, 0.9420663118362427, 0.9715716242790222, 1.0010769367218018, 1.0305821895599365, 1.0600875616073608, 1.0895928144454956, 1.11909818649292, 1.1486034393310547, 1.178108811378479, 1.2076140642166138, 1.237119436264038, 1.2666246891021729, 1.2961300611495972, 1.325635313987732, 1.3551406860351562, 1.384645938873291, 1.4141511917114258]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 8.0, 6.0, 9.0, 8.0, 11.0, 13.0, 19.0, 20.0, 30.0, 37.0, 41.0, 54.0, 49.0, 55.0, 64.0, 73.0, 45.0, 50.0, 43.0, 56.0, 49.0, 54.0, 39.0, 25.0, 21.0, 20.0, 24.0, 14.0, 16.0, 13.0, 11.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2241661548614502, -0.21562409400939941, -0.20708203315734863, -0.19853997230529785, -0.18999791145324707, -0.1814558506011963, -0.1729138046503067, -0.16437174379825592, -0.15582968294620514, -0.14728762209415436, -0.13874556124210358, -0.1302035003900528, -0.12166144698858261, -0.11311938613653183, -0.10457733273506165, -0.09603527188301086, -0.08749321103096008, -0.0789511501789093, -0.07040908932685852, -0.061867035925388336, -0.053324975073337555, -0.044782914221286774, -0.03624085709452629, -0.027698799967765808, -0.019156739115715027, -0.010614680126309395, -0.002072621136903763, 0.006469437852501869, 0.015011496841907501, 0.023553557693958282, 0.032095614820718765, 0.04063767194747925, 0.04917973279953003, 0.05772179365158081, 0.06626385450363159, 0.07480590790510178, 0.08334796875715256, 0.09189002960920334, 0.10043208301067352, 0.1089741438627243, 0.11751620471477509, 0.12605826556682587, 0.13460032641887665, 0.14314238727092743, 0.15168443322181702, 0.1602264940738678, 0.16876855492591858, 0.17731061577796936, 0.18585267663002014, 0.19439473748207092, 0.2029367983341217, 0.21147885918617249, 0.22002092003822327, 0.22856298089027405, 0.23710502684116364, 0.24564708769321442, 0.254189133644104, 0.2627311944961548, 0.27127325534820557, 0.27981531620025635, 0.28835737705230713, 0.2968994379043579, 0.3054414987564087, 0.3139835596084595, 0.32252562046051025]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 6.0, 13.0, 20.0, 17.0, 45.0, 56.0, 97.0, 122.0, 201.0, 355.0, 605.0, 1058.0, 2053.0, 4155.0, 9560.0, 24353.0, 75055.0, 259993.0, 429047.0, 162863.0, 48184.0, 16926.0, 7000.0, 3100.0, 1533.0, 853.0, 491.0, 266.0, 175.0, 106.0, 75.0, 40.0, 43.0, 23.0, 15.0, 13.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.032196044921875, -0.031229496002197266, -0.03026294708251953, -0.029296398162841797, -0.028329849243164062, -0.027363300323486328, -0.026396751403808594, -0.02543020248413086, -0.024463653564453125, -0.02349710464477539, -0.022530555725097656, -0.021564006805419922, -0.020597457885742188, -0.019630908966064453, -0.01866436004638672, -0.017697811126708984, -0.01673126220703125, -0.015764713287353516, -0.014798164367675781, -0.013831615447998047, -0.012865066528320312, -0.011898517608642578, -0.010931968688964844, -0.00996541976928711, -0.008998870849609375, -0.00803232192993164, -0.007065773010253906, -0.006099224090576172, -0.0051326751708984375, -0.004166126251220703, -0.0031995773315429688, -0.0022330284118652344, -0.0012664794921875, -0.0002999305725097656, 0.0006666183471679688, 0.0016331672668457031, 0.0025997161865234375, 0.003566265106201172, 0.004532814025878906, 0.005499362945556641, 0.006465911865234375, 0.007432460784912109, 0.008399009704589844, 0.009365558624267578, 0.010332107543945312, 0.011298656463623047, 0.012265205383300781, 0.013231754302978516, 0.01419830322265625, 0.015164852142333984, 0.01613140106201172, 0.017097949981689453, 0.018064498901367188, 0.019031047821044922, 0.019997596740722656, 0.02096414566040039, 0.021930694580078125, 0.02289724349975586, 0.023863792419433594, 0.024830341339111328, 0.025796890258789062, 0.026763439178466797, 0.02772998809814453, 0.028696537017822266, 0.0296630859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 3.0, 10.0, 4.0, 10.0, 9.0, 25.0, 25.0, 11.0, 21.0, 22.0, 26.0, 41.0, 26.0, 36.0, 29.0, 45.0, 58.0, 51.0, 52.0, 55.0, 45.0, 45.0, 40.0, 39.0, 23.0, 37.0, 42.0, 25.0, 13.0, 20.0, 21.0, 16.0, 12.0, 15.0, 11.0, 7.0, 12.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.01372528076171875, -0.01329505443572998, -0.012864828109741211, -0.012434601783752441, -0.012004375457763672, -0.011574149131774902, -0.011143922805786133, -0.010713696479797363, -0.010283470153808594, -0.009853243827819824, -0.009423017501831055, -0.008992791175842285, -0.008562564849853516, -0.008132338523864746, -0.0077021121978759766, -0.007271885871887207, -0.0068416595458984375, -0.006411433219909668, -0.0059812068939208984, -0.005550980567932129, -0.005120754241943359, -0.00469052791595459, -0.00426030158996582, -0.0038300752639770508, -0.0033998489379882812, -0.0029696226119995117, -0.002539396286010742, -0.0021091699600219727, -0.0016789436340332031, -0.0012487173080444336, -0.0008184909820556641, -0.00038826465606689453, 4.1961669921875e-05, 0.00047218799591064453, 0.0009024143218994141, 0.0013326406478881836, 0.0017628669738769531, 0.0021930932998657227, 0.002623319625854492, 0.0030535459518432617, 0.0034837722778320312, 0.003913998603820801, 0.00434422492980957, 0.00477445125579834, 0.005204677581787109, 0.005634903907775879, 0.0060651302337646484, 0.006495356559753418, 0.0069255828857421875, 0.007355809211730957, 0.0077860355377197266, 0.008216261863708496, 0.008646488189697266, 0.009076714515686035, 0.009506940841674805, 0.009937167167663574, 0.010367393493652344, 0.010797619819641113, 0.011227846145629883, 0.011658072471618652, 0.012088298797607422, 0.012518525123596191, 0.012948751449584961, 0.01337897777557373, 0.0138092041015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 12.0, 6.0, 13.0, 13.0, 21.0, 36.0, 40.0, 75.0, 119.0, 229.0, 452.0, 874.0, 1746.0, 4621.0, 18179.0, 145191.0, 775161.0, 82439.0, 12538.0, 3629.0, 1544.0, 720.0, 364.0, 196.0, 123.0, 73.0, 35.0, 27.0, 18.0, 18.0, 6.0, 7.0, 4.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07696533203125, -0.07458877563476562, -0.07221221923828125, -0.06983566284179688, -0.0674591064453125, -0.06508255004882812, -0.06270599365234375, -0.060329437255859375, -0.057952880859375, -0.055576324462890625, -0.05319976806640625, -0.050823211669921875, -0.0484466552734375, -0.046070098876953125, -0.04369354248046875, -0.041316986083984375, -0.0389404296875, -0.036563873291015625, -0.03418731689453125, -0.031810760498046875, -0.0294342041015625, -0.027057647705078125, -0.02468109130859375, -0.022304534912109375, -0.019927978515625, -0.017551422119140625, -0.01517486572265625, -0.012798309326171875, -0.0104217529296875, -0.008045196533203125, -0.00566864013671875, -0.003292083740234375, -0.00091552734375, 0.001461029052734375, 0.00383758544921875, 0.006214141845703125, 0.0085906982421875, 0.010967254638671875, 0.01334381103515625, 0.015720367431640625, 0.018096923828125, 0.020473480224609375, 0.02285003662109375, 0.025226593017578125, 0.0276031494140625, 0.029979705810546875, 0.03235626220703125, 0.034732818603515625, 0.037109375, 0.039485931396484375, 0.04186248779296875, 0.044239044189453125, 0.0466156005859375, 0.048992156982421875, 0.05136871337890625, 0.053745269775390625, 0.056121826171875, 0.058498382568359375, 0.06087493896484375, 0.06325149536132812, 0.0656280517578125, 0.06800460815429688, 0.07038116455078125, 0.07275772094726562, 0.07513427734375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 12.0, 14.0, 10.0, 23.0, 35.0, 23.0, 35.0, 30.0, 52.0, 63.0, 84.0, 71.0, 84.0, 80.0, 65.0, 74.0, 49.0, 47.0, 40.0, 25.0, 18.0, 15.0, 8.0, 13.0, 10.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0633544921875, -0.06029510498046875, -0.0572357177734375, -0.05417633056640625, -0.051116943359375, -0.04805755615234375, -0.0449981689453125, -0.04193878173828125, -0.03887939453125, -0.03582000732421875, -0.0327606201171875, -0.02970123291015625, -0.026641845703125, -0.02358245849609375, -0.0205230712890625, -0.01746368408203125, -0.014404296875, -0.01134490966796875, -0.0082855224609375, -0.00522613525390625, -0.002166748046875, 0.00089263916015625, 0.0039520263671875, 0.00701141357421875, 0.01007080078125, 0.01313018798828125, 0.0161895751953125, 0.01924896240234375, 0.022308349609375, 0.02536773681640625, 0.0284271240234375, 0.03148651123046875, 0.0345458984375, 0.03760528564453125, 0.0406646728515625, 0.04372406005859375, 0.046783447265625, 0.04984283447265625, 0.0529022216796875, 0.05596160888671875, 0.05902099609375, 0.06208038330078125, 0.0651397705078125, 0.06819915771484375, 0.071258544921875, 0.07431793212890625, 0.0773773193359375, 0.08043670654296875, 0.08349609375, 0.08655548095703125, 0.0896148681640625, 0.09267425537109375, 0.095733642578125, 0.09879302978515625, 0.1018524169921875, 0.10491180419921875, 0.10797119140625, 0.11103057861328125, 0.1140899658203125, 0.11714935302734375, 0.120208740234375, 0.12326812744140625, 0.1263275146484375, 0.12938690185546875, 0.1324462890625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 23.0, 24.0, 24.0, 34.0, 52.0, 89.0, 124.0, 195.0, 304.0, 445.0, 721.0, 1274.0, 2110.0, 4122.0, 8420.0, 21594.0, 82501.0, 701314.0, 168395.0, 33037.0, 11686.0, 5277.0, 2749.0, 1583.0, 893.0, 517.0, 356.0, 214.0, 141.0, 97.0, 65.0, 44.0, 37.0, 24.0, 16.0, 13.0, 2.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.032012939453125, -0.031062602996826172, -0.030112266540527344, -0.029161930084228516, -0.028211593627929688, -0.02726125717163086, -0.02631092071533203, -0.025360584259033203, -0.024410247802734375, -0.023459911346435547, -0.02250957489013672, -0.02155923843383789, -0.020608901977539062, -0.019658565521240234, -0.018708229064941406, -0.017757892608642578, -0.01680755615234375, -0.015857219696044922, -0.014906883239746094, -0.013956546783447266, -0.013006210327148438, -0.01205587387084961, -0.011105537414550781, -0.010155200958251953, -0.009204864501953125, -0.008254528045654297, -0.007304191589355469, -0.006353855133056641, -0.0054035186767578125, -0.004453182220458984, -0.0035028457641601562, -0.002552509307861328, -0.0016021728515625, -0.0006518363952636719, 0.00029850006103515625, 0.0012488365173339844, 0.0021991729736328125, 0.0031495094299316406, 0.004099845886230469, 0.005050182342529297, 0.006000518798828125, 0.006950855255126953, 0.007901191711425781, 0.00885152816772461, 0.009801864624023438, 0.010752201080322266, 0.011702537536621094, 0.012652873992919922, 0.01360321044921875, 0.014553546905517578, 0.015503883361816406, 0.016454219818115234, 0.017404556274414062, 0.01835489273071289, 0.01930522918701172, 0.020255565643310547, 0.021205902099609375, 0.022156238555908203, 0.02310657501220703, 0.02405691146850586, 0.025007247924804688, 0.025957584381103516, 0.026907920837402344, 0.027858257293701172, 0.02880859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 12.0, 14.0, 19.0, 24.0, 30.0, 39.0, 63.0, 76.0, 74.0, 98.0, 94.0, 98.0, 87.0, 57.0, 50.0, 46.0, 31.0, 24.0, 23.0, 13.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0067901611328125e-05, -4.876870661973953e-05, -4.746951162815094e-05, -4.617031663656235e-05, -4.4871121644973755e-05, -4.357192665338516e-05, -4.227273166179657e-05, -4.097353667020798e-05, -3.9674341678619385e-05, -3.837514668703079e-05, -3.70759516954422e-05, -3.577675670385361e-05, -3.4477561712265015e-05, -3.317836672067642e-05, -3.187917172908783e-05, -3.057997673749924e-05, -2.9280781745910645e-05, -2.7981586754322052e-05, -2.668239176273346e-05, -2.5383196771144867e-05, -2.4084001779556274e-05, -2.2784806787967682e-05, -2.148561179637909e-05, -2.0186416804790497e-05, -1.8887221813201904e-05, -1.7588026821613312e-05, -1.628883183002472e-05, -1.4989636838436127e-05, -1.3690441846847534e-05, -1.2391246855258942e-05, -1.1092051863670349e-05, -9.792856872081757e-06, -8.493661880493164e-06, -7.1944668889045715e-06, -5.895271897315979e-06, -4.5960769057273865e-06, -3.296881914138794e-06, -1.9976869225502014e-06, -6.984919309616089e-07, 6.007030606269836e-07, 1.8998980522155762e-06, 3.1990930438041687e-06, 4.498288035392761e-06, 5.797483026981354e-06, 7.096678018569946e-06, 8.395873010158539e-06, 9.695068001747131e-06, 1.0994262993335724e-05, 1.2293457984924316e-05, 1.3592652976512909e-05, 1.4891847968101501e-05, 1.6191042959690094e-05, 1.7490237951278687e-05, 1.878943294286728e-05, 2.008862793445587e-05, 2.1387822926044464e-05, 2.2687017917633057e-05, 2.398621290922165e-05, 2.5285407900810242e-05, 2.6584602892398834e-05, 2.7883797883987427e-05, 2.918299287557602e-05, 3.0482187867164612e-05, 3.1781382858753204e-05, 3.30805778503418e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 9.0, 9.0, 4.0, 20.0, 22.0, 22.0, 55.0, 71.0, 93.0, 183.0, 343.0, 629.0, 1225.0, 2911.0, 7396.0, 25433.0, 157855.0, 750720.0, 75801.0, 16178.0, 5298.0, 2085.0, 1013.0, 492.0, 284.0, 171.0, 81.0, 38.0, 36.0, 16.0, 14.0, 18.0, 4.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.036468505859375, -0.03530454635620117, -0.034140586853027344, -0.032976627349853516, -0.03181266784667969, -0.03064870834350586, -0.02948474884033203, -0.028320789337158203, -0.027156829833984375, -0.025992870330810547, -0.02482891082763672, -0.02366495132446289, -0.022500991821289062, -0.021337032318115234, -0.020173072814941406, -0.019009113311767578, -0.01784515380859375, -0.016681194305419922, -0.015517234802246094, -0.014353275299072266, -0.013189315795898438, -0.01202535629272461, -0.010861396789550781, -0.009697437286376953, -0.008533477783203125, -0.007369518280029297, -0.006205558776855469, -0.005041599273681641, -0.0038776397705078125, -0.0027136802673339844, -0.0015497207641601562, -0.0003857612609863281, 0.0007781982421875, 0.0019421577453613281, 0.0031061172485351562, 0.004270076751708984, 0.0054340362548828125, 0.006597995758056641, 0.007761955261230469, 0.008925914764404297, 0.010089874267578125, 0.011253833770751953, 0.012417793273925781, 0.01358175277709961, 0.014745712280273438, 0.015909671783447266, 0.017073631286621094, 0.018237590789794922, 0.01940155029296875, 0.020565509796142578, 0.021729469299316406, 0.022893428802490234, 0.024057388305664062, 0.02522134780883789, 0.02638530731201172, 0.027549266815185547, 0.028713226318359375, 0.029877185821533203, 0.03104114532470703, 0.03220510482788086, 0.03336906433105469, 0.034533023834228516, 0.035696983337402344, 0.03686094284057617, 0.03802490234375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 8.0, 23.0, 23.0, 23.0, 25.0, 50.0, 54.0, 72.0, 113.0, 131.0, 108.0, 77.0, 68.0, 56.0, 34.0, 21.0, 22.0, 10.0, 7.0, 8.0, 5.0, 8.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0350341796875, -0.03402376174926758, -0.033013343811035156, -0.032002925872802734, -0.030992507934570312, -0.02998208999633789, -0.02897167205810547, -0.027961254119873047, -0.026950836181640625, -0.025940418243408203, -0.02493000030517578, -0.02391958236694336, -0.022909164428710938, -0.021898746490478516, -0.020888328552246094, -0.019877910614013672, -0.01886749267578125, -0.017857074737548828, -0.016846656799316406, -0.015836238861083984, -0.014825820922851562, -0.01381540298461914, -0.012804985046386719, -0.011794567108154297, -0.010784149169921875, -0.009773731231689453, -0.008763313293457031, -0.007752895355224609, -0.0067424774169921875, -0.005732059478759766, -0.004721641540527344, -0.003711223602294922, -0.0027008056640625, -0.0016903877258300781, -0.0006799697875976562, 0.0003304481506347656, 0.0013408660888671875, 0.0023512840270996094, 0.0033617019653320312, 0.004372119903564453, 0.005382537841796875, 0.006392955780029297, 0.007403373718261719, 0.00841379165649414, 0.009424209594726562, 0.010434627532958984, 0.011445045471191406, 0.012455463409423828, 0.01346588134765625, 0.014476299285888672, 0.015486717224121094, 0.016497135162353516, 0.017507553100585938, 0.01851797103881836, 0.01952838897705078, 0.020538806915283203, 0.021549224853515625, 0.022559642791748047, 0.02357006072998047, 0.02458047866821289, 0.025590896606445312, 0.026601314544677734, 0.027611732482910156, 0.028622150421142578, 0.029632568359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 3.0, 8.0, 4.0, 20.0, 18.0, 33.0, 65.0, 108.0, 145.0, 316.0, 143.0, 62.0, 32.0, 16.0, 7.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.09871506690979, -1.0755971670150757, -1.0524792671203613, -1.0293612480163574, -1.006243348121643, -0.9831254482269287, -0.9600075483322144, -0.9368896484375, -0.9137716889381409, -0.8906537890434265, -0.8675358295440674, -0.844417929649353, -0.8213000297546387, -0.7981820702552795, -0.7750641703605652, -0.751946210861206, -0.7288283109664917, -0.7057104110717773, -0.6825924515724182, -0.6594745516777039, -0.6363565921783447, -0.6132386922836304, -0.590120792388916, -0.5670028924942017, -0.5438849329948425, -0.5207670331001282, -0.49764907360076904, -0.4745311737060547, -0.45141324400901794, -0.4282953143119812, -0.40517741441726685, -0.3820594847202301, -0.35894155502319336, -0.3358236253261566, -0.3127056956291199, -0.2895877957344055, -0.2664698660373688, -0.24335193634033203, -0.22023402154445648, -0.19711610674858093, -0.1739981770515442, -0.15088024735450745, -0.1277623325586319, -0.10464441031217575, -0.0815264880657196, -0.05840856581926346, -0.03529064357280731, -0.012172728776931763, 0.01094520092010498, 0.03406312316656113, 0.05718104541301727, 0.08029896765947342, 0.10341688990592957, 0.1265348196029663, 0.14965273439884186, 0.1727706491947174, 0.19588857889175415, 0.2190065085887909, 0.24212442338466644, 0.265242338180542, 0.28836026787757874, 0.3114781975746155, 0.33459609746932983, 0.3577140271663666, 0.3808319568634033]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 11.0, 10.0, 2.0, 9.0, 14.0, 13.0, 20.0, 14.0, 26.0, 32.0, 22.0, 20.0, 28.0, 23.0, 29.0, 47.0, 59.0, 82.0, 94.0, 81.0, 47.0, 44.0, 36.0, 31.0, 28.0, 22.0, 18.0, 21.0, 20.0, 18.0, 10.0, 8.0, 15.0, 12.0, 6.0, 6.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.392331600189209, -0.3809349834918976, -0.3695383369922638, -0.3581417202949524, -0.3467450737953186, -0.3353484570980072, -0.3239518404006958, -0.312555193901062, -0.3011585772037506, -0.2897619605064392, -0.2783653140068054, -0.266968697309494, -0.25557205080986023, -0.24417543411254883, -0.23277880251407623, -0.22138217091560364, -0.20998553931713104, -0.19858890771865845, -0.18719227612018585, -0.17579564452171326, -0.16439902782440186, -0.15300239622592926, -0.14160576462745667, -0.13020914793014526, -0.11881250888109207, -0.10741587728261948, -0.09601925313472748, -0.08462262153625488, -0.07322598993778229, -0.06182936578989029, -0.050432734191417694, -0.039036110043525696, -0.0276394784450531, -0.016242850571870804, -0.004846220836043358, 0.006550408899784088, 0.017947036772966385, 0.02934366464614868, 0.04074029624462128, 0.052136920392513275, 0.06353355199098587, 0.07493018358945847, 0.08632680773735046, 0.09772343933582306, 0.10912007093429565, 0.12051669508218765, 0.13191333413124084, 0.14330995082855225, 0.15470658242702484, 0.16610321402549744, 0.17749984562397003, 0.18889647722244263, 0.20029309391975403, 0.21168972551822662, 0.22308635711669922, 0.23448297381401062, 0.2458796203136444, 0.2572762370109558, 0.2686728835105896, 0.280069500207901, 0.2914661467075348, 0.3028627634048462, 0.31425940990448, 0.3256560266017914, 0.3370526432991028]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 2.0, 6.0, 8.0, 16.0, 16.0, 31.0, 38.0, 51.0, 67.0, 117.0, 149.0, 218.0, 352.0, 496.0, 881.0, 1499.0, 2864.0, 6477.0, 17613.0, 68809.0, 507979.0, 2823147.0, 648314.0, 81105.0, 19679.0, 6936.0, 3176.0, 1598.0, 949.0, 543.0, 364.0, 231.0, 166.0, 107.0, 76.0, 60.0, 36.0, 31.0, 24.0, 8.0, 16.0, 7.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.026611328125, -0.025793790817260742, -0.024976253509521484, -0.024158716201782227, -0.02334117889404297, -0.02252364158630371, -0.021706104278564453, -0.020888566970825195, -0.020071029663085938, -0.01925349235534668, -0.018435955047607422, -0.017618417739868164, -0.016800880432128906, -0.01598334312438965, -0.01516580581665039, -0.014348268508911133, -0.013530731201171875, -0.012713193893432617, -0.01189565658569336, -0.011078119277954102, -0.010260581970214844, -0.009443044662475586, -0.008625507354736328, -0.00780797004699707, -0.0069904327392578125, -0.006172895431518555, -0.005355358123779297, -0.004537820816040039, -0.0037202835083007812, -0.0029027462005615234, -0.0020852088928222656, -0.0012676715850830078, -0.00045013427734375, 0.0003674030303955078, 0.0011849403381347656, 0.0020024776458740234, 0.0028200149536132812, 0.003637552261352539, 0.004455089569091797, 0.005272626876831055, 0.0060901641845703125, 0.00690770149230957, 0.007725238800048828, 0.008542776107788086, 0.009360313415527344, 0.010177850723266602, 0.01099538803100586, 0.011812925338745117, 0.012630462646484375, 0.013447999954223633, 0.01426553726196289, 0.015083074569702148, 0.015900611877441406, 0.016718149185180664, 0.017535686492919922, 0.01835322380065918, 0.019170761108398438, 0.019988298416137695, 0.020805835723876953, 0.02162337303161621, 0.02244091033935547, 0.023258447647094727, 0.024075984954833984, 0.024893522262573242, 0.0257110595703125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 2.0, 9.0, 16.0, 9.0, 23.0, 21.0, 31.0, 28.0, 31.0, 38.0, 43.0, 40.0, 54.0, 51.0, 61.0, 55.0, 62.0, 58.0, 52.0, 43.0, 39.0, 40.0, 21.0, 28.0, 29.0, 15.0, 17.0, 20.0, 12.0, 6.0, 8.0, 11.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.018829345703125, -0.018265247344970703, -0.017701148986816406, -0.01713705062866211, -0.016572952270507812, -0.016008853912353516, -0.015444755554199219, -0.014880657196044922, -0.014316558837890625, -0.013752460479736328, -0.013188362121582031, -0.012624263763427734, -0.012060165405273438, -0.01149606704711914, -0.010931968688964844, -0.010367870330810547, -0.00980377197265625, -0.009239673614501953, -0.008675575256347656, -0.00811147689819336, -0.0075473785400390625, -0.006983280181884766, -0.006419181823730469, -0.005855083465576172, -0.005290985107421875, -0.004726886749267578, -0.004162788391113281, -0.0035986900329589844, -0.0030345916748046875, -0.0024704933166503906, -0.0019063949584960938, -0.0013422966003417969, -0.0007781982421875, -0.00021409988403320312, 0.00034999847412109375, 0.0009140968322753906, 0.0014781951904296875, 0.0020422935485839844, 0.0026063919067382812, 0.003170490264892578, 0.003734588623046875, 0.004298686981201172, 0.004862785339355469, 0.005426883697509766, 0.0059909820556640625, 0.006555080413818359, 0.007119178771972656, 0.007683277130126953, 0.00824737548828125, 0.008811473846435547, 0.009375572204589844, 0.00993967056274414, 0.010503768920898438, 0.011067867279052734, 0.011631965637207031, 0.012196063995361328, 0.012760162353515625, 0.013324260711669922, 0.013888359069824219, 0.014452457427978516, 0.015016555786132812, 0.01558065414428711, 0.016144752502441406, 0.016708850860595703, 0.01727294921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 17.0, 33.0, 74.0, 185.0, 518.0, 2669.0, 2584356.0, 1603086.0, 2467.0, 535.0, 209.0, 75.0, 36.0, 15.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3236846923828125, -0.313873291015625, -0.3040618896484375, -0.29425048828125, -0.2844390869140625, -0.274627685546875, -0.2648162841796875, -0.2550048828125, -0.2451934814453125, -0.235382080078125, -0.2255706787109375, -0.21575927734375, -0.2059478759765625, -0.196136474609375, -0.1863250732421875, -0.176513671875, -0.1667022705078125, -0.156890869140625, -0.1470794677734375, -0.13726806640625, -0.1274566650390625, -0.117645263671875, -0.1078338623046875, -0.0980224609375, -0.0882110595703125, -0.078399658203125, -0.0685882568359375, -0.05877685546875, -0.0489654541015625, -0.039154052734375, -0.0293426513671875, -0.01953125, -0.0097198486328125, 9.1552734375e-05, 0.0099029541015625, 0.01971435546875, 0.0295257568359375, 0.039337158203125, 0.0491485595703125, 0.0589599609375, 0.0687713623046875, 0.078582763671875, 0.0883941650390625, 0.09820556640625, 0.1080169677734375, 0.117828369140625, 0.1276397705078125, 0.137451171875, 0.1472625732421875, 0.157073974609375, 0.1668853759765625, 0.17669677734375, 0.1865081787109375, 0.196319580078125, 0.2061309814453125, 0.2159423828125, 0.2257537841796875, 0.235565185546875, 0.2453765869140625, 0.25518798828125, 0.2649993896484375, 0.274810791015625, 0.2846221923828125, 0.29443359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 21.0, 43.0, 94.0, 491.0, 2556.0, 673.0, 114.0, 35.0, 20.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1182861328125, -0.11326789855957031, -0.10824966430664062, -0.10323143005371094, -0.09821319580078125, -0.09319496154785156, -0.08817672729492188, -0.08315849304199219, -0.0781402587890625, -0.07312202453613281, -0.06810379028320312, -0.06308555603027344, -0.05806732177734375, -0.05304908752441406, -0.048030853271484375, -0.04301261901855469, -0.037994384765625, -0.03297615051269531, -0.027957916259765625, -0.022939682006835938, -0.01792144775390625, -0.012903213500976562, -0.007884979248046875, -0.0028667449951171875, 0.0021514892578125, 0.0071697235107421875, 0.012187957763671875, 0.017206192016601562, 0.02222442626953125, 0.027242660522460938, 0.032260894775390625, 0.03727912902832031, 0.04229736328125, 0.04731559753417969, 0.052333831787109375, 0.05735206604003906, 0.06237030029296875, 0.06738853454589844, 0.07240676879882812, 0.07742500305175781, 0.0824432373046875, 0.08746147155761719, 0.09247970581054688, 0.09749794006347656, 0.10251617431640625, 0.10753440856933594, 0.11255264282226562, 0.11757087707519531, 0.122589111328125, 0.1276073455810547, 0.13262557983398438, 0.13764381408691406, 0.14266204833984375, 0.14768028259277344, 0.15269851684570312, 0.1577167510986328, 0.1627349853515625, 0.1677532196044922, 0.17277145385742188, 0.17778968811035156, 0.18280792236328125, 0.18782615661621094, 0.19284439086914062, 0.1978626251220703, 0.202880859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 11.0, 18.0, 26.0, 49.0, 85.0, 120.0, 183.0, 160.0, 124.0, 101.0, 51.0, 25.0, 15.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3671375513076782, -0.3498218059539795, -0.33250606060028076, -0.31519031524658203, -0.2978745698928833, -0.28055882453918457, -0.26324307918548584, -0.2459273487329483, -0.22861160337924957, -0.21129585802555084, -0.1939801126718521, -0.17666438221931458, -0.15934863686561584, -0.14203289151191711, -0.12471714615821838, -0.10740140080451965, -0.09008565545082092, -0.07276991009712219, -0.05545416846871376, -0.03813842684030533, -0.020822681486606598, -0.0035069361329078674, 0.013808801770210266, 0.031124547123908997, 0.04844029247760773, 0.06575603783130646, 0.08307178318500519, 0.10038752108812332, 0.11770326644182205, 0.13501900434494019, 0.15233474969863892, 0.16965049505233765, 0.18696624040603638, 0.2042819857597351, 0.22159773111343384, 0.23891347646713257, 0.2562292218208313, 0.27354496717453003, 0.29086071252822876, 0.3081764578819275, 0.3254922032356262, 0.34280794858932495, 0.3601236939430237, 0.3774394392967224, 0.39475518465042114, 0.4120709300041199, 0.4293866753578186, 0.44670242071151733, 0.4640181362628937, 0.4813338816165924, 0.49864962697029114, 0.5159653425216675, 0.5332810878753662, 0.5505968332290649, 0.5679125785827637, 0.5852283239364624, 0.6025440692901611, 0.6198598146438599, 0.6371755599975586, 0.6544913053512573, 0.671807050704956, 0.6891227960586548, 0.7064385414123535, 0.7237542867660522, 0.741070032119751]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 7.0, 5.0, 6.0, 12.0, 7.0, 15.0, 15.0, 15.0, 15.0, 15.0, 17.0, 22.0, 43.0, 31.0, 39.0, 37.0, 35.0, 42.0, 46.0, 45.0, 47.0, 53.0, 46.0, 38.0, 38.0, 40.0, 28.0, 40.0, 35.0, 30.0, 26.0, 22.0, 14.0, 16.0, 13.0, 8.0, 6.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.26610541343688965, -0.2573443651199341, -0.2485833317041397, -0.23982229828834534, -0.23106126487255096, -0.2223002314567566, -0.21353918313980103, -0.20477814972400665, -0.19601711630821228, -0.1872560828924179, -0.17849503457546234, -0.16973400115966797, -0.1609729677438736, -0.15221193432807922, -0.14345088601112366, -0.13468985259532928, -0.12592880427837372, -0.11716776341199875, -0.10840672999620438, -0.0996456891298294, -0.09088465571403503, -0.08212361484766006, -0.0733625739812851, -0.06460154056549072, -0.05584049969911575, -0.04707946255803108, -0.03831842541694641, -0.02955738455057144, -0.02079634740948677, -0.0120353102684021, -0.00327426940202713, 0.005486767739057541, 0.014247804880142212, 0.023008842021226883, 0.031769879162311554, 0.04053092002868652, 0.049291957169771194, 0.058052994310855865, 0.06681403517723083, 0.07557506859302521, 0.08433610945940018, 0.09309715032577515, 0.10185818374156952, 0.11061922460794449, 0.11938026547431946, 0.12814129889011383, 0.1369023323059082, 0.14566338062286377, 0.15442441403865814, 0.16318544745445251, 0.17194649577140808, 0.18070752918720245, 0.18946856260299683, 0.1982296109199524, 0.20699064433574677, 0.21575167775154114, 0.2245127260684967, 0.23327375948429108, 0.24203480780124664, 0.250795841217041, 0.2595568895339966, 0.26831790804862976, 0.2770789563655853, 0.2858400046825409, 0.2946010231971741]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 10.0, 8.0, 15.0, 19.0, 35.0, 53.0, 75.0, 132.0, 217.0, 434.0, 808.0, 1722.0, 3671.0, 8857.0, 23093.0, 69371.0, 244115.0, 452873.0, 165279.0, 48846.0, 16588.0, 6480.0, 2939.0, 1287.0, 705.0, 385.0, 215.0, 123.0, 69.0, 42.0, 27.0, 25.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0303497314453125, -0.029239892959594727, -0.028130054473876953, -0.02702021598815918, -0.025910377502441406, -0.024800539016723633, -0.02369070053100586, -0.022580862045288086, -0.021471023559570312, -0.02036118507385254, -0.019251346588134766, -0.018141508102416992, -0.01703166961669922, -0.015921831130981445, -0.014811992645263672, -0.013702154159545898, -0.012592315673828125, -0.011482477188110352, -0.010372638702392578, -0.009262800216674805, -0.008152961730957031, -0.007043123245239258, -0.005933284759521484, -0.004823446273803711, -0.0037136077880859375, -0.002603769302368164, -0.0014939308166503906, -0.0003840923309326172, 0.0007257461547851562, 0.0018355846405029297, 0.002945423126220703, 0.0040552616119384766, 0.00516510009765625, 0.0062749385833740234, 0.007384777069091797, 0.00849461555480957, 0.009604454040527344, 0.010714292526245117, 0.01182413101196289, 0.012933969497680664, 0.014043807983398438, 0.015153646469116211, 0.016263484954833984, 0.017373323440551758, 0.01848316192626953, 0.019593000411987305, 0.020702838897705078, 0.02181267738342285, 0.022922515869140625, 0.0240323543548584, 0.025142192840576172, 0.026252031326293945, 0.02736186981201172, 0.028471708297729492, 0.029581546783447266, 0.03069138526916504, 0.03180122375488281, 0.032911062240600586, 0.03402090072631836, 0.03513073921203613, 0.036240577697753906, 0.03735041618347168, 0.03846025466918945, 0.03957009315490723, 0.040679931640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 6.0, 11.0, 13.0, 18.0, 15.0, 13.0, 18.0, 20.0, 35.0, 30.0, 35.0, 59.0, 50.0, 53.0, 63.0, 66.0, 63.0, 53.0, 54.0, 56.0, 45.0, 38.0, 35.0, 29.0, 28.0, 21.0, 17.0, 9.0, 15.0, 9.0, 3.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0231475830078125, -0.022438526153564453, -0.021729469299316406, -0.02102041244506836, -0.020311355590820312, -0.019602298736572266, -0.01889324188232422, -0.018184185028076172, -0.017475128173828125, -0.016766071319580078, -0.01605701446533203, -0.015347957611083984, -0.014638900756835938, -0.01392984390258789, -0.013220787048339844, -0.012511730194091797, -0.01180267333984375, -0.011093616485595703, -0.010384559631347656, -0.00967550277709961, -0.008966445922851562, -0.008257389068603516, -0.007548332214355469, -0.006839275360107422, -0.006130218505859375, -0.005421161651611328, -0.004712104797363281, -0.004003047943115234, -0.0032939910888671875, -0.0025849342346191406, -0.0018758773803710938, -0.0011668205261230469, -0.000457763671875, 0.0002512931823730469, 0.0009603500366210938, 0.0016694068908691406, 0.0023784637451171875, 0.0030875205993652344, 0.0037965774536132812, 0.004505634307861328, 0.005214691162109375, 0.005923748016357422, 0.006632804870605469, 0.007341861724853516, 0.008050918579101562, 0.00875997543334961, 0.009469032287597656, 0.010178089141845703, 0.01088714599609375, 0.011596202850341797, 0.012305259704589844, 0.01301431655883789, 0.013723373413085938, 0.014432430267333984, 0.015141487121582031, 0.015850543975830078, 0.016559600830078125, 0.017268657684326172, 0.01797771453857422, 0.018686771392822266, 0.019395828247070312, 0.02010488510131836, 0.020813941955566406, 0.021522998809814453, 0.0222320556640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 4.0, 9.0, 8.0, 11.0, 24.0, 27.0, 36.0, 41.0, 64.0, 59.0, 93.0, 145.0, 228.0, 362.0, 440.0, 945.0, 2134.0, 6123.0, 25575.0, 187258.0, 731433.0, 73006.0, 13064.0, 3806.0, 1500.0, 740.0, 420.0, 260.0, 208.0, 144.0, 105.0, 59.0, 52.0, 31.0, 32.0, 20.0, 23.0, 17.0, 10.0, 9.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0], "bins": [-0.07611083984375, -0.07389068603515625, -0.0716705322265625, -0.06945037841796875, -0.067230224609375, -0.06501007080078125, -0.0627899169921875, -0.06056976318359375, -0.058349609375, -0.05612945556640625, -0.0539093017578125, -0.05168914794921875, -0.049468994140625, -0.04724884033203125, -0.0450286865234375, -0.04280853271484375, -0.04058837890625, -0.03836822509765625, -0.0361480712890625, -0.03392791748046875, -0.031707763671875, -0.02948760986328125, -0.0272674560546875, -0.02504730224609375, -0.0228271484375, -0.02060699462890625, -0.0183868408203125, -0.01616668701171875, -0.013946533203125, -0.01172637939453125, -0.0095062255859375, -0.00728607177734375, -0.00506591796875, -0.00284576416015625, -0.0006256103515625, 0.00159454345703125, 0.003814697265625, 0.00603485107421875, 0.0082550048828125, 0.01047515869140625, 0.0126953125, 0.01491546630859375, 0.0171356201171875, 0.01935577392578125, 0.021575927734375, 0.02379608154296875, 0.0260162353515625, 0.02823638916015625, 0.03045654296875, 0.03267669677734375, 0.0348968505859375, 0.03711700439453125, 0.039337158203125, 0.04155731201171875, 0.0437774658203125, 0.04599761962890625, 0.0482177734375, 0.05043792724609375, 0.0526580810546875, 0.05487823486328125, 0.057098388671875, 0.05931854248046875, 0.0615386962890625, 0.06375885009765625, 0.06597900390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 8.0, 5.0, 11.0, 10.0, 10.0, 14.0, 10.0, 14.0, 16.0, 27.0, 21.0, 44.0, 20.0, 35.0, 50.0, 46.0, 36.0, 53.0, 54.0, 46.0, 51.0, 57.0, 40.0, 52.0, 46.0, 37.0, 28.0, 26.0, 20.0, 19.0, 20.0, 13.0, 6.0, 14.0, 5.0, 9.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0831298828125, -0.08056926727294922, -0.07800865173339844, -0.07544803619384766, -0.07288742065429688, -0.0703268051147461, -0.06776618957519531, -0.06520557403564453, -0.06264495849609375, -0.06008434295654297, -0.05752372741699219, -0.054963111877441406, -0.052402496337890625, -0.049841880798339844, -0.04728126525878906, -0.04472064971923828, -0.0421600341796875, -0.03959941864013672, -0.03703880310058594, -0.034478187561035156, -0.031917572021484375, -0.029356956481933594, -0.026796340942382812, -0.02423572540283203, -0.02167510986328125, -0.01911449432373047, -0.016553878784179688, -0.013993263244628906, -0.011432647705078125, -0.008872032165527344, -0.0063114166259765625, -0.0037508010864257812, -0.001190185546875, 0.0013704299926757812, 0.0039310455322265625, 0.006491661071777344, 0.009052276611328125, 0.011612892150878906, 0.014173507690429688, 0.01673412322998047, 0.01929473876953125, 0.02185535430908203, 0.024415969848632812, 0.026976585388183594, 0.029537200927734375, 0.032097816467285156, 0.03465843200683594, 0.03721904754638672, 0.0397796630859375, 0.04234027862548828, 0.04490089416503906, 0.047461509704589844, 0.050022125244140625, 0.052582740783691406, 0.05514335632324219, 0.05770397186279297, 0.06026458740234375, 0.06282520294189453, 0.06538581848144531, 0.0679464340209961, 0.07050704956054688, 0.07306766510009766, 0.07562828063964844, 0.07818889617919922, 0.08074951171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 9.0, 11.0, 12.0, 11.0, 31.0, 18.0, 63.0, 93.0, 190.0, 300.0, 776.0, 1934.0, 6042.0, 25309.0, 172434.0, 764960.0, 59278.0, 11684.0, 3222.0, 1145.0, 479.0, 232.0, 125.0, 69.0, 41.0, 26.0, 13.0, 10.0, 10.0, 4.0, 4.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02838134765625, -0.027210712432861328, -0.026040077209472656, -0.024869441986083984, -0.023698806762695312, -0.02252817153930664, -0.02135753631591797, -0.020186901092529297, -0.019016265869140625, -0.017845630645751953, -0.01667499542236328, -0.01550436019897461, -0.014333724975585938, -0.013163089752197266, -0.011992454528808594, -0.010821819305419922, -0.00965118408203125, -0.008480548858642578, -0.007309913635253906, -0.006139278411865234, -0.0049686431884765625, -0.0037980079650878906, -0.0026273727416992188, -0.0014567375183105469, -0.000286102294921875, 0.0008845329284667969, 0.0020551681518554688, 0.0032258033752441406, 0.0043964385986328125, 0.005567073822021484, 0.006737709045410156, 0.007908344268798828, 0.0090789794921875, 0.010249614715576172, 0.011420249938964844, 0.012590885162353516, 0.013761520385742188, 0.01493215560913086, 0.01610279083251953, 0.017273426055908203, 0.018444061279296875, 0.019614696502685547, 0.02078533172607422, 0.02195596694946289, 0.023126602172851562, 0.024297237396240234, 0.025467872619628906, 0.026638507843017578, 0.02780914306640625, 0.028979778289794922, 0.030150413513183594, 0.031321048736572266, 0.03249168395996094, 0.03366231918334961, 0.03483295440673828, 0.03600358963012695, 0.037174224853515625, 0.0383448600769043, 0.03951549530029297, 0.04068613052368164, 0.04185676574707031, 0.043027400970458984, 0.044198036193847656, 0.04536867141723633, 0.046539306640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 1.0, 7.0, 7.0, 14.0, 21.0, 29.0, 41.0, 53.0, 60.0, 88.0, 90.0, 94.0, 99.0, 87.0, 73.0, 51.0, 50.0, 35.0, 25.0, 13.0, 12.0, 7.0, 7.0, 7.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.035234451293945e-05, -3.919471055269241e-05, -3.8037076592445374e-05, -3.6879442632198334e-05, -3.5721808671951294e-05, -3.4564174711704254e-05, -3.3406540751457214e-05, -3.2248906791210175e-05, -3.1091272830963135e-05, -2.9933638870716095e-05, -2.8776004910469055e-05, -2.7618370950222015e-05, -2.6460736989974976e-05, -2.5303103029727936e-05, -2.4145469069480896e-05, -2.2987835109233856e-05, -2.1830201148986816e-05, -2.0672567188739777e-05, -1.9514933228492737e-05, -1.8357299268245697e-05, -1.7199665307998657e-05, -1.6042031347751617e-05, -1.4884397387504578e-05, -1.3726763427257538e-05, -1.2569129467010498e-05, -1.1411495506763458e-05, -1.0253861546516418e-05, -9.096227586269379e-06, -7.938593626022339e-06, -6.780959665775299e-06, -5.623325705528259e-06, -4.4656917452812195e-06, -3.3080577850341797e-06, -2.15042382478714e-06, -9.927898645401e-07, 1.648440957069397e-07, 1.3224780559539795e-06, 2.4801120162010193e-06, 3.637745976448059e-06, 4.795379936695099e-06, 5.953013896942139e-06, 7.1106478571891785e-06, 8.268281817436218e-06, 9.425915777683258e-06, 1.0583549737930298e-05, 1.1741183698177338e-05, 1.2898817658424377e-05, 1.4056451618671417e-05, 1.5214085578918457e-05, 1.6371719539165497e-05, 1.7529353499412537e-05, 1.8686987459659576e-05, 1.9844621419906616e-05, 2.1002255380153656e-05, 2.2159889340400696e-05, 2.3317523300647736e-05, 2.4475157260894775e-05, 2.5632791221141815e-05, 2.6790425181388855e-05, 2.7948059141635895e-05, 2.9105693101882935e-05, 3.0263327062129974e-05, 3.1420961022377014e-05, 3.2578594982624054e-05, 3.3736228942871094e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 15.0, 21.0, 28.0, 63.0, 95.0, 158.0, 319.0, 659.0, 1820.0, 5634.0, 25978.0, 254355.0, 708372.0, 39510.0, 7682.0, 2226.0, 831.0, 373.0, 170.0, 88.0, 48.0, 36.0, 23.0, 13.0, 10.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04168701171875, -0.04034709930419922, -0.03900718688964844, -0.037667274475097656, -0.036327362060546875, -0.034987449645996094, -0.03364753723144531, -0.03230762481689453, -0.03096771240234375, -0.02962779998779297, -0.028287887573242188, -0.026947975158691406, -0.025608062744140625, -0.024268150329589844, -0.022928237915039062, -0.02158832550048828, -0.0202484130859375, -0.01890850067138672, -0.017568588256835938, -0.016228675842285156, -0.014888763427734375, -0.013548851013183594, -0.012208938598632812, -0.010869026184082031, -0.00952911376953125, -0.008189201354980469, -0.0068492889404296875, -0.005509376525878906, -0.004169464111328125, -0.0028295516967773438, -0.0014896392822265625, -0.00014972686767578125, 0.001190185546875, 0.0025300979614257812, 0.0038700103759765625, 0.005209922790527344, 0.006549835205078125, 0.007889747619628906, 0.009229660034179688, 0.010569572448730469, 0.01190948486328125, 0.013249397277832031, 0.014589309692382812, 0.015929222106933594, 0.017269134521484375, 0.018609046936035156, 0.019948959350585938, 0.02128887176513672, 0.0226287841796875, 0.02396869659423828, 0.025308609008789062, 0.026648521423339844, 0.027988433837890625, 0.029328346252441406, 0.030668258666992188, 0.03200817108154297, 0.03334808349609375, 0.03468799591064453, 0.03602790832519531, 0.037367820739746094, 0.038707733154296875, 0.040047645568847656, 0.04138755798339844, 0.04272747039794922, 0.0440673828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 4.0, 5.0, 14.0, 13.0, 12.0, 22.0, 27.0, 43.0, 66.0, 84.0, 98.0, 166.0, 143.0, 75.0, 66.0, 42.0, 29.0, 27.0, 19.0, 8.0, 7.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0261993408203125, -0.0251767635345459, -0.024154186248779297, -0.023131608963012695, -0.022109031677246094, -0.021086454391479492, -0.02006387710571289, -0.01904129981994629, -0.018018722534179688, -0.016996145248413086, -0.015973567962646484, -0.014950990676879883, -0.013928413391113281, -0.01290583610534668, -0.011883258819580078, -0.010860681533813477, -0.009838104248046875, -0.008815526962280273, -0.007792949676513672, -0.00677037239074707, -0.005747795104980469, -0.004725217819213867, -0.0037026405334472656, -0.002680063247680664, -0.0016574859619140625, -0.0006349086761474609, 0.0003876686096191406, 0.0014102458953857422, 0.0024328231811523438, 0.0034554004669189453, 0.004477977752685547, 0.0055005550384521484, 0.00652313232421875, 0.0075457096099853516, 0.008568286895751953, 0.009590864181518555, 0.010613441467285156, 0.011636018753051758, 0.01265859603881836, 0.013681173324584961, 0.014703750610351562, 0.015726327896118164, 0.016748905181884766, 0.017771482467651367, 0.01879405975341797, 0.01981663703918457, 0.020839214324951172, 0.021861791610717773, 0.022884368896484375, 0.023906946182250977, 0.024929523468017578, 0.02595210075378418, 0.02697467803955078, 0.027997255325317383, 0.029019832611083984, 0.030042409896850586, 0.031064987182617188, 0.03208756446838379, 0.03311014175415039, 0.03413271903991699, 0.035155296325683594, 0.036177873611450195, 0.0372004508972168, 0.0382230281829834, 0.03924560546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 8.0, 11.0, 32.0, 61.0, 120.0, 277.0, 291.0, 107.0, 38.0, 21.0, 7.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.2841212749481201, -1.25989830493927, -1.23567533493042, -1.2114523649215698, -1.1872293949127197, -1.1630065441131592, -1.138783574104309, -1.114560604095459, -1.0903376340866089, -1.0661146640777588, -1.0418916940689087, -1.0176687240600586, -0.9934458136558533, -0.9692228436470032, -0.9449999332427979, -0.9207769632339478, -0.8965539932250977, -0.8723310232162476, -0.8481080532073975, -0.8238851428031921, -0.799662172794342, -0.7754392027854919, -0.7512162923812866, -0.7269933223724365, -0.7027703523635864, -0.6785473823547363, -0.6543244123458862, -0.6301015019416809, -0.6058785319328308, -0.5816555619239807, -0.5574326515197754, -0.5332096815109253, -0.5089866518974304, -0.4847636818885803, -0.4605407416820526, -0.4363178014755249, -0.4120948314666748, -0.3878718614578247, -0.363648921251297, -0.3394259810447693, -0.3152030110359192, -0.2909800410270691, -0.2667571008205414, -0.24253414571285248, -0.21831119060516357, -0.19408823549747467, -0.16986528038978577, -0.14564232528209686, -0.12141937017440796, -0.09719641506671906, -0.07297345995903015, -0.04875050485134125, -0.024527549743652344, -0.00030459463596343994, 0.023918360471725464, 0.04814131557941437, 0.07236427068710327, 0.09658722579479218, 0.12081018090248108, 0.14503313601016998, 0.1692560911178589, 0.1934790462255478, 0.2177020013332367, 0.2419249564409256, 0.2661479115486145]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 2.0, 4.0, 7.0, 2.0, 7.0, 7.0, 11.0, 8.0, 8.0, 15.0, 21.0, 19.0, 21.0, 22.0, 32.0, 30.0, 23.0, 35.0, 28.0, 62.0, 115.0, 113.0, 61.0, 42.0, 32.0, 40.0, 22.0, 25.0, 27.0, 22.0, 22.0, 19.0, 8.0, 11.0, 11.0, 11.0, 6.0, 12.0, 7.0, 6.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.3943328261375427, -0.38268956542015076, -0.3710463345050812, -0.3594030737876892, -0.34775984287261963, -0.33611658215522766, -0.3244733214378357, -0.3128300905227661, -0.30118682980537415, -0.2895435690879822, -0.2779003381729126, -0.26625707745552063, -0.25461381673812866, -0.24297058582305908, -0.23132732510566711, -0.21968407928943634, -0.20804083347320557, -0.1963975876569748, -0.18475434184074402, -0.17311108112335205, -0.16146783530712128, -0.1498245894908905, -0.13818132877349854, -0.12653808295726776, -0.11489483714103699, -0.10325159132480621, -0.09160833805799484, -0.07996508479118347, -0.0683218389749527, -0.056678589433431625, -0.04503533989191055, -0.03339208662509918, -0.021748840808868408, -0.010105591267347336, 0.0015376582741737366, 0.013180907815694809, 0.02482415735721588, 0.036467406898736954, 0.048110656440258026, 0.0597539097070694, 0.07139715552330017, 0.08304040133953094, 0.09468365460634232, 0.10632690787315369, 0.11797015368938446, 0.12961339950561523, 0.1412566602230072, 0.15289990603923798, 0.16454315185546875, 0.17618639767169952, 0.1878296434879303, 0.19947290420532227, 0.21111615002155304, 0.2227593958377838, 0.23440265655517578, 0.24604590237140656, 0.25768914818763733, 0.2693324089050293, 0.2809756398200989, 0.29261890053749084, 0.3042621612548828, 0.3159053921699524, 0.32754865288734436, 0.33919191360473633, 0.3508351445198059]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 10.0, 11.0, 14.0, 18.0, 17.0, 27.0, 38.0, 49.0, 70.0, 105.0, 147.0, 247.0, 342.0, 557.0, 900.0, 1594.0, 3057.0, 6366.0, 16977.0, 74818.0, 715767.0, 2893330.0, 404477.0, 50916.0, 13207.0, 5143.0, 2496.0, 1326.0, 791.0, 465.0, 310.0, 194.0, 143.0, 89.0, 65.0, 44.0, 31.0, 28.0, 22.0, 26.0, 10.0, 9.0, 11.0, 3.0, 4.0, 2.0, 0.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03668212890625, -0.03551340103149414, -0.03434467315673828, -0.03317594528198242, -0.03200721740722656, -0.030838489532470703, -0.029669761657714844, -0.028501033782958984, -0.027332305908203125, -0.026163578033447266, -0.024994850158691406, -0.023826122283935547, -0.022657394409179688, -0.021488666534423828, -0.02031993865966797, -0.01915121078491211, -0.01798248291015625, -0.01681375503540039, -0.01564502716064453, -0.014476299285888672, -0.013307571411132812, -0.012138843536376953, -0.010970115661621094, -0.009801387786865234, -0.008632659912109375, -0.007463932037353516, -0.006295204162597656, -0.005126476287841797, -0.0039577484130859375, -0.002789020538330078, -0.0016202926635742188, -0.0004515647888183594, 0.0007171630859375, 0.0018858909606933594, 0.0030546188354492188, 0.004223346710205078, 0.0053920745849609375, 0.006560802459716797, 0.007729530334472656, 0.008898258209228516, 0.010066986083984375, 0.011235713958740234, 0.012404441833496094, 0.013573169708251953, 0.014741897583007812, 0.015910625457763672, 0.01707935333251953, 0.01824808120727539, 0.01941680908203125, 0.02058553695678711, 0.02175426483154297, 0.022922992706298828, 0.024091720581054688, 0.025260448455810547, 0.026429176330566406, 0.027597904205322266, 0.028766632080078125, 0.029935359954833984, 0.031104087829589844, 0.0322728157043457, 0.03344154357910156, 0.03461027145385742, 0.03577899932861328, 0.03694772720336914, 0.038116455078125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 4.0, 7.0, 9.0, 13.0, 4.0, 24.0, 18.0, 22.0, 30.0, 35.0, 32.0, 47.0, 54.0, 54.0, 51.0, 59.0, 66.0, 46.0, 52.0, 39.0, 46.0, 47.0, 36.0, 40.0, 29.0, 23.0, 20.0, 18.0, 13.0, 14.0, 8.0, 7.0, 6.0, 5.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02337646484375, -0.02267765998840332, -0.02197885513305664, -0.02128005027770996, -0.02058124542236328, -0.0198824405670166, -0.019183635711669922, -0.018484830856323242, -0.017786026000976562, -0.017087221145629883, -0.016388416290283203, -0.015689611434936523, -0.014990806579589844, -0.014292001724243164, -0.013593196868896484, -0.012894392013549805, -0.012195587158203125, -0.011496782302856445, -0.010797977447509766, -0.010099172592163086, -0.009400367736816406, -0.008701562881469727, -0.008002758026123047, -0.007303953170776367, -0.0066051483154296875, -0.005906343460083008, -0.005207538604736328, -0.0045087337493896484, -0.0038099288940429688, -0.003111124038696289, -0.0024123191833496094, -0.0017135143280029297, -0.00101470947265625, -0.0003159046173095703, 0.0003829002380371094, 0.001081705093383789, 0.0017805099487304688, 0.0024793148040771484, 0.003178119659423828, 0.003876924514770508, 0.0045757293701171875, 0.005274534225463867, 0.005973339080810547, 0.0066721439361572266, 0.007370948791503906, 0.008069753646850586, 0.008768558502197266, 0.009467363357543945, 0.010166168212890625, 0.010864973068237305, 0.011563777923583984, 0.012262582778930664, 0.012961387634277344, 0.013660192489624023, 0.014358997344970703, 0.015057802200317383, 0.015756607055664062, 0.016455411911010742, 0.017154216766357422, 0.0178530216217041, 0.01855182647705078, 0.01925063133239746, 0.01994943618774414, 0.02064824104309082, 0.0213470458984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 9.0, 12.0, 32.0, 61.0, 105.0, 304.0, 716.0, 2384.0, 19290.0, 4144639.0, 22623.0, 2683.0, 862.0, 312.0, 137.0, 63.0, 15.0, 13.0, 7.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28515625, -0.2763862609863281, -0.26761627197265625, -0.2588462829589844, -0.2500762939453125, -0.24130630493164062, -0.23253631591796875, -0.22376632690429688, -0.214996337890625, -0.20622634887695312, -0.19745635986328125, -0.18868637084960938, -0.1799163818359375, -0.17114639282226562, -0.16237640380859375, -0.15360641479492188, -0.14483642578125, -0.13606643676757812, -0.12729644775390625, -0.11852645874023438, -0.1097564697265625, -0.10098648071289062, -0.09221649169921875, -0.08344650268554688, -0.074676513671875, -0.06590652465820312, -0.05713653564453125, -0.048366546630859375, -0.0395965576171875, -0.030826568603515625, -0.02205657958984375, -0.013286590576171875, -0.0045166015625, 0.004253387451171875, 0.01302337646484375, 0.021793365478515625, 0.0305633544921875, 0.039333343505859375, 0.04810333251953125, 0.056873321533203125, 0.065643310546875, 0.07441329956054688, 0.08318328857421875, 0.09195327758789062, 0.1007232666015625, 0.10949325561523438, 0.11826324462890625, 0.12703323364257812, 0.13580322265625, 0.14457321166992188, 0.15334320068359375, 0.16211318969726562, 0.1708831787109375, 0.17965316772460938, 0.18842315673828125, 0.19719314575195312, 0.205963134765625, 0.21473312377929688, 0.22350311279296875, 0.23227310180664062, 0.2410430908203125, 0.24981307983398438, 0.25858306884765625, 0.2673530578613281, 0.276123046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 18.0, 58.0, 123.0, 599.0, 2263.0, 746.0, 150.0, 53.0, 23.0, 14.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.188720703125, -0.1827392578125, -0.1767578125, -0.1707763671875, -0.164794921875, -0.1588134765625, -0.15283203125, -0.1468505859375, -0.140869140625, -0.1348876953125, -0.12890625, -0.1229248046875, -0.116943359375, -0.1109619140625, -0.10498046875, -0.0989990234375, -0.093017578125, -0.0870361328125, -0.0810546875, -0.0750732421875, -0.069091796875, -0.0631103515625, -0.05712890625, -0.0511474609375, -0.045166015625, -0.0391845703125, -0.033203125, -0.0272216796875, -0.021240234375, -0.0152587890625, -0.00927734375, -0.0032958984375, 0.002685546875, 0.0086669921875, 0.0146484375, 0.0206298828125, 0.026611328125, 0.0325927734375, 0.03857421875, 0.0445556640625, 0.050537109375, 0.0565185546875, 0.0625, 0.0684814453125, 0.074462890625, 0.0804443359375, 0.08642578125, 0.0924072265625, 0.098388671875, 0.1043701171875, 0.1103515625, 0.1163330078125, 0.122314453125, 0.1282958984375, 0.13427734375, 0.1402587890625, 0.146240234375, 0.1522216796875, 0.158203125, 0.1641845703125, 0.170166015625, 0.1761474609375, 0.18212890625, 0.1881103515625, 0.194091796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 9.0, 23.0, 57.0, 139.0, 308.0, 245.0, 120.0, 43.0, 25.0, 15.0, 7.0, 2.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5114376544952393, -0.4679955840110779, -0.4245535135269165, -0.3811114430427551, -0.33766937255859375, -0.2942273020744324, -0.2507852017879486, -0.20734313130378723, -0.16390106081962585, -0.12045899033546448, -0.0770169124007225, -0.03357483446598053, 0.009867236018180847, 0.053309306502342224, 0.0967513918876648, 0.14019346237182617, 0.18363553285598755, 0.22707760334014893, 0.2705196738243103, 0.3139617443084717, 0.35740381479263306, 0.40084588527679443, 0.4442879855632782, 0.4877300560474396, 0.5311721563339233, 0.5746142268180847, 0.6180562973022461, 0.6614983677864075, 0.7049404382705688, 0.7483825087547302, 0.7918245792388916, 0.8352667093276978, 0.8787087202072144, 0.9221507906913757, 0.9655928611755371, 1.0090349912643433, 1.0524770021438599, 1.095919132232666, 1.1393611431121826, 1.1828032732009888, 1.2262452840805054, 1.2696874141693115, 1.3131294250488281, 1.3565715551376343, 1.4000135660171509, 1.443455696105957, 1.4868977069854736, 1.5303398370742798, 1.573781967163086, 1.617224097251892, 1.6606661081314087, 1.7041082382202148, 1.7475502490997314, 1.7909923791885376, 1.8344343900680542, 1.8778765201568604, 1.921318531036377, 1.964760661125183, 2.0082027912139893, 2.051644802093506, 2.0950868129730225, 2.138528823852539, 2.1819710731506348, 2.2254130840301514, 2.268855094909668]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 12.0, 15.0, 12.0, 17.0, 22.0, 26.0, 37.0, 41.0, 41.0, 83.0, 51.0, 61.0, 50.0, 70.0, 55.0, 56.0, 58.0, 48.0, 40.0, 46.0, 37.0, 39.0, 21.0, 20.0, 11.0, 10.0, 5.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.693741500377655, -0.6767563819885254, -0.6597713232040405, -0.6427862048149109, -0.6258010864257812, -0.6088159680366516, -0.591830849647522, -0.5748457908630371, -0.5578606724739075, -0.5408755540847778, -0.523890495300293, -0.5069053769111633, -0.4899202585220337, -0.47293514013290405, -0.4559500515460968, -0.43896496295928955, -0.4219798445701599, -0.4049947261810303, -0.388009637594223, -0.37102454900741577, -0.35403943061828613, -0.3370543122291565, -0.32006922364234924, -0.303084135055542, -0.28609901666641235, -0.2691138982772827, -0.25212880969047546, -0.23514370620250702, -0.21815860271453857, -0.20117349922657013, -0.18418839573860168, -0.16720329225063324, -0.15021824836730957, -0.13323314487934113, -0.11624804139137268, -0.09926293790340424, -0.08227783441543579, -0.06529273092746735, -0.0483076274394989, -0.03132252395153046, -0.014337420463562012, 0.002647683024406433, 0.019632786512374878, 0.03661789000034332, 0.05360299348831177, 0.07058809697628021, 0.08757320046424866, 0.1045583039522171, 0.12154340744018555, 0.138528510928154, 0.15551361441612244, 0.17249871790409088, 0.18948382139205933, 0.20646892488002777, 0.22345402836799622, 0.24043913185596466, 0.2574242353439331, 0.27440935373306274, 0.29139444231987, 0.30837953090667725, 0.3253646492958069, 0.3423497676849365, 0.3593348562717438, 0.376319944858551, 0.39330506324768066]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 9.0, 10.0, 15.0, 14.0, 36.0, 72.0, 115.0, 183.0, 354.0, 660.0, 1340.0, 2893.0, 7600.0, 23547.0, 92293.0, 467965.0, 352607.0, 68905.0, 18717.0, 6279.0, 2462.0, 1134.0, 605.0, 306.0, 165.0, 112.0, 62.0, 36.0, 28.0, 7.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0584716796875, -0.05657958984375, -0.0546875, -0.05279541015625, -0.0509033203125, -0.04901123046875, -0.047119140625, -0.04522705078125, -0.0433349609375, -0.04144287109375, -0.03955078125, -0.03765869140625, -0.0357666015625, -0.03387451171875, -0.031982421875, -0.03009033203125, -0.0281982421875, -0.02630615234375, -0.0244140625, -0.02252197265625, -0.0206298828125, -0.01873779296875, -0.016845703125, -0.01495361328125, -0.0130615234375, -0.01116943359375, -0.00927734375, -0.00738525390625, -0.0054931640625, -0.00360107421875, -0.001708984375, 0.00018310546875, 0.0020751953125, 0.00396728515625, 0.005859375, 0.00775146484375, 0.0096435546875, 0.01153564453125, 0.013427734375, 0.01531982421875, 0.0172119140625, 0.01910400390625, 0.02099609375, 0.02288818359375, 0.0247802734375, 0.02667236328125, 0.028564453125, 0.03045654296875, 0.0323486328125, 0.03424072265625, 0.0361328125, 0.03802490234375, 0.0399169921875, 0.04180908203125, 0.043701171875, 0.04559326171875, 0.0474853515625, 0.04937744140625, 0.05126953125, 0.05316162109375, 0.0550537109375, 0.05694580078125, 0.058837890625, 0.06072998046875, 0.0626220703125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 5.0, 8.0, 6.0, 11.0, 10.0, 19.0, 16.0, 21.0, 17.0, 22.0, 34.0, 28.0, 31.0, 34.0, 54.0, 43.0, 47.0, 52.0, 45.0, 64.0, 61.0, 42.0, 43.0, 28.0, 38.0, 32.0, 34.0, 25.0, 21.0, 17.0, 13.0, 9.0, 9.0, 13.0, 11.0, 4.0, 7.0, 7.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0236358642578125, -0.022861242294311523, -0.022086620330810547, -0.02131199836730957, -0.020537376403808594, -0.019762754440307617, -0.01898813247680664, -0.018213510513305664, -0.017438888549804688, -0.01666426658630371, -0.015889644622802734, -0.015115022659301758, -0.014340400695800781, -0.013565778732299805, -0.012791156768798828, -0.012016534805297852, -0.011241912841796875, -0.010467290878295898, -0.009692668914794922, -0.008918046951293945, -0.008143424987792969, -0.007368803024291992, -0.006594181060791016, -0.005819559097290039, -0.0050449371337890625, -0.004270315170288086, -0.0034956932067871094, -0.002721071243286133, -0.0019464492797851562, -0.0011718273162841797, -0.0003972053527832031, 0.00037741661071777344, 0.00115203857421875, 0.0019266605377197266, 0.002701282501220703, 0.0034759044647216797, 0.004250526428222656, 0.005025148391723633, 0.005799770355224609, 0.006574392318725586, 0.0073490142822265625, 0.008123636245727539, 0.008898258209228516, 0.009672880172729492, 0.010447502136230469, 0.011222124099731445, 0.011996746063232422, 0.012771368026733398, 0.013545989990234375, 0.014320611953735352, 0.015095233917236328, 0.015869855880737305, 0.01664447784423828, 0.017419099807739258, 0.018193721771240234, 0.01896834373474121, 0.019742965698242188, 0.020517587661743164, 0.02129220962524414, 0.022066831588745117, 0.022841453552246094, 0.02361607551574707, 0.024390697479248047, 0.025165319442749023, 0.02593994140625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 7.0, 4.0, 8.0, 6.0, 17.0, 21.0, 26.0, 53.0, 58.0, 77.0, 85.0, 132.0, 166.0, 288.0, 454.0, 758.0, 1310.0, 3275.0, 11348.0, 98363.0, 859900.0, 58055.0, 8281.0, 2572.0, 1252.0, 670.0, 403.0, 281.0, 192.0, 124.0, 98.0, 58.0, 43.0, 42.0, 31.0, 15.0, 15.0, 11.0, 8.0, 7.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.096435546875, -0.09304046630859375, -0.0896453857421875, -0.08625030517578125, -0.082855224609375, -0.07946014404296875, -0.0760650634765625, -0.07266998291015625, -0.06927490234375, -0.06587982177734375, -0.0624847412109375, -0.05908966064453125, -0.055694580078125, -0.05229949951171875, -0.0489044189453125, -0.04550933837890625, -0.0421142578125, -0.03871917724609375, -0.0353240966796875, -0.03192901611328125, -0.028533935546875, -0.02513885498046875, -0.0217437744140625, -0.01834869384765625, -0.01495361328125, -0.01155853271484375, -0.0081634521484375, -0.00476837158203125, -0.001373291015625, 0.00202178955078125, 0.0054168701171875, 0.00881195068359375, 0.01220703125, 0.01560211181640625, 0.0189971923828125, 0.02239227294921875, 0.025787353515625, 0.02918243408203125, 0.0325775146484375, 0.03597259521484375, 0.03936767578125, 0.04276275634765625, 0.0461578369140625, 0.04955291748046875, 0.052947998046875, 0.05634307861328125, 0.0597381591796875, 0.06313323974609375, 0.0665283203125, 0.06992340087890625, 0.0733184814453125, 0.07671356201171875, 0.080108642578125, 0.08350372314453125, 0.0868988037109375, 0.09029388427734375, 0.09368896484375, 0.09708404541015625, 0.1004791259765625, 0.10387420654296875, 0.107269287109375, 0.11066436767578125, 0.1140594482421875, 0.11745452880859375, 0.120849609375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 2.0, 3.0, 7.0, 8.0, 14.0, 11.0, 18.0, 17.0, 29.0, 26.0, 37.0, 50.0, 54.0, 51.0, 69.0, 63.0, 69.0, 64.0, 55.0, 67.0, 46.0, 49.0, 37.0, 25.0, 28.0, 20.0, 15.0, 15.0, 6.0, 11.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.13761138916015625, -0.1337432861328125, -0.12987518310546875, -0.126007080078125, -0.12213897705078125, -0.1182708740234375, -0.11440277099609375, -0.11053466796875, -0.10666656494140625, -0.1027984619140625, -0.09893035888671875, -0.095062255859375, -0.09119415283203125, -0.0873260498046875, -0.08345794677734375, -0.07958984375, -0.07572174072265625, -0.0718536376953125, -0.06798553466796875, -0.064117431640625, -0.06024932861328125, -0.0563812255859375, -0.05251312255859375, -0.04864501953125, -0.04477691650390625, -0.0409088134765625, -0.03704071044921875, -0.033172607421875, -0.02930450439453125, -0.0254364013671875, -0.02156829833984375, -0.0177001953125, -0.01383209228515625, -0.0099639892578125, -0.00609588623046875, -0.002227783203125, 0.00164031982421875, 0.0055084228515625, 0.00937652587890625, 0.01324462890625, 0.01711273193359375, 0.0209808349609375, 0.02484893798828125, 0.028717041015625, 0.03258514404296875, 0.0364532470703125, 0.04032135009765625, 0.044189453125, 0.04805755615234375, 0.0519256591796875, 0.05579376220703125, 0.059661865234375, 0.06352996826171875, 0.0673980712890625, 0.07126617431640625, 0.07513427734375, 0.07900238037109375, 0.0828704833984375, 0.08673858642578125, 0.090606689453125, 0.09447479248046875, 0.0983428955078125, 0.10221099853515625, 0.1060791015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 22.0, 24.0, 42.0, 102.0, 250.0, 810.0, 4070.0, 47007.0, 947486.0, 43478.0, 3954.0, 829.0, 264.0, 102.0, 45.0, 23.0, 11.0, 8.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0501708984375, -0.04827690124511719, -0.046382904052734375, -0.04448890686035156, -0.04259490966796875, -0.04070091247558594, -0.038806915283203125, -0.03691291809082031, -0.0350189208984375, -0.03312492370605469, -0.031230926513671875, -0.029336929321289062, -0.02744293212890625, -0.025548934936523438, -0.023654937744140625, -0.021760940551757812, -0.019866943359375, -0.017972946166992188, -0.016078948974609375, -0.014184951782226562, -0.01229095458984375, -0.010396957397460938, -0.008502960205078125, -0.0066089630126953125, -0.0047149658203125, -0.0028209686279296875, -0.000926971435546875, 0.0009670257568359375, 0.00286102294921875, 0.0047550201416015625, 0.006649017333984375, 0.008543014526367188, 0.01043701171875, 0.012331008911132812, 0.014225006103515625, 0.016119003295898438, 0.01801300048828125, 0.019906997680664062, 0.021800994873046875, 0.023694992065429688, 0.0255889892578125, 0.027482986450195312, 0.029376983642578125, 0.03127098083496094, 0.03316497802734375, 0.03505897521972656, 0.036952972412109375, 0.03884696960449219, 0.040740966796875, 0.04263496398925781, 0.044528961181640625, 0.04642295837402344, 0.04831695556640625, 0.05021095275878906, 0.052104949951171875, 0.05399894714355469, 0.0558929443359375, 0.05778694152832031, 0.059680938720703125, 0.06157493591308594, 0.06346893310546875, 0.06536293029785156, 0.06725692749023438, 0.06915092468261719, 0.071044921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 7.0, 20.0, 26.0, 25.0, 41.0, 55.0, 93.0, 92.0, 147.0, 128.0, 106.0, 78.0, 48.0, 29.0, 30.0, 21.0, 17.0, 6.0, 8.0, 6.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6803226470947266e-05, -5.496945232152939e-05, -5.313567817211151e-05, -5.1301904022693634e-05, -4.946812987327576e-05, -4.763435572385788e-05, -4.580058157444e-05, -4.3966807425022125e-05, -4.213303327560425e-05, -4.029925912618637e-05, -3.8465484976768494e-05, -3.6631710827350616e-05, -3.479793667793274e-05, -3.296416252851486e-05, -3.1130388379096985e-05, -2.9296614229679108e-05, -2.746284008026123e-05, -2.5629065930843353e-05, -2.3795291781425476e-05, -2.19615176320076e-05, -2.012774348258972e-05, -1.8293969333171844e-05, -1.6460195183753967e-05, -1.462642103433609e-05, -1.2792646884918213e-05, -1.0958872735500336e-05, -9.125098586082458e-06, -7.291324436664581e-06, -5.457550287246704e-06, -3.623776137828827e-06, -1.7900019884109497e-06, 4.377216100692749e-08, 1.8775463104248047e-06, 3.711320459842682e-06, 5.545094609260559e-06, 7.378868758678436e-06, 9.212642908096313e-06, 1.104641705751419e-05, 1.2880191206932068e-05, 1.4713965356349945e-05, 1.6547739505767822e-05, 1.83815136551857e-05, 2.0215287804603577e-05, 2.2049061954021454e-05, 2.388283610343933e-05, 2.5716610252857208e-05, 2.7550384402275085e-05, 2.9384158551692963e-05, 3.121793270111084e-05, 3.305170685052872e-05, 3.4885480999946594e-05, 3.671925514936447e-05, 3.855302929878235e-05, 4.0386803448200226e-05, 4.22205775976181e-05, 4.405435174703598e-05, 4.588812589645386e-05, 4.7721900045871735e-05, 4.955567419528961e-05, 5.138944834470749e-05, 5.3223222494125366e-05, 5.5056996643543243e-05, 5.689077079296112e-05, 5.8724544942379e-05, 6.0558319091796875e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 3.0, 0.0, 4.0, 6.0, 6.0, 10.0, 11.0, 20.0, 27.0, 44.0, 61.0, 92.0, 114.0, 191.0, 295.0, 498.0, 1092.0, 2437.0, 7127.0, 32042.0, 479452.0, 480584.0, 32005.0, 7333.0, 2543.0, 1075.0, 574.0, 334.0, 183.0, 134.0, 72.0, 59.0, 34.0, 19.0, 24.0, 17.0, 10.0, 3.0, 4.0, 8.0, 1.0, 2.0, 0.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034637451171875, -0.033555030822753906, -0.03247261047363281, -0.03139019012451172, -0.030307769775390625, -0.02922534942626953, -0.028142929077148438, -0.027060508728027344, -0.02597808837890625, -0.024895668029785156, -0.023813247680664062, -0.02273082733154297, -0.021648406982421875, -0.02056598663330078, -0.019483566284179688, -0.018401145935058594, -0.0173187255859375, -0.016236305236816406, -0.015153884887695312, -0.014071464538574219, -0.012989044189453125, -0.011906623840332031, -0.010824203491210938, -0.009741783142089844, -0.00865936279296875, -0.007576942443847656, -0.0064945220947265625, -0.005412101745605469, -0.004329681396484375, -0.0032472610473632812, -0.0021648406982421875, -0.0010824203491210938, 0.0, 0.0010824203491210938, 0.0021648406982421875, 0.0032472610473632812, 0.004329681396484375, 0.005412101745605469, 0.0064945220947265625, 0.007576942443847656, 0.00865936279296875, 0.009741783142089844, 0.010824203491210938, 0.011906623840332031, 0.012989044189453125, 0.014071464538574219, 0.015153884887695312, 0.016236305236816406, 0.0173187255859375, 0.018401145935058594, 0.019483566284179688, 0.02056598663330078, 0.021648406982421875, 0.02273082733154297, 0.023813247680664062, 0.024895668029785156, 0.02597808837890625, 0.027060508728027344, 0.028142929077148438, 0.02922534942626953, 0.030307769775390625, 0.03139019012451172, 0.03247261047363281, 0.033555030822753906, 0.034637451171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 8.0, 6.0, 14.0, 12.0, 28.0, 34.0, 41.0, 61.0, 81.0, 109.0, 155.0, 121.0, 77.0, 76.0, 51.0, 27.0, 17.0, 23.0, 12.0, 10.0, 2.0, 9.0, 11.0, 8.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03265380859375, -0.03165006637573242, -0.030646324157714844, -0.029642581939697266, -0.028638839721679688, -0.02763509750366211, -0.02663135528564453, -0.025627613067626953, -0.024623870849609375, -0.023620128631591797, -0.02261638641357422, -0.02161264419555664, -0.020608901977539062, -0.019605159759521484, -0.018601417541503906, -0.017597675323486328, -0.01659393310546875, -0.015590190887451172, -0.014586448669433594, -0.013582706451416016, -0.012578964233398438, -0.01157522201538086, -0.010571479797363281, -0.009567737579345703, -0.008563995361328125, -0.007560253143310547, -0.006556510925292969, -0.005552768707275391, -0.0045490264892578125, -0.0035452842712402344, -0.0025415420532226562, -0.0015377998352050781, -0.0005340576171875, 0.0004696846008300781, 0.0014734268188476562, 0.0024771690368652344, 0.0034809112548828125, 0.004484653472900391, 0.005488395690917969, 0.006492137908935547, 0.007495880126953125, 0.008499622344970703, 0.009503364562988281, 0.01050710678100586, 0.011510848999023438, 0.012514591217041016, 0.013518333435058594, 0.014522075653076172, 0.01552581787109375, 0.016529560089111328, 0.017533302307128906, 0.018537044525146484, 0.019540786743164062, 0.02054452896118164, 0.02154827117919922, 0.022552013397216797, 0.023555755615234375, 0.024559497833251953, 0.02556324005126953, 0.02656698226928711, 0.027570724487304688, 0.028574466705322266, 0.029578208923339844, 0.030581951141357422, 0.031585693359375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 17.0, 76.0, 567.0, 271.0, 47.0, 17.0, 8.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193838596343994, -1.25588858127594, -1.1923933029174805, -1.1288981437683105, -1.065402865409851, -1.0019075870513916, -0.9384123682975769, -0.8749171495437622, -0.8114218711853027, -0.7479265928268433, -0.6844313740730286, -0.6209361553192139, -0.5574408769607544, -0.4939456284046173, -0.4304503798484802, -0.36695513129234314, -0.30345988273620605, -0.23996463418006897, -0.17646938562393188, -0.1129741370677948, -0.049478888511657715, 0.01401636004447937, 0.07751160860061646, 0.14100685715675354, 0.20450210571289062, 0.2679973542690277, 0.3314926028251648, 0.3949878513813019, 0.45848309993743896, 0.5219783782958984, 0.5854735970497131, 0.6489688158035278, 0.7124638557434082, 0.7759591341018677, 0.8394543528556824, 0.9029495716094971, 0.9664448499679565, 1.029940128326416, 1.093435287475586, 1.1569305658340454, 1.2204258441925049, 1.2839211225509644, 1.3474164009094238, 1.4109115600585938, 1.4744068384170532, 1.5379021167755127, 1.6013972759246826, 1.664892554283142, 1.7283878326416016, 1.791883111000061, 1.8553783893585205, 1.9188735485076904, 1.98236882686615, 2.0458641052246094, 2.1093592643737793, 2.1728546619415283, 2.2363498210906982, 2.299844980239868, 2.363340377807617, 2.426835536956787, 2.490330696105957, 2.553826093673706, 2.617321252822876, 2.680816650390625, 2.744311809539795]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 2.0, 2.0, 7.0, 5.0, 8.0, 12.0, 15.0, 8.0, 18.0, 18.0, 19.0, 20.0, 29.0, 30.0, 29.0, 41.0, 40.0, 69.0, 132.0, 132.0, 61.0, 28.0, 36.0, 30.0, 24.0, 25.0, 18.0, 22.0, 25.0, 16.0, 11.0, 9.0, 12.0, 11.0, 10.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.48429399728775024, -0.4708324074745178, -0.457370787858963, -0.4439091980457306, -0.4304475784301758, -0.41698598861694336, -0.40352439880371094, -0.3900628089904785, -0.3766011893749237, -0.3631395995616913, -0.3496779799461365, -0.33621639013290405, -0.32275480031967163, -0.3092931807041168, -0.2958315908908844, -0.2823699712753296, -0.26890838146209717, -0.25544679164886475, -0.24198517203330994, -0.22852358222007751, -0.2150619775056839, -0.20160037279129028, -0.18813878297805786, -0.17467717826366425, -0.16121557354927063, -0.14775396883487701, -0.1342923641204834, -0.12083077430725098, -0.10736916959285736, -0.09390756487846375, -0.08044596761465073, -0.06698437035083771, -0.05352276563644409, -0.040061164647340775, -0.026599563658237457, -0.01313796266913414, 0.00032363831996917725, 0.013785243034362793, 0.027246840298175812, 0.04070843756198883, 0.054170042276382446, 0.06763164699077606, 0.08109324425458908, 0.0945548415184021, 0.10801644623279572, 0.12147805094718933, 0.13493964076042175, 0.14840124547481537, 0.16186285018920898, 0.1753244549036026, 0.18878605961799622, 0.20224764943122864, 0.21570925414562225, 0.22917085886001587, 0.2426324486732483, 0.2560940384864807, 0.2695556581020355, 0.28301724791526794, 0.29647886753082275, 0.3099404573440552, 0.3234020471572876, 0.3368636667728424, 0.35032525658607483, 0.36378687620162964, 0.37724846601486206]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 10.0, 8.0, 12.0, 14.0, 18.0, 24.0, 22.0, 42.0, 55.0, 73.0, 111.0, 134.0, 220.0, 319.0, 437.0, 709.0, 1031.0, 1725.0, 2976.0, 5783.0, 12320.0, 34171.0, 146050.0, 914523.0, 2302571.0, 619008.0, 102839.0, 26839.0, 10447.0, 4915.0, 2528.0, 1486.0, 960.0, 572.0, 395.0, 268.0, 218.0, 121.0, 97.0, 65.0, 54.0, 40.0, 22.0, 16.0, 16.0, 10.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04571533203125, -0.04430389404296875, -0.0428924560546875, -0.04148101806640625, -0.040069580078125, -0.03865814208984375, -0.0372467041015625, -0.03583526611328125, -0.034423828125, -0.03301239013671875, -0.0316009521484375, -0.03018951416015625, -0.028778076171875, -0.02736663818359375, -0.0259552001953125, -0.02454376220703125, -0.02313232421875, -0.02172088623046875, -0.0203094482421875, -0.01889801025390625, -0.017486572265625, -0.01607513427734375, -0.0146636962890625, -0.01325225830078125, -0.0118408203125, -0.01042938232421875, -0.0090179443359375, -0.00760650634765625, -0.006195068359375, -0.00478363037109375, -0.0033721923828125, -0.00196075439453125, -0.00054931640625, 0.00086212158203125, 0.0022735595703125, 0.00368499755859375, 0.005096435546875, 0.00650787353515625, 0.0079193115234375, 0.00933074951171875, 0.0107421875, 0.01215362548828125, 0.0135650634765625, 0.01497650146484375, 0.016387939453125, 0.01779937744140625, 0.0192108154296875, 0.02062225341796875, 0.02203369140625, 0.02344512939453125, 0.0248565673828125, 0.02626800537109375, 0.027679443359375, 0.02909088134765625, 0.0305023193359375, 0.03191375732421875, 0.0333251953125, 0.03473663330078125, 0.0361480712890625, 0.03755950927734375, 0.038970947265625, 0.04038238525390625, 0.0417938232421875, 0.04320526123046875, 0.04461669921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 2.0, 9.0, 8.0, 9.0, 8.0, 19.0, 17.0, 17.0, 23.0, 28.0, 29.0, 31.0, 26.0, 28.0, 41.0, 36.0, 43.0, 47.0, 54.0, 36.0, 53.0, 50.0, 45.0, 37.0, 35.0, 36.0, 28.0, 34.0, 31.0, 22.0, 15.0, 12.0, 13.0, 13.0, 11.0, 14.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208740234375, -0.0202028751373291, -0.019531726837158203, -0.018860578536987305, -0.018189430236816406, -0.017518281936645508, -0.01684713363647461, -0.01617598533630371, -0.015504837036132812, -0.014833688735961914, -0.014162540435791016, -0.013491392135620117, -0.012820243835449219, -0.01214909553527832, -0.011477947235107422, -0.010806798934936523, -0.010135650634765625, -0.009464502334594727, -0.008793354034423828, -0.00812220573425293, -0.007451057434082031, -0.006779909133911133, -0.006108760833740234, -0.005437612533569336, -0.0047664642333984375, -0.004095315933227539, -0.0034241676330566406, -0.002753019332885742, -0.0020818710327148438, -0.0014107227325439453, -0.0007395744323730469, -6.842613220214844e-05, 0.00060272216796875, 0.0012738704681396484, 0.0019450187683105469, 0.0026161670684814453, 0.0032873153686523438, 0.003958463668823242, 0.004629611968994141, 0.005300760269165039, 0.0059719085693359375, 0.006643056869506836, 0.007314205169677734, 0.007985353469848633, 0.008656501770019531, 0.00932765007019043, 0.009998798370361328, 0.010669946670532227, 0.011341094970703125, 0.012012243270874023, 0.012683391571044922, 0.01335453987121582, 0.014025688171386719, 0.014696836471557617, 0.015367984771728516, 0.016039133071899414, 0.016710281372070312, 0.01738142967224121, 0.01805257797241211, 0.018723726272583008, 0.019394874572753906, 0.020066022872924805, 0.020737171173095703, 0.0214083194732666, 0.0220794677734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 27.0, 43.0, 75.0, 123.0, 303.0, 709.0, 2084.0, 22637.0, 4139692.0, 25199.0, 2100.0, 684.0, 271.0, 132.0, 74.0, 42.0, 22.0, 16.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3798828125, -0.3681983947753906, -0.35651397705078125, -0.3448295593261719, -0.3331451416015625, -0.3214607238769531, -0.30977630615234375, -0.2980918884277344, -0.286407470703125, -0.2747230529785156, -0.26303863525390625, -0.2513542175292969, -0.2396697998046875, -0.22798538208007812, -0.21630096435546875, -0.20461654663085938, -0.19293212890625, -0.18124771118164062, -0.16956329345703125, -0.15787887573242188, -0.1461944580078125, -0.13451004028320312, -0.12282562255859375, -0.11114120483398438, -0.099456787109375, -0.08777236938476562, -0.07608795166015625, -0.06440353393554688, -0.0527191162109375, -0.041034698486328125, -0.02935028076171875, -0.017665863037109375, -0.0059814453125, 0.005702972412109375, 0.01738739013671875, 0.029071807861328125, 0.0407562255859375, 0.052440643310546875, 0.06412506103515625, 0.07580947875976562, 0.087493896484375, 0.09917831420898438, 0.11086273193359375, 0.12254714965820312, 0.1342315673828125, 0.14591598510742188, 0.15760040283203125, 0.16928482055664062, 0.18096923828125, 0.19265365600585938, 0.20433807373046875, 0.21602249145507812, 0.2277069091796875, 0.23939132690429688, 0.25107574462890625, 0.2627601623535156, 0.274444580078125, 0.2861289978027344, 0.29781341552734375, 0.3094978332519531, 0.3211822509765625, 0.3328666687011719, 0.34455108642578125, 0.3562355041503906, 0.367919921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 12.0, 21.0, 45.0, 70.0, 159.0, 449.0, 1259.0, 1291.0, 437.0, 181.0, 75.0, 35.0, 14.0, 10.0, 9.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2127685546875, -0.20542335510253906, -0.19807815551757812, -0.1907329559326172, -0.18338775634765625, -0.1760425567626953, -0.16869735717773438, -0.16135215759277344, -0.1540069580078125, -0.14666175842285156, -0.13931655883789062, -0.1319713592529297, -0.12462615966796875, -0.11728096008300781, -0.10993576049804688, -0.10259056091308594, -0.095245361328125, -0.08790016174316406, -0.08055496215820312, -0.07320976257324219, -0.06586456298828125, -0.05851936340332031, -0.051174163818359375, -0.04382896423339844, -0.0364837646484375, -0.029138565063476562, -0.021793365478515625, -0.014448165893554688, -0.00710296630859375, 0.0002422332763671875, 0.007587432861328125, 0.014932632446289062, 0.02227783203125, 0.029623031616210938, 0.036968231201171875, 0.04431343078613281, 0.05165863037109375, 0.05900382995605469, 0.06634902954101562, 0.07369422912597656, 0.0810394287109375, 0.08838462829589844, 0.09572982788085938, 0.10307502746582031, 0.11042022705078125, 0.11776542663574219, 0.12511062622070312, 0.13245582580566406, 0.139801025390625, 0.14714622497558594, 0.15449142456054688, 0.1618366241455078, 0.16918182373046875, 0.1765270233154297, 0.18387222290039062, 0.19121742248535156, 0.1985626220703125, 0.20590782165527344, 0.21325302124023438, 0.2205982208251953, 0.22794342041015625, 0.2352886199951172, 0.24263381958007812, 0.24997901916503906, 0.25732421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 9.0, 10.0, 11.0, 28.0, 58.0, 94.0, 186.0, 231.0, 147.0, 90.0, 50.0, 23.0, 23.0, 16.0, 3.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.906980037689209, -1.858508825302124, -1.8100374937057495, -1.761566162109375, -1.71309494972229, -1.664623737335205, -1.6161524057388306, -1.567681074142456, -1.519209861755371, -1.4707386493682861, -1.4222673177719116, -1.373795986175537, -1.3253247737884521, -1.2768535614013672, -1.2283822298049927, -1.1799108982086182, -1.1314396858215332, -1.0829684734344482, -1.0344971418380737, -0.986025869846344, -0.9375545978546143, -0.8890833258628845, -0.8406120538711548, -0.792140781879425, -0.7436695098876953, -0.6951982378959656, -0.6467269659042358, -0.5982556939125061, -0.5497844219207764, -0.5013131499290466, -0.4528418779373169, -0.40437060594558716, -0.3558993339538574, -0.3074280619621277, -0.25895678997039795, -0.2104855179786682, -0.16201424598693848, -0.11354297399520874, -0.065071702003479, -0.016600430011749268, 0.03187084197998047, 0.0803421139717102, 0.12881338596343994, 0.17728465795516968, 0.22575592994689941, 0.27422720193862915, 0.3226984739303589, 0.3711697459220886, 0.41964101791381836, 0.4681122899055481, 0.5165835618972778, 0.5650548338890076, 0.6135261058807373, 0.661997377872467, 0.7104686498641968, 0.7589399218559265, 0.8074111938476562, 0.855882465839386, 0.9043537378311157, 0.9528250098228455, 1.0012962818145752, 1.0497674942016602, 1.0982388257980347, 1.1467101573944092, 1.1951813697814941]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 16.0, 10.0, 9.0, 16.0, 16.0, 21.0, 31.0, 42.0, 44.0, 46.0, 71.0, 82.0, 84.0, 73.0, 70.0, 48.0, 43.0, 34.0, 39.0, 39.0, 43.0, 35.0, 11.0, 22.0, 12.0, 16.0, 7.0, 1.0, 7.0, 0.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7830135822296143, -0.7581965327262878, -0.7333794832229614, -0.708562433719635, -0.6837453842163086, -0.658928394317627, -0.6341113448143005, -0.6092942953109741, -0.5844772458076477, -0.5596601963043213, -0.5348431468009949, -0.5100260972976685, -0.48520907759666443, -0.460392028093338, -0.435575008392334, -0.41075795888900757, -0.38594090938568115, -0.36112385988235474, -0.3363068103790283, -0.3114897906780243, -0.2866727411746979, -0.26185569167137146, -0.23703865706920624, -0.21222162246704102, -0.1874045729637146, -0.16258752346038818, -0.13777048885822296, -0.11295344680547714, -0.08813640475273132, -0.0633193626999855, -0.038502320647239685, -0.013685286045074463, 0.011131763458251953, 0.03594880551099777, 0.06076584756374359, 0.08558288961648941, 0.11039993166923523, 0.13521698117256165, 0.16003401577472687, 0.1848510503768921, 0.2096680998802185, 0.23448514938354492, 0.25930219888687134, 0.28411921858787537, 0.3089362680912018, 0.3337533175945282, 0.3585703372955322, 0.38338738679885864, 0.40820443630218506, 0.4330214858055115, 0.4578385353088379, 0.4826555550098419, 0.5074726343154907, 0.5322896242141724, 0.5571066737174988, 0.5819237232208252, 0.6067407727241516, 0.631557822227478, 0.6563748717308044, 0.6811919212341309, 0.7060089111328125, 0.7308259606361389, 0.7556430101394653, 0.7804600596427917, 0.8052771091461182]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 11.0, 14.0, 23.0, 26.0, 45.0, 65.0, 109.0, 146.0, 207.0, 384.0, 584.0, 1050.0, 1622.0, 3131.0, 6303.0, 13667.0, 34567.0, 110591.0, 599656.0, 190814.0, 49594.0, 18355.0, 8398.0, 3907.0, 2174.0, 1188.0, 708.0, 398.0, 300.0, 175.0, 119.0, 59.0, 43.0, 29.0, 24.0, 17.0, 17.0, 9.0, 6.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04937744140625, -0.04791116714477539, -0.04644489288330078, -0.04497861862182617, -0.04351234436035156, -0.04204607009887695, -0.040579795837402344, -0.039113521575927734, -0.037647247314453125, -0.036180973052978516, -0.034714698791503906, -0.0332484245300293, -0.03178215026855469, -0.030315876007080078, -0.02884960174560547, -0.02738332748413086, -0.02591705322265625, -0.02445077896118164, -0.02298450469970703, -0.021518230438232422, -0.020051956176757812, -0.018585681915283203, -0.017119407653808594, -0.015653133392333984, -0.014186859130859375, -0.012720584869384766, -0.011254310607910156, -0.009788036346435547, -0.008321762084960938, -0.006855487823486328, -0.005389213562011719, -0.003922939300537109, -0.0024566650390625, -0.0009903907775878906, 0.00047588348388671875, 0.0019421577453613281, 0.0034084320068359375, 0.004874706268310547, 0.006340980529785156, 0.007807254791259766, 0.009273529052734375, 0.010739803314208984, 0.012206077575683594, 0.013672351837158203, 0.015138626098632812, 0.016604900360107422, 0.01807117462158203, 0.01953744888305664, 0.02100372314453125, 0.02246999740600586, 0.02393627166748047, 0.025402545928955078, 0.026868820190429688, 0.028335094451904297, 0.029801368713378906, 0.031267642974853516, 0.032733917236328125, 0.034200191497802734, 0.035666465759277344, 0.03713274002075195, 0.03859901428222656, 0.04006528854370117, 0.04153156280517578, 0.04299783706665039, 0.044464111328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 8.0, 14.0, 16.0, 13.0, 17.0, 21.0, 19.0, 24.0, 35.0, 48.0, 53.0, 50.0, 74.0, 69.0, 64.0, 74.0, 58.0, 52.0, 36.0, 38.0, 45.0, 27.0, 31.0, 25.0, 16.0, 10.0, 10.0, 6.0, 5.0, 5.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039276123046875, -0.03801727294921875, -0.0367584228515625, -0.03549957275390625, -0.03424072265625, -0.03298187255859375, -0.0317230224609375, -0.03046417236328125, -0.029205322265625, -0.02794647216796875, -0.0266876220703125, -0.02542877197265625, -0.024169921875, -0.02291107177734375, -0.0216522216796875, -0.02039337158203125, -0.019134521484375, -0.01787567138671875, -0.0166168212890625, -0.01535797119140625, -0.01409912109375, -0.01284027099609375, -0.0115814208984375, -0.01032257080078125, -0.009063720703125, -0.00780487060546875, -0.0065460205078125, -0.00528717041015625, -0.0040283203125, -0.00276947021484375, -0.0015106201171875, -0.00025177001953125, 0.001007080078125, 0.00226593017578125, 0.0035247802734375, 0.00478363037109375, 0.00604248046875, 0.00730133056640625, 0.0085601806640625, 0.00981903076171875, 0.011077880859375, 0.01233673095703125, 0.0135955810546875, 0.01485443115234375, 0.01611328125, 0.01737213134765625, 0.0186309814453125, 0.01988983154296875, 0.021148681640625, 0.02240753173828125, 0.0236663818359375, 0.02492523193359375, 0.02618408203125, 0.02744293212890625, 0.0287017822265625, 0.02996063232421875, 0.031219482421875, 0.03247833251953125, 0.0337371826171875, 0.03499603271484375, 0.0362548828125, 0.03751373291015625, 0.0387725830078125, 0.04003143310546875, 0.041290283203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 5.0, 13.0, 17.0, 18.0, 28.0, 51.0, 66.0, 100.0, 126.0, 206.0, 324.0, 679.0, 1731.0, 6224.0, 42306.0, 926645.0, 58738.0, 7588.0, 1948.0, 721.0, 394.0, 191.0, 117.0, 83.0, 61.0, 36.0, 28.0, 17.0, 22.0, 15.0, 7.0, 7.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0982666015625, -0.09542369842529297, -0.09258079528808594, -0.0897378921508789, -0.08689498901367188, -0.08405208587646484, -0.08120918273925781, -0.07836627960205078, -0.07552337646484375, -0.07268047332763672, -0.06983757019042969, -0.06699466705322266, -0.06415176391601562, -0.061308860778808594, -0.05846595764160156, -0.05562305450439453, -0.0527801513671875, -0.04993724822998047, -0.04709434509277344, -0.044251441955566406, -0.041408538818359375, -0.038565635681152344, -0.03572273254394531, -0.03287982940673828, -0.03003692626953125, -0.02719402313232422, -0.024351119995117188, -0.021508216857910156, -0.018665313720703125, -0.015822410583496094, -0.012979507446289062, -0.010136604309082031, -0.007293701171875, -0.004450798034667969, -0.0016078948974609375, 0.0012350082397460938, 0.004077911376953125, 0.006920814514160156, 0.009763717651367188, 0.012606620788574219, 0.01544952392578125, 0.01829242706298828, 0.021135330200195312, 0.023978233337402344, 0.026821136474609375, 0.029664039611816406, 0.03250694274902344, 0.03534984588623047, 0.0381927490234375, 0.04103565216064453, 0.04387855529785156, 0.046721458435058594, 0.049564361572265625, 0.052407264709472656, 0.05525016784667969, 0.05809307098388672, 0.06093597412109375, 0.06377887725830078, 0.06662178039550781, 0.06946468353271484, 0.07230758666992188, 0.0751504898071289, 0.07799339294433594, 0.08083629608154297, 0.08367919921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 8.0, 4.0, 2.0, 7.0, 13.0, 8.0, 11.0, 10.0, 7.0, 9.0, 15.0, 15.0, 21.0, 29.0, 25.0, 29.0, 18.0, 41.0, 48.0, 66.0, 57.0, 63.0, 66.0, 48.0, 69.0, 49.0, 34.0, 35.0, 33.0, 23.0, 25.0, 20.0, 10.0, 11.0, 12.0, 14.0, 11.0, 8.0, 10.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10498046875, -0.10138893127441406, -0.09779739379882812, -0.09420585632324219, -0.09061431884765625, -0.08702278137207031, -0.08343124389648438, -0.07983970642089844, -0.0762481689453125, -0.07265663146972656, -0.06906509399414062, -0.06547355651855469, -0.06188201904296875, -0.05829048156738281, -0.054698944091796875, -0.05110740661621094, -0.047515869140625, -0.04392433166503906, -0.040332794189453125, -0.03674125671386719, -0.03314971923828125, -0.029558181762695312, -0.025966644287109375, -0.022375106811523438, -0.0187835693359375, -0.015192031860351562, -0.011600494384765625, -0.008008956909179688, -0.00441741943359375, -0.0008258819580078125, 0.002765655517578125, 0.0063571929931640625, 0.00994873046875, 0.013540267944335938, 0.017131805419921875, 0.020723342895507812, 0.02431488037109375, 0.027906417846679688, 0.031497955322265625, 0.03508949279785156, 0.0386810302734375, 0.04227256774902344, 0.045864105224609375, 0.04945564270019531, 0.05304718017578125, 0.05663871765136719, 0.060230255126953125, 0.06382179260253906, 0.067413330078125, 0.07100486755371094, 0.07459640502929688, 0.07818794250488281, 0.08177947998046875, 0.08537101745605469, 0.08896255493164062, 0.09255409240722656, 0.0961456298828125, 0.09973716735839844, 0.10332870483398438, 0.10692024230957031, 0.11051177978515625, 0.11410331726074219, 0.11769485473632812, 0.12128639221191406, 0.1248779296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 10.0, 16.0, 12.0, 18.0, 24.0, 19.0, 31.0, 35.0, 69.0, 75.0, 149.0, 233.0, 373.0, 850.0, 1991.0, 5816.0, 21517.0, 234638.0, 747798.0, 24342.0, 6239.0, 2169.0, 916.0, 499.0, 228.0, 148.0, 82.0, 48.0, 41.0, 22.0, 24.0, 16.0, 25.0, 14.0, 10.0, 10.0, 9.0, 5.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0124969482421875, -0.01206660270690918, -0.01163625717163086, -0.011205911636352539, -0.010775566101074219, -0.010345220565795898, -0.009914875030517578, -0.009484529495239258, -0.009054183959960938, -0.008623838424682617, -0.008193492889404297, -0.0077631473541259766, -0.007332801818847656, -0.006902456283569336, -0.006472110748291016, -0.006041765213012695, -0.005611419677734375, -0.005181074142456055, -0.004750728607177734, -0.004320383071899414, -0.0038900375366210938, -0.0034596920013427734, -0.003029346466064453, -0.002599000930786133, -0.0021686553955078125, -0.0017383098602294922, -0.0013079643249511719, -0.0008776187896728516, -0.00044727325439453125, -1.6927719116210938e-05, 0.0004134178161621094, 0.0008437633514404297, 0.00127410888671875, 0.0017044544219970703, 0.0021347999572753906, 0.002565145492553711, 0.0029954910278320312, 0.0034258365631103516, 0.003856182098388672, 0.004286527633666992, 0.0047168731689453125, 0.005147218704223633, 0.005577564239501953, 0.0060079097747802734, 0.006438255310058594, 0.006868600845336914, 0.007298946380615234, 0.007729291915893555, 0.008159637451171875, 0.008589982986450195, 0.009020328521728516, 0.009450674057006836, 0.009881019592285156, 0.010311365127563477, 0.010741710662841797, 0.011172056198120117, 0.011602401733398438, 0.012032747268676758, 0.012463092803955078, 0.012893438339233398, 0.013323783874511719, 0.013754129409790039, 0.01418447494506836, 0.01461482048034668, 0.015045166015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 7.0, 5.0, 3.0, 5.0, 4.0, 0.0, 0.0, 7.0, 3.0, 6.0, 3.0, 7.0, 5.0, 11.0, 9.0, 8.0, 14.0, 7.0, 25.0, 17.0, 17.0, 24.0, 22.0, 35.0, 62.0, 52.0, 72.0, 67.0, 63.0, 72.0, 64.0, 51.0, 37.0, 28.0, 22.0, 16.0, 19.0, 15.0, 14.0, 11.0, 9.0, 12.0, 11.0, 7.0, 4.0, 10.0, 5.0, 4.0, 8.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-3.1828880310058594e-05, -3.0780211091041565e-05, -2.9731541872024536e-05, -2.8682872653007507e-05, -2.763420343399048e-05, -2.658553421497345e-05, -2.553686499595642e-05, -2.4488195776939392e-05, -2.3439526557922363e-05, -2.2390857338905334e-05, -2.1342188119888306e-05, -2.0293518900871277e-05, -1.9244849681854248e-05, -1.819618046283722e-05, -1.714751124382019e-05, -1.609884202480316e-05, -1.5050172805786133e-05, -1.4001503586769104e-05, -1.2952834367752075e-05, -1.1904165148735046e-05, -1.0855495929718018e-05, -9.806826710700989e-06, -8.75815749168396e-06, -7.709488272666931e-06, -6.660819053649902e-06, -5.6121498346328735e-06, -4.563480615615845e-06, -3.514811396598816e-06, -2.466142177581787e-06, -1.4174729585647583e-06, -3.688037395477295e-07, 6.798654794692993e-07, 1.7285346984863281e-06, 2.777203917503357e-06, 3.825873136520386e-06, 4.8745423555374146e-06, 5.923211574554443e-06, 6.971880793571472e-06, 8.020550012588501e-06, 9.06921923160553e-06, 1.0117888450622559e-05, 1.1166557669639587e-05, 1.2215226888656616e-05, 1.3263896107673645e-05, 1.4312565326690674e-05, 1.5361234545707703e-05, 1.640990376472473e-05, 1.745857298374176e-05, 1.850724220275879e-05, 1.9555911421775818e-05, 2.0604580640792847e-05, 2.1653249859809875e-05, 2.2701919078826904e-05, 2.3750588297843933e-05, 2.4799257516860962e-05, 2.584792673587799e-05, 2.689659595489502e-05, 2.794526517391205e-05, 2.8993934392929077e-05, 3.0042603611946106e-05, 3.1091272830963135e-05, 3.2139942049980164e-05, 3.318861126899719e-05, 3.423728048801422e-05, 3.528594970703125e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 6.0, 15.0, 28.0, 42.0, 76.0, 121.0, 258.0, 512.0, 1013.0, 2219.0, 5824.0, 18446.0, 123960.0, 844511.0, 35796.0, 9439.0, 3340.0, 1477.0, 660.0, 347.0, 206.0, 94.0, 49.0, 48.0, 17.0, 10.0, 10.0, 10.0, 10.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0118408203125, -0.011371374130249023, -0.010901927947998047, -0.01043248176574707, -0.009963035583496094, -0.009493589401245117, -0.00902414321899414, -0.008554697036743164, -0.008085250854492188, -0.007615804672241211, -0.007146358489990234, -0.006676912307739258, -0.006207466125488281, -0.005738019943237305, -0.005268573760986328, -0.0047991275787353516, -0.004329681396484375, -0.0038602352142333984, -0.003390789031982422, -0.0029213428497314453, -0.0024518966674804688, -0.001982450485229492, -0.0015130043029785156, -0.001043558120727539, -0.0005741119384765625, -0.00010466575622558594, 0.0003647804260253906, 0.0008342266082763672, 0.0013036727905273438, 0.0017731189727783203, 0.002242565155029297, 0.0027120113372802734, 0.00318145751953125, 0.0036509037017822266, 0.004120349884033203, 0.00458979606628418, 0.005059242248535156, 0.005528688430786133, 0.005998134613037109, 0.006467580795288086, 0.0069370269775390625, 0.007406473159790039, 0.007875919342041016, 0.008345365524291992, 0.008814811706542969, 0.009284257888793945, 0.009753704071044922, 0.010223150253295898, 0.010692596435546875, 0.011162042617797852, 0.011631488800048828, 0.012100934982299805, 0.012570381164550781, 0.013039827346801758, 0.013509273529052734, 0.013978719711303711, 0.014448165893554688, 0.014917612075805664, 0.01538705825805664, 0.015856504440307617, 0.016325950622558594, 0.01679539680480957, 0.017264842987060547, 0.017734289169311523, 0.0182037353515625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 4.0, 1.0, 4.0, 13.0, 15.0, 12.0, 22.0, 15.0, 40.0, 56.0, 75.0, 118.0, 174.0, 158.0, 71.0, 58.0, 40.0, 19.0, 19.0, 13.0, 12.0, 9.0, 8.0, 8.0, 8.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01062774658203125, -0.010226130485534668, -0.009824514389038086, -0.009422898292541504, -0.009021282196044922, -0.00861966609954834, -0.008218050003051758, -0.007816433906555176, -0.007414817810058594, -0.007013201713562012, -0.00661158561706543, -0.006209969520568848, -0.005808353424072266, -0.005406737327575684, -0.0050051212310791016, -0.0046035051345825195, -0.0042018890380859375, -0.0038002729415893555, -0.0033986568450927734, -0.0029970407485961914, -0.0025954246520996094, -0.0021938085556030273, -0.0017921924591064453, -0.0013905763626098633, -0.0009889602661132812, -0.0005873441696166992, -0.0001857280731201172, 0.00021588802337646484, 0.0006175041198730469, 0.001019120216369629, 0.001420736312866211, 0.001822352409362793, 0.002223968505859375, 0.002625584602355957, 0.003027200698852539, 0.003428816795349121, 0.003830432891845703, 0.004232048988342285, 0.004633665084838867, 0.005035281181335449, 0.005436897277832031, 0.005838513374328613, 0.006240129470825195, 0.006641745567321777, 0.007043361663818359, 0.007444977760314941, 0.007846593856811523, 0.008248209953308105, 0.008649826049804688, 0.00905144214630127, 0.009453058242797852, 0.009854674339294434, 0.010256290435791016, 0.010657906532287598, 0.01105952262878418, 0.011461138725280762, 0.011862754821777344, 0.012264370918273926, 0.012665987014770508, 0.01306760311126709, 0.013469219207763672, 0.013870835304260254, 0.014272451400756836, 0.014674067497253418, 0.01507568359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 11.0, 23.0, 37.0, 62.0, 98.0, 530.0, 105.0, 59.0, 21.0, 28.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5285054445266724, -0.5099209547042847, -0.4913364350795746, -0.4727519154548645, -0.4541674256324768, -0.4355829060077667, -0.41699838638305664, -0.39841389656066895, -0.37982940673828125, -0.36124488711357117, -0.34266039729118347, -0.3240758776664734, -0.3054913878440857, -0.2869068682193756, -0.2683223485946655, -0.24973785877227783, -0.23115333914756775, -0.21256883442401886, -0.19398432970046997, -0.1753998100757599, -0.1568153202533722, -0.1382308006286621, -0.11964629590511322, -0.10106179118156433, -0.08247728645801544, -0.06389278173446655, -0.045308273285627365, -0.026723764836788177, -0.008139260113239288, 0.0104452446103096, 0.029029756784439087, 0.047614261507987976, 0.06619876623153687, 0.08478327095508575, 0.10336777567863464, 0.12195228785276413, 0.14053678512573242, 0.1591213047504425, 0.1777058094739914, 0.19629031419754028, 0.21487481892108917, 0.23345932364463806, 0.25204384326934814, 0.27062833309173584, 0.2892128527164459, 0.3077973425388336, 0.3263818621635437, 0.3449663519859314, 0.3635508716106415, 0.38213539123535156, 0.40071988105773926, 0.41930440068244934, 0.43788889050483704, 0.4564734101295471, 0.4750578999519348, 0.4936424195766449, 0.512226939201355, 0.5308114290237427, 0.5493959784507751, 0.5679804682731628, 0.5865649580955505, 0.6051494479179382, 0.6237339973449707, 0.6423184871673584, 0.6609029769897461]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 0.0, 3.0, 2.0, 6.0, 10.0, 2.0, 5.0, 6.0, 6.0, 8.0, 8.0, 9.0, 10.0, 14.0, 12.0, 21.0, 27.0, 19.0, 33.0, 26.0, 47.0, 247.0, 186.0, 49.0, 31.0, 33.0, 16.0, 17.0, 20.0, 19.0, 18.0, 16.0, 12.0, 8.0, 5.0, 11.0, 14.0, 10.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3634147047996521, -0.35235968232154846, -0.3413046598434448, -0.3302496075630188, -0.31919458508491516, -0.3081395626068115, -0.2970845401287079, -0.28602951765060425, -0.2749744653701782, -0.2639194428920746, -0.25286442041397095, -0.24180938303470612, -0.23075434565544128, -0.21969932317733765, -0.208644300699234, -0.19758926331996918, -0.18653424084186554, -0.1754792183637619, -0.16442418098449707, -0.15336915850639343, -0.1423141211271286, -0.13125909864902496, -0.12020406872034073, -0.1091490387916565, -0.09809400886297226, -0.08703897893428802, -0.07598394900560379, -0.06492891907691956, -0.05387389287352562, -0.042818862944841385, -0.03176383674144745, -0.020708806812763214, -0.00965377688407898, 0.0014012521132826805, 0.01245628111064434, 0.023511309176683426, 0.03456633910536766, 0.045621369034051895, 0.05667639523744583, 0.06773142516613007, 0.0787864550948143, 0.08984148502349854, 0.10089651495218277, 0.111951544880867, 0.12300656735897064, 0.13406160473823547, 0.1451166272163391, 0.15617164969444275, 0.16722668707370758, 0.17828170955181122, 0.18933674693107605, 0.2003917694091797, 0.21144680678844452, 0.22250182926654816, 0.233556866645813, 0.24461188912391663, 0.25566691160202026, 0.2667219340801239, 0.27777695655822754, 0.28883200883865356, 0.2998870313167572, 0.31094205379486084, 0.3219970762729645, 0.3330520987510681, 0.34410715103149414]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 3.0, 6.0, 9.0, 14.0, 12.0, 15.0, 19.0, 30.0, 31.0, 30.0, 36.0, 52.0, 278.0, 179.0, 50.0, 50.0, 44.0, 30.0, 27.0, 19.0, 16.0, 11.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05078125, -0.04928159713745117, -0.047781944274902344, -0.046282291412353516, -0.04478263854980469, -0.04328298568725586, -0.04178333282470703, -0.0402836799621582, -0.038784027099609375, -0.03728437423706055, -0.03578472137451172, -0.03428506851196289, -0.03278541564941406, -0.031285762786865234, -0.029786109924316406, -0.028286457061767578, -0.02678680419921875, -0.025287151336669922, -0.023787498474121094, -0.022287845611572266, -0.020788192749023438, -0.01928853988647461, -0.01778888702392578, -0.016289234161376953, -0.014789581298828125, -0.013289928436279297, -0.011790275573730469, -0.01029062271118164, -0.008790969848632812, -0.007291316986083984, -0.005791664123535156, -0.004292011260986328, -0.0027923583984375, -0.0012927055358886719, 0.00020694732666015625, 0.0017066001892089844, 0.0032062530517578125, 0.004705905914306641, 0.006205558776855469, 0.007705211639404297, 0.009204864501953125, 0.010704517364501953, 0.012204170227050781, 0.01370382308959961, 0.015203475952148438, 0.016703128814697266, 0.018202781677246094, 0.019702434539794922, 0.02120208740234375, 0.022701740264892578, 0.024201393127441406, 0.025701045989990234, 0.027200698852539062, 0.02870035171508789, 0.03020000457763672, 0.03169965744018555, 0.033199310302734375, 0.0346989631652832, 0.03619861602783203, 0.03769826889038086, 0.03919792175292969, 0.040697574615478516, 0.042197227478027344, 0.04369688034057617, 0.045196533203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 12.0, 12.0, 17.0, 36.0, 51.0, 108.0, 222.0, 566.0, 2161.0, 17307.0, 8355371.0, 10165.0, 1615.0, 448.0, 230.0, 100.0, 58.0, 42.0, 16.0, 10.0, 5.0, 8.0, 10.0, 2.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35434266924858093, -0.33778855204582214, -0.32123440504074097, -0.3046802878379822, -0.2881261706352234, -0.2715720534324646, -0.2550179064273834, -0.23846378922462463, -0.22190965712070465, -0.20535552501678467, -0.18880140781402588, -0.1722472757101059, -0.1556931436061859, -0.13913902640342712, -0.12258489429950714, -0.10603076964616776, -0.08947664499282837, -0.07292252033948898, -0.0563683919608593, -0.039814263582229614, -0.02326013892889023, -0.006706014275550842, 0.00984811782836914, 0.026402242481708527, 0.04295636713504791, 0.0595104917883873, 0.07606461644172668, 0.09261874854564667, 0.10917287319898605, 0.12572699785232544, 0.14228112995624542, 0.1588352620601654, 0.1753893494606018, 0.1919434815645218, 0.20849759876728058, 0.22505173087120056, 0.24160584807395935, 0.2581599950790405, 0.2747141122817993, 0.2912682294845581, 0.3078223466873169, 0.3243764638900757, 0.34093061089515686, 0.35748472809791565, 0.37403884530067444, 0.3905929923057556, 0.4071471095085144, 0.4237012267112732, 0.44025537371635437, 0.45680949091911316, 0.47336363792419434, 0.4899177551269531, 0.5064718723297119, 0.5230259895324707, 0.5395801067352295, 0.5561342835426331, 0.5726884007453918, 0.5892425179481506, 0.6057966351509094, 0.622350811958313, 0.6389049291610718, 0.6554590463638306, 0.6720131635665894, 0.6885672807693481, 0.7051213979721069]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 5.0, 4.0, 4.0, 0.0, 4.0, 7.0, 2.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 5.0, 3.0, 2.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5080909729003906, -0.4912363290786743, -0.474381685256958, -0.4575270414352417, -0.4406723976135254, -0.4238177537918091, -0.4069631099700928, -0.39010846614837646, -0.37325382232666016, -0.35639917850494385, -0.33954453468322754, -0.32268989086151123, -0.3058352470397949, -0.2889806032180786, -0.2721259593963623, -0.255271315574646, -0.2384166717529297, -0.22156202793121338, -0.20470738410949707, -0.18785274028778076, -0.17099809646606445, -0.15414345264434814, -0.13728880882263184, -0.12043416500091553, -0.10357952117919922, -0.08672487735748291, -0.0698702335357666, -0.05301558971405029, -0.036160945892333984, -0.019306302070617676, -0.002451658248901367, 0.014402985572814941, 0.03125762939453125, 0.04811227321624756, 0.06496691703796387, 0.08182156085968018, 0.09867620468139648, 0.11553084850311279, 0.1323854923248291, 0.1492401361465454, 0.16609477996826172, 0.18294942378997803, 0.19980406761169434, 0.21665871143341064, 0.23351335525512695, 0.25036799907684326, 0.26722264289855957, 0.2840772867202759, 0.3009319305419922, 0.3177865743637085, 0.3346412181854248, 0.3514958620071411, 0.3683505058288574, 0.38520514965057373, 0.40205979347229004, 0.41891443729400635, 0.43576908111572266, 0.45262372493743896, 0.4694783687591553, 0.4863330125808716, 0.5031876564025879, 0.5200423002243042, 0.5368969440460205, 0.5537515878677368, 0.5706062316894531]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 19.0, 23.0, 27.0, 50.0, 74.0, 113.0, 212.0, 357.0, 640.0, 1372.0, 3283.0, 10211.0, 46988.0, 264898.0, 159290.0, 26047.0, 6291.0, 2188.0, 940.0, 503.0, 249.0, 170.0, 101.0, 59.0, 38.0, 27.0, 19.0, 13.0, 8.0, 8.0, 6.0, 7.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.465087890625, -0.4500007629394531, -0.43491363525390625, -0.4198265075683594, -0.4047393798828125, -0.3896522521972656, -0.37456512451171875, -0.3594779968261719, -0.344390869140625, -0.3293037414550781, -0.31421661376953125, -0.2991294860839844, -0.2840423583984375, -0.2689552307128906, -0.25386810302734375, -0.23878097534179688, -0.22369384765625, -0.20860671997070312, -0.19351959228515625, -0.17843246459960938, -0.1633453369140625, -0.14825820922851562, -0.13317108154296875, -0.11808395385742188, -0.102996826171875, -0.08790969848632812, -0.07282257080078125, -0.057735443115234375, -0.0426483154296875, -0.027561187744140625, -0.01247406005859375, 0.002613067626953125, 0.0177001953125, 0.032787322998046875, 0.04787445068359375, 0.06296157836914062, 0.0780487060546875, 0.09313583374023438, 0.10822296142578125, 0.12331008911132812, 0.138397216796875, 0.15348434448242188, 0.16857147216796875, 0.18365859985351562, 0.1987457275390625, 0.21383285522460938, 0.22891998291015625, 0.24400711059570312, 0.25909423828125, 0.2741813659667969, 0.28926849365234375, 0.3043556213378906, 0.3194427490234375, 0.3345298767089844, 0.34961700439453125, 0.3647041320800781, 0.379791259765625, 0.3948783874511719, 0.40996551513671875, 0.4250526428222656, 0.4401397705078125, 0.4552268981933594, 0.47031402587890625, 0.4854011535644531, 0.50048828125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 8.0, 7.0, 11.0, 16.0, 16.0, 19.0, 23.0, 33.0, 43.0, 40.0, 59.0, 67.0, 56.0, 71.0, 56.0, 75.0, 66.0, 72.0, 56.0, 37.0, 34.0, 26.0, 21.0, 15.0, 9.0, 13.0, 6.0, 8.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.04473876953125, -0.043469905853271484, -0.04220104217529297, -0.04093217849731445, -0.03966331481933594, -0.03839445114135742, -0.037125587463378906, -0.03585672378540039, -0.034587860107421875, -0.03331899642944336, -0.032050132751464844, -0.030781269073486328, -0.029512405395507812, -0.028243541717529297, -0.02697467803955078, -0.025705814361572266, -0.02443695068359375, -0.023168087005615234, -0.02189922332763672, -0.020630359649658203, -0.019361495971679688, -0.018092632293701172, -0.016823768615722656, -0.01555490493774414, -0.014286041259765625, -0.01301717758178711, -0.011748313903808594, -0.010479450225830078, -0.009210586547851562, -0.007941722869873047, -0.006672859191894531, -0.005403995513916016, -0.0041351318359375, -0.0028662681579589844, -0.0015974044799804688, -0.0003285408020019531, 0.0009403228759765625, 0.002209186553955078, 0.0034780502319335938, 0.004746913909912109, 0.006015777587890625, 0.007284641265869141, 0.008553504943847656, 0.009822368621826172, 0.011091232299804688, 0.012360095977783203, 0.013628959655761719, 0.014897823333740234, 0.01616668701171875, 0.017435550689697266, 0.01870441436767578, 0.019973278045654297, 0.021242141723632812, 0.022511005401611328, 0.023779869079589844, 0.02504873275756836, 0.026317596435546875, 0.02758646011352539, 0.028855323791503906, 0.030124187469482422, 0.03139305114746094, 0.03266191482543945, 0.03393077850341797, 0.035199642181396484, 0.036468505859375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 6.0, 4.0, 3.0, 2.0, 2.0, 8.0, 11.0, 6.0, 11.0, 24.0, 26.0, 43.0, 57.0, 37.0, 54.0, 38.0, 38.0, 27.0, 18.0, 13.0, 10.0, 12.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2834893763065338, -0.27606239914894104, -0.26863542199134827, -0.2612084448337555, -0.2537814676761627, -0.24635447561740875, -0.23892749845981598, -0.2315005213022232, -0.22407352924346924, -0.21664655208587646, -0.2092195749282837, -0.20179259777069092, -0.19436560571193695, -0.18693862855434418, -0.1795116513967514, -0.17208467423915863, -0.16465769708156586, -0.15723071992397308, -0.1498037427663803, -0.14237675070762634, -0.13494977355003357, -0.1275227963924408, -0.12009581923484802, -0.11266884207725525, -0.10524185746908188, -0.0978148803114891, -0.09038789570331573, -0.08296091854572296, -0.07553394138813019, -0.06810695677995682, -0.060679979622364044, -0.05325299873948097, -0.04582600295543671, -0.038399022072553635, -0.030972043052315712, -0.02354506403207779, -0.016118083149194717, -0.008691102266311646, -0.001264125108718872, 0.0061628557741642, 0.013589836657047272, 0.021016817539930344, 0.028443796560168266, 0.03587077558040619, 0.04329775646328926, 0.05072473734617233, 0.058151714503765106, 0.06557869911193848, 0.07300567626953125, 0.08043265342712402, 0.0878596380352974, 0.09528661519289017, 0.10271359980106354, 0.11014057695865631, 0.11756755411624908, 0.12499453127384186, 0.13242152333259583, 0.1398485004901886, 0.14727547764778137, 0.15470245480537415, 0.1621294468641281, 0.1695564240217209, 0.17698340117931366, 0.18441037833690643, 0.1918373554944992]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 6.0, 2.0, 5.0, 7.0, 4.0, 10.0, 25.0, 39.0, 75.0, 86.0, 102.0, 58.0, 20.0, 6.0, 6.0, 11.0, 4.0, 7.0, 2.0, 4.0, 0.0, 2.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2557032108306885, -0.24675419926643372, -0.23780518770217896, -0.2288561761379242, -0.21990716457366943, -0.21095815300941467, -0.2020091414451599, -0.19306012988090515, -0.1841111183166504, -0.17516210675239563, -0.16621309518814087, -0.1572640836238861, -0.14831507205963135, -0.1393660604953766, -0.13041704893112183, -0.12146802991628647, -0.11251901090145111, -0.10356999933719635, -0.09462098777294159, -0.08567197620868683, -0.07672296464443207, -0.06777395308017731, -0.05882493406534195, -0.04987592250108719, -0.04092691093683243, -0.03197789937257767, -0.023028885945677757, -0.014079872518777847, -0.0051308609545230865, 0.003818150609731674, 0.012767165899276733, 0.021716177463531494, 0.030665189027786255, 0.039614200592041016, 0.048563212156295776, 0.057512227445840836, 0.0664612352848053, 0.07541024684906006, 0.08435926586389542, 0.09330827742815018, 0.10225728899240494, 0.1112063005566597, 0.12015531212091446, 0.12910433113574982, 0.13805334270000458, 0.14700235426425934, 0.1559513658285141, 0.16490037739276886, 0.17384938895702362, 0.18279840052127838, 0.19174741208553314, 0.2006964236497879, 0.20964543521404266, 0.21859444677829742, 0.22754347324371338, 0.23649248480796814, 0.2454414963722229, 0.25439050793647766, 0.2633395195007324, 0.2722885310649872, 0.28123754262924194, 0.2901865541934967, 0.29913556575775146, 0.3080845773220062, 0.317033588886261]}, "train/train_runtime": 4778.2339, "train/train_samples_per_second": 5.972, "train/train_steps_per_second": 0.062, "train/total_flos": 0.0, "train/train_loss": 4.439775107284186, "eval/loss": 4.222483158111572, "eval/wer": 2.421539071796906, "eval/runtime": 946.7625, "eval/samples_per_second": 2.791, "eval/steps_per_second": 0.233} \ No newline at end of file