diff --git "a/wandb/run-20220303_055131-e96a3lxb/files/wandb-summary.json" "b/wandb/run-20220303_055131-e96a3lxb/files/wandb-summary.json" --- "a/wandb/run-20220303_055131-e96a3lxb/files/wandb-summary.json" +++ "b/wandb/run-20220303_055131-e96a3lxb/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.8899, "train/learning_rate": 0.0008900000000000001, "train/epoch": 1.0, "train/global_step": 446, "_runtime": 6619, "_timestamp": 1646293310, "_step": 447, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 78.0, 357.0, 439.0, 109.0, 16.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.88333511352539, -41.3859977722168, -36.88865661621094, -32.391319274902344, -27.893980026245117, -23.39664077758789, -18.899303436279297, -14.40196418762207, -9.904624938964844, -5.407286167144775, -0.909947395324707, 3.587390899658203, 8.08473014831543, 12.582069396972656, 17.07940673828125, 21.576745986938477, 26.074085235595703, 30.57142448425293, 35.068763732910156, 39.56610107421875, 44.063438415527344, 48.5607795715332, 53.0581169128418, 57.555458068847656, 62.05279541015625, 66.55013275146484, 71.04747009277344, 75.54481506347656, 80.04215240478516, 84.53948974609375, 89.03682708740234, 93.53416442871094, 98.03150939941406, 102.52884674072266, 107.02618408203125, 111.52352905273438, 116.02086639404297, 120.51820373535156, 125.01554107666016, 129.51287841796875, 134.01022338867188, 138.507568359375, 143.00489807128906, 147.5022430419922, 151.99957275390625, 156.49691772460938, 160.9942626953125, 165.49159240722656, 169.98892211914062, 174.48626708984375, 178.9835968017578, 183.48094177246094, 187.978271484375, 192.47561645507812, 196.97296142578125, 201.4702911376953, 205.96763610839844, 210.46498107910156, 214.96231079101562, 219.45965576171875, 223.9569854736328, 228.45433044433594, 232.95166015625, 237.44900512695312, 241.94635009765625]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 5.0, 5.0, 6.0, 4.0, 13.0, 15.0, 9.0, 19.0, 13.0, 18.0, 24.0, 32.0, 28.0, 30.0, 34.0, 30.0, 39.0, 52.0, 42.0, 51.0, 46.0, 47.0, 32.0, 44.0, 44.0, 39.0, 38.0, 33.0, 22.0, 35.0, 24.0, 21.0, 18.0, 16.0, 12.0, 20.0, 10.0, 8.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.24918365478516, -62.14531326293945, -60.04144287109375, -57.93757247924805, -55.833702087402344, -53.729827880859375, -51.62595748901367, -49.52208709716797, -47.418216705322266, -45.31434631347656, -43.21047592163086, -41.106605529785156, -39.00273132324219, -36.89886474609375, -34.79499053955078, -32.69112014770508, -30.587249755859375, -28.483379364013672, -26.37950897216797, -24.275636672973633, -22.17176628112793, -20.067895889282227, -17.96402359008789, -15.860153198242188, -13.756282806396484, -11.652412414550781, -9.548541069030762, -7.4446702003479, -5.340799331665039, -3.236928939819336, -1.1330575942993164, 0.9708137512207031, 3.0746917724609375, 5.178562641143799, 7.28243350982666, 9.38630485534668, 11.490175247192383, 13.594045639038086, 15.697916984558105, 17.801788330078125, 19.905658721923828, 22.00952911376953, 24.113399505615234, 26.21727180480957, 28.321142196655273, 30.425012588500977, 32.52888488769531, 34.632755279541016, 36.73662567138672, 38.84049606323242, 40.944366455078125, 43.04823684692383, 45.15210723876953, 47.2559814453125, 49.3598518371582, 51.463722229003906, 53.56759262084961, 55.67146301269531, 57.775333404541016, 59.87920379638672, 61.98307800292969, 64.08694458007812, 66.1908187866211, 68.29469299316406, 70.3985595703125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 4.0, 5.0, 12.0, 9.0, 6.0, 15.0, 15.0, 22.0, 16.0, 27.0, 21.0, 36.0, 35.0, 33.0, 40.0, 38.0, 56.0, 56.0, 51.0, 45.0, 40.0, 51.0, 59.0, 53.0, 35.0, 32.0, 33.0, 22.0, 24.0, 27.0, 21.0, 19.0, 12.0, 8.0, 6.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.623046875, -1.576690673828125, -1.53033447265625, -1.483978271484375, -1.4376220703125, -1.391265869140625, -1.34490966796875, -1.298553466796875, -1.252197265625, -1.205841064453125, -1.15948486328125, -1.113128662109375, -1.0667724609375, -1.020416259765625, -0.97406005859375, -0.927703857421875, -0.88134765625, -0.834991455078125, -0.78863525390625, -0.742279052734375, -0.6959228515625, -0.649566650390625, -0.60321044921875, -0.556854248046875, -0.510498046875, -0.464141845703125, -0.41778564453125, -0.371429443359375, -0.3250732421875, -0.278717041015625, -0.23236083984375, -0.186004638671875, -0.1396484375, -0.093292236328125, -0.04693603515625, -0.000579833984375, 0.0457763671875, 0.092132568359375, 0.13848876953125, 0.184844970703125, 0.231201171875, 0.277557373046875, 0.32391357421875, 0.370269775390625, 0.4166259765625, 0.462982177734375, 0.50933837890625, 0.555694580078125, 0.60205078125, 0.648406982421875, 0.69476318359375, 0.741119384765625, 0.7874755859375, 0.833831787109375, 0.88018798828125, 0.926544189453125, 0.972900390625, 1.019256591796875, 1.06561279296875, 1.111968994140625, 1.1583251953125, 1.204681396484375, 1.25103759765625, 1.297393798828125, 1.34375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 8.0, 14.0, 22.0, 23.0, 27.0, 35.0, 59.0, 87.0, 118.0, 153.0, 214.0, 327.0, 478.0, 749.0, 1145.0, 2014.0, 4292.0, 15400.0, 281478.0, 3816804.0, 54896.0, 8421.0, 2970.0, 1630.0, 1027.0, 609.0, 383.0, 259.0, 185.0, 139.0, 90.0, 68.0, 30.0, 39.0, 20.0, 17.0, 11.0, 8.0, 6.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.734375, -14.3046875, -13.875, -13.4453125, -13.015625, -12.5859375, -12.15625, -11.7265625, -11.296875, -10.8671875, -10.4375, -10.0078125, -9.578125, -9.1484375, -8.71875, -8.2890625, -7.859375, -7.4296875, -7.0, -6.5703125, -6.140625, -5.7109375, -5.28125, -4.8515625, -4.421875, -3.9921875, -3.5625, -3.1328125, -2.703125, -2.2734375, -1.84375, -1.4140625, -0.984375, -0.5546875, -0.125, 0.3046875, 0.734375, 1.1640625, 1.59375, 2.0234375, 2.453125, 2.8828125, 3.3125, 3.7421875, 4.171875, 4.6015625, 5.03125, 5.4609375, 5.890625, 6.3203125, 6.75, 7.1796875, 7.609375, 8.0390625, 8.46875, 8.8984375, 9.328125, 9.7578125, 10.1875, 10.6171875, 11.046875, 11.4765625, 11.90625, 12.3359375, 12.765625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 16.0, 33.0, 58.0, 145.0, 434.0, 1106.0, 1332.0, 520.0, 190.0, 116.0, 49.0, 28.0, 24.0, 14.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3203125, -9.9085693359375, -9.496826171875, -9.0850830078125, -8.67333984375, -8.2615966796875, -7.849853515625, -7.4381103515625, -7.0263671875, -6.6146240234375, -6.202880859375, -5.7911376953125, -5.37939453125, -4.9676513671875, -4.555908203125, -4.1441650390625, -3.732421875, -3.3206787109375, -2.908935546875, -2.4971923828125, -2.08544921875, -1.6737060546875, -1.261962890625, -0.8502197265625, -0.4384765625, -0.0267333984375, 0.385009765625, 0.7967529296875, 1.20849609375, 1.6202392578125, 2.031982421875, 2.4437255859375, 2.85546875, 3.2672119140625, 3.678955078125, 4.0906982421875, 4.50244140625, 4.9141845703125, 5.325927734375, 5.7376708984375, 6.1494140625, 6.5611572265625, 6.972900390625, 7.3846435546875, 7.79638671875, 8.2081298828125, 8.619873046875, 9.0316162109375, 9.443359375, 9.8551025390625, 10.266845703125, 10.6785888671875, 11.09033203125, 11.5020751953125, 11.913818359375, 12.3255615234375, 12.7373046875, 13.1490478515625, 13.560791015625, 13.9725341796875, 14.38427734375, 14.7960205078125, 15.207763671875, 15.6195068359375, 16.03125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 21.0, 46.0, 100.0, 222.0, 704.0, 4200.0, 3430448.0, 754313.0, 3127.0, 680.0, 208.0, 103.0, 59.0, 18.0, 9.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.09375, -39.845703125, -38.59765625, -37.349609375, -36.1015625, -34.853515625, -33.60546875, -32.357421875, -31.109375, -29.861328125, -28.61328125, -27.365234375, -26.1171875, -24.869140625, -23.62109375, -22.373046875, -21.125, -19.876953125, -18.62890625, -17.380859375, -16.1328125, -14.884765625, -13.63671875, -12.388671875, -11.140625, -9.892578125, -8.64453125, -7.396484375, -6.1484375, -4.900390625, -3.65234375, -2.404296875, -1.15625, 0.091796875, 1.33984375, 2.587890625, 3.8359375, 5.083984375, 6.33203125, 7.580078125, 8.828125, 10.076171875, 11.32421875, 12.572265625, 13.8203125, 15.068359375, 16.31640625, 17.564453125, 18.8125, 20.060546875, 21.30859375, 22.556640625, 23.8046875, 25.052734375, 26.30078125, 27.548828125, 28.796875, 30.044921875, 31.29296875, 32.541015625, 33.7890625, 35.037109375, 36.28515625, 37.533203125, 38.78125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 49.0, 579.0, 350.0, 31.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.93313598632812, -176.4544677734375, -172.97579956054688, -169.4971160888672, -166.01844787597656, -162.53977966308594, -159.0611114501953, -155.5824432373047, -152.103759765625, -148.62509155273438, -145.14642333984375, -141.66773986816406, -138.18907165527344, -134.7104034423828, -131.2317352294922, -127.75306701660156, -124.27439880371094, -120.79573059082031, -117.31705474853516, -113.83838653564453, -110.35971069335938, -106.88104248046875, -103.40237426757812, -99.9237060546875, -96.44503021240234, -92.96636199951172, -89.48768615722656, -86.00901794433594, -82.53034973144531, -79.05167388916016, -75.57300567626953, -72.09432983398438, -68.61566162109375, -65.13699340820312, -61.65831756591797, -58.179649353027344, -54.70097732543945, -51.22230529785156, -47.74363708496094, -44.26496505737305, -40.78628921508789, -37.3076171875, -33.828948974609375, -30.350276947021484, -26.871604919433594, -23.392932891845703, -19.914262771606445, -16.435592651367188, -12.956920623779297, -9.478249549865723, -5.999578475952148, -2.520907402038574, 0.957763671875, 4.436435699462891, 7.915105819702148, 11.393775939941406, 14.872447967529297, 18.351119995117188, 21.829790115356445, 25.308460235595703, 28.787132263183594, 32.265804290771484, 35.744476318359375, 39.22314453125, 42.70181655883789]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 13.0, 10.0, 12.0, 12.0, 18.0, 21.0, 27.0, 25.0, 33.0, 31.0, 45.0, 37.0, 47.0, 41.0, 51.0, 51.0, 50.0, 48.0, 38.0, 32.0, 46.0, 37.0, 41.0, 28.0, 25.0, 30.0, 25.0, 17.0, 18.0, 14.0, 17.0, 13.0, 5.0, 7.0, 8.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-32.39892578125, -31.52111053466797, -30.64329719543457, -29.76548194885254, -28.88766860961914, -28.00985336303711, -27.132038116455078, -26.254222869873047, -25.37640953063965, -24.498594284057617, -23.62078094482422, -22.742965698242188, -21.865150451660156, -20.987337112426758, -20.109521865844727, -19.231708526611328, -18.353893280029297, -17.476078033447266, -16.598264694213867, -15.720449447631836, -14.842635154724121, -13.964820861816406, -13.087005615234375, -12.20919132232666, -11.331377029418945, -10.45356273651123, -9.575748443603516, -8.697933197021484, -7.8201189041137695, -6.942304611206055, -6.064489841461182, -5.186675071716309, -4.308860778808594, -3.4310462474823, -2.553231716156006, -1.675417184829712, -0.797602653503418, 0.08021163940429688, 0.9580264091491699, 1.835841178894043, 2.713655471801758, 3.5914700031280518, 4.469284534454346, 5.347099304199219, 6.224913597106934, 7.102727890014648, 7.9805426597595215, 8.858357429504395, 9.73617172241211, 10.613986015319824, 11.491800308227539, 12.36961555480957, 13.247429847717285, 14.125244140625, 15.003059387207031, 15.880873680114746, 16.75868797302246, 17.636503219604492, 18.51431655883789, 19.392131805419922, 20.269947052001953, 21.14776039123535, 22.025575637817383, 22.90338897705078, 23.781204223632812]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 10.0, 10.0, 11.0, 12.0, 17.0, 14.0, 21.0, 15.0, 22.0, 25.0, 24.0, 34.0, 28.0, 34.0, 47.0, 32.0, 43.0, 37.0, 45.0, 46.0, 43.0, 47.0, 33.0, 42.0, 41.0, 41.0, 30.0, 36.0, 16.0, 28.0, 22.0, 17.0, 6.0, 10.0, 15.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.263580322265625, -1.22247314453125, -1.181365966796875, -1.1402587890625, -1.099151611328125, -1.05804443359375, -1.016937255859375, -0.975830078125, -0.934722900390625, -0.89361572265625, -0.852508544921875, -0.8114013671875, -0.770294189453125, -0.72918701171875, -0.688079833984375, -0.64697265625, -0.605865478515625, -0.56475830078125, -0.523651123046875, -0.4825439453125, -0.441436767578125, -0.40032958984375, -0.359222412109375, -0.318115234375, -0.277008056640625, -0.23590087890625, -0.194793701171875, -0.1536865234375, -0.112579345703125, -0.07147216796875, -0.030364990234375, 0.0107421875, 0.051849365234375, 0.09295654296875, 0.134063720703125, 0.1751708984375, 0.216278076171875, 0.25738525390625, 0.298492431640625, 0.339599609375, 0.380706787109375, 0.42181396484375, 0.462921142578125, 0.5040283203125, 0.545135498046875, 0.58624267578125, 0.627349853515625, 0.66845703125, 0.709564208984375, 0.75067138671875, 0.791778564453125, 0.8328857421875, 0.873992919921875, 0.91510009765625, 0.956207275390625, 0.997314453125, 1.038421630859375, 1.07952880859375, 1.120635986328125, 1.1617431640625, 1.202850341796875, 1.24395751953125, 1.285064697265625, 1.326171875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 14.0, 15.0, 35.0, 42.0, 76.0, 103.0, 142.0, 196.0, 294.0, 365.0, 605.0, 749.0, 1160.0, 1664.0, 2315.0, 3193.0, 4615.0, 6763.0, 9570.0, 14080.0, 20448.0, 30487.0, 45823.0, 71224.0, 121589.0, 285192.0, 167951.0, 89186.0, 55384.0, 36603.0, 24311.0, 16765.0, 11318.0, 7985.0, 5487.0, 3838.0, 2670.0, 1879.0, 1309.0, 959.0, 616.0, 485.0, 329.0, 206.0, 170.0, 110.0, 72.0, 51.0, 47.0, 22.0, 17.0, 9.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.05267333984375, -0.05101299285888672, -0.04935264587402344, -0.047692298889160156, -0.046031951904296875, -0.044371604919433594, -0.04271125793457031, -0.04105091094970703, -0.03939056396484375, -0.03773021697998047, -0.03606986999511719, -0.034409523010253906, -0.032749176025390625, -0.031088829040527344, -0.029428482055664062, -0.02776813507080078, -0.0261077880859375, -0.02444744110107422, -0.022787094116210938, -0.021126747131347656, -0.019466400146484375, -0.017806053161621094, -0.016145706176757812, -0.014485359191894531, -0.01282501220703125, -0.011164665222167969, -0.009504318237304688, -0.007843971252441406, -0.006183624267578125, -0.004523277282714844, -0.0028629302978515625, -0.0012025833129882812, 0.000457763671875, 0.0021181106567382812, 0.0037784576416015625, 0.005438804626464844, 0.007099151611328125, 0.008759498596191406, 0.010419845581054688, 0.012080192565917969, 0.01374053955078125, 0.015400886535644531, 0.017061233520507812, 0.018721580505371094, 0.020381927490234375, 0.022042274475097656, 0.023702621459960938, 0.02536296844482422, 0.0270233154296875, 0.02868366241455078, 0.030344009399414062, 0.032004356384277344, 0.033664703369140625, 0.035325050354003906, 0.03698539733886719, 0.03864574432373047, 0.04030609130859375, 0.04196643829345703, 0.04362678527832031, 0.045287132263183594, 0.046947479248046875, 0.048607826232910156, 0.05026817321777344, 0.05192852020263672, 0.0535888671875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 6.0, 14.0, 6.0, 17.0, 15.0, 22.0, 14.0, 20.0, 26.0, 21.0, 22.0, 34.0, 28.0, 38.0, 38.0, 33.0, 37.0, 40.0, 37.0, 1059.0, 30.0, 37.0, 40.0, 46.0, 24.0, 45.0, 44.0, 21.0, 30.0, 23.0, 16.0, 17.0, 17.0, 22.0, 11.0, 18.0, 10.0, 13.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.1484375, -1.1159591674804688, -1.0834808349609375, -1.0510025024414062, -1.018524169921875, -0.9860458374023438, -0.9535675048828125, -0.9210891723632812, -0.88861083984375, -0.8561325073242188, -0.8236541748046875, -0.7911758422851562, -0.758697509765625, -0.7262191772460938, -0.6937408447265625, -0.6612625122070312, -0.6287841796875, -0.5963058471679688, -0.5638275146484375, -0.5313491821289062, -0.498870849609375, -0.46639251708984375, -0.4339141845703125, -0.40143585205078125, -0.36895751953125, -0.33647918701171875, -0.3040008544921875, -0.27152252197265625, -0.239044189453125, -0.20656585693359375, -0.1740875244140625, -0.14160919189453125, -0.109130859375, -0.07665252685546875, -0.0441741943359375, -0.01169586181640625, 0.020782470703125, 0.05326080322265625, 0.0857391357421875, 0.11821746826171875, 0.15069580078125, 0.18317413330078125, 0.2156524658203125, 0.24813079833984375, 0.280609130859375, 0.31308746337890625, 0.3455657958984375, 0.37804412841796875, 0.4105224609375, 0.44300079345703125, 0.4754791259765625, 0.5079574584960938, 0.540435791015625, 0.5729141235351562, 0.6053924560546875, 0.6378707885742188, 0.67034912109375, 0.7028274536132812, 0.7353057861328125, 0.7677841186523438, 0.800262451171875, 0.8327407836914062, 0.8652191162109375, 0.8976974487304688, 0.93017578125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 14.0, 12.0, 22.0, 28.0, 52.0, 74.0, 117.0, 174.0, 274.0, 397.0, 648.0, 959.0, 1443.0, 2241.0, 3181.0, 4811.0, 7156.0, 10479.0, 15665.0, 23829.0, 36829.0, 60243.0, 104412.0, 209741.0, 1314786.0, 116389.0, 66129.0, 40194.0, 25405.0, 16956.0, 11252.0, 7694.0, 5118.0, 3496.0, 2347.0, 1553.0, 1013.0, 686.0, 450.0, 268.0, 229.0, 120.0, 99.0, 51.0, 42.0, 21.0, 14.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031280517578125, -0.030274391174316406, -0.029268264770507812, -0.02826213836669922, -0.027256011962890625, -0.02624988555908203, -0.025243759155273438, -0.024237632751464844, -0.02323150634765625, -0.022225379943847656, -0.021219253540039062, -0.02021312713623047, -0.019207000732421875, -0.01820087432861328, -0.017194747924804688, -0.016188621520996094, -0.0151824951171875, -0.014176368713378906, -0.013170242309570312, -0.012164115905761719, -0.011157989501953125, -0.010151863098144531, -0.009145736694335938, -0.008139610290527344, -0.00713348388671875, -0.006127357482910156, -0.0051212310791015625, -0.004115104675292969, -0.003108978271484375, -0.0021028518676757812, -0.0010967254638671875, -9.059906005859375e-05, 0.00091552734375, 0.0019216537475585938, 0.0029277801513671875, 0.003933906555175781, 0.004940032958984375, 0.005946159362792969, 0.0069522857666015625, 0.007958412170410156, 0.00896453857421875, 0.009970664978027344, 0.010976791381835938, 0.011982917785644531, 0.012989044189453125, 0.013995170593261719, 0.015001296997070312, 0.016007423400878906, 0.0170135498046875, 0.018019676208496094, 0.019025802612304688, 0.02003192901611328, 0.021038055419921875, 0.02204418182373047, 0.023050308227539062, 0.024056434631347656, 0.02506256103515625, 0.026068687438964844, 0.027074813842773438, 0.02808094024658203, 0.029087066650390625, 0.03009319305419922, 0.031099319458007812, 0.032105445861816406, 0.033111572265625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 9.0, 4.0, 12.0, 15.0, 8.0, 0.0, 13.0, 16.0, 17.0, 29.0, 61.0, 69.0, 437.0, 94.0, 61.0, 34.0, 0.0, 17.0, 15.0, 15.0, 14.0, 5.0, 10.0, 6.0, 9.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.086162567138672e-06, -2.032145857810974e-06, -1.9781291484832764e-06, -1.9241124391555786e-06, -1.8700957298278809e-06, -1.816079020500183e-06, -1.7620623111724854e-06, -1.7080456018447876e-06, -1.6540288925170898e-06, -1.600012183189392e-06, -1.5459954738616943e-06, -1.4919787645339966e-06, -1.4379620552062988e-06, -1.383945345878601e-06, -1.3299286365509033e-06, -1.2759119272232056e-06, -1.2218952178955078e-06, -1.16787850856781e-06, -1.1138617992401123e-06, -1.0598450899124146e-06, -1.0058283805847168e-06, -9.51811671257019e-07, -8.977949619293213e-07, -8.437782526016235e-07, -7.897615432739258e-07, -7.35744833946228e-07, -6.817281246185303e-07, -6.277114152908325e-07, -5.736947059631348e-07, -5.19677996635437e-07, -4.6566128730773926e-07, -4.116445779800415e-07, -3.5762786865234375e-07, -3.03611159324646e-07, -2.4959444999694824e-07, -1.955777406692505e-07, -1.4156103134155273e-07, -8.754432201385498e-08, -3.3527612686157227e-08, 2.0489096641540527e-08, 7.450580596923828e-08, 1.2852251529693604e-07, 1.825392246246338e-07, 2.3655593395233154e-07, 2.905726432800293e-07, 3.4458935260772705e-07, 3.986060619354248e-07, 4.5262277126312256e-07, 5.066394805908203e-07, 5.606561899185181e-07, 6.146728992462158e-07, 6.686896085739136e-07, 7.227063179016113e-07, 7.767230272293091e-07, 8.307397365570068e-07, 8.847564458847046e-07, 9.387731552124023e-07, 9.927898645401e-07, 1.0468065738677979e-06, 1.1008232831954956e-06, 1.1548399925231934e-06, 1.2088567018508911e-06, 1.2628734111785889e-06, 1.3168901205062866e-06, 1.3709068298339844e-06]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 7.0, 5.0, 12.0, 12.0, 19.0, 31.0, 25.0, 33.0, 45.0, 47.0, 71.0, 84.0, 142.0, 356.0, 3177.0, 1042735.0, 949.0, 321.0, 121.0, 68.0, 59.0, 45.0, 26.0, 44.0, 19.0, 19.0, 15.0, 13.0, 9.0, 8.0, 4.0, 3.0, 7.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1888484954833984e-05, -3.07643786072731e-05, -2.964027225971222e-05, -2.8516165912151337e-05, -2.7392059564590454e-05, -2.626795321702957e-05, -2.514384686946869e-05, -2.4019740521907806e-05, -2.2895634174346924e-05, -2.177152782678604e-05, -2.064742147922516e-05, -1.9523315131664276e-05, -1.8399208784103394e-05, -1.727510243654251e-05, -1.615099608898163e-05, -1.5026889741420746e-05, -1.3902783393859863e-05, -1.277867704629898e-05, -1.1654570698738098e-05, -1.0530464351177216e-05, -9.406358003616333e-06, -8.28225165605545e-06, -7.158145308494568e-06, -6.034038960933685e-06, -4.909932613372803e-06, -3.78582626581192e-06, -2.6617199182510376e-06, -1.537613570690155e-06, -4.1350722312927246e-07, 7.105991244316101e-07, 1.8347054719924927e-06, 2.9588118195533752e-06, 4.082918167114258e-06, 5.20702451467514e-06, 6.331130862236023e-06, 7.4552372097969055e-06, 8.579343557357788e-06, 9.70344990491867e-06, 1.0827556252479553e-05, 1.1951662600040436e-05, 1.3075768947601318e-05, 1.4199875295162201e-05, 1.5323981642723083e-05, 1.6448087990283966e-05, 1.757219433784485e-05, 1.869630068540573e-05, 1.9820407032966614e-05, 2.0944513380527496e-05, 2.206861972808838e-05, 2.319272607564926e-05, 2.4316832423210144e-05, 2.5440938770771027e-05, 2.656504511833191e-05, 2.7689151465892792e-05, 2.8813257813453674e-05, 2.9937364161014557e-05, 3.106147050857544e-05, 3.218557685613632e-05, 3.3309683203697205e-05, 3.443378955125809e-05, 3.555789589881897e-05, 3.668200224637985e-05, 3.7806108593940735e-05, 3.893021494150162e-05, 4.00543212890625e-05]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 69.0, 915.0, 34.0], "bins": [-5.084586973680416e-06, -5.0030935199174564e-06, -4.921600066154497e-06, -4.840106612391537e-06, -4.758613158628577e-06, -4.677119250118267e-06, -4.595625796355307e-06, -4.514132342592347e-06, -4.432638888829388e-06, -4.351145435066428e-06, -4.269651981303468e-06, -4.188158527540509e-06, -4.106665073777549e-06, -4.025171620014589e-06, -3.94367816625163e-06, -3.862184257741319e-06, -3.7806910313520348e-06, -3.699197577589075e-06, -3.6177041238261154e-06, -3.5362104426894803e-06, -3.4547169889265206e-06, -3.373223535163561e-06, -3.291730081400601e-06, -3.2102366276376415e-06, -3.128743173874682e-06, -3.047249720111722e-06, -2.9657562663487624e-06, -2.8842628125858027e-06, -2.8027691314491676e-06, -2.721275677686208e-06, -2.6397822239232482e-06, -2.5582887701602885e-06, -2.4767950890236534e-06, -2.3953016352606937e-06, -2.313808181497734e-06, -2.2323147277347744e-06, -2.1508210465981392e-06, -2.0693275928351795e-06, -1.98783413907222e-06, -1.9063406853092602e-06, -1.8248472315463005e-06, -1.7433537777833408e-06, -1.6618602103335434e-06, -1.5803667565705837e-06, -1.4988731891207863e-06, -1.4173797353578266e-06, -1.3358862815948669e-06, -1.2543928278319072e-06, -1.1728992603821098e-06, -1.09140580661915e-06, -1.0099122391693527e-06, -9.28418785406393e-07, -8.469252748000144e-07, -7.654317641936359e-07, -6.839383104306762e-07, -6.024447998242977e-07, -5.209512892179191e-07, -4.3945777861154056e-07, -3.5796429642687144e-07, -2.764708142422023e-07, -1.9497730363582377e-07, -1.1348379302944522e-07, -3.1990339266485535e-08, 4.9503171339893015e-08, 1.3099668194627156e-07]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 72.0, 0.0, 0.0, 0.0, 0.0, 137.0, 0.0, 0.0, 0.0, 0.0, 0.0, 522.0, 0.0, 0.0, 0.0, 0.0, 151.0, 0.0, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.46451997756958e-07, -3.3527612686157227e-07, -3.241002559661865e-07, -3.129243850708008e-07, -3.0174851417541504e-07, -2.905726432800293e-07, -2.7939677238464355e-07, -2.682209014892578e-07, -2.5704503059387207e-07, -2.4586915969848633e-07, -2.3469328880310059e-07, -2.2351741790771484e-07, -2.123415470123291e-07, -2.0116567611694336e-07, -1.8998980522155762e-07, -1.7881393432617188e-07, -1.6763806343078613e-07, -1.564621925354004e-07, -1.4528632164001465e-07, -1.341104507446289e-07, -1.2293457984924316e-07, -1.1175870895385742e-07, -1.0058283805847168e-07, -8.940696716308594e-08, -7.82310962677002e-08, -6.705522537231445e-08, -5.587935447692871e-08, -4.470348358154297e-08, -3.3527612686157227e-08, -2.2351741790771484e-08, -1.1175870895385742e-08, 0.0, 1.1175870895385742e-08, 2.2351741790771484e-08, 3.3527612686157227e-08, 4.470348358154297e-08, 5.587935447692871e-08, 6.705522537231445e-08, 7.82310962677002e-08, 8.940696716308594e-08, 1.0058283805847168e-07, 1.1175870895385742e-07, 1.2293457984924316e-07, 1.341104507446289e-07, 1.4528632164001465e-07, 1.564621925354004e-07, 1.6763806343078613e-07, 1.7881393432617188e-07, 1.8998980522155762e-07, 2.0116567611694336e-07, 2.123415470123291e-07, 2.2351741790771484e-07, 2.3469328880310059e-07, 2.4586915969848633e-07, 2.5704503059387207e-07, 2.682209014892578e-07, 2.7939677238464355e-07, 2.905726432800293e-07, 3.0174851417541504e-07, 3.129243850708008e-07, 3.241002559661865e-07, 3.3527612686157227e-07, 3.46451997756958e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 10.0, 10.0, 11.0, 12.0, 17.0, 14.0, 21.0, 15.0, 22.0, 25.0, 24.0, 34.0, 28.0, 34.0, 47.0, 32.0, 43.0, 37.0, 45.0, 46.0, 43.0, 47.0, 33.0, 42.0, 41.0, 41.0, 30.0, 36.0, 16.0, 28.0, 22.0, 17.0, 6.0, 10.0, 15.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.263580322265625, -1.22247314453125, -1.181365966796875, -1.1402587890625, -1.099151611328125, -1.05804443359375, -1.016937255859375, -0.975830078125, -0.934722900390625, -0.89361572265625, -0.852508544921875, -0.8114013671875, -0.770294189453125, -0.72918701171875, -0.688079833984375, -0.64697265625, -0.605865478515625, -0.56475830078125, -0.523651123046875, -0.4825439453125, -0.441436767578125, -0.40032958984375, -0.359222412109375, -0.318115234375, -0.277008056640625, -0.23590087890625, -0.194793701171875, -0.1536865234375, -0.112579345703125, -0.07147216796875, -0.030364990234375, 0.0107421875, 0.051849365234375, 0.09295654296875, 0.134063720703125, 0.1751708984375, 0.216278076171875, 0.25738525390625, 0.298492431640625, 0.339599609375, 0.380706787109375, 0.42181396484375, 0.462921142578125, 0.5040283203125, 0.545135498046875, 0.58624267578125, 0.627349853515625, 0.66845703125, 0.709564208984375, 0.75067138671875, 0.791778564453125, 0.8328857421875, 0.873992919921875, 0.91510009765625, 0.956207275390625, 0.997314453125, 1.038421630859375, 1.07952880859375, 1.120635986328125, 1.1617431640625, 1.202850341796875, 1.24395751953125, 1.285064697265625, 1.326171875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 10.0, 7.0, 11.0, 16.0, 16.0, 35.0, 39.0, 40.0, 57.0, 102.0, 137.0, 151.0, 245.0, 315.0, 426.0, 582.0, 866.0, 1294.0, 2044.0, 3274.0, 6004.0, 12985.0, 37024.0, 141360.0, 492528.0, 249060.0, 61222.0, 18974.0, 8032.0, 4234.0, 2419.0, 1557.0, 996.0, 723.0, 496.0, 342.0, 247.0, 184.0, 133.0, 101.0, 75.0, 54.0, 33.0, 30.0, 27.0, 18.0, 12.0, 8.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.3515625, -6.1630859375, -5.974609375, -5.7861328125, -5.59765625, -5.4091796875, -5.220703125, -5.0322265625, -4.84375, -4.6552734375, -4.466796875, -4.2783203125, -4.08984375, -3.9013671875, -3.712890625, -3.5244140625, -3.3359375, -3.1474609375, -2.958984375, -2.7705078125, -2.58203125, -2.3935546875, -2.205078125, -2.0166015625, -1.828125, -1.6396484375, -1.451171875, -1.2626953125, -1.07421875, -0.8857421875, -0.697265625, -0.5087890625, -0.3203125, -0.1318359375, 0.056640625, 0.2451171875, 0.43359375, 0.6220703125, 0.810546875, 0.9990234375, 1.1875, 1.3759765625, 1.564453125, 1.7529296875, 1.94140625, 2.1298828125, 2.318359375, 2.5068359375, 2.6953125, 2.8837890625, 3.072265625, 3.2607421875, 3.44921875, 3.6376953125, 3.826171875, 4.0146484375, 4.203125, 4.3916015625, 4.580078125, 4.7685546875, 4.95703125, 5.1455078125, 5.333984375, 5.5224609375, 5.7109375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 7.0, 9.0, 12.0, 11.0, 14.0, 19.0, 17.0, 25.0, 26.0, 34.0, 28.0, 44.0, 52.0, 78.0, 112.0, 181.0, 876.0, 782.0, 178.0, 106.0, 80.0, 65.0, 53.0, 44.0, 33.0, 27.0, 26.0, 17.0, 25.0, 16.0, 6.0, 13.0, 4.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.03125, -4.8740234375, -4.716796875, -4.5595703125, -4.40234375, -4.2451171875, -4.087890625, -3.9306640625, -3.7734375, -3.6162109375, -3.458984375, -3.3017578125, -3.14453125, -2.9873046875, -2.830078125, -2.6728515625, -2.515625, -2.3583984375, -2.201171875, -2.0439453125, -1.88671875, -1.7294921875, -1.572265625, -1.4150390625, -1.2578125, -1.1005859375, -0.943359375, -0.7861328125, -0.62890625, -0.4716796875, -0.314453125, -0.1572265625, 0.0, 0.1572265625, 0.314453125, 0.4716796875, 0.62890625, 0.7861328125, 0.943359375, 1.1005859375, 1.2578125, 1.4150390625, 1.572265625, 1.7294921875, 1.88671875, 2.0439453125, 2.201171875, 2.3583984375, 2.515625, 2.6728515625, 2.830078125, 2.9873046875, 3.14453125, 3.3017578125, 3.458984375, 3.6162109375, 3.7734375, 3.9306640625, 4.087890625, 4.2451171875, 4.40234375, 4.5595703125, 4.716796875, 4.8740234375, 5.03125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 9.0, 5.0, 6.0, 10.0, 15.0, 15.0, 18.0, 28.0, 34.0, 42.0, 40.0, 68.0, 124.0, 294.0, 1321.0, 275110.0, 2864907.0, 2791.0, 389.0, 139.0, 77.0, 60.0, 28.0, 36.0, 29.0, 13.0, 13.0, 20.0, 15.0, 13.0, 6.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.921875, -23.177734375, -22.43359375, -21.689453125, -20.9453125, -20.201171875, -19.45703125, -18.712890625, -17.96875, -17.224609375, -16.48046875, -15.736328125, -14.9921875, -14.248046875, -13.50390625, -12.759765625, -12.015625, -11.271484375, -10.52734375, -9.783203125, -9.0390625, -8.294921875, -7.55078125, -6.806640625, -6.0625, -5.318359375, -4.57421875, -3.830078125, -3.0859375, -2.341796875, -1.59765625, -0.853515625, -0.109375, 0.634765625, 1.37890625, 2.123046875, 2.8671875, 3.611328125, 4.35546875, 5.099609375, 5.84375, 6.587890625, 7.33203125, 8.076171875, 8.8203125, 9.564453125, 10.30859375, 11.052734375, 11.796875, 12.541015625, 13.28515625, 14.029296875, 14.7734375, 15.517578125, 16.26171875, 17.005859375, 17.75, 18.494140625, 19.23828125, 19.982421875, 20.7265625, 21.470703125, 22.21484375, 22.958984375, 23.703125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [968.0, 47.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.007070064544678, 1.9058313369750977, 7.818732738494873, 13.731634140014648, 19.644535064697266, 25.557435989379883, 31.470338821411133, 37.38323974609375, 43.296142578125, 49.20904541015625, 55.121944427490234, 61.034847259521484, 66.94774627685547, 72.86064910888672, 78.77355194091797, 84.68644714355469, 90.59934997558594, 96.51225280761719, 102.42515563964844, 108.33805847167969, 114.2509536743164, 120.16385650634766, 126.0767593383789, 131.98965454101562, 137.90255737304688, 143.81546020507812, 149.72836303710938, 155.64126586914062, 161.55416870117188, 167.46707153320312, 173.37997436523438, 179.29286193847656, 185.2057647705078, 191.11866760253906, 197.0315704345703, 202.94447326660156, 208.8573760986328, 214.770263671875, 220.68316650390625, 226.5960693359375, 232.50897216796875, 238.421875, 244.33477783203125, 250.2476806640625, 256.16058349609375, 262.073486328125, 267.98638916015625, 273.8992919921875, 279.81219482421875, 285.72509765625, 291.63800048828125, 297.5509033203125, 303.46380615234375, 309.376708984375, 315.28961181640625, 321.2025146484375, 327.1153869628906, 333.0282897949219, 338.9411926269531, 344.8540954589844, 350.7669982910156, 356.6799011230469, 362.5928039550781, 368.5057067871094, 374.4186096191406]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 8.0, 12.0, 6.0, 18.0, 17.0, 18.0, 20.0, 19.0, 26.0, 27.0, 35.0, 32.0, 38.0, 37.0, 34.0, 46.0, 38.0, 41.0, 36.0, 40.0, 42.0, 44.0, 41.0, 38.0, 32.0, 30.0, 33.0, 22.0, 26.0, 25.0, 21.0, 14.0, 12.0, 11.0, 10.0, 10.0, 7.0, 12.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.260639190673828, -17.712726593017578, -17.164812088012695, -16.616899490356445, -16.068984985351562, -15.521072387695312, -14.973158836364746, -14.42524528503418, -13.877331733703613, -13.329418182373047, -12.78150463104248, -12.233591079711914, -11.685678482055664, -11.137763977050781, -10.589851379394531, -10.041937828063965, -9.494024276733398, -8.946110725402832, -8.398197174072266, -7.850284099578857, -7.302370548248291, -6.754456996917725, -6.206543922424316, -5.65863037109375, -5.110716819763184, -4.562803268432617, -4.014889717102051, -3.4669766426086426, -2.919063091278076, -2.3711495399475098, -1.8232362270355225, -1.2753229141235352, -0.7274112701416016, -0.1794978380203247, 0.36841559410095215, 0.916329026222229, 1.4642424583435059, 2.0121560096740723, 2.5600693225860596, 3.107982635498047, 3.6558961868286133, 4.20380973815918, 4.751723289489746, 5.299636363983154, 5.847549915313721, 6.395463466644287, 6.943376541137695, 7.491290092468262, 8.039203643798828, 8.587117195129395, 9.135030746459961, 9.682944297790527, 10.230857849121094, 10.778770446777344, 11.32668399810791, 11.874597549438477, 12.422511100769043, 12.97042465209961, 13.518338203430176, 14.066251754760742, 14.614164352416992, 15.162078857421875, 15.709991455078125, 16.257904052734375, 16.805818557739258]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 10.0, 7.0, 11.0, 8.0, 11.0, 19.0, 13.0, 18.0, 18.0, 26.0, 21.0, 23.0, 22.0, 29.0, 38.0, 36.0, 37.0, 37.0, 36.0, 41.0, 42.0, 44.0, 34.0, 47.0, 34.0, 31.0, 41.0, 33.0, 29.0, 31.0, 33.0, 21.0, 18.0, 15.0, 13.0, 10.0, 13.0, 6.0, 9.0, 10.0, 7.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.318359375, -1.2775726318359375, -1.236785888671875, -1.1959991455078125, -1.15521240234375, -1.1144256591796875, -1.073638916015625, -1.0328521728515625, -0.9920654296875, -0.9512786865234375, -0.910491943359375, -0.8697052001953125, -0.82891845703125, -0.7881317138671875, -0.747344970703125, -0.7065582275390625, -0.665771484375, -0.6249847412109375, -0.584197998046875, -0.5434112548828125, -0.50262451171875, -0.4618377685546875, -0.421051025390625, -0.3802642822265625, -0.3394775390625, -0.2986907958984375, -0.257904052734375, -0.2171173095703125, -0.17633056640625, -0.1355438232421875, -0.094757080078125, -0.0539703369140625, -0.01318359375, 0.0276031494140625, 0.068389892578125, 0.1091766357421875, 0.14996337890625, 0.1907501220703125, 0.231536865234375, 0.2723236083984375, 0.3131103515625, 0.3538970947265625, 0.394683837890625, 0.4354705810546875, 0.47625732421875, 0.5170440673828125, 0.557830810546875, 0.5986175537109375, 0.639404296875, 0.6801910400390625, 0.720977783203125, 0.7617645263671875, 0.80255126953125, 0.8433380126953125, 0.884124755859375, 0.9249114990234375, 0.9656982421875, 1.0064849853515625, 1.047271728515625, 1.0880584716796875, 1.12884521484375, 1.1696319580078125, 1.210418701171875, 1.2512054443359375, 1.2919921875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 4.0, 7.0, 9.0, 15.0, 15.0, 16.0, 34.0, 44.0, 46.0, 61.0, 93.0, 109.0, 160.0, 244.0, 322.0, 524.0, 1096.0, 3307.0, 20050.0, 430954.0, 3553585.0, 167514.0, 11330.0, 2331.0, 861.0, 439.0, 340.0, 205.0, 162.0, 85.0, 91.0, 67.0, 33.0, 33.0, 30.0, 19.0, 10.0, 8.0, 10.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.6171875, -10.3170166015625, -10.016845703125, -9.7166748046875, -9.41650390625, -9.1163330078125, -8.816162109375, -8.5159912109375, -8.2158203125, -7.9156494140625, -7.615478515625, -7.3153076171875, -7.01513671875, -6.7149658203125, -6.414794921875, -6.1146240234375, -5.814453125, -5.5142822265625, -5.214111328125, -4.9139404296875, -4.61376953125, -4.3135986328125, -4.013427734375, -3.7132568359375, -3.4130859375, -3.1129150390625, -2.812744140625, -2.5125732421875, -2.21240234375, -1.9122314453125, -1.612060546875, -1.3118896484375, -1.01171875, -0.7115478515625, -0.411376953125, -0.1112060546875, 0.18896484375, 0.4891357421875, 0.789306640625, 1.0894775390625, 1.3896484375, 1.6898193359375, 1.989990234375, 2.2901611328125, 2.59033203125, 2.8905029296875, 3.190673828125, 3.4908447265625, 3.791015625, 4.0911865234375, 4.391357421875, 4.6915283203125, 4.99169921875, 5.2918701171875, 5.592041015625, 5.8922119140625, 6.1923828125, 6.4925537109375, 6.792724609375, 7.0928955078125, 7.39306640625, 7.6932373046875, 7.993408203125, 8.2935791015625, 8.59375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 11.0, 33.0, 42.0, 80.0, 157.0, 272.0, 579.0, 826.0, 872.0, 505.0, 328.0, 159.0, 95.0, 45.0, 24.0, 24.0, 7.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-12.3515625, -12.082763671875, -11.81396484375, -11.545166015625, -11.2763671875, -11.007568359375, -10.73876953125, -10.469970703125, -10.201171875, -9.932373046875, -9.66357421875, -9.394775390625, -9.1259765625, -8.857177734375, -8.58837890625, -8.319580078125, -8.05078125, -7.781982421875, -7.51318359375, -7.244384765625, -6.9755859375, -6.706787109375, -6.43798828125, -6.169189453125, -5.900390625, -5.631591796875, -5.36279296875, -5.093994140625, -4.8251953125, -4.556396484375, -4.28759765625, -4.018798828125, -3.75, -3.481201171875, -3.21240234375, -2.943603515625, -2.6748046875, -2.406005859375, -2.13720703125, -1.868408203125, -1.599609375, -1.330810546875, -1.06201171875, -0.793212890625, -0.5244140625, -0.255615234375, 0.01318359375, 0.281982421875, 0.55078125, 0.819580078125, 1.08837890625, 1.357177734375, 1.6259765625, 1.894775390625, 2.16357421875, 2.432373046875, 2.701171875, 2.969970703125, 3.23876953125, 3.507568359375, 3.7763671875, 4.045166015625, 4.31396484375, 4.582763671875, 4.8515625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 12.0, 11.0, 14.0, 31.0, 49.0, 94.0, 208.0, 410.0, 969.0, 3104.0, 15609.0, 303122.0, 3514074.0, 335446.0, 16152.0, 3120.0, 989.0, 422.0, 194.0, 108.0, 53.0, 29.0, 20.0, 11.0, 5.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.875, -16.412841796875, -15.95068359375, -15.488525390625, -15.0263671875, -14.564208984375, -14.10205078125, -13.639892578125, -13.177734375, -12.715576171875, -12.25341796875, -11.791259765625, -11.3291015625, -10.866943359375, -10.40478515625, -9.942626953125, -9.48046875, -9.018310546875, -8.55615234375, -8.093994140625, -7.6318359375, -7.169677734375, -6.70751953125, -6.245361328125, -5.783203125, -5.321044921875, -4.85888671875, -4.396728515625, -3.9345703125, -3.472412109375, -3.01025390625, -2.548095703125, -2.0859375, -1.623779296875, -1.16162109375, -0.699462890625, -0.2373046875, 0.224853515625, 0.68701171875, 1.149169921875, 1.611328125, 2.073486328125, 2.53564453125, 2.997802734375, 3.4599609375, 3.922119140625, 4.38427734375, 4.846435546875, 5.30859375, 5.770751953125, 6.23291015625, 6.695068359375, 7.1572265625, 7.619384765625, 8.08154296875, 8.543701171875, 9.005859375, 9.468017578125, 9.93017578125, 10.392333984375, 10.8544921875, 11.316650390625, 11.77880859375, 12.240966796875, 12.703125]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 31.0, 155.0, 305.0, 328.0, 154.0, 28.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.87224197387695, -43.86967086791992, -41.867095947265625, -39.864524841308594, -37.8619499206543, -35.859378814697266, -33.85680389404297, -31.854232788085938, -29.851659774780273, -27.84908676147461, -25.846513748168945, -23.84394073486328, -21.84136962890625, -19.838794708251953, -17.836223602294922, -15.833650588989258, -13.831077575683594, -11.82850456237793, -9.825931549072266, -7.823359489440918, -5.820786476135254, -3.81821346282959, -1.8156414031982422, 0.18693161010742188, 2.189504623413086, 4.19207763671875, 6.194650173187256, 8.197222709655762, 10.199795722961426, 12.20236873626709, 14.204940795898438, 16.2075138092041, 18.21009063720703, 20.212663650512695, 22.21523666381836, 24.21780776977539, 26.220382690429688, 28.22295379638672, 30.225526809692383, 32.22809982299805, 34.230674743652344, 36.233245849609375, 38.23582077026367, 40.2383918762207, 42.240966796875, 44.24353790283203, 46.24610900878906, 48.24868392944336, 50.25125503540039, 52.25382614135742, 54.25640106201172, 56.25897216796875, 58.26154708862305, 60.26411819458008, 62.266693115234375, 64.2692642211914, 66.27183532714844, 68.27440643310547, 70.2769775390625, 72.27955627441406, 74.2821273803711, 76.28469848632812, 78.28726959228516, 80.28984069824219, 82.29241943359375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 4.0, 4.0, 0.0, 3.0, 6.0, 6.0, 8.0, 9.0, 12.0, 20.0, 17.0, 13.0, 21.0, 26.0, 29.0, 28.0, 31.0, 29.0, 28.0, 46.0, 41.0, 44.0, 47.0, 34.0, 46.0, 33.0, 47.0, 33.0, 26.0, 28.0, 42.0, 31.0, 25.0, 21.0, 31.0, 21.0, 34.0, 14.0, 20.0, 9.0, 10.0, 6.0, 9.0, 3.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.536693572998047, -12.05055046081543, -11.564407348632812, -11.078264236450195, -10.592121124267578, -10.105978012084961, -9.619834899902344, -9.13369083404541, -8.647547721862793, -8.161404609680176, -7.675261497497559, -7.189118385314941, -6.702974796295166, -6.216831684112549, -5.730688571929932, -5.244544982910156, -4.758402347564697, -4.27225923538208, -3.786115884780884, -3.2999727725982666, -2.8138294219970703, -2.327686309814453, -1.841543197631836, -1.3553998470306396, -0.8692567348480225, -0.3831135332584381, 0.10302966833114624, 0.5891728401184082, 1.075316071510315, 1.5614593029022217, 2.047602415084839, 2.533745765686035, 3.0198888778686523, 3.5060319900512695, 3.992175340652466, 4.478318214416504, 4.964461803436279, 5.4506049156188965, 5.936748027801514, 6.422891616821289, 6.909034729003906, 7.395177841186523, 7.881320953369141, 8.367464065551758, 8.853607177734375, 9.339750289916992, 9.82589340209961, 10.312037467956543, 10.798179626464844, 11.284322738647461, 11.770465850830078, 12.256608963012695, 12.742752075195312, 13.22889518737793, 13.715038299560547, 14.20118236541748, 14.687325477600098, 15.173468589782715, 15.659611701965332, 16.145755767822266, 16.631898880004883, 17.1180419921875, 17.604185104370117, 18.090328216552734, 18.57647132873535]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 6.0, 8.0, 4.0, 13.0, 9.0, 12.0, 20.0, 13.0, 16.0, 16.0, 22.0, 25.0, 20.0, 25.0, 37.0, 37.0, 36.0, 37.0, 36.0, 35.0, 52.0, 45.0, 44.0, 43.0, 42.0, 44.0, 31.0, 34.0, 38.0, 22.0, 27.0, 25.0, 18.0, 15.0, 20.0, 11.0, 14.0, 10.0, 7.0, 7.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.2928619384765625, -1.249786376953125, -1.2067108154296875, -1.16363525390625, -1.1205596923828125, -1.077484130859375, -1.0344085693359375, -0.9913330078125, -0.9482574462890625, -0.905181884765625, -0.8621063232421875, -0.81903076171875, -0.7759552001953125, -0.732879638671875, -0.6898040771484375, -0.646728515625, -0.6036529541015625, -0.560577392578125, -0.5175018310546875, -0.47442626953125, -0.4313507080078125, -0.388275146484375, -0.3451995849609375, -0.3021240234375, -0.2590484619140625, -0.215972900390625, -0.1728973388671875, -0.12982177734375, -0.0867462158203125, -0.043670654296875, -0.0005950927734375, 0.04248046875, 0.0855560302734375, 0.128631591796875, 0.1717071533203125, 0.21478271484375, 0.2578582763671875, 0.300933837890625, 0.3440093994140625, 0.3870849609375, 0.4301605224609375, 0.473236083984375, 0.5163116455078125, 0.55938720703125, 0.6024627685546875, 0.645538330078125, 0.6886138916015625, 0.731689453125, 0.7747650146484375, 0.817840576171875, 0.8609161376953125, 0.90399169921875, 0.9470672607421875, 0.990142822265625, 1.0332183837890625, 1.0762939453125, 1.1193695068359375, 1.162445068359375, 1.2055206298828125, 1.24859619140625, 1.2916717529296875, 1.334747314453125, 1.3778228759765625, 1.4208984375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 13.0, 8.0, 22.0, 34.0, 44.0, 81.0, 124.0, 170.0, 262.0, 374.0, 600.0, 847.0, 1299.0, 1907.0, 2779.0, 4209.0, 6167.0, 9428.0, 14311.0, 22408.0, 35821.0, 59177.0, 104697.0, 244588.0, 267200.0, 107883.0, 60822.0, 36675.0, 22996.0, 14560.0, 9678.0, 6318.0, 4277.0, 2862.0, 1918.0, 1317.0, 869.0, 622.0, 382.0, 271.0, 182.0, 128.0, 72.0, 54.0, 36.0, 25.0, 18.0, 6.0, 7.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057281494140625, -0.0554351806640625, -0.0535888671875, -0.0517425537109375, -0.049896240234375, -0.0480499267578125, -0.04620361328125, -0.0443572998046875, -0.042510986328125, -0.0406646728515625, -0.038818359375, -0.0369720458984375, -0.035125732421875, -0.0332794189453125, -0.03143310546875, -0.0295867919921875, -0.027740478515625, -0.0258941650390625, -0.0240478515625, -0.0222015380859375, -0.020355224609375, -0.0185089111328125, -0.01666259765625, -0.0148162841796875, -0.012969970703125, -0.0111236572265625, -0.00927734375, -0.0074310302734375, -0.005584716796875, -0.0037384033203125, -0.00189208984375, -4.57763671875e-05, 0.001800537109375, 0.0036468505859375, 0.0054931640625, 0.0073394775390625, 0.009185791015625, 0.0110321044921875, 0.01287841796875, 0.0147247314453125, 0.016571044921875, 0.0184173583984375, 0.020263671875, 0.0221099853515625, 0.023956298828125, 0.0258026123046875, 0.02764892578125, 0.0294952392578125, 0.031341552734375, 0.0331878662109375, 0.0350341796875, 0.0368804931640625, 0.038726806640625, 0.0405731201171875, 0.04241943359375, 0.0442657470703125, 0.046112060546875, 0.0479583740234375, 0.0498046875, 0.0516510009765625, 0.053497314453125, 0.0553436279296875, 0.05718994140625, 0.0590362548828125, 0.060882568359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 6.0, 5.0, 13.0, 8.0, 12.0, 11.0, 14.0, 12.0, 22.0, 24.0, 20.0, 27.0, 30.0, 23.0, 46.0, 27.0, 41.0, 39.0, 46.0, 42.0, 1067.0, 33.0, 25.0, 31.0, 36.0, 46.0, 38.0, 31.0, 36.0, 32.0, 23.0, 18.0, 23.0, 26.0, 16.0, 10.0, 5.0, 11.0, 10.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.17578125, -1.1416778564453125, -1.107574462890625, -1.0734710693359375, -1.03936767578125, -1.0052642822265625, -0.971160888671875, -0.9370574951171875, -0.9029541015625, -0.8688507080078125, -0.834747314453125, -0.8006439208984375, -0.76654052734375, -0.7324371337890625, -0.698333740234375, -0.6642303466796875, -0.630126953125, -0.5960235595703125, -0.561920166015625, -0.5278167724609375, -0.49371337890625, -0.4596099853515625, -0.425506591796875, -0.3914031982421875, -0.3572998046875, -0.3231964111328125, -0.289093017578125, -0.2549896240234375, -0.22088623046875, -0.1867828369140625, -0.152679443359375, -0.1185760498046875, -0.08447265625, -0.0503692626953125, -0.016265869140625, 0.0178375244140625, 0.05194091796875, 0.0860443115234375, 0.120147705078125, 0.1542510986328125, 0.1883544921875, 0.2224578857421875, 0.256561279296875, 0.2906646728515625, 0.32476806640625, 0.3588714599609375, 0.392974853515625, 0.4270782470703125, 0.461181640625, 0.4952850341796875, 0.529388427734375, 0.5634918212890625, 0.59759521484375, 0.6316986083984375, 0.665802001953125, 0.6999053955078125, 0.7340087890625, 0.7681121826171875, 0.802215576171875, 0.8363189697265625, 0.87042236328125, 0.9045257568359375, 0.938629150390625, 0.9727325439453125, 1.0068359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 5.0, 15.0, 19.0, 26.0, 46.0, 63.0, 102.0, 151.0, 235.0, 322.0, 490.0, 749.0, 1109.0, 1530.0, 2254.0, 3375.0, 4805.0, 6972.0, 10548.0, 15341.0, 23550.0, 36394.0, 59221.0, 100810.0, 200481.0, 1325062.0, 116858.0, 66706.0, 40883.0, 25893.0, 17302.0, 11260.0, 7711.0, 5313.0, 3634.0, 2483.0, 1736.0, 1169.0, 807.0, 560.0, 374.0, 259.0, 186.0, 116.0, 74.0, 49.0, 34.0, 22.0, 11.0, 9.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03204345703125, -0.031013965606689453, -0.029984474182128906, -0.02895498275756836, -0.027925491333007812, -0.026895999908447266, -0.02586650848388672, -0.024837017059326172, -0.023807525634765625, -0.022778034210205078, -0.02174854278564453, -0.020719051361083984, -0.019689559936523438, -0.01866006851196289, -0.017630577087402344, -0.016601085662841797, -0.01557159423828125, -0.014542102813720703, -0.013512611389160156, -0.01248311996459961, -0.011453628540039062, -0.010424137115478516, -0.009394645690917969, -0.008365154266357422, -0.007335662841796875, -0.006306171417236328, -0.005276679992675781, -0.004247188568115234, -0.0032176971435546875, -0.0021882057189941406, -0.0011587142944335938, -0.00012922286987304688, 0.0009002685546875, 0.0019297599792480469, 0.0029592514038085938, 0.003988742828369141, 0.0050182342529296875, 0.006047725677490234, 0.007077217102050781, 0.008106708526611328, 0.009136199951171875, 0.010165691375732422, 0.011195182800292969, 0.012224674224853516, 0.013254165649414062, 0.01428365707397461, 0.015313148498535156, 0.016342639923095703, 0.01737213134765625, 0.018401622772216797, 0.019431114196777344, 0.02046060562133789, 0.021490097045898438, 0.022519588470458984, 0.02354907989501953, 0.024578571319580078, 0.025608062744140625, 0.026637554168701172, 0.02766704559326172, 0.028696537017822266, 0.029726028442382812, 0.03075551986694336, 0.031785011291503906, 0.03281450271606445, 0.033843994140625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 8.0, 0.0, 6.0, 14.0, 0.0, 11.0, 33.0, 0.0, 43.0, 98.0, 565.0, 0.0, 90.0, 53.0, 0.0, 23.0, 22.0, 10.0, 0.0, 10.0, 4.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2097880244255066e-06, -1.16787850856781e-06, -1.1259689927101135e-06, -1.084059476852417e-06, -1.0421499609947205e-06, -1.000240445137024e-06, -9.583309292793274e-07, -9.164214134216309e-07, -8.745118975639343e-07, -8.326023817062378e-07, -7.906928658485413e-07, -7.487833499908447e-07, -7.068738341331482e-07, -6.649643182754517e-07, -6.230548024177551e-07, -5.811452865600586e-07, -5.392357707023621e-07, -4.973262548446655e-07, -4.55416738986969e-07, -4.1350722312927246e-07, -3.7159770727157593e-07, -3.296881914138794e-07, -2.8777867555618286e-07, -2.4586915969848633e-07, -2.039596438407898e-07, -1.6205012798309326e-07, -1.2014061212539673e-07, -7.82310962677002e-08, -3.632158041000366e-08, 5.587935447692871e-09, 4.7497451305389404e-08, 8.940696716308594e-08, 1.3131648302078247e-07, 1.73225998878479e-07, 2.1513551473617554e-07, 2.5704503059387207e-07, 2.989545464515686e-07, 3.4086406230926514e-07, 3.8277357816696167e-07, 4.246830940246582e-07, 4.6659260988235474e-07, 5.085021257400513e-07, 5.504116415977478e-07, 5.923211574554443e-07, 6.342306733131409e-07, 6.761401891708374e-07, 7.180497050285339e-07, 7.599592208862305e-07, 8.01868736743927e-07, 8.437782526016235e-07, 8.856877684593201e-07, 9.275972843170166e-07, 9.695068001747131e-07, 1.0114163160324097e-06, 1.0533258318901062e-06, 1.0952353477478027e-06, 1.1371448636054993e-06, 1.1790543794631958e-06, 1.2209638953208923e-06, 1.2628734111785889e-06, 1.3047829270362854e-06, 1.346692442893982e-06, 1.3886019587516785e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 8.0, 8.0, 1.0, 3.0, 3.0, 3.0, 11.0, 13.0, 11.0, 26.0, 32.0, 31.0, 59.0, 89.0, 187.0, 648.0, 72994.0, 972601.0, 1259.0, 200.0, 117.0, 60.0, 49.0, 30.0, 20.0, 21.0, 19.0, 4.0, 9.0, 5.0, 4.0, 7.0, 6.0, 4.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9371509552001953e-05, -1.87065452337265e-05, -1.804158091545105e-05, -1.7376616597175598e-05, -1.6711652278900146e-05, -1.6046687960624695e-05, -1.5381723642349243e-05, -1.4716759324073792e-05, -1.405179500579834e-05, -1.3386830687522888e-05, -1.2721866369247437e-05, -1.2056902050971985e-05, -1.1391937732696533e-05, -1.0726973414421082e-05, -1.006200909614563e-05, -9.397044777870178e-06, -8.732080459594727e-06, -8.067116141319275e-06, -7.402151823043823e-06, -6.737187504768372e-06, -6.07222318649292e-06, -5.407258868217468e-06, -4.742294549942017e-06, -4.077330231666565e-06, -3.4123659133911133e-06, -2.7474015951156616e-06, -2.08243727684021e-06, -1.4174729585647583e-06, -7.525086402893066e-07, -8.754432201385498e-08, 5.774199962615967e-07, 1.2423843145370483e-06, 1.9073486328125e-06, 2.5723129510879517e-06, 3.2372772693634033e-06, 3.902241587638855e-06, 4.567205905914307e-06, 5.232170224189758e-06, 5.89713454246521e-06, 6.562098860740662e-06, 7.227063179016113e-06, 7.892027497291565e-06, 8.556991815567017e-06, 9.221956133842468e-06, 9.88692045211792e-06, 1.0551884770393372e-05, 1.1216849088668823e-05, 1.1881813406944275e-05, 1.2546777725219727e-05, 1.3211742043495178e-05, 1.387670636177063e-05, 1.4541670680046082e-05, 1.5206634998321533e-05, 1.5871599316596985e-05, 1.6536563634872437e-05, 1.7201527953147888e-05, 1.786649227142334e-05, 1.853145658969879e-05, 1.9196420907974243e-05, 1.9861385226249695e-05, 2.0526349544525146e-05, 2.1191313862800598e-05, 2.185627818107605e-05, 2.25212424993515e-05, 2.3186206817626953e-05]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 15.0, 9.0, 12.0, 7.0, 7.0, 18.0, 14.0, 11.0, 805.0, 20.0, 15.0, 12.0, 14.0, 7.0, 7.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.351340443989102e-07, -1.303858283563386e-07, -1.2563761231376702e-07, -1.2088939627119544e-07, -1.1614118733405121e-07, -1.1139297129147963e-07, -1.066447623543354e-07, -1.0189654631176381e-07, -9.714833026919223e-08, -9.240011422662064e-08, -8.765189818404906e-08, -8.290368924690483e-08, -7.815547320433325e-08, -7.340725716176166e-08, -6.865904822461744e-08, -6.391083218204585e-08, -5.9162616139474267e-08, -5.441440009690268e-08, -4.9666187607044776e-08, -4.491797511718687e-08, -4.0169759074615285e-08, -3.54215430320437e-08, -3.0673330542185795e-08, -2.592511805232789e-08, -2.1176902009756304e-08, -1.642868774354156e-08, -1.1680473477326814e-08, -6.9322592111120684e-09, -2.184044944897323e-09, 2.564169321317422e-09, 7.3123835875321674e-09, 1.2060596077390073e-08, 1.6808812119961658e-08, 2.1557026386176403e-08, 2.630524065239115e-08, 3.1053453142249055e-08, 3.580166918482064e-08, 4.0549885227392224e-08, 4.529809771725013e-08, 5.0046310207108036e-08, 5.479452624967962e-08, 5.9542742292251205e-08, 6.429095833482279e-08, 6.903916727196702e-08, 7.37873833145386e-08, 7.853559935711019e-08, 8.328380829425441e-08, 8.8032024336826e-08, 9.278024037939758e-08, 9.752845642196917e-08, 1.0227667246454075e-07, 1.0702488140168498e-07, 1.1177309744425656e-07, 1.1652131348682815e-07, 1.2126952242397238e-07, 1.2601773846654396e-07, 1.3076595450911555e-07, 1.3551417055168713e-07, 1.4026238659425871e-07, 1.450106026368303e-07, 1.4975881867940188e-07, 1.5450702051111875e-07, 1.5925523655369034e-07, 1.6400345259626192e-07, 1.687516686388335e-07]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 815.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 6.0, 8.0, 4.0, 13.0, 9.0, 12.0, 20.0, 13.0, 16.0, 16.0, 22.0, 25.0, 20.0, 25.0, 37.0, 37.0, 36.0, 37.0, 36.0, 35.0, 52.0, 45.0, 44.0, 43.0, 42.0, 44.0, 31.0, 34.0, 38.0, 22.0, 27.0, 25.0, 18.0, 15.0, 20.0, 11.0, 14.0, 10.0, 7.0, 7.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.2928619384765625, -1.249786376953125, -1.2067108154296875, -1.16363525390625, -1.1205596923828125, -1.077484130859375, -1.0344085693359375, -0.9913330078125, -0.9482574462890625, -0.905181884765625, -0.8621063232421875, -0.81903076171875, -0.7759552001953125, -0.732879638671875, -0.6898040771484375, -0.646728515625, -0.6036529541015625, -0.560577392578125, -0.5175018310546875, -0.47442626953125, -0.4313507080078125, -0.388275146484375, -0.3451995849609375, -0.3021240234375, -0.2590484619140625, -0.215972900390625, -0.1728973388671875, -0.12982177734375, -0.0867462158203125, -0.043670654296875, -0.0005950927734375, 0.04248046875, 0.0855560302734375, 0.128631591796875, 0.1717071533203125, 0.21478271484375, 0.2578582763671875, 0.300933837890625, 0.3440093994140625, 0.3870849609375, 0.4301605224609375, 0.473236083984375, 0.5163116455078125, 0.55938720703125, 0.6024627685546875, 0.645538330078125, 0.6886138916015625, 0.731689453125, 0.7747650146484375, 0.817840576171875, 0.8609161376953125, 0.90399169921875, 0.9470672607421875, 0.990142822265625, 1.0332183837890625, 1.0762939453125, 1.1193695068359375, 1.162445068359375, 1.2055206298828125, 1.24859619140625, 1.2916717529296875, 1.334747314453125, 1.3778228759765625, 1.4208984375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 9.0, 8.0, 30.0, 36.0, 70.0, 77.0, 121.0, 211.0, 263.0, 432.0, 682.0, 1033.0, 1595.0, 2490.0, 4184.0, 7699.0, 14349.0, 29584.0, 66354.0, 157552.0, 368903.0, 221806.0, 89549.0, 39856.0, 18386.0, 9696.0, 5271.0, 3071.0, 1835.0, 1149.0, 764.0, 479.0, 329.0, 225.0, 154.0, 94.0, 76.0, 33.0, 30.0, 18.0, 13.0, 10.0, 9.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.974609375, -1.915985107421875, -1.85736083984375, -1.798736572265625, -1.7401123046875, -1.681488037109375, -1.62286376953125, -1.564239501953125, -1.505615234375, -1.446990966796875, -1.38836669921875, -1.329742431640625, -1.2711181640625, -1.212493896484375, -1.15386962890625, -1.095245361328125, -1.03662109375, -0.977996826171875, -0.91937255859375, -0.860748291015625, -0.8021240234375, -0.743499755859375, -0.68487548828125, -0.626251220703125, -0.567626953125, -0.509002685546875, -0.45037841796875, -0.391754150390625, -0.3331298828125, -0.274505615234375, -0.21588134765625, -0.157257080078125, -0.0986328125, -0.040008544921875, 0.01861572265625, 0.077239990234375, 0.1358642578125, 0.194488525390625, 0.25311279296875, 0.311737060546875, 0.370361328125, 0.428985595703125, 0.48760986328125, 0.546234130859375, 0.6048583984375, 0.663482666015625, 0.72210693359375, 0.780731201171875, 0.83935546875, 0.897979736328125, 0.95660400390625, 1.015228271484375, 1.0738525390625, 1.132476806640625, 1.19110107421875, 1.249725341796875, 1.308349609375, 1.366973876953125, 1.42559814453125, 1.484222412109375, 1.5428466796875, 1.601470947265625, 1.66009521484375, 1.718719482421875, 1.77734375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 2.0, 6.0, 4.0, 13.0, 11.0, 5.0, 17.0, 17.0, 39.0, 30.0, 30.0, 34.0, 46.0, 46.0, 54.0, 65.0, 110.0, 210.0, 1562.0, 212.0, 101.0, 74.0, 55.0, 48.0, 34.0, 52.0, 33.0, 27.0, 11.0, 27.0, 14.0, 9.0, 8.0, 14.0, 5.0, 2.0, 4.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.05078125, -4.8797607421875, -4.708740234375, -4.5377197265625, -4.36669921875, -4.1956787109375, -4.024658203125, -3.8536376953125, -3.6826171875, -3.5115966796875, -3.340576171875, -3.1695556640625, -2.99853515625, -2.8275146484375, -2.656494140625, -2.4854736328125, -2.314453125, -2.1434326171875, -1.972412109375, -1.8013916015625, -1.63037109375, -1.4593505859375, -1.288330078125, -1.1173095703125, -0.9462890625, -0.7752685546875, -0.604248046875, -0.4332275390625, -0.26220703125, -0.0911865234375, 0.079833984375, 0.2508544921875, 0.421875, 0.5928955078125, 0.763916015625, 0.9349365234375, 1.10595703125, 1.2769775390625, 1.447998046875, 1.6190185546875, 1.7900390625, 1.9610595703125, 2.132080078125, 2.3031005859375, 2.47412109375, 2.6451416015625, 2.816162109375, 2.9871826171875, 3.158203125, 3.3292236328125, 3.500244140625, 3.6712646484375, 3.84228515625, 4.0133056640625, 4.184326171875, 4.3553466796875, 4.5263671875, 4.6973876953125, 4.868408203125, 5.0394287109375, 5.21044921875, 5.3814697265625, 5.552490234375, 5.7235107421875, 5.89453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 3.0, 1.0, 6.0, 9.0, 6.0, 13.0, 11.0, 15.0, 18.0, 24.0, 45.0, 53.0, 53.0, 83.0, 181.0, 438.0, 1653.0, 35859.0, 2998039.0, 105260.0, 2801.0, 493.0, 219.0, 122.0, 76.0, 37.0, 43.0, 35.0, 25.0, 23.0, 13.0, 7.0, 12.0, 7.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.828125, -13.4285888671875, -13.029052734375, -12.6295166015625, -12.22998046875, -11.8304443359375, -11.430908203125, -11.0313720703125, -10.6318359375, -10.2322998046875, -9.832763671875, -9.4332275390625, -9.03369140625, -8.6341552734375, -8.234619140625, -7.8350830078125, -7.435546875, -7.0360107421875, -6.636474609375, -6.2369384765625, -5.83740234375, -5.4378662109375, -5.038330078125, -4.6387939453125, -4.2392578125, -3.8397216796875, -3.440185546875, -3.0406494140625, -2.64111328125, -2.2415771484375, -1.842041015625, -1.4425048828125, -1.04296875, -0.6434326171875, -0.243896484375, 0.1556396484375, 0.55517578125, 0.9547119140625, 1.354248046875, 1.7537841796875, 2.1533203125, 2.5528564453125, 2.952392578125, 3.3519287109375, 3.75146484375, 4.1510009765625, 4.550537109375, 4.9500732421875, 5.349609375, 5.7491455078125, 6.148681640625, 6.5482177734375, 6.94775390625, 7.3472900390625, 7.746826171875, 8.1463623046875, 8.5458984375, 8.9454345703125, 9.344970703125, 9.7445068359375, 10.14404296875, 10.5435791015625, 10.943115234375, 11.3426513671875, 11.7421875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 15.0, 26.0, 43.0, 95.0, 158.0, 206.0, 180.0, 121.0, 75.0, 48.0, 22.0, 10.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.23815155029297, -15.808196067810059, -15.378240585327148, -14.948284149169922, -14.518328666687012, -14.088373184204102, -13.658417701721191, -13.228462219238281, -12.798505783081055, -12.368550300598145, -11.938594818115234, -11.508638381958008, -11.078682899475098, -10.648727416992188, -10.218771934509277, -9.788816452026367, -9.358860969543457, -8.928905487060547, -8.498950004577637, -8.068994522094727, -7.6390380859375, -7.20908260345459, -6.77912712097168, -6.3491716384887695, -5.919215679168701, -5.489260196685791, -5.059304237365723, -4.6293487548828125, -4.199393272399902, -3.769437313079834, -3.339481830596924, -2.9095261096954346, -2.4795703887939453, -2.049614667892456, -1.6196590662002563, -1.1897034645080566, -0.7597477436065674, -0.3297920227050781, 0.10016345977783203, 0.5301191806793213, 0.9600749015808105, 1.3900306224822998, 1.8199862241744995, 2.249941825866699, 2.6798975467681885, 3.1098532676696777, 3.539808750152588, 3.969764471054077, 4.399720191955566, 4.829675674438477, 5.259631633758545, 5.689587116241455, 6.119543075561523, 6.549498558044434, 6.979454040527344, 7.409409523010254, 7.839365482330322, 8.26932144165039, 8.6992769241333, 9.129232406616211, 9.559187889099121, 9.989143371582031, 10.419099807739258, 10.849055290222168, 11.279010772705078]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 15.0, 10.0, 18.0, 19.0, 23.0, 22.0, 18.0, 14.0, 22.0, 23.0, 36.0, 35.0, 41.0, 40.0, 47.0, 42.0, 42.0, 51.0, 34.0, 42.0, 41.0, 41.0, 26.0, 43.0, 35.0, 30.0, 28.0, 25.0, 20.0, 24.0, 22.0, 13.0, 17.0, 12.0, 9.0, 5.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.803150177001953, -16.246971130371094, -15.69079303741455, -15.134614944458008, -14.578435897827148, -14.022256851196289, -13.466078758239746, -12.909900665283203, -12.353721618652344, -11.797542572021484, -11.241364479064941, -10.685186386108398, -10.129007339477539, -9.57282829284668, -9.016650199890137, -8.460472106933594, -7.904293060302734, -7.348114490509033, -6.791935920715332, -6.235757350921631, -5.67957878112793, -5.1234002113342285, -4.567221641540527, -4.011043071746826, -3.454864501953125, -2.898685932159424, -2.3425073623657227, -1.7863287925720215, -1.2301502227783203, -0.6739716529846191, -0.11779308319091797, 0.4383854866027832, 0.9945621490478516, 1.5507407188415527, 2.106919288635254, 2.663097858428955, 3.2192764282226562, 3.7754549980163574, 4.331633567810059, 4.88781213760376, 5.443990707397461, 6.000169277191162, 6.556347846984863, 7.1125264167785645, 7.668704986572266, 8.224884033203125, 8.781062126159668, 9.337240219116211, 9.89341926574707, 10.44959831237793, 11.005776405334473, 11.561954498291016, 12.118133544921875, 12.674312591552734, 13.230490684509277, 13.78666877746582, 14.34284782409668, 14.899026870727539, 15.455204963684082, 16.011383056640625, 16.567562103271484, 17.123741149902344, 17.679920196533203, 18.23609733581543, 18.79227638244629]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 11.0, 10.0, 17.0, 20.0, 10.0, 17.0, 17.0, 22.0, 23.0, 21.0, 25.0, 34.0, 37.0, 29.0, 42.0, 40.0, 41.0, 39.0, 41.0, 42.0, 51.0, 43.0, 35.0, 41.0, 42.0, 22.0, 25.0, 25.0, 22.0, 21.0, 24.0, 11.0, 15.0, 16.0, 9.0, 9.0, 7.0, 8.0, 9.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.302734375, -1.259521484375, -1.21630859375, -1.173095703125, -1.1298828125, -1.086669921875, -1.04345703125, -1.000244140625, -0.95703125, -0.913818359375, -0.87060546875, -0.827392578125, -0.7841796875, -0.740966796875, -0.69775390625, -0.654541015625, -0.611328125, -0.568115234375, -0.52490234375, -0.481689453125, -0.4384765625, -0.395263671875, -0.35205078125, -0.308837890625, -0.265625, -0.222412109375, -0.17919921875, -0.135986328125, -0.0927734375, -0.049560546875, -0.00634765625, 0.036865234375, 0.080078125, 0.123291015625, 0.16650390625, 0.209716796875, 0.2529296875, 0.296142578125, 0.33935546875, 0.382568359375, 0.42578125, 0.468994140625, 0.51220703125, 0.555419921875, 0.5986328125, 0.641845703125, 0.68505859375, 0.728271484375, 0.771484375, 0.814697265625, 0.85791015625, 0.901123046875, 0.9443359375, 0.987548828125, 1.03076171875, 1.073974609375, 1.1171875, 1.160400390625, 1.20361328125, 1.246826171875, 1.2900390625, 1.333251953125, 1.37646484375, 1.419677734375, 1.462890625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 11.0, 5.0, 8.0, 5.0, 14.0, 10.0, 14.0, 22.0, 23.0, 35.0, 30.0, 35.0, 41.0, 49.0, 60.0, 107.0, 140.0, 258.0, 521.0, 1206.0, 3735.0, 15942.0, 100318.0, 966413.0, 2725662.0, 326187.0, 41724.0, 7769.0, 2090.0, 722.0, 377.0, 191.0, 102.0, 87.0, 69.0, 61.0, 35.0, 29.0, 34.0, 31.0, 19.0, 14.0, 19.0, 17.0, 11.0, 15.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.32421875, -6.1341552734375, -5.944091796875, -5.7540283203125, -5.56396484375, -5.3739013671875, -5.183837890625, -4.9937744140625, -4.8037109375, -4.6136474609375, -4.423583984375, -4.2335205078125, -4.04345703125, -3.8533935546875, -3.663330078125, -3.4732666015625, -3.283203125, -3.0931396484375, -2.903076171875, -2.7130126953125, -2.52294921875, -2.3328857421875, -2.142822265625, -1.9527587890625, -1.7626953125, -1.5726318359375, -1.382568359375, -1.1925048828125, -1.00244140625, -0.8123779296875, -0.622314453125, -0.4322509765625, -0.2421875, -0.0521240234375, 0.137939453125, 0.3280029296875, 0.51806640625, 0.7081298828125, 0.898193359375, 1.0882568359375, 1.2783203125, 1.4683837890625, 1.658447265625, 1.8485107421875, 2.03857421875, 2.2286376953125, 2.418701171875, 2.6087646484375, 2.798828125, 2.9888916015625, 3.178955078125, 3.3690185546875, 3.55908203125, 3.7491455078125, 3.939208984375, 4.1292724609375, 4.3193359375, 4.5093994140625, 4.699462890625, 4.8895263671875, 5.07958984375, 5.2696533203125, 5.459716796875, 5.6497802734375, 5.83984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 9.0, 18.0, 27.0, 25.0, 54.0, 80.0, 142.0, 208.0, 306.0, 466.0, 677.0, 667.0, 481.0, 328.0, 216.0, 155.0, 81.0, 52.0, 37.0, 17.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.696533203125, -8.47900390625, -8.261474609375, -8.0439453125, -7.826416015625, -7.60888671875, -7.391357421875, -7.173828125, -6.956298828125, -6.73876953125, -6.521240234375, -6.3037109375, -6.086181640625, -5.86865234375, -5.651123046875, -5.43359375, -5.216064453125, -4.99853515625, -4.781005859375, -4.5634765625, -4.345947265625, -4.12841796875, -3.910888671875, -3.693359375, -3.475830078125, -3.25830078125, -3.040771484375, -2.8232421875, -2.605712890625, -2.38818359375, -2.170654296875, -1.953125, -1.735595703125, -1.51806640625, -1.300537109375, -1.0830078125, -0.865478515625, -0.64794921875, -0.430419921875, -0.212890625, 0.004638671875, 0.22216796875, 0.439697265625, 0.6572265625, 0.874755859375, 1.09228515625, 1.309814453125, 1.52734375, 1.744873046875, 1.96240234375, 2.179931640625, 2.3974609375, 2.614990234375, 2.83251953125, 3.050048828125, 3.267578125, 3.485107421875, 3.70263671875, 3.920166015625, 4.1376953125, 4.355224609375, 4.57275390625, 4.790283203125, 5.0078125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 10.0, 22.0, 30.0, 55.0, 97.0, 152.0, 290.0, 535.0, 1161.0, 2696.0, 9550.0, 55497.0, 497295.0, 2770106.0, 757435.0, 80811.0, 12502.0, 3316.0, 1325.0, 599.0, 346.0, 187.0, 104.0, 59.0, 32.0, 20.0, 13.0, 9.0, 10.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.40625, -9.08837890625, -8.7705078125, -8.45263671875, -8.134765625, -7.81689453125, -7.4990234375, -7.18115234375, -6.86328125, -6.54541015625, -6.2275390625, -5.90966796875, -5.591796875, -5.27392578125, -4.9560546875, -4.63818359375, -4.3203125, -4.00244140625, -3.6845703125, -3.36669921875, -3.048828125, -2.73095703125, -2.4130859375, -2.09521484375, -1.77734375, -1.45947265625, -1.1416015625, -0.82373046875, -0.505859375, -0.18798828125, 0.1298828125, 0.44775390625, 0.765625, 1.08349609375, 1.4013671875, 1.71923828125, 2.037109375, 2.35498046875, 2.6728515625, 2.99072265625, 3.30859375, 3.62646484375, 3.9443359375, 4.26220703125, 4.580078125, 4.89794921875, 5.2158203125, 5.53369140625, 5.8515625, 6.16943359375, 6.4873046875, 6.80517578125, 7.123046875, 7.44091796875, 7.7587890625, 8.07666015625, 8.39453125, 8.71240234375, 9.0302734375, 9.34814453125, 9.666015625, 9.98388671875, 10.3017578125, 10.61962890625, 10.9375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 18.0, 51.0, 119.0, 224.0, 255.0, 171.0, 105.0, 57.0, 11.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.57279205322266, -92.76798248291016, -90.96317291259766, -89.15836334228516, -87.35355377197266, -85.54873657226562, -83.74392700195312, -81.93911743164062, -80.13430786132812, -78.32949829101562, -76.52468872070312, -74.71987915039062, -72.91506958007812, -71.11026000976562, -69.3054428100586, -67.5006332397461, -65.6958236694336, -63.891014099121094, -62.086204528808594, -60.28139114379883, -58.47658157348633, -56.67177200317383, -54.86696243286133, -53.06214904785156, -51.25734329223633, -49.45253372192383, -47.64772415161133, -45.84291076660156, -44.03810119628906, -42.23329162597656, -40.42848205566406, -38.62367248535156, -36.81885528564453, -35.01404571533203, -33.20923614501953, -31.4044246673584, -29.599613189697266, -27.794803619384766, -25.989994049072266, -24.185182571411133, -22.380374908447266, -20.575565338134766, -18.770753860473633, -16.965944290161133, -15.1611328125, -13.3563232421875, -11.551512718200684, -9.746702194213867, -7.941890716552734, -6.137080192565918, -4.332269668579102, -2.5274596214294434, -0.722649097442627, 1.0821609497070312, 2.8869714736938477, 4.691781997680664, 6.4965925216674805, 8.301403045654297, 10.106213569641113, 11.91102409362793, 13.71583366394043, 15.520644187927246, 17.325454711914062, 19.130264282226562, 20.935075759887695]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 3.0, 4.0, 7.0, 3.0, 15.0, 17.0, 19.0, 25.0, 23.0, 30.0, 27.0, 37.0, 49.0, 38.0, 51.0, 30.0, 48.0, 39.0, 43.0, 43.0, 39.0, 41.0, 34.0, 46.0, 36.0, 44.0, 27.0, 19.0, 29.0, 19.0, 15.0, 21.0, 21.0, 10.0, 13.0, 12.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.511360168457031, -14.975646018981934, -14.439931869506836, -13.904217720031738, -13.36850357055664, -12.83279037475586, -12.297076225280762, -11.761362075805664, -11.225647926330566, -10.689933776855469, -10.154219627380371, -9.618505477905273, -9.082792282104492, -8.547077178955078, -8.011363983154297, -7.475649833679199, -6.939935684204102, -6.404221534729004, -5.868507385253906, -5.332793712615967, -4.797079563140869, -4.2613654136657715, -3.725651502609253, -3.1899375915527344, -2.6542234420776367, -2.118509292602539, -1.5827953815460205, -1.0470813512802124, -0.5113673210144043, 0.02434682846069336, 0.5600607395172119, 1.0957746505737305, 1.631490707397461, 2.1672048568725586, 2.702918767929077, 3.2386326789855957, 3.7743468284606934, 4.310060977935791, 4.8457746505737305, 5.381488800048828, 5.917202949523926, 6.452917098999023, 6.988631248474121, 7.5243449211120605, 8.06005859375, 8.595773696899414, 9.131486892700195, 9.667201042175293, 10.20291519165039, 10.738629341125488, 11.274343490600586, 11.810057640075684, 12.345771789550781, 12.881484985351562, 13.41719913482666, 13.952913284301758, 14.488627433776855, 15.024341583251953, 15.56005573272705, 16.09576988220215, 16.63148307800293, 17.167198181152344, 17.702911376953125, 18.238624572753906, 18.77433967590332]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 8.0, 9.0, 7.0, 10.0, 16.0, 16.0, 18.0, 17.0, 18.0, 15.0, 20.0, 24.0, 22.0, 30.0, 37.0, 41.0, 31.0, 34.0, 42.0, 45.0, 50.0, 41.0, 31.0, 36.0, 37.0, 32.0, 37.0, 37.0, 22.0, 30.0, 23.0, 20.0, 25.0, 16.0, 26.0, 10.0, 11.0, 12.0, 7.0, 11.0, 6.0, 3.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2446746826171875, -1.201263427734375, -1.1578521728515625, -1.11444091796875, -1.0710296630859375, -1.027618408203125, -0.9842071533203125, -0.9407958984375, -0.8973846435546875, -0.853973388671875, -0.8105621337890625, -0.76715087890625, -0.7237396240234375, -0.680328369140625, -0.6369171142578125, -0.593505859375, -0.5500946044921875, -0.506683349609375, -0.4632720947265625, -0.41986083984375, -0.3764495849609375, -0.333038330078125, -0.2896270751953125, -0.2462158203125, -0.2028045654296875, -0.159393310546875, -0.1159820556640625, -0.07257080078125, -0.0291595458984375, 0.014251708984375, 0.0576629638671875, 0.10107421875, 0.1444854736328125, 0.187896728515625, 0.2313079833984375, 0.27471923828125, 0.3181304931640625, 0.361541748046875, 0.4049530029296875, 0.4483642578125, 0.4917755126953125, 0.535186767578125, 0.5785980224609375, 0.62200927734375, 0.6654205322265625, 0.708831787109375, 0.7522430419921875, 0.795654296875, 0.8390655517578125, 0.882476806640625, 0.9258880615234375, 0.96929931640625, 1.0127105712890625, 1.056121826171875, 1.0995330810546875, 1.1429443359375, 1.1863555908203125, 1.229766845703125, 1.2731781005859375, 1.31658935546875, 1.3600006103515625, 1.403411865234375, 1.4468231201171875, 1.490234375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 14.0, 30.0, 46.0, 54.0, 80.0, 122.0, 193.0, 281.0, 408.0, 666.0, 970.0, 1472.0, 2155.0, 3313.0, 4941.0, 7601.0, 11340.0, 17061.0, 26755.0, 42617.0, 70110.0, 127787.0, 329288.0, 171468.0, 86725.0, 51588.0, 31743.0, 20413.0, 13183.0, 8743.0, 5836.0, 3852.0, 2608.0, 1724.0, 1119.0, 743.0, 523.0, 323.0, 204.0, 154.0, 97.0, 79.0, 41.0, 22.0, 15.0, 11.0, 11.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05242919921875, -0.05066347122192383, -0.048897743225097656, -0.047132015228271484, -0.04536628723144531, -0.04360055923461914, -0.04183483123779297, -0.0400691032409668, -0.038303375244140625, -0.03653764724731445, -0.03477191925048828, -0.03300619125366211, -0.031240463256835938, -0.029474735260009766, -0.027709007263183594, -0.025943279266357422, -0.02417755126953125, -0.022411823272705078, -0.020646095275878906, -0.018880367279052734, -0.017114639282226562, -0.01534891128540039, -0.013583183288574219, -0.011817455291748047, -0.010051727294921875, -0.008285999298095703, -0.006520271301269531, -0.004754543304443359, -0.0029888153076171875, -0.0012230873107910156, 0.0005426406860351562, 0.002308368682861328, 0.0040740966796875, 0.005839824676513672, 0.007605552673339844, 0.009371280670166016, 0.011137008666992188, 0.01290273666381836, 0.014668464660644531, 0.016434192657470703, 0.018199920654296875, 0.019965648651123047, 0.02173137664794922, 0.02349710464477539, 0.025262832641601562, 0.027028560638427734, 0.028794288635253906, 0.030560016632080078, 0.03232574462890625, 0.03409147262573242, 0.035857200622558594, 0.037622928619384766, 0.03938865661621094, 0.04115438461303711, 0.04292011260986328, 0.04468584060668945, 0.046451568603515625, 0.0482172966003418, 0.04998302459716797, 0.05174875259399414, 0.05351448059082031, 0.055280208587646484, 0.057045936584472656, 0.05881166458129883, 0.060577392578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 3.0, 6.0, 3.0, 8.0, 8.0, 7.0, 3.0, 8.0, 4.0, 11.0, 16.0, 17.0, 22.0, 15.0, 21.0, 28.0, 32.0, 33.0, 31.0, 23.0, 36.0, 39.0, 33.0, 30.0, 39.0, 1052.0, 40.0, 32.0, 56.0, 28.0, 31.0, 27.0, 26.0, 24.0, 37.0, 31.0, 25.0, 27.0, 16.0, 13.0, 16.0, 11.0, 12.0, 8.0, 7.0, 5.0, 11.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0], "bins": [-1.0693359375, -1.0385665893554688, -1.0077972412109375, -0.9770278930664062, -0.946258544921875, -0.9154891967773438, -0.8847198486328125, -0.8539505004882812, -0.82318115234375, -0.7924118041992188, -0.7616424560546875, -0.7308731079101562, -0.700103759765625, -0.6693344116210938, -0.6385650634765625, -0.6077957153320312, -0.5770263671875, -0.5462570190429688, -0.5154876708984375, -0.48471832275390625, -0.453948974609375, -0.42317962646484375, -0.3924102783203125, -0.36164093017578125, -0.33087158203125, -0.30010223388671875, -0.2693328857421875, -0.23856353759765625, -0.207794189453125, -0.17702484130859375, -0.1462554931640625, -0.11548614501953125, -0.084716796875, -0.05394744873046875, -0.0231781005859375, 0.00759124755859375, 0.038360595703125, 0.06912994384765625, 0.0998992919921875, 0.13066864013671875, 0.16143798828125, 0.19220733642578125, 0.2229766845703125, 0.25374603271484375, 0.284515380859375, 0.31528472900390625, 0.3460540771484375, 0.37682342529296875, 0.4075927734375, 0.43836212158203125, 0.4691314697265625, 0.49990081787109375, 0.530670166015625, 0.5614395141601562, 0.5922088623046875, 0.6229782104492188, 0.65374755859375, 0.6845169067382812, 0.7152862548828125, 0.7460556030273438, 0.776824951171875, 0.8075942993164062, 0.8383636474609375, 0.8691329956054688, 0.89990234375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 5.0, 8.0, 9.0, 24.0, 31.0, 40.0, 76.0, 119.0, 164.0, 250.0, 341.0, 457.0, 699.0, 966.0, 1372.0, 1898.0, 2797.0, 3862.0, 5617.0, 7950.0, 11622.0, 17324.0, 25612.0, 38688.0, 60277.0, 101850.0, 205014.0, 1302357.0, 113214.0, 65740.0, 41555.0, 27662.0, 18295.0, 12567.0, 8662.0, 5941.0, 4074.0, 3000.0, 2061.0, 1578.0, 1004.0, 737.0, 517.0, 390.0, 228.0, 179.0, 113.0, 81.0, 39.0, 26.0, 18.0, 15.0, 9.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0291290283203125, -0.02819204330444336, -0.02725505828857422, -0.026318073272705078, -0.025381088256835938, -0.024444103240966797, -0.023507118225097656, -0.022570133209228516, -0.021633148193359375, -0.020696163177490234, -0.019759178161621094, -0.018822193145751953, -0.017885208129882812, -0.016948223114013672, -0.01601123809814453, -0.01507425308227539, -0.01413726806640625, -0.01320028305053711, -0.012263298034667969, -0.011326313018798828, -0.010389328002929688, -0.009452342987060547, -0.008515357971191406, -0.007578372955322266, -0.006641387939453125, -0.005704402923583984, -0.004767417907714844, -0.003830432891845703, -0.0028934478759765625, -0.001956462860107422, -0.0010194778442382812, -8.249282836914062e-05, 0.0008544921875, 0.0017914772033691406, 0.0027284622192382812, 0.003665447235107422, 0.0046024322509765625, 0.005539417266845703, 0.006476402282714844, 0.007413387298583984, 0.008350372314453125, 0.009287357330322266, 0.010224342346191406, 0.011161327362060547, 0.012098312377929688, 0.013035297393798828, 0.013972282409667969, 0.01490926742553711, 0.01584625244140625, 0.01678323745727539, 0.01772022247314453, 0.018657207489013672, 0.019594192504882812, 0.020531177520751953, 0.021468162536621094, 0.022405147552490234, 0.023342132568359375, 0.024279117584228516, 0.025216102600097656, 0.026153087615966797, 0.027090072631835938, 0.028027057647705078, 0.02896404266357422, 0.02990102767944336, 0.0308380126953125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 8.0, 0.0, 30.0, 0.0, 35.0, 0.0, 0.0, 108.0, 0.0, 635.0, 0.0, 105.0, 0.0, 0.0, 26.0, 0.0, 19.0, 0.0, 0.0, 11.0, 0.0, 5.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-8.940696716308594e-07, -8.689239621162415e-07, -8.437782526016235e-07, -8.186325430870056e-07, -7.934868335723877e-07, -7.683411240577698e-07, -7.431954145431519e-07, -7.180497050285339e-07, -6.92903995513916e-07, -6.677582859992981e-07, -6.426125764846802e-07, -6.174668669700623e-07, -5.923211574554443e-07, -5.671754479408264e-07, -5.420297384262085e-07, -5.168840289115906e-07, -4.917383193969727e-07, -4.6659260988235474e-07, -4.414469003677368e-07, -4.163011908531189e-07, -3.91155481338501e-07, -3.6600977182388306e-07, -3.4086406230926514e-07, -3.157183527946472e-07, -2.905726432800293e-07, -2.654269337654114e-07, -2.4028122425079346e-07, -2.1513551473617554e-07, -1.8998980522155762e-07, -1.648440957069397e-07, -1.3969838619232178e-07, -1.1455267667770386e-07, -8.940696716308594e-08, -6.426125764846802e-08, -3.91155481338501e-08, -1.3969838619232178e-08, 1.1175870895385742e-08, 3.632158041000366e-08, 6.146728992462158e-08, 8.66129994392395e-08, 1.1175870895385742e-07, 1.3690441846847534e-07, 1.6205012798309326e-07, 1.8719583749771118e-07, 2.123415470123291e-07, 2.3748725652694702e-07, 2.6263296604156494e-07, 2.8777867555618286e-07, 3.129243850708008e-07, 3.380700945854187e-07, 3.632158041000366e-07, 3.8836151361465454e-07, 4.1350722312927246e-07, 4.386529326438904e-07, 4.637986421585083e-07, 4.889443516731262e-07, 5.140900611877441e-07, 5.392357707023621e-07, 5.6438148021698e-07, 5.895271897315979e-07, 6.146728992462158e-07, 6.398186087608337e-07, 6.649643182754517e-07, 6.901100277900696e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 11.0, 5.0, 4.0, 5.0, 10.0, 15.0, 8.0, 21.0, 21.0, 56.0, 35.0, 98.0, 88.0, 476.0, 4928.0, 883851.0, 156435.0, 1773.0, 370.0, 71.0, 72.0, 21.0, 56.0, 11.0, 22.0, 17.0, 18.0, 7.0, 2.0, 11.0, 6.0, 5.0, 3.0, 2.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.3470649719238281e-05, -1.3084150850772858e-05, -1.2697651982307434e-05, -1.231115311384201e-05, -1.1924654245376587e-05, -1.1538155376911163e-05, -1.115165650844574e-05, -1.0765157639980316e-05, -1.0378658771514893e-05, -9.992159903049469e-06, -9.605661034584045e-06, -9.219162166118622e-06, -8.832663297653198e-06, -8.446164429187775e-06, -8.059665560722351e-06, -7.673166692256927e-06, -7.286667823791504e-06, -6.90016895532608e-06, -6.513670086860657e-06, -6.127171218395233e-06, -5.7406723499298096e-06, -5.354173481464386e-06, -4.967674612998962e-06, -4.581175744533539e-06, -4.194676876068115e-06, -3.8081780076026917e-06, -3.421679139137268e-06, -3.0351802706718445e-06, -2.648681402206421e-06, -2.2621825337409973e-06, -1.8756836652755737e-06, -1.4891847968101501e-06, -1.1026859283447266e-06, -7.16187059879303e-07, -3.296881914138794e-07, 5.681067705154419e-08, 4.4330954551696777e-07, 8.298084139823914e-07, 1.216307282447815e-06, 1.6028061509132385e-06, 1.989305019378662e-06, 2.3758038878440857e-06, 2.7623027563095093e-06, 3.148801624774933e-06, 3.5353004932403564e-06, 3.92179936170578e-06, 4.308298230171204e-06, 4.694797098636627e-06, 5.081295967102051e-06, 5.467794835567474e-06, 5.854293704032898e-06, 6.2407925724983215e-06, 6.627291440963745e-06, 7.013790309429169e-06, 7.400289177894592e-06, 7.786788046360016e-06, 8.17328691482544e-06, 8.559785783290863e-06, 8.946284651756287e-06, 9.33278352022171e-06, 9.719282388687134e-06, 1.0105781257152557e-05, 1.0492280125617981e-05, 1.0878778994083405e-05, 1.1265277862548828e-05]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 1.0, 4.0, 2.0, 6.0, 932.0, 6.0, 3.0, 6.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7114422234953963e-07, -1.6711740613573056e-07, -1.6309057571106678e-07, -1.590637594972577e-07, -1.5503694328344864e-07, -1.5101011285878485e-07, -1.4698329664497578e-07, -1.429564804311667e-07, -1.3892965000650292e-07, -1.3490283379269385e-07, -1.3087600336803007e-07, -1.26849187154221e-07, -1.2282237094041193e-07, -1.1879554051574814e-07, -1.1476872430193907e-07, -1.1074190098270265e-07, -1.0671508476889358e-07, -1.0268826144965715e-07, -9.866144523584808e-08, -9.463462191661165e-08, -9.060779859737522e-08, -8.658098238356615e-08, -8.255415906432972e-08, -7.85273357450933e-08, -7.450051953128423e-08, -7.04736962120478e-08, -6.644687999823873e-08, -6.24200566790023e-08, -5.839323335976587e-08, -5.4366413593243124e-08, -5.0339593826720375e-08, -4.631277050748395e-08, -4.228594718824752e-08, -3.825912742172477e-08, -3.423230410248834e-08, -3.0205484335965593e-08, -2.6178662793086005e-08, -2.2151841250206417e-08, -1.8125021483683668e-08, -1.409819994080408e-08, -1.0071378397924491e-08, -6.044557299134112e-09, -2.017736200343734e-09, 2.009084454357435e-09, 6.035905997237023e-09, 1.0062727540116612e-08, 1.408954730663936e-08, 1.811636884951895e-08, 2.2143190392398537e-08, 2.6170011935278126e-08, 3.0196833478157714e-08, 3.422365324468046e-08, 3.825047656391689e-08, 4.227729633043964e-08, 4.630411609696239e-08, 5.0330939416198817e-08, 5.4357759182721566e-08, 5.8384578949244315e-08, 6.241140226848074e-08, 6.643821848228981e-08, 7.046504180152624e-08, 7.449186512076267e-08, 7.851868133457174e-08, 8.254550465380817e-08, 8.65723279730446e-08]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 934.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 8.0, 9.0, 7.0, 10.0, 16.0, 16.0, 18.0, 17.0, 18.0, 15.0, 20.0, 24.0, 22.0, 30.0, 37.0, 41.0, 31.0, 34.0, 42.0, 45.0, 50.0, 41.0, 31.0, 36.0, 37.0, 32.0, 37.0, 37.0, 22.0, 30.0, 23.0, 20.0, 25.0, 16.0, 26.0, 10.0, 11.0, 12.0, 7.0, 11.0, 6.0, 3.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2446746826171875, -1.201263427734375, -1.1578521728515625, -1.11444091796875, -1.0710296630859375, -1.027618408203125, -0.9842071533203125, -0.9407958984375, -0.8973846435546875, -0.853973388671875, -0.8105621337890625, -0.76715087890625, -0.7237396240234375, -0.680328369140625, -0.6369171142578125, -0.593505859375, -0.5500946044921875, -0.506683349609375, -0.4632720947265625, -0.41986083984375, -0.3764495849609375, -0.333038330078125, -0.2896270751953125, -0.2462158203125, -0.2028045654296875, -0.159393310546875, -0.1159820556640625, -0.07257080078125, -0.0291595458984375, 0.014251708984375, 0.0576629638671875, 0.10107421875, 0.1444854736328125, 0.187896728515625, 0.2313079833984375, 0.27471923828125, 0.3181304931640625, 0.361541748046875, 0.4049530029296875, 0.4483642578125, 0.4917755126953125, 0.535186767578125, 0.5785980224609375, 0.62200927734375, 0.6654205322265625, 0.708831787109375, 0.7522430419921875, 0.795654296875, 0.8390655517578125, 0.882476806640625, 0.9258880615234375, 0.96929931640625, 1.0127105712890625, 1.056121826171875, 1.0995330810546875, 1.1429443359375, 1.1863555908203125, 1.229766845703125, 1.2731781005859375, 1.31658935546875, 1.3600006103515625, 1.403411865234375, 1.4468231201171875, 1.490234375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 6.0, 14.0, 15.0, 24.0, 43.0, 69.0, 93.0, 146.0, 244.0, 358.0, 647.0, 1109.0, 1964.0, 3412.0, 6215.0, 12404.0, 25841.0, 64211.0, 194502.0, 476833.0, 159175.0, 54290.0, 22751.0, 11000.0, 5728.0, 3120.0, 1788.0, 1024.0, 574.0, 368.0, 204.0, 128.0, 89.0, 63.0, 39.0, 26.0, 9.0, 19.0, 8.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.53125, -2.45068359375, -2.3701171875, -2.28955078125, -2.208984375, -2.12841796875, -2.0478515625, -1.96728515625, -1.88671875, -1.80615234375, -1.7255859375, -1.64501953125, -1.564453125, -1.48388671875, -1.4033203125, -1.32275390625, -1.2421875, -1.16162109375, -1.0810546875, -1.00048828125, -0.919921875, -0.83935546875, -0.7587890625, -0.67822265625, -0.59765625, -0.51708984375, -0.4365234375, -0.35595703125, -0.275390625, -0.19482421875, -0.1142578125, -0.03369140625, 0.046875, 0.12744140625, 0.2080078125, 0.28857421875, 0.369140625, 0.44970703125, 0.5302734375, 0.61083984375, 0.69140625, 0.77197265625, 0.8525390625, 0.93310546875, 1.013671875, 1.09423828125, 1.1748046875, 1.25537109375, 1.3359375, 1.41650390625, 1.4970703125, 1.57763671875, 1.658203125, 1.73876953125, 1.8193359375, 1.89990234375, 1.98046875, 2.06103515625, 2.1416015625, 2.22216796875, 2.302734375, 2.38330078125, 2.4638671875, 2.54443359375, 2.625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 9.0, 7.0, 5.0, 7.0, 21.0, 21.0, 36.0, 31.0, 32.0, 36.0, 34.0, 50.0, 62.0, 93.0, 181.0, 1555.0, 258.0, 116.0, 77.0, 59.0, 67.0, 42.0, 49.0, 40.0, 20.0, 21.0, 16.0, 22.0, 10.0, 18.0, 7.0, 11.0, 8.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.9095458984375, -5.729248046875, -5.5489501953125, -5.36865234375, -5.1883544921875, -5.008056640625, -4.8277587890625, -4.6474609375, -4.4671630859375, -4.286865234375, -4.1065673828125, -3.92626953125, -3.7459716796875, -3.565673828125, -3.3853759765625, -3.205078125, -3.0247802734375, -2.844482421875, -2.6641845703125, -2.48388671875, -2.3035888671875, -2.123291015625, -1.9429931640625, -1.7626953125, -1.5823974609375, -1.402099609375, -1.2218017578125, -1.04150390625, -0.8612060546875, -0.680908203125, -0.5006103515625, -0.3203125, -0.1400146484375, 0.040283203125, 0.2205810546875, 0.40087890625, 0.5811767578125, 0.761474609375, 0.9417724609375, 1.1220703125, 1.3023681640625, 1.482666015625, 1.6629638671875, 1.84326171875, 2.0235595703125, 2.203857421875, 2.3841552734375, 2.564453125, 2.7447509765625, 2.925048828125, 3.1053466796875, 3.28564453125, 3.4659423828125, 3.646240234375, 3.8265380859375, 4.0068359375, 4.1871337890625, 4.367431640625, 4.5477294921875, 4.72802734375, 4.9083251953125, 5.088623046875, 5.2689208984375, 5.44921875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 9.0, 6.0, 13.0, 16.0, 16.0, 29.0, 22.0, 45.0, 69.0, 89.0, 152.0, 329.0, 735.0, 2607.0, 18968.0, 462975.0, 2606537.0, 46316.0, 4714.0, 1088.0, 393.0, 195.0, 120.0, 68.0, 54.0, 35.0, 24.0, 17.0, 13.0, 13.0, 5.0, 4.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.296875, -8.978271484375, -8.65966796875, -8.341064453125, -8.0224609375, -7.703857421875, -7.38525390625, -7.066650390625, -6.748046875, -6.429443359375, -6.11083984375, -5.792236328125, -5.4736328125, -5.155029296875, -4.83642578125, -4.517822265625, -4.19921875, -3.880615234375, -3.56201171875, -3.243408203125, -2.9248046875, -2.606201171875, -2.28759765625, -1.968994140625, -1.650390625, -1.331787109375, -1.01318359375, -0.694580078125, -0.3759765625, -0.057373046875, 0.26123046875, 0.579833984375, 0.8984375, 1.217041015625, 1.53564453125, 1.854248046875, 2.1728515625, 2.491455078125, 2.81005859375, 3.128662109375, 3.447265625, 3.765869140625, 4.08447265625, 4.403076171875, 4.7216796875, 5.040283203125, 5.35888671875, 5.677490234375, 5.99609375, 6.314697265625, 6.63330078125, 6.951904296875, 7.2705078125, 7.589111328125, 7.90771484375, 8.226318359375, 8.544921875, 8.863525390625, 9.18212890625, 9.500732421875, 9.8193359375, 10.137939453125, 10.45654296875, 10.775146484375, 11.09375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 17.0, 102.0, 300.0, 348.0, 201.0, 38.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-54.88368606567383, -53.8116569519043, -52.739627838134766, -51.667598724365234, -50.5955696105957, -49.52354049682617, -48.45151138305664, -47.379478454589844, -46.30744934082031, -45.23542022705078, -44.16339111328125, -43.09136199951172, -42.01933288574219, -40.947303771972656, -39.875274658203125, -38.803245544433594, -37.73121643066406, -36.65918731689453, -35.587158203125, -34.51512908935547, -33.44309997558594, -32.371070861816406, -31.299039840698242, -30.22701072692871, -29.15498161315918, -28.08295249938965, -27.010923385620117, -25.938894271850586, -24.866863250732422, -23.79483413696289, -22.72280502319336, -21.650775909423828, -20.57874298095703, -19.5067138671875, -18.43468475341797, -17.362655639648438, -16.290626525878906, -15.218596458435059, -14.146566390991211, -13.07453727722168, -12.002509117126465, -10.930480003356934, -9.858449935913086, -8.786420822143555, -7.714391708374023, -6.642362594604492, -5.570333003997803, -4.498303413391113, -3.426274299621582, -2.3542449474334717, -1.2822155952453613, -0.21018624305725098, 0.8618431091308594, 1.9338722229003906, 3.00590181350708, 4.0779314041137695, 5.149960517883301, 6.221989631652832, 7.2940192222595215, 8.366048812866211, 9.438077926635742, 10.510107040405273, 11.582136154174805, 12.654166221618652, 13.726195335388184]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 5.0, 6.0, 4.0, 5.0, 11.0, 9.0, 14.0, 20.0, 27.0, 14.0, 25.0, 20.0, 22.0, 29.0, 26.0, 25.0, 34.0, 36.0, 38.0, 42.0, 47.0, 44.0, 38.0, 42.0, 33.0, 37.0, 36.0, 41.0, 38.0, 29.0, 26.0, 12.0, 23.0, 17.0, 26.0, 23.0, 16.0, 11.0, 12.0, 12.0, 7.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-17.735549926757812, -17.222135543823242, -16.708721160888672, -16.19530487060547, -15.681890487670898, -15.168476104736328, -14.655061721801758, -14.141646385192871, -13.628231048583984, -13.114816665649414, -12.601401329040527, -12.087986946105957, -11.57457160949707, -11.0611572265625, -10.54774284362793, -10.034327507019043, -9.520913124084473, -9.007498741149902, -8.494083404541016, -7.980669021606445, -7.467253684997559, -6.953839302062988, -6.44042444229126, -5.927009582519531, -5.413594722747803, -4.900179862976074, -4.386765003204346, -3.8733503818511963, -3.3599355220794678, -2.8465206623077393, -2.33310604095459, -1.8196911811828613, -1.3062763214111328, -0.7928615212440491, -0.27944672107696533, 0.23396801948547363, 0.7473828792572021, 1.2607977390289307, 1.77421236038208, 2.2876272201538086, 2.801042079925537, 3.3144569396972656, 3.827871799468994, 4.341286659240723, 4.854701042175293, 5.36811637878418, 5.88153076171875, 6.3949456214904785, 6.908360481262207, 7.4217753410339355, 7.935190200805664, 8.448604583740234, 8.962019920349121, 9.475434303283691, 9.988849639892578, 10.502264022827148, 11.015678405761719, 11.529092788696289, 12.042508125305176, 12.555922508239746, 13.069337844848633, 13.582752227783203, 14.096166610717773, 14.60958194732666, 15.122997283935547]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 6.0, 11.0, 11.0, 17.0, 16.0, 15.0, 18.0, 18.0, 16.0, 17.0, 24.0, 25.0, 29.0, 36.0, 35.0, 34.0, 33.0, 39.0, 46.0, 49.0, 47.0, 31.0, 43.0, 24.0, 30.0, 47.0, 27.0, 31.0, 33.0, 21.0, 17.0, 28.0, 25.0, 15.0, 18.0, 5.0, 12.0, 10.0, 9.0, 3.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.283203125, -1.2386016845703125, -1.194000244140625, -1.1493988037109375, -1.10479736328125, -1.0601959228515625, -1.015594482421875, -0.9709930419921875, -0.9263916015625, -0.8817901611328125, -0.837188720703125, -0.7925872802734375, -0.74798583984375, -0.7033843994140625, -0.658782958984375, -0.6141815185546875, -0.569580078125, -0.5249786376953125, -0.480377197265625, -0.4357757568359375, -0.39117431640625, -0.3465728759765625, -0.301971435546875, -0.2573699951171875, -0.2127685546875, -0.1681671142578125, -0.123565673828125, -0.0789642333984375, -0.03436279296875, 0.0102386474609375, 0.054840087890625, 0.0994415283203125, 0.14404296875, 0.1886444091796875, 0.233245849609375, 0.2778472900390625, 0.32244873046875, 0.3670501708984375, 0.411651611328125, 0.4562530517578125, 0.5008544921875, 0.5454559326171875, 0.590057373046875, 0.6346588134765625, 0.67926025390625, 0.7238616943359375, 0.768463134765625, 0.8130645751953125, 0.857666015625, 0.9022674560546875, 0.946868896484375, 0.9914703369140625, 1.03607177734375, 1.0806732177734375, 1.125274658203125, 1.1698760986328125, 1.2144775390625, 1.2590789794921875, 1.303680419921875, 1.3482818603515625, 1.39288330078125, 1.4374847412109375, 1.482086181640625, 1.5266876220703125, 1.5712890625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 10.0, 11.0, 11.0, 18.0, 24.0, 28.0, 28.0, 41.0, 34.0, 55.0, 93.0, 105.0, 161.0, 325.0, 610.0, 1527.0, 4838.0, 21829.0, 138991.0, 1233791.0, 2429474.0, 307142.0, 42762.0, 8086.0, 2251.0, 836.0, 428.0, 230.0, 138.0, 95.0, 59.0, 50.0, 47.0, 36.0, 23.0, 27.0, 7.0, 18.0, 10.0, 10.0, 7.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.87890625, -5.7017822265625, -5.524658203125, -5.3475341796875, -5.17041015625, -4.9932861328125, -4.816162109375, -4.6390380859375, -4.4619140625, -4.2847900390625, -4.107666015625, -3.9305419921875, -3.75341796875, -3.5762939453125, -3.399169921875, -3.2220458984375, -3.044921875, -2.8677978515625, -2.690673828125, -2.5135498046875, -2.33642578125, -2.1593017578125, -1.982177734375, -1.8050537109375, -1.6279296875, -1.4508056640625, -1.273681640625, -1.0965576171875, -0.91943359375, -0.7423095703125, -0.565185546875, -0.3880615234375, -0.2109375, -0.0338134765625, 0.143310546875, 0.3204345703125, 0.49755859375, 0.6746826171875, 0.851806640625, 1.0289306640625, 1.2060546875, 1.3831787109375, 1.560302734375, 1.7374267578125, 1.91455078125, 2.0916748046875, 2.268798828125, 2.4459228515625, 2.623046875, 2.8001708984375, 2.977294921875, 3.1544189453125, 3.33154296875, 3.5086669921875, 3.685791015625, 3.8629150390625, 4.0400390625, 4.2171630859375, 4.394287109375, 4.5714111328125, 4.74853515625, 4.9256591796875, 5.102783203125, 5.2799072265625, 5.45703125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 6.0, 1.0, 3.0, 10.0, 6.0, 10.0, 12.0, 26.0, 35.0, 43.0, 62.0, 105.0, 160.0, 198.0, 285.0, 428.0, 515.0, 515.0, 490.0, 360.0, 258.0, 158.0, 123.0, 85.0, 56.0, 34.0, 28.0, 17.0, 14.0, 8.0, 9.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.0777587890625, -3.909423828125, -3.7410888671875, -3.57275390625, -3.4044189453125, -3.236083984375, -3.0677490234375, -2.8994140625, -2.7310791015625, -2.562744140625, -2.3944091796875, -2.22607421875, -2.0577392578125, -1.889404296875, -1.7210693359375, -1.552734375, -1.3843994140625, -1.216064453125, -1.0477294921875, -0.87939453125, -0.7110595703125, -0.542724609375, -0.3743896484375, -0.2060546875, -0.0377197265625, 0.130615234375, 0.2989501953125, 0.46728515625, 0.6356201171875, 0.803955078125, 0.9722900390625, 1.140625, 1.3089599609375, 1.477294921875, 1.6456298828125, 1.81396484375, 1.9822998046875, 2.150634765625, 2.3189697265625, 2.4873046875, 2.6556396484375, 2.823974609375, 2.9923095703125, 3.16064453125, 3.3289794921875, 3.497314453125, 3.6656494140625, 3.833984375, 4.0023193359375, 4.170654296875, 4.3389892578125, 4.50732421875, 4.6756591796875, 4.843994140625, 5.0123291015625, 5.1806640625, 5.3489990234375, 5.517333984375, 5.6856689453125, 5.85400390625, 6.0223388671875, 6.190673828125, 6.3590087890625, 6.52734375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 20.0, 14.0, 33.0, 59.0, 114.0, 187.0, 399.0, 874.0, 2260.0, 7340.0, 47402.0, 545901.0, 2930673.0, 595923.0, 51098.0, 7936.0, 2189.0, 929.0, 426.0, 197.0, 114.0, 71.0, 27.0, 25.0, 14.0, 13.0, 5.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.92724609375, -12.5732421875, -12.21923828125, -11.865234375, -11.51123046875, -11.1572265625, -10.80322265625, -10.44921875, -10.09521484375, -9.7412109375, -9.38720703125, -9.033203125, -8.67919921875, -8.3251953125, -7.97119140625, -7.6171875, -7.26318359375, -6.9091796875, -6.55517578125, -6.201171875, -5.84716796875, -5.4931640625, -5.13916015625, -4.78515625, -4.43115234375, -4.0771484375, -3.72314453125, -3.369140625, -3.01513671875, -2.6611328125, -2.30712890625, -1.953125, -1.59912109375, -1.2451171875, -0.89111328125, -0.537109375, -0.18310546875, 0.1708984375, 0.52490234375, 0.87890625, 1.23291015625, 1.5869140625, 1.94091796875, 2.294921875, 2.64892578125, 3.0029296875, 3.35693359375, 3.7109375, 4.06494140625, 4.4189453125, 4.77294921875, 5.126953125, 5.48095703125, 5.8349609375, 6.18896484375, 6.54296875, 6.89697265625, 7.2509765625, 7.60498046875, 7.958984375, 8.31298828125, 8.6669921875, 9.02099609375, 9.375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 29.0, 60.0, 116.0, 172.0, 195.0, 195.0, 127.0, 66.0, 35.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.501319885253906, -18.86980438232422, -17.23828887939453, -15.606772422790527, -13.97525691986084, -12.343741416931152, -10.712224960327148, -9.080709457397461, -7.449193954467773, -5.817678451538086, -4.18616247177124, -2.5546464920043945, -0.923130989074707, 0.7083845138549805, 2.3399009704589844, 3.971416473388672, 5.602931976318359, 7.234447479248047, 8.865962982177734, 10.497479438781738, 12.128994941711426, 13.760510444641113, 15.392026901245117, 17.023542404174805, 18.655057907104492, 20.28657341003418, 21.918088912963867, 23.549606323242188, 25.181121826171875, 26.812637329101562, 28.44415283203125, 30.075668334960938, 31.707183837890625, 33.33869934082031, 34.97021484375, 36.60173034667969, 38.233245849609375, 39.86476135253906, 41.49627685546875, 43.12779235839844, 44.759307861328125, 46.39082336425781, 48.0223388671875, 49.65385437011719, 51.285369873046875, 52.91688537597656, 54.54840087890625, 56.17991638183594, 57.81143569946289, 59.44295120239258, 61.074466705322266, 62.70598220825195, 64.3375015258789, 65.9690170288086, 67.60053253173828, 69.23204803466797, 70.86356353759766, 72.49507904052734, 74.12659454345703, 75.75811004638672, 77.3896255493164, 79.0211410522461, 80.65265655517578, 82.28417205810547, 83.91568756103516]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 5.0, 4.0, 6.0, 9.0, 12.0, 10.0, 18.0, 18.0, 15.0, 31.0, 33.0, 39.0, 32.0, 43.0, 34.0, 43.0, 36.0, 57.0, 51.0, 36.0, 43.0, 55.0, 46.0, 47.0, 42.0, 50.0, 33.0, 23.0, 25.0, 18.0, 19.0, 14.0, 14.0, 15.0, 5.0, 12.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.6761474609375, -19.113943099975586, -18.551738739013672, -17.98953628540039, -17.427331924438477, -16.865127563476562, -16.30292320251465, -15.74071979522705, -15.178516387939453, -14.616312026977539, -14.054108619689941, -13.491904258728027, -12.92970085144043, -12.367496490478516, -11.805292129516602, -11.243088722229004, -10.68088436126709, -10.118680000305176, -9.556476593017578, -8.994272232055664, -8.432068824768066, -7.869864463806152, -7.3076605796813965, -6.745456695556641, -6.183252811431885, -5.621048927307129, -5.058845043182373, -4.496641159057617, -3.9344370365142822, -3.3722331523895264, -2.8100290298461914, -2.2478251457214355, -1.6856212615966797, -1.1234173774719238, -0.5612133741378784, 0.0009906291961669922, 0.5631945133209229, 1.1253983974456787, 1.6876025199890137, 2.2498064041137695, 2.8120102882385254, 3.3742141723632812, 3.936418056488037, 4.498621940612793, 5.060826301574707, 5.623029708862305, 6.185234069824219, 6.747437953948975, 7.3096418380737305, 7.871845722198486, 8.434049606323242, 8.996253967285156, 9.558457374572754, 10.120661735534668, 10.682865142822266, 11.24506950378418, 11.807273864746094, 12.369478225708008, 12.931681632995605, 13.49388599395752, 14.056089401245117, 14.618293762207031, 15.180498123168945, 15.742701530456543, 16.30490493774414]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 12.0, 13.0, 10.0, 10.0, 8.0, 22.0, 21.0, 23.0, 23.0, 32.0, 19.0, 37.0, 27.0, 42.0, 42.0, 35.0, 49.0, 42.0, 34.0, 50.0, 32.0, 32.0, 45.0, 40.0, 32.0, 36.0, 25.0, 32.0, 27.0, 23.0, 19.0, 20.0, 12.0, 11.0, 9.0, 11.0, 6.0, 8.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4814453125, -1.43408203125, -1.38671875, -1.33935546875, -1.2919921875, -1.24462890625, -1.197265625, -1.14990234375, -1.1025390625, -1.05517578125, -1.0078125, -0.96044921875, -0.9130859375, -0.86572265625, -0.818359375, -0.77099609375, -0.7236328125, -0.67626953125, -0.62890625, -0.58154296875, -0.5341796875, -0.48681640625, -0.439453125, -0.39208984375, -0.3447265625, -0.29736328125, -0.25, -0.20263671875, -0.1552734375, -0.10791015625, -0.060546875, -0.01318359375, 0.0341796875, 0.08154296875, 0.12890625, 0.17626953125, 0.2236328125, 0.27099609375, 0.318359375, 0.36572265625, 0.4130859375, 0.46044921875, 0.5078125, 0.55517578125, 0.6025390625, 0.64990234375, 0.697265625, 0.74462890625, 0.7919921875, 0.83935546875, 0.88671875, 0.93408203125, 0.9814453125, 1.02880859375, 1.076171875, 1.12353515625, 1.1708984375, 1.21826171875, 1.265625, 1.31298828125, 1.3603515625, 1.40771484375, 1.455078125, 1.50244140625, 1.5498046875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 11.0, 21.0, 35.0, 44.0, 48.0, 106.0, 152.0, 182.0, 320.0, 429.0, 634.0, 903.0, 1419.0, 2168.0, 3210.0, 4762.0, 7137.0, 11067.0, 16886.0, 26647.0, 42740.0, 71202.0, 124937.0, 318715.0, 177901.0, 90630.0, 53568.0, 32721.0, 20625.0, 13295.0, 8719.0, 5739.0, 3736.0, 2652.0, 1711.0, 1153.0, 714.0, 507.0, 346.0, 220.0, 195.0, 109.0, 78.0, 47.0, 35.0, 15.0, 18.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.059967041015625, -0.05813455581665039, -0.05630207061767578, -0.05446958541870117, -0.05263710021972656, -0.05080461502075195, -0.048972129821777344, -0.047139644622802734, -0.045307159423828125, -0.043474674224853516, -0.041642189025878906, -0.0398097038269043, -0.03797721862792969, -0.03614473342895508, -0.03431224822998047, -0.03247976303100586, -0.03064727783203125, -0.02881479263305664, -0.02698230743408203, -0.025149822235107422, -0.023317337036132812, -0.021484851837158203, -0.019652366638183594, -0.017819881439208984, -0.015987396240234375, -0.014154911041259766, -0.012322425842285156, -0.010489940643310547, -0.008657455444335938, -0.006824970245361328, -0.004992485046386719, -0.0031599998474121094, -0.0013275146484375, 0.0005049705505371094, 0.0023374557495117188, 0.004169940948486328, 0.0060024261474609375, 0.007834911346435547, 0.009667396545410156, 0.011499881744384766, 0.013332366943359375, 0.015164852142333984, 0.016997337341308594, 0.018829822540283203, 0.020662307739257812, 0.022494792938232422, 0.02432727813720703, 0.02615976333618164, 0.02799224853515625, 0.02982473373413086, 0.03165721893310547, 0.03348970413208008, 0.03532218933105469, 0.0371546745300293, 0.038987159729003906, 0.040819644927978516, 0.042652130126953125, 0.044484615325927734, 0.046317100524902344, 0.04814958572387695, 0.04998207092285156, 0.05181455612182617, 0.05364704132080078, 0.05547952651977539, 0.05731201171875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 6.0, 13.0, 6.0, 15.0, 12.0, 12.0, 17.0, 18.0, 28.0, 25.0, 20.0, 29.0, 22.0, 22.0, 38.0, 45.0, 49.0, 43.0, 36.0, 1064.0, 41.0, 41.0, 34.0, 50.0, 32.0, 41.0, 30.0, 35.0, 28.0, 22.0, 17.0, 18.0, 10.0, 15.0, 13.0, 12.0, 16.0, 11.0, 12.0, 2.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95947265625, -0.9250869750976562, -0.8907012939453125, -0.8563156127929688, -0.821929931640625, -0.7875442504882812, -0.7531585693359375, -0.7187728881835938, -0.68438720703125, -0.6500015258789062, -0.6156158447265625, -0.5812301635742188, -0.546844482421875, -0.5124588012695312, -0.4780731201171875, -0.44368743896484375, -0.4093017578125, -0.37491607666015625, -0.3405303955078125, -0.30614471435546875, -0.271759033203125, -0.23737335205078125, -0.2029876708984375, -0.16860198974609375, -0.13421630859375, -0.09983062744140625, -0.0654449462890625, -0.03105926513671875, 0.003326416015625, 0.03771209716796875, 0.0720977783203125, 0.10648345947265625, 0.140869140625, 0.17525482177734375, 0.2096405029296875, 0.24402618408203125, 0.278411865234375, 0.31279754638671875, 0.3471832275390625, 0.38156890869140625, 0.41595458984375, 0.45034027099609375, 0.4847259521484375, 0.5191116333007812, 0.553497314453125, 0.5878829956054688, 0.6222686767578125, 0.6566543579101562, 0.6910400390625, 0.7254257202148438, 0.7598114013671875, 0.7941970825195312, 0.828582763671875, 0.8629684448242188, 0.8973541259765625, 0.9317398071289062, 0.96612548828125, 1.0005111694335938, 1.0348968505859375, 1.0692825317382812, 1.103668212890625, 1.1380538940429688, 1.1724395751953125, 1.2068252563476562, 1.2412109375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 15.0, 24.0, 29.0, 45.0, 80.0, 121.0, 177.0, 266.0, 411.0, 638.0, 903.0, 1415.0, 2193.0, 3136.0, 4802.0, 7150.0, 10348.0, 15506.0, 23755.0, 37494.0, 63352.0, 117082.0, 1338607.0, 215182.0, 100321.0, 55855.0, 33641.0, 21484.0, 14361.0, 9456.0, 6399.0, 4297.0, 2902.0, 1870.0, 1309.0, 865.0, 556.0, 373.0, 240.0, 154.0, 92.0, 76.0, 43.0, 38.0, 18.0, 14.0, 14.0, 4.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0357666015625, -0.03467893600463867, -0.033591270446777344, -0.032503604888916016, -0.03141593933105469, -0.03032827377319336, -0.02924060821533203, -0.028152942657470703, -0.027065277099609375, -0.025977611541748047, -0.02488994598388672, -0.02380228042602539, -0.022714614868164062, -0.021626949310302734, -0.020539283752441406, -0.019451618194580078, -0.01836395263671875, -0.017276287078857422, -0.016188621520996094, -0.015100955963134766, -0.014013290405273438, -0.01292562484741211, -0.011837959289550781, -0.010750293731689453, -0.009662628173828125, -0.008574962615966797, -0.007487297058105469, -0.006399631500244141, -0.0053119659423828125, -0.004224300384521484, -0.0031366348266601562, -0.002048969268798828, -0.0009613037109375, 0.00012636184692382812, 0.0012140274047851562, 0.0023016929626464844, 0.0033893585205078125, 0.004477024078369141, 0.005564689636230469, 0.006652355194091797, 0.007740020751953125, 0.008827686309814453, 0.009915351867675781, 0.01100301742553711, 0.012090682983398438, 0.013178348541259766, 0.014266014099121094, 0.015353679656982422, 0.01644134521484375, 0.017529010772705078, 0.018616676330566406, 0.019704341888427734, 0.020792007446289062, 0.02187967300415039, 0.02296733856201172, 0.024055004119873047, 0.025142669677734375, 0.026230335235595703, 0.02731800079345703, 0.02840566635131836, 0.029493331909179688, 0.030580997467041016, 0.031668663024902344, 0.03275632858276367, 0.033843994140625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 8.0, 0.0, 14.0, 0.0, 0.0, 12.0, 0.0, 22.0, 0.0, 0.0, 39.0, 0.0, 93.0, 0.0, 660.0, 0.0, 0.0, 68.0, 0.0, 31.0, 0.0, 14.0, 0.0, 0.0, 11.0, 0.0, 9.0, 0.0, 0.0, 5.0, 0.0, 5.0, 0.0, 8.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.497146725654602e-07, -7.245689630508423e-07, -6.994232535362244e-07, -6.742775440216064e-07, -6.491318345069885e-07, -6.239861249923706e-07, -5.988404154777527e-07, -5.736947059631348e-07, -5.485489964485168e-07, -5.234032869338989e-07, -4.98257577419281e-07, -4.731118679046631e-07, -4.4796615839004517e-07, -4.2282044887542725e-07, -3.976747393608093e-07, -3.725290298461914e-07, -3.473833203315735e-07, -3.2223761081695557e-07, -2.9709190130233765e-07, -2.7194619178771973e-07, -2.468004822731018e-07, -2.2165477275848389e-07, -1.9650906324386597e-07, -1.7136335372924805e-07, -1.4621764421463013e-07, -1.210719347000122e-07, -9.592622518539429e-08, -7.078051567077637e-08, -4.563480615615845e-08, -2.0489096641540527e-08, 4.6566128730773926e-09, 2.9802322387695312e-08, 5.494803190231323e-08, 8.009374141693115e-08, 1.0523945093154907e-07, 1.30385160446167e-07, 1.555308699607849e-07, 1.8067657947540283e-07, 2.0582228899002075e-07, 2.3096799850463867e-07, 2.561137080192566e-07, 2.812594175338745e-07, 3.0640512704849243e-07, 3.3155083656311035e-07, 3.5669654607772827e-07, 3.818422555923462e-07, 4.069879651069641e-07, 4.3213367462158203e-07, 4.5727938413619995e-07, 4.824250936508179e-07, 5.075708031654358e-07, 5.327165126800537e-07, 5.578622221946716e-07, 5.830079317092896e-07, 6.081536412239075e-07, 6.332993507385254e-07, 6.584450602531433e-07, 6.835907697677612e-07, 7.087364792823792e-07, 7.338821887969971e-07, 7.59027898311615e-07, 7.841736078262329e-07, 8.093193173408508e-07, 8.344650268554688e-07]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 6.0, 6.0, 7.0, 4.0, 6.0, 4.0, 19.0, 9.0, 12.0, 24.0, 18.0, 20.0, 22.0, 27.0, 41.0, 70.0, 120.0, 265.0, 1235.0, 26455.0, 933804.0, 82270.0, 3215.0, 463.0, 83.0, 101.0, 43.0, 35.0, 21.0, 23.0, 23.0, 14.0, 16.0, 7.0, 5.0, 15.0, 11.0, 9.0, 7.0, 4.0, 5.0, 5.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.0907649993896484e-05, -1.0583549737930298e-05, -1.0259449481964111e-05, -9.935349225997925e-06, -9.611248970031738e-06, -9.287148714065552e-06, -8.963048458099365e-06, -8.638948202133179e-06, -8.314847946166992e-06, -7.990747690200806e-06, -7.666647434234619e-06, -7.342547178268433e-06, -7.018446922302246e-06, -6.6943466663360596e-06, -6.370246410369873e-06, -6.0461461544036865e-06, -5.7220458984375e-06, -5.3979456424713135e-06, -5.073845386505127e-06, -4.7497451305389404e-06, -4.425644874572754e-06, -4.101544618606567e-06, -3.777444362640381e-06, -3.4533441066741943e-06, -3.129243850708008e-06, -2.8051435947418213e-06, -2.4810433387756348e-06, -2.1569430828094482e-06, -1.8328428268432617e-06, -1.5087425708770752e-06, -1.1846423149108887e-06, -8.605420589447021e-07, -5.364418029785156e-07, -2.123415470123291e-07, 1.1175870895385742e-07, 4.3585896492004395e-07, 7.599592208862305e-07, 1.084059476852417e-06, 1.4081597328186035e-06, 1.73225998878479e-06, 2.0563602447509766e-06, 2.380460500717163e-06, 2.7045607566833496e-06, 3.028661012649536e-06, 3.3527612686157227e-06, 3.676861524581909e-06, 4.000961780548096e-06, 4.325062036514282e-06, 4.649162292480469e-06, 4.973262548446655e-06, 5.297362804412842e-06, 5.621463060379028e-06, 5.945563316345215e-06, 6.269663572311401e-06, 6.593763828277588e-06, 6.917864084243774e-06, 7.241964340209961e-06, 7.5660645961761475e-06, 7.890164852142334e-06, 8.21426510810852e-06, 8.538365364074707e-06, 8.862465620040894e-06, 9.18656587600708e-06, 9.510666131973267e-06, 9.834766387939453e-06]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 4.0, 960.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.201703128117515e-07, -1.1653239084807865e-07, -1.1289446177897844e-07, -1.0925653981530559e-07, -1.0561861785163273e-07, -1.0198068878253252e-07, -9.834276681885967e-08, -9.470484485518682e-08, -9.106691578608661e-08, -8.742899382241376e-08, -8.379106475331355e-08, -8.01531427896407e-08, -7.651522082596784e-08, -7.287729175686763e-08, -6.923936979319478e-08, -6.560144072409457e-08, -6.196351876042172e-08, -5.832559324403519e-08, -5.468767128036234e-08, -5.104974576397581e-08, -4.7411820247589276e-08, -4.3773894731202745e-08, -4.013597276752989e-08, -3.649804725114336e-08, -3.286012884018419e-08, -2.9222205100154497e-08, -2.5584279583767966e-08, -2.1946355843738274e-08, -1.8308430327351743e-08, -1.4670506587322052e-08, -1.103258284729236e-08, -7.3946573309058294e-09, -3.7567318145192985e-09, -1.1880740835579218e-10, 3.519116997807714e-09, 7.1570411819266155e-09, 1.0794965810134727e-08, 1.4432890438342838e-08, 1.807081417837253e-08, 2.170873969475906e-08, 2.5346663434788752e-08, 2.8984587174818444e-08, 3.2622512691204975e-08, 3.6260438207591505e-08, 3.989836017126436e-08, 4.353628568765089e-08, 4.717421120403742e-08, 5.081213316771027e-08, 5.44500586840968e-08, 5.8087984200483334e-08, 6.172590616415619e-08, 6.53638352332564e-08, 6.900175719692925e-08, 7.26396791606021e-08, 7.627760112427495e-08, 7.991553019337516e-08, 8.355345215704801e-08, 8.719137412072087e-08, 9.082930318982108e-08, 9.446722515349393e-08, 9.810514711716678e-08, 1.0174307618626699e-07, 1.0538099814993984e-07, 1.0901892721904005e-07, 1.126568491827129e-07]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 960.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 12.0, 13.0, 10.0, 10.0, 8.0, 22.0, 21.0, 23.0, 23.0, 32.0, 19.0, 37.0, 27.0, 42.0, 42.0, 35.0, 49.0, 42.0, 34.0, 50.0, 32.0, 32.0, 45.0, 40.0, 32.0, 36.0, 25.0, 32.0, 27.0, 23.0, 19.0, 20.0, 12.0, 11.0, 9.0, 11.0, 6.0, 8.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4814453125, -1.43408203125, -1.38671875, -1.33935546875, -1.2919921875, -1.24462890625, -1.197265625, -1.14990234375, -1.1025390625, -1.05517578125, -1.0078125, -0.96044921875, -0.9130859375, -0.86572265625, -0.818359375, -0.77099609375, -0.7236328125, -0.67626953125, -0.62890625, -0.58154296875, -0.5341796875, -0.48681640625, -0.439453125, -0.39208984375, -0.3447265625, -0.29736328125, -0.25, -0.20263671875, -0.1552734375, -0.10791015625, -0.060546875, -0.01318359375, 0.0341796875, 0.08154296875, 0.12890625, 0.17626953125, 0.2236328125, 0.27099609375, 0.318359375, 0.36572265625, 0.4130859375, 0.46044921875, 0.5078125, 0.55517578125, 0.6025390625, 0.64990234375, 0.697265625, 0.74462890625, 0.7919921875, 0.83935546875, 0.88671875, 0.93408203125, 0.9814453125, 1.02880859375, 1.076171875, 1.12353515625, 1.1708984375, 1.21826171875, 1.265625, 1.31298828125, 1.3603515625, 1.40771484375, 1.455078125, 1.50244140625, 1.5498046875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 7.0, 9.0, 15.0, 28.0, 30.0, 38.0, 49.0, 87.0, 145.0, 166.0, 262.0, 400.0, 607.0, 1061.0, 1541.0, 2446.0, 4109.0, 6926.0, 11650.0, 20730.0, 38468.0, 77977.0, 172716.0, 315083.0, 203008.0, 90613.0, 44450.0, 23185.0, 13077.0, 7461.0, 4490.0, 2779.0, 1708.0, 1064.0, 725.0, 477.0, 309.0, 207.0, 139.0, 94.0, 63.0, 43.0, 33.0, 15.0, 11.0, 17.0, 7.0, 7.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.8125, -1.7551422119140625, -1.697784423828125, -1.6404266357421875, -1.58306884765625, -1.5257110595703125, -1.468353271484375, -1.4109954833984375, -1.3536376953125, -1.2962799072265625, -1.238922119140625, -1.1815643310546875, -1.12420654296875, -1.0668487548828125, -1.009490966796875, -0.9521331787109375, -0.894775390625, -0.8374176025390625, -0.780059814453125, -0.7227020263671875, -0.66534423828125, -0.6079864501953125, -0.550628662109375, -0.4932708740234375, -0.4359130859375, -0.3785552978515625, -0.321197509765625, -0.2638397216796875, -0.20648193359375, -0.1491241455078125, -0.091766357421875, -0.0344085693359375, 0.02294921875, 0.0803070068359375, 0.137664794921875, 0.1950225830078125, 0.25238037109375, 0.3097381591796875, 0.367095947265625, 0.4244537353515625, 0.4818115234375, 0.5391693115234375, 0.596527099609375, 0.6538848876953125, 0.71124267578125, 0.7686004638671875, 0.825958251953125, 0.8833160400390625, 0.940673828125, 0.9980316162109375, 1.055389404296875, 1.1127471923828125, 1.17010498046875, 1.2274627685546875, 1.284820556640625, 1.3421783447265625, 1.3995361328125, 1.4568939208984375, 1.514251708984375, 1.5716094970703125, 1.62896728515625, 1.6863250732421875, 1.743682861328125, 1.8010406494140625, 1.8583984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 6.0, 10.0, 11.0, 15.0, 28.0, 37.0, 37.0, 41.0, 54.0, 58.0, 74.0, 121.0, 288.0, 1618.0, 171.0, 88.0, 59.0, 73.0, 57.0, 54.0, 36.0, 30.0, 18.0, 14.0, 14.0, 7.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.640625, -8.40240478515625, -8.1641845703125, -7.92596435546875, -7.687744140625, -7.44952392578125, -7.2113037109375, -6.97308349609375, -6.73486328125, -6.49664306640625, -6.2584228515625, -6.02020263671875, -5.781982421875, -5.54376220703125, -5.3055419921875, -5.06732177734375, -4.8291015625, -4.59088134765625, -4.3526611328125, -4.11444091796875, -3.876220703125, -3.63800048828125, -3.3997802734375, -3.16156005859375, -2.92333984375, -2.68511962890625, -2.4468994140625, -2.20867919921875, -1.970458984375, -1.73223876953125, -1.4940185546875, -1.25579833984375, -1.017578125, -0.77935791015625, -0.5411376953125, -0.30291748046875, -0.064697265625, 0.17352294921875, 0.4117431640625, 0.64996337890625, 0.88818359375, 1.12640380859375, 1.3646240234375, 1.60284423828125, 1.841064453125, 2.07928466796875, 2.3175048828125, 2.55572509765625, 2.7939453125, 3.03216552734375, 3.2703857421875, 3.50860595703125, 3.746826171875, 3.98504638671875, 4.2232666015625, 4.46148681640625, 4.69970703125, 4.93792724609375, 5.1761474609375, 5.41436767578125, 5.652587890625, 5.89080810546875, 6.1290283203125, 6.36724853515625, 6.60546875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 6.0, 2.0, 11.0, 9.0, 7.0, 22.0, 32.0, 35.0, 55.0, 80.0, 156.0, 364.0, 1128.0, 5759.0, 48052.0, 2373578.0, 685991.0, 25445.0, 3592.0, 722.0, 284.0, 132.0, 82.0, 49.0, 22.0, 32.0, 17.0, 12.0, 8.0, 8.0, 4.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.0662841796875, -7.741943359375, -7.4176025390625, -7.09326171875, -6.7689208984375, -6.444580078125, -6.1202392578125, -5.7958984375, -5.4715576171875, -5.147216796875, -4.8228759765625, -4.49853515625, -4.1741943359375, -3.849853515625, -3.5255126953125, -3.201171875, -2.8768310546875, -2.552490234375, -2.2281494140625, -1.90380859375, -1.5794677734375, -1.255126953125, -0.9307861328125, -0.6064453125, -0.2821044921875, 0.042236328125, 0.3665771484375, 0.69091796875, 1.0152587890625, 1.339599609375, 1.6639404296875, 1.98828125, 2.3126220703125, 2.636962890625, 2.9613037109375, 3.28564453125, 3.6099853515625, 3.934326171875, 4.2586669921875, 4.5830078125, 4.9073486328125, 5.231689453125, 5.5560302734375, 5.88037109375, 6.2047119140625, 6.529052734375, 6.8533935546875, 7.177734375, 7.5020751953125, 7.826416015625, 8.1507568359375, 8.47509765625, 8.7994384765625, 9.123779296875, 9.4481201171875, 9.7724609375, 10.0968017578125, 10.421142578125, 10.7454833984375, 11.06982421875, 11.3941650390625, 11.718505859375, 12.0428466796875, 12.3671875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [5.0, 37.0, 331.0, 473.0, 151.0, 19.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.411599159240723, -4.450282096862793, -2.4889652729034424, -0.5276484489440918, 1.433668613433838, 3.3949851989746094, 5.356302261352539, 7.317619323730469, 9.278936386108398, 11.240253448486328, 13.201570510864258, 15.162887573242188, 17.124204635620117, 19.085521697998047, 21.046836853027344, 23.008155822753906, 24.969470977783203, 26.930788040161133, 28.892105102539062, 30.853422164916992, 32.81473922729492, 34.77605438232422, 36.73737335205078, 38.69868850708008, 40.66000747680664, 42.62132263183594, 44.5826416015625, 46.5439567565918, 48.50527572631836, 50.466590881347656, 52.42790985107422, 54.389225006103516, 56.35054397583008, 58.311859130859375, 60.27317810058594, 62.234493255615234, 64.19580841064453, 66.1571273803711, 68.11844635009766, 70.07976531982422, 72.04107666015625, 74.00239562988281, 75.96370697021484, 77.9250259399414, 79.88634490966797, 81.84766387939453, 83.80897521972656, 85.77029418945312, 87.73161315917969, 89.69293212890625, 91.65424346923828, 93.61556243896484, 95.5768814086914, 97.53820037841797, 99.49951171875, 101.46083068847656, 103.42214965820312, 105.38346862792969, 107.34477996826172, 109.30609893798828, 111.26741790771484, 113.2287368774414, 115.19004821777344, 117.1513671875, 119.11268615722656]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 10.0, 12.0, 11.0, 13.0, 20.0, 25.0, 14.0, 18.0, 22.0, 40.0, 37.0, 38.0, 44.0, 29.0, 53.0, 44.0, 58.0, 43.0, 43.0, 45.0, 36.0, 25.0, 36.0, 31.0, 31.0, 30.0, 25.0, 32.0, 14.0, 19.0, 19.0, 12.0, 15.0, 11.0, 7.0, 5.0, 4.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.878488540649414, -17.288463592529297, -16.698440551757812, -16.108415603637695, -15.518391609191895, -14.928367614746094, -14.338342666625977, -13.748318672180176, -13.158294677734375, -12.568270683288574, -11.978246688842773, -11.388221740722656, -10.798197746276855, -10.208173751831055, -9.618148803710938, -9.028124809265137, -8.438100814819336, -7.848076820373535, -7.258052349090576, -6.668027877807617, -6.078003883361816, -5.487979888916016, -4.897955417633057, -4.307930946350098, -3.717906951904297, -3.127882719039917, -2.537858486175537, -1.9478342533111572, -1.3578100204467773, -0.7677857875823975, -0.17776155471801758, 0.4122629165649414, 1.002288818359375, 1.5923130512237549, 2.1823372840881348, 2.7723615169525146, 3.3623857498168945, 3.9524099826812744, 4.542434215545654, 5.132458686828613, 5.722482681274414, 6.312506675720215, 6.902531147003174, 7.492555618286133, 8.082579612731934, 8.672603607177734, 9.262628555297852, 9.852652549743652, 10.442676544189453, 11.032700538635254, 11.622724533081055, 12.212749481201172, 12.802773475646973, 13.392797470092773, 13.98282241821289, 14.572846412658691, 15.162870407104492, 15.752894401550293, 16.342918395996094, 16.93294334411621, 17.522968292236328, 18.112991333007812, 18.70301628112793, 19.293041229248047, 19.88306427001953]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 11.0, 10.0, 12.0, 11.0, 8.0, 22.0, 21.0, 20.0, 27.0, 24.0, 27.0, 30.0, 31.0, 41.0, 51.0, 45.0, 34.0, 49.0, 41.0, 34.0, 37.0, 45.0, 37.0, 38.0, 34.0, 30.0, 29.0, 30.0, 24.0, 22.0, 20.0, 19.0, 13.0, 14.0, 9.0, 8.0, 5.0, 10.0, 2.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5283203125, -1.479248046875, -1.43017578125, -1.381103515625, -1.33203125, -1.282958984375, -1.23388671875, -1.184814453125, -1.1357421875, -1.086669921875, -1.03759765625, -0.988525390625, -0.939453125, -0.890380859375, -0.84130859375, -0.792236328125, -0.7431640625, -0.694091796875, -0.64501953125, -0.595947265625, -0.546875, -0.497802734375, -0.44873046875, -0.399658203125, -0.3505859375, -0.301513671875, -0.25244140625, -0.203369140625, -0.154296875, -0.105224609375, -0.05615234375, -0.007080078125, 0.0419921875, 0.091064453125, 0.14013671875, 0.189208984375, 0.23828125, 0.287353515625, 0.33642578125, 0.385498046875, 0.4345703125, 0.483642578125, 0.53271484375, 0.581787109375, 0.630859375, 0.679931640625, 0.72900390625, 0.778076171875, 0.8271484375, 0.876220703125, 0.92529296875, 0.974365234375, 1.0234375, 1.072509765625, 1.12158203125, 1.170654296875, 1.2197265625, 1.268798828125, 1.31787109375, 1.366943359375, 1.416015625, 1.465087890625, 1.51416015625, 1.563232421875, 1.6123046875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 5.0, 4.0, 15.0, 14.0, 20.0, 22.0, 43.0, 59.0, 89.0, 147.0, 213.0, 284.0, 647.0, 1194.0, 2726.0, 6595.0, 18126.0, 52425.0, 159298.0, 517650.0, 1582487.0, 1276113.0, 389440.0, 121719.0, 40566.0, 14326.0, 5406.0, 2214.0, 1058.0, 520.0, 287.0, 170.0, 101.0, 89.0, 52.0, 42.0, 23.0, 15.0, 14.0, 15.0, 8.0, 8.0, 10.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3515625, -3.2496337890625, -3.147705078125, -3.0457763671875, -2.94384765625, -2.8419189453125, -2.739990234375, -2.6380615234375, -2.5361328125, -2.4342041015625, -2.332275390625, -2.2303466796875, -2.12841796875, -2.0264892578125, -1.924560546875, -1.8226318359375, -1.720703125, -1.6187744140625, -1.516845703125, -1.4149169921875, -1.31298828125, -1.2110595703125, -1.109130859375, -1.0072021484375, -0.9052734375, -0.8033447265625, -0.701416015625, -0.5994873046875, -0.49755859375, -0.3956298828125, -0.293701171875, -0.1917724609375, -0.08984375, 0.0120849609375, 0.114013671875, 0.2159423828125, 0.31787109375, 0.4197998046875, 0.521728515625, 0.6236572265625, 0.7255859375, 0.8275146484375, 0.929443359375, 1.0313720703125, 1.13330078125, 1.2352294921875, 1.337158203125, 1.4390869140625, 1.541015625, 1.6429443359375, 1.744873046875, 1.8468017578125, 1.94873046875, 2.0506591796875, 2.152587890625, 2.2545166015625, 2.3564453125, 2.4583740234375, 2.560302734375, 2.6622314453125, 2.76416015625, 2.8660888671875, 2.968017578125, 3.0699462890625, 3.171875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 5.0, 7.0, 17.0, 28.0, 43.0, 53.0, 77.0, 137.0, 239.0, 311.0, 463.0, 631.0, 574.0, 510.0, 304.0, 201.0, 165.0, 114.0, 65.0, 61.0, 21.0, 15.0, 12.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.125, -8.91754150390625, -8.7100830078125, -8.50262451171875, -8.295166015625, -8.08770751953125, -7.8802490234375, -7.67279052734375, -7.46533203125, -7.25787353515625, -7.0504150390625, -6.84295654296875, -6.635498046875, -6.42803955078125, -6.2205810546875, -6.01312255859375, -5.8056640625, -5.59820556640625, -5.3907470703125, -5.18328857421875, -4.975830078125, -4.76837158203125, -4.5609130859375, -4.35345458984375, -4.14599609375, -3.93853759765625, -3.7310791015625, -3.52362060546875, -3.316162109375, -3.10870361328125, -2.9012451171875, -2.69378662109375, -2.486328125, -2.27886962890625, -2.0714111328125, -1.86395263671875, -1.656494140625, -1.44903564453125, -1.2415771484375, -1.03411865234375, -0.82666015625, -0.61920166015625, -0.4117431640625, -0.20428466796875, 0.003173828125, 0.21063232421875, 0.4180908203125, 0.62554931640625, 0.8330078125, 1.04046630859375, 1.2479248046875, 1.45538330078125, 1.662841796875, 1.87030029296875, 2.0777587890625, 2.28521728515625, 2.49267578125, 2.70013427734375, 2.9075927734375, 3.11505126953125, 3.322509765625, 3.52996826171875, 3.7374267578125, 3.94488525390625, 4.15234375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 2.0, 3.0, 8.0, 6.0, 18.0, 18.0, 39.0, 67.0, 83.0, 152.0, 275.0, 479.0, 966.0, 2158.0, 6373.0, 27254.0, 165921.0, 1086521.0, 2302544.0, 504634.0, 75638.0, 14087.0, 3915.0, 1467.0, 747.0, 385.0, 199.0, 121.0, 77.0, 60.0, 27.0, 15.0, 9.0, 4.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.27734375, -7.00054931640625, -6.7237548828125, -6.44696044921875, -6.170166015625, -5.89337158203125, -5.6165771484375, -5.33978271484375, -5.06298828125, -4.78619384765625, -4.5093994140625, -4.23260498046875, -3.955810546875, -3.67901611328125, -3.4022216796875, -3.12542724609375, -2.8486328125, -2.57183837890625, -2.2950439453125, -2.01824951171875, -1.741455078125, -1.46466064453125, -1.1878662109375, -0.91107177734375, -0.63427734375, -0.35748291015625, -0.0806884765625, 0.19610595703125, 0.472900390625, 0.74969482421875, 1.0264892578125, 1.30328369140625, 1.580078125, 1.85687255859375, 2.1336669921875, 2.41046142578125, 2.687255859375, 2.96405029296875, 3.2408447265625, 3.51763916015625, 3.79443359375, 4.07122802734375, 4.3480224609375, 4.62481689453125, 4.901611328125, 5.17840576171875, 5.4552001953125, 5.73199462890625, 6.0087890625, 6.28558349609375, 6.5623779296875, 6.83917236328125, 7.115966796875, 7.39276123046875, 7.6695556640625, 7.94635009765625, 8.22314453125, 8.49993896484375, 8.7767333984375, 9.05352783203125, 9.330322265625, 9.60711669921875, 9.8839111328125, 10.16070556640625, 10.4375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 15.0, 27.0, 41.0, 50.0, 85.0, 81.0, 109.0, 96.0, 115.0, 101.0, 76.0, 67.0, 51.0, 36.0, 24.0, 12.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.560035705566406, -31.597412109375, -30.634788513183594, -29.672164916992188, -28.70954132080078, -27.746917724609375, -26.78429412841797, -25.82166862487793, -24.859045028686523, -23.896421432495117, -22.93379783630371, -21.971174240112305, -21.0085506439209, -20.04592514038086, -19.083301544189453, -18.120677947998047, -17.15805435180664, -16.195430755615234, -15.232807159423828, -14.270183563232422, -13.3075590133667, -12.344935417175293, -11.382311820983887, -10.419687271118164, -9.45706558227539, -8.494441986083984, -7.53181791305542, -6.569194316864014, -5.606570243835449, -4.643946647644043, -3.6813230514526367, -2.7186989784240723, -1.7560749053955078, -0.7934511303901672, 0.16917264461517334, 1.1317963600158691, 2.0944201946258545, 3.05704402923584, 4.019667625427246, 4.9822916984558105, 5.944915294647217, 6.907538890838623, 7.8701629638671875, 8.832786560058594, 9.79541015625, 10.758033752441406, 11.720657348632812, 12.683281898498535, 13.645905494689941, 14.608529090881348, 15.571152687072754, 16.533777236938477, 17.496400833129883, 18.45902442932129, 19.421648025512695, 20.3842716217041, 21.346895217895508, 22.309518814086914, 23.27214241027832, 24.234766006469727, 25.197389602661133, 26.160015106201172, 27.122638702392578, 28.085262298583984, 29.04788589477539]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 9.0, 9.0, 9.0, 11.0, 6.0, 15.0, 17.0, 20.0, 25.0, 22.0, 42.0, 38.0, 41.0, 36.0, 25.0, 39.0, 53.0, 41.0, 45.0, 47.0, 40.0, 43.0, 36.0, 44.0, 34.0, 21.0, 33.0, 25.0, 22.0, 23.0, 11.0, 28.0, 12.0, 11.0, 10.0, 8.0, 10.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.71459197998047, -16.211467742919922, -15.708341598510742, -15.205217361450195, -14.702092170715332, -14.198966979980469, -13.695842742919922, -13.192717552185059, -12.689592361450195, -12.186467170715332, -11.683341979980469, -11.180217742919922, -10.677092552185059, -10.173967361450195, -9.670843124389648, -9.167717933654785, -8.664592742919922, -8.161467552185059, -7.6583428382873535, -7.155218124389648, -6.652092933654785, -6.148967742919922, -5.645843029022217, -5.142718315124512, -4.639593124389648, -4.136467933654785, -3.63334321975708, -3.130218267440796, -2.6270933151245117, -2.1239683628082275, -1.6208434104919434, -1.1177184581756592, -0.614593505859375, -0.11146855354309082, 0.39165639877319336, 0.8947813510894775, 1.3979063034057617, 1.901031255722046, 2.40415620803833, 2.9072811603546143, 3.4104061126708984, 3.9135310649871826, 4.416656017303467, 4.919780731201172, 5.422905921936035, 5.926031112670898, 6.4291558265686035, 6.932280540466309, 7.435405731201172, 7.938530921936035, 8.441656112670898, 8.944780349731445, 9.447905540466309, 9.951030731201172, 10.454154968261719, 10.957280158996582, 11.460405349731445, 11.963530540466309, 12.466655731201172, 12.969779968261719, 13.472905158996582, 13.976030349731445, 14.479154586791992, 14.982279777526855, 15.485404968261719]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 5.0, 8.0, 1.0, 11.0, 12.0, 12.0, 13.0, 12.0, 16.0, 17.0, 26.0, 23.0, 34.0, 22.0, 25.0, 40.0, 35.0, 44.0, 41.0, 42.0, 34.0, 35.0, 47.0, 39.0, 38.0, 37.0, 30.0, 34.0, 33.0, 25.0, 34.0, 27.0, 20.0, 22.0, 23.0, 15.0, 11.0, 16.0, 11.0, 11.0, 9.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4697265625, -1.4201812744140625, -1.370635986328125, -1.3210906982421875, -1.27154541015625, -1.2220001220703125, -1.172454833984375, -1.1229095458984375, -1.0733642578125, -1.0238189697265625, -0.974273681640625, -0.9247283935546875, -0.87518310546875, -0.8256378173828125, -0.776092529296875, -0.7265472412109375, -0.677001953125, -0.6274566650390625, -0.577911376953125, -0.5283660888671875, -0.47882080078125, -0.4292755126953125, -0.379730224609375, -0.3301849365234375, -0.2806396484375, -0.2310943603515625, -0.181549072265625, -0.1320037841796875, -0.08245849609375, -0.0329132080078125, 0.016632080078125, 0.0661773681640625, 0.11572265625, 0.1652679443359375, 0.214813232421875, 0.2643585205078125, 0.31390380859375, 0.3634490966796875, 0.412994384765625, 0.4625396728515625, 0.5120849609375, 0.5616302490234375, 0.611175537109375, 0.6607208251953125, 0.71026611328125, 0.7598114013671875, 0.809356689453125, 0.8589019775390625, 0.908447265625, 0.9579925537109375, 1.007537841796875, 1.0570831298828125, 1.10662841796875, 1.1561737060546875, 1.205718994140625, 1.2552642822265625, 1.3048095703125, 1.3543548583984375, 1.403900146484375, 1.4534454345703125, 1.50299072265625, 1.5525360107421875, 1.602081298828125, 1.6516265869140625, 1.701171875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 8.0, 6.0, 8.0, 12.0, 31.0, 26.0, 47.0, 105.0, 111.0, 188.0, 287.0, 375.0, 601.0, 861.0, 1337.0, 1859.0, 2885.0, 4318.0, 6399.0, 9824.0, 14743.0, 22472.0, 34840.0, 55677.0, 95570.0, 188884.0, 290990.0, 124324.0, 70098.0, 42476.0, 26887.0, 17550.0, 11531.0, 7609.0, 5129.0, 3418.0, 2289.0, 1540.0, 1052.0, 748.0, 468.0, 356.0, 190.0, 140.0, 124.0, 59.0, 35.0, 34.0, 18.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061309814453125, -0.05934572219848633, -0.057381629943847656, -0.055417537689208984, -0.05345344543457031, -0.05148935317993164, -0.04952526092529297, -0.0475611686706543, -0.045597076416015625, -0.04363298416137695, -0.04166889190673828, -0.03970479965209961, -0.03774070739746094, -0.035776615142822266, -0.033812522888183594, -0.03184843063354492, -0.02988433837890625, -0.027920246124267578, -0.025956153869628906, -0.023992061614990234, -0.022027969360351562, -0.02006387710571289, -0.01809978485107422, -0.016135692596435547, -0.014171600341796875, -0.012207508087158203, -0.010243415832519531, -0.00827932357788086, -0.0063152313232421875, -0.004351139068603516, -0.0023870468139648438, -0.0004229545593261719, 0.0015411376953125, 0.003505229949951172, 0.005469322204589844, 0.007433414459228516, 0.009397506713867188, 0.01136159896850586, 0.013325691223144531, 0.015289783477783203, 0.017253875732421875, 0.019217967987060547, 0.02118206024169922, 0.02314615249633789, 0.025110244750976562, 0.027074337005615234, 0.029038429260253906, 0.031002521514892578, 0.03296661376953125, 0.03493070602416992, 0.036894798278808594, 0.038858890533447266, 0.04082298278808594, 0.04278707504272461, 0.04475116729736328, 0.04671525955200195, 0.048679351806640625, 0.0506434440612793, 0.05260753631591797, 0.05457162857055664, 0.05653572082519531, 0.058499813079833984, 0.060463905334472656, 0.06242799758911133, 0.06439208984375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 6.0, 17.0, 9.0, 22.0, 16.0, 21.0, 23.0, 23.0, 28.0, 27.0, 41.0, 33.0, 32.0, 41.0, 33.0, 40.0, 41.0, 1070.0, 37.0, 39.0, 45.0, 41.0, 33.0, 39.0, 28.0, 27.0, 28.0, 23.0, 19.0, 28.0, 17.0, 15.0, 9.0, 7.0, 5.0, 9.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0869140625, -1.051025390625, -1.01513671875, -0.979248046875, -0.943359375, -0.907470703125, -0.87158203125, -0.835693359375, -0.7998046875, -0.763916015625, -0.72802734375, -0.692138671875, -0.65625, -0.620361328125, -0.58447265625, -0.548583984375, -0.5126953125, -0.476806640625, -0.44091796875, -0.405029296875, -0.369140625, -0.333251953125, -0.29736328125, -0.261474609375, -0.2255859375, -0.189697265625, -0.15380859375, -0.117919921875, -0.08203125, -0.046142578125, -0.01025390625, 0.025634765625, 0.0615234375, 0.097412109375, 0.13330078125, 0.169189453125, 0.205078125, 0.240966796875, 0.27685546875, 0.312744140625, 0.3486328125, 0.384521484375, 0.42041015625, 0.456298828125, 0.4921875, 0.528076171875, 0.56396484375, 0.599853515625, 0.6357421875, 0.671630859375, 0.70751953125, 0.743408203125, 0.779296875, 0.815185546875, 0.85107421875, 0.886962890625, 0.9228515625, 0.958740234375, 0.99462890625, 1.030517578125, 1.06640625, 1.102294921875, 1.13818359375, 1.174072265625, 1.2099609375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 11.0, 14.0, 24.0, 43.0, 44.0, 90.0, 115.0, 150.0, 245.0, 358.0, 508.0, 738.0, 1147.0, 1622.0, 2384.0, 3600.0, 5143.0, 7538.0, 11223.0, 16888.0, 25581.0, 39511.0, 65200.0, 114417.0, 1320174.0, 210756.0, 102100.0, 59030.0, 36829.0, 23480.0, 15463.0, 10489.0, 7125.0, 4889.0, 3247.0, 2184.0, 1475.0, 1008.0, 746.0, 519.0, 319.0, 223.0, 165.0, 111.0, 70.0, 44.0, 33.0, 18.0, 20.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0], "bins": [-0.03485107421875, -0.03379201889038086, -0.03273296356201172, -0.03167390823364258, -0.030614852905273438, -0.029555797576904297, -0.028496742248535156, -0.027437686920166016, -0.026378631591796875, -0.025319576263427734, -0.024260520935058594, -0.023201465606689453, -0.022142410278320312, -0.021083354949951172, -0.02002429962158203, -0.01896524429321289, -0.01790618896484375, -0.01684713363647461, -0.01578807830810547, -0.014729022979736328, -0.013669967651367188, -0.012610912322998047, -0.011551856994628906, -0.010492801666259766, -0.009433746337890625, -0.008374691009521484, -0.007315635681152344, -0.006256580352783203, -0.0051975250244140625, -0.004138469696044922, -0.0030794143676757812, -0.0020203590393066406, -0.0009613037109375, 9.775161743164062e-05, 0.0011568069458007812, 0.002215862274169922, 0.0032749176025390625, 0.004333972930908203, 0.005393028259277344, 0.006452083587646484, 0.007511138916015625, 0.008570194244384766, 0.009629249572753906, 0.010688304901123047, 0.011747360229492188, 0.012806415557861328, 0.013865470886230469, 0.01492452621459961, 0.01598358154296875, 0.01704263687133789, 0.01810169219970703, 0.019160747528076172, 0.020219802856445312, 0.021278858184814453, 0.022337913513183594, 0.023396968841552734, 0.024456024169921875, 0.025515079498291016, 0.026574134826660156, 0.027633190155029297, 0.028692245483398438, 0.029751300811767578, 0.03081035614013672, 0.03186941146850586, 0.032928466796875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 0.0, 13.0, 11.0, 10.0, 0.0, 14.0, 22.0, 33.0, 0.0, 77.0, 625.0, 90.0, 0.0, 27.0, 21.0, 10.0, 10.0, 0.0, 8.0, 11.0, 5.0, 0.0, 2.0, 1.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2060627341270447e-06, -1.1604279279708862e-06, -1.1147931218147278e-06, -1.0691583156585693e-06, -1.0235235095024109e-06, -9.778887033462524e-07, -9.32253897190094e-07, -8.866190910339355e-07, -8.409842848777771e-07, -7.953494787216187e-07, -7.497146725654602e-07, -7.040798664093018e-07, -6.584450602531433e-07, -6.128102540969849e-07, -5.671754479408264e-07, -5.21540641784668e-07, -4.759058356285095e-07, -4.302710294723511e-07, -3.8463622331619263e-07, -3.390014171600342e-07, -2.9336661100387573e-07, -2.477318048477173e-07, -2.0209699869155884e-07, -1.564621925354004e-07, -1.1082738637924194e-07, -6.51925802230835e-08, -1.955777406692505e-08, 2.60770320892334e-08, 7.171183824539185e-08, 1.1734664440155029e-07, 1.6298145055770874e-07, 2.086162567138672e-07, 2.5425106287002563e-07, 2.998858690261841e-07, 3.4552067518234253e-07, 3.91155481338501e-07, 4.367902874946594e-07, 4.824250936508179e-07, 5.280598998069763e-07, 5.736947059631348e-07, 6.193295121192932e-07, 6.649643182754517e-07, 7.105991244316101e-07, 7.562339305877686e-07, 8.01868736743927e-07, 8.475035429000854e-07, 8.931383490562439e-07, 9.387731552124023e-07, 9.844079613685608e-07, 1.0300427675247192e-06, 1.0756775736808777e-06, 1.1213123798370361e-06, 1.1669471859931946e-06, 1.212581992149353e-06, 1.2582167983055115e-06, 1.30385160446167e-06, 1.3494864106178284e-06, 1.3951212167739868e-06, 1.4407560229301453e-06, 1.4863908290863037e-06, 1.5320256352424622e-06, 1.5776604413986206e-06, 1.623295247554779e-06, 1.6689300537109375e-06]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 7.0, 2.0, 2.0, 4.0, 6.0, 10.0, 26.0, 32.0, 43.0, 46.0, 96.0, 262.0, 2313.0, 983330.0, 61176.0, 795.0, 176.0, 63.0, 37.0, 29.0, 23.0, 31.0, 12.0, 8.0, 9.0, 5.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.6881694793701172e-05, -2.6131048798561096e-05, -2.538040280342102e-05, -2.4629756808280945e-05, -2.387911081314087e-05, -2.3128464818000793e-05, -2.2377818822860718e-05, -2.1627172827720642e-05, -2.0876526832580566e-05, -2.012588083744049e-05, -1.9375234842300415e-05, -1.862458884716034e-05, -1.7873942852020264e-05, -1.7123296856880188e-05, -1.6372650861740112e-05, -1.5622004866600037e-05, -1.4871358871459961e-05, -1.4120712876319885e-05, -1.337006688117981e-05, -1.2619420886039734e-05, -1.1868774890899658e-05, -1.1118128895759583e-05, -1.0367482900619507e-05, -9.616836905479431e-06, -8.866190910339355e-06, -8.11554491519928e-06, -7.364898920059204e-06, -6.614252924919128e-06, -5.863606929779053e-06, -5.112960934638977e-06, -4.362314939498901e-06, -3.6116689443588257e-06, -2.86102294921875e-06, -2.1103769540786743e-06, -1.3597309589385986e-06, -6.09084963798523e-07, 1.4156103134155273e-07, 8.922070264816284e-07, 1.642853021621704e-06, 2.3934990167617798e-06, 3.1441450119018555e-06, 3.894791007041931e-06, 4.645437002182007e-06, 5.3960829973220825e-06, 6.146728992462158e-06, 6.897374987602234e-06, 7.64802098274231e-06, 8.398666977882385e-06, 9.149312973022461e-06, 9.899958968162537e-06, 1.0650604963302612e-05, 1.1401250958442688e-05, 1.2151896953582764e-05, 1.290254294872284e-05, 1.3653188943862915e-05, 1.440383493900299e-05, 1.5154480934143066e-05, 1.5905126929283142e-05, 1.6655772924423218e-05, 1.7406418919563293e-05, 1.815706491470337e-05, 1.8907710909843445e-05, 1.965835690498352e-05, 2.0409002900123596e-05, 2.1159648895263672e-05]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 10.0, 8.0, 13.0, 901.0, 9.0, 11.0, 17.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.6425776645264705e-07, -4.544414764495741e-07, -4.446252148682106e-07, -4.3480892486513767e-07, -4.2499263486206473e-07, -4.1517637328070123e-07, -4.053600832776283e-07, -3.9554379327455536e-07, -3.8572753169319185e-07, -3.759112416901189e-07, -3.660949801087554e-07, -3.5627869010568247e-07, -3.4646240010260954e-07, -3.3664613852124603e-07, -3.268298485181731e-07, -3.170135869368096e-07, -3.0719729693373665e-07, -2.973810069306637e-07, -2.875647453493002e-07, -2.777484553462273e-07, -2.6793216534315434e-07, -2.5811590376179083e-07, -2.482996137587179e-07, -2.3848332375564496e-07, -2.2866703375257202e-07, -2.188507579603538e-07, -2.0903446795728087e-07, -1.9921819216506265e-07, -1.8940191637284443e-07, -1.795856405806262e-07, -1.6976935057755327e-07, -1.5995307478533505e-07, -1.501367847822621e-07, -1.403205089900439e-07, -1.3050421898697095e-07, -1.2068794319475273e-07, -1.1087166740253451e-07, -1.0105538450488893e-07, -9.123910160724336e-08, -8.142282581502513e-08, -7.160654291737956e-08, -6.179026001973398e-08, -5.197398422751576e-08, -4.215770132987018e-08, -3.234142198493828e-08, -2.252514264000638e-08, -1.27088597423608e-08, -2.89258395014258e-09, 6.923698947502999e-09, 1.6739978292434898e-08, 2.6556259413723637e-08, 3.6372540535012376e-08, 4.6188819879944276e-08, 5.6005099224876176e-08, 6.582138212252175e-08, 7.563765791473998e-08, 8.545394081238555e-08, 9.527022371003113e-08, 1.0508649950224935e-07, 1.1490278239989493e-07, 1.247190652975405e-07, 1.3453534108975873e-07, 1.4435161688197695e-07, 1.541679068850499e-07, 1.639841826772681e-07]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 903.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.384185791015625e-07, -2.3189932107925415e-07, -2.253800630569458e-07, -2.1886080503463745e-07, -2.123415470123291e-07, -2.0582228899002075e-07, -1.993030309677124e-07, -1.9278377294540405e-07, -1.862645149230957e-07, -1.7974525690078735e-07, -1.73225998878479e-07, -1.6670674085617065e-07, -1.601874828338623e-07, -1.5366822481155396e-07, -1.471489667892456e-07, -1.4062970876693726e-07, -1.341104507446289e-07, -1.2759119272232056e-07, -1.210719347000122e-07, -1.1455267667770386e-07, -1.0803341865539551e-07, -1.0151416063308716e-07, -9.499490261077881e-08, -8.847564458847046e-08, -8.195638656616211e-08, -7.543712854385376e-08, -6.891787052154541e-08, -6.239861249923706e-08, -5.587935447692871e-08, -4.936009645462036e-08, -4.284083843231201e-08, -3.632158041000366e-08, -2.9802322387695312e-08, -2.3283064365386963e-08, -1.6763806343078613e-08, -1.0244548320770264e-08, -3.725290298461914e-09, 2.7939677238464355e-09, 9.313225746154785e-09, 1.5832483768463135e-08, 2.2351741790771484e-08, 2.8870999813079834e-08, 3.5390257835388184e-08, 4.190951585769653e-08, 4.842877388000488e-08, 5.494803190231323e-08, 6.146728992462158e-08, 6.798654794692993e-08, 7.450580596923828e-08, 8.102506399154663e-08, 8.754432201385498e-08, 9.406358003616333e-08, 1.0058283805847168e-07, 1.0710209608078003e-07, 1.1362135410308838e-07, 1.2014061212539673e-07, 1.2665987014770508e-07, 1.3317912817001343e-07, 1.3969838619232178e-07, 1.4621764421463013e-07, 1.5273690223693848e-07, 1.5925616025924683e-07, 1.6577541828155518e-07, 1.7229467630386353e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 5.0, 8.0, 1.0, 11.0, 12.0, 12.0, 13.0, 12.0, 16.0, 17.0, 26.0, 23.0, 34.0, 22.0, 25.0, 40.0, 35.0, 44.0, 41.0, 42.0, 34.0, 35.0, 47.0, 39.0, 38.0, 37.0, 30.0, 34.0, 33.0, 25.0, 34.0, 27.0, 20.0, 22.0, 23.0, 15.0, 11.0, 16.0, 11.0, 11.0, 9.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4697265625, -1.4201812744140625, -1.370635986328125, -1.3210906982421875, -1.27154541015625, -1.2220001220703125, -1.172454833984375, -1.1229095458984375, -1.0733642578125, -1.0238189697265625, -0.974273681640625, -0.9247283935546875, -0.87518310546875, -0.8256378173828125, -0.776092529296875, -0.7265472412109375, -0.677001953125, -0.6274566650390625, -0.577911376953125, -0.5283660888671875, -0.47882080078125, -0.4292755126953125, -0.379730224609375, -0.3301849365234375, -0.2806396484375, -0.2310943603515625, -0.181549072265625, -0.1320037841796875, -0.08245849609375, -0.0329132080078125, 0.016632080078125, 0.0661773681640625, 0.11572265625, 0.1652679443359375, 0.214813232421875, 0.2643585205078125, 0.31390380859375, 0.3634490966796875, 0.412994384765625, 0.4625396728515625, 0.5120849609375, 0.5616302490234375, 0.611175537109375, 0.6607208251953125, 0.71026611328125, 0.7598114013671875, 0.809356689453125, 0.8589019775390625, 0.908447265625, 0.9579925537109375, 1.007537841796875, 1.0570831298828125, 1.10662841796875, 1.1561737060546875, 1.205718994140625, 1.2552642822265625, 1.3048095703125, 1.3543548583984375, 1.403900146484375, 1.4534454345703125, 1.50299072265625, 1.5525360107421875, 1.602081298828125, 1.6516265869140625, 1.701171875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 10.0, 11.0, 16.0, 25.0, 45.0, 50.0, 93.0, 126.0, 189.0, 287.0, 383.0, 591.0, 952.0, 1298.0, 2015.0, 2914.0, 4289.0, 6479.0, 9412.0, 14203.0, 21864.0, 36065.0, 59967.0, 101513.0, 177500.0, 233361.0, 150016.0, 86313.0, 50560.0, 30486.0, 19313.0, 12335.0, 8432.0, 5690.0, 3752.0, 2630.0, 1754.0, 1192.0, 784.0, 547.0, 372.0, 246.0, 154.0, 100.0, 82.0, 55.0, 33.0, 22.0, 15.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.607421875, -1.5577239990234375, -1.508026123046875, -1.4583282470703125, -1.40863037109375, -1.3589324951171875, -1.309234619140625, -1.2595367431640625, -1.2098388671875, -1.1601409912109375, -1.110443115234375, -1.0607452392578125, -1.01104736328125, -0.9613494873046875, -0.911651611328125, -0.8619537353515625, -0.812255859375, -0.7625579833984375, -0.712860107421875, -0.6631622314453125, -0.61346435546875, -0.5637664794921875, -0.514068603515625, -0.4643707275390625, -0.4146728515625, -0.3649749755859375, -0.315277099609375, -0.2655792236328125, -0.21588134765625, -0.1661834716796875, -0.116485595703125, -0.0667877197265625, -0.01708984375, 0.0326080322265625, 0.082305908203125, 0.1320037841796875, 0.18170166015625, 0.2313995361328125, 0.281097412109375, 0.3307952880859375, 0.3804931640625, 0.4301910400390625, 0.479888916015625, 0.5295867919921875, 0.57928466796875, 0.6289825439453125, 0.678680419921875, 0.7283782958984375, 0.778076171875, 0.8277740478515625, 0.877471923828125, 0.9271697998046875, 0.97686767578125, 1.0265655517578125, 1.076263427734375, 1.1259613037109375, 1.1756591796875, 1.2253570556640625, 1.275054931640625, 1.3247528076171875, 1.37445068359375, 1.4241485595703125, 1.473846435546875, 1.5235443115234375, 1.5732421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 6.0, 7.0, 15.0, 17.0, 17.0, 10.0, 19.0, 36.0, 41.0, 33.0, 42.0, 40.0, 49.0, 73.0, 99.0, 137.0, 230.0, 1318.0, 192.0, 119.0, 77.0, 61.0, 57.0, 48.0, 32.0, 36.0, 31.0, 35.0, 21.0, 19.0, 20.0, 24.0, 22.0, 9.0, 13.0, 8.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.16015625, -5.98114013671875, -5.8021240234375, -5.62310791015625, -5.444091796875, -5.26507568359375, -5.0860595703125, -4.90704345703125, -4.72802734375, -4.54901123046875, -4.3699951171875, -4.19097900390625, -4.011962890625, -3.83294677734375, -3.6539306640625, -3.47491455078125, -3.2958984375, -3.11688232421875, -2.9378662109375, -2.75885009765625, -2.579833984375, -2.40081787109375, -2.2218017578125, -2.04278564453125, -1.86376953125, -1.68475341796875, -1.5057373046875, -1.32672119140625, -1.147705078125, -0.96868896484375, -0.7896728515625, -0.61065673828125, -0.431640625, -0.25262451171875, -0.0736083984375, 0.10540771484375, 0.284423828125, 0.46343994140625, 0.6424560546875, 0.82147216796875, 1.00048828125, 1.17950439453125, 1.3585205078125, 1.53753662109375, 1.716552734375, 1.89556884765625, 2.0745849609375, 2.25360107421875, 2.4326171875, 2.61163330078125, 2.7906494140625, 2.96966552734375, 3.148681640625, 3.32769775390625, 3.5067138671875, 3.68572998046875, 3.86474609375, 4.04376220703125, 4.2227783203125, 4.40179443359375, 4.580810546875, 4.75982666015625, 4.9388427734375, 5.11785888671875, 5.296875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 7.0, 18.0, 20.0, 23.0, 29.0, 18.0, 38.0, 53.0, 71.0, 98.0, 187.0, 372.0, 653.0, 1567.0, 4095.0, 13337.0, 59596.0, 477497.0, 2285788.0, 248488.0, 38658.0, 9551.0, 2929.0, 1264.0, 523.0, 275.0, 162.0, 108.0, 60.0, 54.0, 27.0, 26.0, 18.0, 20.0, 8.0, 13.0, 7.0, 5.0, 5.0, 4.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.64453125, -7.40081787109375, -7.1571044921875, -6.91339111328125, -6.669677734375, -6.42596435546875, -6.1822509765625, -5.93853759765625, -5.69482421875, -5.45111083984375, -5.2073974609375, -4.96368408203125, -4.719970703125, -4.47625732421875, -4.2325439453125, -3.98883056640625, -3.7451171875, -3.50140380859375, -3.2576904296875, -3.01397705078125, -2.770263671875, -2.52655029296875, -2.2828369140625, -2.03912353515625, -1.79541015625, -1.55169677734375, -1.3079833984375, -1.06427001953125, -0.820556640625, -0.57684326171875, -0.3331298828125, -0.08941650390625, 0.154296875, 0.39801025390625, 0.6417236328125, 0.88543701171875, 1.129150390625, 1.37286376953125, 1.6165771484375, 1.86029052734375, 2.10400390625, 2.34771728515625, 2.5914306640625, 2.83514404296875, 3.078857421875, 3.32257080078125, 3.5662841796875, 3.80999755859375, 4.0537109375, 4.29742431640625, 4.5411376953125, 4.78485107421875, 5.028564453125, 5.27227783203125, 5.5159912109375, 5.75970458984375, 6.00341796875, 6.24713134765625, 6.4908447265625, 6.73455810546875, 6.978271484375, 7.22198486328125, 7.4656982421875, 7.70941162109375, 7.953125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 104.0, 733.0, 174.0], "bins": [-305.97344970703125, -301.0771484375, -296.1808776855469, -291.2845764160156, -286.3883056640625, -281.49200439453125, -276.595703125, -271.6994323730469, -266.8031311035156, -261.9068298339844, -257.01055908203125, -252.1142578125, -247.2179718017578, -242.32168579101562, -237.42538452148438, -232.5290985107422, -227.6328125, -222.7365264892578, -217.84024047851562, -212.94393920898438, -208.0476531982422, -203.1513671875, -198.25506591796875, -193.35877990722656, -188.46249389648438, -183.5662078857422, -178.669921875, -173.77362060546875, -168.87733459472656, -163.98104858398438, -159.08474731445312, -154.18846130371094, -149.29217529296875, -144.39588928222656, -139.49960327148438, -134.60330200195312, -129.70701599121094, -124.81072998046875, -119.91443634033203, -115.01814270019531, -110.12186431884766, -105.22557067871094, -100.32928466796875, -95.43299865722656, -90.53670501708984, -85.64041137695312, -80.74412536621094, -75.84783935546875, -70.95154571533203, -66.05525207519531, -61.158966064453125, -56.26267623901367, -51.36638641357422, -46.470096588134766, -41.57380676269531, -36.67751693725586, -31.781227111816406, -26.884937286376953, -21.9886474609375, -17.092357635498047, -12.196067810058594, -7.299777984619141, -2.4034881591796875, 2.4928016662597656, 7.389091491699219]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 5.0, 1.0, 3.0, 4.0, 9.0, 8.0, 6.0, 7.0, 8.0, 18.0, 9.0, 22.0, 18.0, 25.0, 27.0, 28.0, 18.0, 21.0, 26.0, 32.0, 46.0, 31.0, 31.0, 41.0, 35.0, 34.0, 33.0, 44.0, 38.0, 28.0, 28.0, 38.0, 47.0, 34.0, 26.0, 19.0, 20.0, 26.0, 19.0, 12.0, 11.0, 15.0, 17.0, 10.0, 4.0, 5.0, 4.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.080780029296875, -17.523303985595703, -16.96582794189453, -16.40835189819336, -15.850875854492188, -15.293399810791016, -14.73592472076416, -14.178448677062988, -13.620972633361816, -13.063496589660645, -12.506020545959473, -11.9485445022583, -11.391069412231445, -10.833593368530273, -10.276117324829102, -9.71864128112793, -9.161165237426758, -8.603689193725586, -8.046213150024414, -7.4887375831604, -6.9312615394592285, -6.373785495758057, -5.816309928894043, -5.258833885192871, -4.701357841491699, -4.143881797790527, -3.5864059925079346, -3.028930187225342, -2.47145414352417, -1.913978099822998, -1.3565022945404053, -0.7990264892578125, -0.24155235290527344, 0.3159235715866089, 0.8733994960784912, 1.4308754205703735, 1.9883513450622559, 2.5458273887634277, 3.1033031940460205, 3.6607789993286133, 4.218255043029785, 4.775731086730957, 5.333207130432129, 5.890682697296143, 6.4481587409973145, 7.005634784698486, 7.5631103515625, 8.120586395263672, 8.678062438964844, 9.235538482666016, 9.793014526367188, 10.35049057006836, 10.907966613769531, 11.465442657470703, 12.022917747497559, 12.58039379119873, 13.137869834899902, 13.695345878601074, 14.252821922302246, 14.810297966003418, 15.367773056030273, 15.925249099731445, 16.482725143432617, 17.04020118713379, 17.59767723083496]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 4.0, 6.0, 9.0, 12.0, 14.0, 17.0, 23.0, 15.0, 23.0, 21.0, 26.0, 31.0, 36.0, 39.0, 27.0, 35.0, 44.0, 35.0, 34.0, 44.0, 40.0, 50.0, 36.0, 41.0, 40.0, 27.0, 33.0, 35.0, 23.0, 35.0, 16.0, 18.0, 14.0, 16.0, 20.0, 14.0, 9.0, 5.0, 10.0, 7.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.5117340087890625, -1.459014892578125, -1.4062957763671875, -1.35357666015625, -1.3008575439453125, -1.248138427734375, -1.1954193115234375, -1.1427001953125, -1.0899810791015625, -1.037261962890625, -0.9845428466796875, -0.93182373046875, -0.8791046142578125, -0.826385498046875, -0.7736663818359375, -0.720947265625, -0.6682281494140625, -0.615509033203125, -0.5627899169921875, -0.51007080078125, -0.4573516845703125, -0.404632568359375, -0.3519134521484375, -0.2991943359375, -0.2464752197265625, -0.193756103515625, -0.1410369873046875, -0.08831787109375, -0.0355987548828125, 0.017120361328125, 0.0698394775390625, 0.12255859375, 0.1752777099609375, 0.227996826171875, 0.2807159423828125, 0.33343505859375, 0.3861541748046875, 0.438873291015625, 0.4915924072265625, 0.5443115234375, 0.5970306396484375, 0.649749755859375, 0.7024688720703125, 0.75518798828125, 0.8079071044921875, 0.860626220703125, 0.9133453369140625, 0.966064453125, 1.0187835693359375, 1.071502685546875, 1.1242218017578125, 1.17694091796875, 1.2296600341796875, 1.282379150390625, 1.3350982666015625, 1.3878173828125, 1.4405364990234375, 1.493255615234375, 1.5459747314453125, 1.59869384765625, 1.6514129638671875, 1.704132080078125, 1.7568511962890625, 1.8095703125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 4.0, 5.0, 5.0, 9.0, 20.0, 23.0, 31.0, 26.0, 40.0, 69.0, 106.0, 158.0, 217.0, 397.0, 793.0, 1655.0, 4103.0, 11153.0, 32910.0, 104434.0, 350830.0, 1208165.0, 1671940.0, 565953.0, 163577.0, 50294.0, 16553.0, 6082.0, 2352.0, 1017.0, 477.0, 272.0, 159.0, 121.0, 98.0, 53.0, 46.0, 33.0, 30.0, 17.0, 15.0, 13.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.654296875, -3.544189453125, -3.43408203125, -3.323974609375, -3.2138671875, -3.103759765625, -2.99365234375, -2.883544921875, -2.7734375, -2.663330078125, -2.55322265625, -2.443115234375, -2.3330078125, -2.222900390625, -2.11279296875, -2.002685546875, -1.892578125, -1.782470703125, -1.67236328125, -1.562255859375, -1.4521484375, -1.342041015625, -1.23193359375, -1.121826171875, -1.01171875, -0.901611328125, -0.79150390625, -0.681396484375, -0.5712890625, -0.461181640625, -0.35107421875, -0.240966796875, -0.130859375, -0.020751953125, 0.08935546875, 0.199462890625, 0.3095703125, 0.419677734375, 0.52978515625, 0.639892578125, 0.75, 0.860107421875, 0.97021484375, 1.080322265625, 1.1904296875, 1.300537109375, 1.41064453125, 1.520751953125, 1.630859375, 1.740966796875, 1.85107421875, 1.961181640625, 2.0712890625, 2.181396484375, 2.29150390625, 2.401611328125, 2.51171875, 2.621826171875, 2.73193359375, 2.842041015625, 2.9521484375, 3.062255859375, 3.17236328125, 3.282470703125, 3.392578125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 11.0, 20.0, 33.0, 46.0, 89.0, 150.0, 303.0, 454.0, 738.0, 839.0, 562.0, 381.0, 207.0, 112.0, 63.0, 33.0, 18.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.109375, -13.81671142578125, -13.5240478515625, -13.23138427734375, -12.938720703125, -12.64605712890625, -12.3533935546875, -12.06072998046875, -11.76806640625, -11.47540283203125, -11.1827392578125, -10.89007568359375, -10.597412109375, -10.30474853515625, -10.0120849609375, -9.71942138671875, -9.4267578125, -9.13409423828125, -8.8414306640625, -8.54876708984375, -8.256103515625, -7.96343994140625, -7.6707763671875, -7.37811279296875, -7.08544921875, -6.79278564453125, -6.5001220703125, -6.20745849609375, -5.914794921875, -5.62213134765625, -5.3294677734375, -5.03680419921875, -4.744140625, -4.45147705078125, -4.1588134765625, -3.86614990234375, -3.573486328125, -3.28082275390625, -2.9881591796875, -2.69549560546875, -2.40283203125, -2.11016845703125, -1.8175048828125, -1.52484130859375, -1.232177734375, -0.93951416015625, -0.6468505859375, -0.35418701171875, -0.0615234375, 0.23114013671875, 0.5238037109375, 0.81646728515625, 1.109130859375, 1.40179443359375, 1.6944580078125, 1.98712158203125, 2.27978515625, 2.57244873046875, 2.8651123046875, 3.15777587890625, 3.450439453125, 3.74310302734375, 4.0357666015625, 4.32843017578125, 4.62109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 9.0, 10.0, 30.0, 27.0, 43.0, 81.0, 139.0, 269.0, 586.0, 1531.0, 5640.0, 45226.0, 790046.0, 3010448.0, 313928.0, 20708.0, 3538.0, 1071.0, 444.0, 229.0, 105.0, 61.0, 37.0, 25.0, 18.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.7884521484375, -9.350341796875, -8.9122314453125, -8.47412109375, -8.0360107421875, -7.597900390625, -7.1597900390625, -6.7216796875, -6.2835693359375, -5.845458984375, -5.4073486328125, -4.96923828125, -4.5311279296875, -4.093017578125, -3.6549072265625, -3.216796875, -2.7786865234375, -2.340576171875, -1.9024658203125, -1.46435546875, -1.0262451171875, -0.588134765625, -0.1500244140625, 0.2880859375, 0.7261962890625, 1.164306640625, 1.6024169921875, 2.04052734375, 2.4786376953125, 2.916748046875, 3.3548583984375, 3.79296875, 4.2310791015625, 4.669189453125, 5.1072998046875, 5.54541015625, 5.9835205078125, 6.421630859375, 6.8597412109375, 7.2978515625, 7.7359619140625, 8.174072265625, 8.6121826171875, 9.05029296875, 9.4884033203125, 9.926513671875, 10.3646240234375, 10.802734375, 11.2408447265625, 11.678955078125, 12.1170654296875, 12.55517578125, 12.9932861328125, 13.431396484375, 13.8695068359375, 14.3076171875, 14.7457275390625, 15.183837890625, 15.6219482421875, 16.06005859375, 16.4981689453125, 16.936279296875, 17.3743896484375, 17.8125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 8.0, 24.0, 35.0, 46.0, 66.0, 79.0, 92.0, 104.0, 122.0, 117.0, 98.0, 71.0, 57.0, 44.0, 22.0, 10.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.606205940246582, -12.44528865814209, -11.284372329711914, -10.123455047607422, -8.96253776550293, -7.801621437072754, -6.640704154968262, -5.479787826538086, -4.318870544433594, -3.1579537391662598, -1.9970366954803467, -0.8361196517944336, 0.3247971534729004, 1.4857139587402344, 2.6466312408447266, 3.8075475692749023, 4.9684648513793945, 6.1293816566467285, 7.2902984619140625, 8.451215744018555, 9.612133026123047, 10.773049354553223, 11.933966636657715, 13.09488296508789, 14.255800247192383, 15.416717529296875, 16.577634811401367, 17.73855209350586, 18.89946746826172, 20.06038475036621, 21.221302032470703, 22.382217407226562, 23.543132781982422, 24.704050064086914, 25.864967346191406, 27.025882720947266, 28.186800003051758, 29.34771728515625, 30.508634567260742, 31.669551849365234, 32.830467224121094, 33.99138259887695, 35.15230178833008, 36.31321716308594, 37.47413635253906, 38.63505172729492, 39.79596710205078, 40.956886291503906, 42.11780548095703, 43.27872085571289, 44.439640045166016, 45.600555419921875, 46.761474609375, 47.92238998413086, 49.08330535888672, 50.244224548339844, 51.4051399230957, 52.56605529785156, 53.72697448730469, 54.88788986206055, 56.04880905151367, 57.20972442626953, 58.370643615722656, 59.531558990478516, 60.692474365234375]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 7.0, 4.0, 10.0, 8.0, 12.0, 10.0, 16.0, 22.0, 15.0, 15.0, 14.0, 29.0, 33.0, 34.0, 29.0, 29.0, 33.0, 39.0, 42.0, 42.0, 42.0, 28.0, 53.0, 29.0, 47.0, 29.0, 38.0, 41.0, 30.0, 33.0, 31.0, 24.0, 15.0, 15.0, 24.0, 20.0, 12.0, 13.0, 8.0, 11.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.288288116455078, -19.717477798461914, -19.14666748046875, -18.575857162475586, -18.005046844482422, -17.434236526489258, -16.863426208496094, -16.292617797851562, -15.721806526184082, -15.150996208190918, -14.580185890197754, -14.00937557220459, -13.438566207885742, -12.867755889892578, -12.296945571899414, -11.72613525390625, -11.155324935913086, -10.584514617919922, -10.013704299926758, -9.442893981933594, -8.87208366394043, -8.301273345947266, -7.730463981628418, -7.159653663635254, -6.58884334564209, -6.018033027648926, -5.447222709655762, -4.876412868499756, -4.305602550506592, -3.7347922325134277, -3.1639821529388428, -2.593172073364258, -2.022359848022461, -1.4515496492385864, -0.8807394504547119, -0.3099292516708374, 0.2608809471130371, 0.8316912651062012, 1.4025013446807861, 1.973311424255371, 2.544121742248535, 3.114932060241699, 3.685742139816284, 4.256552219390869, 4.827362537384033, 5.398172855377197, 5.968982696533203, 6.539793014526367, 7.110603332519531, 7.681413650512695, 8.25222396850586, 8.823034286499023, 9.393844604492188, 9.964654922485352, 10.5354642868042, 11.106274604797363, 11.677084922790527, 12.247895240783691, 12.818705558776855, 13.38951587677002, 13.960325241088867, 14.531135559082031, 15.101945877075195, 15.67275619506836, 16.243566513061523]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 5.0, 7.0, 6.0, 9.0, 11.0, 16.0, 13.0, 20.0, 15.0, 19.0, 20.0, 27.0, 30.0, 32.0, 35.0, 35.0, 39.0, 28.0, 36.0, 36.0, 38.0, 47.0, 36.0, 42.0, 38.0, 35.0, 35.0, 37.0, 41.0, 29.0, 25.0, 20.0, 19.0, 19.0, 19.0, 18.0, 19.0, 11.0, 6.0, 7.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.5109100341796875, -1.457366943359375, -1.4038238525390625, -1.35028076171875, -1.2967376708984375, -1.243194580078125, -1.1896514892578125, -1.1361083984375, -1.0825653076171875, -1.029022216796875, -0.9754791259765625, -0.92193603515625, -0.8683929443359375, -0.814849853515625, -0.7613067626953125, -0.707763671875, -0.6542205810546875, -0.600677490234375, -0.5471343994140625, -0.49359130859375, -0.4400482177734375, -0.386505126953125, -0.3329620361328125, -0.2794189453125, -0.2258758544921875, -0.172332763671875, -0.1187896728515625, -0.06524658203125, -0.0117034912109375, 0.041839599609375, 0.0953826904296875, 0.14892578125, 0.2024688720703125, 0.256011962890625, 0.3095550537109375, 0.36309814453125, 0.4166412353515625, 0.470184326171875, 0.5237274169921875, 0.5772705078125, 0.6308135986328125, 0.684356689453125, 0.7378997802734375, 0.79144287109375, 0.8449859619140625, 0.898529052734375, 0.9520721435546875, 1.005615234375, 1.0591583251953125, 1.112701416015625, 1.1662445068359375, 1.21978759765625, 1.2733306884765625, 1.326873779296875, 1.3804168701171875, 1.4339599609375, 1.4875030517578125, 1.541046142578125, 1.5945892333984375, 1.64813232421875, 1.7016754150390625, 1.755218505859375, 1.8087615966796875, 1.8623046875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 5.0, 7.0, 21.0, 40.0, 49.0, 82.0, 121.0, 159.0, 248.0, 380.0, 566.0, 829.0, 1263.0, 1942.0, 2813.0, 4250.0, 6156.0, 9181.0, 13057.0, 19126.0, 28905.0, 43510.0, 67465.0, 113367.0, 276722.0, 187533.0, 94989.0, 58593.0, 38069.0, 25442.0, 17209.0, 11710.0, 7952.0, 5531.0, 3651.0, 2564.0, 1678.0, 1154.0, 785.0, 501.0, 313.0, 206.0, 147.0, 97.0, 50.0, 38.0, 34.0, 15.0, 9.0, 10.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.062255859375, -0.06030082702636719, -0.058345794677734375, -0.05639076232910156, -0.05443572998046875, -0.05248069763183594, -0.050525665283203125, -0.04857063293457031, -0.0466156005859375, -0.04466056823730469, -0.042705535888671875, -0.04075050354003906, -0.03879547119140625, -0.03684043884277344, -0.034885406494140625, -0.03293037414550781, -0.030975341796875, -0.029020309448242188, -0.027065277099609375, -0.025110244750976562, -0.02315521240234375, -0.021200180053710938, -0.019245147705078125, -0.017290115356445312, -0.0153350830078125, -0.013380050659179688, -0.011425018310546875, -0.009469985961914062, -0.00751495361328125, -0.0055599212646484375, -0.003604888916015625, -0.0016498565673828125, 0.00030517578125, 0.0022602081298828125, 0.004215240478515625, 0.0061702728271484375, 0.00812530517578125, 0.010080337524414062, 0.012035369873046875, 0.013990402221679688, 0.0159454345703125, 0.017900466918945312, 0.019855499267578125, 0.021810531616210938, 0.02376556396484375, 0.025720596313476562, 0.027675628662109375, 0.029630661010742188, 0.031585693359375, 0.03354072570800781, 0.035495758056640625, 0.03745079040527344, 0.03940582275390625, 0.04136085510253906, 0.043315887451171875, 0.04527091979980469, 0.0472259521484375, 0.04918098449707031, 0.051136016845703125, 0.05309104919433594, 0.05504608154296875, 0.05700111389160156, 0.058956146240234375, 0.06091117858886719, 0.0628662109375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 4.0, 9.0, 11.0, 7.0, 18.0, 21.0, 31.0, 32.0, 29.0, 29.0, 23.0, 34.0, 35.0, 43.0, 40.0, 45.0, 32.0, 34.0, 1051.0, 42.0, 45.0, 45.0, 44.0, 40.0, 39.0, 34.0, 35.0, 31.0, 23.0, 14.0, 16.0, 12.0, 10.0, 12.0, 8.0, 12.0, 5.0, 10.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1787109375, -1.1368255615234375, -1.094940185546875, -1.0530548095703125, -1.01116943359375, -0.9692840576171875, -0.927398681640625, -0.8855133056640625, -0.8436279296875, -0.8017425537109375, -0.759857177734375, -0.7179718017578125, -0.67608642578125, -0.6342010498046875, -0.592315673828125, -0.5504302978515625, -0.508544921875, -0.4666595458984375, -0.424774169921875, -0.3828887939453125, -0.34100341796875, -0.2991180419921875, -0.257232666015625, -0.2153472900390625, -0.1734619140625, -0.1315765380859375, -0.089691162109375, -0.0478057861328125, -0.00592041015625, 0.0359649658203125, 0.077850341796875, 0.1197357177734375, 0.16162109375, 0.2035064697265625, 0.245391845703125, 0.2872772216796875, 0.32916259765625, 0.3710479736328125, 0.412933349609375, 0.4548187255859375, 0.4967041015625, 0.5385894775390625, 0.580474853515625, 0.6223602294921875, 0.66424560546875, 0.7061309814453125, 0.748016357421875, 0.7899017333984375, 0.831787109375, 0.8736724853515625, 0.915557861328125, 0.9574432373046875, 0.99932861328125, 1.0412139892578125, 1.083099365234375, 1.1249847412109375, 1.1668701171875, 1.2087554931640625, 1.250640869140625, 1.2925262451171875, 1.33441162109375, 1.3762969970703125, 1.418182373046875, 1.4600677490234375, 1.501953125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 4.0, 9.0, 11.0, 23.0, 29.0, 54.0, 75.0, 114.0, 181.0, 286.0, 429.0, 629.0, 1027.0, 1530.0, 2538.0, 3924.0, 5983.0, 9213.0, 14361.0, 23212.0, 37727.0, 63487.0, 117915.0, 1313134.0, 232604.0, 110295.0, 61028.0, 35987.0, 22170.0, 14305.0, 8912.0, 5676.0, 3580.0, 2363.0, 1520.0, 995.0, 646.0, 438.0, 251.0, 166.0, 93.0, 71.0, 44.0, 23.0, 21.0, 13.0, 12.0, 11.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.043182373046875, -0.04187202453613281, -0.040561676025390625, -0.03925132751464844, -0.03794097900390625, -0.03663063049316406, -0.035320281982421875, -0.03400993347167969, -0.0326995849609375, -0.03138923645019531, -0.030078887939453125, -0.028768539428710938, -0.02745819091796875, -0.026147842407226562, -0.024837493896484375, -0.023527145385742188, -0.022216796875, -0.020906448364257812, -0.019596099853515625, -0.018285751342773438, -0.01697540283203125, -0.015665054321289062, -0.014354705810546875, -0.013044357299804688, -0.0117340087890625, -0.010423660278320312, -0.009113311767578125, -0.0078029632568359375, -0.00649261474609375, -0.0051822662353515625, -0.003871917724609375, -0.0025615692138671875, -0.001251220703125, 5.91278076171875e-05, 0.001369476318359375, 0.0026798248291015625, 0.00399017333984375, 0.0053005218505859375, 0.006610870361328125, 0.007921218872070312, 0.0092315673828125, 0.010541915893554688, 0.011852264404296875, 0.013162612915039062, 0.01447296142578125, 0.015783309936523438, 0.017093658447265625, 0.018404006958007812, 0.01971435546875, 0.021024703979492188, 0.022335052490234375, 0.023645401000976562, 0.02495574951171875, 0.026266098022460938, 0.027576446533203125, 0.028886795043945312, 0.0301971435546875, 0.03150749206542969, 0.032817840576171875, 0.03412818908691406, 0.03543853759765625, 0.03674888610839844, 0.038059234619140625, 0.03936958312988281, 0.040679931640625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 0.0, 10.0, 6.0, 14.0, 13.0, 0.0, 13.0, 36.0, 52.0, 88.0, 0.0, 527.0, 102.0, 57.0, 0.0, 28.0, 10.0, 12.0, 6.0, 0.0, 6.0, 4.0, 3.0, 0.0, 7.0, 0.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.9203871488571167e-06, -1.8738210201263428e-06, -1.8272548913955688e-06, -1.780688762664795e-06, -1.734122633934021e-06, -1.687556505203247e-06, -1.6409903764724731e-06, -1.5944242477416992e-06, -1.5478581190109253e-06, -1.5012919902801514e-06, -1.4547258615493774e-06, -1.4081597328186035e-06, -1.3615936040878296e-06, -1.3150274753570557e-06, -1.2684613466262817e-06, -1.2218952178955078e-06, -1.1753290891647339e-06, -1.12876296043396e-06, -1.082196831703186e-06, -1.0356307029724121e-06, -9.890645742416382e-07, -9.424984455108643e-07, -8.959323167800903e-07, -8.493661880493164e-07, -8.028000593185425e-07, -7.562339305877686e-07, -7.096678018569946e-07, -6.631016731262207e-07, -6.165355443954468e-07, -5.699694156646729e-07, -5.234032869338989e-07, -4.76837158203125e-07, -4.302710294723511e-07, -3.8370490074157715e-07, -3.371387720108032e-07, -2.905726432800293e-07, -2.4400651454925537e-07, -1.9744038581848145e-07, -1.5087425708770752e-07, -1.043081283569336e-07, -5.774199962615967e-08, -1.1175870895385742e-08, 3.5390257835388184e-08, 8.195638656616211e-08, 1.2852251529693604e-07, 1.7508864402770996e-07, 2.2165477275848389e-07, 2.682209014892578e-07, 3.1478703022003174e-07, 3.6135315895080566e-07, 4.079192876815796e-07, 4.544854164123535e-07, 5.010515451431274e-07, 5.476176738739014e-07, 5.941838026046753e-07, 6.407499313354492e-07, 6.873160600662231e-07, 7.338821887969971e-07, 7.80448317527771e-07, 8.270144462585449e-07, 8.735805749893188e-07, 9.201467037200928e-07, 9.667128324508667e-07, 1.0132789611816406e-06]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 3.0, 4.0, 7.0, 7.0, 13.0, 9.0, 30.0, 44.0, 74.0, 129.0, 372.0, 15033.0, 1021847.0, 10387.0, 305.0, 93.0, 48.0, 46.0, 29.0, 24.0, 20.0, 17.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9550323486328125e-05, -1.8716789782047272e-05, -1.788325607776642e-05, -1.7049722373485565e-05, -1.6216188669204712e-05, -1.538265496492386e-05, -1.4549121260643005e-05, -1.3715587556362152e-05, -1.2882053852081299e-05, -1.2048520147800446e-05, -1.1214986443519592e-05, -1.0381452739238739e-05, -9.547919034957886e-06, -8.714385330677032e-06, -7.88085162639618e-06, -7.047317922115326e-06, -6.213784217834473e-06, -5.380250513553619e-06, -4.546716809272766e-06, -3.713183104991913e-06, -2.8796494007110596e-06, -2.0461156964302063e-06, -1.212581992149353e-06, -3.7904828786849976e-07, 4.544854164123535e-07, 1.2880191206932068e-06, 2.12155282497406e-06, 2.9550865292549133e-06, 3.7886202335357666e-06, 4.62215393781662e-06, 5.455687642097473e-06, 6.289221346378326e-06, 7.12275505065918e-06, 7.956288754940033e-06, 8.789822459220886e-06, 9.62335616350174e-06, 1.0456889867782593e-05, 1.1290423572063446e-05, 1.21239572763443e-05, 1.2957490980625153e-05, 1.3791024684906006e-05, 1.4624558389186859e-05, 1.5458092093467712e-05, 1.6291625797748566e-05, 1.712515950202942e-05, 1.7958693206310272e-05, 1.8792226910591125e-05, 1.962576061487198e-05, 2.0459294319152832e-05, 2.1292828023433685e-05, 2.212636172771454e-05, 2.2959895431995392e-05, 2.3793429136276245e-05, 2.46269628405571e-05, 2.546049654483795e-05, 2.6294030249118805e-05, 2.7127563953399658e-05, 2.796109765768051e-05, 2.8794631361961365e-05, 2.9628165066242218e-05, 3.046169877052307e-05, 3.1295232474803925e-05, 3.212876617908478e-05, 3.296229988336563e-05, 3.3795833587646484e-05]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 11.0, 16.0, 20.0, 31.0, 833.0, 31.0, 22.0, 21.0, 11.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.063435300049605e-07, -8.880516588760656e-07, -8.697597309037519e-07, -8.514678597748571e-07, -8.331759318025433e-07, -8.148840606736485e-07, -7.965921895447536e-07, -7.783002615724399e-07, -7.600083904435451e-07, -7.417165193146502e-07, -7.234245913423365e-07, -7.051327202134416e-07, -6.868407922411279e-07, -6.685489211122331e-07, -6.502569931399194e-07, -6.319651220110245e-07, -6.136732508821297e-07, -5.953813797532348e-07, -5.770894517809211e-07, -5.587975806520262e-07, -5.405056526797125e-07, -5.222137815508177e-07, -5.039219104219228e-07, -4.856299824496091e-07, -4.6733805447729537e-07, -4.490461549266911e-07, -4.307542553760868e-07, -4.1246238424719195e-07, -3.9417048469658766e-07, -3.758785851459834e-07, -3.575866855953791e-07, -3.392947860447748e-07, -3.210029433375894e-07, -3.027110437869851e-07, -2.844191442363808e-07, -2.6612724468577653e-07, -2.478353735568817e-07, -2.295434740062774e-07, -2.112515744556731e-07, -1.9295968911592354e-07, -1.7466778956531925e-07, -1.5637589001471497e-07, -1.380840046749654e-07, -1.1979210512436111e-07, -1.0150021267918419e-07, -8.320832023400726e-08, -6.491642068340298e-08, -4.6624535343653406e-08, -2.833263579304912e-08, -1.0040741571515355e-08, 8.251152650018412e-09, 2.6543048647909018e-08, 4.4834941093085945e-08, 6.312683353826287e-08, 8.141873308886716e-08, 9.971061842861673e-08, 1.1800251797922101e-07, 1.362944175298253e-07, 1.5458630286957487e-07, 1.7287820242017915e-07, 1.9117010197078343e-07, 2.09461987310533e-07, 2.277538868611373e-07, 2.4604577220088686e-07, 2.6433767175149114e-07]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 825.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 5.0, 7.0, 6.0, 9.0, 11.0, 16.0, 13.0, 20.0, 15.0, 19.0, 20.0, 27.0, 30.0, 32.0, 35.0, 35.0, 39.0, 28.0, 36.0, 36.0, 38.0, 47.0, 36.0, 42.0, 38.0, 35.0, 35.0, 37.0, 41.0, 29.0, 25.0, 20.0, 19.0, 19.0, 19.0, 18.0, 19.0, 11.0, 6.0, 7.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.5109100341796875, -1.457366943359375, -1.4038238525390625, -1.35028076171875, -1.2967376708984375, -1.243194580078125, -1.1896514892578125, -1.1361083984375, -1.0825653076171875, -1.029022216796875, -0.9754791259765625, -0.92193603515625, -0.8683929443359375, -0.814849853515625, -0.7613067626953125, -0.707763671875, -0.6542205810546875, -0.600677490234375, -0.5471343994140625, -0.49359130859375, -0.4400482177734375, -0.386505126953125, -0.3329620361328125, -0.2794189453125, -0.2258758544921875, -0.172332763671875, -0.1187896728515625, -0.06524658203125, -0.0117034912109375, 0.041839599609375, 0.0953826904296875, 0.14892578125, 0.2024688720703125, 0.256011962890625, 0.3095550537109375, 0.36309814453125, 0.4166412353515625, 0.470184326171875, 0.5237274169921875, 0.5772705078125, 0.6308135986328125, 0.684356689453125, 0.7378997802734375, 0.79144287109375, 0.8449859619140625, 0.898529052734375, 0.9520721435546875, 1.005615234375, 1.0591583251953125, 1.112701416015625, 1.1662445068359375, 1.21978759765625, 1.2733306884765625, 1.326873779296875, 1.3804168701171875, 1.4339599609375, 1.4875030517578125, 1.541046142578125, 1.5945892333984375, 1.64813232421875, 1.7016754150390625, 1.755218505859375, 1.8087615966796875, 1.8623046875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 13.0, 14.0, 17.0, 22.0, 34.0, 44.0, 68.0, 103.0, 153.0, 247.0, 364.0, 503.0, 840.0, 1266.0, 1894.0, 2788.0, 4445.0, 6991.0, 11094.0, 18522.0, 31781.0, 58669.0, 116746.0, 253323.0, 269789.0, 123177.0, 61579.0, 32891.0, 19021.0, 11456.0, 7303.0, 4625.0, 2956.0, 2011.0, 1236.0, 870.0, 584.0, 377.0, 272.0, 128.0, 116.0, 65.0, 52.0, 33.0, 26.0, 23.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.296875, -2.222869873046875, -2.14886474609375, -2.074859619140625, -2.0008544921875, -1.926849365234375, -1.85284423828125, -1.778839111328125, -1.704833984375, -1.630828857421875, -1.55682373046875, -1.482818603515625, -1.4088134765625, -1.334808349609375, -1.26080322265625, -1.186798095703125, -1.11279296875, -1.038787841796875, -0.96478271484375, -0.890777587890625, -0.8167724609375, -0.742767333984375, -0.66876220703125, -0.594757080078125, -0.520751953125, -0.446746826171875, -0.37274169921875, -0.298736572265625, -0.2247314453125, -0.150726318359375, -0.07672119140625, -0.002716064453125, 0.0712890625, 0.145294189453125, 0.21929931640625, 0.293304443359375, 0.3673095703125, 0.441314697265625, 0.51531982421875, 0.589324951171875, 0.663330078125, 0.737335205078125, 0.81134033203125, 0.885345458984375, 0.9593505859375, 1.033355712890625, 1.10736083984375, 1.181365966796875, 1.25537109375, 1.329376220703125, 1.40338134765625, 1.477386474609375, 1.5513916015625, 1.625396728515625, 1.69940185546875, 1.773406982421875, 1.847412109375, 1.921417236328125, 1.99542236328125, 2.069427490234375, 2.1434326171875, 2.217437744140625, 2.29144287109375, 2.365447998046875, 2.439453125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 15.0, 10.0, 17.0, 23.0, 28.0, 34.0, 33.0, 46.0, 53.0, 59.0, 91.0, 131.0, 202.0, 1456.0, 286.0, 128.0, 84.0, 67.0, 48.0, 42.0, 32.0, 30.0, 28.0, 21.0, 17.0, 23.0, 10.0, 7.0, 6.0, 5.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8203125, -9.5595703125, -9.298828125, -9.0380859375, -8.77734375, -8.5166015625, -8.255859375, -7.9951171875, -7.734375, -7.4736328125, -7.212890625, -6.9521484375, -6.69140625, -6.4306640625, -6.169921875, -5.9091796875, -5.6484375, -5.3876953125, -5.126953125, -4.8662109375, -4.60546875, -4.3447265625, -4.083984375, -3.8232421875, -3.5625, -3.3017578125, -3.041015625, -2.7802734375, -2.51953125, -2.2587890625, -1.998046875, -1.7373046875, -1.4765625, -1.2158203125, -0.955078125, -0.6943359375, -0.43359375, -0.1728515625, 0.087890625, 0.3486328125, 0.609375, 0.8701171875, 1.130859375, 1.3916015625, 1.65234375, 1.9130859375, 2.173828125, 2.4345703125, 2.6953125, 2.9560546875, 3.216796875, 3.4775390625, 3.73828125, 3.9990234375, 4.259765625, 4.5205078125, 4.78125, 5.0419921875, 5.302734375, 5.5634765625, 5.82421875, 6.0849609375, 6.345703125, 6.6064453125, 6.8671875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 6.0, 4.0, 17.0, 13.0, 11.0, 16.0, 21.0, 29.0, 37.0, 64.0, 85.0, 134.0, 199.0, 399.0, 1011.0, 3811.0, 20505.0, 203475.0, 2537584.0, 342049.0, 28859.0, 4915.0, 1247.0, 495.0, 237.0, 122.0, 101.0, 58.0, 56.0, 36.0, 28.0, 28.0, 14.0, 8.0, 8.0, 8.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.234375, -9.8997802734375, -9.565185546875, -9.2305908203125, -8.89599609375, -8.5614013671875, -8.226806640625, -7.8922119140625, -7.5576171875, -7.2230224609375, -6.888427734375, -6.5538330078125, -6.21923828125, -5.8846435546875, -5.550048828125, -5.2154541015625, -4.880859375, -4.5462646484375, -4.211669921875, -3.8770751953125, -3.54248046875, -3.2078857421875, -2.873291015625, -2.5386962890625, -2.2041015625, -1.8695068359375, -1.534912109375, -1.2003173828125, -0.86572265625, -0.5311279296875, -0.196533203125, 0.1380615234375, 0.47265625, 0.8072509765625, 1.141845703125, 1.4764404296875, 1.81103515625, 2.1456298828125, 2.480224609375, 2.8148193359375, 3.1494140625, 3.4840087890625, 3.818603515625, 4.1531982421875, 4.48779296875, 4.8223876953125, 5.156982421875, 5.4915771484375, 5.826171875, 6.1607666015625, 6.495361328125, 6.8299560546875, 7.16455078125, 7.4991455078125, 7.833740234375, 8.1683349609375, 8.5029296875, 8.8375244140625, 9.172119140625, 9.5067138671875, 9.84130859375, 10.1759033203125, 10.510498046875, 10.8450927734375, 11.1796875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [108.0, 871.0, 39.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.390555381774902, -2.889803886413574, 3.610947608947754, 10.111699104309082, 16.612449645996094, 23.113201141357422, 29.61395263671875, 36.11470413208008, 42.615455627441406, 49.116207122802734, 55.61695861816406, 62.11771011352539, 68.61846160888672, 75.11921691894531, 81.61996459960938, 88.12071228027344, 94.62146759033203, 101.12222290039062, 107.62297058105469, 114.12371826171875, 120.62447357177734, 127.12522888183594, 133.6259765625, 140.12672424316406, 146.6274871826172, 153.12823486328125, 159.62899780273438, 166.12974548339844, 172.6304931640625, 179.13124084472656, 185.63198852539062, 192.13275146484375, 198.63348388671875, 205.1342315673828, 211.63497924804688, 218.1357421875, 224.63648986816406, 231.13723754882812, 237.63800048828125, 244.1387481689453, 250.63949584960938, 257.1402587890625, 263.6409912109375, 270.1417541503906, 276.64251708984375, 283.14324951171875, 289.6440124511719, 296.1447448730469, 302.6455078125, 309.1462707519531, 315.6470031738281, 322.14776611328125, 328.64849853515625, 335.1492614746094, 341.6500244140625, 348.1507568359375, 354.6515197753906, 361.15228271484375, 367.65301513671875, 374.1537780761719, 380.654541015625, 387.1552734375, 393.6560363769531, 400.1567687988281, 406.65753173828125]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 5.0, 16.0, 9.0, 5.0, 9.0, 10.0, 17.0, 22.0, 22.0, 18.0, 27.0, 26.0, 31.0, 34.0, 39.0, 37.0, 30.0, 40.0, 33.0, 38.0, 40.0, 35.0, 48.0, 41.0, 43.0, 41.0, 26.0, 29.0, 26.0, 24.0, 26.0, 23.0, 14.0, 11.0, 20.0, 14.0, 11.0, 10.0, 12.0, 10.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0], "bins": [-22.254898071289062, -21.652996063232422, -21.05109405517578, -20.449193954467773, -19.847291946411133, -19.245389938354492, -18.643489837646484, -18.041587829589844, -17.439685821533203, -16.837783813476562, -16.235881805419922, -15.633981704711914, -15.032079696655273, -14.430177688598633, -13.828276634216309, -13.226375579833984, -12.624473571777344, -12.022571563720703, -11.420670509338379, -10.818769454956055, -10.216867446899414, -9.614965438842773, -9.01306438446045, -8.411163330078125, -7.809261322021484, -7.207359790802002, -6.6054582595825195, -6.003556728363037, -5.401655197143555, -4.799753665924072, -4.19785213470459, -3.5959506034851074, -2.994047164916992, -2.3921456336975098, -1.7902441024780273, -1.188342571258545, -0.5864410400390625, 0.015460491180419922, 0.6173620223999023, 1.2192635536193848, 1.8211650848388672, 2.4230666160583496, 3.024968147277832, 3.6268696784973145, 4.228771209716797, 4.830672740936279, 5.432574272155762, 6.034475803375244, 6.636377334594727, 7.238278865814209, 7.840180397033691, 8.442081451416016, 9.043983459472656, 9.645885467529297, 10.247786521911621, 10.849687576293945, 11.451589584350586, 12.053491592407227, 12.65539264678955, 13.257293701171875, 13.859195709228516, 14.461097717285156, 15.06299877166748, 15.664899826049805, 16.266801834106445]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 13.0, 10.0, 13.0, 14.0, 16.0, 18.0, 18.0, 17.0, 19.0, 23.0, 17.0, 27.0, 35.0, 34.0, 26.0, 30.0, 35.0, 39.0, 36.0, 36.0, 41.0, 29.0, 36.0, 44.0, 31.0, 28.0, 35.0, 34.0, 36.0, 31.0, 20.0, 15.0, 18.0, 18.0, 20.0, 15.0, 11.0, 8.0, 10.0, 7.0, 10.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5224609375, -1.469940185546875, -1.41741943359375, -1.364898681640625, -1.3123779296875, -1.259857177734375, -1.20733642578125, -1.154815673828125, -1.102294921875, -1.049774169921875, -0.99725341796875, -0.944732666015625, -0.8922119140625, -0.839691162109375, -0.78717041015625, -0.734649658203125, -0.68212890625, -0.629608154296875, -0.57708740234375, -0.524566650390625, -0.4720458984375, -0.419525146484375, -0.36700439453125, -0.314483642578125, -0.261962890625, -0.209442138671875, -0.15692138671875, -0.104400634765625, -0.0518798828125, 0.000640869140625, 0.05316162109375, 0.105682373046875, 0.158203125, 0.210723876953125, 0.26324462890625, 0.315765380859375, 0.3682861328125, 0.420806884765625, 0.47332763671875, 0.525848388671875, 0.578369140625, 0.630889892578125, 0.68341064453125, 0.735931396484375, 0.7884521484375, 0.840972900390625, 0.89349365234375, 0.946014404296875, 0.99853515625, 1.051055908203125, 1.10357666015625, 1.156097412109375, 1.2086181640625, 1.261138916015625, 1.31365966796875, 1.366180419921875, 1.418701171875, 1.471221923828125, 1.52374267578125, 1.576263427734375, 1.6287841796875, 1.681304931640625, 1.73382568359375, 1.786346435546875, 1.8388671875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 5.0, 12.0, 9.0, 11.0, 21.0, 24.0, 29.0, 62.0, 94.0, 130.0, 205.0, 326.0, 544.0, 952.0, 1785.0, 3436.0, 7031.0, 14621.0, 32495.0, 72687.0, 164995.0, 379036.0, 850934.0, 1282715.0, 772347.0, 340888.0, 147914.0, 64867.0, 29195.0, 13388.0, 6402.0, 3243.0, 1670.0, 861.0, 506.0, 286.0, 196.0, 126.0, 80.0, 47.0, 35.0, 25.0, 18.0, 8.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.693359375, -2.615142822265625, -2.53692626953125, -2.458709716796875, -2.3804931640625, -2.302276611328125, -2.22406005859375, -2.145843505859375, -2.067626953125, -1.989410400390625, -1.91119384765625, -1.832977294921875, -1.7547607421875, -1.676544189453125, -1.59832763671875, -1.520111083984375, -1.44189453125, -1.363677978515625, -1.28546142578125, -1.207244873046875, -1.1290283203125, -1.050811767578125, -0.97259521484375, -0.894378662109375, -0.816162109375, -0.737945556640625, -0.65972900390625, -0.581512451171875, -0.5032958984375, -0.425079345703125, -0.34686279296875, -0.268646240234375, -0.1904296875, -0.112213134765625, -0.03399658203125, 0.044219970703125, 0.1224365234375, 0.200653076171875, 0.27886962890625, 0.357086181640625, 0.435302734375, 0.513519287109375, 0.59173583984375, 0.669952392578125, 0.7481689453125, 0.826385498046875, 0.90460205078125, 0.982818603515625, 1.06103515625, 1.139251708984375, 1.21746826171875, 1.295684814453125, 1.3739013671875, 1.452117919921875, 1.53033447265625, 1.608551025390625, 1.686767578125, 1.764984130859375, 1.84320068359375, 1.921417236328125, 1.9996337890625, 2.077850341796875, 2.15606689453125, 2.234283447265625, 2.3125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 7.0, 11.0, 15.0, 19.0, 36.0, 61.0, 99.0, 137.0, 202.0, 284.0, 414.0, 538.0, 579.0, 471.0, 371.0, 274.0, 173.0, 140.0, 81.0, 56.0, 38.0, 26.0, 14.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.219970703125, -9.00244140625, -8.784912109375, -8.5673828125, -8.349853515625, -8.13232421875, -7.914794921875, -7.697265625, -7.479736328125, -7.26220703125, -7.044677734375, -6.8271484375, -6.609619140625, -6.39208984375, -6.174560546875, -5.95703125, -5.739501953125, -5.52197265625, -5.304443359375, -5.0869140625, -4.869384765625, -4.65185546875, -4.434326171875, -4.216796875, -3.999267578125, -3.78173828125, -3.564208984375, -3.3466796875, -3.129150390625, -2.91162109375, -2.694091796875, -2.4765625, -2.259033203125, -2.04150390625, -1.823974609375, -1.6064453125, -1.388916015625, -1.17138671875, -0.953857421875, -0.736328125, -0.518798828125, -0.30126953125, -0.083740234375, 0.1337890625, 0.351318359375, 0.56884765625, 0.786376953125, 1.00390625, 1.221435546875, 1.43896484375, 1.656494140625, 1.8740234375, 2.091552734375, 2.30908203125, 2.526611328125, 2.744140625, 2.961669921875, 3.17919921875, 3.396728515625, 3.6142578125, 3.831787109375, 4.04931640625, 4.266845703125, 4.484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 14.0, 28.0, 35.0, 65.0, 114.0, 178.0, 312.0, 633.0, 1579.0, 4872.0, 20391.0, 111309.0, 653333.0, 2231565.0, 960686.0, 169209.0, 29809.0, 6654.0, 1947.0, 714.0, 336.0, 185.0, 116.0, 59.0, 38.0, 32.0, 22.0, 15.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.13671875, -6.86859130859375, -6.6004638671875, -6.33233642578125, -6.064208984375, -5.79608154296875, -5.5279541015625, -5.25982666015625, -4.99169921875, -4.72357177734375, -4.4554443359375, -4.18731689453125, -3.919189453125, -3.65106201171875, -3.3829345703125, -3.11480712890625, -2.8466796875, -2.57855224609375, -2.3104248046875, -2.04229736328125, -1.774169921875, -1.50604248046875, -1.2379150390625, -0.96978759765625, -0.70166015625, -0.43353271484375, -0.1654052734375, 0.10272216796875, 0.370849609375, 0.63897705078125, 0.9071044921875, 1.17523193359375, 1.443359375, 1.71148681640625, 1.9796142578125, 2.24774169921875, 2.515869140625, 2.78399658203125, 3.0521240234375, 3.32025146484375, 3.58837890625, 3.85650634765625, 4.1246337890625, 4.39276123046875, 4.660888671875, 4.92901611328125, 5.1971435546875, 5.46527099609375, 5.7333984375, 6.00152587890625, 6.2696533203125, 6.53778076171875, 6.805908203125, 7.07403564453125, 7.3421630859375, 7.61029052734375, 7.87841796875, 8.14654541015625, 8.4146728515625, 8.68280029296875, 8.950927734375, 9.21905517578125, 9.4871826171875, 9.75531005859375, 10.0234375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 10.0, 30.0, 46.0, 124.0, 171.0, 174.0, 192.0, 156.0, 62.0, 30.0, 16.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.161182403564453, -15.189746856689453, -13.218311309814453, -11.24687671661377, -9.27544116973877, -7.3040056228637695, -5.332571029663086, -3.361135482788086, -1.389699935913086, 0.581735372543335, 2.553170680999756, 4.524605751037598, 6.496041297912598, 8.467476844787598, 10.438911437988281, 12.410346984863281, 14.381782531738281, 16.35321807861328, 18.32465362548828, 20.29608917236328, 22.26752471923828, 24.23896026611328, 26.21039390563965, 28.18182945251465, 30.15326499938965, 32.124698638916016, 34.096134185791016, 36.067569732666016, 38.039005279541016, 40.010440826416016, 41.981876373291016, 43.953311920166016, 45.92474365234375, 47.89617919921875, 49.86761474609375, 51.83905029296875, 53.81048583984375, 55.78192138671875, 57.75335693359375, 59.72479248046875, 61.69622802734375, 63.66766357421875, 65.63909912109375, 67.61053466796875, 69.58197021484375, 71.55340576171875, 73.52484130859375, 75.49627685546875, 77.46771240234375, 79.43914794921875, 81.41058349609375, 83.38201904296875, 85.35345458984375, 87.32489013671875, 89.29632568359375, 91.26776123046875, 93.23918914794922, 95.21062469482422, 97.18206024169922, 99.15349578857422, 101.12493133544922, 103.09636688232422, 105.06780242919922, 107.03923797607422, 109.01067352294922]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 6.0, 10.0, 8.0, 10.0, 14.0, 8.0, 19.0, 19.0, 17.0, 28.0, 20.0, 19.0, 24.0, 37.0, 35.0, 34.0, 31.0, 44.0, 31.0, 39.0, 44.0, 36.0, 41.0, 49.0, 38.0, 38.0, 39.0, 24.0, 24.0, 29.0, 32.0, 21.0, 22.0, 22.0, 13.0, 12.0, 13.0, 6.0, 10.0, 11.0, 6.0, 5.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-20.3746337890625, -19.805919647216797, -19.237205505371094, -18.668493270874023, -18.09977912902832, -17.531064987182617, -16.962352752685547, -16.393638610839844, -15.82492446899414, -15.256210327148438, -14.68749713897705, -14.118783950805664, -13.550069808959961, -12.981355667114258, -12.412642478942871, -11.843929290771484, -11.275215148925781, -10.706501007080078, -10.137787818908691, -9.569074630737305, -9.000360488891602, -8.431646347045898, -7.862933158874512, -7.294219493865967, -6.725505828857422, -6.156792163848877, -5.588078498840332, -5.019364833831787, -4.450651168823242, -3.8819375038146973, -3.3132238388061523, -2.7445101737976074, -2.1757965087890625, -1.6070828437805176, -1.0383691787719727, -0.46965551376342773, 0.09905815124511719, 0.6677718162536621, 1.236485481262207, 1.805199146270752, 2.373912811279297, 2.942626476287842, 3.5113401412963867, 4.080053806304932, 4.648767471313477, 5.2174811363220215, 5.786194801330566, 6.354908466339111, 6.923622131347656, 7.492335796356201, 8.061049461364746, 8.629762649536133, 9.198476791381836, 9.767190933227539, 10.335904121398926, 10.904617309570312, 11.473331451416016, 12.042045593261719, 12.610758781433105, 13.179471969604492, 13.748186111450195, 14.316900253295898, 14.885613441467285, 15.454326629638672, 16.023040771484375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 7.0, 8.0, 9.0, 6.0, 14.0, 16.0, 10.0, 15.0, 23.0, 19.0, 19.0, 25.0, 26.0, 24.0, 34.0, 44.0, 29.0, 34.0, 35.0, 35.0, 35.0, 36.0, 36.0, 35.0, 33.0, 38.0, 30.0, 35.0, 25.0, 31.0, 28.0, 24.0, 21.0, 23.0, 25.0, 12.0, 15.0, 18.0, 7.0, 12.0, 7.0, 10.0, 3.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.685546875, -1.6317291259765625, -1.577911376953125, -1.5240936279296875, -1.47027587890625, -1.4164581298828125, -1.362640380859375, -1.3088226318359375, -1.2550048828125, -1.2011871337890625, -1.147369384765625, -1.0935516357421875, -1.03973388671875, -0.9859161376953125, -0.932098388671875, -0.8782806396484375, -0.824462890625, -0.7706451416015625, -0.716827392578125, -0.6630096435546875, -0.60919189453125, -0.5553741455078125, -0.501556396484375, -0.4477386474609375, -0.3939208984375, -0.3401031494140625, -0.286285400390625, -0.2324676513671875, -0.17864990234375, -0.1248321533203125, -0.071014404296875, -0.0171966552734375, 0.03662109375, 0.0904388427734375, 0.144256591796875, 0.1980743408203125, 0.25189208984375, 0.3057098388671875, 0.359527587890625, 0.4133453369140625, 0.4671630859375, 0.5209808349609375, 0.574798583984375, 0.6286163330078125, 0.68243408203125, 0.7362518310546875, 0.790069580078125, 0.8438873291015625, 0.897705078125, 0.9515228271484375, 1.005340576171875, 1.0591583251953125, 1.11297607421875, 1.1667938232421875, 1.220611572265625, 1.2744293212890625, 1.3282470703125, 1.3820648193359375, 1.435882568359375, 1.4897003173828125, 1.54351806640625, 1.5973358154296875, 1.651153564453125, 1.7049713134765625, 1.7587890625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 13.0, 25.0, 34.0, 45.0, 87.0, 106.0, 138.0, 192.0, 328.0, 449.0, 660.0, 904.0, 1332.0, 1824.0, 2832.0, 4111.0, 6173.0, 8938.0, 13152.0, 19413.0, 28986.0, 43838.0, 71135.0, 125008.0, 298872.0, 172042.0, 88530.0, 53570.0, 34381.0, 22907.0, 15482.0, 10401.0, 7138.0, 4823.0, 3368.0, 2207.0, 1551.0, 1083.0, 759.0, 499.0, 372.0, 231.0, 172.0, 127.0, 87.0, 63.0, 41.0, 41.0, 24.0, 17.0, 9.0, 5.0, 2.0, 5.0, 2.0, 6.0], "bins": [-0.07025146484375, -0.06810379028320312, -0.06595611572265625, -0.06380844116210938, -0.0616607666015625, -0.059513092041015625, -0.05736541748046875, -0.055217742919921875, -0.053070068359375, -0.050922393798828125, -0.04877471923828125, -0.046627044677734375, -0.0444793701171875, -0.042331695556640625, -0.04018402099609375, -0.038036346435546875, -0.035888671875, -0.033740997314453125, -0.03159332275390625, -0.029445648193359375, -0.0272979736328125, -0.025150299072265625, -0.02300262451171875, -0.020854949951171875, -0.018707275390625, -0.016559600830078125, -0.01441192626953125, -0.012264251708984375, -0.0101165771484375, -0.007968902587890625, -0.00582122802734375, -0.003673553466796875, -0.00152587890625, 0.000621795654296875, 0.00276947021484375, 0.004917144775390625, 0.0070648193359375, 0.009212493896484375, 0.01136016845703125, 0.013507843017578125, 0.015655517578125, 0.017803192138671875, 0.01995086669921875, 0.022098541259765625, 0.0242462158203125, 0.026393890380859375, 0.02854156494140625, 0.030689239501953125, 0.0328369140625, 0.034984588623046875, 0.03713226318359375, 0.039279937744140625, 0.0414276123046875, 0.043575286865234375, 0.04572296142578125, 0.047870635986328125, 0.050018310546875, 0.052165985107421875, 0.05431365966796875, 0.056461334228515625, 0.0586090087890625, 0.060756683349609375, 0.06290435791015625, 0.06505203247070312, 0.06719970703125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 2.0, 7.0, 7.0, 8.0, 14.0, 11.0, 11.0, 18.0, 19.0, 22.0, 17.0, 18.0, 27.0, 21.0, 27.0, 26.0, 34.0, 33.0, 37.0, 47.0, 43.0, 1066.0, 51.0, 32.0, 36.0, 31.0, 43.0, 27.0, 34.0, 26.0, 23.0, 33.0, 20.0, 18.0, 17.0, 15.0, 15.0, 13.0, 14.0, 14.0, 9.0, 4.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.271484375, -1.232635498046875, -1.19378662109375, -1.154937744140625, -1.1160888671875, -1.077239990234375, -1.03839111328125, -0.999542236328125, -0.960693359375, -0.921844482421875, -0.88299560546875, -0.844146728515625, -0.8052978515625, -0.766448974609375, -0.72760009765625, -0.688751220703125, -0.64990234375, -0.611053466796875, -0.57220458984375, -0.533355712890625, -0.4945068359375, -0.455657958984375, -0.41680908203125, -0.377960205078125, -0.339111328125, -0.300262451171875, -0.26141357421875, -0.222564697265625, -0.1837158203125, -0.144866943359375, -0.10601806640625, -0.067169189453125, -0.0283203125, 0.010528564453125, 0.04937744140625, 0.088226318359375, 0.1270751953125, 0.165924072265625, 0.20477294921875, 0.243621826171875, 0.282470703125, 0.321319580078125, 0.36016845703125, 0.399017333984375, 0.4378662109375, 0.476715087890625, 0.51556396484375, 0.554412841796875, 0.59326171875, 0.632110595703125, 0.67095947265625, 0.709808349609375, 0.7486572265625, 0.787506103515625, 0.82635498046875, 0.865203857421875, 0.904052734375, 0.942901611328125, 0.98175048828125, 1.020599365234375, 1.0594482421875, 1.098297119140625, 1.13714599609375, 1.175994873046875, 1.21484375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 8.0, 12.0, 12.0, 33.0, 41.0, 61.0, 95.0, 117.0, 174.0, 239.0, 375.0, 519.0, 729.0, 1049.0, 1428.0, 2022.0, 2994.0, 4170.0, 5702.0, 8087.0, 11346.0, 16262.0, 23434.0, 34496.0, 53662.0, 87596.0, 168414.0, 1343804.0, 121226.0, 69158.0, 43926.0, 28786.0, 19636.0, 13880.0, 9726.0, 7000.0, 4979.0, 3379.0, 2558.0, 1732.0, 1295.0, 889.0, 649.0, 433.0, 327.0, 192.0, 152.0, 106.0, 75.0, 56.0, 33.0, 25.0, 13.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.03497314453125, -0.03385496139526367, -0.032736778259277344, -0.031618595123291016, -0.030500411987304688, -0.02938222885131836, -0.02826404571533203, -0.027145862579345703, -0.026027679443359375, -0.024909496307373047, -0.02379131317138672, -0.02267313003540039, -0.021554946899414062, -0.020436763763427734, -0.019318580627441406, -0.018200397491455078, -0.01708221435546875, -0.015964031219482422, -0.014845848083496094, -0.013727664947509766, -0.012609481811523438, -0.01149129867553711, -0.010373115539550781, -0.009254932403564453, -0.008136749267578125, -0.007018566131591797, -0.005900382995605469, -0.004782199859619141, -0.0036640167236328125, -0.0025458335876464844, -0.0014276504516601562, -0.0003094673156738281, 0.0008087158203125, 0.0019268989562988281, 0.0030450820922851562, 0.004163265228271484, 0.0052814483642578125, 0.006399631500244141, 0.007517814636230469, 0.008635997772216797, 0.009754180908203125, 0.010872364044189453, 0.011990547180175781, 0.01310873031616211, 0.014226913452148438, 0.015345096588134766, 0.016463279724121094, 0.017581462860107422, 0.01869964599609375, 0.019817829132080078, 0.020936012268066406, 0.022054195404052734, 0.023172378540039062, 0.02429056167602539, 0.02540874481201172, 0.026526927947998047, 0.027645111083984375, 0.028763294219970703, 0.02988147735595703, 0.03099966049194336, 0.03211784362792969, 0.033236026763916016, 0.034354209899902344, 0.03547239303588867, 0.036590576171875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 11.0, 0.0, 13.0, 0.0, 18.0, 0.0, 21.0, 0.0, 39.0, 0.0, 51.0, 0.0, 79.0, 0.0, 497.0, 0.0, 96.0, 63.0, 0.0, 43.0, 0.0, 26.0, 0.0, 18.0, 0.0, 9.0, 0.0, 7.0, 0.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.5367431640625e-07, -9.220093488693237e-07, -8.903443813323975e-07, -8.586794137954712e-07, -8.270144462585449e-07, -7.953494787216187e-07, -7.636845111846924e-07, -7.320195436477661e-07, -7.003545761108398e-07, -6.686896085739136e-07, -6.370246410369873e-07, -6.05359673500061e-07, -5.736947059631348e-07, -5.420297384262085e-07, -5.103647708892822e-07, -4.78699803352356e-07, -4.470348358154297e-07, -4.153698682785034e-07, -3.8370490074157715e-07, -3.520399332046509e-07, -3.203749656677246e-07, -2.8870999813079834e-07, -2.5704503059387207e-07, -2.253800630569458e-07, -1.9371509552001953e-07, -1.6205012798309326e-07, -1.30385160446167e-07, -9.872019290924072e-08, -6.705522537231445e-08, -3.5390257835388184e-08, -3.725290298461914e-09, 2.7939677238464355e-08, 5.960464477539063e-08, 9.12696123123169e-08, 1.2293457984924316e-07, 1.5459954738616943e-07, 1.862645149230957e-07, 2.1792948246002197e-07, 2.4959444999694824e-07, 2.812594175338745e-07, 3.129243850708008e-07, 3.4458935260772705e-07, 3.762543201446533e-07, 4.079192876815796e-07, 4.3958425521850586e-07, 4.7124922275543213e-07, 5.029141902923584e-07, 5.345791578292847e-07, 5.662441253662109e-07, 5.979090929031372e-07, 6.295740604400635e-07, 6.612390279769897e-07, 6.92903995513916e-07, 7.245689630508423e-07, 7.562339305877686e-07, 7.878988981246948e-07, 8.195638656616211e-07, 8.512288331985474e-07, 8.828938007354736e-07, 9.145587682723999e-07, 9.462237358093262e-07, 9.778887033462524e-07, 1.0095536708831787e-06, 1.041218638420105e-06, 1.0728836059570312e-06]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 10.0, 6.0, 3.0, 14.0, 7.0, 23.0, 22.0, 54.0, 93.0, 125.0, 238.0, 1810.0, 26416.0, 928662.0, 85400.0, 4858.0, 397.0, 135.0, 66.0, 52.0, 27.0, 35.0, 18.0, 16.0, 16.0, 9.0, 9.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.704692840576172e-05, -1.6555190086364746e-05, -1.6063451766967773e-05, -1.55717134475708e-05, -1.5079975128173828e-05, -1.4588236808776855e-05, -1.4096498489379883e-05, -1.360476016998291e-05, -1.3113021850585938e-05, -1.2621283531188965e-05, -1.2129545211791992e-05, -1.163780689239502e-05, -1.1146068572998047e-05, -1.0654330253601074e-05, -1.0162591934204102e-05, -9.670853614807129e-06, -9.179115295410156e-06, -8.687376976013184e-06, -8.195638656616211e-06, -7.703900337219238e-06, -7.212162017822266e-06, -6.720423698425293e-06, -6.22868537902832e-06, -5.736947059631348e-06, -5.245208740234375e-06, -4.753470420837402e-06, -4.26173210144043e-06, -3.769993782043457e-06, -3.2782554626464844e-06, -2.7865171432495117e-06, -2.294778823852539e-06, -1.8030405044555664e-06, -1.3113021850585938e-06, -8.195638656616211e-07, -3.2782554626464844e-07, 1.6391277313232422e-07, 6.556510925292969e-07, 1.1473894119262695e-06, 1.6391277313232422e-06, 2.130866050720215e-06, 2.6226043701171875e-06, 3.11434268951416e-06, 3.606081008911133e-06, 4.0978193283081055e-06, 4.589557647705078e-06, 5.081295967102051e-06, 5.5730342864990234e-06, 6.064772605895996e-06, 6.556510925292969e-06, 7.048249244689941e-06, 7.539987564086914e-06, 8.031725883483887e-06, 8.52346420288086e-06, 9.015202522277832e-06, 9.506940841674805e-06, 9.998679161071777e-06, 1.049041748046875e-05, 1.0982155799865723e-05, 1.1473894119262695e-05, 1.1965632438659668e-05, 1.245737075805664e-05, 1.2949109077453613e-05, 1.3440847396850586e-05, 1.3932585716247559e-05, 1.4424324035644531e-05]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 9.0, 8.0, 22.0, 19.0, 29.0, 29.0, 37.0, 645.0, 38.0, 36.0, 33.0, 27.0, 22.0, 11.0, 9.0, 12.0, 5.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.801639642617374e-07, -6.659624887106474e-07, -6.517609563161386e-07, -6.375594807650486e-07, -6.233580052139587e-07, -6.091564728194498e-07, -5.949549972683599e-07, -5.807535217172699e-07, -5.665519893227611e-07, -5.523505137716711e-07, -5.381489813771623e-07, -5.239475058260723e-07, -5.097460302749823e-07, -4.955445547238924e-07, -4.813430223293835e-07, -4.6714154677829356e-07, -4.529400712272036e-07, -4.387385672544042e-07, -4.245370917033142e-07, -4.103355877305148e-07, -3.9613411217942485e-07, -3.8193260820662545e-07, -3.6773110423382604e-07, -3.535296286827361e-07, -3.393281247099367e-07, -3.2512662073713727e-07, -3.109251451860473e-07, -2.967236412132479e-07, -2.825221372404485e-07, -2.6832066168935853e-07, -2.5411915771655913e-07, -2.3991765374375973e-07, -2.2571616398181504e-07, -2.1151467421987036e-07, -1.9731317024707096e-07, -1.8311168048512627e-07, -1.6891019072318159e-07, -1.547087009612369e-07, -1.4050721119929221e-07, -1.2630570722649281e-07, -1.1210421746454813e-07, -9.790272770260344e-08, -8.37012308352314e-08, -6.949973396785936e-08, -5.529824420591467e-08, -4.1096754443969985e-08, -2.6895257576597942e-08, -1.2693760709225899e-08, 1.507729052718787e-09, 1.570922236737715e-08, 2.9910715682035516e-08, 4.411220899669388e-08, 5.8313702311352245e-08, 7.251519207329693e-08, 8.671668894066897e-08, 1.0091818580804102e-07, 1.151196755699857e-07, 1.293211653319304e-07, 1.435226693047298e-07, 1.5772415906667447e-07, 1.7192564882861916e-07, 1.8612713859056385e-07, 2.0032862835250853e-07, 2.1453013232530793e-07, 2.2873162208725262e-07]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 143.0, 0.0, 0.0, 0.0, 0.0, 0.0, 651.0, 0.0, 0.0, 0.0, 0.0, 0.0, 139.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4831464290618896e-07, -3.390014171600342e-07, -3.296881914138794e-07, -3.203749656677246e-07, -3.110617399215698e-07, -3.0174851417541504e-07, -2.9243528842926025e-07, -2.8312206268310547e-07, -2.738088369369507e-07, -2.644956111907959e-07, -2.551823854446411e-07, -2.4586915969848633e-07, -2.3655593395233154e-07, -2.2724270820617676e-07, -2.1792948246002197e-07, -2.086162567138672e-07, -1.993030309677124e-07, -1.8998980522155762e-07, -1.8067657947540283e-07, -1.7136335372924805e-07, -1.6205012798309326e-07, -1.5273690223693848e-07, -1.434236764907837e-07, -1.341104507446289e-07, -1.2479722499847412e-07, -1.1548399925231934e-07, -1.0617077350616455e-07, -9.685754776000977e-08, -8.754432201385498e-08, -7.82310962677002e-08, -6.891787052154541e-08, -5.960464477539063e-08, -5.029141902923584e-08, -4.0978193283081055e-08, -3.166496753692627e-08, -2.2351741790771484e-08, -1.30385160446167e-08, -3.725290298461914e-09, 5.587935447692871e-09, 1.4901161193847656e-08, 2.421438694000244e-08, 3.3527612686157227e-08, 4.284083843231201e-08, 5.21540641784668e-08, 6.146728992462158e-08, 7.078051567077637e-08, 8.009374141693115e-08, 8.940696716308594e-08, 9.872019290924072e-08, 1.0803341865539551e-07, 1.1734664440155029e-07, 1.2665987014770508e-07, 1.3597309589385986e-07, 1.4528632164001465e-07, 1.5459954738616943e-07, 1.6391277313232422e-07, 1.73225998878479e-07, 1.825392246246338e-07, 1.9185245037078857e-07, 2.0116567611694336e-07, 2.1047890186309814e-07, 2.1979212760925293e-07, 2.2910535335540771e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 7.0, 8.0, 9.0, 6.0, 14.0, 16.0, 10.0, 15.0, 23.0, 19.0, 19.0, 25.0, 26.0, 24.0, 34.0, 44.0, 29.0, 34.0, 35.0, 35.0, 35.0, 36.0, 36.0, 35.0, 33.0, 38.0, 30.0, 35.0, 25.0, 31.0, 28.0, 24.0, 21.0, 23.0, 25.0, 12.0, 15.0, 18.0, 7.0, 12.0, 7.0, 10.0, 3.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.685546875, -1.6317291259765625, -1.577911376953125, -1.5240936279296875, -1.47027587890625, -1.4164581298828125, -1.362640380859375, -1.3088226318359375, -1.2550048828125, -1.2011871337890625, -1.147369384765625, -1.0935516357421875, -1.03973388671875, -0.9859161376953125, -0.932098388671875, -0.8782806396484375, -0.824462890625, -0.7706451416015625, -0.716827392578125, -0.6630096435546875, -0.60919189453125, -0.5553741455078125, -0.501556396484375, -0.4477386474609375, -0.3939208984375, -0.3401031494140625, -0.286285400390625, -0.2324676513671875, -0.17864990234375, -0.1248321533203125, -0.071014404296875, -0.0171966552734375, 0.03662109375, 0.0904388427734375, 0.144256591796875, 0.1980743408203125, 0.25189208984375, 0.3057098388671875, 0.359527587890625, 0.4133453369140625, 0.4671630859375, 0.5209808349609375, 0.574798583984375, 0.6286163330078125, 0.68243408203125, 0.7362518310546875, 0.790069580078125, 0.8438873291015625, 0.897705078125, 0.9515228271484375, 1.005340576171875, 1.0591583251953125, 1.11297607421875, 1.1667938232421875, 1.220611572265625, 1.2744293212890625, 1.3282470703125, 1.3820648193359375, 1.435882568359375, 1.4897003173828125, 1.54351806640625, 1.5973358154296875, 1.651153564453125, 1.7049713134765625, 1.7587890625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 11.0, 6.0, 20.0, 29.0, 34.0, 54.0, 69.0, 130.0, 168.0, 279.0, 396.0, 646.0, 1080.0, 1540.0, 2288.0, 3517.0, 5708.0, 8925.0, 14612.0, 25808.0, 52119.0, 123215.0, 268916.0, 281640.0, 133187.0, 56087.0, 27093.0, 15150.0, 9197.0, 5854.0, 3706.0, 2451.0, 1616.0, 999.0, 690.0, 436.0, 285.0, 208.0, 129.0, 88.0, 55.0, 36.0, 19.0, 22.0, 10.0, 17.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.501953125, -2.421356201171875, -2.34075927734375, -2.260162353515625, -2.1795654296875, -2.098968505859375, -2.01837158203125, -1.937774658203125, -1.857177734375, -1.776580810546875, -1.69598388671875, -1.615386962890625, -1.5347900390625, -1.454193115234375, -1.37359619140625, -1.292999267578125, -1.21240234375, -1.131805419921875, -1.05120849609375, -0.970611572265625, -0.8900146484375, -0.809417724609375, -0.72882080078125, -0.648223876953125, -0.567626953125, -0.487030029296875, -0.40643310546875, -0.325836181640625, -0.2452392578125, -0.164642333984375, -0.08404541015625, -0.003448486328125, 0.0771484375, 0.157745361328125, 0.23834228515625, 0.318939208984375, 0.3995361328125, 0.480133056640625, 0.56072998046875, 0.641326904296875, 0.721923828125, 0.802520751953125, 0.88311767578125, 0.963714599609375, 1.0443115234375, 1.124908447265625, 1.20550537109375, 1.286102294921875, 1.36669921875, 1.447296142578125, 1.52789306640625, 1.608489990234375, 1.6890869140625, 1.769683837890625, 1.85028076171875, 1.930877685546875, 2.011474609375, 2.092071533203125, 2.17266845703125, 2.253265380859375, 2.3338623046875, 2.414459228515625, 2.49505615234375, 2.575653076171875, 2.65625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 7.0, 8.0, 7.0, 11.0, 18.0, 16.0, 20.0, 25.0, 25.0, 29.0, 38.0, 32.0, 61.0, 57.0, 79.0, 112.0, 178.0, 1358.0, 289.0, 146.0, 95.0, 74.0, 54.0, 50.0, 38.0, 42.0, 36.0, 24.0, 16.0, 14.0, 15.0, 16.0, 9.0, 8.0, 10.0, 8.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.6484375, -7.42242431640625, -7.1964111328125, -6.97039794921875, -6.744384765625, -6.51837158203125, -6.2923583984375, -6.06634521484375, -5.84033203125, -5.61431884765625, -5.3883056640625, -5.16229248046875, -4.936279296875, -4.71026611328125, -4.4842529296875, -4.25823974609375, -4.0322265625, -3.80621337890625, -3.5802001953125, -3.35418701171875, -3.128173828125, -2.90216064453125, -2.6761474609375, -2.45013427734375, -2.22412109375, -1.99810791015625, -1.7720947265625, -1.54608154296875, -1.320068359375, -1.09405517578125, -0.8680419921875, -0.64202880859375, -0.416015625, -0.19000244140625, 0.0360107421875, 0.26202392578125, 0.488037109375, 0.71405029296875, 0.9400634765625, 1.16607666015625, 1.39208984375, 1.61810302734375, 1.8441162109375, 2.07012939453125, 2.296142578125, 2.52215576171875, 2.7481689453125, 2.97418212890625, 3.2001953125, 3.42620849609375, 3.6522216796875, 3.87823486328125, 4.104248046875, 4.33026123046875, 4.5562744140625, 4.78228759765625, 5.00830078125, 5.23431396484375, 5.4603271484375, 5.68634033203125, 5.912353515625, 6.13836669921875, 6.3643798828125, 6.59039306640625, 6.81640625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 10.0, 14.0, 14.0, 18.0, 14.0, 19.0, 31.0, 47.0, 64.0, 84.0, 133.0, 221.0, 356.0, 959.0, 4322.0, 30467.0, 716660.0, 2314853.0, 67022.0, 7705.0, 1476.0, 460.0, 230.0, 147.0, 105.0, 66.0, 49.0, 25.0, 25.0, 23.0, 15.0, 15.0, 7.0, 10.0, 7.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5390625, -12.123291015625, -11.70751953125, -11.291748046875, -10.8759765625, -10.460205078125, -10.04443359375, -9.628662109375, -9.212890625, -8.797119140625, -8.38134765625, -7.965576171875, -7.5498046875, -7.134033203125, -6.71826171875, -6.302490234375, -5.88671875, -5.470947265625, -5.05517578125, -4.639404296875, -4.2236328125, -3.807861328125, -3.39208984375, -2.976318359375, -2.560546875, -2.144775390625, -1.72900390625, -1.313232421875, -0.8974609375, -0.481689453125, -0.06591796875, 0.349853515625, 0.765625, 1.181396484375, 1.59716796875, 2.012939453125, 2.4287109375, 2.844482421875, 3.26025390625, 3.676025390625, 4.091796875, 4.507568359375, 4.92333984375, 5.339111328125, 5.7548828125, 6.170654296875, 6.58642578125, 7.002197265625, 7.41796875, 7.833740234375, 8.24951171875, 8.665283203125, 9.0810546875, 9.496826171875, 9.91259765625, 10.328369140625, 10.744140625, 11.159912109375, 11.57568359375, 11.991455078125, 12.4072265625, 12.822998046875, 13.23876953125, 13.654541015625, 14.0703125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 20.0, 67.0, 150.0, 261.0, 254.0, 166.0, 70.0, 14.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.20335388183594, -76.7536849975586, -75.30401611328125, -73.8543472290039, -72.40467834472656, -70.95500183105469, -69.50533294677734, -68.0556640625, -66.60599517822266, -65.15632629394531, -63.70665740966797, -62.25698471069336, -60.807315826416016, -59.35764694213867, -57.90797424316406, -56.45830535888672, -55.008636474609375, -53.55896759033203, -52.10929870605469, -50.65962600708008, -49.209957122802734, -47.76028823852539, -46.31061553955078, -44.86094665527344, -43.411277770996094, -41.96160888671875, -40.511940002441406, -39.0622673034668, -37.61259841918945, -36.16292953491211, -34.7132568359375, -33.263587951660156, -31.813915252685547, -30.364246368408203, -28.914575576782227, -27.46490478515625, -26.015235900878906, -24.565567016601562, -23.115896224975586, -21.66622543334961, -20.216556549072266, -18.766887664794922, -17.317216873168945, -15.867547035217285, -14.417877197265625, -12.968207359313965, -11.518537521362305, -10.068867683410645, -8.619197845458984, -7.169528007507324, -5.719858169555664, -4.270188331604004, -2.8205184936523438, -1.3708486557006836, 0.07882118225097656, 1.5284910202026367, 2.978160858154297, 4.427830696105957, 5.877500534057617, 7.327170372009277, 8.776840209960938, 10.226510047912598, 11.676179885864258, 13.125849723815918, 14.575519561767578]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 7.0, 5.0, 7.0, 13.0, 15.0, 10.0, 16.0, 30.0, 13.0, 14.0, 26.0, 32.0, 26.0, 26.0, 34.0, 28.0, 33.0, 45.0, 41.0, 41.0, 33.0, 39.0, 39.0, 41.0, 38.0, 35.0, 45.0, 45.0, 26.0, 36.0, 30.0, 23.0, 17.0, 21.0, 10.0, 11.0, 5.0, 4.0, 10.0, 4.0, 11.0, 6.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.197187423706055, -16.65139389038086, -16.10559844970703, -15.559804916381836, -15.01401138305664, -14.468217849731445, -13.922423362731934, -13.376628875732422, -12.830835342407227, -12.285041809082031, -11.73924732208252, -11.193452835083008, -10.647659301757812, -10.101865768432617, -9.556071281433105, -9.010276794433594, -8.464483261108398, -7.918689250946045, -7.372895240783691, -6.827101230621338, -6.281307220458984, -5.735513210296631, -5.189719200134277, -4.643925189971924, -4.09813117980957, -3.552337169647217, -3.0065431594848633, -2.4607491493225098, -1.9149551391601562, -1.3691611289978027, -0.8233671188354492, -0.2775731086730957, 0.2682209014892578, 0.8140149116516113, 1.3598089218139648, 1.9056029319763184, 2.451396942138672, 2.9971909523010254, 3.542984962463379, 4.088778972625732, 4.634572982788086, 5.1803669929504395, 5.726161003112793, 6.2719550132751465, 6.8177490234375, 7.3635430335998535, 7.909337043762207, 8.455131530761719, 9.000925064086914, 9.54671859741211, 10.092513084411621, 10.638307571411133, 11.184101104736328, 11.729894638061523, 12.275689125061035, 12.821483612060547, 13.367277145385742, 13.913070678710938, 14.45886516571045, 15.004659652709961, 15.550453186035156, 16.09624671936035, 16.642040252685547, 17.187835693359375, 17.73362922668457]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 6.0, 5.0, 7.0, 8.0, 9.0, 10.0, 5.0, 17.0, 13.0, 14.0, 17.0, 16.0, 19.0, 29.0, 20.0, 29.0, 31.0, 32.0, 36.0, 31.0, 36.0, 32.0, 28.0, 42.0, 41.0, 33.0, 35.0, 32.0, 31.0, 36.0, 35.0, 28.0, 21.0, 31.0, 35.0, 24.0, 16.0, 17.0, 7.0, 20.0, 11.0, 10.0, 13.0, 11.0, 8.0, 4.0, 7.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.8583984375, -1.802276611328125, -1.74615478515625, -1.690032958984375, -1.6339111328125, -1.577789306640625, -1.52166748046875, -1.465545654296875, -1.409423828125, -1.353302001953125, -1.29718017578125, -1.241058349609375, -1.1849365234375, -1.128814697265625, -1.07269287109375, -1.016571044921875, -0.96044921875, -0.904327392578125, -0.84820556640625, -0.792083740234375, -0.7359619140625, -0.679840087890625, -0.62371826171875, -0.567596435546875, -0.511474609375, -0.455352783203125, -0.39923095703125, -0.343109130859375, -0.2869873046875, -0.230865478515625, -0.17474365234375, -0.118621826171875, -0.0625, -0.006378173828125, 0.04974365234375, 0.105865478515625, 0.1619873046875, 0.218109130859375, 0.27423095703125, 0.330352783203125, 0.386474609375, 0.442596435546875, 0.49871826171875, 0.554840087890625, 0.6109619140625, 0.667083740234375, 0.72320556640625, 0.779327392578125, 0.83544921875, 0.891571044921875, 0.94769287109375, 1.003814697265625, 1.0599365234375, 1.116058349609375, 1.17218017578125, 1.228302001953125, 1.284423828125, 1.340545654296875, 1.39666748046875, 1.452789306640625, 1.5089111328125, 1.565032958984375, 1.62115478515625, 1.677276611328125, 1.7333984375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 8.0, 10.0, 15.0, 7.0, 16.0, 14.0, 15.0, 24.0, 29.0, 54.0, 68.0, 85.0, 166.0, 280.0, 517.0, 1137.0, 3217.0, 10713.0, 40671.0, 167915.0, 708375.0, 1974642.0, 975722.0, 233447.0, 55778.0, 14308.0, 4163.0, 1422.0, 605.0, 282.0, 196.0, 100.0, 76.0, 48.0, 35.0, 34.0, 16.0, 17.0, 13.0, 13.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.04296875, -4.89727783203125, -4.7515869140625, -4.60589599609375, -4.460205078125, -4.31451416015625, -4.1688232421875, -4.02313232421875, -3.87744140625, -3.73175048828125, -3.5860595703125, -3.44036865234375, -3.294677734375, -3.14898681640625, -3.0032958984375, -2.85760498046875, -2.7119140625, -2.56622314453125, -2.4205322265625, -2.27484130859375, -2.129150390625, -1.98345947265625, -1.8377685546875, -1.69207763671875, -1.54638671875, -1.40069580078125, -1.2550048828125, -1.10931396484375, -0.963623046875, -0.81793212890625, -0.6722412109375, -0.52655029296875, -0.380859375, -0.23516845703125, -0.0894775390625, 0.05621337890625, 0.201904296875, 0.34759521484375, 0.4932861328125, 0.63897705078125, 0.78466796875, 0.93035888671875, 1.0760498046875, 1.22174072265625, 1.367431640625, 1.51312255859375, 1.6588134765625, 1.80450439453125, 1.9501953125, 2.09588623046875, 2.2415771484375, 2.38726806640625, 2.532958984375, 2.67864990234375, 2.8243408203125, 2.97003173828125, 3.11572265625, 3.26141357421875, 3.4071044921875, 3.55279541015625, 3.698486328125, 3.84417724609375, 3.9898681640625, 4.13555908203125, 4.28125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 10.0, 7.0, 18.0, 26.0, 36.0, 35.0, 61.0, 99.0, 170.0, 221.0, 292.0, 385.0, 490.0, 546.0, 447.0, 353.0, 265.0, 175.0, 152.0, 75.0, 72.0, 44.0, 31.0, 25.0, 14.0, 6.0, 9.0, 3.0, 1.0, 5.0, 5.0, 2.0, 1.0, 3.0], "bins": [-9.3515625, -9.135986328125, -8.92041015625, -8.704833984375, -8.4892578125, -8.273681640625, -8.05810546875, -7.842529296875, -7.626953125, -7.411376953125, -7.19580078125, -6.980224609375, -6.7646484375, -6.549072265625, -6.33349609375, -6.117919921875, -5.90234375, -5.686767578125, -5.47119140625, -5.255615234375, -5.0400390625, -4.824462890625, -4.60888671875, -4.393310546875, -4.177734375, -3.962158203125, -3.74658203125, -3.531005859375, -3.3154296875, -3.099853515625, -2.88427734375, -2.668701171875, -2.453125, -2.237548828125, -2.02197265625, -1.806396484375, -1.5908203125, -1.375244140625, -1.15966796875, -0.944091796875, -0.728515625, -0.512939453125, -0.29736328125, -0.081787109375, 0.1337890625, 0.349365234375, 0.56494140625, 0.780517578125, 0.99609375, 1.211669921875, 1.42724609375, 1.642822265625, 1.8583984375, 2.073974609375, 2.28955078125, 2.505126953125, 2.720703125, 2.936279296875, 3.15185546875, 3.367431640625, 3.5830078125, 3.798583984375, 4.01416015625, 4.229736328125, 4.4453125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 6.0, 6.0, 2.0, 3.0, 8.0, 12.0, 24.0, 38.0, 42.0, 74.0, 148.0, 291.0, 568.0, 2380.0, 25047.0, 719506.0, 3206773.0, 226929.0, 10115.0, 1422.0, 422.0, 200.0, 105.0, 62.0, 47.0, 31.0, 13.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -9.9346923828125, -9.392822265625, -8.8509521484375, -8.30908203125, -7.7672119140625, -7.225341796875, -6.6834716796875, -6.1416015625, -5.5997314453125, -5.057861328125, -4.5159912109375, -3.97412109375, -3.4322509765625, -2.890380859375, -2.3485107421875, -1.806640625, -1.2647705078125, -0.722900390625, -0.1810302734375, 0.36083984375, 0.9027099609375, 1.444580078125, 1.9864501953125, 2.5283203125, 3.0701904296875, 3.612060546875, 4.1539306640625, 4.69580078125, 5.2376708984375, 5.779541015625, 6.3214111328125, 6.86328125, 7.4051513671875, 7.947021484375, 8.4888916015625, 9.03076171875, 9.5726318359375, 10.114501953125, 10.6563720703125, 11.1982421875, 11.7401123046875, 12.281982421875, 12.8238525390625, 13.36572265625, 13.9075927734375, 14.449462890625, 14.9913330078125, 15.533203125, 16.0750732421875, 16.616943359375, 17.1588134765625, 17.70068359375, 18.2425537109375, 18.784423828125, 19.3262939453125, 19.8681640625, 20.4100341796875, 20.951904296875, 21.4937744140625, 22.03564453125, 22.5775146484375, 23.119384765625, 23.6612548828125, 24.203125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 13.0, 15.0, 29.0, 49.0, 63.0, 68.0, 96.0, 87.0, 117.0, 108.0, 96.0, 86.0, 67.0, 45.0, 35.0, 13.0, 7.0, 4.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.028179168701172, -24.881858825683594, -23.735536575317383, -22.589214324951172, -21.442893981933594, -20.296573638916016, -19.150251388549805, -18.003929138183594, -16.857608795166016, -15.711287498474121, -14.564966201782227, -13.418644905090332, -12.272323608398438, -11.126002311706543, -9.979681015014648, -8.833359718322754, -7.687038421630859, -6.540717124938965, -5.39439582824707, -4.248074531555176, -3.1017532348632812, -1.9554319381713867, -0.8091106414794922, 0.33721065521240234, 1.4835319519042969, 2.6298532485961914, 3.776174545288086, 4.9224958419799805, 6.068817138671875, 7.2151384353637695, 8.361459732055664, 9.507781028747559, 10.654098510742188, 11.800419807434082, 12.946741104125977, 14.093062400817871, 15.239383697509766, 16.385704040527344, 17.532026290893555, 18.678348541259766, 19.824668884277344, 20.970989227294922, 22.117311477661133, 23.263633728027344, 24.409954071044922, 25.5562744140625, 26.70259666442871, 27.848918914794922, 28.9952392578125, 30.141559600830078, 31.28788185119629, 32.4342041015625, 33.58052444458008, 34.726844787597656, 35.8731689453125, 37.01948928833008, 38.165809631347656, 39.312129974365234, 40.45845031738281, 41.604774475097656, 42.751094818115234, 43.89741516113281, 45.043739318847656, 46.190059661865234, 47.33638000488281]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 6.0, 12.0, 10.0, 13.0, 18.0, 20.0, 14.0, 21.0, 18.0, 23.0, 28.0, 34.0, 26.0, 33.0, 42.0, 34.0, 36.0, 32.0, 52.0, 42.0, 49.0, 44.0, 39.0, 49.0, 32.0, 33.0, 23.0, 25.0, 26.0, 24.0, 27.0, 13.0, 13.0, 18.0, 18.0, 14.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-21.775001525878906, -21.15688705444336, -20.538774490356445, -19.9206600189209, -19.302547454833984, -18.684432983398438, -18.066320419311523, -17.448205947875977, -16.830093383789062, -16.211978912353516, -15.593866348266602, -14.975752830505371, -14.35763931274414, -13.739524841308594, -13.121411323547363, -12.503297805786133, -11.885183334350586, -11.267069816589355, -10.648956298828125, -10.030842781066895, -9.412729263305664, -8.794614791870117, -8.176501274108887, -7.558387756347656, -6.940274238586426, -6.322160720825195, -5.704047203063965, -5.085933208465576, -4.467819690704346, -3.8497061729431152, -3.2315924167633057, -2.613478660583496, -1.9953651428222656, -1.3772515058517456, -0.7591378688812256, -0.14102423191070557, 0.47708940505981445, 1.095202922821045, 1.7133166790008545, 2.331430435180664, 2.9495439529418945, 3.567657470703125, 4.1857709884643555, 4.803884983062744, 5.421998500823975, 6.040112018585205, 6.658226013183594, 7.276339530944824, 7.894453048706055, 8.512566566467285, 9.130680084228516, 9.748793601989746, 10.366907119750977, 10.985021591186523, 11.603135108947754, 12.221248626708984, 12.839362144470215, 13.457475662231445, 14.075589179992676, 14.693702697753906, 15.311817169189453, 15.929929733276367, 16.548044204711914, 17.166156768798828, 17.784271240234375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 8.0, 10.0, 8.0, 8.0, 14.0, 15.0, 11.0, 18.0, 24.0, 29.0, 21.0, 31.0, 25.0, 29.0, 26.0, 31.0, 40.0, 33.0, 39.0, 32.0, 36.0, 36.0, 37.0, 39.0, 35.0, 42.0, 24.0, 33.0, 41.0, 27.0, 22.0, 21.0, 18.0, 22.0, 16.0, 13.0, 13.0, 12.0, 9.0, 6.0, 4.0, 8.0, 9.0, 4.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7596282958984375, -1.701873779296875, -1.6441192626953125, -1.58636474609375, -1.5286102294921875, -1.470855712890625, -1.4131011962890625, -1.3553466796875, -1.2975921630859375, -1.239837646484375, -1.1820831298828125, -1.12432861328125, -1.0665740966796875, -1.008819580078125, -0.9510650634765625, -0.893310546875, -0.8355560302734375, -0.777801513671875, -0.7200469970703125, -0.66229248046875, -0.6045379638671875, -0.546783447265625, -0.4890289306640625, -0.4312744140625, -0.3735198974609375, -0.315765380859375, -0.2580108642578125, -0.20025634765625, -0.1425018310546875, -0.084747314453125, -0.0269927978515625, 0.03076171875, 0.0885162353515625, 0.146270751953125, 0.2040252685546875, 0.26177978515625, 0.3195343017578125, 0.377288818359375, 0.4350433349609375, 0.4927978515625, 0.5505523681640625, 0.608306884765625, 0.6660614013671875, 0.72381591796875, 0.7815704345703125, 0.839324951171875, 0.8970794677734375, 0.954833984375, 1.0125885009765625, 1.070343017578125, 1.1280975341796875, 1.18585205078125, 1.2436065673828125, 1.301361083984375, 1.3591156005859375, 1.4168701171875, 1.4746246337890625, 1.532379150390625, 1.5901336669921875, 1.64788818359375, 1.7056427001953125, 1.763397216796875, 1.8211517333984375, 1.87890625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 8.0, 8.0, 11.0, 14.0, 14.0, 28.0, 53.0, 75.0, 115.0, 183.0, 230.0, 290.0, 490.0, 725.0, 1103.0, 1463.0, 2072.0, 3017.0, 4341.0, 6356.0, 9373.0, 13587.0, 20342.0, 30490.0, 47931.0, 77663.0, 143831.0, 313786.0, 147528.0, 78888.0, 48554.0, 31030.0, 20913.0, 13800.0, 9374.0, 6422.0, 4530.0, 2986.0, 2124.0, 1481.0, 1074.0, 722.0, 473.0, 344.0, 247.0, 145.0, 129.0, 62.0, 44.0, 36.0, 25.0, 15.0, 6.0, 10.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.07568359375, -0.07328224182128906, -0.07088088989257812, -0.06847953796386719, -0.06607818603515625, -0.06367683410644531, -0.061275482177734375, -0.05887413024902344, -0.0564727783203125, -0.05407142639160156, -0.051670074462890625, -0.04926872253417969, -0.04686737060546875, -0.04446601867675781, -0.042064666748046875, -0.03966331481933594, -0.037261962890625, -0.03486061096191406, -0.032459259033203125, -0.030057907104492188, -0.02765655517578125, -0.025255203247070312, -0.022853851318359375, -0.020452499389648438, -0.0180511474609375, -0.015649795532226562, -0.013248443603515625, -0.010847091674804688, -0.00844573974609375, -0.0060443878173828125, -0.003643035888671875, -0.0012416839599609375, 0.00115966796875, 0.0035610198974609375, 0.005962371826171875, 0.008363723754882812, 0.01076507568359375, 0.013166427612304688, 0.015567779541015625, 0.017969131469726562, 0.0203704833984375, 0.022771835327148438, 0.025173187255859375, 0.027574539184570312, 0.02997589111328125, 0.03237724304199219, 0.034778594970703125, 0.03717994689941406, 0.039581298828125, 0.04198265075683594, 0.044384002685546875, 0.04678535461425781, 0.04918670654296875, 0.05158805847167969, 0.053989410400390625, 0.05639076232910156, 0.0587921142578125, 0.06119346618652344, 0.06359481811523438, 0.06599617004394531, 0.06839752197265625, 0.07079887390136719, 0.07320022583007812, 0.07560157775878906, 0.0780029296875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 9.0, 5.0, 7.0, 8.0, 15.0, 11.0, 14.0, 20.0, 19.0, 22.0, 26.0, 29.0, 34.0, 22.0, 34.0, 32.0, 29.0, 29.0, 47.0, 41.0, 1067.0, 43.0, 38.0, 46.0, 41.0, 35.0, 43.0, 35.0, 26.0, 27.0, 22.0, 22.0, 17.0, 17.0, 22.0, 15.0, 7.0, 7.0, 5.0, 6.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.29296875, -1.2514190673828125, -1.209869384765625, -1.1683197021484375, -1.12677001953125, -1.0852203369140625, -1.043670654296875, -1.0021209716796875, -0.9605712890625, -0.9190216064453125, -0.877471923828125, -0.8359222412109375, -0.79437255859375, -0.7528228759765625, -0.711273193359375, -0.6697235107421875, -0.628173828125, -0.5866241455078125, -0.545074462890625, -0.5035247802734375, -0.46197509765625, -0.4204254150390625, -0.378875732421875, -0.3373260498046875, -0.2957763671875, -0.2542266845703125, -0.212677001953125, -0.1711273193359375, -0.12957763671875, -0.0880279541015625, -0.046478271484375, -0.0049285888671875, 0.03662109375, 0.0781707763671875, 0.119720458984375, 0.1612701416015625, 0.20281982421875, 0.2443695068359375, 0.285919189453125, 0.3274688720703125, 0.3690185546875, 0.4105682373046875, 0.452117919921875, 0.4936676025390625, 0.53521728515625, 0.5767669677734375, 0.618316650390625, 0.6598663330078125, 0.701416015625, 0.7429656982421875, 0.784515380859375, 0.8260650634765625, 0.86761474609375, 0.9091644287109375, 0.950714111328125, 0.9922637939453125, 1.0338134765625, 1.0753631591796875, 1.116912841796875, 1.1584625244140625, 1.20001220703125, 1.2415618896484375, 1.283111572265625, 1.3246612548828125, 1.3662109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 12.0, 13.0, 22.0, 27.0, 46.0, 58.0, 75.0, 129.0, 152.0, 220.0, 363.0, 473.0, 665.0, 895.0, 1292.0, 1976.0, 2694.0, 3913.0, 5638.0, 8338.0, 11982.0, 17870.0, 26685.0, 41625.0, 66261.0, 115370.0, 1323913.0, 198616.0, 97651.0, 57947.0, 36645.0, 23976.0, 16097.0, 10858.0, 7499.0, 5085.0, 3662.0, 2593.0, 1675.0, 1231.0, 898.0, 588.0, 440.0, 310.0, 200.0, 126.0, 107.0, 66.0, 49.0, 39.0, 24.0, 16.0, 11.0, 11.0, 6.0, 2.0, 2.0, 4.0], "bins": [-0.03936767578125, -0.03816986083984375, -0.0369720458984375, -0.03577423095703125, -0.034576416015625, -0.03337860107421875, -0.0321807861328125, -0.03098297119140625, -0.02978515625, -0.02858734130859375, -0.0273895263671875, -0.02619171142578125, -0.024993896484375, -0.02379608154296875, -0.0225982666015625, -0.02140045166015625, -0.02020263671875, -0.01900482177734375, -0.0178070068359375, -0.01660919189453125, -0.015411376953125, -0.01421356201171875, -0.0130157470703125, -0.01181793212890625, -0.0106201171875, -0.00942230224609375, -0.0082244873046875, -0.00702667236328125, -0.005828857421875, -0.00463104248046875, -0.0034332275390625, -0.00223541259765625, -0.00103759765625, 0.00016021728515625, 0.0013580322265625, 0.00255584716796875, 0.003753662109375, 0.00495147705078125, 0.0061492919921875, 0.00734710693359375, 0.008544921875, 0.00974273681640625, 0.0109405517578125, 0.01213836669921875, 0.013336181640625, 0.01453399658203125, 0.0157318115234375, 0.01692962646484375, 0.01812744140625, 0.01932525634765625, 0.0205230712890625, 0.02172088623046875, 0.022918701171875, 0.02411651611328125, 0.0253143310546875, 0.02651214599609375, 0.0277099609375, 0.02890777587890625, 0.0301055908203125, 0.03130340576171875, 0.032501220703125, 0.03369903564453125, 0.0348968505859375, 0.03609466552734375, 0.03729248046875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 0.0, 13.0, 19.0, 0.0, 23.0, 26.0, 33.0, 0.0, 39.0, 56.0, 0.0, 74.0, 431.0, 83.0, 0.0, 67.0, 37.0, 24.0, 0.0, 15.0, 14.0, 0.0, 16.0, 11.0, 10.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.387670636177063e-06, -1.344829797744751e-06, -1.301988959312439e-06, -1.259148120880127e-06, -1.216307282447815e-06, -1.173466444015503e-06, -1.130625605583191e-06, -1.087784767150879e-06, -1.044943928718567e-06, -1.0021030902862549e-06, -9.592622518539429e-07, -9.164214134216309e-07, -8.735805749893188e-07, -8.307397365570068e-07, -7.878988981246948e-07, -7.450580596923828e-07, -7.022172212600708e-07, -6.593763828277588e-07, -6.165355443954468e-07, -5.736947059631348e-07, -5.308538675308228e-07, -4.880130290985107e-07, -4.4517219066619873e-07, -4.023313522338867e-07, -3.594905138015747e-07, -3.166496753692627e-07, -2.738088369369507e-07, -2.3096799850463867e-07, -1.8812716007232666e-07, -1.4528632164001465e-07, -1.0244548320770264e-07, -5.960464477539063e-08, -1.6763806343078613e-08, 2.60770320892334e-08, 6.891787052154541e-08, 1.1175870895385742e-07, 1.5459954738616943e-07, 1.9744038581848145e-07, 2.4028122425079346e-07, 2.8312206268310547e-07, 3.259629011154175e-07, 3.688037395477295e-07, 4.116445779800415e-07, 4.544854164123535e-07, 4.973262548446655e-07, 5.401670932769775e-07, 5.830079317092896e-07, 6.258487701416016e-07, 6.686896085739136e-07, 7.115304470062256e-07, 7.543712854385376e-07, 7.972121238708496e-07, 8.400529623031616e-07, 8.828938007354736e-07, 9.257346391677856e-07, 9.685754776000977e-07, 1.0114163160324097e-06, 1.0542571544647217e-06, 1.0970979928970337e-06, 1.1399388313293457e-06, 1.1827796697616577e-06, 1.2256205081939697e-06, 1.2684613466262817e-06, 1.3113021850585938e-06]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 17.0, 12.0, 14.0, 23.0, 36.0, 63.0, 158.0, 519.0, 7513.0, 849605.0, 186500.0, 3480.0, 307.0, 128.0, 60.0, 33.0, 20.0, 16.0, 11.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.282857894897461e-05, -2.2009946405887604e-05, -2.1191313862800598e-05, -2.0372681319713593e-05, -1.9554048776626587e-05, -1.873541623353958e-05, -1.7916783690452576e-05, -1.709815114736557e-05, -1.6279518604278564e-05, -1.546088606119156e-05, -1.4642253518104553e-05, -1.3823620975017548e-05, -1.3004988431930542e-05, -1.2186355888843536e-05, -1.136772334575653e-05, -1.0549090802669525e-05, -9.73045825958252e-06, -8.911825716495514e-06, -8.093193173408508e-06, -7.274560630321503e-06, -6.455928087234497e-06, -5.6372955441474915e-06, -4.818663001060486e-06, -4.00003045797348e-06, -3.1813979148864746e-06, -2.362765371799469e-06, -1.5441328287124634e-06, -7.255002856254578e-07, 9.313225746154785e-08, 9.117648005485535e-07, 1.730397343635559e-06, 2.5490298867225647e-06, 3.3676624298095703e-06, 4.186294972896576e-06, 5.0049275159835815e-06, 5.823560059070587e-06, 6.642192602157593e-06, 7.460825145244598e-06, 8.279457688331604e-06, 9.09809023141861e-06, 9.916722774505615e-06, 1.0735355317592621e-05, 1.1553987860679626e-05, 1.2372620403766632e-05, 1.3191252946853638e-05, 1.4009885489940643e-05, 1.4828518033027649e-05, 1.5647150576114655e-05, 1.646578311920166e-05, 1.7284415662288666e-05, 1.810304820537567e-05, 1.8921680748462677e-05, 1.9740313291549683e-05, 2.0558945834636688e-05, 2.1377578377723694e-05, 2.21962109208107e-05, 2.3014843463897705e-05, 2.383347600698471e-05, 2.4652108550071716e-05, 2.5470741093158722e-05, 2.6289373636245728e-05, 2.7108006179332733e-05, 2.792663872241974e-05, 2.8745271265506744e-05, 2.956390380859375e-05]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 13.0, 24.0, 144.0, 653.0, 131.0, 39.0, 6.0, 5.0], "bins": [-4.811475719179725e-06, -4.730711225420237e-06, -4.649946276913397e-06, -4.569181783153908e-06, -4.488416834647069e-06, -4.40765234088758e-06, -4.326887847128091e-06, -4.246122898621252e-06, -4.165358404861763e-06, -4.0845939111022744e-06, -4.003828962595435e-06, -3.923064468835946e-06, -3.842299520329107e-06, -3.761535026569618e-06, -3.6807703054364538e-06, -3.6000055843032897e-06, -3.519241090543801e-06, -3.438476369410637e-06, -3.3577116482774727e-06, -3.276947154517984e-06, -3.19618243338482e-06, -3.1154177122516558e-06, -3.0346529911184916e-06, -2.9538882699853275e-06, -2.8731235488521634e-06, -2.7923588277189992e-06, -2.711594106585835e-06, -2.6308296128263464e-06, -2.5500648916931823e-06, -2.469300170560018e-06, -2.388535449426854e-06, -2.3077709556673653e-06, -2.2270064619078767e-06, -2.1462417407747125e-06, -2.0654770196415484e-06, -1.9847125258820597e-06, -1.9039478047488956e-06, -1.8231830836157314e-06, -1.7424183624825673e-06, -1.661653755036241e-06, -1.5808890339030768e-06, -1.5001243127699126e-06, -1.4193597053235862e-06, -1.3385949841904221e-06, -1.2578303767440957e-06, -1.1770656556109316e-06, -1.0963010481646052e-06, -1.015536327031441e-06, -9.347716627416958e-07, -8.540069984519505e-07, -7.732423341622052e-07, -6.9247766987246e-07, -6.117129487392958e-07, -5.309483412929694e-07, -4.501836201598053e-07, -3.6941895587006e-07, -2.8865429158031475e-07, -2.0788962729056948e-07, -1.271249487899695e-07, -4.636027028936951e-08, 3.440439400037576e-08, 1.1516905829012103e-07, 1.9593375100157573e-07, 2.76698415291321e-07, 3.5746307958106627e-07]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 168.0, 0.0, 0.0, 0.0, 440.0, 0.0, 0.0, 0.0, 154.0, 0.0, 0.0, 0.0, 57.0, 0.0, 0.0, 0.0, 33.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.6193599700927734e-07, -4.470348358154297e-07, -4.3213367462158203e-07, -4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07, 4.3213367462158203e-07, 4.470348358154297e-07, 4.6193599700927734e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 8.0, 10.0, 8.0, 8.0, 14.0, 15.0, 11.0, 18.0, 24.0, 29.0, 21.0, 31.0, 25.0, 29.0, 26.0, 31.0, 40.0, 33.0, 39.0, 32.0, 36.0, 36.0, 37.0, 39.0, 35.0, 42.0, 24.0, 33.0, 41.0, 27.0, 22.0, 21.0, 18.0, 22.0, 16.0, 13.0, 13.0, 12.0, 9.0, 6.0, 4.0, 8.0, 9.0, 4.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7596282958984375, -1.701873779296875, -1.6441192626953125, -1.58636474609375, -1.5286102294921875, -1.470855712890625, -1.4131011962890625, -1.3553466796875, -1.2975921630859375, -1.239837646484375, -1.1820831298828125, -1.12432861328125, -1.0665740966796875, -1.008819580078125, -0.9510650634765625, -0.893310546875, -0.8355560302734375, -0.777801513671875, -0.7200469970703125, -0.66229248046875, -0.6045379638671875, -0.546783447265625, -0.4890289306640625, -0.4312744140625, -0.3735198974609375, -0.315765380859375, -0.2580108642578125, -0.20025634765625, -0.1425018310546875, -0.084747314453125, -0.0269927978515625, 0.03076171875, 0.0885162353515625, 0.146270751953125, 0.2040252685546875, 0.26177978515625, 0.3195343017578125, 0.377288818359375, 0.4350433349609375, 0.4927978515625, 0.5505523681640625, 0.608306884765625, 0.6660614013671875, 0.72381591796875, 0.7815704345703125, 0.839324951171875, 0.8970794677734375, 0.954833984375, 1.0125885009765625, 1.070343017578125, 1.1280975341796875, 1.18585205078125, 1.2436065673828125, 1.301361083984375, 1.3591156005859375, 1.4168701171875, 1.4746246337890625, 1.532379150390625, 1.5901336669921875, 1.64788818359375, 1.7056427001953125, 1.763397216796875, 1.8211517333984375, 1.87890625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 14.0, 20.0, 48.0, 79.0, 74.0, 142.0, 218.0, 341.0, 507.0, 785.0, 1213.0, 1755.0, 2639.0, 3932.0, 5562.0, 8218.0, 11854.0, 17133.0, 24847.0, 37919.0, 62379.0, 116096.0, 228205.0, 228663.0, 115949.0, 62585.0, 37992.0, 24805.0, 17097.0, 11841.0, 8150.0, 5708.0, 3908.0, 2595.0, 1840.0, 1148.0, 773.0, 499.0, 327.0, 236.0, 152.0, 115.0, 71.0, 28.0, 28.0, 19.0, 13.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0], "bins": [-2.32421875, -2.255859375, -2.1875, -2.119140625, -2.05078125, -1.982421875, -1.9140625, -1.845703125, -1.77734375, -1.708984375, -1.640625, -1.572265625, -1.50390625, -1.435546875, -1.3671875, -1.298828125, -1.23046875, -1.162109375, -1.09375, -1.025390625, -0.95703125, -0.888671875, -0.8203125, -0.751953125, -0.68359375, -0.615234375, -0.546875, -0.478515625, -0.41015625, -0.341796875, -0.2734375, -0.205078125, -0.13671875, -0.068359375, 0.0, 0.068359375, 0.13671875, 0.205078125, 0.2734375, 0.341796875, 0.41015625, 0.478515625, 0.546875, 0.615234375, 0.68359375, 0.751953125, 0.8203125, 0.888671875, 0.95703125, 1.025390625, 1.09375, 1.162109375, 1.23046875, 1.298828125, 1.3671875, 1.435546875, 1.50390625, 1.572265625, 1.640625, 1.708984375, 1.77734375, 1.845703125, 1.9140625, 1.982421875, 2.05078125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 8.0, 9.0, 3.0, 6.0, 13.0, 11.0, 14.0, 14.0, 13.0, 18.0, 22.0, 22.0, 36.0, 29.0, 37.0, 31.0, 39.0, 65.0, 76.0, 111.0, 182.0, 1367.0, 246.0, 137.0, 116.0, 64.0, 42.0, 45.0, 36.0, 33.0, 31.0, 30.0, 16.0, 20.0, 20.0, 19.0, 15.0, 12.0, 2.0, 7.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-7.33984375, -7.11541748046875, -6.8909912109375, -6.66656494140625, -6.442138671875, -6.21771240234375, -5.9932861328125, -5.76885986328125, -5.54443359375, -5.32000732421875, -5.0955810546875, -4.87115478515625, -4.646728515625, -4.42230224609375, -4.1978759765625, -3.97344970703125, -3.7490234375, -3.52459716796875, -3.3001708984375, -3.07574462890625, -2.851318359375, -2.62689208984375, -2.4024658203125, -2.17803955078125, -1.95361328125, -1.72918701171875, -1.5047607421875, -1.28033447265625, -1.055908203125, -0.83148193359375, -0.6070556640625, -0.38262939453125, -0.158203125, 0.06622314453125, 0.2906494140625, 0.51507568359375, 0.739501953125, 0.96392822265625, 1.1883544921875, 1.41278076171875, 1.63720703125, 1.86163330078125, 2.0860595703125, 2.31048583984375, 2.534912109375, 2.75933837890625, 2.9837646484375, 3.20819091796875, 3.4326171875, 3.65704345703125, 3.8814697265625, 4.10589599609375, 4.330322265625, 4.55474853515625, 4.7791748046875, 5.00360107421875, 5.22802734375, 5.45245361328125, 5.6768798828125, 5.90130615234375, 6.125732421875, 6.35015869140625, 6.5745849609375, 6.79901123046875, 7.0234375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 9.0, 8.0, 4.0, 9.0, 12.0, 10.0, 14.0, 24.0, 24.0, 43.0, 44.0, 40.0, 89.0, 94.0, 137.0, 223.0, 377.0, 890.0, 3605.0, 20878.0, 199097.0, 2510886.0, 368389.0, 33140.0, 5130.0, 1192.0, 435.0, 227.0, 167.0, 137.0, 65.0, 73.0, 50.0, 35.0, 28.0, 21.0, 23.0, 14.0, 18.0, 8.0, 12.0, 6.0, 6.0, 8.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-12.6953125, -12.3060302734375, -11.916748046875, -11.5274658203125, -11.13818359375, -10.7489013671875, -10.359619140625, -9.9703369140625, -9.5810546875, -9.1917724609375, -8.802490234375, -8.4132080078125, -8.02392578125, -7.6346435546875, -7.245361328125, -6.8560791015625, -6.466796875, -6.0775146484375, -5.688232421875, -5.2989501953125, -4.90966796875, -4.5203857421875, -4.131103515625, -3.7418212890625, -3.3525390625, -2.9632568359375, -2.573974609375, -2.1846923828125, -1.79541015625, -1.4061279296875, -1.016845703125, -0.6275634765625, -0.23828125, 0.1510009765625, 0.540283203125, 0.9295654296875, 1.31884765625, 1.7081298828125, 2.097412109375, 2.4866943359375, 2.8759765625, 3.2652587890625, 3.654541015625, 4.0438232421875, 4.43310546875, 4.8223876953125, 5.211669921875, 5.6009521484375, 5.990234375, 6.3795166015625, 6.768798828125, 7.1580810546875, 7.54736328125, 7.9366455078125, 8.325927734375, 8.7152099609375, 9.1044921875, 9.4937744140625, 9.883056640625, 10.2723388671875, 10.66162109375, 11.0509033203125, 11.440185546875, 11.8294677734375, 12.21875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [169.0, 724.0, 126.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.981283664703369, -2.498626708984375, 2.984030246734619, 8.46668815612793, 13.949344635009766, 19.4320011138916, 24.91465950012207, 30.397314071655273, 35.87997055053711, 41.36262893676758, 46.84528350830078, 52.32794189453125, 57.81060028076172, 63.29325485229492, 68.77590942382812, 74.2585678100586, 79.74122619628906, 85.22388458251953, 90.70654296875, 96.18919372558594, 101.6718521118164, 107.15451049804688, 112.63716888427734, 118.11982727050781, 123.60248565673828, 129.08514404296875, 134.5677947998047, 140.0504608154297, 145.53311157226562, 151.01577758789062, 156.49842834472656, 161.9810791015625, 167.46372985839844, 172.94638061523438, 178.42904663085938, 183.9116973876953, 189.3943634033203, 194.87701416015625, 200.35968017578125, 205.8423309326172, 211.32498168945312, 216.80763244628906, 222.29029846191406, 227.77294921875, 233.255615234375, 238.73826599121094, 244.22091674804688, 249.70358276367188, 255.18624877929688, 260.6689147949219, 266.15155029296875, 271.63421630859375, 277.11688232421875, 282.59954833984375, 288.0821838378906, 293.5648498535156, 299.0474853515625, 304.5301513671875, 310.0127868652344, 315.4954528808594, 320.9781188964844, 326.46075439453125, 331.94342041015625, 337.42608642578125, 342.90875244140625]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 11.0, 7.0, 7.0, 11.0, 13.0, 16.0, 16.0, 23.0, 23.0, 24.0, 34.0, 33.0, 35.0, 30.0, 38.0, 43.0, 32.0, 40.0, 47.0, 40.0, 31.0, 37.0, 37.0, 37.0, 34.0, 33.0, 35.0, 20.0, 30.0, 25.0, 15.0, 28.0, 17.0, 20.0, 15.0, 15.0, 10.0, 9.0, 5.0, 6.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-25.10976791381836, -24.4102840423584, -23.710800170898438, -23.01131820678711, -22.31183433532715, -21.612350463867188, -20.912866592407227, -20.213382720947266, -19.513898849487305, -18.814414978027344, -18.114931106567383, -17.415447235107422, -16.715965270996094, -16.016481399536133, -15.316997528076172, -14.617513656616211, -13.918030738830566, -13.218546867370605, -12.519063949584961, -11.819580078125, -11.120096206665039, -10.420612335205078, -9.721129417419434, -9.021645545959473, -8.322162628173828, -7.622679233551025, -6.9231953620910645, -6.223711967468262, -5.524228096008301, -4.824744701385498, -4.125261306762695, -3.4257774353027344, -2.7262935638427734, -2.0268099308013916, -1.3273264169692993, -0.627842903137207, 0.0716407299041748, 0.7711243629455566, 1.4706077575683594, 2.1700916290283203, 2.869575023651123, 3.569058656692505, 4.268542289733887, 4.9680256843566895, 5.667509078979492, 6.366992950439453, 7.066476345062256, 7.765960216522217, 8.46544361114502, 9.16492748260498, 9.864410400390625, 10.563894271850586, 11.263378143310547, 11.962862014770508, 12.662344932556152, 13.361828804016113, 14.061311721801758, 14.760795593261719, 15.460278511047363, 16.15976333618164, 16.85924530029297, 17.55872917175293, 18.25821304321289, 18.95769691467285, 19.657180786132812]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 3.0, 4.0, 10.0, 10.0, 8.0, 9.0, 12.0, 14.0, 11.0, 26.0, 19.0, 26.0, 28.0, 23.0, 33.0, 29.0, 24.0, 28.0, 35.0, 31.0, 37.0, 32.0, 41.0, 38.0, 39.0, 36.0, 30.0, 35.0, 28.0, 33.0, 31.0, 28.0, 25.0, 16.0, 27.0, 15.0, 18.0, 16.0, 18.0, 10.0, 10.0, 11.0, 7.0, 7.0, 4.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8974609375, -1.8375091552734375, -1.777557373046875, -1.7176055908203125, -1.65765380859375, -1.5977020263671875, -1.537750244140625, -1.4777984619140625, -1.4178466796875, -1.3578948974609375, -1.297943115234375, -1.2379913330078125, -1.17803955078125, -1.1180877685546875, -1.058135986328125, -0.9981842041015625, -0.938232421875, -0.8782806396484375, -0.818328857421875, -0.7583770751953125, -0.69842529296875, -0.6384735107421875, -0.578521728515625, -0.5185699462890625, -0.4586181640625, -0.3986663818359375, -0.338714599609375, -0.2787628173828125, -0.21881103515625, -0.1588592529296875, -0.098907470703125, -0.0389556884765625, 0.02099609375, 0.0809478759765625, 0.140899658203125, 0.2008514404296875, 0.26080322265625, 0.3207550048828125, 0.380706787109375, 0.4406585693359375, 0.5006103515625, 0.5605621337890625, 0.620513916015625, 0.6804656982421875, 0.74041748046875, 0.8003692626953125, 0.860321044921875, 0.9202728271484375, 0.980224609375, 1.0401763916015625, 1.100128173828125, 1.1600799560546875, 1.22003173828125, 1.2799835205078125, 1.339935302734375, 1.3998870849609375, 1.4598388671875, 1.5197906494140625, 1.579742431640625, 1.6396942138671875, 1.69964599609375, 1.7595977783203125, 1.819549560546875, 1.8795013427734375, 1.939453125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 9.0, 10.0, 17.0, 21.0, 27.0, 37.0, 67.0, 89.0, 145.0, 229.0, 360.0, 661.0, 1015.0, 2018.0, 3998.0, 7737.0, 15886.0, 33125.0, 70958.0, 154516.0, 335830.0, 702827.0, 1143913.0, 886512.0, 447023.0, 206821.0, 94881.0, 43345.0, 20875.0, 10163.0, 5136.0, 2672.0, 1398.0, 753.0, 431.0, 278.0, 168.0, 120.0, 71.0, 40.0, 31.0, 33.0, 17.0, 12.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.76171875, -2.682098388671875, -2.60247802734375, -2.522857666015625, -2.4432373046875, -2.363616943359375, -2.28399658203125, -2.204376220703125, -2.124755859375, -2.045135498046875, -1.96551513671875, -1.885894775390625, -1.8062744140625, -1.726654052734375, -1.64703369140625, -1.567413330078125, -1.48779296875, -1.408172607421875, -1.32855224609375, -1.248931884765625, -1.1693115234375, -1.089691162109375, -1.01007080078125, -0.930450439453125, -0.850830078125, -0.771209716796875, -0.69158935546875, -0.611968994140625, -0.5323486328125, -0.452728271484375, -0.37310791015625, -0.293487548828125, -0.2138671875, -0.134246826171875, -0.05462646484375, 0.024993896484375, 0.1046142578125, 0.184234619140625, 0.26385498046875, 0.343475341796875, 0.423095703125, 0.502716064453125, 0.58233642578125, 0.661956787109375, 0.7415771484375, 0.821197509765625, 0.90081787109375, 0.980438232421875, 1.06005859375, 1.139678955078125, 1.21929931640625, 1.298919677734375, 1.3785400390625, 1.458160400390625, 1.53778076171875, 1.617401123046875, 1.697021484375, 1.776641845703125, 1.85626220703125, 1.935882568359375, 2.0155029296875, 2.095123291015625, 2.17474365234375, 2.254364013671875, 2.333984375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 15.0, 13.0, 18.0, 25.0, 38.0, 58.0, 74.0, 118.0, 203.0, 261.0, 380.0, 457.0, 540.0, 505.0, 387.0, 290.0, 217.0, 150.0, 110.0, 57.0, 56.0, 35.0, 24.0, 12.0, 15.0, 7.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.55078125, -7.33355712890625, -7.1163330078125, -6.89910888671875, -6.681884765625, -6.46466064453125, -6.2474365234375, -6.03021240234375, -5.81298828125, -5.59576416015625, -5.3785400390625, -5.16131591796875, -4.944091796875, -4.72686767578125, -4.5096435546875, -4.29241943359375, -4.0751953125, -3.85797119140625, -3.6407470703125, -3.42352294921875, -3.206298828125, -2.98907470703125, -2.7718505859375, -2.55462646484375, -2.33740234375, -2.12017822265625, -1.9029541015625, -1.68572998046875, -1.468505859375, -1.25128173828125, -1.0340576171875, -0.81683349609375, -0.599609375, -0.38238525390625, -0.1651611328125, 0.05206298828125, 0.269287109375, 0.48651123046875, 0.7037353515625, 0.92095947265625, 1.13818359375, 1.35540771484375, 1.5726318359375, 1.78985595703125, 2.007080078125, 2.22430419921875, 2.4415283203125, 2.65875244140625, 2.8759765625, 3.09320068359375, 3.3104248046875, 3.52764892578125, 3.744873046875, 3.96209716796875, 4.1793212890625, 4.39654541015625, 4.61376953125, 4.83099365234375, 5.0482177734375, 5.26544189453125, 5.482666015625, 5.69989013671875, 5.9171142578125, 6.13433837890625, 6.3515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 6.0, 8.0, 29.0, 34.0, 54.0, 100.0, 137.0, 241.0, 510.0, 1479.0, 6751.0, 47447.0, 435092.0, 2453832.0, 1104208.0, 124735.0, 15322.0, 2772.0, 756.0, 324.0, 172.0, 95.0, 65.0, 35.0, 27.0, 21.0, 12.0, 7.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9296875, -9.5955810546875, -9.261474609375, -8.9273681640625, -8.59326171875, -8.2591552734375, -7.925048828125, -7.5909423828125, -7.2568359375, -6.9227294921875, -6.588623046875, -6.2545166015625, -5.92041015625, -5.5863037109375, -5.252197265625, -4.9180908203125, -4.583984375, -4.2498779296875, -3.915771484375, -3.5816650390625, -3.24755859375, -2.9134521484375, -2.579345703125, -2.2452392578125, -1.9111328125, -1.5770263671875, -1.242919921875, -0.9088134765625, -0.57470703125, -0.2406005859375, 0.093505859375, 0.4276123046875, 0.76171875, 1.0958251953125, 1.429931640625, 1.7640380859375, 2.09814453125, 2.4322509765625, 2.766357421875, 3.1004638671875, 3.4345703125, 3.7686767578125, 4.102783203125, 4.4368896484375, 4.77099609375, 5.1051025390625, 5.439208984375, 5.7733154296875, 6.107421875, 6.4415283203125, 6.775634765625, 7.1097412109375, 7.44384765625, 7.7779541015625, 8.112060546875, 8.4461669921875, 8.7802734375, 9.1143798828125, 9.448486328125, 9.7825927734375, 10.11669921875, 10.4508056640625, 10.784912109375, 11.1190185546875, 11.453125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 24.0, 60.0, 136.0, 204.0, 239.0, 174.0, 112.0, 49.0, 12.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.100248336791992, -26.759870529174805, -24.419490814208984, -22.079113006591797, -19.73873519897461, -17.398357391357422, -15.057978630065918, -12.717599868774414, -10.377222061157227, -8.036844253540039, -5.696465492248535, -3.3560872077941895, -1.0157089233398438, 1.3246688842773438, 3.6650476455688477, 6.005426406860352, 8.345804214477539, 10.686182022094727, 13.02656078338623, 15.366939544677734, 17.707317352294922, 20.04769515991211, 22.388072967529297, 24.728452682495117, 27.068830490112305, 29.409208297729492, 31.749588012695312, 34.0899658203125, 36.43034362792969, 38.770721435546875, 41.11109924316406, 43.45147705078125, 45.79186248779297, 48.132240295410156, 50.472618103027344, 52.81299591064453, 55.15337371826172, 57.493751525878906, 59.83413314819336, 62.17451095581055, 64.514892578125, 66.85527038574219, 69.19564819335938, 71.53602600097656, 73.87640380859375, 76.21678161621094, 78.55715942382812, 80.89753723144531, 83.2379150390625, 85.57829284667969, 87.91867065429688, 90.25904846191406, 92.59942626953125, 94.93980407714844, 97.28018188476562, 99.62055969238281, 101.9609375, 104.30131530761719, 106.64169311523438, 108.98207092285156, 111.32244873046875, 113.66282653808594, 116.00320434570312, 118.34358215332031, 120.68396759033203]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 4.0, 5.0, 4.0, 7.0, 5.0, 15.0, 17.0, 16.0, 27.0, 23.0, 19.0, 23.0, 20.0, 26.0, 36.0, 37.0, 32.0, 39.0, 36.0, 35.0, 33.0, 38.0, 50.0, 57.0, 37.0, 34.0, 37.0, 30.0, 27.0, 32.0, 23.0, 19.0, 29.0, 25.0, 19.0, 10.0, 13.0, 9.0, 12.0, 8.0, 4.0, 8.0, 3.0, 3.0, 3.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.26940155029297, -16.721149444580078, -16.172897338867188, -15.62464714050293, -15.076395034790039, -14.528142929077148, -13.979891777038574, -13.431640625, -12.88338851928711, -12.335136413574219, -11.786885261535645, -11.23863410949707, -10.69038200378418, -10.142129898071289, -9.593878746032715, -9.04562759399414, -8.49737548828125, -7.949123859405518, -7.400872230529785, -6.852620601654053, -6.30436897277832, -5.756117343902588, -5.2078657150268555, -4.659614086151123, -4.111362457275391, -3.563110828399658, -3.014859199523926, -2.4666075706481934, -1.918355941772461, -1.3701043128967285, -0.8218526840209961, -0.27360105514526367, 0.27465057373046875, 0.8229022026062012, 1.3711538314819336, 1.919405460357666, 2.4676570892333984, 3.015908718109131, 3.5641603469848633, 4.112411975860596, 4.660663604736328, 5.2089152336120605, 5.757166862487793, 6.305418491363525, 6.853670120239258, 7.40192174911499, 7.950173377990723, 8.498424530029297, 9.046676635742188, 9.594928741455078, 10.143179893493652, 10.691431045532227, 11.239683151245117, 11.787935256958008, 12.336186408996582, 12.884437561035156, 13.432689666748047, 13.980941772460938, 14.529192924499512, 15.077444076538086, 15.625696182250977, 16.173948287963867, 16.722198486328125, 17.270450592041016, 17.818702697753906]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 11.0, 7.0, 11.0, 14.0, 12.0, 15.0, 16.0, 21.0, 18.0, 23.0, 25.0, 34.0, 27.0, 31.0, 33.0, 40.0, 42.0, 30.0, 49.0, 54.0, 30.0, 40.0, 40.0, 35.0, 26.0, 28.0, 32.0, 38.0, 25.0, 22.0, 24.0, 16.0, 24.0, 9.0, 17.0, 20.0, 12.0, 11.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.072265625, -2.00634765625, -1.9404296875, -1.87451171875, -1.80859375, -1.74267578125, -1.6767578125, -1.61083984375, -1.544921875, -1.47900390625, -1.4130859375, -1.34716796875, -1.28125, -1.21533203125, -1.1494140625, -1.08349609375, -1.017578125, -0.95166015625, -0.8857421875, -0.81982421875, -0.75390625, -0.68798828125, -0.6220703125, -0.55615234375, -0.490234375, -0.42431640625, -0.3583984375, -0.29248046875, -0.2265625, -0.16064453125, -0.0947265625, -0.02880859375, 0.037109375, 0.10302734375, 0.1689453125, 0.23486328125, 0.30078125, 0.36669921875, 0.4326171875, 0.49853515625, 0.564453125, 0.63037109375, 0.6962890625, 0.76220703125, 0.828125, 0.89404296875, 0.9599609375, 1.02587890625, 1.091796875, 1.15771484375, 1.2236328125, 1.28955078125, 1.35546875, 1.42138671875, 1.4873046875, 1.55322265625, 1.619140625, 1.68505859375, 1.7509765625, 1.81689453125, 1.8828125, 1.94873046875, 2.0146484375, 2.08056640625, 2.146484375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 7.0, 9.0, 14.0, 21.0, 23.0, 47.0, 54.0, 77.0, 137.0, 198.0, 299.0, 438.0, 745.0, 1102.0, 1668.0, 2617.0, 3993.0, 6076.0, 9705.0, 15772.0, 25883.0, 43908.0, 76297.0, 148867.0, 370524.0, 149874.0, 76786.0, 43931.0, 26185.0, 15853.0, 9816.0, 6272.0, 4066.0, 2568.0, 1598.0, 1096.0, 685.0, 451.0, 288.0, 226.0, 134.0, 84.0, 55.0, 30.0, 27.0, 18.0, 11.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.093017578125, -0.09006500244140625, -0.0871124267578125, -0.08415985107421875, -0.081207275390625, -0.07825469970703125, -0.0753021240234375, -0.07234954833984375, -0.06939697265625, -0.06644439697265625, -0.0634918212890625, -0.06053924560546875, -0.057586669921875, -0.05463409423828125, -0.0516815185546875, -0.04872894287109375, -0.0457763671875, -0.04282379150390625, -0.0398712158203125, -0.03691864013671875, -0.033966064453125, -0.03101348876953125, -0.0280609130859375, -0.02510833740234375, -0.02215576171875, -0.01920318603515625, -0.0162506103515625, -0.01329803466796875, -0.010345458984375, -0.00739288330078125, -0.0044403076171875, -0.00148773193359375, 0.00146484375, 0.00441741943359375, 0.0073699951171875, 0.01032257080078125, 0.013275146484375, 0.01622772216796875, 0.0191802978515625, 0.02213287353515625, 0.02508544921875, 0.02803802490234375, 0.0309906005859375, 0.03394317626953125, 0.036895751953125, 0.03984832763671875, 0.0428009033203125, 0.04575347900390625, 0.0487060546875, 0.05165863037109375, 0.0546112060546875, 0.05756378173828125, 0.060516357421875, 0.06346893310546875, 0.0664215087890625, 0.06937408447265625, 0.07232666015625, 0.07527923583984375, 0.0782318115234375, 0.08118438720703125, 0.084136962890625, 0.08708953857421875, 0.0900421142578125, 0.09299468994140625, 0.095947265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 11.0, 14.0, 7.0, 6.0, 12.0, 31.0, 22.0, 22.0, 27.0, 26.0, 28.0, 26.0, 42.0, 35.0, 47.0, 47.0, 48.0, 1060.0, 43.0, 42.0, 33.0, 36.0, 37.0, 44.0, 28.0, 31.0, 28.0, 33.0, 23.0, 19.0, 18.0, 27.0, 8.0, 7.0, 8.0, 11.0, 9.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5654296875, -1.5162811279296875, -1.467132568359375, -1.4179840087890625, -1.36883544921875, -1.3196868896484375, -1.270538330078125, -1.2213897705078125, -1.1722412109375, -1.1230926513671875, -1.073944091796875, -1.0247955322265625, -0.97564697265625, -0.9264984130859375, -0.877349853515625, -0.8282012939453125, -0.779052734375, -0.7299041748046875, -0.680755615234375, -0.6316070556640625, -0.58245849609375, -0.5333099365234375, -0.484161376953125, -0.4350128173828125, -0.3858642578125, -0.3367156982421875, -0.287567138671875, -0.2384185791015625, -0.18927001953125, -0.1401214599609375, -0.090972900390625, -0.0418243408203125, 0.00732421875, 0.0564727783203125, 0.105621337890625, 0.1547698974609375, 0.20391845703125, 0.2530670166015625, 0.302215576171875, 0.3513641357421875, 0.4005126953125, 0.4496612548828125, 0.498809814453125, 0.5479583740234375, 0.59710693359375, 0.6462554931640625, 0.695404052734375, 0.7445526123046875, 0.793701171875, 0.8428497314453125, 0.891998291015625, 0.9411468505859375, 0.99029541015625, 1.0394439697265625, 1.088592529296875, 1.1377410888671875, 1.1868896484375, 1.2360382080078125, 1.285186767578125, 1.3343353271484375, 1.38348388671875, 1.4326324462890625, 1.481781005859375, 1.5309295654296875, 1.580078125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 10.0, 8.0, 23.0, 24.0, 40.0, 60.0, 80.0, 144.0, 173.0, 296.0, 448.0, 670.0, 953.0, 1395.0, 2103.0, 3056.0, 4670.0, 6718.0, 10288.0, 14993.0, 22845.0, 35240.0, 57156.0, 97527.0, 198989.0, 1333253.0, 119656.0, 66931.0, 40643.0, 26151.0, 17263.0, 11603.0, 7632.0, 5217.0, 3594.0, 2398.0, 1553.0, 1082.0, 773.0, 458.0, 343.0, 239.0, 144.0, 96.0, 60.0, 61.0, 18.0, 22.0, 13.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.045562744140625, -0.044146060943603516, -0.04272937774658203, -0.04131269454956055, -0.03989601135253906, -0.03847932815551758, -0.037062644958496094, -0.03564596176147461, -0.034229278564453125, -0.03281259536743164, -0.031395912170410156, -0.029979228973388672, -0.028562545776367188, -0.027145862579345703, -0.02572917938232422, -0.024312496185302734, -0.02289581298828125, -0.021479129791259766, -0.02006244659423828, -0.018645763397216797, -0.017229080200195312, -0.015812397003173828, -0.014395713806152344, -0.01297903060913086, -0.011562347412109375, -0.01014566421508789, -0.008728981018066406, -0.007312297821044922, -0.0058956146240234375, -0.004478931427001953, -0.0030622482299804688, -0.0016455650329589844, -0.0002288818359375, 0.0011878013610839844, 0.0026044845581054688, 0.004021167755126953, 0.0054378509521484375, 0.006854534149169922, 0.008271217346191406, 0.00968790054321289, 0.011104583740234375, 0.01252126693725586, 0.013937950134277344, 0.015354633331298828, 0.016771316528320312, 0.018187999725341797, 0.01960468292236328, 0.021021366119384766, 0.02243804931640625, 0.023854732513427734, 0.02527141571044922, 0.026688098907470703, 0.028104782104492188, 0.029521465301513672, 0.030938148498535156, 0.03235483169555664, 0.033771514892578125, 0.03518819808959961, 0.036604881286621094, 0.03802156448364258, 0.03943824768066406, 0.04085493087768555, 0.04227161407470703, 0.043688297271728516, 0.04510498046875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 18.0, 0.0, 21.0, 0.0, 27.0, 0.0, 32.0, 0.0, 50.0, 89.0, 0.0, 500.0, 0.0, 87.0, 0.0, 53.0, 0.0, 45.0, 0.0, 28.0, 0.0, 13.0, 0.0, 14.0, 0.0, 9.0, 0.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0], "bins": [-1.0728836059570312e-06, -1.0421499609947205e-06, -1.0114163160324097e-06, -9.806826710700989e-07, -9.499490261077881e-07, -9.192153811454773e-07, -8.884817361831665e-07, -8.577480912208557e-07, -8.270144462585449e-07, -7.962808012962341e-07, -7.655471563339233e-07, -7.348135113716125e-07, -7.040798664093018e-07, -6.73346221446991e-07, -6.426125764846802e-07, -6.118789315223694e-07, -5.811452865600586e-07, -5.504116415977478e-07, -5.19677996635437e-07, -4.889443516731262e-07, -4.5821070671081543e-07, -4.2747706174850464e-07, -3.9674341678619385e-07, -3.6600977182388306e-07, -3.3527612686157227e-07, -3.045424818992615e-07, -2.738088369369507e-07, -2.430751919746399e-07, -2.123415470123291e-07, -1.816079020500183e-07, -1.5087425708770752e-07, -1.2014061212539673e-07, -8.940696716308594e-08, -5.8673322200775146e-08, -2.7939677238464355e-08, 2.7939677238464355e-09, 3.3527612686157227e-08, 6.426125764846802e-08, 9.499490261077881e-08, 1.257285475730896e-07, 1.564621925354004e-07, 1.8719583749771118e-07, 2.1792948246002197e-07, 2.4866312742233276e-07, 2.7939677238464355e-07, 3.1013041734695435e-07, 3.4086406230926514e-07, 3.7159770727157593e-07, 4.023313522338867e-07, 4.330649971961975e-07, 4.637986421585083e-07, 4.945322871208191e-07, 5.252659320831299e-07, 5.559995770454407e-07, 5.867332220077515e-07, 6.174668669700623e-07, 6.48200511932373e-07, 6.789341568946838e-07, 7.096678018569946e-07, 7.404014468193054e-07, 7.711350917816162e-07, 8.01868736743927e-07, 8.326023817062378e-07, 8.633360266685486e-07, 8.940696716308594e-07]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 6.0, 11.0, 7.0, 28.0, 42.0, 47.0, 68.0, 157.0, 1164.0, 35665.0, 959153.0, 50288.0, 1510.0, 160.0, 77.0, 49.0, 27.0, 24.0, 16.0, 8.0, 5.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.8312595784664154e-05, -1.767091453075409e-05, -1.7029233276844025e-05, -1.638755202293396e-05, -1.5745870769023895e-05, -1.510418951511383e-05, -1.4462508261203766e-05, -1.3820827007293701e-05, -1.3179145753383636e-05, -1.2537464499473572e-05, -1.1895783245563507e-05, -1.1254101991653442e-05, -1.0612420737743378e-05, -9.970739483833313e-06, -9.329058229923248e-06, -8.687376976013184e-06, -8.045695722103119e-06, -7.404014468193054e-06, -6.7623332142829895e-06, -6.120651960372925e-06, -5.47897070646286e-06, -4.837289452552795e-06, -4.195608198642731e-06, -3.553926944732666e-06, -2.9122456908226013e-06, -2.2705644369125366e-06, -1.628883183002472e-06, -9.872019290924072e-07, -3.4552067518234253e-07, 2.9616057872772217e-07, 9.378418326377869e-07, 1.5795230865478516e-06, 2.2212043404579163e-06, 2.862885594367981e-06, 3.5045668482780457e-06, 4.14624810218811e-06, 4.787929356098175e-06, 5.42961061000824e-06, 6.0712918639183044e-06, 6.712973117828369e-06, 7.354654371738434e-06, 7.996335625648499e-06, 8.638016879558563e-06, 9.279698133468628e-06, 9.921379387378693e-06, 1.0563060641288757e-05, 1.1204741895198822e-05, 1.1846423149108887e-05, 1.2488104403018951e-05, 1.3129785656929016e-05, 1.377146691083908e-05, 1.4413148164749146e-05, 1.505482941865921e-05, 1.5696510672569275e-05, 1.633819192647934e-05, 1.6979873180389404e-05, 1.762155443429947e-05, 1.8263235688209534e-05, 1.89049169421196e-05, 1.9546598196029663e-05, 2.0188279449939728e-05, 2.0829960703849792e-05, 2.1471641957759857e-05, 2.2113323211669922e-05]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 17.0, 24.0, 20.0, 15.0, 11.0, 17.0, 26.0, 647.0, 30.0, 22.0, 24.0, 16.0, 25.0, 16.0, 13.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.0980652354628546e-07, -3.018973870894115e-07, -2.939882222108281e-07, -2.860790573322447e-07, -2.7816992087537074e-07, -2.7026078441849677e-07, -2.6235161953991337e-07, -2.5444245466133e-07, -2.46533318204456e-07, -2.3862418174758204e-07, -2.3071501686899865e-07, -2.2280586620126996e-07, -2.1489671553354128e-07, -2.069875648658126e-07, -1.9907841419808392e-07, -1.9116926353035524e-07, -1.8326011286262656e-07, -1.7535096219489787e-07, -1.674418115271692e-07, -1.595326608594405e-07, -1.5162351019171183e-07, -1.4371435952398315e-07, -1.3580520885625447e-07, -1.2789605818852579e-07, -1.199869075207971e-07, -1.1207775685306842e-07, -1.0416860618533974e-07, -9.625945551761106e-08, -8.835030484988238e-08, -8.04411541821537e-08, -7.253200351442501e-08, -6.462285284669633e-08, -5.6713716389822366e-08, -4.8804565722093685e-08, -4.0895415054365e-08, -3.298626438663632e-08, -2.507711371890764e-08, -1.7167963051178958e-08, -9.258812383450277e-09, -1.349661715721595e-09, 6.5594889520070865e-09, 1.4468639619735768e-08, 2.237779028746445e-08, 3.028694095519313e-08, 3.819609162292181e-08, 4.6105242290650494e-08, 5.4014392958379176e-08, 6.192354362610786e-08, 6.983269429383654e-08, 7.774184496156522e-08, 8.56509956292939e-08, 9.356014629702258e-08, 1.0146929696475127e-07, 1.0937844763247995e-07, 1.1728759830020863e-07, 1.251967489679373e-07, 1.33105899635666e-07, 1.4101505030339467e-07, 1.4892420097112335e-07, 1.5683335163885204e-07, 1.6474250230658072e-07, 1.726516529743094e-07, 1.8056080364203808e-07, 1.8846995430976676e-07, 1.9637910497749544e-07]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 133.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 685.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 130.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 11.0, 7.0, 11.0, 14.0, 12.0, 15.0, 16.0, 21.0, 18.0, 23.0, 25.0, 34.0, 27.0, 31.0, 33.0, 40.0, 42.0, 30.0, 49.0, 54.0, 30.0, 40.0, 40.0, 35.0, 26.0, 28.0, 32.0, 38.0, 25.0, 22.0, 24.0, 16.0, 24.0, 9.0, 17.0, 20.0, 12.0, 11.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.072265625, -2.00634765625, -1.9404296875, -1.87451171875, -1.80859375, -1.74267578125, -1.6767578125, -1.61083984375, -1.544921875, -1.47900390625, -1.4130859375, -1.34716796875, -1.28125, -1.21533203125, -1.1494140625, -1.08349609375, -1.017578125, -0.95166015625, -0.8857421875, -0.81982421875, -0.75390625, -0.68798828125, -0.6220703125, -0.55615234375, -0.490234375, -0.42431640625, -0.3583984375, -0.29248046875, -0.2265625, -0.16064453125, -0.0947265625, -0.02880859375, 0.037109375, 0.10302734375, 0.1689453125, 0.23486328125, 0.30078125, 0.36669921875, 0.4326171875, 0.49853515625, 0.564453125, 0.63037109375, 0.6962890625, 0.76220703125, 0.828125, 0.89404296875, 0.9599609375, 1.02587890625, 1.091796875, 1.15771484375, 1.2236328125, 1.28955078125, 1.35546875, 1.42138671875, 1.4873046875, 1.55322265625, 1.619140625, 1.68505859375, 1.7509765625, 1.81689453125, 1.8828125, 1.94873046875, 2.0146484375, 2.08056640625, 2.146484375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 6.0, 23.0, 26.0, 40.0, 79.0, 159.0, 277.0, 484.0, 769.0, 1367.0, 2345.0, 4448.0, 8347.0, 16427.0, 34289.0, 74063.0, 185627.0, 376803.0, 195074.0, 76658.0, 35538.0, 17005.0, 8513.0, 4488.0, 2431.0, 1343.0, 802.0, 467.0, 277.0, 184.0, 78.0, 38.0, 29.0, 25.0, 8.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.015625, -3.89215087890625, -3.7686767578125, -3.64520263671875, -3.521728515625, -3.39825439453125, -3.2747802734375, -3.15130615234375, -3.02783203125, -2.90435791015625, -2.7808837890625, -2.65740966796875, -2.533935546875, -2.41046142578125, -2.2869873046875, -2.16351318359375, -2.0400390625, -1.91656494140625, -1.7930908203125, -1.66961669921875, -1.546142578125, -1.42266845703125, -1.2991943359375, -1.17572021484375, -1.05224609375, -0.92877197265625, -0.8052978515625, -0.68182373046875, -0.558349609375, -0.43487548828125, -0.3114013671875, -0.18792724609375, -0.064453125, 0.05902099609375, 0.1824951171875, 0.30596923828125, 0.429443359375, 0.55291748046875, 0.6763916015625, 0.79986572265625, 0.92333984375, 1.04681396484375, 1.1702880859375, 1.29376220703125, 1.417236328125, 1.54071044921875, 1.6641845703125, 1.78765869140625, 1.9111328125, 2.03460693359375, 2.1580810546875, 2.28155517578125, 2.405029296875, 2.52850341796875, 2.6519775390625, 2.77545166015625, 2.89892578125, 3.02239990234375, 3.1458740234375, 3.26934814453125, 3.392822265625, 3.51629638671875, 3.6397705078125, 3.76324462890625, 3.88671875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 9.0, 8.0, 6.0, 10.0, 10.0, 10.0, 12.0, 7.0, 20.0, 24.0, 22.0, 36.0, 33.0, 39.0, 34.0, 72.0, 55.0, 91.0, 110.0, 220.0, 1321.0, 237.0, 147.0, 86.0, 66.0, 59.0, 43.0, 28.0, 41.0, 28.0, 30.0, 28.0, 29.0, 14.0, 11.0, 15.0, 10.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1171875, -7.84228515625, -7.5673828125, -7.29248046875, -7.017578125, -6.74267578125, -6.4677734375, -6.19287109375, -5.91796875, -5.64306640625, -5.3681640625, -5.09326171875, -4.818359375, -4.54345703125, -4.2685546875, -3.99365234375, -3.71875, -3.44384765625, -3.1689453125, -2.89404296875, -2.619140625, -2.34423828125, -2.0693359375, -1.79443359375, -1.51953125, -1.24462890625, -0.9697265625, -0.69482421875, -0.419921875, -0.14501953125, 0.1298828125, 0.40478515625, 0.6796875, 0.95458984375, 1.2294921875, 1.50439453125, 1.779296875, 2.05419921875, 2.3291015625, 2.60400390625, 2.87890625, 3.15380859375, 3.4287109375, 3.70361328125, 3.978515625, 4.25341796875, 4.5283203125, 4.80322265625, 5.078125, 5.35302734375, 5.6279296875, 5.90283203125, 6.177734375, 6.45263671875, 6.7275390625, 7.00244140625, 7.27734375, 7.55224609375, 7.8271484375, 8.10205078125, 8.376953125, 8.65185546875, 8.9267578125, 9.20166015625, 9.4765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 7.0, 10.0, 10.0, 29.0, 30.0, 44.0, 72.0, 89.0, 123.0, 163.0, 249.0, 579.0, 1799.0, 11116.0, 170299.0, 2767685.0, 178652.0, 11487.0, 1731.0, 612.0, 296.0, 149.0, 126.0, 81.0, 54.0, 43.0, 36.0, 34.0, 20.0, 16.0, 19.0, 9.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.875, -17.2890625, -16.703125, -16.1171875, -15.53125, -14.9453125, -14.359375, -13.7734375, -13.1875, -12.6015625, -12.015625, -11.4296875, -10.84375, -10.2578125, -9.671875, -9.0859375, -8.5, -7.9140625, -7.328125, -6.7421875, -6.15625, -5.5703125, -4.984375, -4.3984375, -3.8125, -3.2265625, -2.640625, -2.0546875, -1.46875, -0.8828125, -0.296875, 0.2890625, 0.875, 1.4609375, 2.046875, 2.6328125, 3.21875, 3.8046875, 4.390625, 4.9765625, 5.5625, 6.1484375, 6.734375, 7.3203125, 7.90625, 8.4921875, 9.078125, 9.6640625, 10.25, 10.8359375, 11.421875, 12.0078125, 12.59375, 13.1796875, 13.765625, 14.3515625, 14.9375, 15.5234375, 16.109375, 16.6953125, 17.28125, 17.8671875, 18.453125, 19.0390625, 19.625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 151.0, 649.0, 196.0, 20.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.149761199951172, -18.923728942871094, -13.697694778442383, -8.471661567687988, -3.2456283569335938, 1.9804039001464844, 7.206438064575195, 12.432472229003906, 17.658504486083984, 22.884536743164062, 28.110570907592773, 33.336605072021484, 38.56263732910156, 43.78866958618164, 49.01470184326172, 54.24073791503906, 59.46677017211914, 64.69280242919922, 69.91883850097656, 75.14486694335938, 80.37090301513672, 85.59693908691406, 90.82296752929688, 96.04900360107422, 101.27503967285156, 106.5010757446289, 111.72710418701172, 116.95314025878906, 122.17916870117188, 127.40520477294922, 132.63124084472656, 137.85726928710938, 143.08331298828125, 148.30934143066406, 153.53538513183594, 158.76141357421875, 163.98744201660156, 169.21347045898438, 174.43951416015625, 179.66554260253906, 184.89157104492188, 190.1175994873047, 195.34364318847656, 200.56967163085938, 205.7957000732422, 211.021728515625, 216.24777221679688, 221.4738006591797, 226.69984436035156, 231.92587280273438, 237.15191650390625, 242.37794494628906, 247.60397338867188, 252.83001708984375, 258.0560302734375, 263.2820739746094, 268.50811767578125, 273.7341613769531, 278.9601745605469, 284.18621826171875, 289.4122619628906, 294.6382751464844, 299.86431884765625, 305.0903625488281, 310.3163757324219]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 3.0, 4.0, 3.0, 8.0, 16.0, 13.0, 12.0, 19.0, 19.0, 23.0, 28.0, 30.0, 37.0, 35.0, 43.0, 37.0, 37.0, 45.0, 42.0, 57.0, 48.0, 45.0, 39.0, 38.0, 36.0, 39.0, 28.0, 42.0, 34.0, 18.0, 17.0, 23.0, 9.0, 22.0, 9.0, 13.0, 11.0, 3.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.152633666992188, -25.332061767578125, -24.511489868164062, -23.69091796875, -22.870344161987305, -22.049772262573242, -21.22920036315918, -20.408628463745117, -19.588054656982422, -18.76748275756836, -17.946910858154297, -17.126338958740234, -16.30576515197754, -15.485193252563477, -14.664621353149414, -13.844049453735352, -13.023477554321289, -12.202905654907227, -11.382332801818848, -10.561760902404785, -9.741188049316406, -8.920616149902344, -8.100044250488281, -7.2794718742370605, -6.45889949798584, -5.638327121734619, -4.817754745483398, -3.997182846069336, -3.1766104698181152, -2.3560380935668945, -1.535466194152832, -0.7148938179016113, 0.10568046569824219, 0.9262527227401733, 1.7468249797821045, 2.567397117614746, 3.387969493865967, 4.2085418701171875, 5.02911376953125, 5.849686145782471, 6.670258522033691, 7.490830898284912, 8.311403274536133, 9.131975173950195, 9.952547073364258, 10.773119926452637, 11.5936918258667, 12.414264678955078, 13.23483657836914, 14.055408477783203, 14.875981330871582, 15.696553230285645, 16.517126083374023, 17.337697982788086, 18.15826988220215, 18.97884178161621, 19.799415588378906, 20.61998748779297, 21.44055938720703, 22.261131286621094, 23.08170509338379, 23.90227699279785, 24.722848892211914, 25.543420791625977, 26.36399269104004]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 12.0, 2.0, 5.0, 6.0, 5.0, 6.0, 6.0, 9.0, 9.0, 11.0, 18.0, 23.0, 19.0, 21.0, 23.0, 23.0, 33.0, 26.0, 27.0, 37.0, 22.0, 34.0, 38.0, 32.0, 39.0, 34.0, 42.0, 44.0, 34.0, 29.0, 40.0, 27.0, 24.0, 33.0, 30.0, 30.0, 20.0, 21.0, 22.0, 11.0, 11.0, 15.0, 10.0, 11.0, 5.0, 8.0, 5.0, 8.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-2.349609375, -2.278961181640625, -2.20831298828125, -2.137664794921875, -2.0670166015625, -1.996368408203125, -1.92572021484375, -1.855072021484375, -1.784423828125, -1.713775634765625, -1.64312744140625, -1.572479248046875, -1.5018310546875, -1.431182861328125, -1.36053466796875, -1.289886474609375, -1.21923828125, -1.148590087890625, -1.07794189453125, -1.007293701171875, -0.9366455078125, -0.865997314453125, -0.79534912109375, -0.724700927734375, -0.654052734375, -0.583404541015625, -0.51275634765625, -0.442108154296875, -0.3714599609375, -0.300811767578125, -0.23016357421875, -0.159515380859375, -0.0888671875, -0.018218994140625, 0.05242919921875, 0.123077392578125, 0.1937255859375, 0.264373779296875, 0.33502197265625, 0.405670166015625, 0.476318359375, 0.546966552734375, 0.61761474609375, 0.688262939453125, 0.7589111328125, 0.829559326171875, 0.90020751953125, 0.970855712890625, 1.04150390625, 1.112152099609375, 1.18280029296875, 1.253448486328125, 1.3240966796875, 1.394744873046875, 1.46539306640625, 1.536041259765625, 1.606689453125, 1.677337646484375, 1.74798583984375, 1.818634033203125, 1.8892822265625, 1.959930419921875, 2.03057861328125, 2.101226806640625, 2.171875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 4.0, 4.0, 9.0, 13.0, 15.0, 16.0, 30.0, 36.0, 32.0, 57.0, 123.0, 225.0, 440.0, 1431.0, 5812.0, 33569.0, 239599.0, 1616195.0, 1928951.0, 313863.0, 43641.0, 7374.0, 1704.0, 507.0, 233.0, 120.0, 62.0, 54.0, 27.0, 30.0, 16.0, 16.0, 8.0, 7.0, 12.0, 10.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.859375, -7.6473388671875, -7.435302734375, -7.2232666015625, -7.01123046875, -6.7991943359375, -6.587158203125, -6.3751220703125, -6.1630859375, -5.9510498046875, -5.739013671875, -5.5269775390625, -5.31494140625, -5.1029052734375, -4.890869140625, -4.6788330078125, -4.466796875, -4.2547607421875, -4.042724609375, -3.8306884765625, -3.61865234375, -3.4066162109375, -3.194580078125, -2.9825439453125, -2.7705078125, -2.5584716796875, -2.346435546875, -2.1343994140625, -1.92236328125, -1.7103271484375, -1.498291015625, -1.2862548828125, -1.07421875, -0.8621826171875, -0.650146484375, -0.4381103515625, -0.22607421875, -0.0140380859375, 0.197998046875, 0.4100341796875, 0.6220703125, 0.8341064453125, 1.046142578125, 1.2581787109375, 1.47021484375, 1.6822509765625, 1.894287109375, 2.1063232421875, 2.318359375, 2.5303955078125, 2.742431640625, 2.9544677734375, 3.16650390625, 3.3785400390625, 3.590576171875, 3.8026123046875, 4.0146484375, 4.2266845703125, 4.438720703125, 4.6507568359375, 4.86279296875, 5.0748291015625, 5.286865234375, 5.4989013671875, 5.7109375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 16.0, 16.0, 22.0, 16.0, 45.0, 57.0, 59.0, 98.0, 137.0, 169.0, 239.0, 284.0, 406.0, 439.0, 440.0, 386.0, 321.0, 263.0, 194.0, 142.0, 91.0, 54.0, 41.0, 46.0, 22.0, 19.0, 16.0, 11.0, 12.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.409423828125, -4.21728515625, -4.025146484375, -3.8330078125, -3.640869140625, -3.44873046875, -3.256591796875, -3.064453125, -2.872314453125, -2.68017578125, -2.488037109375, -2.2958984375, -2.103759765625, -1.91162109375, -1.719482421875, -1.52734375, -1.335205078125, -1.14306640625, -0.950927734375, -0.7587890625, -0.566650390625, -0.37451171875, -0.182373046875, 0.009765625, 0.201904296875, 0.39404296875, 0.586181640625, 0.7783203125, 0.970458984375, 1.16259765625, 1.354736328125, 1.546875, 1.739013671875, 1.93115234375, 2.123291015625, 2.3154296875, 2.507568359375, 2.69970703125, 2.891845703125, 3.083984375, 3.276123046875, 3.46826171875, 3.660400390625, 3.8525390625, 4.044677734375, 4.23681640625, 4.428955078125, 4.62109375, 4.813232421875, 5.00537109375, 5.197509765625, 5.3896484375, 5.581787109375, 5.77392578125, 5.966064453125, 6.158203125, 6.350341796875, 6.54248046875, 6.734619140625, 6.9267578125, 7.118896484375, 7.31103515625, 7.503173828125, 7.6953125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 15.0, 11.0, 25.0, 32.0, 36.0, 52.0, 82.0, 145.0, 171.0, 297.0, 686.0, 2326.0, 13596.0, 142809.0, 1486894.0, 2252146.0, 265348.0, 24467.0, 3318.0, 830.0, 378.0, 216.0, 118.0, 87.0, 70.0, 33.0, 30.0, 16.0, 19.0, 11.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-14.5625, -14.1995849609375, -13.836669921875, -13.4737548828125, -13.11083984375, -12.7479248046875, -12.385009765625, -12.0220947265625, -11.6591796875, -11.2962646484375, -10.933349609375, -10.5704345703125, -10.20751953125, -9.8446044921875, -9.481689453125, -9.1187744140625, -8.755859375, -8.3929443359375, -8.030029296875, -7.6671142578125, -7.30419921875, -6.9412841796875, -6.578369140625, -6.2154541015625, -5.8525390625, -5.4896240234375, -5.126708984375, -4.7637939453125, -4.40087890625, -4.0379638671875, -3.675048828125, -3.3121337890625, -2.94921875, -2.5863037109375, -2.223388671875, -1.8604736328125, -1.49755859375, -1.1346435546875, -0.771728515625, -0.4088134765625, -0.0458984375, 0.3170166015625, 0.679931640625, 1.0428466796875, 1.40576171875, 1.7686767578125, 2.131591796875, 2.4945068359375, 2.857421875, 3.2203369140625, 3.583251953125, 3.9461669921875, 4.30908203125, 4.6719970703125, 5.034912109375, 5.3978271484375, 5.7607421875, 6.1236572265625, 6.486572265625, 6.8494873046875, 7.21240234375, 7.5753173828125, 7.938232421875, 8.3011474609375, 8.6640625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 22.0, 65.0, 125.0, 196.0, 211.0, 194.0, 129.0, 52.0, 19.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.29646873474121, -26.009565353393555, -23.72266387939453, -21.435760498046875, -19.14885711669922, -16.861953735351562, -14.575051307678223, -12.288148880004883, -10.001245498657227, -7.7143425941467285, -5.4274396896362305, -3.1405367851257324, -0.8536338806152344, 1.4332695007324219, 3.7201719284057617, 6.007074356079102, 8.293977737426758, 10.580881118774414, 12.867783546447754, 15.154685974121094, 17.44158935546875, 19.728492736816406, 22.015396118164062, 24.302297592163086, 26.589200973510742, 28.8761043548584, 31.163005828857422, 33.44990921020508, 35.736812591552734, 38.02371597290039, 40.31061935424805, 42.59751892089844, 44.884429931640625, 47.17133331298828, 49.45823669433594, 51.745140075683594, 54.03204345703125, 56.318946838378906, 58.6058464050293, 60.89274978637695, 63.17965316772461, 65.466552734375, 67.75345611572266, 70.04035949707031, 72.32726287841797, 74.61416625976562, 76.90106964111328, 79.18797302246094, 81.4748764038086, 83.76177978515625, 86.0486831665039, 88.33558654785156, 90.62248992919922, 92.90939331054688, 95.19629669189453, 97.48320007324219, 99.77009582519531, 102.05699920654297, 104.34390258789062, 106.63080596923828, 108.91770935058594, 111.2046127319336, 113.49151611328125, 115.77841186523438, 118.06532287597656]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 7.0, 6.0, 9.0, 14.0, 7.0, 16.0, 19.0, 16.0, 27.0, 28.0, 22.0, 23.0, 39.0, 41.0, 31.0, 41.0, 50.0, 38.0, 49.0, 51.0, 43.0, 42.0, 47.0, 40.0, 37.0, 35.0, 33.0, 35.0, 23.0, 18.0, 27.0, 19.0, 14.0, 15.0, 14.0, 8.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.35489273071289, -18.71091651916504, -18.066940307617188, -17.422964096069336, -16.778987884521484, -16.135011672973633, -15.491035461425781, -14.84705924987793, -14.203083038330078, -13.559106826782227, -12.915130615234375, -12.271154403686523, -11.627178192138672, -10.98320198059082, -10.339225769042969, -9.695249557495117, -9.051274299621582, -8.40729808807373, -7.763321876525879, -7.119345664978027, -6.475369453430176, -5.831393241882324, -5.187417507171631, -4.543441295623779, -3.8994650840759277, -3.255488872528076, -2.6115126609802246, -1.9675366878509521, -1.3235604763031006, -0.679584264755249, -0.03560829162597656, 0.608367919921875, 1.2523441314697266, 1.8963203430175781, 2.5402965545654297, 3.184272527694702, 3.8282487392425537, 4.472225189208984, 5.116200923919678, 5.760177135467529, 6.404153347015381, 7.048129558563232, 7.692105770111084, 8.336081504821777, 8.980057716369629, 9.62403392791748, 10.268010139465332, 10.911986351013184, 11.555962562561035, 12.199938774108887, 12.843914985656738, 13.48789119720459, 14.131867408752441, 14.775843620300293, 15.419818878173828, 16.06379508972168, 16.70777130126953, 17.351747512817383, 17.995723724365234, 18.639699935913086, 19.283676147460938, 19.92765235900879, 20.57162857055664, 21.215604782104492, 21.859580993652344]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 10.0, 7.0, 9.0, 12.0, 15.0, 19.0, 18.0, 17.0, 24.0, 24.0, 25.0, 37.0, 37.0, 29.0, 36.0, 41.0, 38.0, 43.0, 37.0, 49.0, 48.0, 41.0, 30.0, 41.0, 42.0, 32.0, 34.0, 27.0, 29.0, 21.0, 17.0, 13.0, 17.0, 12.0, 12.0, 11.0, 11.0, 3.0, 6.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.52734375, -2.4481201171875, -2.368896484375, -2.2896728515625, -2.21044921875, -2.1312255859375, -2.052001953125, -1.9727783203125, -1.8935546875, -1.8143310546875, -1.735107421875, -1.6558837890625, -1.57666015625, -1.4974365234375, -1.418212890625, -1.3389892578125, -1.259765625, -1.1805419921875, -1.101318359375, -1.0220947265625, -0.94287109375, -0.8636474609375, -0.784423828125, -0.7052001953125, -0.6259765625, -0.5467529296875, -0.467529296875, -0.3883056640625, -0.30908203125, -0.2298583984375, -0.150634765625, -0.0714111328125, 0.0078125, 0.0870361328125, 0.166259765625, 0.2454833984375, 0.32470703125, 0.4039306640625, 0.483154296875, 0.5623779296875, 0.6416015625, 0.7208251953125, 0.800048828125, 0.8792724609375, 0.95849609375, 1.0377197265625, 1.116943359375, 1.1961669921875, 1.275390625, 1.3546142578125, 1.433837890625, 1.5130615234375, 1.59228515625, 1.6715087890625, 1.750732421875, 1.8299560546875, 1.9091796875, 1.9884033203125, 2.067626953125, 2.1468505859375, 2.22607421875, 2.3052978515625, 2.384521484375, 2.4637451171875, 2.54296875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 7.0, 0.0, 3.0, 6.0, 11.0, 21.0, 24.0, 41.0, 57.0, 88.0, 107.0, 162.0, 202.0, 353.0, 470.0, 734.0, 1048.0, 1551.0, 2156.0, 3194.0, 4771.0, 7029.0, 10483.0, 15759.0, 24475.0, 38780.0, 64419.0, 113587.0, 296862.0, 208680.0, 97159.0, 56496.0, 34607.0, 21584.0, 14302.0, 9379.0, 6228.0, 4340.0, 2991.0, 2029.0, 1359.0, 911.0, 634.0, 458.0, 335.0, 223.0, 150.0, 94.0, 66.0, 45.0, 30.0, 23.0, 19.0, 13.0, 5.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0], "bins": [-0.09991455078125, -0.09677982330322266, -0.09364509582519531, -0.09051036834716797, -0.08737564086914062, -0.08424091339111328, -0.08110618591308594, -0.0779714584350586, -0.07483673095703125, -0.0717020034790039, -0.06856727600097656, -0.06543254852294922, -0.062297821044921875, -0.05916309356689453, -0.05602836608886719, -0.052893638610839844, -0.0497589111328125, -0.046624183654785156, -0.04348945617675781, -0.04035472869873047, -0.037220001220703125, -0.03408527374267578, -0.030950546264648438, -0.027815818786621094, -0.02468109130859375, -0.021546363830566406, -0.018411636352539062, -0.015276908874511719, -0.012142181396484375, -0.009007453918457031, -0.0058727264404296875, -0.0027379989624023438, 0.000396728515625, 0.0035314559936523438, 0.0066661834716796875, 0.009800910949707031, 0.012935638427734375, 0.01607036590576172, 0.019205093383789062, 0.022339820861816406, 0.02547454833984375, 0.028609275817871094, 0.03174400329589844, 0.03487873077392578, 0.038013458251953125, 0.04114818572998047, 0.04428291320800781, 0.047417640686035156, 0.0505523681640625, 0.053687095642089844, 0.05682182312011719, 0.05995655059814453, 0.06309127807617188, 0.06622600555419922, 0.06936073303222656, 0.0724954605102539, 0.07563018798828125, 0.0787649154663086, 0.08189964294433594, 0.08503437042236328, 0.08816909790039062, 0.09130382537841797, 0.09443855285644531, 0.09757328033447266, 0.1007080078125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 5.0, 7.0, 11.0, 8.0, 7.0, 13.0, 18.0, 16.0, 25.0, 21.0, 19.0, 28.0, 29.0, 26.0, 33.0, 30.0, 31.0, 34.0, 22.0, 40.0, 39.0, 31.0, 1062.0, 33.0, 31.0, 27.0, 25.0, 35.0, 33.0, 33.0, 28.0, 34.0, 25.0, 16.0, 20.0, 23.0, 15.0, 17.0, 9.0, 3.0, 7.0, 4.0, 6.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.59375, -1.5457000732421875, -1.497650146484375, -1.4496002197265625, -1.40155029296875, -1.3535003662109375, -1.305450439453125, -1.2574005126953125, -1.2093505859375, -1.1613006591796875, -1.113250732421875, -1.0652008056640625, -1.01715087890625, -0.9691009521484375, -0.921051025390625, -0.8730010986328125, -0.824951171875, -0.7769012451171875, -0.728851318359375, -0.6808013916015625, -0.63275146484375, -0.5847015380859375, -0.536651611328125, -0.4886016845703125, -0.4405517578125, -0.3925018310546875, -0.344451904296875, -0.2964019775390625, -0.24835205078125, -0.2003021240234375, -0.152252197265625, -0.1042022705078125, -0.05615234375, -0.0081024169921875, 0.039947509765625, 0.0879974365234375, 0.13604736328125, 0.1840972900390625, 0.232147216796875, 0.2801971435546875, 0.3282470703125, 0.3762969970703125, 0.424346923828125, 0.4723968505859375, 0.52044677734375, 0.5684967041015625, 0.616546630859375, 0.6645965576171875, 0.712646484375, 0.7606964111328125, 0.808746337890625, 0.8567962646484375, 0.90484619140625, 0.9528961181640625, 1.000946044921875, 1.0489959716796875, 1.0970458984375, 1.1450958251953125, 1.193145751953125, 1.2411956787109375, 1.28924560546875, 1.3372955322265625, 1.385345458984375, 1.4333953857421875, 1.4814453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 9.0, 17.0, 19.0, 36.0, 50.0, 93.0, 90.0, 135.0, 202.0, 274.0, 382.0, 507.0, 690.0, 1000.0, 1371.0, 1775.0, 2535.0, 3539.0, 4763.0, 6620.0, 9456.0, 13451.0, 19368.0, 28519.0, 41963.0, 64137.0, 102609.0, 203636.0, 1275199.0, 106690.0, 66196.0, 43408.0, 29470.0, 20184.0, 13918.0, 9846.0, 6958.0, 5050.0, 3555.0, 2616.0, 1843.0, 1357.0, 995.0, 749.0, 560.0, 377.0, 277.0, 203.0, 153.0, 83.0, 78.0, 45.0, 29.0, 22.0, 14.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.043212890625, -0.041820526123046875, -0.04042816162109375, -0.039035797119140625, -0.0376434326171875, -0.036251068115234375, -0.03485870361328125, -0.033466339111328125, -0.032073974609375, -0.030681610107421875, -0.02928924560546875, -0.027896881103515625, -0.0265045166015625, -0.025112152099609375, -0.02371978759765625, -0.022327423095703125, -0.02093505859375, -0.019542694091796875, -0.01815032958984375, -0.016757965087890625, -0.0153656005859375, -0.013973236083984375, -0.01258087158203125, -0.011188507080078125, -0.009796142578125, -0.008403778076171875, -0.00701141357421875, -0.005619049072265625, -0.0042266845703125, -0.002834320068359375, -0.00144195556640625, -4.9591064453125e-05, 0.0013427734375, 0.002735137939453125, 0.00412750244140625, 0.005519866943359375, 0.0069122314453125, 0.008304595947265625, 0.00969696044921875, 0.011089324951171875, 0.012481689453125, 0.013874053955078125, 0.01526641845703125, 0.016658782958984375, 0.0180511474609375, 0.019443511962890625, 0.02083587646484375, 0.022228240966796875, 0.02362060546875, 0.025012969970703125, 0.02640533447265625, 0.027797698974609375, 0.0291900634765625, 0.030582427978515625, 0.03197479248046875, 0.033367156982421875, 0.034759521484375, 0.036151885986328125, 0.03754425048828125, 0.038936614990234375, 0.0403289794921875, 0.041721343994140625, 0.04311370849609375, 0.044506072998046875, 0.0458984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 0.0, 6.0, 5.0, 0.0, 8.0, 13.0, 0.0, 7.0, 13.0, 0.0, 14.0, 18.0, 0.0, 33.0, 42.0, 0.0, 58.0, 74.0, 0.0, 407.0, 96.0, 0.0, 70.0, 41.0, 0.0, 20.0, 21.0, 0.0, 8.0, 8.0, 0.0, 12.0, 9.0, 0.0, 6.0, 6.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4500692486763e-06, -1.4100223779678345e-06, -1.369975507259369e-06, -1.3299286365509033e-06, -1.2898817658424377e-06, -1.2498348951339722e-06, -1.2097880244255066e-06, -1.169741153717041e-06, -1.1296942830085754e-06, -1.0896474123001099e-06, -1.0496005415916443e-06, -1.0095536708831787e-06, -9.695068001747131e-07, -9.294599294662476e-07, -8.89413058757782e-07, -8.493661880493164e-07, -8.093193173408508e-07, -7.692724466323853e-07, -7.292255759239197e-07, -6.891787052154541e-07, -6.491318345069885e-07, -6.09084963798523e-07, -5.690380930900574e-07, -5.289912223815918e-07, -4.889443516731262e-07, -4.4889748096466064e-07, -4.0885061025619507e-07, -3.688037395477295e-07, -3.287568688392639e-07, -2.8870999813079834e-07, -2.4866312742233276e-07, -2.086162567138672e-07, -1.685693860054016e-07, -1.2852251529693604e-07, -8.847564458847046e-08, -4.842877388000488e-08, -8.381903171539307e-09, 3.166496753692627e-08, 7.171183824539185e-08, 1.1175870895385742e-07, 1.51805579662323e-07, 1.9185245037078857e-07, 2.3189932107925415e-07, 2.7194619178771973e-07, 3.119930624961853e-07, 3.520399332046509e-07, 3.9208680391311646e-07, 4.3213367462158203e-07, 4.721805453300476e-07, 5.122274160385132e-07, 5.522742867469788e-07, 5.923211574554443e-07, 6.323680281639099e-07, 6.724148988723755e-07, 7.124617695808411e-07, 7.525086402893066e-07, 7.925555109977722e-07, 8.326023817062378e-07, 8.726492524147034e-07, 9.126961231231689e-07, 9.527429938316345e-07, 9.927898645401e-07, 1.0328367352485657e-06, 1.0728836059570312e-06]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 1.0, 6.0, 5.0, 4.0, 4.0, 13.0, 25.0, 39.0, 67.0, 70.0, 134.0, 464.0, 9927.0, 899641.0, 134032.0, 3501.0, 280.0, 123.0, 65.0, 43.0, 26.0, 21.0, 12.0, 8.0, 11.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2590160369873047e-05, -2.1778978407382965e-05, -2.0967796444892883e-05, -2.01566144824028e-05, -1.934543251991272e-05, -1.8534250557422638e-05, -1.7723068594932556e-05, -1.6911886632442474e-05, -1.6100704669952393e-05, -1.528952270746231e-05, -1.4478340744972229e-05, -1.3667158782482147e-05, -1.2855976819992065e-05, -1.2044794857501984e-05, -1.1233612895011902e-05, -1.042243093252182e-05, -9.611248970031738e-06, -8.800067007541656e-06, -7.988885045051575e-06, -7.177703082561493e-06, -6.366521120071411e-06, -5.555339157581329e-06, -4.7441571950912476e-06, -3.932975232601166e-06, -3.121793270111084e-06, -2.310611307621002e-06, -1.4994293451309204e-06, -6.882473826408386e-07, 1.2293457984924316e-07, 9.34116542339325e-07, 1.7452985048294067e-06, 2.5564804673194885e-06, 3.3676624298095703e-06, 4.178844392299652e-06, 4.990026354789734e-06, 5.801208317279816e-06, 6.6123902797698975e-06, 7.423572242259979e-06, 8.234754204750061e-06, 9.045936167240143e-06, 9.857118129730225e-06, 1.0668300092220306e-05, 1.1479482054710388e-05, 1.229066401720047e-05, 1.3101845979690552e-05, 1.3913027942180634e-05, 1.4724209904670715e-05, 1.5535391867160797e-05, 1.634657382965088e-05, 1.715775579214096e-05, 1.7968937754631042e-05, 1.8780119717121124e-05, 1.9591301679611206e-05, 2.0402483642101288e-05, 2.121366560459137e-05, 2.202484756708145e-05, 2.2836029529571533e-05, 2.3647211492061615e-05, 2.4458393454551697e-05, 2.526957541704178e-05, 2.608075737953186e-05, 2.6891939342021942e-05, 2.7703121304512024e-05, 2.8514303267002106e-05, 2.9325485229492188e-05]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 13.0, 26.0, 48.0, 88.0, 607.0, 97.0, 58.0, 33.0, 25.0, 9.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.8092907794198254e-06, -1.7743664102454204e-06, -1.7394421547578531e-06, -1.7045177855834481e-06, -1.6695935300958809e-06, -1.6346691609214759e-06, -1.5997447917470708e-06, -1.5648205362595036e-06, -1.5298961670850986e-06, -1.4949717979106936e-06, -1.4600475424231263e-06, -1.4251231732487213e-06, -1.390198917761154e-06, -1.355274548586749e-06, -1.3203502930991817e-06, -1.2854259239247767e-06, -1.2505015547503717e-06, -1.2155771855759667e-06, -1.1806529300883994e-06, -1.1457285609139944e-06, -1.1108043054264272e-06, -1.0758799362520222e-06, -1.0409555670776172e-06, -1.0060313115900499e-06, -9.711070561024826e-07, -9.361827437714965e-07, -9.012584314405103e-07, -8.663340622661053e-07, -8.314097499351192e-07, -7.96485437604133e-07, -7.615611252731469e-07, -7.266368129421608e-07, -6.917125574545935e-07, -6.567882451236073e-07, -6.218639327926212e-07, -5.869395636182162e-07, -5.520152512872301e-07, -5.170909389562439e-07, -4.821666266252578e-07, -4.472422858725622e-07, -4.1231794511986664e-07, -3.773936327888805e-07, -3.424692920361849e-07, -3.075449797051988e-07, -2.726206389525032e-07, -2.3769632662151707e-07, -2.0277201429053093e-07, -1.6784767353783536e-07, -1.3292336120684922e-07, -9.799903466500837e-08, -6.307471522859487e-08, -2.815039579218137e-08, 6.773930749659485e-09, 4.169825729150034e-08, 7.662256962248648e-08, 1.1154691037518205e-07, 1.464712227061682e-07, 1.8139554924800905e-07, 2.163198757898499e-07, 2.5124418812083604e-07, 2.861685288735316e-07, 3.2109284120451775e-07, 3.560171535355039e-07, 3.9094149428819946e-07, 4.258658066191856e-07]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 0.0, 0.0, 147.0, 0.0, 0.0, 0.0, 0.0, 539.0, 0.0, 0.0, 0.0, 155.0, 0.0, 0.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 10.0, 7.0, 9.0, 12.0, 15.0, 19.0, 18.0, 17.0, 24.0, 24.0, 25.0, 37.0, 37.0, 29.0, 36.0, 41.0, 38.0, 43.0, 37.0, 49.0, 48.0, 41.0, 30.0, 41.0, 42.0, 32.0, 34.0, 27.0, 29.0, 21.0, 17.0, 13.0, 17.0, 12.0, 12.0, 11.0, 11.0, 3.0, 6.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.52734375, -2.4481201171875, -2.368896484375, -2.2896728515625, -2.21044921875, -2.1312255859375, -2.052001953125, -1.9727783203125, -1.8935546875, -1.8143310546875, -1.735107421875, -1.6558837890625, -1.57666015625, -1.4974365234375, -1.418212890625, -1.3389892578125, -1.259765625, -1.1805419921875, -1.101318359375, -1.0220947265625, -0.94287109375, -0.8636474609375, -0.784423828125, -0.7052001953125, -0.6259765625, -0.5467529296875, -0.467529296875, -0.3883056640625, -0.30908203125, -0.2298583984375, -0.150634765625, -0.0714111328125, 0.0078125, 0.0870361328125, 0.166259765625, 0.2454833984375, 0.32470703125, 0.4039306640625, 0.483154296875, 0.5623779296875, 0.6416015625, 0.7208251953125, 0.800048828125, 0.8792724609375, 0.95849609375, 1.0377197265625, 1.116943359375, 1.1961669921875, 1.275390625, 1.3546142578125, 1.433837890625, 1.5130615234375, 1.59228515625, 1.6715087890625, 1.750732421875, 1.8299560546875, 1.9091796875, 1.9884033203125, 2.067626953125, 2.1468505859375, 2.22607421875, 2.3052978515625, 2.384521484375, 2.4637451171875, 2.54296875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 3.0, 10.0, 16.0, 33.0, 47.0, 82.0, 138.0, 224.0, 352.0, 651.0, 1088.0, 1836.0, 3035.0, 5169.0, 8514.0, 13632.0, 23054.0, 38508.0, 65543.0, 116250.0, 230909.0, 246919.0, 122996.0, 68780.0, 40215.0, 23873.0, 14776.0, 8855.0, 5193.0, 3132.0, 1861.0, 1179.0, 684.0, 375.0, 251.0, 131.0, 73.0, 53.0, 34.0, 33.0, 13.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.505859375, -2.41650390625, -2.3271484375, -2.23779296875, -2.1484375, -2.05908203125, -1.9697265625, -1.88037109375, -1.791015625, -1.70166015625, -1.6123046875, -1.52294921875, -1.43359375, -1.34423828125, -1.2548828125, -1.16552734375, -1.076171875, -0.98681640625, -0.8974609375, -0.80810546875, -0.71875, -0.62939453125, -0.5400390625, -0.45068359375, -0.361328125, -0.27197265625, -0.1826171875, -0.09326171875, -0.00390625, 0.08544921875, 0.1748046875, 0.26416015625, 0.353515625, 0.44287109375, 0.5322265625, 0.62158203125, 0.7109375, 0.80029296875, 0.8896484375, 0.97900390625, 1.068359375, 1.15771484375, 1.2470703125, 1.33642578125, 1.42578125, 1.51513671875, 1.6044921875, 1.69384765625, 1.783203125, 1.87255859375, 1.9619140625, 2.05126953125, 2.140625, 2.22998046875, 2.3193359375, 2.40869140625, 2.498046875, 2.58740234375, 2.6767578125, 2.76611328125, 2.85546875, 2.94482421875, 3.0341796875, 3.12353515625, 3.212890625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 8.0, 13.0, 11.0, 13.0, 9.0, 32.0, 16.0, 23.0, 31.0, 31.0, 36.0, 41.0, 58.0, 63.0, 92.0, 154.0, 278.0, 1394.0, 195.0, 115.0, 83.0, 67.0, 40.0, 38.0, 24.0, 31.0, 24.0, 23.0, 21.0, 16.0, 11.0, 13.0, 9.0, 3.0, 11.0, 1.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.679931640625, -8.38330078125, -8.086669921875, -7.7900390625, -7.493408203125, -7.19677734375, -6.900146484375, -6.603515625, -6.306884765625, -6.01025390625, -5.713623046875, -5.4169921875, -5.120361328125, -4.82373046875, -4.527099609375, -4.23046875, -3.933837890625, -3.63720703125, -3.340576171875, -3.0439453125, -2.747314453125, -2.45068359375, -2.154052734375, -1.857421875, -1.560791015625, -1.26416015625, -0.967529296875, -0.6708984375, -0.374267578125, -0.07763671875, 0.218994140625, 0.515625, 0.812255859375, 1.10888671875, 1.405517578125, 1.7021484375, 1.998779296875, 2.29541015625, 2.592041015625, 2.888671875, 3.185302734375, 3.48193359375, 3.778564453125, 4.0751953125, 4.371826171875, 4.66845703125, 4.965087890625, 5.26171875, 5.558349609375, 5.85498046875, 6.151611328125, 6.4482421875, 6.744873046875, 7.04150390625, 7.338134765625, 7.634765625, 7.931396484375, 8.22802734375, 8.524658203125, 8.8212890625, 9.117919921875, 9.41455078125, 9.711181640625, 10.0078125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 10.0, 9.0, 9.0, 12.0, 16.0, 14.0, 35.0, 30.0, 57.0, 69.0, 95.0, 132.0, 194.0, 389.0, 1014.0, 7393.0, 201694.0, 2805734.0, 121446.0, 5386.0, 888.0, 326.0, 205.0, 136.0, 102.0, 81.0, 60.0, 33.0, 38.0, 20.0, 19.0, 13.0, 11.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.109375, -20.513671875, -19.91796875, -19.322265625, -18.7265625, -18.130859375, -17.53515625, -16.939453125, -16.34375, -15.748046875, -15.15234375, -14.556640625, -13.9609375, -13.365234375, -12.76953125, -12.173828125, -11.578125, -10.982421875, -10.38671875, -9.791015625, -9.1953125, -8.599609375, -8.00390625, -7.408203125, -6.8125, -6.216796875, -5.62109375, -5.025390625, -4.4296875, -3.833984375, -3.23828125, -2.642578125, -2.046875, -1.451171875, -0.85546875, -0.259765625, 0.3359375, 0.931640625, 1.52734375, 2.123046875, 2.71875, 3.314453125, 3.91015625, 4.505859375, 5.1015625, 5.697265625, 6.29296875, 6.888671875, 7.484375, 8.080078125, 8.67578125, 9.271484375, 9.8671875, 10.462890625, 11.05859375, 11.654296875, 12.25, 12.845703125, 13.44140625, 14.037109375, 14.6328125, 15.228515625, 15.82421875, 16.419921875, 17.015625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 12.0, 52.0, 125.0, 225.0, 278.0, 195.0, 81.0, 35.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.813081741333008, -16.073143005371094, -14.333202362060547, -12.593262672424316, -10.853322982788086, -9.113383293151855, -7.373443603515625, -5.6335039138793945, -3.893564224243164, -2.1536245346069336, -0.4136848449707031, 1.3262548446655273, 3.066194534301758, 4.806134223937988, 6.546073913574219, 8.28601360321045, 10.02595329284668, 11.76589298248291, 13.50583267211914, 15.245772361755371, 16.9857120513916, 18.725650787353516, 20.465591430664062, 22.20553207397461, 23.945470809936523, 25.685409545898438, 27.425350189208984, 29.16529083251953, 30.905229568481445, 32.64516830444336, 34.385108947753906, 36.12504959106445, 37.864990234375, 39.60493087768555, 41.344871520996094, 43.084808349609375, 44.82474899291992, 46.56468963623047, 48.30462646484375, 50.0445671081543, 51.784507751464844, 53.52444839477539, 55.26438903808594, 57.00432586669922, 58.744266510009766, 60.48420715332031, 62.224143981933594, 63.96408462524414, 65.70402526855469, 67.44396209716797, 69.18390655517578, 70.92384338378906, 72.66378784179688, 74.40372467041016, 76.14366149902344, 77.88360595703125, 79.62354278564453, 81.36347961425781, 83.10342407226562, 84.8433609008789, 86.58329772949219, 88.3232421875, 90.06317901611328, 91.8031234741211, 93.54306030273438]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 12.0, 14.0, 13.0, 7.0, 13.0, 24.0, 17.0, 21.0, 37.0, 33.0, 46.0, 44.0, 48.0, 48.0, 46.0, 44.0, 52.0, 44.0, 53.0, 40.0, 47.0, 44.0, 40.0, 32.0, 35.0, 30.0, 30.0, 22.0, 16.0, 8.0, 9.0, 13.0, 6.0, 1.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.407669067382812, -28.35000991821289, -27.29235076904297, -26.23469352722168, -25.177034378051758, -24.119375228881836, -23.061717987060547, -22.004058837890625, -20.946399688720703, -19.88874053955078, -18.83108139038086, -17.77342414855957, -16.71576499938965, -15.658105850219727, -14.600447654724121, -13.542789459228516, -12.485130310058594, -11.427471160888672, -10.369812965393066, -9.312154769897461, -8.254495620727539, -7.196836948394775, -6.139178276062012, -5.081519603729248, -4.023860931396484, -2.9662022590637207, -1.908543586730957, -0.8508849143981934, 0.2067737579345703, 1.264432430267334, 2.3220911026000977, 3.3797497749328613, 4.437412261962891, 5.495070934295654, 6.552729606628418, 7.610388278961182, 8.668046951293945, 9.725706100463867, 10.783364295959473, 11.841022491455078, 12.898681640625, 13.956340789794922, 15.013998985290527, 16.071657180786133, 17.129316329956055, 18.186975479125977, 19.244632720947266, 20.302291870117188, 21.35995101928711, 22.41761016845703, 23.475269317626953, 24.532926559448242, 25.590585708618164, 26.648244857788086, 27.705902099609375, 28.763561248779297, 29.82122039794922, 30.87887954711914, 31.936538696289062, 32.994197845458984, 34.051856994628906, 35.10951232910156, 36.167171478271484, 37.224830627441406, 38.28248977661133]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 6.0, 7.0, 10.0, 11.0, 18.0, 23.0, 11.0, 14.0, 17.0, 16.0, 38.0, 37.0, 30.0, 40.0, 34.0, 51.0, 38.0, 43.0, 36.0, 44.0, 50.0, 38.0, 43.0, 36.0, 34.0, 45.0, 30.0, 28.0, 23.0, 20.0, 13.0, 23.0, 13.0, 17.0, 12.0, 7.0, 7.0, 10.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.923828125, -2.8353271484375, -2.746826171875, -2.6583251953125, -2.56982421875, -2.4813232421875, -2.392822265625, -2.3043212890625, -2.2158203125, -2.1273193359375, -2.038818359375, -1.9503173828125, -1.86181640625, -1.7733154296875, -1.684814453125, -1.5963134765625, -1.5078125, -1.4193115234375, -1.330810546875, -1.2423095703125, -1.15380859375, -1.0653076171875, -0.976806640625, -0.8883056640625, -0.7998046875, -0.7113037109375, -0.622802734375, -0.5343017578125, -0.44580078125, -0.3572998046875, -0.268798828125, -0.1802978515625, -0.091796875, -0.0032958984375, 0.085205078125, 0.1737060546875, 0.26220703125, 0.3507080078125, 0.439208984375, 0.5277099609375, 0.6162109375, 0.7047119140625, 0.793212890625, 0.8817138671875, 0.97021484375, 1.0587158203125, 1.147216796875, 1.2357177734375, 1.32421875, 1.4127197265625, 1.501220703125, 1.5897216796875, 1.67822265625, 1.7667236328125, 1.855224609375, 1.9437255859375, 2.0322265625, 2.1207275390625, 2.209228515625, 2.2977294921875, 2.38623046875, 2.4747314453125, 2.563232421875, 2.6517333984375, 2.740234375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 8.0, 19.0, 13.0, 14.0, 32.0, 25.0, 26.0, 39.0, 76.0, 112.0, 250.0, 651.0, 2075.0, 8952.0, 50167.0, 359580.0, 2010171.0, 1494789.0, 225136.0, 32996.0, 6388.0, 1593.0, 571.0, 218.0, 108.0, 72.0, 41.0, 36.0, 20.0, 15.0, 15.0, 5.0, 9.0, 9.0, 5.0, 12.0, 3.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80859375, -6.588134765625, -6.36767578125, -6.147216796875, -5.9267578125, -5.706298828125, -5.48583984375, -5.265380859375, -5.044921875, -4.824462890625, -4.60400390625, -4.383544921875, -4.1630859375, -3.942626953125, -3.72216796875, -3.501708984375, -3.28125, -3.060791015625, -2.84033203125, -2.619873046875, -2.3994140625, -2.178955078125, -1.95849609375, -1.738037109375, -1.517578125, -1.297119140625, -1.07666015625, -0.856201171875, -0.6357421875, -0.415283203125, -0.19482421875, 0.025634765625, 0.24609375, 0.466552734375, 0.68701171875, 0.907470703125, 1.1279296875, 1.348388671875, 1.56884765625, 1.789306640625, 2.009765625, 2.230224609375, 2.45068359375, 2.671142578125, 2.8916015625, 3.112060546875, 3.33251953125, 3.552978515625, 3.7734375, 3.993896484375, 4.21435546875, 4.434814453125, 4.6552734375, 4.875732421875, 5.09619140625, 5.316650390625, 5.537109375, 5.757568359375, 5.97802734375, 6.198486328125, 6.4189453125, 6.639404296875, 6.85986328125, 7.080322265625, 7.30078125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 6.0, 11.0, 15.0, 16.0, 36.0, 44.0, 72.0, 70.0, 138.0, 184.0, 236.0, 305.0, 409.0, 439.0, 494.0, 421.0, 298.0, 242.0, 174.0, 119.0, 104.0, 62.0, 47.0, 47.0, 29.0, 16.0, 12.0, 9.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.85516357421875, -4.6439208984375, -4.43267822265625, -4.221435546875, -4.01019287109375, -3.7989501953125, -3.58770751953125, -3.37646484375, -3.16522216796875, -2.9539794921875, -2.74273681640625, -2.531494140625, -2.32025146484375, -2.1090087890625, -1.89776611328125, -1.6865234375, -1.47528076171875, -1.2640380859375, -1.05279541015625, -0.841552734375, -0.63031005859375, -0.4190673828125, -0.20782470703125, 0.00341796875, 0.21466064453125, 0.4259033203125, 0.63714599609375, 0.848388671875, 1.05963134765625, 1.2708740234375, 1.48211669921875, 1.693359375, 1.90460205078125, 2.1158447265625, 2.32708740234375, 2.538330078125, 2.74957275390625, 2.9608154296875, 3.17205810546875, 3.38330078125, 3.59454345703125, 3.8057861328125, 4.01702880859375, 4.228271484375, 4.43951416015625, 4.6507568359375, 4.86199951171875, 5.0732421875, 5.28448486328125, 5.4957275390625, 5.70697021484375, 5.918212890625, 6.12945556640625, 6.3406982421875, 6.55194091796875, 6.76318359375, 6.97442626953125, 7.1856689453125, 7.39691162109375, 7.608154296875, 7.81939697265625, 8.0306396484375, 8.24188232421875, 8.453125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 9.0, 9.0, 25.0, 26.0, 50.0, 59.0, 82.0, 121.0, 193.0, 324.0, 642.0, 4233.0, 254229.0, 3727098.0, 201952.0, 3774.0, 637.0, 321.0, 182.0, 98.0, 73.0, 51.0, 33.0, 17.0, 15.0, 11.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.15625, -26.450439453125, -25.74462890625, -25.038818359375, -24.3330078125, -23.627197265625, -22.92138671875, -22.215576171875, -21.509765625, -20.803955078125, -20.09814453125, -19.392333984375, -18.6865234375, -17.980712890625, -17.27490234375, -16.569091796875, -15.86328125, -15.157470703125, -14.45166015625, -13.745849609375, -13.0400390625, -12.334228515625, -11.62841796875, -10.922607421875, -10.216796875, -9.510986328125, -8.80517578125, -8.099365234375, -7.3935546875, -6.687744140625, -5.98193359375, -5.276123046875, -4.5703125, -3.864501953125, -3.15869140625, -2.452880859375, -1.7470703125, -1.041259765625, -0.33544921875, 0.370361328125, 1.076171875, 1.781982421875, 2.48779296875, 3.193603515625, 3.8994140625, 4.605224609375, 5.31103515625, 6.016845703125, 6.72265625, 7.428466796875, 8.13427734375, 8.840087890625, 9.5458984375, 10.251708984375, 10.95751953125, 11.663330078125, 12.369140625, 13.074951171875, 13.78076171875, 14.486572265625, 15.1923828125, 15.898193359375, 16.60400390625, 17.309814453125, 18.015625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 14.0, 68.0, 147.0, 227.0, 275.0, 171.0, 80.0, 24.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.93401336669922, -86.46440887451172, -83.99480438232422, -81.52519989013672, -79.05558776855469, -76.58598327636719, -74.11637878417969, -71.64677429199219, -69.17716979980469, -66.70756530761719, -64.23796081542969, -61.76835250854492, -59.29874801635742, -56.82914352416992, -54.359535217285156, -51.889930725097656, -49.420326232910156, -46.950721740722656, -44.481117248535156, -42.01150894165039, -39.54190444946289, -37.07229995727539, -34.602691650390625, -32.133087158203125, -29.663482666015625, -27.193878173828125, -24.724271774291992, -22.25466537475586, -19.78506088256836, -17.31545639038086, -14.845849990844727, -12.376243591308594, -9.906646728515625, -7.437041282653809, -4.967435836791992, -2.497830390930176, -0.028224945068359375, 2.441380500793457, 4.910985946655273, 7.380592346191406, 9.850196838378906, 12.319802284240723, 14.789407730102539, 17.259014129638672, 19.728618621826172, 22.198223114013672, 24.667829513549805, 27.137435913085938, 29.607040405273438, 32.07664489746094, 34.54624938964844, 37.0158576965332, 39.4854621887207, 41.9550666809082, 44.42467498779297, 46.89427947998047, 49.36388397216797, 51.83348846435547, 54.30309295654297, 56.772701263427734, 59.242305755615234, 61.711910247802734, 64.1815185546875, 66.651123046875, 69.1207275390625]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 11.0, 5.0, 5.0, 6.0, 20.0, 17.0, 18.0, 13.0, 25.0, 36.0, 29.0, 29.0, 35.0, 27.0, 29.0, 38.0, 48.0, 29.0, 41.0, 37.0, 48.0, 37.0, 42.0, 41.0, 39.0, 36.0, 37.0, 37.0, 16.0, 29.0, 8.0, 22.0, 22.0, 14.0, 14.0, 12.0, 16.0, 8.0, 8.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-22.92513656616211, -22.26451301574707, -21.6038875579834, -20.94326400756836, -20.28264045715332, -19.62201499938965, -18.96139144897461, -18.300765991210938, -17.6401424407959, -16.97951889038086, -16.318893432617188, -15.658269882202148, -14.997645378112793, -14.337020874023438, -13.676397323608398, -13.015772819519043, -12.355149269104004, -11.694524765014648, -11.03390121459961, -10.373276710510254, -9.712652206420898, -9.05202865600586, -8.391404151916504, -7.730779647827148, -7.070155620574951, -6.409531593322754, -5.748907089233398, -5.088283061981201, -4.427659034729004, -3.7670345306396484, -3.106410503387451, -2.4457859992980957, -1.7851619720458984, -1.124537706375122, -0.46391355991363525, 0.19671058654785156, 0.8573348522186279, 1.5179591178894043, 2.1785831451416016, 2.839207649230957, 3.4998316764831543, 4.160455703735352, 4.821080207824707, 5.481704235076904, 6.142328262329102, 6.802952766418457, 7.463576793670654, 8.124200820922852, 8.784825325012207, 9.445449829101562, 10.106073379516602, 10.766697883605957, 11.427322387695312, 12.087945938110352, 12.748570442199707, 13.409194946289062, 14.069818496704102, 14.730443000793457, 15.391066551208496, 16.05169105529785, 16.71231460571289, 17.372940063476562, 18.0335636138916, 18.69418716430664, 19.354812622070312]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 11.0, 8.0, 4.0, 12.0, 9.0, 10.0, 9.0, 18.0, 22.0, 18.0, 28.0, 28.0, 38.0, 37.0, 30.0, 32.0, 35.0, 43.0, 46.0, 47.0, 45.0, 42.0, 32.0, 43.0, 48.0, 43.0, 32.0, 31.0, 22.0, 24.0, 13.0, 31.0, 9.0, 18.0, 19.0, 19.0, 7.0, 8.0, 8.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.87890625, -2.792877197265625, -2.70684814453125, -2.620819091796875, -2.5347900390625, -2.448760986328125, -2.36273193359375, -2.276702880859375, -2.190673828125, -2.104644775390625, -2.01861572265625, -1.932586669921875, -1.8465576171875, -1.760528564453125, -1.67449951171875, -1.588470458984375, -1.50244140625, -1.416412353515625, -1.33038330078125, -1.244354248046875, -1.1583251953125, -1.072296142578125, -0.98626708984375, -0.900238037109375, -0.814208984375, -0.728179931640625, -0.64215087890625, -0.556121826171875, -0.4700927734375, -0.384063720703125, -0.29803466796875, -0.212005615234375, -0.1259765625, -0.039947509765625, 0.04608154296875, 0.132110595703125, 0.2181396484375, 0.304168701171875, 0.39019775390625, 0.476226806640625, 0.562255859375, 0.648284912109375, 0.73431396484375, 0.820343017578125, 0.9063720703125, 0.992401123046875, 1.07843017578125, 1.164459228515625, 1.25048828125, 1.336517333984375, 1.42254638671875, 1.508575439453125, 1.5946044921875, 1.680633544921875, 1.76666259765625, 1.852691650390625, 1.938720703125, 2.024749755859375, 2.11077880859375, 2.196807861328125, 2.2828369140625, 2.368865966796875, 2.45489501953125, 2.540924072265625, 2.626953125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 5.0, 6.0, 6.0, 6.0, 21.0, 23.0, 46.0, 50.0, 71.0, 120.0, 166.0, 225.0, 360.0, 475.0, 709.0, 963.0, 1454.0, 2035.0, 2816.0, 3928.0, 5860.0, 8089.0, 11934.0, 17284.0, 26051.0, 39701.0, 64555.0, 115776.0, 296585.0, 193705.0, 93628.0, 55043.0, 34104.0, 22847.0, 15279.0, 10433.0, 7150.0, 4966.0, 3624.0, 2547.0, 1699.0, 1281.0, 904.0, 656.0, 408.0, 294.0, 215.0, 149.0, 114.0, 54.0, 58.0, 25.0, 20.0, 15.0, 12.0, 4.0, 6.0, 5.0, 5.0, 1.0], "bins": [-0.1070556640625, -0.10379505157470703, -0.10053443908691406, -0.0972738265991211, -0.09401321411132812, -0.09075260162353516, -0.08749198913574219, -0.08423137664794922, -0.08097076416015625, -0.07771015167236328, -0.07444953918457031, -0.07118892669677734, -0.06792831420898438, -0.0646677017211914, -0.06140708923339844, -0.05814647674560547, -0.0548858642578125, -0.05162525177001953, -0.04836463928222656, -0.045104026794433594, -0.041843414306640625, -0.038582801818847656, -0.03532218933105469, -0.03206157684326172, -0.02880096435546875, -0.02554035186767578, -0.022279739379882812, -0.019019126892089844, -0.015758514404296875, -0.012497901916503906, -0.009237289428710938, -0.005976676940917969, -0.002716064453125, 0.0005445480346679688, 0.0038051605224609375, 0.007065773010253906, 0.010326385498046875, 0.013586997985839844, 0.016847610473632812, 0.02010822296142578, 0.02336883544921875, 0.02662944793701172, 0.029890060424804688, 0.033150672912597656, 0.036411285400390625, 0.039671897888183594, 0.04293251037597656, 0.04619312286376953, 0.0494537353515625, 0.05271434783935547, 0.05597496032714844, 0.059235572814941406, 0.062496185302734375, 0.06575679779052734, 0.06901741027832031, 0.07227802276611328, 0.07553863525390625, 0.07879924774169922, 0.08205986022949219, 0.08532047271728516, 0.08858108520507812, 0.0918416976928711, 0.09510231018066406, 0.09836292266845703, 0.10162353515625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 6.0, 6.0, 6.0, 10.0, 6.0, 14.0, 13.0, 24.0, 23.0, 26.0, 23.0, 29.0, 37.0, 27.0, 36.0, 24.0, 35.0, 48.0, 43.0, 39.0, 1059.0, 32.0, 38.0, 31.0, 35.0, 27.0, 34.0, 21.0, 34.0, 34.0, 21.0, 33.0, 26.0, 25.0, 12.0, 10.0, 18.0, 9.0, 10.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.658203125, -1.60418701171875, -1.5501708984375, -1.49615478515625, -1.442138671875, -1.38812255859375, -1.3341064453125, -1.28009033203125, -1.22607421875, -1.17205810546875, -1.1180419921875, -1.06402587890625, -1.010009765625, -0.95599365234375, -0.9019775390625, -0.84796142578125, -0.7939453125, -0.73992919921875, -0.6859130859375, -0.63189697265625, -0.577880859375, -0.52386474609375, -0.4698486328125, -0.41583251953125, -0.36181640625, -0.30780029296875, -0.2537841796875, -0.19976806640625, -0.145751953125, -0.09173583984375, -0.0377197265625, 0.01629638671875, 0.0703125, 0.12432861328125, 0.1783447265625, 0.23236083984375, 0.286376953125, 0.34039306640625, 0.3944091796875, 0.44842529296875, 0.50244140625, 0.55645751953125, 0.6104736328125, 0.66448974609375, 0.718505859375, 0.77252197265625, 0.8265380859375, 0.88055419921875, 0.9345703125, 0.98858642578125, 1.0426025390625, 1.09661865234375, 1.150634765625, 1.20465087890625, 1.2586669921875, 1.31268310546875, 1.36669921875, 1.42071533203125, 1.4747314453125, 1.52874755859375, 1.582763671875, 1.63677978515625, 1.6907958984375, 1.74481201171875, 1.798828125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 17.0, 27.0, 38.0, 63.0, 78.0, 117.0, 179.0, 249.0, 353.0, 509.0, 721.0, 977.0, 1345.0, 1956.0, 2816.0, 4213.0, 5916.0, 8628.0, 12929.0, 19168.0, 28353.0, 42380.0, 66980.0, 113855.0, 1300745.0, 200822.0, 102220.0, 60510.0, 39323.0, 26096.0, 17580.0, 11866.0, 7999.0, 5475.0, 3807.0, 2656.0, 1789.0, 1318.0, 919.0, 597.0, 461.0, 300.0, 223.0, 156.0, 112.0, 95.0, 52.0, 53.0, 28.0, 21.0, 15.0, 7.0, 8.0, 2.0, 1.0, 2.0], "bins": [-0.05181884765625, -0.05024385452270508, -0.048668861389160156, -0.047093868255615234, -0.04551887512207031, -0.04394388198852539, -0.04236888885498047, -0.04079389572143555, -0.039218902587890625, -0.0376439094543457, -0.03606891632080078, -0.03449392318725586, -0.03291893005371094, -0.031343936920166016, -0.029768943786621094, -0.028193950653076172, -0.02661895751953125, -0.025043964385986328, -0.023468971252441406, -0.021893978118896484, -0.020318984985351562, -0.01874399185180664, -0.01716899871826172, -0.015594005584716797, -0.014019012451171875, -0.012444019317626953, -0.010869026184082031, -0.00929403305053711, -0.0077190399169921875, -0.006144046783447266, -0.004569053649902344, -0.002994060516357422, -0.0014190673828125, 0.00015592575073242188, 0.0017309188842773438, 0.0033059120178222656, 0.0048809051513671875, 0.006455898284912109, 0.008030891418457031, 0.009605884552001953, 0.011180877685546875, 0.012755870819091797, 0.014330863952636719, 0.01590585708618164, 0.017480850219726562, 0.019055843353271484, 0.020630836486816406, 0.022205829620361328, 0.02378082275390625, 0.025355815887451172, 0.026930809020996094, 0.028505802154541016, 0.030080795288085938, 0.03165578842163086, 0.03323078155517578, 0.0348057746887207, 0.036380767822265625, 0.03795576095581055, 0.03953075408935547, 0.04110574722290039, 0.04268074035644531, 0.044255733489990234, 0.045830726623535156, 0.04740571975708008, 0.048980712890625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 0.0, 5.0, 8.0, 7.0, 5.0, 5.0, 6.0, 13.0, 15.0, 13.0, 0.0, 22.0, 43.0, 62.0, 116.0, 353.0, 107.0, 67.0, 39.0, 15.0, 23.0, 0.0, 10.0, 9.0, 10.0, 14.0, 3.0, 2.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.912936568260193e-06, -1.8589198589324951e-06, -1.8049031496047974e-06, -1.7508864402770996e-06, -1.6968697309494019e-06, -1.642853021621704e-06, -1.5888363122940063e-06, -1.5348196029663086e-06, -1.4808028936386108e-06, -1.426786184310913e-06, -1.3727694749832153e-06, -1.3187527656555176e-06, -1.2647360563278198e-06, -1.210719347000122e-06, -1.1567026376724243e-06, -1.1026859283447266e-06, -1.0486692190170288e-06, -9.94652509689331e-07, -9.406358003616333e-07, -8.866190910339355e-07, -8.326023817062378e-07, -7.7858567237854e-07, -7.245689630508423e-07, -6.705522537231445e-07, -6.165355443954468e-07, -5.62518835067749e-07, -5.085021257400513e-07, -4.544854164123535e-07, -4.0046870708465576e-07, -3.46451997756958e-07, -2.9243528842926025e-07, -2.384185791015625e-07, -1.8440186977386475e-07, -1.30385160446167e-07, -7.636845111846924e-08, -2.2351741790771484e-08, 3.166496753692627e-08, 8.568167686462402e-08, 1.3969838619232178e-07, 1.9371509552001953e-07, 2.477318048477173e-07, 3.0174851417541504e-07, 3.557652235031128e-07, 4.0978193283081055e-07, 4.637986421585083e-07, 5.178153514862061e-07, 5.718320608139038e-07, 6.258487701416016e-07, 6.798654794692993e-07, 7.338821887969971e-07, 7.878988981246948e-07, 8.419156074523926e-07, 8.959323167800903e-07, 9.499490261077881e-07, 1.0039657354354858e-06, 1.0579824447631836e-06, 1.1119991540908813e-06, 1.166015863418579e-06, 1.2200325727462769e-06, 1.2740492820739746e-06, 1.3280659914016724e-06, 1.3820827007293701e-06, 1.4360994100570679e-06, 1.4901161193847656e-06]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 6.0, 4.0, 6.0, 7.0, 16.0, 29.0, 49.0, 74.0, 177.0, 470.0, 23198.0, 1000592.0, 23045.0, 505.0, 137.0, 90.0, 48.0, 23.0, 8.0, 9.0, 4.0, 8.0, 5.0, 4.0, 4.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.147125244140625e-05, -3.0326656997203827e-05, -2.9182061553001404e-05, -2.803746610879898e-05, -2.6892870664596558e-05, -2.5748275220394135e-05, -2.460367977619171e-05, -2.345908433198929e-05, -2.2314488887786865e-05, -2.1169893443584442e-05, -2.002529799938202e-05, -1.8880702555179596e-05, -1.7736107110977173e-05, -1.659151166677475e-05, -1.5446916222572327e-05, -1.4302320778369904e-05, -1.315772533416748e-05, -1.2013129889965057e-05, -1.0868534445762634e-05, -9.723939001560211e-06, -8.579343557357788e-06, -7.434748113155365e-06, -6.290152668952942e-06, -5.145557224750519e-06, -4.000961780548096e-06, -2.8563663363456726e-06, -1.7117708921432495e-06, -5.671754479408264e-07, 5.774199962615967e-07, 1.7220154404640198e-06, 2.866610884666443e-06, 4.011206328868866e-06, 5.155801773071289e-06, 6.300397217273712e-06, 7.444992661476135e-06, 8.589588105678558e-06, 9.734183549880981e-06, 1.0878778994083405e-05, 1.2023374438285828e-05, 1.316796988248825e-05, 1.4312565326690674e-05, 1.5457160770893097e-05, 1.660175621509552e-05, 1.7746351659297943e-05, 1.8890947103500366e-05, 2.003554254770279e-05, 2.1180137991905212e-05, 2.2324733436107635e-05, 2.346932888031006e-05, 2.461392432451248e-05, 2.5758519768714905e-05, 2.6903115212917328e-05, 2.804771065711975e-05, 2.9192306101322174e-05, 3.0336901545524597e-05, 3.148149698972702e-05, 3.262609243392944e-05, 3.3770687878131866e-05, 3.491528332233429e-05, 3.605987876653671e-05, 3.7204474210739136e-05, 3.834906965494156e-05, 3.949366509914398e-05, 4.0638260543346405e-05, 4.178285598754883e-05]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 15.0, 36.0, 70.0, 103.0, 413.0, 153.0, 114.0, 47.0, 18.0, 16.0, 9.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2349764801911078e-06, -1.1975039342360105e-06, -1.1600313882809132e-06, -1.122558842325816e-06, -1.0850864100575563e-06, -1.047613864102459e-06, -1.0101413181473617e-06, -9.726687721922644e-07, -9.351962262371671e-07, -8.977236802820698e-07, -8.602511911703914e-07, -8.227786452152941e-07, -7.853060992601968e-07, -7.478336101485183e-07, -7.10361064193421e-07, -6.728885182383237e-07, -6.354160291266453e-07, -5.97943483171548e-07, -5.604709940598696e-07, -5.229984481047723e-07, -4.85525902149675e-07, -4.480533846162871e-07, -4.105808670828992e-07, -3.731083211278019e-07, -3.3563580359441403e-07, -2.9816328606102616e-07, -2.6069074010592885e-07, -2.2321822257254098e-07, -1.857456908282984e-07, -1.482731590840558e-07, -1.1080064155066793e-07, -7.332809559557063e-08, -3.585557806218276e-08, 1.6169501293461508e-09, 3.908947832087506e-08, 7.656200295969029e-08, 1.1403453470393288e-07, 1.5150706644817546e-07, 1.8897958398156334e-07, 2.2645212993666064e-07, 2.639246474700485e-07, 3.013971650034364e-07, 3.388697109585337e-07, 3.7634222849192156e-07, 4.1381474602530943e-07, 4.5128729198040674e-07, 4.88759837935504e-07, 5.262323838906013e-07, 5.637048730022798e-07, 6.011774189573771e-07, 6.386499080690555e-07, 6.761224540241528e-07, 7.135949999792501e-07, 7.510675459343474e-07, 7.885400350460259e-07, 8.260125810011232e-07, 8.634850701128016e-07, 9.009576160678989e-07, 9.384301051795774e-07, 9.759025942912558e-07, 1.0133751402463531e-06, 1.0508476862014504e-06, 1.0883202321565477e-06, 1.125792778111645e-06, 1.1632653240667423e-06]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 0.0, 66.0, 0.0, 0.0, 0.0, 210.0, 0.0, 0.0, 0.0, 0.0, 392.0, 0.0, 0.0, 0.0, 0.0, 183.0, 0.0, 0.0, 0.0, 79.0, 0.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4458935260772705e-07, -3.3155083656311035e-07, -3.1851232051849365e-07, -3.0547380447387695e-07, -2.9243528842926025e-07, -2.7939677238464355e-07, -2.6635825634002686e-07, -2.5331974029541016e-07, -2.4028122425079346e-07, -2.2724270820617676e-07, -2.1420419216156006e-07, -2.0116567611694336e-07, -1.8812716007232666e-07, -1.7508864402770996e-07, -1.6205012798309326e-07, -1.4901161193847656e-07, -1.3597309589385986e-07, -1.2293457984924316e-07, -1.0989606380462646e-07, -9.685754776000977e-08, -8.381903171539307e-08, -7.078051567077637e-08, -5.774199962615967e-08, -4.470348358154297e-08, -3.166496753692627e-08, -1.862645149230957e-08, -5.587935447692871e-09, 7.450580596923828e-09, 2.0489096641540527e-08, 3.3527612686157227e-08, 4.6566128730773926e-08, 5.960464477539063e-08, 7.264316082000732e-08, 8.568167686462402e-08, 9.872019290924072e-08, 1.1175870895385742e-07, 1.2479722499847412e-07, 1.3783574104309082e-07, 1.5087425708770752e-07, 1.6391277313232422e-07, 1.7695128917694092e-07, 1.8998980522155762e-07, 2.0302832126617432e-07, 2.1606683731079102e-07, 2.2910535335540771e-07, 2.421438694000244e-07, 2.551823854446411e-07, 2.682209014892578e-07, 2.812594175338745e-07, 2.942979335784912e-07, 3.073364496231079e-07, 3.203749656677246e-07, 3.334134817123413e-07, 3.46451997756958e-07, 3.594905138015747e-07, 3.725290298461914e-07, 3.855675458908081e-07, 3.986060619354248e-07, 4.116445779800415e-07, 4.246830940246582e-07, 4.377216100692749e-07, 4.507601261138916e-07, 4.637986421585083e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 11.0, 8.0, 4.0, 12.0, 9.0, 10.0, 9.0, 18.0, 22.0, 18.0, 28.0, 28.0, 38.0, 37.0, 30.0, 32.0, 35.0, 43.0, 46.0, 47.0, 45.0, 42.0, 32.0, 43.0, 48.0, 43.0, 32.0, 31.0, 22.0, 24.0, 13.0, 31.0, 9.0, 18.0, 19.0, 19.0, 7.0, 8.0, 8.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.87890625, -2.792877197265625, -2.70684814453125, -2.620819091796875, -2.5347900390625, -2.448760986328125, -2.36273193359375, -2.276702880859375, -2.190673828125, -2.104644775390625, -2.01861572265625, -1.932586669921875, -1.8465576171875, -1.760528564453125, -1.67449951171875, -1.588470458984375, -1.50244140625, -1.416412353515625, -1.33038330078125, -1.244354248046875, -1.1583251953125, -1.072296142578125, -0.98626708984375, -0.900238037109375, -0.814208984375, -0.728179931640625, -0.64215087890625, -0.556121826171875, -0.4700927734375, -0.384063720703125, -0.29803466796875, -0.212005615234375, -0.1259765625, -0.039947509765625, 0.04608154296875, 0.132110595703125, 0.2181396484375, 0.304168701171875, 0.39019775390625, 0.476226806640625, 0.562255859375, 0.648284912109375, 0.73431396484375, 0.820343017578125, 0.9063720703125, 0.992401123046875, 1.07843017578125, 1.164459228515625, 1.25048828125, 1.336517333984375, 1.42254638671875, 1.508575439453125, 1.5946044921875, 1.680633544921875, 1.76666259765625, 1.852691650390625, 1.938720703125, 2.024749755859375, 2.11077880859375, 2.196807861328125, 2.2828369140625, 2.368865966796875, 2.45489501953125, 2.540924072265625, 2.626953125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 7.0, 12.0, 17.0, 31.0, 43.0, 66.0, 108.0, 180.0, 287.0, 496.0, 879.0, 1389.0, 2297.0, 3850.0, 6529.0, 11177.0, 19051.0, 32704.0, 54841.0, 89988.0, 158137.0, 278440.0, 160794.0, 91846.0, 55448.0, 33136.0, 19273.0, 11353.0, 6640.0, 3856.0, 2263.0, 1327.0, 810.0, 508.0, 326.0, 167.0, 104.0, 83.0, 41.0, 17.0, 12.0, 14.0, 8.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94140625, -2.845001220703125, -2.74859619140625, -2.652191162109375, -2.5557861328125, -2.459381103515625, -2.36297607421875, -2.266571044921875, -2.170166015625, -2.073760986328125, -1.97735595703125, -1.880950927734375, -1.7845458984375, -1.688140869140625, -1.59173583984375, -1.495330810546875, -1.39892578125, -1.302520751953125, -1.20611572265625, -1.109710693359375, -1.0133056640625, -0.916900634765625, -0.82049560546875, -0.724090576171875, -0.627685546875, -0.531280517578125, -0.43487548828125, -0.338470458984375, -0.2420654296875, -0.145660400390625, -0.04925537109375, 0.047149658203125, 0.1435546875, 0.239959716796875, 0.33636474609375, 0.432769775390625, 0.5291748046875, 0.625579833984375, 0.72198486328125, 0.818389892578125, 0.914794921875, 1.011199951171875, 1.10760498046875, 1.204010009765625, 1.3004150390625, 1.396820068359375, 1.49322509765625, 1.589630126953125, 1.68603515625, 1.782440185546875, 1.87884521484375, 1.975250244140625, 2.0716552734375, 2.168060302734375, 2.26446533203125, 2.360870361328125, 2.457275390625, 2.553680419921875, 2.65008544921875, 2.746490478515625, 2.8428955078125, 2.939300537109375, 3.03570556640625, 3.132110595703125, 3.228515625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 14.0, 5.0, 13.0, 12.0, 16.0, 21.0, 16.0, 29.0, 27.0, 28.0, 30.0, 27.0, 43.0, 46.0, 66.0, 76.0, 120.0, 155.0, 1363.0, 259.0, 153.0, 91.0, 64.0, 45.0, 38.0, 41.0, 36.0, 31.0, 26.0, 19.0, 26.0, 11.0, 16.0, 8.0, 15.0, 9.0, 11.0, 3.0, 5.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 5.0], "bins": [-9.59375, -9.32568359375, -9.0576171875, -8.78955078125, -8.521484375, -8.25341796875, -7.9853515625, -7.71728515625, -7.44921875, -7.18115234375, -6.9130859375, -6.64501953125, -6.376953125, -6.10888671875, -5.8408203125, -5.57275390625, -5.3046875, -5.03662109375, -4.7685546875, -4.50048828125, -4.232421875, -3.96435546875, -3.6962890625, -3.42822265625, -3.16015625, -2.89208984375, -2.6240234375, -2.35595703125, -2.087890625, -1.81982421875, -1.5517578125, -1.28369140625, -1.015625, -0.74755859375, -0.4794921875, -0.21142578125, 0.056640625, 0.32470703125, 0.5927734375, 0.86083984375, 1.12890625, 1.39697265625, 1.6650390625, 1.93310546875, 2.201171875, 2.46923828125, 2.7373046875, 3.00537109375, 3.2734375, 3.54150390625, 3.8095703125, 4.07763671875, 4.345703125, 4.61376953125, 4.8818359375, 5.14990234375, 5.41796875, 5.68603515625, 5.9541015625, 6.22216796875, 6.490234375, 6.75830078125, 7.0263671875, 7.29443359375, 7.5625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 16.0, 17.0, 21.0, 33.0, 28.0, 51.0, 69.0, 73.0, 100.0, 120.0, 175.0, 242.0, 329.0, 782.0, 4538.0, 77112.0, 2629836.0, 415981.0, 13172.0, 1490.0, 447.0, 255.0, 197.0, 145.0, 123.0, 86.0, 62.0, 42.0, 44.0, 34.0, 19.0, 23.0, 8.0, 6.0, 6.0, 3.0, 7.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.359375, -16.794189453125, -16.22900390625, -15.663818359375, -15.0986328125, -14.533447265625, -13.96826171875, -13.403076171875, -12.837890625, -12.272705078125, -11.70751953125, -11.142333984375, -10.5771484375, -10.011962890625, -9.44677734375, -8.881591796875, -8.31640625, -7.751220703125, -7.18603515625, -6.620849609375, -6.0556640625, -5.490478515625, -4.92529296875, -4.360107421875, -3.794921875, -3.229736328125, -2.66455078125, -2.099365234375, -1.5341796875, -0.968994140625, -0.40380859375, 0.161376953125, 0.7265625, 1.291748046875, 1.85693359375, 2.422119140625, 2.9873046875, 3.552490234375, 4.11767578125, 4.682861328125, 5.248046875, 5.813232421875, 6.37841796875, 6.943603515625, 7.5087890625, 8.073974609375, 8.63916015625, 9.204345703125, 9.76953125, 10.334716796875, 10.89990234375, 11.465087890625, 12.0302734375, 12.595458984375, 13.16064453125, 13.725830078125, 14.291015625, 14.856201171875, 15.42138671875, 15.986572265625, 16.5517578125, 17.116943359375, 17.68212890625, 18.247314453125, 18.8125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 9.0, 47.0, 137.0, 250.0, 263.0, 180.0, 89.0, 30.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.159503936767578, -10.49328899383545, -8.82707405090332, -7.160858154296875, -5.494643211364746, -3.828428268432617, -2.162212371826172, -0.49599742889404297, 1.170217514038086, 2.836432695388794, 4.502647876739502, 6.168863296508789, 7.835078239440918, 9.501293182373047, 11.167509078979492, 12.833724021911621, 14.49993896484375, 16.166154861450195, 17.832368850708008, 19.498584747314453, 21.164798736572266, 22.83101463317871, 24.497230529785156, 26.16344451904297, 27.829660415649414, 29.49587631225586, 31.162090301513672, 32.82830810546875, 34.49452209472656, 36.160736083984375, 37.82695007324219, 39.493167877197266, 41.159385681152344, 42.825599670410156, 44.491817474365234, 46.15803146362305, 47.82424545288086, 49.49046325683594, 51.15667724609375, 52.82289123535156, 54.489105224609375, 56.15531921386719, 57.821537017822266, 59.48775100708008, 61.15396499633789, 62.82018280029297, 64.48639678955078, 66.1526107788086, 67.81883239746094, 69.48504638671875, 71.15126037597656, 72.81747436523438, 74.48369598388672, 76.14990997314453, 77.81612396240234, 79.48233795166016, 81.14855194091797, 82.81476593017578, 84.4809799194336, 86.14720153808594, 87.81341552734375, 89.47962951660156, 91.14584350585938, 92.81205749511719, 94.478271484375]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 7.0, 8.0, 8.0, 12.0, 13.0, 18.0, 8.0, 26.0, 24.0, 27.0, 28.0, 34.0, 36.0, 37.0, 32.0, 49.0, 49.0, 58.0, 40.0, 40.0, 46.0, 44.0, 37.0, 26.0, 38.0, 32.0, 26.0, 25.0, 26.0, 10.0, 27.0, 19.0, 12.0, 16.0, 14.0, 9.0, 7.0, 1.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-26.554752349853516, -25.73130226135254, -24.907854080200195, -24.08440399169922, -23.260953903198242, -22.437503814697266, -21.614055633544922, -20.790605545043945, -19.96715545654297, -19.143705368041992, -18.32025718688965, -17.496807098388672, -16.673357009887695, -15.849907875061035, -15.026458740234375, -14.203008651733398, -13.379559516906738, -12.556110382080078, -11.732660293579102, -10.909211158752441, -10.085761070251465, -9.262311935424805, -8.438861846923828, -7.615412712097168, -6.79196310043335, -5.968513488769531, -5.145063877105713, -4.3216142654418945, -3.4981648921966553, -2.674715518951416, -1.8512659072875977, -1.0278162956237793, -0.20436668395996094, 0.6190828680992126, 1.4425324201583862, 2.265981912612915, 3.0894315242767334, 3.9128808975219727, 4.736330509185791, 5.559780120849609, 6.383229732513428, 7.206679344177246, 8.030128479003906, 8.853578567504883, 9.677027702331543, 10.500476837158203, 11.32392692565918, 12.147377014160156, 12.970826148986816, 13.794275283813477, 14.617725372314453, 15.441174507141113, 16.264623641967773, 17.08807373046875, 17.911523818969727, 18.734973907470703, 19.558422088623047, 20.381872177124023, 21.205320358276367, 22.028770446777344, 22.85222053527832, 23.675670623779297, 24.49911880493164, 25.322568893432617, 26.146018981933594]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 11.0, 8.0, 15.0, 9.0, 14.0, 9.0, 16.0, 21.0, 31.0, 27.0, 30.0, 25.0, 39.0, 23.0, 50.0, 49.0, 41.0, 39.0, 36.0, 45.0, 40.0, 55.0, 35.0, 42.0, 32.0, 24.0, 29.0, 32.0, 26.0, 15.0, 17.0, 13.0, 25.0, 14.0, 8.0, 14.0, 8.0, 7.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0703125, -2.97705078125, -2.8837890625, -2.79052734375, -2.697265625, -2.60400390625, -2.5107421875, -2.41748046875, -2.32421875, -2.23095703125, -2.1376953125, -2.04443359375, -1.951171875, -1.85791015625, -1.7646484375, -1.67138671875, -1.578125, -1.48486328125, -1.3916015625, -1.29833984375, -1.205078125, -1.11181640625, -1.0185546875, -0.92529296875, -0.83203125, -0.73876953125, -0.6455078125, -0.55224609375, -0.458984375, -0.36572265625, -0.2724609375, -0.17919921875, -0.0859375, 0.00732421875, 0.1005859375, 0.19384765625, 0.287109375, 0.38037109375, 0.4736328125, 0.56689453125, 0.66015625, 0.75341796875, 0.8466796875, 0.93994140625, 1.033203125, 1.12646484375, 1.2197265625, 1.31298828125, 1.40625, 1.49951171875, 1.5927734375, 1.68603515625, 1.779296875, 1.87255859375, 1.9658203125, 2.05908203125, 2.15234375, 2.24560546875, 2.3388671875, 2.43212890625, 2.525390625, 2.61865234375, 2.7119140625, 2.80517578125, 2.8984375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 8.0, 8.0, 14.0, 14.0, 29.0, 27.0, 35.0, 69.0, 111.0, 197.0, 409.0, 772.0, 1686.0, 4020.0, 11029.0, 31872.0, 100163.0, 325676.0, 978535.0, 1598475.0, 776152.0, 247982.0, 76750.0, 25023.0, 8715.0, 3480.0, 1424.0, 724.0, 355.0, 184.0, 118.0, 77.0, 35.0, 33.0, 25.0, 16.0, 13.0, 6.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.96331787109375, -3.8328857421875, -3.70245361328125, -3.572021484375, -3.44158935546875, -3.3111572265625, -3.18072509765625, -3.05029296875, -2.91986083984375, -2.7894287109375, -2.65899658203125, -2.528564453125, -2.39813232421875, -2.2677001953125, -2.13726806640625, -2.0068359375, -1.87640380859375, -1.7459716796875, -1.61553955078125, -1.485107421875, -1.35467529296875, -1.2242431640625, -1.09381103515625, -0.96337890625, -0.83294677734375, -0.7025146484375, -0.57208251953125, -0.441650390625, -0.31121826171875, -0.1807861328125, -0.05035400390625, 0.080078125, 0.21051025390625, 0.3409423828125, 0.47137451171875, 0.601806640625, 0.73223876953125, 0.8626708984375, 0.99310302734375, 1.12353515625, 1.25396728515625, 1.3843994140625, 1.51483154296875, 1.645263671875, 1.77569580078125, 1.9061279296875, 2.03656005859375, 2.1669921875, 2.29742431640625, 2.4278564453125, 2.55828857421875, 2.688720703125, 2.81915283203125, 2.9495849609375, 3.08001708984375, 3.21044921875, 3.34088134765625, 3.4713134765625, 3.60174560546875, 3.732177734375, 3.86260986328125, 3.9930419921875, 4.12347412109375, 4.25390625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 8.0, 6.0, 10.0, 13.0, 13.0, 18.0, 36.0, 41.0, 64.0, 108.0, 117.0, 136.0, 192.0, 250.0, 303.0, 405.0, 398.0, 395.0, 368.0, 302.0, 231.0, 153.0, 119.0, 89.0, 79.0, 66.0, 44.0, 38.0, 25.0, 10.0, 14.0, 4.0, 9.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.90234375, -5.7318115234375, -5.561279296875, -5.3907470703125, -5.22021484375, -5.0496826171875, -4.879150390625, -4.7086181640625, -4.5380859375, -4.3675537109375, -4.197021484375, -4.0264892578125, -3.85595703125, -3.6854248046875, -3.514892578125, -3.3443603515625, -3.173828125, -3.0032958984375, -2.832763671875, -2.6622314453125, -2.49169921875, -2.3211669921875, -2.150634765625, -1.9801025390625, -1.8095703125, -1.6390380859375, -1.468505859375, -1.2979736328125, -1.12744140625, -0.9569091796875, -0.786376953125, -0.6158447265625, -0.4453125, -0.2747802734375, -0.104248046875, 0.0662841796875, 0.23681640625, 0.4073486328125, 0.577880859375, 0.7484130859375, 0.9189453125, 1.0894775390625, 1.260009765625, 1.4305419921875, 1.60107421875, 1.7716064453125, 1.942138671875, 2.1126708984375, 2.283203125, 2.4537353515625, 2.624267578125, 2.7947998046875, 2.96533203125, 3.1358642578125, 3.306396484375, 3.4769287109375, 3.6474609375, 3.8179931640625, 3.988525390625, 4.1590576171875, 4.32958984375, 4.5001220703125, 4.670654296875, 4.8411865234375, 5.01171875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 9.0, 5.0, 6.0, 12.0, 21.0, 26.0, 32.0, 61.0, 68.0, 116.0, 140.0, 181.0, 288.0, 534.0, 2111.0, 38822.0, 1345474.0, 2700141.0, 100544.0, 4095.0, 637.0, 290.0, 221.0, 137.0, 104.0, 56.0, 53.0, 28.0, 24.0, 15.0, 9.0, 9.0, 6.0, 9.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.65625, -15.118896484375, -14.58154296875, -14.044189453125, -13.5068359375, -12.969482421875, -12.43212890625, -11.894775390625, -11.357421875, -10.820068359375, -10.28271484375, -9.745361328125, -9.2080078125, -8.670654296875, -8.13330078125, -7.595947265625, -7.05859375, -6.521240234375, -5.98388671875, -5.446533203125, -4.9091796875, -4.371826171875, -3.83447265625, -3.297119140625, -2.759765625, -2.222412109375, -1.68505859375, -1.147705078125, -0.6103515625, -0.072998046875, 0.46435546875, 1.001708984375, 1.5390625, 2.076416015625, 2.61376953125, 3.151123046875, 3.6884765625, 4.225830078125, 4.76318359375, 5.300537109375, 5.837890625, 6.375244140625, 6.91259765625, 7.449951171875, 7.9873046875, 8.524658203125, 9.06201171875, 9.599365234375, 10.13671875, 10.674072265625, 11.21142578125, 11.748779296875, 12.2861328125, 12.823486328125, 13.36083984375, 13.898193359375, 14.435546875, 14.972900390625, 15.51025390625, 16.047607421875, 16.5849609375, 17.122314453125, 17.65966796875, 18.197021484375, 18.734375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 9.0, 8.0, 19.0, 29.0, 37.0, 47.0, 73.0, 95.0, 106.0, 106.0, 127.0, 109.0, 65.0, 64.0, 49.0, 31.0, 19.0, 13.0, 4.0, 6.0, 1.0], "bins": [-53.673614501953125, -52.65141677856445, -51.62921905517578, -50.60702133178711, -49.58482360839844, -48.562625885009766, -47.540428161621094, -46.51823043823242, -45.49603271484375, -44.47383499145508, -43.451637268066406, -42.429439544677734, -41.40724182128906, -40.38504409790039, -39.36284637451172, -38.34064865112305, -37.318450927734375, -36.2962532043457, -35.27405548095703, -34.25185775756836, -33.22966003417969, -32.207462310791016, -31.185264587402344, -30.163066864013672, -29.140872955322266, -28.118675231933594, -27.096477508544922, -26.07427978515625, -25.052082061767578, -24.029884338378906, -23.007686614990234, -21.985488891601562, -20.96329116821289, -19.94109344482422, -18.918895721435547, -17.896697998046875, -16.874500274658203, -15.852302551269531, -14.830105781555176, -13.807908058166504, -12.785710334777832, -11.76351261138916, -10.741314888000488, -9.719118118286133, -8.696920394897461, -7.674722194671631, -6.652524948120117, -5.630327224731445, -4.608129501342773, -3.5859317779541016, -2.563734292984009, -1.541536808013916, -0.5193390846252441, 0.5028586387634277, 1.5250558853149414, 2.5472536087036133, 3.569451332092285, 4.591649055480957, 5.613846778869629, 6.636044025421143, 7.6582417488098145, 8.680438995361328, 9.70263671875, 10.724834442138672, 11.747032165527344]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 6.0, 5.0, 11.0, 9.0, 15.0, 17.0, 20.0, 17.0, 27.0, 20.0, 28.0, 26.0, 33.0, 44.0, 49.0, 37.0, 60.0, 46.0, 41.0, 38.0, 39.0, 37.0, 33.0, 44.0, 38.0, 32.0, 47.0, 21.0, 25.0, 25.0, 23.0, 12.0, 13.0, 8.0, 15.0, 12.0, 5.0, 5.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.15804672241211, -20.55150032043457, -19.94495391845703, -19.33840560913086, -18.73185920715332, -18.12531280517578, -17.518766403198242, -16.912220001220703, -16.30567169189453, -15.699125289916992, -15.092577934265137, -14.486031532287598, -13.879484176635742, -13.272937774658203, -12.666391372680664, -12.059844017028809, -11.45329761505127, -10.84675121307373, -10.240203857421875, -9.633657455444336, -9.02711009979248, -8.420563697814941, -7.814016819000244, -7.207469940185547, -6.60092306137085, -5.994376182556152, -5.387829303741455, -4.781282424926758, -4.174736022949219, -3.5681889057159424, -2.961642265319824, -2.355095386505127, -1.7485485076904297, -1.1420016288757324, -0.5354548692703247, 0.07109189033508301, 0.6776387691497803, 1.2841856479644775, 1.8907322883605957, 2.497279167175293, 3.1038260459899902, 3.7103729248046875, 4.316919803619385, 4.923466682434082, 5.530013084411621, 6.136560440063477, 6.743106842041016, 7.349653720855713, 7.95620059967041, 8.56274700164795, 9.169294357299805, 9.775840759277344, 10.3823881149292, 10.988934516906738, 11.595481872558594, 12.202028274536133, 12.808574676513672, 13.415121078491211, 14.021668434143066, 14.628214836120605, 15.234762191772461, 15.84130859375, 16.44785499572754, 17.054401397705078, 17.66094970703125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 8.0, 9.0, 11.0, 11.0, 8.0, 18.0, 15.0, 31.0, 23.0, 32.0, 27.0, 26.0, 26.0, 43.0, 40.0, 48.0, 49.0, 35.0, 45.0, 37.0, 57.0, 22.0, 49.0, 41.0, 29.0, 37.0, 27.0, 24.0, 12.0, 13.0, 20.0, 15.0, 17.0, 15.0, 11.0, 16.0, 7.0, 7.0, 9.0, 4.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.033203125, -2.945037841796875, -2.85687255859375, -2.768707275390625, -2.6805419921875, -2.592376708984375, -2.50421142578125, -2.416046142578125, -2.327880859375, -2.239715576171875, -2.15155029296875, -2.063385009765625, -1.9752197265625, -1.887054443359375, -1.79888916015625, -1.710723876953125, -1.62255859375, -1.534393310546875, -1.44622802734375, -1.358062744140625, -1.2698974609375, -1.181732177734375, -1.09356689453125, -1.005401611328125, -0.917236328125, -0.829071044921875, -0.74090576171875, -0.652740478515625, -0.5645751953125, -0.476409912109375, -0.38824462890625, -0.300079345703125, -0.2119140625, -0.123748779296875, -0.03558349609375, 0.052581787109375, 0.1407470703125, 0.228912353515625, 0.31707763671875, 0.405242919921875, 0.493408203125, 0.581573486328125, 0.66973876953125, 0.757904052734375, 0.8460693359375, 0.934234619140625, 1.02239990234375, 1.110565185546875, 1.19873046875, 1.286895751953125, 1.37506103515625, 1.463226318359375, 1.5513916015625, 1.639556884765625, 1.72772216796875, 1.815887451171875, 1.904052734375, 1.992218017578125, 2.08038330078125, 2.168548583984375, 2.2567138671875, 2.344879150390625, 2.43304443359375, 2.521209716796875, 2.609375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 8.0, 20.0, 28.0, 37.0, 57.0, 71.0, 118.0, 162.0, 246.0, 370.0, 465.0, 758.0, 1101.0, 1571.0, 2305.0, 3412.0, 5034.0, 7469.0, 11218.0, 17085.0, 26087.0, 41259.0, 72301.0, 139848.0, 350329.0, 160111.0, 78857.0, 45293.0, 28134.0, 17826.0, 11918.0, 8003.0, 5513.0, 3620.0, 2570.0, 1696.0, 1139.0, 796.0, 541.0, 364.0, 277.0, 161.0, 111.0, 90.0, 51.0, 37.0, 30.0, 15.0, 18.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.12322998046875, -0.11944770812988281, -0.11566543579101562, -0.11188316345214844, -0.10810089111328125, -0.10431861877441406, -0.10053634643554688, -0.09675407409667969, -0.0929718017578125, -0.08918952941894531, -0.08540725708007812, -0.08162498474121094, -0.07784271240234375, -0.07406044006347656, -0.07027816772460938, -0.06649589538574219, -0.062713623046875, -0.05893135070800781, -0.055149078369140625, -0.05136680603027344, -0.04758453369140625, -0.04380226135253906, -0.040019989013671875, -0.03623771667480469, -0.0324554443359375, -0.028673171997070312, -0.024890899658203125, -0.021108627319335938, -0.01732635498046875, -0.013544082641601562, -0.009761810302734375, -0.0059795379638671875, -0.002197265625, 0.0015850067138671875, 0.005367279052734375, 0.009149551391601562, 0.01293182373046875, 0.016714096069335938, 0.020496368408203125, 0.024278640747070312, 0.0280609130859375, 0.03184318542480469, 0.035625457763671875, 0.03940773010253906, 0.04319000244140625, 0.04697227478027344, 0.050754547119140625, 0.05453681945800781, 0.058319091796875, 0.06210136413574219, 0.06588363647460938, 0.06966590881347656, 0.07344818115234375, 0.07723045349121094, 0.08101272583007812, 0.08479499816894531, 0.0885772705078125, 0.09235954284667969, 0.09614181518554688, 0.09992408752441406, 0.10370635986328125, 0.10748863220214844, 0.11127090454101562, 0.11505317687988281, 0.11883544921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 13.0, 9.0, 7.0, 8.0, 23.0, 22.0, 26.0, 22.0, 33.0, 38.0, 39.0, 27.0, 47.0, 34.0, 45.0, 42.0, 42.0, 1068.0, 48.0, 40.0, 37.0, 50.0, 43.0, 28.0, 28.0, 42.0, 22.0, 38.0, 14.0, 14.0, 25.0, 13.0, 15.0, 4.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.288116455078125, -2.21685791015625, -2.145599365234375, -2.0743408203125, -2.003082275390625, -1.93182373046875, -1.860565185546875, -1.789306640625, -1.718048095703125, -1.64678955078125, -1.575531005859375, -1.5042724609375, -1.433013916015625, -1.36175537109375, -1.290496826171875, -1.21923828125, -1.147979736328125, -1.07672119140625, -1.005462646484375, -0.9342041015625, -0.862945556640625, -0.79168701171875, -0.720428466796875, -0.649169921875, -0.577911376953125, -0.50665283203125, -0.435394287109375, -0.3641357421875, -0.292877197265625, -0.22161865234375, -0.150360107421875, -0.0791015625, -0.007843017578125, 0.06341552734375, 0.134674072265625, 0.2059326171875, 0.277191162109375, 0.34844970703125, 0.419708251953125, 0.490966796875, 0.562225341796875, 0.63348388671875, 0.704742431640625, 0.7760009765625, 0.847259521484375, 0.91851806640625, 0.989776611328125, 1.06103515625, 1.132293701171875, 1.20355224609375, 1.274810791015625, 1.3460693359375, 1.417327880859375, 1.48858642578125, 1.559844970703125, 1.631103515625, 1.702362060546875, 1.77362060546875, 1.844879150390625, 1.9161376953125, 1.987396240234375, 2.05865478515625, 2.129913330078125, 2.201171875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 9.0, 9.0, 18.0, 31.0, 41.0, 62.0, 85.0, 158.0, 275.0, 346.0, 573.0, 960.0, 1464.0, 2338.0, 3605.0, 5698.0, 9294.0, 14173.0, 22523.0, 35957.0, 59899.0, 105374.0, 225419.0, 1325909.0, 114844.0, 64186.0, 38353.0, 24097.0, 15105.0, 9581.0, 6013.0, 3914.0, 2441.0, 1641.0, 924.0, 645.0, 431.0, 228.0, 169.0, 129.0, 73.0, 36.0, 32.0, 20.0, 14.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06414794921875, -0.06208324432373047, -0.06001853942871094, -0.057953834533691406, -0.055889129638671875, -0.053824424743652344, -0.05175971984863281, -0.04969501495361328, -0.04763031005859375, -0.04556560516357422, -0.04350090026855469, -0.041436195373535156, -0.039371490478515625, -0.037306785583496094, -0.03524208068847656, -0.03317737579345703, -0.0311126708984375, -0.02904796600341797, -0.026983261108398438, -0.024918556213378906, -0.022853851318359375, -0.020789146423339844, -0.018724441528320312, -0.01665973663330078, -0.01459503173828125, -0.012530326843261719, -0.010465621948242188, -0.008400917053222656, -0.006336212158203125, -0.004271507263183594, -0.0022068023681640625, -0.00014209747314453125, 0.001922607421875, 0.003987312316894531, 0.0060520172119140625, 0.008116722106933594, 0.010181427001953125, 0.012246131896972656, 0.014310836791992188, 0.01637554168701172, 0.01844024658203125, 0.02050495147705078, 0.022569656372070312, 0.024634361267089844, 0.026699066162109375, 0.028763771057128906, 0.030828475952148438, 0.03289318084716797, 0.0349578857421875, 0.03702259063720703, 0.03908729553222656, 0.041152000427246094, 0.043216705322265625, 0.045281410217285156, 0.04734611511230469, 0.04941082000732422, 0.05147552490234375, 0.05354022979736328, 0.05560493469238281, 0.057669639587402344, 0.059734344482421875, 0.061799049377441406, 0.06386375427246094, 0.06592845916748047, 0.0679931640625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 1.0, 7.0, 3.0, 4.0, 6.0, 8.0, 7.0, 13.0, 6.0, 41.0, 17.0, 37.0, 29.0, 153.0, 352.0, 83.0, 84.0, 23.0, 40.0, 6.0, 15.0, 8.0, 13.0, 2.0, 10.0, 3.0, 4.0, 3.0, 12.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.682209014892578e-06, -2.594664692878723e-06, -2.507120370864868e-06, -2.419576048851013e-06, -2.332031726837158e-06, -2.2444874048233032e-06, -2.1569430828094482e-06, -2.0693987607955933e-06, -1.9818544387817383e-06, -1.8943101167678833e-06, -1.8067657947540283e-06, -1.7192214727401733e-06, -1.6316771507263184e-06, -1.5441328287124634e-06, -1.4565885066986084e-06, -1.3690441846847534e-06, -1.2814998626708984e-06, -1.1939555406570435e-06, -1.1064112186431885e-06, -1.0188668966293335e-06, -9.313225746154785e-07, -8.437782526016235e-07, -7.562339305877686e-07, -6.686896085739136e-07, -5.811452865600586e-07, -4.936009645462036e-07, -4.0605664253234863e-07, -3.1851232051849365e-07, -2.3096799850463867e-07, -1.434236764907837e-07, -5.587935447692871e-08, 3.166496753692627e-08, 1.1920928955078125e-07, 2.0675361156463623e-07, 2.942979335784912e-07, 3.818422555923462e-07, 4.6938657760620117e-07, 5.569308996200562e-07, 6.444752216339111e-07, 7.320195436477661e-07, 8.195638656616211e-07, 9.071081876754761e-07, 9.94652509689331e-07, 1.082196831703186e-06, 1.169741153717041e-06, 1.257285475730896e-06, 1.344829797744751e-06, 1.432374119758606e-06, 1.519918441772461e-06, 1.607462763786316e-06, 1.695007085800171e-06, 1.7825514078140259e-06, 1.8700957298278809e-06, 1.957640051841736e-06, 2.045184373855591e-06, 2.132728695869446e-06, 2.2202730178833008e-06, 2.3078173398971558e-06, 2.3953616619110107e-06, 2.4829059839248657e-06, 2.5704503059387207e-06, 2.6579946279525757e-06, 2.7455389499664307e-06, 2.8330832719802856e-06, 2.9206275939941406e-06]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 8.0, 5.0, 3.0, 8.0, 3.0, 10.0, 12.0, 10.0, 11.0, 33.0, 57.0, 117.0, 350.0, 11821.0, 1029994.0, 5530.0, 290.0, 107.0, 54.0, 35.0, 24.0, 13.0, 10.0, 6.0, 6.0, 9.0, 6.0, 0.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.109476089477539e-05, -5.926750600337982e-05, -5.744025111198425e-05, -5.5612996220588684e-05, -5.3785741329193115e-05, -5.1958486437797546e-05, -5.013123154640198e-05, -4.830397665500641e-05, -4.647672176361084e-05, -4.464946687221527e-05, -4.28222119808197e-05, -4.099495708942413e-05, -3.9167702198028564e-05, -3.7340447306632996e-05, -3.551319241523743e-05, -3.368593752384186e-05, -3.185868263244629e-05, -3.003142774105072e-05, -2.820417284965515e-05, -2.6376917958259583e-05, -2.4549663066864014e-05, -2.2722408175468445e-05, -2.0895153284072876e-05, -1.9067898392677307e-05, -1.7240643501281738e-05, -1.541338860988617e-05, -1.35861337184906e-05, -1.1758878827095032e-05, -9.931623935699463e-06, -8.104369044303894e-06, -6.277114152908325e-06, -4.449859261512756e-06, -2.6226043701171875e-06, -7.953494787216187e-07, 1.0319054126739502e-06, 2.859160304069519e-06, 4.686415195465088e-06, 6.513670086860657e-06, 8.340924978256226e-06, 1.0168179869651794e-05, 1.1995434761047363e-05, 1.3822689652442932e-05, 1.56499445438385e-05, 1.747719943523407e-05, 1.930445432662964e-05, 2.1131709218025208e-05, 2.2958964109420776e-05, 2.4786219000816345e-05, 2.6613473892211914e-05, 2.8440728783607483e-05, 3.0267983675003052e-05, 3.209523856639862e-05, 3.392249345779419e-05, 3.574974834918976e-05, 3.757700324058533e-05, 3.9404258131980896e-05, 4.1231513023376465e-05, 4.3058767914772034e-05, 4.48860228061676e-05, 4.671327769756317e-05, 4.854053258895874e-05, 5.036778748035431e-05, 5.219504237174988e-05, 5.402229726314545e-05, 5.5849552154541016e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 29.0, 81.0, 486.0, 291.0, 80.0, 24.0, 14.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0188667804177385e-06, -1.9268757114332402e-06, -1.834884642448742e-06, -1.7428935734642437e-06, -1.6509025044797454e-06, -1.5589114354952471e-06, -1.4669204801975866e-06, -1.3749294112130883e-06, -1.28293834222859e-06, -1.1909472732440918e-06, -1.0989562042595935e-06, -1.006965248961933e-06, -9.149741231340158e-07, -8.229830541495176e-07, -7.309920420084381e-07, -6.390009730239399e-07, -5.470099040394416e-07, -4.5501883505494334e-07, -3.630277944921545e-07, -2.7103675392936566e-07, -1.790456849448674e-07, -8.705461596036912e-08, 4.93639618071029e-09, 9.692746516520856e-08, 1.8891853414970683e-07, 2.809096031342051e-07, 3.7290064369699394e-07, 4.648916842597828e-07, 5.56882753244281e-07, 6.488738222287793e-07, 7.408648343698587e-07, 8.32855903354357e-07, 9.248469723388553e-07, 1.0168380413233535e-06, 1.1088291103078518e-06, 1.20082017929235e-06, 1.2928112482768483e-06, 1.3848023172613466e-06, 1.4767932725590072e-06, 1.5687843415435054e-06, 1.6607754105280037e-06, 1.752766479512502e-06, 1.8447575484970002e-06, 1.936748503794661e-06, 2.028739572779159e-06, 2.1207306417636573e-06, 2.2127217107481556e-06, 2.304712779732654e-06, 2.396703848717152e-06, 2.4886949177016504e-06, 2.5806859866861487e-06, 2.672677055670647e-06, 2.7646681246551452e-06, 2.8566591936396435e-06, 2.9486500352504663e-06, 3.04064133160864e-06, 3.132632173219463e-06, 3.224623242203961e-06, 3.3166143111884594e-06, 3.4086053801729577e-06, 3.500596449157456e-06, 3.592587518141954e-06, 3.6845785871264525e-06, 3.7765694287372753e-06, 3.868560725095449e-06]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 0.0, 6.0, 0.0, 8.0, 0.0, 0.0, 20.0, 0.0, 52.0, 0.0, 0.0, 87.0, 0.0, 160.0, 0.0, 315.0, 0.0, 0.0, 176.0, 0.0, 101.0, 0.0, 33.0, 0.0, 0.0, 22.0, 0.0, 17.0, 0.0, 0.0, 4.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.497146725654602e-07, -7.245689630508423e-07, -6.994232535362244e-07, -6.742775440216064e-07, -6.491318345069885e-07, -6.239861249923706e-07, -5.988404154777527e-07, -5.736947059631348e-07, -5.485489964485168e-07, -5.234032869338989e-07, -4.98257577419281e-07, -4.731118679046631e-07, -4.4796615839004517e-07, -4.2282044887542725e-07, -3.976747393608093e-07, -3.725290298461914e-07, -3.473833203315735e-07, -3.2223761081695557e-07, -2.9709190130233765e-07, -2.7194619178771973e-07, -2.468004822731018e-07, -2.2165477275848389e-07, -1.9650906324386597e-07, -1.7136335372924805e-07, -1.4621764421463013e-07, -1.210719347000122e-07, -9.592622518539429e-08, -7.078051567077637e-08, -4.563480615615845e-08, -2.0489096641540527e-08, 4.6566128730773926e-09, 2.9802322387695312e-08, 5.494803190231323e-08, 8.009374141693115e-08, 1.0523945093154907e-07, 1.30385160446167e-07, 1.555308699607849e-07, 1.8067657947540283e-07, 2.0582228899002075e-07, 2.3096799850463867e-07, 2.561137080192566e-07, 2.812594175338745e-07, 3.0640512704849243e-07, 3.3155083656311035e-07, 3.5669654607772827e-07, 3.818422555923462e-07, 4.069879651069641e-07, 4.3213367462158203e-07, 4.5727938413619995e-07, 4.824250936508179e-07, 5.075708031654358e-07, 5.327165126800537e-07, 5.578622221946716e-07, 5.830079317092896e-07, 6.081536412239075e-07, 6.332993507385254e-07, 6.584450602531433e-07, 6.835907697677612e-07, 7.087364792823792e-07, 7.338821887969971e-07, 7.59027898311615e-07, 7.841736078262329e-07, 8.093193173408508e-07, 8.344650268554688e-07]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 8.0, 9.0, 11.0, 11.0, 8.0, 18.0, 15.0, 31.0, 23.0, 32.0, 27.0, 26.0, 26.0, 43.0, 40.0, 48.0, 49.0, 35.0, 45.0, 37.0, 57.0, 22.0, 49.0, 41.0, 29.0, 37.0, 27.0, 24.0, 12.0, 13.0, 20.0, 15.0, 17.0, 15.0, 11.0, 16.0, 7.0, 7.0, 9.0, 4.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.033203125, -2.945037841796875, -2.85687255859375, -2.768707275390625, -2.6805419921875, -2.592376708984375, -2.50421142578125, -2.416046142578125, -2.327880859375, -2.239715576171875, -2.15155029296875, -2.063385009765625, -1.9752197265625, -1.887054443359375, -1.79888916015625, -1.710723876953125, -1.62255859375, -1.534393310546875, -1.44622802734375, -1.358062744140625, -1.2698974609375, -1.181732177734375, -1.09356689453125, -1.005401611328125, -0.917236328125, -0.829071044921875, -0.74090576171875, -0.652740478515625, -0.5645751953125, -0.476409912109375, -0.38824462890625, -0.300079345703125, -0.2119140625, -0.123748779296875, -0.03558349609375, 0.052581787109375, 0.1407470703125, 0.228912353515625, 0.31707763671875, 0.405242919921875, 0.493408203125, 0.581573486328125, 0.66973876953125, 0.757904052734375, 0.8460693359375, 0.934234619140625, 1.02239990234375, 1.110565185546875, 1.19873046875, 1.286895751953125, 1.37506103515625, 1.463226318359375, 1.5513916015625, 1.639556884765625, 1.72772216796875, 1.815887451171875, 1.904052734375, 1.992218017578125, 2.08038330078125, 2.168548583984375, 2.2567138671875, 2.344879150390625, 2.43304443359375, 2.521209716796875, 2.609375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 21.0, 17.0, 36.0, 54.0, 90.0, 157.0, 259.0, 453.0, 777.0, 1269.0, 2157.0, 3822.0, 6515.0, 11647.0, 21046.0, 40760.0, 82649.0, 175994.0, 330836.0, 187719.0, 88158.0, 43259.0, 22321.0, 12118.0, 6770.0, 4005.0, 2306.0, 1304.0, 798.0, 473.0, 290.0, 154.0, 115.0, 67.0, 47.0, 28.0, 15.0, 15.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.353515625, -3.2535400390625, -3.153564453125, -3.0535888671875, -2.95361328125, -2.8536376953125, -2.753662109375, -2.6536865234375, -2.5537109375, -2.4537353515625, -2.353759765625, -2.2537841796875, -2.15380859375, -2.0538330078125, -1.953857421875, -1.8538818359375, -1.75390625, -1.6539306640625, -1.553955078125, -1.4539794921875, -1.35400390625, -1.2540283203125, -1.154052734375, -1.0540771484375, -0.9541015625, -0.8541259765625, -0.754150390625, -0.6541748046875, -0.55419921875, -0.4542236328125, -0.354248046875, -0.2542724609375, -0.154296875, -0.0543212890625, 0.045654296875, 0.1456298828125, 0.24560546875, 0.3455810546875, 0.445556640625, 0.5455322265625, 0.6455078125, 0.7454833984375, 0.845458984375, 0.9454345703125, 1.04541015625, 1.1453857421875, 1.245361328125, 1.3453369140625, 1.4453125, 1.5452880859375, 1.645263671875, 1.7452392578125, 1.84521484375, 1.9451904296875, 2.045166015625, 2.1451416015625, 2.2451171875, 2.3450927734375, 2.445068359375, 2.5450439453125, 2.64501953125, 2.7449951171875, 2.844970703125, 2.9449462890625, 3.044921875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 8.0, 6.0, 9.0, 12.0, 17.0, 20.0, 16.0, 26.0, 22.0, 27.0, 35.0, 35.0, 37.0, 41.0, 41.0, 63.0, 112.0, 195.0, 1387.0, 259.0, 163.0, 98.0, 58.0, 51.0, 32.0, 28.0, 33.0, 30.0, 26.0, 16.0, 22.0, 18.0, 12.0, 15.0, 7.0, 12.0, 9.0, 7.0, 8.0, 4.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.6015625, -9.30029296875, -8.9990234375, -8.69775390625, -8.396484375, -8.09521484375, -7.7939453125, -7.49267578125, -7.19140625, -6.89013671875, -6.5888671875, -6.28759765625, -5.986328125, -5.68505859375, -5.3837890625, -5.08251953125, -4.78125, -4.47998046875, -4.1787109375, -3.87744140625, -3.576171875, -3.27490234375, -2.9736328125, -2.67236328125, -2.37109375, -2.06982421875, -1.7685546875, -1.46728515625, -1.166015625, -0.86474609375, -0.5634765625, -0.26220703125, 0.0390625, 0.34033203125, 0.6416015625, 0.94287109375, 1.244140625, 1.54541015625, 1.8466796875, 2.14794921875, 2.44921875, 2.75048828125, 3.0517578125, 3.35302734375, 3.654296875, 3.95556640625, 4.2568359375, 4.55810546875, 4.859375, 5.16064453125, 5.4619140625, 5.76318359375, 6.064453125, 6.36572265625, 6.6669921875, 6.96826171875, 7.26953125, 7.57080078125, 7.8720703125, 8.17333984375, 8.474609375, 8.77587890625, 9.0771484375, 9.37841796875, 9.6796875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 5.0, 12.0, 12.0, 11.0, 23.0, 23.0, 35.0, 33.0, 44.0, 81.0, 95.0, 173.0, 229.0, 386.0, 803.0, 2377.0, 28051.0, 2202367.0, 892385.0, 14929.0, 1793.0, 714.0, 368.0, 218.0, 134.0, 87.0, 80.0, 59.0, 48.0, 23.0, 19.0, 19.0, 15.0, 7.0, 11.0, 4.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.875, -20.240478515625, -19.60595703125, -18.971435546875, -18.3369140625, -17.702392578125, -17.06787109375, -16.433349609375, -15.798828125, -15.164306640625, -14.52978515625, -13.895263671875, -13.2607421875, -12.626220703125, -11.99169921875, -11.357177734375, -10.72265625, -10.088134765625, -9.45361328125, -8.819091796875, -8.1845703125, -7.550048828125, -6.91552734375, -6.281005859375, -5.646484375, -5.011962890625, -4.37744140625, -3.742919921875, -3.1083984375, -2.473876953125, -1.83935546875, -1.204833984375, -0.5703125, 0.064208984375, 0.69873046875, 1.333251953125, 1.9677734375, 2.602294921875, 3.23681640625, 3.871337890625, 4.505859375, 5.140380859375, 5.77490234375, 6.409423828125, 7.0439453125, 7.678466796875, 8.31298828125, 8.947509765625, 9.58203125, 10.216552734375, 10.85107421875, 11.485595703125, 12.1201171875, 12.754638671875, 13.38916015625, 14.023681640625, 14.658203125, 15.292724609375, 15.92724609375, 16.561767578125, 17.1962890625, 17.830810546875, 18.46533203125, 19.099853515625, 19.734375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 12.0, 29.0, 64.0, 126.0, 170.0, 216.0, 152.0, 131.0, 75.0, 27.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.57356071472168, -22.415613174438477, -21.25766372680664, -20.099716186523438, -18.941768646240234, -17.7838191986084, -16.625871658325195, -15.467923164367676, -14.309974670410156, -13.152026176452637, -11.994077682495117, -10.836130142211914, -9.678181648254395, -8.520233154296875, -7.362285137176514, -6.204337120056152, -5.046388626098633, -3.8884403705596924, -2.730492115020752, -1.5725438594818115, -0.4145956039428711, 0.7433528900146484, 1.9013009071350098, 3.059248924255371, 4.217197418212891, 5.37514591217041, 6.5330939292907715, 7.691041946411133, 8.848990440368652, 10.006938934326172, 11.164886474609375, 12.322834968566895, 13.480781555175781, 14.6387300491333, 15.79667854309082, 16.954626083374023, 18.11257553100586, 19.270523071289062, 20.428470611572266, 21.58641815185547, 22.744367599487305, 23.902315139770508, 25.060264587402344, 26.218212127685547, 27.37615966796875, 28.534109115600586, 29.69205665588379, 30.850006103515625, 32.00795364379883, 33.16590118408203, 34.323848724365234, 35.4818000793457, 36.639747619628906, 37.79769515991211, 38.95564270019531, 40.113590240478516, 41.27153778076172, 42.42948532104492, 43.587432861328125, 44.745384216308594, 45.9033317565918, 47.061279296875, 48.2192268371582, 49.377174377441406, 50.535125732421875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 8.0, 10.0, 10.0, 13.0, 17.0, 20.0, 21.0, 19.0, 30.0, 30.0, 23.0, 20.0, 34.0, 47.0, 46.0, 40.0, 32.0, 47.0, 47.0, 51.0, 44.0, 48.0, 28.0, 41.0, 32.0, 45.0, 34.0, 28.0, 19.0, 18.0, 23.0, 8.0, 23.0, 13.0, 6.0, 12.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.353559494018555, -28.451400756835938, -27.549240112304688, -26.64708137512207, -25.744922637939453, -24.842763900756836, -23.94060516357422, -23.03844451904297, -22.13628578186035, -21.234127044677734, -20.331966400146484, -19.429807662963867, -18.52764892578125, -17.625490188598633, -16.723331451416016, -15.821170806884766, -14.919012069702148, -14.016853332519531, -13.114693641662598, -12.212533950805664, -11.310375213623047, -10.40821647644043, -9.506056785583496, -8.603897094726562, -7.701738357543945, -6.79957914352417, -5.8974199295043945, -4.995260715484619, -4.093101501464844, -3.1909422874450684, -2.288783073425293, -1.3866238594055176, -0.4844646453857422, 0.4176945686340332, 1.3198537826538086, 2.222012996673584, 3.1241722106933594, 4.026331424713135, 4.92849063873291, 5.8306498527526855, 6.732809066772461, 7.634968280792236, 8.537127494812012, 9.439287185668945, 10.341445922851562, 11.24360466003418, 12.145764350891113, 13.047924041748047, 13.950082778930664, 14.852241516113281, 15.754401206970215, 16.65656089782715, 17.558719635009766, 18.460878372192383, 19.363037109375, 20.26519775390625, 21.167356491088867, 22.069515228271484, 22.971675872802734, 23.87383460998535, 24.77599334716797, 25.678152084350586, 26.580310821533203, 27.482471466064453, 28.38463020324707]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 8.0, 13.0, 12.0, 11.0, 18.0, 21.0, 21.0, 26.0, 31.0, 17.0, 24.0, 32.0, 36.0, 47.0, 39.0, 44.0, 63.0, 52.0, 42.0, 36.0, 38.0, 44.0, 48.0, 34.0, 36.0, 23.0, 15.0, 21.0, 29.0, 11.0, 15.0, 15.0, 13.0, 11.0, 12.0, 10.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.10546875, -3.00701904296875, -2.9085693359375, -2.81011962890625, -2.711669921875, -2.61322021484375, -2.5147705078125, -2.41632080078125, -2.31787109375, -2.21942138671875, -2.1209716796875, -2.02252197265625, -1.924072265625, -1.82562255859375, -1.7271728515625, -1.62872314453125, -1.5302734375, -1.43182373046875, -1.3333740234375, -1.23492431640625, -1.136474609375, -1.03802490234375, -0.9395751953125, -0.84112548828125, -0.74267578125, -0.64422607421875, -0.5457763671875, -0.44732666015625, -0.348876953125, -0.25042724609375, -0.1519775390625, -0.05352783203125, 0.044921875, 0.14337158203125, 0.2418212890625, 0.34027099609375, 0.438720703125, 0.53717041015625, 0.6356201171875, 0.73406982421875, 0.83251953125, 0.93096923828125, 1.0294189453125, 1.12786865234375, 1.226318359375, 1.32476806640625, 1.4232177734375, 1.52166748046875, 1.6201171875, 1.71856689453125, 1.8170166015625, 1.91546630859375, 2.013916015625, 2.11236572265625, 2.2108154296875, 2.30926513671875, 2.40771484375, 2.50616455078125, 2.6046142578125, 2.70306396484375, 2.801513671875, 2.89996337890625, 2.9984130859375, 3.09686279296875, 3.1953125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 8.0, 3.0, 14.0, 16.0, 16.0, 25.0, 47.0, 67.0, 112.0, 131.0, 230.0, 388.0, 662.0, 1211.0, 2189.0, 4294.0, 8731.0, 18511.0, 40893.0, 94883.0, 226362.0, 529672.0, 1065270.0, 1146336.0, 599137.0, 258908.0, 108450.0, 46675.0, 20921.0, 9790.0, 4760.0, 2371.0, 1287.0, 743.0, 442.0, 282.0, 174.0, 78.0, 63.0, 44.0, 31.0, 13.0, 17.0, 11.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.484375, -3.385040283203125, -3.28570556640625, -3.186370849609375, -3.0870361328125, -2.987701416015625, -2.88836669921875, -2.789031982421875, -2.689697265625, -2.590362548828125, -2.49102783203125, -2.391693115234375, -2.2923583984375, -2.193023681640625, -2.09368896484375, -1.994354248046875, -1.89501953125, -1.795684814453125, -1.69635009765625, -1.597015380859375, -1.4976806640625, -1.398345947265625, -1.29901123046875, -1.199676513671875, -1.100341796875, -1.001007080078125, -0.90167236328125, -0.802337646484375, -0.7030029296875, -0.603668212890625, -0.50433349609375, -0.404998779296875, -0.3056640625, -0.206329345703125, -0.10699462890625, -0.007659912109375, 0.0916748046875, 0.191009521484375, 0.29034423828125, 0.389678955078125, 0.489013671875, 0.588348388671875, 0.68768310546875, 0.787017822265625, 0.8863525390625, 0.985687255859375, 1.08502197265625, 1.184356689453125, 1.28369140625, 1.383026123046875, 1.48236083984375, 1.581695556640625, 1.6810302734375, 1.780364990234375, 1.87969970703125, 1.979034423828125, 2.078369140625, 2.177703857421875, 2.27703857421875, 2.376373291015625, 2.4757080078125, 2.575042724609375, 2.67437744140625, 2.773712158203125, 2.873046875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 8.0, 6.0, 8.0, 6.0, 8.0, 14.0, 12.0, 31.0, 44.0, 44.0, 72.0, 88.0, 122.0, 136.0, 193.0, 243.0, 291.0, 397.0, 391.0, 385.0, 381.0, 286.0, 226.0, 178.0, 119.0, 84.0, 78.0, 64.0, 41.0, 29.0, 22.0, 15.0, 19.0, 6.0, 4.0, 6.0, 10.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0], "bins": [-6.33984375, -6.17205810546875, -6.0042724609375, -5.83648681640625, -5.668701171875, -5.50091552734375, -5.3331298828125, -5.16534423828125, -4.99755859375, -4.82977294921875, -4.6619873046875, -4.49420166015625, -4.326416015625, -4.15863037109375, -3.9908447265625, -3.82305908203125, -3.6552734375, -3.48748779296875, -3.3197021484375, -3.15191650390625, -2.984130859375, -2.81634521484375, -2.6485595703125, -2.48077392578125, -2.31298828125, -2.14520263671875, -1.9774169921875, -1.80963134765625, -1.641845703125, -1.47406005859375, -1.3062744140625, -1.13848876953125, -0.970703125, -0.80291748046875, -0.6351318359375, -0.46734619140625, -0.299560546875, -0.13177490234375, 0.0360107421875, 0.20379638671875, 0.37158203125, 0.53936767578125, 0.7071533203125, 0.87493896484375, 1.042724609375, 1.21051025390625, 1.3782958984375, 1.54608154296875, 1.7138671875, 1.88165283203125, 2.0494384765625, 2.21722412109375, 2.385009765625, 2.55279541015625, 2.7205810546875, 2.88836669921875, 3.05615234375, 3.22393798828125, 3.3917236328125, 3.55950927734375, 3.727294921875, 3.89508056640625, 4.0628662109375, 4.23065185546875, 4.3984375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 8.0, 10.0, 6.0, 13.0, 16.0, 22.0, 34.0, 44.0, 65.0, 81.0, 108.0, 170.0, 228.0, 445.0, 1501.0, 45567.0, 3338150.0, 797831.0, 8169.0, 757.0, 310.0, 198.0, 134.0, 120.0, 84.0, 58.0, 44.0, 29.0, 20.0, 11.0, 8.0, 8.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.421875, -19.65966796875, -18.8974609375, -18.13525390625, -17.373046875, -16.61083984375, -15.8486328125, -15.08642578125, -14.32421875, -13.56201171875, -12.7998046875, -12.03759765625, -11.275390625, -10.51318359375, -9.7509765625, -8.98876953125, -8.2265625, -7.46435546875, -6.7021484375, -5.93994140625, -5.177734375, -4.41552734375, -3.6533203125, -2.89111328125, -2.12890625, -1.36669921875, -0.6044921875, 0.15771484375, 0.919921875, 1.68212890625, 2.4443359375, 3.20654296875, 3.96875, 4.73095703125, 5.4931640625, 6.25537109375, 7.017578125, 7.77978515625, 8.5419921875, 9.30419921875, 10.06640625, 10.82861328125, 11.5908203125, 12.35302734375, 13.115234375, 13.87744140625, 14.6396484375, 15.40185546875, 16.1640625, 16.92626953125, 17.6884765625, 18.45068359375, 19.212890625, 19.97509765625, 20.7373046875, 21.49951171875, 22.26171875, 23.02392578125, 23.7861328125, 24.54833984375, 25.310546875, 26.07275390625, 26.8349609375, 27.59716796875, 28.359375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 14.0, 26.0, 37.0, 69.0, 108.0, 157.0, 155.0, 170.0, 128.0, 80.0, 37.0, 18.0, 9.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.42382049560547, -26.81435203552246, -25.20488166809082, -23.595413208007812, -21.985942840576172, -20.376474380493164, -18.767005920410156, -17.157535552978516, -15.548067092895508, -13.938597679138184, -12.32912826538086, -10.719659805297852, -9.110190391540527, -7.500720977783203, -5.891252517700195, -4.281783103942871, -2.672313690185547, -1.0628445148468018, 0.5466246604919434, 2.1560935974121094, 3.7655630111694336, 5.375032424926758, 6.984500885009766, 8.59397029876709, 10.203439712524414, 11.812909126281738, 13.422378540039062, 15.03184700012207, 16.641315460205078, 18.25078582763672, 19.860254287719727, 21.469722747802734, 23.079193115234375, 24.688661575317383, 26.298131942749023, 27.90760040283203, 29.517070770263672, 31.12653923034668, 32.73600769042969, 34.34547805786133, 35.95494842529297, 37.56441879272461, 39.173885345458984, 40.783355712890625, 42.392826080322266, 44.002296447753906, 45.61176300048828, 47.22123336791992, 48.8306999206543, 50.44017028808594, 52.04963684082031, 53.65910720825195, 55.268577575683594, 56.87804412841797, 58.48751449584961, 60.09698486328125, 61.706451416015625, 63.315921783447266, 64.9253921508789, 66.53485870361328, 68.14432525634766, 69.75379943847656, 71.36326599121094, 72.97273254394531, 74.58220672607422]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 14.0, 5.0, 9.0, 9.0, 7.0, 9.0, 10.0, 11.0, 20.0, 13.0, 19.0, 24.0, 25.0, 27.0, 16.0, 32.0, 29.0, 23.0, 33.0, 36.0, 33.0, 38.0, 28.0, 37.0, 36.0, 26.0, 43.0, 29.0, 41.0, 25.0, 39.0, 25.0, 26.0, 27.0, 19.0, 23.0, 27.0, 17.0, 9.0, 11.0, 14.0, 9.0, 8.0, 8.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-15.946121215820312, -15.441732406616211, -14.937342643737793, -14.432952880859375, -13.928564071655273, -13.424175262451172, -12.919785499572754, -12.415395736694336, -11.911006927490234, -11.406618118286133, -10.902228355407715, -10.397838592529297, -9.893449783325195, -9.389060974121094, -8.884671211242676, -8.380281448364258, -7.875892639160156, -7.3715033531188965, -6.867114067077637, -6.362724781036377, -5.858335494995117, -5.353946208953857, -4.849556922912598, -4.345167636871338, -3.840778350830078, -3.3363890647888184, -2.8319997787475586, -2.327610492706299, -1.823221206665039, -1.3188319206237793, -0.8144426345825195, -0.31005334854125977, 0.1943359375, 0.6987252235412598, 1.2031145095825195, 1.7075037956237793, 2.211893081665039, 2.716282367706299, 3.2206716537475586, 3.7250609397888184, 4.229450225830078, 4.733839511871338, 5.238228797912598, 5.742618083953857, 6.247007369995117, 6.751396656036377, 7.255785942077637, 7.7601752281188965, 8.264564514160156, 8.768953323364258, 9.273343086242676, 9.777732849121094, 10.282121658325195, 10.786510467529297, 11.290900230407715, 11.795289993286133, 12.299678802490234, 12.804067611694336, 13.308457374572754, 13.812847137451172, 14.317235946655273, 14.821624755859375, 15.326014518737793, 15.830404281616211, 16.334793090820312]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 10.0, 9.0, 9.0, 18.0, 18.0, 14.0, 19.0, 20.0, 28.0, 26.0, 26.0, 44.0, 30.0, 29.0, 45.0, 44.0, 54.0, 45.0, 39.0, 52.0, 32.0, 36.0, 38.0, 42.0, 32.0, 33.0, 17.0, 19.0, 18.0, 26.0, 9.0, 8.0, 20.0, 19.0, 17.0, 8.0, 4.0, 7.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.099609375, -3.008575439453125, -2.91754150390625, -2.826507568359375, -2.7354736328125, -2.644439697265625, -2.55340576171875, -2.462371826171875, -2.371337890625, -2.280303955078125, -2.18927001953125, -2.098236083984375, -2.0072021484375, -1.916168212890625, -1.82513427734375, -1.734100341796875, -1.64306640625, -1.552032470703125, -1.46099853515625, -1.369964599609375, -1.2789306640625, -1.187896728515625, -1.09686279296875, -1.005828857421875, -0.914794921875, -0.823760986328125, -0.73272705078125, -0.641693115234375, -0.5506591796875, -0.459625244140625, -0.36859130859375, -0.277557373046875, -0.1865234375, -0.095489501953125, -0.00445556640625, 0.086578369140625, 0.1776123046875, 0.268646240234375, 0.35968017578125, 0.450714111328125, 0.541748046875, 0.632781982421875, 0.72381591796875, 0.814849853515625, 0.9058837890625, 0.996917724609375, 1.08795166015625, 1.178985595703125, 1.27001953125, 1.361053466796875, 1.45208740234375, 1.543121337890625, 1.6341552734375, 1.725189208984375, 1.81622314453125, 1.907257080078125, 1.998291015625, 2.089324951171875, 2.18035888671875, 2.271392822265625, 2.3624267578125, 2.453460693359375, 2.54449462890625, 2.635528564453125, 2.7265625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 12.0, 15.0, 20.0, 29.0, 55.0, 61.0, 100.0, 149.0, 177.0, 286.0, 342.0, 540.0, 720.0, 1046.0, 1438.0, 1983.0, 2729.0, 3849.0, 5423.0, 7639.0, 11142.0, 16322.0, 24012.0, 37108.0, 59080.0, 104783.0, 275079.0, 230047.0, 97705.0, 56091.0, 35252.0, 22967.0, 15834.0, 10788.0, 7486.0, 5280.0, 3714.0, 2637.0, 1898.0, 1338.0, 994.0, 678.0, 520.0, 322.0, 256.0, 172.0, 120.0, 116.0, 56.0, 39.0, 46.0, 23.0, 19.0, 12.0, 4.0, 2.0, 2.0, 5.0], "bins": [-0.118896484375, -0.11528778076171875, -0.1116790771484375, -0.10807037353515625, -0.104461669921875, -0.10085296630859375, -0.0972442626953125, -0.09363555908203125, -0.09002685546875, -0.08641815185546875, -0.0828094482421875, -0.07920074462890625, -0.075592041015625, -0.07198333740234375, -0.0683746337890625, -0.06476593017578125, -0.0611572265625, -0.05754852294921875, -0.0539398193359375, -0.05033111572265625, -0.046722412109375, -0.04311370849609375, -0.0395050048828125, -0.03589630126953125, -0.03228759765625, -0.02867889404296875, -0.0250701904296875, -0.02146148681640625, -0.017852783203125, -0.01424407958984375, -0.0106353759765625, -0.00702667236328125, -0.00341796875, 0.00019073486328125, 0.0037994384765625, 0.00740814208984375, 0.011016845703125, 0.01462554931640625, 0.0182342529296875, 0.02184295654296875, 0.02545166015625, 0.02906036376953125, 0.0326690673828125, 0.03627777099609375, 0.039886474609375, 0.04349517822265625, 0.0471038818359375, 0.05071258544921875, 0.0543212890625, 0.05792999267578125, 0.0615386962890625, 0.06514739990234375, 0.068756103515625, 0.07236480712890625, 0.0759735107421875, 0.07958221435546875, 0.08319091796875, 0.08679962158203125, 0.0904083251953125, 0.09401702880859375, 0.097625732421875, 0.10123443603515625, 0.1048431396484375, 0.10845184326171875, 0.112060546875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 6.0, 5.0, 10.0, 13.0, 16.0, 12.0, 13.0, 20.0, 20.0, 19.0, 22.0, 29.0, 34.0, 30.0, 37.0, 41.0, 46.0, 43.0, 35.0, 1050.0, 36.0, 28.0, 52.0, 34.0, 32.0, 41.0, 32.0, 25.0, 42.0, 28.0, 28.0, 24.0, 12.0, 10.0, 18.0, 11.0, 14.0, 12.0, 3.0, 12.0, 6.0, 3.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.056640625, -1.993927001953125, -1.93121337890625, -1.868499755859375, -1.8057861328125, -1.743072509765625, -1.68035888671875, -1.617645263671875, -1.554931640625, -1.492218017578125, -1.42950439453125, -1.366790771484375, -1.3040771484375, -1.241363525390625, -1.17864990234375, -1.115936279296875, -1.05322265625, -0.990509033203125, -0.92779541015625, -0.865081787109375, -0.8023681640625, -0.739654541015625, -0.67694091796875, -0.614227294921875, -0.551513671875, -0.488800048828125, -0.42608642578125, -0.363372802734375, -0.3006591796875, -0.237945556640625, -0.17523193359375, -0.112518310546875, -0.0498046875, 0.012908935546875, 0.07562255859375, 0.138336181640625, 0.2010498046875, 0.263763427734375, 0.32647705078125, 0.389190673828125, 0.451904296875, 0.514617919921875, 0.57733154296875, 0.640045166015625, 0.7027587890625, 0.765472412109375, 0.82818603515625, 0.890899658203125, 0.95361328125, 1.016326904296875, 1.07904052734375, 1.141754150390625, 1.2044677734375, 1.267181396484375, 1.32989501953125, 1.392608642578125, 1.455322265625, 1.518035888671875, 1.58074951171875, 1.643463134765625, 1.7061767578125, 1.768890380859375, 1.83160400390625, 1.894317626953125, 1.95703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 7.0, 12.0, 14.0, 21.0, 30.0, 37.0, 78.0, 98.0, 130.0, 200.0, 293.0, 424.0, 633.0, 871.0, 1340.0, 1835.0, 2620.0, 3663.0, 5370.0, 7477.0, 11049.0, 16329.0, 24141.0, 36563.0, 58421.0, 98813.0, 188288.0, 1312407.0, 124517.0, 70127.0, 43275.0, 27891.0, 18523.0, 12679.0, 8855.0, 6051.0, 4193.0, 2990.0, 2063.0, 1473.0, 975.0, 738.0, 511.0, 342.0, 244.0, 163.0, 126.0, 81.0, 59.0, 38.0, 22.0, 19.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.056365966796875, -0.054558753967285156, -0.05275154113769531, -0.05094432830810547, -0.049137115478515625, -0.04732990264892578, -0.04552268981933594, -0.043715476989746094, -0.04190826416015625, -0.040101051330566406, -0.03829383850097656, -0.03648662567138672, -0.034679412841796875, -0.03287220001220703, -0.031064987182617188, -0.029257774353027344, -0.0274505615234375, -0.025643348693847656, -0.023836135864257812, -0.02202892303466797, -0.020221710205078125, -0.01841449737548828, -0.016607284545898438, -0.014800071716308594, -0.01299285888671875, -0.011185646057128906, -0.009378433227539062, -0.007571220397949219, -0.005764007568359375, -0.003956794738769531, -0.0021495819091796875, -0.00034236907958984375, 0.00146484375, 0.0032720565795898438, 0.0050792694091796875, 0.006886482238769531, 0.008693695068359375, 0.010500907897949219, 0.012308120727539062, 0.014115333557128906, 0.01592254638671875, 0.017729759216308594, 0.019536972045898438, 0.02134418487548828, 0.023151397705078125, 0.02495861053466797, 0.026765823364257812, 0.028573036193847656, 0.0303802490234375, 0.032187461853027344, 0.03399467468261719, 0.03580188751220703, 0.037609100341796875, 0.03941631317138672, 0.04122352600097656, 0.043030738830566406, 0.04483795166015625, 0.046645164489746094, 0.04845237731933594, 0.05025959014892578, 0.052066802978515625, 0.05387401580810547, 0.05568122863769531, 0.057488441467285156, 0.059295654296875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 0.0, 5.0, 4.0, 4.0, 2.0, 4.0, 12.0, 10.0, 10.0, 11.0, 23.0, 24.0, 71.0, 54.0, 89.0, 427.0, 57.0, 48.0, 26.0, 46.0, 15.0, 13.0, 7.0, 13.0, 4.0, 5.0, 10.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7713755369186401e-06, -1.695007085800171e-06, -1.6186386346817017e-06, -1.5422701835632324e-06, -1.4659017324447632e-06, -1.389533281326294e-06, -1.3131648302078247e-06, -1.2367963790893555e-06, -1.1604279279708862e-06, -1.084059476852417e-06, -1.0076910257339478e-06, -9.313225746154785e-07, -8.549541234970093e-07, -7.7858567237854e-07, -7.022172212600708e-07, -6.258487701416016e-07, -5.494803190231323e-07, -4.731118679046631e-07, -3.9674341678619385e-07, -3.203749656677246e-07, -2.4400651454925537e-07, -1.6763806343078613e-07, -9.12696123123169e-08, -1.4901161193847656e-08, 6.146728992462158e-08, 1.3783574104309082e-07, 2.1420419216156006e-07, 2.905726432800293e-07, 3.6694109439849854e-07, 4.4330954551696777e-07, 5.19677996635437e-07, 5.960464477539062e-07, 6.724148988723755e-07, 7.487833499908447e-07, 8.25151801109314e-07, 9.015202522277832e-07, 9.778887033462524e-07, 1.0542571544647217e-06, 1.130625605583191e-06, 1.2069940567016602e-06, 1.2833625078201294e-06, 1.3597309589385986e-06, 1.4360994100570679e-06, 1.5124678611755371e-06, 1.5888363122940063e-06, 1.6652047634124756e-06, 1.7415732145309448e-06, 1.817941665649414e-06, 1.8943101167678833e-06, 1.9706785678863525e-06, 2.0470470190048218e-06, 2.123415470123291e-06, 2.1997839212417603e-06, 2.2761523723602295e-06, 2.3525208234786987e-06, 2.428889274597168e-06, 2.505257725715637e-06, 2.5816261768341064e-06, 2.6579946279525757e-06, 2.734363079071045e-06, 2.810731530189514e-06, 2.8870999813079834e-06, 2.9634684324264526e-06, 3.039836883544922e-06]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 6.0, 13.0, 7.0, 14.0, 28.0, 51.0, 78.0, 165.0, 1487.0, 865858.0, 179633.0, 841.0, 170.0, 75.0, 34.0, 22.0, 17.0, 8.0, 12.0, 8.0, 2.0, 1.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-6.872415542602539e-05, -6.700213998556137e-05, -6.528012454509735e-05, -6.355810910463333e-05, -6.183609366416931e-05, -6.011407822370529e-05, -5.839206278324127e-05, -5.667004734277725e-05, -5.494803190231323e-05, -5.322601646184921e-05, -5.150400102138519e-05, -4.978198558092117e-05, -4.805997014045715e-05, -4.6337954699993134e-05, -4.4615939259529114e-05, -4.2893923819065094e-05, -4.1171908378601074e-05, -3.9449892938137054e-05, -3.7727877497673035e-05, -3.6005862057209015e-05, -3.4283846616744995e-05, -3.2561831176280975e-05, -3.0839815735816956e-05, -2.9117800295352936e-05, -2.7395784854888916e-05, -2.5673769414424896e-05, -2.3951753973960876e-05, -2.2229738533496857e-05, -2.0507723093032837e-05, -1.8785707652568817e-05, -1.7063692212104797e-05, -1.5341676771640778e-05, -1.3619661331176758e-05, -1.1897645890712738e-05, -1.0175630450248718e-05, -8.453615009784698e-06, -6.731599569320679e-06, -5.009584128856659e-06, -3.287568688392639e-06, -1.5655532479286194e-06, 1.564621925354004e-07, 1.8784776329994202e-06, 3.60049307346344e-06, 5.32250851392746e-06, 7.0445239543914795e-06, 8.7665393948555e-06, 1.0488554835319519e-05, 1.2210570275783539e-05, 1.3932585716247559e-05, 1.565460115671158e-05, 1.7376616597175598e-05, 1.9098632037639618e-05, 2.0820647478103638e-05, 2.2542662918567657e-05, 2.4264678359031677e-05, 2.5986693799495697e-05, 2.7708709239959717e-05, 2.9430724680423737e-05, 3.1152740120887756e-05, 3.2874755561351776e-05, 3.4596771001815796e-05, 3.6318786442279816e-05, 3.8040801882743835e-05, 3.9762817323207855e-05, 4.1484832763671875e-05]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 8.0, 21.0, 27.0, 27.0, 41.0, 52.0, 62.0, 77.0, 95.0, 224.0, 91.0, 49.0, 54.0, 34.0, 32.0, 28.0, 12.0, 10.0, 11.0, 7.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.328449219632603e-07, -5.116322654430405e-07, -4.904196089228208e-07, -4.692069239808916e-07, -4.4799426746067184e-07, -4.267816109404521e-07, -4.055689259985229e-07, -3.8435626947830315e-07, -3.631436129580834e-07, -3.4193095643786364e-07, -3.207182999176439e-07, -2.995056149757147e-07, -2.7829295845549495e-07, -2.570803019352752e-07, -2.3586763120420073e-07, -2.1465496047312627e-07, -1.9344230395290651e-07, -1.7222964743268676e-07, -1.510169767016123e-07, -1.2980430597053783e-07, -1.0859164945031807e-07, -8.737898582467096e-08, -6.616632219902385e-08, -4.4953651467949385e-08, -2.3740994947729632e-08, -2.528331322082522e-09, 1.8684332303564588e-08, 3.98969959292117e-08, 6.110965955485881e-08, 8.232232318050592e-08, 1.0353498680615303e-07, 1.247476575372275e-07, 1.459603709008661e-07, 1.6717302742108586e-07, 1.8838569815216033e-07, 2.095983688832348e-07, 2.3081102540345455e-07, 2.520236819236743e-07, 2.732363668656035e-07, 2.9444902338582324e-07, 3.15661679906043e-07, 3.3687433642626274e-07, 3.580869929464825e-07, 3.792996778884117e-07, 4.0051233440863143e-07, 4.217249909288512e-07, 4.4293767587078037e-07, 4.641503323910001e-07, 4.853629889112199e-07, 5.065756454314396e-07, 5.277883019516594e-07, 5.490009584718791e-07, 5.702136149920989e-07, 5.914263283557375e-07, 6.126389848759572e-07, 6.33851641396177e-07, 6.550642979163968e-07, 6.762769544366165e-07, 6.974896109568363e-07, 7.18702267477056e-07, 7.399149808406946e-07, 7.611276373609144e-07, 7.823402938811341e-07, 8.035529504013539e-07, 8.247656069215736e-07]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 15.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 103.0, 0.0, 0.0, 155.0, 0.0, 0.0, 0.0, 242.0, 0.0, 0.0, 198.0, 0.0, 0.0, 0.0, 108.0, 0.0, 0.0, 58.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-07, -5.187466740608215e-07, -5.010515451431274e-07, -4.833564162254333e-07, -4.6566128730773926e-07, -4.4796615839004517e-07, -4.302710294723511e-07, -4.12575900554657e-07, -3.948807716369629e-07, -3.771856427192688e-07, -3.594905138015747e-07, -3.417953848838806e-07, -3.241002559661865e-07, -3.0640512704849243e-07, -2.8870999813079834e-07, -2.7101486921310425e-07, -2.5331974029541016e-07, -2.3562461137771606e-07, -2.1792948246002197e-07, -2.0023435354232788e-07, -1.825392246246338e-07, -1.648440957069397e-07, -1.471489667892456e-07, -1.2945383787155151e-07, -1.1175870895385742e-07, -9.406358003616333e-08, -7.636845111846924e-08, -5.8673322200775146e-08, -4.0978193283081055e-08, -2.3283064365386963e-08, -5.587935447692871e-09, 1.210719347000122e-08, 2.9802322387695312e-08, 4.7497451305389404e-08, 6.51925802230835e-08, 8.288770914077759e-08, 1.0058283805847168e-07, 1.1827796697616577e-07, 1.3597309589385986e-07, 1.5366822481155396e-07, 1.7136335372924805e-07, 1.8905848264694214e-07, 2.0675361156463623e-07, 2.2444874048233032e-07, 2.421438694000244e-07, 2.598389983177185e-07, 2.775341272354126e-07, 2.952292561531067e-07, 3.129243850708008e-07, 3.3061951398849487e-07, 3.4831464290618896e-07, 3.6600977182388306e-07, 3.8370490074157715e-07, 4.0140002965927124e-07, 4.1909515857696533e-07, 4.367902874946594e-07, 4.544854164123535e-07, 4.721805453300476e-07, 4.898756742477417e-07, 5.075708031654358e-07, 5.252659320831299e-07, 5.42961061000824e-07, 5.606561899185181e-07, 5.783513188362122e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 10.0, 9.0, 9.0, 18.0, 18.0, 14.0, 19.0, 20.0, 28.0, 26.0, 26.0, 44.0, 30.0, 29.0, 45.0, 44.0, 54.0, 45.0, 39.0, 52.0, 32.0, 36.0, 38.0, 42.0, 32.0, 33.0, 17.0, 19.0, 18.0, 26.0, 9.0, 8.0, 20.0, 19.0, 17.0, 8.0, 4.0, 7.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.099609375, -3.008575439453125, -2.91754150390625, -2.826507568359375, -2.7354736328125, -2.644439697265625, -2.55340576171875, -2.462371826171875, -2.371337890625, -2.280303955078125, -2.18927001953125, -2.098236083984375, -2.0072021484375, -1.916168212890625, -1.82513427734375, -1.734100341796875, -1.64306640625, -1.552032470703125, -1.46099853515625, -1.369964599609375, -1.2789306640625, -1.187896728515625, -1.09686279296875, -1.005828857421875, -0.914794921875, -0.823760986328125, -0.73272705078125, -0.641693115234375, -0.5506591796875, -0.459625244140625, -0.36859130859375, -0.277557373046875, -0.1865234375, -0.095489501953125, -0.00445556640625, 0.086578369140625, 0.1776123046875, 0.268646240234375, 0.35968017578125, 0.450714111328125, 0.541748046875, 0.632781982421875, 0.72381591796875, 0.814849853515625, 0.9058837890625, 0.996917724609375, 1.08795166015625, 1.178985595703125, 1.27001953125, 1.361053466796875, 1.45208740234375, 1.543121337890625, 1.6341552734375, 1.725189208984375, 1.81622314453125, 1.907257080078125, 1.998291015625, 2.089324951171875, 2.18035888671875, 2.271392822265625, 2.3624267578125, 2.453460693359375, 2.54449462890625, 2.635528564453125, 2.7265625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 10.0, 16.0, 13.0, 37.0, 61.0, 104.0, 147.0, 257.0, 452.0, 722.0, 1252.0, 2019.0, 3418.0, 5677.0, 9520.0, 15660.0, 26898.0, 49979.0, 101519.0, 216342.0, 286241.0, 160830.0, 75009.0, 38592.0, 21762.0, 12745.0, 7596.0, 4635.0, 2860.0, 1728.0, 963.0, 592.0, 369.0, 198.0, 105.0, 68.0, 55.0, 36.0, 18.0, 11.0, 11.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.62890625, -3.523101806640625, -3.41729736328125, -3.311492919921875, -3.2056884765625, -3.099884033203125, -2.99407958984375, -2.888275146484375, -2.782470703125, -2.676666259765625, -2.57086181640625, -2.465057373046875, -2.3592529296875, -2.253448486328125, -2.14764404296875, -2.041839599609375, -1.93603515625, -1.830230712890625, -1.72442626953125, -1.618621826171875, -1.5128173828125, -1.407012939453125, -1.30120849609375, -1.195404052734375, -1.089599609375, -0.983795166015625, -0.87799072265625, -0.772186279296875, -0.6663818359375, -0.560577392578125, -0.45477294921875, -0.348968505859375, -0.2431640625, -0.137359619140625, -0.03155517578125, 0.074249267578125, 0.1800537109375, 0.285858154296875, 0.39166259765625, 0.497467041015625, 0.603271484375, 0.709075927734375, 0.81488037109375, 0.920684814453125, 1.0264892578125, 1.132293701171875, 1.23809814453125, 1.343902587890625, 1.44970703125, 1.555511474609375, 1.66131591796875, 1.767120361328125, 1.8729248046875, 1.978729248046875, 2.08453369140625, 2.190338134765625, 2.296142578125, 2.401947021484375, 2.50775146484375, 2.613555908203125, 2.7193603515625, 2.825164794921875, 2.93096923828125, 3.036773681640625, 3.142578125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 4.0, 8.0, 6.0, 11.0, 18.0, 19.0, 24.0, 18.0, 20.0, 29.0, 41.0, 37.0, 39.0, 22.0, 58.0, 67.0, 77.0, 128.0, 243.0, 1398.0, 197.0, 100.0, 75.0, 63.0, 59.0, 35.0, 36.0, 28.0, 21.0, 17.0, 23.0, 16.0, 19.0, 16.0, 10.0, 12.0, 7.0, 8.0, 3.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-9.890625, -9.5843505859375, -9.278076171875, -8.9718017578125, -8.66552734375, -8.3592529296875, -8.052978515625, -7.7467041015625, -7.4404296875, -7.1341552734375, -6.827880859375, -6.5216064453125, -6.21533203125, -5.9090576171875, -5.602783203125, -5.2965087890625, -4.990234375, -4.6839599609375, -4.377685546875, -4.0714111328125, -3.76513671875, -3.4588623046875, -3.152587890625, -2.8463134765625, -2.5400390625, -2.2337646484375, -1.927490234375, -1.6212158203125, -1.31494140625, -1.0086669921875, -0.702392578125, -0.3961181640625, -0.08984375, 0.2164306640625, 0.522705078125, 0.8289794921875, 1.13525390625, 1.4415283203125, 1.747802734375, 2.0540771484375, 2.3603515625, 2.6666259765625, 2.972900390625, 3.2791748046875, 3.58544921875, 3.8917236328125, 4.197998046875, 4.5042724609375, 4.810546875, 5.1168212890625, 5.423095703125, 5.7293701171875, 6.03564453125, 6.3419189453125, 6.648193359375, 6.9544677734375, 7.2607421875, 7.5670166015625, 7.873291015625, 8.1795654296875, 8.48583984375, 8.7921142578125, 9.098388671875, 9.4046630859375, 9.7109375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 9.0, 6.0, 8.0, 8.0, 19.0, 22.0, 28.0, 25.0, 40.0, 39.0, 66.0, 76.0, 108.0, 128.0, 212.0, 360.0, 1123.0, 11329.0, 475158.0, 2604916.0, 47794.0, 2628.0, 556.0, 283.0, 192.0, 131.0, 98.0, 91.0, 57.0, 31.0, 26.0, 27.0, 27.0, 19.0, 14.0, 8.0, 7.0, 8.0, 2.0, 9.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.078125, -19.43505859375, -18.7919921875, -18.14892578125, -17.505859375, -16.86279296875, -16.2197265625, -15.57666015625, -14.93359375, -14.29052734375, -13.6474609375, -13.00439453125, -12.361328125, -11.71826171875, -11.0751953125, -10.43212890625, -9.7890625, -9.14599609375, -8.5029296875, -7.85986328125, -7.216796875, -6.57373046875, -5.9306640625, -5.28759765625, -4.64453125, -4.00146484375, -3.3583984375, -2.71533203125, -2.072265625, -1.42919921875, -0.7861328125, -0.14306640625, 0.5, 1.14306640625, 1.7861328125, 2.42919921875, 3.072265625, 3.71533203125, 4.3583984375, 5.00146484375, 5.64453125, 6.28759765625, 6.9306640625, 7.57373046875, 8.216796875, 8.85986328125, 9.5029296875, 10.14599609375, 10.7890625, 11.43212890625, 12.0751953125, 12.71826171875, 13.361328125, 14.00439453125, 14.6474609375, 15.29052734375, 15.93359375, 16.57666015625, 17.2197265625, 17.86279296875, 18.505859375, 19.14892578125, 19.7919921875, 20.43505859375, 21.078125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 200.0, 817.0], "bins": [-514.3544921875, -506.2168273925781, -498.0791320800781, -489.94146728515625, -481.8038024902344, -473.6661376953125, -465.5284423828125, -457.3907775878906, -449.25311279296875, -441.1154479980469, -432.9777526855469, -424.840087890625, -416.7024230957031, -408.56475830078125, -400.42706298828125, -392.2893981933594, -384.1517028808594, -376.0140380859375, -367.8763427734375, -359.7386779785156, -351.60101318359375, -343.46331787109375, -335.3256530761719, -327.18798828125, -319.05029296875, -310.9126281738281, -302.7749328613281, -294.63726806640625, -286.4996032714844, -278.3619384765625, -270.2242431640625, -262.0865783691406, -253.9488983154297, -245.81121826171875, -237.67355346679688, -229.53587341308594, -221.398193359375, -213.26052856445312, -205.1228485107422, -196.98516845703125, -188.84750366210938, -180.70982360839844, -172.57215881347656, -164.43447875976562, -156.29681396484375, -148.1591339111328, -140.02145385742188, -131.8837890625, -123.7461166381836, -115.60844421386719, -107.47076416015625, -99.33309173583984, -91.19541931152344, -83.05774688720703, -74.92007446289062, -66.78239440917969, -58.644718170166016, -50.507041931152344, -42.36936950683594, -34.23169708251953, -26.09402084350586, -17.956348419189453, -9.818672180175781, -1.6809959411621094, 6.4566755294799805]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 13.0, 4.0, 12.0, 8.0, 20.0, 26.0, 10.0, 17.0, 16.0, 23.0, 30.0, 26.0, 22.0, 16.0, 26.0, 35.0, 41.0, 47.0, 55.0, 54.0, 45.0, 31.0, 40.0, 34.0, 41.0, 26.0, 37.0, 25.0, 23.0, 28.0, 25.0, 26.0, 18.0, 12.0, 12.0, 7.0, 13.0, 13.0, 8.0, 8.0, 6.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.11357879638672, -24.307601928710938, -23.501625061035156, -22.695648193359375, -21.889673233032227, -21.083696365356445, -20.277719497680664, -19.471742630004883, -18.665767669677734, -17.859790802001953, -17.053813934326172, -16.24783706665039, -15.441862106323242, -14.635885238647461, -13.82990837097168, -13.023931503295898, -12.217954635620117, -11.411977767944336, -10.606001853942871, -9.80002498626709, -8.994049072265625, -8.188072204589844, -7.3820953369140625, -6.5761189460754395, -5.770142555236816, -4.964166164398193, -4.15818977355957, -3.352212905883789, -2.546236515045166, -1.740260124206543, -0.9342832565307617, -0.12830686569213867, 0.6776695251464844, 1.483646035194397, 2.2896225452423096, 3.0955991744995117, 3.9015755653381348, 4.707551956176758, 5.513528823852539, 6.319505214691162, 7.125481605529785, 7.931457996368408, 8.737434387207031, 9.543411254882812, 10.349388122558594, 11.155364036560059, 11.96134090423584, 12.767316818237305, 13.573293685913086, 14.379270553588867, 15.185246467590332, 15.991223335266113, 16.797199249267578, 17.60317611694336, 18.40915298461914, 19.215129852294922, 20.021106719970703, 20.827083587646484, 21.633060455322266, 22.439037322998047, 23.245012283325195, 24.050989151000977, 24.856966018676758, 25.66294288635254, 26.468917846679688]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 2.0, 9.0, 3.0, 11.0, 8.0, 14.0, 10.0, 15.0, 15.0, 23.0, 17.0, 26.0, 36.0, 31.0, 22.0, 41.0, 26.0, 38.0, 48.0, 48.0, 51.0, 37.0, 43.0, 45.0, 35.0, 32.0, 33.0, 39.0, 28.0, 26.0, 26.0, 19.0, 15.0, 19.0, 18.0, 16.0, 18.0, 10.0, 5.0, 8.0, 6.0, 6.0, 10.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.25, -3.155059814453125, -3.06011962890625, -2.965179443359375, -2.8702392578125, -2.775299072265625, -2.68035888671875, -2.585418701171875, -2.490478515625, -2.395538330078125, -2.30059814453125, -2.205657958984375, -2.1107177734375, -2.015777587890625, -1.92083740234375, -1.825897216796875, -1.73095703125, -1.636016845703125, -1.54107666015625, -1.446136474609375, -1.3511962890625, -1.256256103515625, -1.16131591796875, -1.066375732421875, -0.971435546875, -0.876495361328125, -0.78155517578125, -0.686614990234375, -0.5916748046875, -0.496734619140625, -0.40179443359375, -0.306854248046875, -0.2119140625, -0.116973876953125, -0.02203369140625, 0.072906494140625, 0.1678466796875, 0.262786865234375, 0.35772705078125, 0.452667236328125, 0.547607421875, 0.642547607421875, 0.73748779296875, 0.832427978515625, 0.9273681640625, 1.022308349609375, 1.11724853515625, 1.212188720703125, 1.30712890625, 1.402069091796875, 1.49700927734375, 1.591949462890625, 1.6868896484375, 1.781829833984375, 1.87677001953125, 1.971710205078125, 2.066650390625, 2.161590576171875, 2.25653076171875, 2.351470947265625, 2.4464111328125, 2.541351318359375, 2.63629150390625, 2.731231689453125, 2.826171875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 8.0, 10.0, 13.0, 5.0, 12.0, 22.0, 15.0, 16.0, 33.0, 35.0, 52.0, 74.0, 159.0, 406.0, 1027.0, 3178.0, 11297.0, 44860.0, 199892.0, 910458.0, 2057057.0, 751278.0, 163011.0, 37261.0, 9571.0, 2776.0, 970.0, 312.0, 166.0, 65.0, 38.0, 31.0, 22.0, 16.0, 15.0, 16.0, 12.0, 13.0, 17.0, 7.0, 8.0, 9.0, 4.0, 4.0, 8.0, 2.0, 1.0, 5.0, 1.0, 3.0], "bins": [-6.35546875, -6.1708984375, -5.986328125, -5.8017578125, -5.6171875, -5.4326171875, -5.248046875, -5.0634765625, -4.87890625, -4.6943359375, -4.509765625, -4.3251953125, -4.140625, -3.9560546875, -3.771484375, -3.5869140625, -3.40234375, -3.2177734375, -3.033203125, -2.8486328125, -2.6640625, -2.4794921875, -2.294921875, -2.1103515625, -1.92578125, -1.7412109375, -1.556640625, -1.3720703125, -1.1875, -1.0029296875, -0.818359375, -0.6337890625, -0.44921875, -0.2646484375, -0.080078125, 0.1044921875, 0.2890625, 0.4736328125, 0.658203125, 0.8427734375, 1.02734375, 1.2119140625, 1.396484375, 1.5810546875, 1.765625, 1.9501953125, 2.134765625, 2.3193359375, 2.50390625, 2.6884765625, 2.873046875, 3.0576171875, 3.2421875, 3.4267578125, 3.611328125, 3.7958984375, 3.98046875, 4.1650390625, 4.349609375, 4.5341796875, 4.71875, 4.9033203125, 5.087890625, 5.2724609375, 5.45703125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 9.0, 8.0, 10.0, 11.0, 17.0, 16.0, 17.0, 26.0, 36.0, 47.0, 61.0, 62.0, 106.0, 83.0, 119.0, 165.0, 181.0, 221.0, 290.0, 302.0, 337.0, 336.0, 297.0, 226.0, 210.0, 176.0, 136.0, 132.0, 93.0, 79.0, 50.0, 46.0, 34.0, 25.0, 22.0, 20.0, 10.0, 14.0, 8.0, 4.0, 8.0, 6.0, 5.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.09765625, -3.95989990234375, -3.8221435546875, -3.68438720703125, -3.546630859375, -3.40887451171875, -3.2711181640625, -3.13336181640625, -2.99560546875, -2.85784912109375, -2.7200927734375, -2.58233642578125, -2.444580078125, -2.30682373046875, -2.1690673828125, -2.03131103515625, -1.8935546875, -1.75579833984375, -1.6180419921875, -1.48028564453125, -1.342529296875, -1.20477294921875, -1.0670166015625, -0.92926025390625, -0.79150390625, -0.65374755859375, -0.5159912109375, -0.37823486328125, -0.240478515625, -0.10272216796875, 0.0350341796875, 0.17279052734375, 0.310546875, 0.44830322265625, 0.5860595703125, 0.72381591796875, 0.861572265625, 0.99932861328125, 1.1370849609375, 1.27484130859375, 1.41259765625, 1.55035400390625, 1.6881103515625, 1.82586669921875, 1.963623046875, 2.10137939453125, 2.2391357421875, 2.37689208984375, 2.5146484375, 2.65240478515625, 2.7901611328125, 2.92791748046875, 3.065673828125, 3.20343017578125, 3.3411865234375, 3.47894287109375, 3.61669921875, 3.75445556640625, 3.8922119140625, 4.02996826171875, 4.167724609375, 4.30548095703125, 4.4432373046875, 4.58099365234375, 4.71875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 6.0, 12.0, 17.0, 9.0, 20.0, 23.0, 30.0, 42.0, 53.0, 67.0, 81.0, 106.0, 180.0, 190.0, 269.0, 479.0, 2127.0, 48822.0, 2063734.0, 2026478.0, 47790.0, 2118.0, 448.0, 275.0, 205.0, 136.0, 100.0, 106.0, 66.0, 62.0, 49.0, 34.0, 17.0, 28.0, 10.0, 13.0, 16.0, 10.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-20.890625, -20.293701171875, -19.69677734375, -19.099853515625, -18.5029296875, -17.906005859375, -17.30908203125, -16.712158203125, -16.115234375, -15.518310546875, -14.92138671875, -14.324462890625, -13.7275390625, -13.130615234375, -12.53369140625, -11.936767578125, -11.33984375, -10.742919921875, -10.14599609375, -9.549072265625, -8.9521484375, -8.355224609375, -7.75830078125, -7.161376953125, -6.564453125, -5.967529296875, -5.37060546875, -4.773681640625, -4.1767578125, -3.579833984375, -2.98291015625, -2.385986328125, -1.7890625, -1.192138671875, -0.59521484375, 0.001708984375, 0.5986328125, 1.195556640625, 1.79248046875, 2.389404296875, 2.986328125, 3.583251953125, 4.18017578125, 4.777099609375, 5.3740234375, 5.970947265625, 6.56787109375, 7.164794921875, 7.76171875, 8.358642578125, 8.95556640625, 9.552490234375, 10.1494140625, 10.746337890625, 11.34326171875, 11.940185546875, 12.537109375, 13.134033203125, 13.73095703125, 14.327880859375, 14.9248046875, 15.521728515625, 16.11865234375, 16.715576171875, 17.3125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 11.0, 12.0, 19.0, 29.0, 50.0, 52.0, 76.0, 95.0, 97.0, 97.0, 101.0, 81.0, 86.0, 58.0, 43.0, 41.0, 18.0, 19.0, 9.0, 8.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.57284927368164, -13.711023330688477, -12.849196434020996, -11.987370491027832, -11.125543594360352, -10.263717651367188, -9.401891708374023, -8.54006576538086, -7.678238868713379, -6.816412448883057, -5.954586029052734, -5.09276008605957, -4.230933666229248, -3.369107246398926, -2.5072813034057617, -1.6454548835754395, -0.7836284637451172, 0.07819783687591553, 0.9400241374969482, 1.8018503189086914, 2.6636767387390137, 3.525503158569336, 4.3873291015625, 5.249155521392822, 6.1109819412231445, 6.972808361053467, 7.834634780883789, 8.696460723876953, 9.558286666870117, 10.420113563537598, 11.281939506530762, 12.143766403198242, 13.005592346191406, 13.86741828918457, 14.72924518585205, 15.591071128845215, 16.452898025512695, 17.31472396850586, 18.176549911499023, 19.038375854492188, 19.900203704833984, 20.76202964782715, 21.623855590820312, 22.48568344116211, 23.347509384155273, 24.209335327148438, 25.0711612701416, 25.932987213134766, 26.79481315612793, 27.656639099121094, 28.518465042114258, 29.380290985107422, 30.24211883544922, 31.103944778442383, 31.965770721435547, 32.827598571777344, 33.689422607421875, 34.55125045776367, 35.4130744934082, 36.27490234375, 37.13672637939453, 37.99855422973633, 38.860382080078125, 39.722206115722656, 40.58403396606445]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 8.0, 13.0, 11.0, 13.0, 19.0, 16.0, 24.0, 31.0, 39.0, 28.0, 40.0, 34.0, 40.0, 29.0, 35.0, 39.0, 41.0, 45.0, 43.0, 36.0, 36.0, 36.0, 32.0, 37.0, 29.0, 30.0, 18.0, 26.0, 21.0, 23.0, 19.0, 19.0, 17.0, 13.0, 14.0, 11.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.84534454345703, -16.25760269165039, -15.669862747192383, -15.082121849060059, -14.494380950927734, -13.906639099121094, -13.31889820098877, -12.731157302856445, -12.143416404724121, -11.555675506591797, -10.967934608459473, -10.380193710327148, -9.792451858520508, -9.2047119140625, -8.61697006225586, -8.029229164123535, -7.441488265991211, -6.853747367858887, -6.2660064697265625, -5.67826509475708, -5.090524196624756, -4.502783298492432, -3.9150421619415283, -3.327301025390625, -2.739560127258301, -2.1518192291259766, -1.5640780925750732, -0.9763370752334595, -0.3885960578918457, 0.19914484024047852, 0.7868859767913818, 1.3746271133422852, 1.9623680114746094, 2.5501089096069336, 3.137850046157837, 3.7255911827087402, 4.3133320808410645, 4.901072978973389, 5.488814353942871, 6.076555252075195, 6.6642961502075195, 7.252037048339844, 7.839777946472168, 8.427518844604492, 9.015260696411133, 9.60300064086914, 10.190742492675781, 10.778483390808105, 11.36622428894043, 11.953965187072754, 12.541706085205078, 13.129446983337402, 13.717187881469727, 14.304929733276367, 14.892670631408691, 15.480411529541016, 16.068153381347656, 16.655895233154297, 17.243635177612305, 17.831377029418945, 18.419116973876953, 19.006858825683594, 19.5945987701416, 20.182340621948242, 20.77008056640625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 5.0, 5.0, 4.0, 6.0, 4.0, 15.0, 13.0, 9.0, 13.0, 21.0, 19.0, 21.0, 22.0, 28.0, 28.0, 29.0, 40.0, 41.0, 39.0, 34.0, 38.0, 36.0, 40.0, 52.0, 49.0, 30.0, 34.0, 41.0, 23.0, 43.0, 24.0, 27.0, 27.0, 20.0, 21.0, 21.0, 7.0, 15.0, 11.0, 11.0, 11.0, 4.0, 5.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.009765625, -2.917327880859375, -2.82489013671875, -2.732452392578125, -2.6400146484375, -2.547576904296875, -2.45513916015625, -2.362701416015625, -2.270263671875, -2.177825927734375, -2.08538818359375, -1.992950439453125, -1.9005126953125, -1.808074951171875, -1.71563720703125, -1.623199462890625, -1.53076171875, -1.438323974609375, -1.34588623046875, -1.253448486328125, -1.1610107421875, -1.068572998046875, -0.97613525390625, -0.883697509765625, -0.791259765625, -0.698822021484375, -0.60638427734375, -0.513946533203125, -0.4215087890625, -0.329071044921875, -0.23663330078125, -0.144195556640625, -0.0517578125, 0.040679931640625, 0.13311767578125, 0.225555419921875, 0.3179931640625, 0.410430908203125, 0.50286865234375, 0.595306396484375, 0.687744140625, 0.780181884765625, 0.87261962890625, 0.965057373046875, 1.0574951171875, 1.149932861328125, 1.24237060546875, 1.334808349609375, 1.42724609375, 1.519683837890625, 1.61212158203125, 1.704559326171875, 1.7969970703125, 1.889434814453125, 1.98187255859375, 2.074310302734375, 2.166748046875, 2.259185791015625, 2.35162353515625, 2.444061279296875, 2.5364990234375, 2.628936767578125, 2.72137451171875, 2.813812255859375, 2.90625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 8.0, 9.0, 15.0, 18.0, 28.0, 35.0, 46.0, 82.0, 100.0, 135.0, 169.0, 257.0, 367.0, 521.0, 711.0, 1027.0, 1399.0, 2039.0, 2880.0, 4206.0, 6170.0, 9056.0, 13300.0, 19858.0, 29832.0, 46297.0, 76004.0, 140500.0, 318096.0, 151202.0, 80029.0, 48319.0, 31165.0, 20645.0, 13750.0, 9312.0, 6396.0, 4379.0, 2987.0, 2135.0, 1449.0, 1062.0, 671.0, 566.0, 376.0, 258.0, 196.0, 139.0, 96.0, 80.0, 60.0, 42.0, 30.0, 16.0, 14.0, 11.0, 6.0, 3.0, 4.0, 2.0], "bins": [-0.1270751953125, -0.12317085266113281, -0.11926651000976562, -0.11536216735839844, -0.11145782470703125, -0.10755348205566406, -0.10364913940429688, -0.09974479675292969, -0.0958404541015625, -0.09193611145019531, -0.08803176879882812, -0.08412742614746094, -0.08022308349609375, -0.07631874084472656, -0.07241439819335938, -0.06851005554199219, -0.064605712890625, -0.06070137023925781, -0.056797027587890625, -0.05289268493652344, -0.04898834228515625, -0.04508399963378906, -0.041179656982421875, -0.03727531433105469, -0.0333709716796875, -0.029466629028320312, -0.025562286376953125, -0.021657943725585938, -0.01775360107421875, -0.013849258422851562, -0.009944915771484375, -0.0060405731201171875, -0.00213623046875, 0.0017681121826171875, 0.005672454833984375, 0.009576797485351562, 0.01348114013671875, 0.017385482788085938, 0.021289825439453125, 0.025194168090820312, 0.0290985107421875, 0.03300285339355469, 0.036907196044921875, 0.04081153869628906, 0.04471588134765625, 0.04862022399902344, 0.052524566650390625, 0.05642890930175781, 0.060333251953125, 0.06423759460449219, 0.06814193725585938, 0.07204627990722656, 0.07595062255859375, 0.07985496520996094, 0.08375930786132812, 0.08766365051269531, 0.0915679931640625, 0.09547233581542969, 0.09937667846679688, 0.10328102111816406, 0.10718536376953125, 0.11108970642089844, 0.11499404907226562, 0.11889839172363281, 0.122802734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 8.0, 7.0, 11.0, 9.0, 17.0, 13.0, 6.0, 15.0, 29.0, 20.0, 20.0, 29.0, 39.0, 24.0, 29.0, 40.0, 35.0, 38.0, 43.0, 1067.0, 43.0, 44.0, 45.0, 41.0, 31.0, 43.0, 36.0, 31.0, 28.0, 30.0, 19.0, 21.0, 13.0, 16.0, 20.0, 10.0, 9.0, 9.0, 10.0, 9.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.077606201171875, -2.00286865234375, -1.928131103515625, -1.8533935546875, -1.778656005859375, -1.70391845703125, -1.629180908203125, -1.554443359375, -1.479705810546875, -1.40496826171875, -1.330230712890625, -1.2554931640625, -1.180755615234375, -1.10601806640625, -1.031280517578125, -0.95654296875, -0.881805419921875, -0.80706787109375, -0.732330322265625, -0.6575927734375, -0.582855224609375, -0.50811767578125, -0.433380126953125, -0.358642578125, -0.283905029296875, -0.20916748046875, -0.134429931640625, -0.0596923828125, 0.015045166015625, 0.08978271484375, 0.164520263671875, 0.2392578125, 0.313995361328125, 0.38873291015625, 0.463470458984375, 0.5382080078125, 0.612945556640625, 0.68768310546875, 0.762420654296875, 0.837158203125, 0.911895751953125, 0.98663330078125, 1.061370849609375, 1.1361083984375, 1.210845947265625, 1.28558349609375, 1.360321044921875, 1.43505859375, 1.509796142578125, 1.58453369140625, 1.659271240234375, 1.7340087890625, 1.808746337890625, 1.88348388671875, 1.958221435546875, 2.032958984375, 2.107696533203125, 2.18243408203125, 2.257171630859375, 2.3319091796875, 2.406646728515625, 2.48138427734375, 2.556121826171875, 2.630859375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 18.0, 22.0, 45.0, 59.0, 123.0, 139.0, 274.0, 419.0, 586.0, 901.0, 1442.0, 2070.0, 3182.0, 4654.0, 6924.0, 10418.0, 15501.0, 24006.0, 38193.0, 62585.0, 112654.0, 1327267.0, 223824.0, 102073.0, 57916.0, 35462.0, 22266.0, 14770.0, 9567.0, 6591.0, 4403.0, 2931.0, 2032.0, 1295.0, 864.0, 601.0, 388.0, 237.0, 153.0, 103.0, 53.0, 29.0, 32.0, 15.0, 11.0, 10.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.07586669921875, -0.0735626220703125, -0.071258544921875, -0.0689544677734375, -0.066650390625, -0.0643463134765625, -0.062042236328125, -0.0597381591796875, -0.05743408203125, -0.0551300048828125, -0.052825927734375, -0.0505218505859375, -0.0482177734375, -0.0459136962890625, -0.043609619140625, -0.0413055419921875, -0.03900146484375, -0.0366973876953125, -0.034393310546875, -0.0320892333984375, -0.02978515625, -0.0274810791015625, -0.025177001953125, -0.0228729248046875, -0.02056884765625, -0.0182647705078125, -0.015960693359375, -0.0136566162109375, -0.0113525390625, -0.0090484619140625, -0.006744384765625, -0.0044403076171875, -0.00213623046875, 0.0001678466796875, 0.002471923828125, 0.0047760009765625, 0.007080078125, 0.0093841552734375, 0.011688232421875, 0.0139923095703125, 0.01629638671875, 0.0186004638671875, 0.020904541015625, 0.0232086181640625, 0.0255126953125, 0.0278167724609375, 0.030120849609375, 0.0324249267578125, 0.03472900390625, 0.0370330810546875, 0.039337158203125, 0.0416412353515625, 0.0439453125, 0.0462493896484375, 0.048553466796875, 0.0508575439453125, 0.05316162109375, 0.0554656982421875, 0.057769775390625, 0.0600738525390625, 0.0623779296875, 0.0646820068359375, 0.066986083984375, 0.0692901611328125, 0.07159423828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 4.0, 7.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 19.0, 19.0, 0.0, 18.0, 27.0, 24.0, 46.0, 0.0, 56.0, 99.0, 303.0, 95.0, 80.0, 0.0, 41.0, 41.0, 23.0, 18.0, 0.0, 16.0, 10.0, 9.0, 6.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 0.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6205012798309326e-06, -1.5720725059509277e-06, -1.5236437320709229e-06, -1.475214958190918e-06, -1.426786184310913e-06, -1.3783574104309082e-06, -1.3299286365509033e-06, -1.2814998626708984e-06, -1.2330710887908936e-06, -1.1846423149108887e-06, -1.1362135410308838e-06, -1.087784767150879e-06, -1.039355993270874e-06, -9.909272193908691e-07, -9.424984455108643e-07, -8.940696716308594e-07, -8.456408977508545e-07, -7.972121238708496e-07, -7.487833499908447e-07, -7.003545761108398e-07, -6.51925802230835e-07, -6.034970283508301e-07, -5.550682544708252e-07, -5.066394805908203e-07, -4.5821070671081543e-07, -4.0978193283081055e-07, -3.6135315895080566e-07, -3.129243850708008e-07, -2.644956111907959e-07, -2.1606683731079102e-07, -1.6763806343078613e-07, -1.1920928955078125e-07, -7.078051567077637e-08, -2.2351741790771484e-08, 2.60770320892334e-08, 7.450580596923828e-08, 1.2293457984924316e-07, 1.7136335372924805e-07, 2.1979212760925293e-07, 2.682209014892578e-07, 3.166496753692627e-07, 3.650784492492676e-07, 4.1350722312927246e-07, 4.6193599700927734e-07, 5.103647708892822e-07, 5.587935447692871e-07, 6.07222318649292e-07, 6.556510925292969e-07, 7.040798664093018e-07, 7.525086402893066e-07, 8.009374141693115e-07, 8.493661880493164e-07, 8.977949619293213e-07, 9.462237358093262e-07, 9.94652509689331e-07, 1.043081283569336e-06, 1.0915100574493408e-06, 1.1399388313293457e-06, 1.1883676052093506e-06, 1.2367963790893555e-06, 1.2852251529693604e-06, 1.3336539268493652e-06, 1.3820827007293701e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 2.0, 9.0, 11.0, 17.0, 19.0, 36.0, 42.0, 65.0, 117.0, 325.0, 2947.0, 173053.0, 864384.0, 6677.0, 420.0, 149.0, 83.0, 43.0, 21.0, 28.0, 24.0, 17.0, 13.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.962350845336914e-05, -2.8570182621479034e-05, -2.7516856789588928e-05, -2.6463530957698822e-05, -2.5410205125808716e-05, -2.435687929391861e-05, -2.3303553462028503e-05, -2.2250227630138397e-05, -2.119690179824829e-05, -2.0143575966358185e-05, -1.909025013446808e-05, -1.8036924302577972e-05, -1.6983598470687866e-05, -1.593027263879776e-05, -1.4876946806907654e-05, -1.3823620975017548e-05, -1.2770295143127441e-05, -1.1716969311237335e-05, -1.0663643479347229e-05, -9.610317647457123e-06, -8.556991815567017e-06, -7.50366598367691e-06, -6.450340151786804e-06, -5.397014319896698e-06, -4.343688488006592e-06, -3.2903626561164856e-06, -2.2370368242263794e-06, -1.1837109923362732e-06, -1.30385160446167e-07, 9.229406714439392e-07, 1.9762665033340454e-06, 3.0295923352241516e-06, 4.082918167114258e-06, 5.136243999004364e-06, 6.18956983089447e-06, 7.242895662784576e-06, 8.296221494674683e-06, 9.349547326564789e-06, 1.0402873158454895e-05, 1.1456198990345001e-05, 1.2509524822235107e-05, 1.3562850654125214e-05, 1.461617648601532e-05, 1.5669502317905426e-05, 1.6722828149795532e-05, 1.777615398168564e-05, 1.8829479813575745e-05, 1.988280564546585e-05, 2.0936131477355957e-05, 2.1989457309246063e-05, 2.304278314113617e-05, 2.4096108973026276e-05, 2.5149434804916382e-05, 2.6202760636806488e-05, 2.7256086468696594e-05, 2.83094123005867e-05, 2.9362738132476807e-05, 3.0416063964366913e-05, 3.146938979625702e-05, 3.2522715628147125e-05, 3.357604146003723e-05, 3.462936729192734e-05, 3.5682693123817444e-05, 3.673601895570755e-05, 3.7789344787597656e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 13.0, 14.0, 25.0, 30.0, 44.0, 79.0, 89.0, 139.0, 246.0, 124.0, 66.0, 44.0, 28.0, 21.0, 19.0, 5.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.845655775578052e-07, -6.534622798426426e-07, -6.223590389708988e-07, -5.912557412557362e-07, -5.601524435405736e-07, -5.29049145825411e-07, -4.979458481102483e-07, -4.6684260723850457e-07, -4.3573930952334194e-07, -4.046360118081793e-07, -3.735327425147261e-07, -3.4242947322127293e-07, -3.113261755061103e-07, -2.802228777909477e-07, -2.491196084974945e-07, -2.1801632499318657e-07, -1.8691304148887866e-07, -1.5580975798457075e-07, -1.2470647448026284e-07, -9.360319097595493e-08, -6.249990747164702e-08, -3.139662396733911e-08, -2.9334046303119976e-10, 3.080994304127671e-08, 6.191322654558462e-08, 9.301651004989253e-08, 1.2411979355420044e-07, 1.5522307705850835e-07, 1.8632636056281626e-07, 2.1742964406712417e-07, 2.485329275714321e-07, 2.796361968648853e-07, 3.1073955142346676e-07, 3.418428491386294e-07, 3.729461184320826e-07, 4.040493877255358e-07, 4.351526854406984e-07, 4.6625598315586103e-07, 4.973592240276048e-07, 5.284625217427674e-07, 5.5956581945793e-07, 5.906691171730927e-07, 6.217724148882553e-07, 6.528756557599991e-07, 6.839789534751617e-07, 7.150822511903243e-07, 7.461854920620681e-07, 7.772887897772307e-07, 8.083920874923933e-07, 8.39495385207556e-07, 8.705986829227186e-07, 9.017019237944623e-07, 9.32805221509625e-07, 9.639085192247876e-07, 9.950117600965314e-07, 1.0261151146551128e-06, 1.0572183555268566e-06, 1.0883215963986004e-06, 1.1194249509571819e-06, 1.1505281918289256e-06, 1.1816314327006694e-06, 1.2127347872592509e-06, 1.2438380281309946e-06, 1.2749413826895761e-06, 1.30604462356132e-06]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 43.0, 0.0, 0.0, 86.0, 0.0, 0.0, 0.0, 201.0, 0.0, 0.0, 256.0, 0.0, 0.0, 0.0, 188.0, 0.0, 0.0, 107.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 11.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.783513188362122e-07, -5.606561899185181e-07, -5.42961061000824e-07, -5.252659320831299e-07, -5.075708031654358e-07, -4.898756742477417e-07, -4.721805453300476e-07, -4.544854164123535e-07, -4.367902874946594e-07, -4.1909515857696533e-07, -4.0140002965927124e-07, -3.8370490074157715e-07, -3.6600977182388306e-07, -3.4831464290618896e-07, -3.3061951398849487e-07, -3.129243850708008e-07, -2.952292561531067e-07, -2.775341272354126e-07, -2.598389983177185e-07, -2.421438694000244e-07, -2.2444874048233032e-07, -2.0675361156463623e-07, -1.8905848264694214e-07, -1.7136335372924805e-07, -1.5366822481155396e-07, -1.3597309589385986e-07, -1.1827796697616577e-07, -1.0058283805847168e-07, -8.288770914077759e-08, -6.51925802230835e-08, -4.7497451305389404e-08, -2.9802322387695312e-08, -1.210719347000122e-08, 5.587935447692871e-09, 2.3283064365386963e-08, 4.0978193283081055e-08, 5.8673322200775146e-08, 7.636845111846924e-08, 9.406358003616333e-08, 1.1175870895385742e-07, 1.2945383787155151e-07, 1.471489667892456e-07, 1.648440957069397e-07, 1.825392246246338e-07, 2.0023435354232788e-07, 2.1792948246002197e-07, 2.3562461137771606e-07, 2.5331974029541016e-07, 2.7101486921310425e-07, 2.8870999813079834e-07, 3.0640512704849243e-07, 3.241002559661865e-07, 3.417953848838806e-07, 3.594905138015747e-07, 3.771856427192688e-07, 3.948807716369629e-07, 4.12575900554657e-07, 4.302710294723511e-07, 4.4796615839004517e-07, 4.6566128730773926e-07, 4.833564162254333e-07, 5.010515451431274e-07, 5.187466740608215e-07, 5.364418029785156e-07]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 5.0, 5.0, 4.0, 6.0, 4.0, 15.0, 13.0, 9.0, 13.0, 21.0, 19.0, 21.0, 22.0, 28.0, 28.0, 29.0, 40.0, 41.0, 39.0, 34.0, 38.0, 36.0, 40.0, 52.0, 49.0, 30.0, 34.0, 41.0, 23.0, 43.0, 24.0, 27.0, 27.0, 20.0, 21.0, 21.0, 7.0, 15.0, 11.0, 11.0, 11.0, 4.0, 5.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.009765625, -2.917327880859375, -2.82489013671875, -2.732452392578125, -2.6400146484375, -2.547576904296875, -2.45513916015625, -2.362701416015625, -2.270263671875, -2.177825927734375, -2.08538818359375, -1.992950439453125, -1.9005126953125, -1.808074951171875, -1.71563720703125, -1.623199462890625, -1.53076171875, -1.438323974609375, -1.34588623046875, -1.253448486328125, -1.1610107421875, -1.068572998046875, -0.97613525390625, -0.883697509765625, -0.791259765625, -0.698822021484375, -0.60638427734375, -0.513946533203125, -0.4215087890625, -0.329071044921875, -0.23663330078125, -0.144195556640625, -0.0517578125, 0.040679931640625, 0.13311767578125, 0.225555419921875, 0.3179931640625, 0.410430908203125, 0.50286865234375, 0.595306396484375, 0.687744140625, 0.780181884765625, 0.87261962890625, 0.965057373046875, 1.0574951171875, 1.149932861328125, 1.24237060546875, 1.334808349609375, 1.42724609375, 1.519683837890625, 1.61212158203125, 1.704559326171875, 1.7969970703125, 1.889434814453125, 1.98187255859375, 2.074310302734375, 2.166748046875, 2.259185791015625, 2.35162353515625, 2.444061279296875, 2.5364990234375, 2.628936767578125, 2.72137451171875, 2.813812255859375, 2.90625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 8.0, 15.0, 25.0, 41.0, 59.0, 78.0, 126.0, 204.0, 340.0, 516.0, 828.0, 1292.0, 2141.0, 3601.0, 5906.0, 9613.0, 17116.0, 31220.0, 59654.0, 118967.0, 242658.0, 271054.0, 134600.0, 67641.0, 34968.0, 18884.0, 10583.0, 6364.0, 3883.0, 2289.0, 1416.0, 947.0, 576.0, 353.0, 207.0, 142.0, 70.0, 58.0, 43.0, 25.0, 15.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.66796875, -3.56036376953125, -3.4527587890625, -3.34515380859375, -3.237548828125, -3.12994384765625, -3.0223388671875, -2.91473388671875, -2.80712890625, -2.69952392578125, -2.5919189453125, -2.48431396484375, -2.376708984375, -2.26910400390625, -2.1614990234375, -2.05389404296875, -1.9462890625, -1.83868408203125, -1.7310791015625, -1.62347412109375, -1.515869140625, -1.40826416015625, -1.3006591796875, -1.19305419921875, -1.08544921875, -0.97784423828125, -0.8702392578125, -0.76263427734375, -0.655029296875, -0.54742431640625, -0.4398193359375, -0.33221435546875, -0.224609375, -0.11700439453125, -0.0093994140625, 0.09820556640625, 0.205810546875, 0.31341552734375, 0.4210205078125, 0.52862548828125, 0.63623046875, 0.74383544921875, 0.8514404296875, 0.95904541015625, 1.066650390625, 1.17425537109375, 1.2818603515625, 1.38946533203125, 1.4970703125, 1.60467529296875, 1.7122802734375, 1.81988525390625, 1.927490234375, 2.03509521484375, 2.1427001953125, 2.25030517578125, 2.35791015625, 2.46551513671875, 2.5731201171875, 2.68072509765625, 2.788330078125, 2.89593505859375, 3.0035400390625, 3.11114501953125, 3.21875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 7.0, 9.0, 9.0, 11.0, 20.0, 28.0, 16.0, 18.0, 26.0, 33.0, 35.0, 37.0, 33.0, 57.0, 64.0, 100.0, 102.0, 247.0, 1459.0, 236.0, 94.0, 69.0, 42.0, 62.0, 34.0, 30.0, 33.0, 28.0, 26.0, 16.0, 12.0, 8.0, 5.0, 5.0, 8.0, 10.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -10.031982421875, -9.71240234375, -9.392822265625, -9.0732421875, -8.753662109375, -8.43408203125, -8.114501953125, -7.794921875, -7.475341796875, -7.15576171875, -6.836181640625, -6.5166015625, -6.197021484375, -5.87744140625, -5.557861328125, -5.23828125, -4.918701171875, -4.59912109375, -4.279541015625, -3.9599609375, -3.640380859375, -3.32080078125, -3.001220703125, -2.681640625, -2.362060546875, -2.04248046875, -1.722900390625, -1.4033203125, -1.083740234375, -0.76416015625, -0.444580078125, -0.125, 0.194580078125, 0.51416015625, 0.833740234375, 1.1533203125, 1.472900390625, 1.79248046875, 2.112060546875, 2.431640625, 2.751220703125, 3.07080078125, 3.390380859375, 3.7099609375, 4.029541015625, 4.34912109375, 4.668701171875, 4.98828125, 5.307861328125, 5.62744140625, 5.947021484375, 6.2666015625, 6.586181640625, 6.90576171875, 7.225341796875, 7.544921875, 7.864501953125, 8.18408203125, 8.503662109375, 8.8232421875, 9.142822265625, 9.46240234375, 9.781982421875, 10.1015625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 12.0, 15.0, 16.0, 11.0, 23.0, 33.0, 55.0, 48.0, 78.0, 92.0, 151.0, 180.0, 339.0, 567.0, 1580.0, 9590.0, 176585.0, 2814374.0, 130781.0, 7943.0, 1446.0, 575.0, 336.0, 207.0, 149.0, 107.0, 80.0, 70.0, 52.0, 44.0, 25.0, 28.0, 23.0, 19.0, 10.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.171875, -17.612060546875, -17.05224609375, -16.492431640625, -15.9326171875, -15.372802734375, -14.81298828125, -14.253173828125, -13.693359375, -13.133544921875, -12.57373046875, -12.013916015625, -11.4541015625, -10.894287109375, -10.33447265625, -9.774658203125, -9.21484375, -8.655029296875, -8.09521484375, -7.535400390625, -6.9755859375, -6.415771484375, -5.85595703125, -5.296142578125, -4.736328125, -4.176513671875, -3.61669921875, -3.056884765625, -2.4970703125, -1.937255859375, -1.37744140625, -0.817626953125, -0.2578125, 0.302001953125, 0.86181640625, 1.421630859375, 1.9814453125, 2.541259765625, 3.10107421875, 3.660888671875, 4.220703125, 4.780517578125, 5.34033203125, 5.900146484375, 6.4599609375, 7.019775390625, 7.57958984375, 8.139404296875, 8.69921875, 9.259033203125, 9.81884765625, 10.378662109375, 10.9384765625, 11.498291015625, 12.05810546875, 12.617919921875, 13.177734375, 13.737548828125, 14.29736328125, 14.857177734375, 15.4169921875, 15.976806640625, 16.53662109375, 17.096435546875, 17.65625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 26.0, 135.0, 303.0, 347.0, 159.0, 40.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.669567108154297, -15.727313995361328, -13.78506088256836, -11.84280776977539, -9.900554656982422, -7.958301544189453, -6.016048431396484, -4.073795318603516, -2.131542205810547, -0.18928909301757812, 1.7529640197753906, 3.6952171325683594, 5.637470245361328, 7.579723358154297, 9.521976470947266, 11.464229583740234, 13.406482696533203, 15.348735809326172, 17.29098892211914, 19.23324203491211, 21.175495147705078, 23.117748260498047, 25.060001373291016, 27.002254486083984, 28.944507598876953, 30.886760711669922, 32.82901382446289, 34.77126693725586, 36.71352005004883, 38.6557731628418, 40.598026275634766, 42.540279388427734, 44.48252868652344, 46.424781799316406, 48.367034912109375, 50.309288024902344, 52.25154113769531, 54.19379425048828, 56.13604736328125, 58.07830047607422, 60.02055358886719, 61.962806701660156, 63.905059814453125, 65.8473129272461, 67.78956604003906, 69.73181915283203, 71.674072265625, 73.61632537841797, 75.55857849121094, 77.5008316040039, 79.44308471679688, 81.38533782958984, 83.32759094238281, 85.26984405517578, 87.21209716796875, 89.15435028076172, 91.09660339355469, 93.03885650634766, 94.98110961914062, 96.9233627319336, 98.86561584472656, 100.80786895751953, 102.7501220703125, 104.69237518310547, 106.63462829589844]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 8.0, 3.0, 9.0, 11.0, 4.0, 10.0, 7.0, 12.0, 7.0, 19.0, 17.0, 19.0, 26.0, 18.0, 23.0, 19.0, 32.0, 32.0, 34.0, 32.0, 34.0, 28.0, 42.0, 31.0, 43.0, 33.0, 47.0, 37.0, 34.0, 41.0, 37.0, 28.0, 23.0, 27.0, 26.0, 21.0, 21.0, 20.0, 12.0, 8.0, 10.0, 9.0, 11.0, 8.0, 5.0, 8.0, 3.0, 7.0, 2.0, 1.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-23.31140899658203, -22.597003936767578, -21.882598876953125, -21.168193817138672, -20.45378875732422, -19.7393856048584, -19.024980545043945, -18.310575485229492, -17.59617042541504, -16.881765365600586, -16.167360305786133, -15.452956199645996, -14.738551139831543, -14.02414608001709, -13.309741973876953, -12.5953369140625, -11.880931854248047, -11.166526794433594, -10.45212173461914, -9.737717628479004, -9.02331256866455, -8.308907508850098, -7.594502925872803, -6.880098342895508, -6.165693283081055, -5.451288223266602, -4.736883640289307, -4.022479057312012, -3.3080739974975586, -2.5936691761016846, -1.8792643547058105, -1.1648597717285156, -0.4504566192626953, 0.2639482021331787, 0.9783530235290527, 1.6927578449249268, 2.407162666320801, 3.121567487716675, 3.835972309112549, 4.550376892089844, 5.264781951904297, 5.97918701171875, 6.693591594696045, 7.40799617767334, 8.122401237487793, 8.836806297302246, 9.551210403442383, 10.265615463256836, 10.980020523071289, 11.694425582885742, 12.408830642700195, 13.123234748840332, 13.837639808654785, 14.552044868469238, 15.266448974609375, 15.980854034423828, 16.69525909423828, 17.409664154052734, 18.124069213867188, 18.83847427368164, 19.552879333496094, 20.267282485961914, 20.981687545776367, 21.69609260559082, 22.410497665405273]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 2.0, 11.0, 10.0, 23.0, 15.0, 9.0, 19.0, 14.0, 25.0, 25.0, 28.0, 33.0, 30.0, 44.0, 28.0, 32.0, 42.0, 40.0, 40.0, 44.0, 39.0, 50.0, 45.0, 26.0, 33.0, 26.0, 31.0, 37.0, 28.0, 16.0, 25.0, 21.0, 17.0, 18.0, 7.0, 9.0, 9.0, 12.0, 6.0, 6.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.263671875, -3.16558837890625, -3.0675048828125, -2.96942138671875, -2.871337890625, -2.77325439453125, -2.6751708984375, -2.57708740234375, -2.47900390625, -2.38092041015625, -2.2828369140625, -2.18475341796875, -2.086669921875, -1.98858642578125, -1.8905029296875, -1.79241943359375, -1.6943359375, -1.59625244140625, -1.4981689453125, -1.40008544921875, -1.302001953125, -1.20391845703125, -1.1058349609375, -1.00775146484375, -0.90966796875, -0.81158447265625, -0.7135009765625, -0.61541748046875, -0.517333984375, -0.41925048828125, -0.3211669921875, -0.22308349609375, -0.125, -0.02691650390625, 0.0711669921875, 0.16925048828125, 0.267333984375, 0.36541748046875, 0.4635009765625, 0.56158447265625, 0.65966796875, 0.75775146484375, 0.8558349609375, 0.95391845703125, 1.052001953125, 1.15008544921875, 1.2481689453125, 1.34625244140625, 1.4443359375, 1.54241943359375, 1.6405029296875, 1.73858642578125, 1.836669921875, 1.93475341796875, 2.0328369140625, 2.13092041015625, 2.22900390625, 2.32708740234375, 2.4251708984375, 2.52325439453125, 2.621337890625, 2.71942138671875, 2.8175048828125, 2.91558837890625, 3.013671875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 1.0, 4.0, 4.0, 5.0, 6.0, 10.0, 15.0, 11.0, 18.0, 15.0, 21.0, 28.0, 32.0, 35.0, 69.0, 93.0, 219.0, 444.0, 1266.0, 4296.0, 17284.0, 75232.0, 357340.0, 1558397.0, 1678654.0, 392805.0, 81916.0, 18776.0, 4755.0, 1464.0, 469.0, 206.0, 121.0, 64.0, 31.0, 30.0, 27.0, 22.0, 16.0, 16.0, 12.0, 11.0, 9.0, 6.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.05859375, -5.86944580078125, -5.6802978515625, -5.49114990234375, -5.302001953125, -5.11285400390625, -4.9237060546875, -4.73455810546875, -4.54541015625, -4.35626220703125, -4.1671142578125, -3.97796630859375, -3.788818359375, -3.59967041015625, -3.4105224609375, -3.22137451171875, -3.0322265625, -2.84307861328125, -2.6539306640625, -2.46478271484375, -2.275634765625, -2.08648681640625, -1.8973388671875, -1.70819091796875, -1.51904296875, -1.32989501953125, -1.1407470703125, -0.95159912109375, -0.762451171875, -0.57330322265625, -0.3841552734375, -0.19500732421875, -0.005859375, 0.18328857421875, 0.3724365234375, 0.56158447265625, 0.750732421875, 0.93988037109375, 1.1290283203125, 1.31817626953125, 1.50732421875, 1.69647216796875, 1.8856201171875, 2.07476806640625, 2.263916015625, 2.45306396484375, 2.6422119140625, 2.83135986328125, 3.0205078125, 3.20965576171875, 3.3988037109375, 3.58795166015625, 3.777099609375, 3.96624755859375, 4.1553955078125, 4.34454345703125, 4.53369140625, 4.72283935546875, 4.9119873046875, 5.10113525390625, 5.290283203125, 5.47943115234375, 5.6685791015625, 5.85772705078125, 6.046875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 5.0, 8.0, 11.0, 16.0, 17.0, 35.0, 38.0, 52.0, 95.0, 94.0, 136.0, 162.0, 228.0, 309.0, 366.0, 435.0, 433.0, 353.0, 307.0, 222.0, 180.0, 134.0, 106.0, 83.0, 60.0, 51.0, 34.0, 18.0, 16.0, 14.0, 7.0, 9.0, 9.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.256591796875, -5.08740234375, -4.918212890625, -4.7490234375, -4.579833984375, -4.41064453125, -4.241455078125, -4.072265625, -3.903076171875, -3.73388671875, -3.564697265625, -3.3955078125, -3.226318359375, -3.05712890625, -2.887939453125, -2.71875, -2.549560546875, -2.38037109375, -2.211181640625, -2.0419921875, -1.872802734375, -1.70361328125, -1.534423828125, -1.365234375, -1.196044921875, -1.02685546875, -0.857666015625, -0.6884765625, -0.519287109375, -0.35009765625, -0.180908203125, -0.01171875, 0.157470703125, 0.32666015625, 0.495849609375, 0.6650390625, 0.834228515625, 1.00341796875, 1.172607421875, 1.341796875, 1.510986328125, 1.68017578125, 1.849365234375, 2.0185546875, 2.187744140625, 2.35693359375, 2.526123046875, 2.6953125, 2.864501953125, 3.03369140625, 3.202880859375, 3.3720703125, 3.541259765625, 3.71044921875, 3.879638671875, 4.048828125, 4.218017578125, 4.38720703125, 4.556396484375, 4.7255859375, 4.894775390625, 5.06396484375, 5.233154296875, 5.40234375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 1.0, 11.0, 6.0, 10.0, 9.0, 14.0, 18.0, 18.0, 34.0, 46.0, 63.0, 98.0, 107.0, 149.0, 223.0, 379.0, 990.0, 27900.0, 3748230.0, 411894.0, 2638.0, 512.0, 277.0, 176.0, 117.0, 107.0, 78.0, 47.0, 30.0, 28.0, 19.0, 15.0, 10.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.515625, -27.556396484375, -26.59716796875, -25.637939453125, -24.6787109375, -23.719482421875, -22.76025390625, -21.801025390625, -20.841796875, -19.882568359375, -18.92333984375, -17.964111328125, -17.0048828125, -16.045654296875, -15.08642578125, -14.127197265625, -13.16796875, -12.208740234375, -11.24951171875, -10.290283203125, -9.3310546875, -8.371826171875, -7.41259765625, -6.453369140625, -5.494140625, -4.534912109375, -3.57568359375, -2.616455078125, -1.6572265625, -0.697998046875, 0.26123046875, 1.220458984375, 2.1796875, 3.138916015625, 4.09814453125, 5.057373046875, 6.0166015625, 6.975830078125, 7.93505859375, 8.894287109375, 9.853515625, 10.812744140625, 11.77197265625, 12.731201171875, 13.6904296875, 14.649658203125, 15.60888671875, 16.568115234375, 17.52734375, 18.486572265625, 19.44580078125, 20.405029296875, 21.3642578125, 22.323486328125, 23.28271484375, 24.241943359375, 25.201171875, 26.160400390625, 27.11962890625, 28.078857421875, 29.0380859375, 29.997314453125, 30.95654296875, 31.915771484375, 32.875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 10.0, 29.0, 26.0, 50.0, 65.0, 98.0, 135.0, 123.0, 111.0, 104.0, 90.0, 59.0, 42.0, 28.0, 19.0, 9.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.44246482849121, -15.464035034179688, -14.485605239868164, -13.50717544555664, -12.528745651245117, -11.550315856933594, -10.571885108947754, -9.59345531463623, -8.615025520324707, -7.636595726013184, -6.65816593170166, -5.6797356605529785, -4.701305866241455, -3.7228760719299316, -2.74444580078125, -1.7660160064697266, -0.7875862121582031, 0.19084370136260986, 1.1692736148834229, 2.1477036476135254, 3.126133441925049, 4.104563236236572, 5.082993507385254, 6.061423301696777, 7.039853096008301, 8.018282890319824, 8.996712684631348, 9.975143432617188, 10.953573226928711, 11.932003021240234, 12.910432815551758, 13.888862609863281, 14.867294311523438, 15.845724105834961, 16.824153900146484, 17.802583694458008, 18.78101348876953, 19.759443283081055, 20.737873077392578, 21.716304779052734, 22.694732666015625, 23.67316246032715, 24.651592254638672, 25.630022048950195, 26.60845184326172, 27.586881637573242, 28.565311431884766, 29.543743133544922, 30.522172927856445, 31.50060272216797, 32.479034423828125, 33.457462310791016, 34.43589401245117, 35.41432189941406, 36.39275360107422, 37.37118148803711, 38.349613189697266, 39.32804489135742, 40.30647277832031, 41.28490447998047, 42.26333236694336, 43.241764068603516, 44.220191955566406, 45.19862365722656, 46.17705154418945]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 7.0, 9.0, 16.0, 7.0, 8.0, 11.0, 17.0, 21.0, 25.0, 28.0, 36.0, 41.0, 39.0, 37.0, 51.0, 36.0, 43.0, 46.0, 40.0, 33.0, 34.0, 37.0, 43.0, 39.0, 41.0, 35.0, 29.0, 27.0, 29.0, 16.0, 19.0, 8.0, 17.0, 14.0, 15.0, 5.0, 9.0, 5.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.608158111572266, -17.004281997680664, -16.400405883789062, -15.796528816223145, -15.192652702331543, -14.588775634765625, -13.984899520874023, -13.381023406982422, -12.77714729309082, -12.173271179199219, -11.5693941116333, -10.9655179977417, -10.361641883850098, -9.75776481628418, -9.153888702392578, -8.550012588500977, -7.946135520935059, -7.342258930206299, -6.738382816314697, -6.1345062255859375, -5.530630111694336, -4.926753520965576, -4.322876930236816, -3.719000816345215, -3.115124225616455, -2.5112478733062744, -1.9073714017868042, -1.303494930267334, -0.6996185779571533, -0.09574222564697266, 0.5081343650817871, 1.1120104789733887, 1.7158870697021484, 2.319763422012329, 2.9236397743225098, 3.5275163650512695, 4.131392478942871, 4.735269069671631, 5.339145660400391, 5.943021774291992, 6.546898365020752, 7.150774955749512, 7.754651069641113, 8.358528137207031, 8.962404251098633, 9.566280364990234, 10.170156478881836, 10.774032592773438, 11.377909660339355, 11.981785774230957, 12.585662841796875, 13.189538955688477, 13.793415069580078, 14.39729118347168, 15.001168251037598, 15.6050443649292, 16.208921432495117, 16.81279754638672, 17.41667366027832, 18.020549774169922, 18.624427795410156, 19.228303909301758, 19.83218002319336, 20.43605613708496, 21.039932250976562]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 12.0, 9.0, 6.0, 6.0, 14.0, 11.0, 17.0, 19.0, 22.0, 21.0, 29.0, 33.0, 37.0, 29.0, 46.0, 41.0, 36.0, 44.0, 41.0, 41.0, 44.0, 44.0, 36.0, 51.0, 46.0, 33.0, 28.0, 26.0, 29.0, 20.0, 27.0, 19.0, 16.0, 12.0, 12.0, 6.0, 13.0, 6.0, 2.0, 5.0, 3.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.318603515625, -3.21337890625, -3.108154296875, -3.0029296875, -2.897705078125, -2.79248046875, -2.687255859375, -2.58203125, -2.476806640625, -2.37158203125, -2.266357421875, -2.1611328125, -2.055908203125, -1.95068359375, -1.845458984375, -1.740234375, -1.635009765625, -1.52978515625, -1.424560546875, -1.3193359375, -1.214111328125, -1.10888671875, -1.003662109375, -0.8984375, -0.793212890625, -0.68798828125, -0.582763671875, -0.4775390625, -0.372314453125, -0.26708984375, -0.161865234375, -0.056640625, 0.048583984375, 0.15380859375, 0.259033203125, 0.3642578125, 0.469482421875, 0.57470703125, 0.679931640625, 0.78515625, 0.890380859375, 0.99560546875, 1.100830078125, 1.2060546875, 1.311279296875, 1.41650390625, 1.521728515625, 1.626953125, 1.732177734375, 1.83740234375, 1.942626953125, 2.0478515625, 2.153076171875, 2.25830078125, 2.363525390625, 2.46875, 2.573974609375, 2.67919921875, 2.784423828125, 2.8896484375, 2.994873046875, 3.10009765625, 3.205322265625, 3.310546875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 11.0, 13.0, 17.0, 34.0, 57.0, 80.0, 146.0, 217.0, 297.0, 492.0, 797.0, 1174.0, 1895.0, 3025.0, 4953.0, 8079.0, 13380.0, 23175.0, 41180.0, 77318.0, 162425.0, 390521.0, 151478.0, 72925.0, 39234.0, 22178.0, 13057.0, 7747.0, 4714.0, 2881.0, 1865.0, 1123.0, 702.0, 491.0, 323.0, 192.0, 128.0, 78.0, 55.0, 36.0, 30.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1668701171875, -0.16156578063964844, -0.15626144409179688, -0.1509571075439453, -0.14565277099609375, -0.1403484344482422, -0.13504409790039062, -0.12973976135253906, -0.1244354248046875, -0.11913108825683594, -0.11382675170898438, -0.10852241516113281, -0.10321807861328125, -0.09791374206542969, -0.09260940551757812, -0.08730506896972656, -0.082000732421875, -0.07669639587402344, -0.07139205932617188, -0.06608772277832031, -0.06078338623046875, -0.05547904968261719, -0.050174713134765625, -0.04487037658691406, -0.0395660400390625, -0.03426170349121094, -0.028957366943359375, -0.023653030395507812, -0.01834869384765625, -0.013044357299804688, -0.007740020751953125, -0.0024356842041015625, 0.00286865234375, 0.008172988891601562, 0.013477325439453125, 0.018781661987304688, 0.02408599853515625, 0.029390335083007812, 0.034694671630859375, 0.03999900817871094, 0.0453033447265625, 0.05060768127441406, 0.055912017822265625, 0.06121635437011719, 0.06652069091796875, 0.07182502746582031, 0.07712936401367188, 0.08243370056152344, 0.087738037109375, 0.09304237365722656, 0.09834671020507812, 0.10365104675292969, 0.10895538330078125, 0.11425971984863281, 0.11956405639648438, 0.12486839294433594, 0.1301727294921875, 0.13547706604003906, 0.14078140258789062, 0.1460857391357422, 0.15139007568359375, 0.1566944122314453, 0.16199874877929688, 0.16730308532714844, 0.172607421875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 5.0, 14.0, 16.0, 20.0, 16.0, 16.0, 24.0, 26.0, 41.0, 24.0, 35.0, 25.0, 39.0, 43.0, 32.0, 35.0, 38.0, 1071.0, 58.0, 39.0, 30.0, 37.0, 35.0, 39.0, 33.0, 30.0, 21.0, 27.0, 21.0, 15.0, 24.0, 17.0, 13.0, 15.0, 11.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.321868896484375, -2.24530029296875, -2.168731689453125, -2.0921630859375, -2.015594482421875, -1.93902587890625, -1.862457275390625, -1.785888671875, -1.709320068359375, -1.63275146484375, -1.556182861328125, -1.4796142578125, -1.403045654296875, -1.32647705078125, -1.249908447265625, -1.17333984375, -1.096771240234375, -1.02020263671875, -0.943634033203125, -0.8670654296875, -0.790496826171875, -0.71392822265625, -0.637359619140625, -0.560791015625, -0.484222412109375, -0.40765380859375, -0.331085205078125, -0.2545166015625, -0.177947998046875, -0.10137939453125, -0.024810791015625, 0.0517578125, 0.128326416015625, 0.20489501953125, 0.281463623046875, 0.3580322265625, 0.434600830078125, 0.51116943359375, 0.587738037109375, 0.664306640625, 0.740875244140625, 0.81744384765625, 0.894012451171875, 0.9705810546875, 1.047149658203125, 1.12371826171875, 1.200286865234375, 1.27685546875, 1.353424072265625, 1.42999267578125, 1.506561279296875, 1.5831298828125, 1.659698486328125, 1.73626708984375, 1.812835693359375, 1.889404296875, 1.965972900390625, 2.04254150390625, 2.119110107421875, 2.1956787109375, 2.272247314453125, 2.34881591796875, 2.425384521484375, 2.501953125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 15.0, 11.0, 21.0, 29.0, 43.0, 82.0, 96.0, 162.0, 214.0, 316.0, 505.0, 757.0, 1124.0, 1721.0, 2512.0, 3885.0, 5842.0, 8522.0, 12767.0, 18938.0, 28907.0, 45055.0, 73164.0, 129309.0, 1355284.0, 166100.0, 88485.0, 53353.0, 33271.0, 22203.0, 14596.0, 9932.0, 6622.0, 4352.0, 2973.0, 1974.0, 1351.0, 935.0, 569.0, 395.0, 240.0, 165.0, 109.0, 80.0, 47.0, 35.0, 15.0, 22.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0721435546875, -0.06993579864501953, -0.06772804260253906, -0.0655202865600586, -0.06331253051757812, -0.061104774475097656, -0.05889701843261719, -0.05668926239013672, -0.05448150634765625, -0.05227375030517578, -0.05006599426269531, -0.047858238220214844, -0.045650482177734375, -0.043442726135253906, -0.04123497009277344, -0.03902721405029297, -0.0368194580078125, -0.03461170196533203, -0.03240394592285156, -0.030196189880371094, -0.027988433837890625, -0.025780677795410156, -0.023572921752929688, -0.02136516571044922, -0.01915740966796875, -0.01694965362548828, -0.014741897583007812, -0.012534141540527344, -0.010326385498046875, -0.008118629455566406, -0.0059108734130859375, -0.0037031173706054688, -0.001495361328125, 0.0007123947143554688, 0.0029201507568359375, 0.005127906799316406, 0.007335662841796875, 0.009543418884277344, 0.011751174926757812, 0.013958930969238281, 0.01616668701171875, 0.01837444305419922, 0.020582199096679688, 0.022789955139160156, 0.024997711181640625, 0.027205467224121094, 0.029413223266601562, 0.03162097930908203, 0.0338287353515625, 0.03603649139404297, 0.03824424743652344, 0.040452003479003906, 0.042659759521484375, 0.044867515563964844, 0.04707527160644531, 0.04928302764892578, 0.05149078369140625, 0.05369853973388672, 0.05590629577636719, 0.058114051818847656, 0.060321807861328125, 0.0625295639038086, 0.06473731994628906, 0.06694507598876953, 0.06915283203125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 4.0, 4.0, 9.0, 13.0, 14.0, 19.0, 19.0, 20.0, 19.0, 42.0, 38.0, 54.0, 104.0, 288.0, 0.0, 97.0, 61.0, 42.0, 26.0, 12.0, 19.0, 20.0, 14.0, 11.0, 8.0, 12.0, 10.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7881393432617188e-06, -1.730397343635559e-06, -1.6726553440093994e-06, -1.6149133443832397e-06, -1.55717134475708e-06, -1.4994293451309204e-06, -1.4416873455047607e-06, -1.383945345878601e-06, -1.3262033462524414e-06, -1.2684613466262817e-06, -1.210719347000122e-06, -1.1529773473739624e-06, -1.0952353477478027e-06, -1.037493348121643e-06, -9.797513484954834e-07, -9.220093488693237e-07, -8.642673492431641e-07, -8.065253496170044e-07, -7.487833499908447e-07, -6.910413503646851e-07, -6.332993507385254e-07, -5.755573511123657e-07, -5.178153514862061e-07, -4.600733518600464e-07, -4.023313522338867e-07, -3.4458935260772705e-07, -2.868473529815674e-07, -2.2910535335540771e-07, -1.7136335372924805e-07, -1.1362135410308838e-07, -5.587935447692871e-08, 1.862645149230957e-09, 5.960464477539063e-08, 1.1734664440155029e-07, 1.7508864402770996e-07, 2.3283064365386963e-07, 2.905726432800293e-07, 3.4831464290618896e-07, 4.0605664253234863e-07, 4.637986421585083e-07, 5.21540641784668e-07, 5.792826414108276e-07, 6.370246410369873e-07, 6.94766640663147e-07, 7.525086402893066e-07, 8.102506399154663e-07, 8.67992639541626e-07, 9.257346391677856e-07, 9.834766387939453e-07, 1.041218638420105e-06, 1.0989606380462646e-06, 1.1567026376724243e-06, 1.214444637298584e-06, 1.2721866369247437e-06, 1.3299286365509033e-06, 1.387670636177063e-06, 1.4454126358032227e-06, 1.5031546354293823e-06, 1.560896635055542e-06, 1.6186386346817017e-06, 1.6763806343078613e-06, 1.734122633934021e-06, 1.7918646335601807e-06, 1.8496066331863403e-06, 1.9073486328125e-06]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 11.0, 11.0, 7.0, 12.0, 25.0, 25.0, 26.0, 42.0, 107.0, 198.0, 915.0, 95491.0, 946601.0, 4428.0, 283.0, 128.0, 66.0, 38.0, 27.0, 26.0, 20.0, 13.0, 13.0, 11.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.309415817260742e-05, -4.1795894503593445e-05, -4.049763083457947e-05, -3.919936716556549e-05, -3.7901103496551514e-05, -3.660283982753754e-05, -3.530457615852356e-05, -3.400631248950958e-05, -3.2708048820495605e-05, -3.140978515148163e-05, -3.011152148246765e-05, -2.8813257813453674e-05, -2.7514994144439697e-05, -2.621673047542572e-05, -2.4918466806411743e-05, -2.3620203137397766e-05, -2.232193946838379e-05, -2.1023675799369812e-05, -1.9725412130355835e-05, -1.8427148461341858e-05, -1.712888479232788e-05, -1.5830621123313904e-05, -1.4532357454299927e-05, -1.323409378528595e-05, -1.1935830116271973e-05, -1.0637566447257996e-05, -9.339302778244019e-06, -8.041039109230042e-06, -6.7427754402160645e-06, -5.444511771202087e-06, -4.14624810218811e-06, -2.8479844331741333e-06, -1.5497207641601562e-06, -2.514570951461792e-07, 1.0468065738677979e-06, 2.345070242881775e-06, 3.643333911895752e-06, 4.941597580909729e-06, 6.239861249923706e-06, 7.538124918937683e-06, 8.83638858795166e-06, 1.0134652256965637e-05, 1.1432915925979614e-05, 1.2731179594993591e-05, 1.4029443264007568e-05, 1.5327706933021545e-05, 1.6625970602035522e-05, 1.79242342710495e-05, 1.9222497940063477e-05, 2.0520761609077454e-05, 2.181902527809143e-05, 2.3117288947105408e-05, 2.4415552616119385e-05, 2.5713816285133362e-05, 2.701207995414734e-05, 2.8310343623161316e-05, 2.9608607292175293e-05, 3.090687096118927e-05, 3.220513463020325e-05, 3.3503398299217224e-05, 3.48016619682312e-05, 3.609992563724518e-05, 3.7398189306259155e-05, 3.869645297527313e-05, 3.999471664428711e-05]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 25.0, 84.0, 299.0, 450.0, 101.0, 26.0, 16.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.428028998721857e-06, -5.329571649781428e-06, -5.231113846093649e-06, -5.132656497153221e-06, -5.0341986934654415e-06, -4.935741344525013e-06, -4.837283995584585e-06, -4.7388261918968055e-06, -4.640368842956377e-06, -4.541911494015949e-06, -4.44345369032817e-06, -4.344996341387741e-06, -4.246538992447313e-06, -4.148081188759534e-06, -4.049623839819105e-06, -3.951166036131326e-06, -3.852708687190898e-06, -3.754251110876794e-06, -3.65579353456269e-06, -3.557336185622262e-06, -3.458878609308158e-06, -3.3604210329940543e-06, -3.261963684053626e-06, -3.163506107739522e-06, -3.0650485314254183e-06, -2.9665909551113145e-06, -2.8681333787972108e-06, -2.7696760298567824e-06, -2.6712184535426786e-06, -2.572760877228575e-06, -2.4743035282881465e-06, -2.3758459519740427e-06, -2.277388375659939e-06, -2.178930799345835e-06, -2.0804732230317313e-06, -1.982015874091303e-06, -1.8835582977771992e-06, -1.7851007214630954e-06, -1.6866432588358293e-06, -1.5881857962085633e-06, -1.4897282198944595e-06, -1.3912706435803557e-06, -1.2928131809530896e-06, -1.1943557183258235e-06, -1.0958981420117198e-06, -9.97440565697616e-07, -8.989831030703499e-07, -8.00525583599665e-07, -7.0206806412898e-07, -6.036105446582951e-07, -5.051530251876102e-07, -4.0669550571692525e-07, -3.082379862462403e-07, -2.097804667755554e-07, -1.1132294730487047e-07, -1.2865427834185539e-08, 8.559209163649939e-08, 1.8404961110718432e-07, 2.8250713057786925e-07, 3.809646500485542e-07, 4.794221695192391e-07, 5.77879688989924e-07, 6.76337208460609e-07, 7.747947279312939e-07, 8.732522474019788e-07]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 10.0, 0.0, 0.0, 17.0, 0.0, 31.0, 0.0, 0.0, 63.0, 0.0, 0.0, 87.0, 0.0, 151.0, 0.0, 0.0, 249.0, 0.0, 172.0, 0.0, 0.0, 116.0, 0.0, 59.0, 0.0, 0.0, 31.0, 0.0, 16.0, 0.0, 0.0, 7.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.323680281639099e-07, -6.09084963798523e-07, -5.85801899433136e-07, -5.62518835067749e-07, -5.392357707023621e-07, -5.159527063369751e-07, -4.926696419715881e-07, -4.6938657760620117e-07, -4.461035132408142e-07, -4.2282044887542725e-07, -3.995373845100403e-07, -3.762543201446533e-07, -3.5297125577926636e-07, -3.296881914138794e-07, -3.0640512704849243e-07, -2.8312206268310547e-07, -2.598389983177185e-07, -2.3655593395233154e-07, -2.1327286958694458e-07, -1.8998980522155762e-07, -1.6670674085617065e-07, -1.434236764907837e-07, -1.2014061212539673e-07, -9.685754776000977e-08, -7.35744833946228e-08, -5.029141902923584e-08, -2.7008354663848877e-08, -3.725290298461914e-09, 1.955777406692505e-08, 4.284083843231201e-08, 6.612390279769897e-08, 8.940696716308594e-08, 1.126900315284729e-07, 1.3597309589385986e-07, 1.5925616025924683e-07, 1.825392246246338e-07, 2.0582228899002075e-07, 2.2910535335540771e-07, 2.523884177207947e-07, 2.7567148208618164e-07, 2.989545464515686e-07, 3.2223761081695557e-07, 3.4552067518234253e-07, 3.688037395477295e-07, 3.9208680391311646e-07, 4.153698682785034e-07, 4.386529326438904e-07, 4.6193599700927734e-07, 4.852190613746643e-07, 5.085021257400513e-07, 5.317851901054382e-07, 5.550682544708252e-07, 5.783513188362122e-07, 6.016343832015991e-07, 6.249174475669861e-07, 6.48200511932373e-07, 6.7148357629776e-07, 6.94766640663147e-07, 7.180497050285339e-07, 7.413327693939209e-07, 7.646158337593079e-07, 7.878988981246948e-07, 8.111819624900818e-07, 8.344650268554688e-07]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 12.0, 9.0, 6.0, 6.0, 14.0, 11.0, 17.0, 19.0, 22.0, 21.0, 29.0, 33.0, 37.0, 29.0, 46.0, 41.0, 36.0, 44.0, 41.0, 41.0, 44.0, 44.0, 36.0, 51.0, 46.0, 33.0, 28.0, 26.0, 29.0, 20.0, 27.0, 19.0, 16.0, 12.0, 12.0, 6.0, 13.0, 6.0, 2.0, 5.0, 3.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.318603515625, -3.21337890625, -3.108154296875, -3.0029296875, -2.897705078125, -2.79248046875, -2.687255859375, -2.58203125, -2.476806640625, -2.37158203125, -2.266357421875, -2.1611328125, -2.055908203125, -1.95068359375, -1.845458984375, -1.740234375, -1.635009765625, -1.52978515625, -1.424560546875, -1.3193359375, -1.214111328125, -1.10888671875, -1.003662109375, -0.8984375, -0.793212890625, -0.68798828125, -0.582763671875, -0.4775390625, -0.372314453125, -0.26708984375, -0.161865234375, -0.056640625, 0.048583984375, 0.15380859375, 0.259033203125, 0.3642578125, 0.469482421875, 0.57470703125, 0.679931640625, 0.78515625, 0.890380859375, 0.99560546875, 1.100830078125, 1.2060546875, 1.311279296875, 1.41650390625, 1.521728515625, 1.626953125, 1.732177734375, 1.83740234375, 1.942626953125, 2.0478515625, 2.153076171875, 2.25830078125, 2.363525390625, 2.46875, 2.573974609375, 2.67919921875, 2.784423828125, 2.8896484375, 2.994873046875, 3.10009765625, 3.205322265625, 3.310546875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 12.0, 11.0, 23.0, 29.0, 39.0, 89.0, 141.0, 250.0, 483.0, 892.0, 1678.0, 3225.0, 5868.0, 10711.0, 19818.0, 37530.0, 76320.0, 187263.0, 424203.0, 146922.0, 63672.0, 31860.0, 17197.0, 9187.0, 5142.0, 2787.0, 1472.0, 766.0, 425.0, 193.0, 120.0, 80.0, 47.0, 32.0, 13.0, 19.0, 7.0, 3.0, 2.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.62890625, -4.490234375, -4.3515625, -4.212890625, -4.07421875, -3.935546875, -3.796875, -3.658203125, -3.51953125, -3.380859375, -3.2421875, -3.103515625, -2.96484375, -2.826171875, -2.6875, -2.548828125, -2.41015625, -2.271484375, -2.1328125, -1.994140625, -1.85546875, -1.716796875, -1.578125, -1.439453125, -1.30078125, -1.162109375, -1.0234375, -0.884765625, -0.74609375, -0.607421875, -0.46875, -0.330078125, -0.19140625, -0.052734375, 0.0859375, 0.224609375, 0.36328125, 0.501953125, 0.640625, 0.779296875, 0.91796875, 1.056640625, 1.1953125, 1.333984375, 1.47265625, 1.611328125, 1.75, 1.888671875, 2.02734375, 2.166015625, 2.3046875, 2.443359375, 2.58203125, 2.720703125, 2.859375, 2.998046875, 3.13671875, 3.275390625, 3.4140625, 3.552734375, 3.69140625, 3.830078125, 3.96875, 4.107421875, 4.24609375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 14.0, 15.0, 15.0, 14.0, 27.0, 20.0, 27.0, 34.0, 42.0, 43.0, 58.0, 50.0, 82.0, 130.0, 231.0, 1528.0, 174.0, 103.0, 68.0, 59.0, 50.0, 34.0, 35.0, 32.0, 20.0, 21.0, 26.0, 19.0, 17.0, 10.0, 5.0, 8.0, 8.0, 2.0, 6.0, 3.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.4375, -10.06884765625, -9.7001953125, -9.33154296875, -8.962890625, -8.59423828125, -8.2255859375, -7.85693359375, -7.48828125, -7.11962890625, -6.7509765625, -6.38232421875, -6.013671875, -5.64501953125, -5.2763671875, -4.90771484375, -4.5390625, -4.17041015625, -3.8017578125, -3.43310546875, -3.064453125, -2.69580078125, -2.3271484375, -1.95849609375, -1.58984375, -1.22119140625, -0.8525390625, -0.48388671875, -0.115234375, 0.25341796875, 0.6220703125, 0.99072265625, 1.359375, 1.72802734375, 2.0966796875, 2.46533203125, 2.833984375, 3.20263671875, 3.5712890625, 3.93994140625, 4.30859375, 4.67724609375, 5.0458984375, 5.41455078125, 5.783203125, 6.15185546875, 6.5205078125, 6.88916015625, 7.2578125, 7.62646484375, 7.9951171875, 8.36376953125, 8.732421875, 9.10107421875, 9.4697265625, 9.83837890625, 10.20703125, 10.57568359375, 10.9443359375, 11.31298828125, 11.681640625, 12.05029296875, 12.4189453125, 12.78759765625, 13.15625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 12.0, 9.0, 11.0, 20.0, 21.0, 24.0, 39.0, 43.0, 54.0, 51.0, 104.0, 152.0, 244.0, 622.0, 3428.0, 81391.0, 2859049.0, 192283.0, 6425.0, 812.0, 281.0, 180.0, 114.0, 71.0, 55.0, 44.0, 25.0, 37.0, 21.0, 22.0, 21.0, 10.0, 4.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.203125, -27.4111328125, -26.619140625, -25.8271484375, -25.03515625, -24.2431640625, -23.451171875, -22.6591796875, -21.8671875, -21.0751953125, -20.283203125, -19.4912109375, -18.69921875, -17.9072265625, -17.115234375, -16.3232421875, -15.53125, -14.7392578125, -13.947265625, -13.1552734375, -12.36328125, -11.5712890625, -10.779296875, -9.9873046875, -9.1953125, -8.4033203125, -7.611328125, -6.8193359375, -6.02734375, -5.2353515625, -4.443359375, -3.6513671875, -2.859375, -2.0673828125, -1.275390625, -0.4833984375, 0.30859375, 1.1005859375, 1.892578125, 2.6845703125, 3.4765625, 4.2685546875, 5.060546875, 5.8525390625, 6.64453125, 7.4365234375, 8.228515625, 9.0205078125, 9.8125, 10.6044921875, 11.396484375, 12.1884765625, 12.98046875, 13.7724609375, 14.564453125, 15.3564453125, 16.1484375, 16.9404296875, 17.732421875, 18.5244140625, 19.31640625, 20.1083984375, 20.900390625, 21.6923828125, 22.484375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [2.0, 20.0, 63.0, 241.0, 362.0, 236.0, 83.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.559069633483887, -7.432194709777832, -5.305319309234619, -3.1784439086914062, -1.0515689849853516, 1.0753059387207031, 3.202181816101074, 5.329056739807129, 7.455931663513184, 9.582806587219238, 11.70968246459961, 13.836557388305664, 15.963432312011719, 18.090307235717773, 20.217182159423828, 22.344058990478516, 24.470932006835938, 26.597806930541992, 28.724681854248047, 30.851558685302734, 32.978431701660156, 35.105308532714844, 37.23218536376953, 39.35905838012695, 41.48593521118164, 43.61281204223633, 45.73968505859375, 47.86656188964844, 49.99343490600586, 52.12031173706055, 54.24718475341797, 56.374061584472656, 58.500938415527344, 60.62781524658203, 62.75468826293945, 64.88156127929688, 67.00843811035156, 69.13531494140625, 71.26219177246094, 73.38906860351562, 75.51593780517578, 77.64281463623047, 79.76969146728516, 81.89656066894531, 84.0234375, 86.15031433105469, 88.27719116210938, 90.40406799316406, 92.53094482421875, 94.65782165527344, 96.78469848632812, 98.91156768798828, 101.03844451904297, 103.16532135009766, 105.29219818115234, 107.4190673828125, 109.54594421386719, 111.67282104492188, 113.79969787597656, 115.92656707763672, 118.0534439086914, 120.1803207397461, 122.30719757080078, 124.43406677246094, 126.56094360351562]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 13.0, 8.0, 8.0, 11.0, 25.0, 19.0, 33.0, 40.0, 31.0, 45.0, 42.0, 51.0, 50.0, 47.0, 47.0, 42.0, 54.0, 41.0, 49.0, 39.0, 58.0, 42.0, 41.0, 35.0, 14.0, 20.0, 20.0, 14.0, 9.0, 15.0, 11.0, 5.0, 4.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.96651077270508, -31.773164749145508, -30.579818725585938, -29.386472702026367, -28.193126678466797, -26.99978256225586, -25.80643653869629, -24.61309051513672, -23.41974449157715, -22.226398468017578, -21.033052444458008, -19.839706420898438, -18.6463623046875, -17.453014373779297, -16.25967025756836, -15.066324234008789, -13.872978210449219, -12.679632186889648, -11.486286163330078, -10.292941093444824, -9.099595069885254, -7.906249046325684, -6.7129034996032715, -5.519557952880859, -4.326211929321289, -3.132866144180298, -1.9395203590393066, -0.7461745738983154, 0.4471712112426758, 1.640517234802246, 2.833862781524658, 4.02720832824707, 5.220558166503906, 6.413904190063477, 7.607249736785889, 8.8005952835083, 9.993941307067871, 11.187287330627441, 12.380632400512695, 13.573978424072266, 14.767324447631836, 15.960670471191406, 17.154016494750977, 18.347362518310547, 19.540706634521484, 20.734054565429688, 21.927398681640625, 23.120744705200195, 24.314090728759766, 25.507436752319336, 26.700782775878906, 27.894128799438477, 29.087474822998047, 30.280818939208984, 31.474164962768555, 32.667510986328125, 33.86085510253906, 35.05419921875, 36.2475471496582, 37.44089126586914, 38.634239196777344, 39.82758331298828, 41.020931243896484, 42.21427536010742, 43.407623291015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 13.0, 6.0, 11.0, 9.0, 15.0, 19.0, 22.0, 16.0, 27.0, 20.0, 35.0, 28.0, 40.0, 32.0, 51.0, 34.0, 46.0, 46.0, 37.0, 44.0, 54.0, 42.0, 39.0, 40.0, 39.0, 20.0, 33.0, 25.0, 22.0, 19.0, 21.0, 13.0, 21.0, 8.0, 5.0, 10.0, 8.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.80859375, -3.694366455078125, -3.58013916015625, -3.465911865234375, -3.3516845703125, -3.237457275390625, -3.12322998046875, -3.009002685546875, -2.894775390625, -2.780548095703125, -2.66632080078125, -2.552093505859375, -2.4378662109375, -2.323638916015625, -2.20941162109375, -2.095184326171875, -1.98095703125, -1.866729736328125, -1.75250244140625, -1.638275146484375, -1.5240478515625, -1.409820556640625, -1.29559326171875, -1.181365966796875, -1.067138671875, -0.952911376953125, -0.83868408203125, -0.724456787109375, -0.6102294921875, -0.496002197265625, -0.38177490234375, -0.267547607421875, -0.1533203125, -0.039093017578125, 0.07513427734375, 0.189361572265625, 0.3035888671875, 0.417816162109375, 0.53204345703125, 0.646270751953125, 0.760498046875, 0.874725341796875, 0.98895263671875, 1.103179931640625, 1.2174072265625, 1.331634521484375, 1.44586181640625, 1.560089111328125, 1.67431640625, 1.788543701171875, 1.90277099609375, 2.016998291015625, 2.1312255859375, 2.245452880859375, 2.35968017578125, 2.473907470703125, 2.588134765625, 2.702362060546875, 2.81658935546875, 2.930816650390625, 3.0450439453125, 3.159271240234375, 3.27349853515625, 3.387725830078125, 3.501953125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 1.0, 2.0, 3.0, 5.0, 12.0, 24.0, 33.0, 46.0, 63.0, 107.0, 176.0, 262.0, 437.0, 712.0, 1151.0, 2016.0, 3609.0, 6309.0, 11640.0, 22134.0, 42380.0, 84015.0, 165869.0, 319769.0, 580139.0, 896443.0, 874474.0, 554312.0, 304811.0, 157052.0, 79355.0, 40402.0, 21117.0, 11306.0, 6004.0, 3351.0, 1881.0, 1142.0, 660.0, 390.0, 236.0, 169.0, 90.0, 61.0, 32.0, 25.0, 19.0, 16.0, 15.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.884765625, -2.7972412109375, -2.709716796875, -2.6221923828125, -2.53466796875, -2.4471435546875, -2.359619140625, -2.2720947265625, -2.1845703125, -2.0970458984375, -2.009521484375, -1.9219970703125, -1.83447265625, -1.7469482421875, -1.659423828125, -1.5718994140625, -1.484375, -1.3968505859375, -1.309326171875, -1.2218017578125, -1.13427734375, -1.0467529296875, -0.959228515625, -0.8717041015625, -0.7841796875, -0.6966552734375, -0.609130859375, -0.5216064453125, -0.43408203125, -0.3465576171875, -0.259033203125, -0.1715087890625, -0.083984375, 0.0035400390625, 0.091064453125, 0.1785888671875, 0.26611328125, 0.3536376953125, 0.441162109375, 0.5286865234375, 0.6162109375, 0.7037353515625, 0.791259765625, 0.8787841796875, 0.96630859375, 1.0538330078125, 1.141357421875, 1.2288818359375, 1.31640625, 1.4039306640625, 1.491455078125, 1.5789794921875, 1.66650390625, 1.7540283203125, 1.841552734375, 1.9290771484375, 2.0166015625, 2.1041259765625, 2.191650390625, 2.2791748046875, 2.36669921875, 2.4542236328125, 2.541748046875, 2.6292724609375, 2.716796875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 7.0, 7.0, 22.0, 16.0, 24.0, 36.0, 63.0, 77.0, 86.0, 128.0, 152.0, 228.0, 268.0, 341.0, 420.0, 464.0, 388.0, 316.0, 255.0, 172.0, 147.0, 101.0, 88.0, 74.0, 55.0, 29.0, 22.0, 24.0, 16.0, 5.0, 8.0, 6.0, 4.0, 5.0, 1.0, 6.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.79296875, -6.60552978515625, -6.4180908203125, -6.23065185546875, -6.043212890625, -5.85577392578125, -5.6683349609375, -5.48089599609375, -5.29345703125, -5.10601806640625, -4.9185791015625, -4.73114013671875, -4.543701171875, -4.35626220703125, -4.1688232421875, -3.98138427734375, -3.7939453125, -3.60650634765625, -3.4190673828125, -3.23162841796875, -3.044189453125, -2.85675048828125, -2.6693115234375, -2.48187255859375, -2.29443359375, -2.10699462890625, -1.9195556640625, -1.73211669921875, -1.544677734375, -1.35723876953125, -1.1697998046875, -0.98236083984375, -0.794921875, -0.60748291015625, -0.4200439453125, -0.23260498046875, -0.045166015625, 0.14227294921875, 0.3297119140625, 0.51715087890625, 0.70458984375, 0.89202880859375, 1.0794677734375, 1.26690673828125, 1.454345703125, 1.64178466796875, 1.8292236328125, 2.01666259765625, 2.2041015625, 2.39154052734375, 2.5789794921875, 2.76641845703125, 2.953857421875, 3.14129638671875, 3.3287353515625, 3.51617431640625, 3.70361328125, 3.89105224609375, 4.0784912109375, 4.26593017578125, 4.453369140625, 4.64080810546875, 4.8282470703125, 5.01568603515625, 5.203125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 7.0, 6.0, 5.0, 7.0, 19.0, 24.0, 18.0, 41.0, 75.0, 64.0, 94.0, 151.0, 210.0, 339.0, 657.0, 2930.0, 119523.0, 3659400.0, 402562.0, 6139.0, 807.0, 413.0, 232.0, 153.0, 109.0, 79.0, 71.0, 37.0, 28.0, 23.0, 16.0, 12.0, 3.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.095458984375, -18.37841796875, -17.661376953125, -16.9443359375, -16.227294921875, -15.51025390625, -14.793212890625, -14.076171875, -13.359130859375, -12.64208984375, -11.925048828125, -11.2080078125, -10.490966796875, -9.77392578125, -9.056884765625, -8.33984375, -7.622802734375, -6.90576171875, -6.188720703125, -5.4716796875, -4.754638671875, -4.03759765625, -3.320556640625, -2.603515625, -1.886474609375, -1.16943359375, -0.452392578125, 0.2646484375, 0.981689453125, 1.69873046875, 2.415771484375, 3.1328125, 3.849853515625, 4.56689453125, 5.283935546875, 6.0009765625, 6.718017578125, 7.43505859375, 8.152099609375, 8.869140625, 9.586181640625, 10.30322265625, 11.020263671875, 11.7373046875, 12.454345703125, 13.17138671875, 13.888427734375, 14.60546875, 15.322509765625, 16.03955078125, 16.756591796875, 17.4736328125, 18.190673828125, 18.90771484375, 19.624755859375, 20.341796875, 21.058837890625, 21.77587890625, 22.492919921875, 23.2099609375, 23.927001953125, 24.64404296875, 25.361083984375, 26.078125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 59.0, 275.0, 453.0, 194.0, 28.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.2837677001953, -136.19705200195312, -132.11033630371094, -128.02362060546875, -123.9369125366211, -119.8501968383789, -115.76348876953125, -111.67677307128906, -107.59005737304688, -103.50334167480469, -99.4166259765625, -95.32991790771484, -91.24320220947266, -87.15648651123047, -83.06977844238281, -78.98306274414062, -74.89634704589844, -70.80963134765625, -66.72291564941406, -62.636207580566406, -58.54949188232422, -54.46277618408203, -50.37606430053711, -46.28935241699219, -42.20263671875, -38.11592102050781, -34.02920913696289, -29.942495346069336, -25.85578155517578, -21.769067764282227, -17.682353973388672, -13.595640182495117, -9.508941650390625, -5.42222785949707, -1.3355140686035156, 2.751199722290039, 6.837913513183594, 10.924627304077148, 15.011341094970703, 19.098054885864258, 23.184768676757812, 27.271482467651367, 31.358196258544922, 35.444908142089844, 39.53162384033203, 43.61833953857422, 47.70505142211914, 51.79176330566406, 55.87847900390625, 59.96519470214844, 64.05191040039062, 68.13861846923828, 72.22533416748047, 76.31204986572266, 80.39875793457031, 84.4854736328125, 88.57218933105469, 92.65890502929688, 96.74562072753906, 100.83232879638672, 104.9190444946289, 109.0057601928711, 113.09246826171875, 117.17918395996094, 121.26589965820312]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 9.0, 6.0, 4.0, 9.0, 13.0, 5.0, 13.0, 20.0, 15.0, 33.0, 34.0, 34.0, 43.0, 42.0, 42.0, 37.0, 34.0, 51.0, 43.0, 48.0, 41.0, 44.0, 43.0, 42.0, 32.0, 52.0, 26.0, 24.0, 24.0, 19.0, 18.0, 24.0, 18.0, 18.0, 10.0, 13.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.325834274291992, -20.60890007019043, -19.891965866088867, -19.175031661987305, -18.458099365234375, -17.741165161132812, -17.02423095703125, -16.307296752929688, -15.590362548828125, -14.873428344726562, -14.156494140625, -13.439560890197754, -12.722626686096191, -12.005692481994629, -11.288759231567383, -10.57182502746582, -9.854890823364258, -9.137956619262695, -8.421022415161133, -7.704089164733887, -6.987154960632324, -6.270220756530762, -5.553287029266357, -4.836353302001953, -4.119419097900391, -3.4024851322174072, -2.685551166534424, -1.9686172008514404, -1.251683235168457, -0.5347492694854736, 0.18218469619750977, 0.8991184234619141, 1.6160507202148438, 2.332984685897827, 3.0499186515808105, 3.766852617263794, 4.483786582946777, 5.20072078704834, 5.917654514312744, 6.634588241577148, 7.351522445678711, 8.068456649780273, 8.785390853881836, 9.502324104309082, 10.219258308410645, 10.936192512512207, 11.653125762939453, 12.370059967041016, 13.086994171142578, 13.80392837524414, 14.520862579345703, 15.23779582977295, 15.954730033874512, 16.671663284301758, 17.38859748840332, 18.105531692504883, 18.822465896606445, 19.539400100708008, 20.25633430480957, 20.973268508911133, 21.690200805664062, 22.407135009765625, 23.124069213867188, 23.84100341796875, 24.557937622070312]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 15.0, 14.0, 14.0, 13.0, 17.0, 21.0, 17.0, 25.0, 36.0, 27.0, 24.0, 38.0, 38.0, 45.0, 44.0, 35.0, 40.0, 54.0, 40.0, 51.0, 46.0, 34.0, 35.0, 30.0, 26.0, 27.0, 20.0, 28.0, 21.0, 16.0, 12.0, 19.0, 7.0, 11.0, 10.0, 8.0, 1.0, 3.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.34906005859375, -3.2410888671875, -3.13311767578125, -3.025146484375, -2.91717529296875, -2.8092041015625, -2.70123291015625, -2.59326171875, -2.48529052734375, -2.3773193359375, -2.26934814453125, -2.161376953125, -2.05340576171875, -1.9454345703125, -1.83746337890625, -1.7294921875, -1.62152099609375, -1.5135498046875, -1.40557861328125, -1.297607421875, -1.18963623046875, -1.0816650390625, -0.97369384765625, -0.86572265625, -0.75775146484375, -0.6497802734375, -0.54180908203125, -0.433837890625, -0.32586669921875, -0.2178955078125, -0.10992431640625, -0.001953125, 0.10601806640625, 0.2139892578125, 0.32196044921875, 0.429931640625, 0.53790283203125, 0.6458740234375, 0.75384521484375, 0.86181640625, 0.96978759765625, 1.0777587890625, 1.18572998046875, 1.293701171875, 1.40167236328125, 1.5096435546875, 1.61761474609375, 1.7255859375, 1.83355712890625, 1.9415283203125, 2.04949951171875, 2.157470703125, 2.26544189453125, 2.3734130859375, 2.48138427734375, 2.58935546875, 2.69732666015625, 2.8052978515625, 2.91326904296875, 3.021240234375, 3.12921142578125, 3.2371826171875, 3.34515380859375, 3.453125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 9.0, 18.0, 27.0, 47.0, 69.0, 82.0, 146.0, 194.0, 301.0, 454.0, 622.0, 895.0, 1391.0, 2149.0, 3179.0, 4641.0, 6934.0, 10051.0, 15300.0, 23174.0, 35539.0, 58210.0, 105677.0, 288698.0, 237250.0, 97974.0, 55045.0, 33941.0, 21931.0, 14701.0, 9669.0, 6624.0, 4442.0, 2913.0, 2027.0, 1421.0, 911.0, 629.0, 427.0, 267.0, 217.0, 126.0, 92.0, 53.0, 30.0, 21.0, 13.0, 9.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.141357421875, -0.136932373046875, -0.13250732421875, -0.128082275390625, -0.1236572265625, -0.119232177734375, -0.11480712890625, -0.110382080078125, -0.10595703125, -0.101531982421875, -0.09710693359375, -0.092681884765625, -0.0882568359375, -0.083831787109375, -0.07940673828125, -0.074981689453125, -0.070556640625, -0.066131591796875, -0.06170654296875, -0.057281494140625, -0.0528564453125, -0.048431396484375, -0.04400634765625, -0.039581298828125, -0.03515625, -0.030731201171875, -0.02630615234375, -0.021881103515625, -0.0174560546875, -0.013031005859375, -0.00860595703125, -0.004180908203125, 0.000244140625, 0.004669189453125, 0.00909423828125, 0.013519287109375, 0.0179443359375, 0.022369384765625, 0.02679443359375, 0.031219482421875, 0.03564453125, 0.040069580078125, 0.04449462890625, 0.048919677734375, 0.0533447265625, 0.057769775390625, 0.06219482421875, 0.066619873046875, 0.071044921875, 0.075469970703125, 0.07989501953125, 0.084320068359375, 0.0887451171875, 0.093170166015625, 0.09759521484375, 0.102020263671875, 0.1064453125, 0.110870361328125, 0.11529541015625, 0.119720458984375, 0.1241455078125, 0.128570556640625, 0.13299560546875, 0.137420654296875, 0.141845703125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 7.0, 5.0, 6.0, 7.0, 12.0, 12.0, 8.0, 17.0, 16.0, 25.0, 20.0, 30.0, 24.0, 30.0, 41.0, 37.0, 30.0, 35.0, 39.0, 35.0, 37.0, 39.0, 1066.0, 31.0, 37.0, 37.0, 30.0, 45.0, 32.0, 35.0, 25.0, 17.0, 17.0, 25.0, 21.0, 14.0, 15.0, 16.0, 12.0, 8.0, 4.0, 6.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.48828125, -2.41070556640625, -2.3331298828125, -2.25555419921875, -2.177978515625, -2.10040283203125, -2.0228271484375, -1.94525146484375, -1.86767578125, -1.79010009765625, -1.7125244140625, -1.63494873046875, -1.557373046875, -1.47979736328125, -1.4022216796875, -1.32464599609375, -1.2470703125, -1.16949462890625, -1.0919189453125, -1.01434326171875, -0.936767578125, -0.85919189453125, -0.7816162109375, -0.70404052734375, -0.62646484375, -0.54888916015625, -0.4713134765625, -0.39373779296875, -0.316162109375, -0.23858642578125, -0.1610107421875, -0.08343505859375, -0.005859375, 0.07171630859375, 0.1492919921875, 0.22686767578125, 0.304443359375, 0.38201904296875, 0.4595947265625, 0.53717041015625, 0.61474609375, 0.69232177734375, 0.7698974609375, 0.84747314453125, 0.925048828125, 1.00262451171875, 1.0802001953125, 1.15777587890625, 1.2353515625, 1.31292724609375, 1.3905029296875, 1.46807861328125, 1.545654296875, 1.62322998046875, 1.7008056640625, 1.77838134765625, 1.85595703125, 1.93353271484375, 2.0111083984375, 2.08868408203125, 2.166259765625, 2.24383544921875, 2.3214111328125, 2.39898681640625, 2.4765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 15.0, 13.0, 25.0, 38.0, 50.0, 83.0, 111.0, 187.0, 194.0, 369.0, 493.0, 675.0, 966.0, 1392.0, 1963.0, 2834.0, 4092.0, 5792.0, 8561.0, 12084.0, 18039.0, 26606.0, 41156.0, 65828.0, 111791.0, 1296079.0, 208871.0, 104925.0, 62922.0, 39422.0, 25770.0, 17186.0, 11915.0, 8081.0, 5618.0, 3856.0, 2804.0, 1932.0, 1305.0, 953.0, 625.0, 462.0, 332.0, 225.0, 148.0, 117.0, 70.0, 52.0, 43.0, 23.0, 16.0, 9.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0714111328125, -0.06917572021484375, -0.0669403076171875, -0.06470489501953125, -0.062469482421875, -0.06023406982421875, -0.0579986572265625, -0.05576324462890625, -0.05352783203125, -0.05129241943359375, -0.0490570068359375, -0.04682159423828125, -0.044586181640625, -0.04235076904296875, -0.0401153564453125, -0.03787994384765625, -0.03564453125, -0.03340911865234375, -0.0311737060546875, -0.02893829345703125, -0.026702880859375, -0.02446746826171875, -0.0222320556640625, -0.01999664306640625, -0.01776123046875, -0.01552581787109375, -0.0132904052734375, -0.01105499267578125, -0.008819580078125, -0.00658416748046875, -0.0043487548828125, -0.00211334228515625, 0.0001220703125, 0.00235748291015625, 0.0045928955078125, 0.00682830810546875, 0.009063720703125, 0.01129913330078125, 0.0135345458984375, 0.01576995849609375, 0.01800537109375, 0.02024078369140625, 0.0224761962890625, 0.02471160888671875, 0.026947021484375, 0.02918243408203125, 0.0314178466796875, 0.03365325927734375, 0.035888671875, 0.03812408447265625, 0.0403594970703125, 0.04259490966796875, 0.044830322265625, 0.04706573486328125, 0.0493011474609375, 0.05153656005859375, 0.05377197265625, 0.05600738525390625, 0.0582427978515625, 0.06047821044921875, 0.062713623046875, 0.06494903564453125, 0.0671844482421875, 0.06941986083984375, 0.0716552734375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 0.0, 7.0, 14.0, 9.0, 13.0, 16.0, 21.0, 19.0, 41.0, 36.0, 0.0, 28.0, 60.0, 72.0, 302.0, 84.0, 64.0, 37.0, 33.0, 30.0, 15.0, 0.0, 21.0, 10.0, 11.0, 13.0, 2.0, 3.0, 5.0, 7.0, 10.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9073486328125e-06, -1.8533319234848022e-06, -1.7993152141571045e-06, -1.7452985048294067e-06, -1.691281795501709e-06, -1.6372650861740112e-06, -1.5832483768463135e-06, -1.5292316675186157e-06, -1.475214958190918e-06, -1.4211982488632202e-06, -1.3671815395355225e-06, -1.3131648302078247e-06, -1.259148120880127e-06, -1.2051314115524292e-06, -1.1511147022247314e-06, -1.0970979928970337e-06, -1.043081283569336e-06, -9.890645742416382e-07, -9.350478649139404e-07, -8.810311555862427e-07, -8.270144462585449e-07, -7.729977369308472e-07, -7.189810276031494e-07, -6.649643182754517e-07, -6.109476089477539e-07, -5.569308996200562e-07, -5.029141902923584e-07, -4.4889748096466064e-07, -3.948807716369629e-07, -3.4086406230926514e-07, -2.868473529815674e-07, -2.3283064365386963e-07, -1.7881393432617188e-07, -1.2479722499847412e-07, -7.078051567077637e-08, -1.6763806343078613e-08, 3.725290298461914e-08, 9.12696123123169e-08, 1.4528632164001465e-07, 1.993030309677124e-07, 2.5331974029541016e-07, 3.073364496231079e-07, 3.6135315895080566e-07, 4.153698682785034e-07, 4.6938657760620117e-07, 5.234032869338989e-07, 5.774199962615967e-07, 6.314367055892944e-07, 6.854534149169922e-07, 7.394701242446899e-07, 7.934868335723877e-07, 8.475035429000854e-07, 9.015202522277832e-07, 9.55536961555481e-07, 1.0095536708831787e-06, 1.0635703802108765e-06, 1.1175870895385742e-06, 1.171603798866272e-06, 1.2256205081939697e-06, 1.2796372175216675e-06, 1.3336539268493652e-06, 1.387670636177063e-06, 1.4416873455047607e-06, 1.4957040548324585e-06, 1.5497207641601562e-06]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 4.0, 2.0, 4.0, 4.0, 8.0, 8.0, 6.0, 13.0, 18.0, 20.0, 17.0, 37.0, 56.0, 93.0, 196.0, 762.0, 42307.0, 988610.0, 15447.0, 455.0, 149.0, 88.0, 56.0, 48.0, 30.0, 18.0, 14.0, 12.0, 14.0, 10.0, 7.0, 7.0, 8.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.403425216674805e-05, -3.287661820650101e-05, -3.171898424625397e-05, -3.056135028600693e-05, -2.9403716325759888e-05, -2.8246082365512848e-05, -2.7088448405265808e-05, -2.593081444501877e-05, -2.477318048477173e-05, -2.361554652452469e-05, -2.245791256427765e-05, -2.130027860403061e-05, -2.014264464378357e-05, -1.898501068353653e-05, -1.782737672328949e-05, -1.666974276304245e-05, -1.551210880279541e-05, -1.435447484254837e-05, -1.319684088230133e-05, -1.203920692205429e-05, -1.0881572961807251e-05, -9.723939001560211e-06, -8.566305041313171e-06, -7.408671081066132e-06, -6.251037120819092e-06, -5.093403160572052e-06, -3.935769200325012e-06, -2.7781352400779724e-06, -1.6205012798309326e-06, -4.628673195838928e-07, 6.94766640663147e-07, 1.8524006009101868e-06, 3.0100345611572266e-06, 4.167668521404266e-06, 5.325302481651306e-06, 6.482936441898346e-06, 7.640570402145386e-06, 8.798204362392426e-06, 9.955838322639465e-06, 1.1113472282886505e-05, 1.2271106243133545e-05, 1.3428740203380585e-05, 1.4586374163627625e-05, 1.5744008123874664e-05, 1.6901642084121704e-05, 1.8059276044368744e-05, 1.9216910004615784e-05, 2.0374543964862823e-05, 2.1532177925109863e-05, 2.2689811885356903e-05, 2.3847445845603943e-05, 2.5005079805850983e-05, 2.6162713766098022e-05, 2.7320347726345062e-05, 2.8477981686592102e-05, 2.9635615646839142e-05, 3.079324960708618e-05, 3.195088356733322e-05, 3.310851752758026e-05, 3.42661514878273e-05, 3.542378544807434e-05, 3.658141940832138e-05, 3.773905336856842e-05, 3.889668732881546e-05, 4.00543212890625e-05]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 27.0, 173.0, 648.0, 140.0, 24.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.361460459127557e-06, -8.202021490433253e-06, -8.04258252173895e-06, -7.883144462539349e-06, -7.723705493845046e-06, -7.564266525150742e-06, -7.404827556456439e-06, -7.245389042509487e-06, -7.085950073815184e-06, -6.9265111051208805e-06, -6.767072591173928e-06, -6.607633622479625e-06, -6.448195108532673e-06, -6.2887561398383696e-06, -6.129317625891417e-06, -5.969878657197114e-06, -5.810439688502811e-06, -5.651000719808508e-06, -5.491562205861555e-06, -5.332123237167252e-06, -5.1726847232203e-06, -5.013245754525997e-06, -4.8538067858316936e-06, -4.694368271884741e-06, -4.534929757937789e-06, -4.375490789243486e-06, -4.2160522752965335e-06, -4.05661330660223e-06, -3.897174792655278e-06, -3.737735823960975e-06, -3.578297082640347e-06, -3.4188583413197193e-06, -3.259419827372767e-06, -3.0999810860521393e-06, -2.9405423447315115e-06, -2.7811033760372084e-06, -2.6216646347165806e-06, -2.462225893395953e-06, -2.302787152075325e-06, -2.1433484107546974e-06, -1.9839094420603942e-06, -1.8244707007397665e-06, -1.665031845732301e-06, -1.5055931044116733e-06, -1.3461542494042078e-06, -1.18671550808358e-06, -1.0272767667629523e-06, -8.678379117554869e-07, -7.083991704348591e-07, -5.489603722708125e-07, -3.8952160252847534e-07, -2.3008283278613817e-07, -7.064403462209157e-08, 8.879476354195504e-08, 2.482335048625828e-07, 4.0767235987004824e-07, 5.67111101190676e-07, 7.265498993547226e-07, 8.859886975187692e-07, 1.045427438839397e-06, 1.2048662938468624e-06, 1.3643050351674901e-06, 1.5237437764881179e-06, 1.6831826314955833e-06, 1.842621372816211e-06]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 8.0, 0.0, 23.0, 0.0, 0.0, 35.0, 0.0, 0.0, 37.0, 0.0, 58.0, 0.0, 0.0, 100.0, 0.0, 0.0, 133.0, 0.0, 213.0, 0.0, 0.0, 141.0, 0.0, 0.0, 100.0, 0.0, 59.0, 0.0, 0.0, 45.0, 0.0, 0.0, 25.0, 0.0, 19.0, 0.0, 0.0, 9.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.736947059631348e-07, -5.513429641723633e-07, -5.289912223815918e-07, -5.066394805908203e-07, -4.842877388000488e-07, -4.6193599700927734e-07, -4.3958425521850586e-07, -4.172325134277344e-07, -3.948807716369629e-07, -3.725290298461914e-07, -3.501772880554199e-07, -3.2782554626464844e-07, -3.0547380447387695e-07, -2.8312206268310547e-07, -2.60770320892334e-07, -2.384185791015625e-07, -2.1606683731079102e-07, -1.9371509552001953e-07, -1.7136335372924805e-07, -1.4901161193847656e-07, -1.2665987014770508e-07, -1.043081283569336e-07, -8.195638656616211e-08, -5.960464477539063e-08, -3.725290298461914e-08, -1.4901161193847656e-08, 7.450580596923828e-09, 2.9802322387695312e-08, 5.21540641784668e-08, 7.450580596923828e-08, 9.685754776000977e-08, 1.1920928955078125e-07, 1.4156103134155273e-07, 1.6391277313232422e-07, 1.862645149230957e-07, 2.086162567138672e-07, 2.3096799850463867e-07, 2.5331974029541016e-07, 2.7567148208618164e-07, 2.980232238769531e-07, 3.203749656677246e-07, 3.427267074584961e-07, 3.650784492492676e-07, 3.8743019104003906e-07, 4.0978193283081055e-07, 4.3213367462158203e-07, 4.544854164123535e-07, 4.76837158203125e-07, 4.991888999938965e-07, 5.21540641784668e-07, 5.438923835754395e-07, 5.662441253662109e-07, 5.885958671569824e-07, 6.109476089477539e-07, 6.332993507385254e-07, 6.556510925292969e-07, 6.780028343200684e-07, 7.003545761108398e-07, 7.227063179016113e-07, 7.450580596923828e-07, 7.674098014831543e-07, 7.897615432739258e-07, 8.121132850646973e-07, 8.344650268554688e-07]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 15.0, 14.0, 14.0, 13.0, 17.0, 21.0, 17.0, 25.0, 36.0, 27.0, 24.0, 38.0, 38.0, 45.0, 44.0, 35.0, 40.0, 54.0, 40.0, 51.0, 46.0, 34.0, 35.0, 30.0, 26.0, 27.0, 20.0, 28.0, 21.0, 16.0, 12.0, 19.0, 7.0, 11.0, 10.0, 8.0, 1.0, 3.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.34906005859375, -3.2410888671875, -3.13311767578125, -3.025146484375, -2.91717529296875, -2.8092041015625, -2.70123291015625, -2.59326171875, -2.48529052734375, -2.3773193359375, -2.26934814453125, -2.161376953125, -2.05340576171875, -1.9454345703125, -1.83746337890625, -1.7294921875, -1.62152099609375, -1.5135498046875, -1.40557861328125, -1.297607421875, -1.18963623046875, -1.0816650390625, -0.97369384765625, -0.86572265625, -0.75775146484375, -0.6497802734375, -0.54180908203125, -0.433837890625, -0.32586669921875, -0.2178955078125, -0.10992431640625, -0.001953125, 0.10601806640625, 0.2139892578125, 0.32196044921875, 0.429931640625, 0.53790283203125, 0.6458740234375, 0.75384521484375, 0.86181640625, 0.96978759765625, 1.0777587890625, 1.18572998046875, 1.293701171875, 1.40167236328125, 1.5096435546875, 1.61761474609375, 1.7255859375, 1.83355712890625, 1.9415283203125, 2.04949951171875, 2.157470703125, 2.26544189453125, 2.3734130859375, 2.48138427734375, 2.58935546875, 2.69732666015625, 2.8052978515625, 2.91326904296875, 3.021240234375, 3.12921142578125, 3.2371826171875, 3.34515380859375, 3.453125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 1.0, 16.0, 21.0, 38.0, 57.0, 78.0, 139.0, 221.0, 379.0, 564.0, 900.0, 1397.0, 2229.0, 3318.0, 5267.0, 8345.0, 13267.0, 20919.0, 32738.0, 51572.0, 83765.0, 145224.0, 222967.0, 180989.0, 103525.0, 62437.0, 39167.0, 25178.0, 15868.0, 10160.0, 6524.0, 4057.0, 2593.0, 1669.0, 1075.0, 705.0, 426.0, 275.0, 205.0, 107.0, 71.0, 42.0, 21.0, 15.0, 10.0, 1.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.984375, -2.887176513671875, -2.78997802734375, -2.692779541015625, -2.5955810546875, -2.498382568359375, -2.40118408203125, -2.303985595703125, -2.206787109375, -2.109588623046875, -2.01239013671875, -1.915191650390625, -1.8179931640625, -1.720794677734375, -1.62359619140625, -1.526397705078125, -1.42919921875, -1.332000732421875, -1.23480224609375, -1.137603759765625, -1.0404052734375, -0.943206787109375, -0.84600830078125, -0.748809814453125, -0.651611328125, -0.554412841796875, -0.45721435546875, -0.360015869140625, -0.2628173828125, -0.165618896484375, -0.06842041015625, 0.028778076171875, 0.1259765625, 0.223175048828125, 0.32037353515625, 0.417572021484375, 0.5147705078125, 0.611968994140625, 0.70916748046875, 0.806365966796875, 0.903564453125, 1.000762939453125, 1.09796142578125, 1.195159912109375, 1.2923583984375, 1.389556884765625, 1.48675537109375, 1.583953857421875, 1.68115234375, 1.778350830078125, 1.87554931640625, 1.972747802734375, 2.0699462890625, 2.167144775390625, 2.26434326171875, 2.361541748046875, 2.458740234375, 2.555938720703125, 2.65313720703125, 2.750335693359375, 2.8475341796875, 2.944732666015625, 3.04193115234375, 3.139129638671875, 3.236328125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 4.0, 5.0, 6.0, 13.0, 10.0, 5.0, 16.0, 16.0, 20.0, 26.0, 23.0, 23.0, 30.0, 31.0, 39.0, 41.0, 64.0, 82.0, 134.0, 271.0, 1349.0, 227.0, 138.0, 75.0, 58.0, 45.0, 41.0, 38.0, 32.0, 32.0, 23.0, 24.0, 18.0, 10.0, 7.0, 13.0, 12.0, 10.0, 10.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.8125, -10.46728515625, -10.1220703125, -9.77685546875, -9.431640625, -9.08642578125, -8.7412109375, -8.39599609375, -8.05078125, -7.70556640625, -7.3603515625, -7.01513671875, -6.669921875, -6.32470703125, -5.9794921875, -5.63427734375, -5.2890625, -4.94384765625, -4.5986328125, -4.25341796875, -3.908203125, -3.56298828125, -3.2177734375, -2.87255859375, -2.52734375, -2.18212890625, -1.8369140625, -1.49169921875, -1.146484375, -0.80126953125, -0.4560546875, -0.11083984375, 0.234375, 0.57958984375, 0.9248046875, 1.27001953125, 1.615234375, 1.96044921875, 2.3056640625, 2.65087890625, 2.99609375, 3.34130859375, 3.6865234375, 4.03173828125, 4.376953125, 4.72216796875, 5.0673828125, 5.41259765625, 5.7578125, 6.10302734375, 6.4482421875, 6.79345703125, 7.138671875, 7.48388671875, 7.8291015625, 8.17431640625, 8.51953125, 8.86474609375, 9.2099609375, 9.55517578125, 9.900390625, 10.24560546875, 10.5908203125, 10.93603515625, 11.28125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 10.0, 9.0, 7.0, 12.0, 14.0, 14.0, 24.0, 37.0, 38.0, 56.0, 95.0, 96.0, 143.0, 214.0, 390.0, 1042.0, 5791.0, 61980.0, 1303586.0, 1686120.0, 76706.0, 7012.0, 1103.0, 371.0, 238.0, 154.0, 91.0, 93.0, 58.0, 41.0, 35.0, 30.0, 21.0, 14.0, 6.0, 16.0, 10.0, 6.0, 5.0, 4.0, 8.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.625, -15.166015625, -14.70703125, -14.248046875, -13.7890625, -13.330078125, -12.87109375, -12.412109375, -11.953125, -11.494140625, -11.03515625, -10.576171875, -10.1171875, -9.658203125, -9.19921875, -8.740234375, -8.28125, -7.822265625, -7.36328125, -6.904296875, -6.4453125, -5.986328125, -5.52734375, -5.068359375, -4.609375, -4.150390625, -3.69140625, -3.232421875, -2.7734375, -2.314453125, -1.85546875, -1.396484375, -0.9375, -0.478515625, -0.01953125, 0.439453125, 0.8984375, 1.357421875, 1.81640625, 2.275390625, 2.734375, 3.193359375, 3.65234375, 4.111328125, 4.5703125, 5.029296875, 5.48828125, 5.947265625, 6.40625, 6.865234375, 7.32421875, 7.783203125, 8.2421875, 8.701171875, 9.16015625, 9.619140625, 10.078125, 10.537109375, 10.99609375, 11.455078125, 11.9140625, 12.373046875, 12.83203125, 13.291015625, 13.75]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 16.0, 132.0, 470.0, 334.0, 59.0, 7.0], "bins": [-198.3383331298828, -195.07504272460938, -191.81173706054688, -188.54844665527344, -185.28514099121094, -182.0218505859375, -178.758544921875, -175.49525451660156, -172.23194885253906, -168.96865844726562, -165.70535278320312, -162.4420623779297, -159.1787567138672, -155.91546630859375, -152.65216064453125, -149.3888702392578, -146.12557983398438, -142.86228942871094, -139.59898376464844, -136.335693359375, -133.0723876953125, -129.80909729003906, -126.54579162597656, -123.28250122070312, -120.01919555664062, -116.75589752197266, -113.49259948730469, -110.22930145263672, -106.96600341796875, -103.70270538330078, -100.43940734863281, -97.17611694335938, -93.91280364990234, -90.64950561523438, -87.3862075805664, -84.12290954589844, -80.85961151123047, -77.5963134765625, -74.33302307128906, -71.06971740722656, -67.80642700195312, -64.54312896728516, -61.27983093261719, -58.01653289794922, -54.75323486328125, -51.48993682861328, -48.22664260864258, -44.96334457397461, -41.700042724609375, -38.436744689941406, -35.17344665527344, -31.9101505279541, -28.646852493286133, -25.383554458618164, -22.120258331298828, -18.85696029663086, -15.593664169311523, -12.330366134643555, -9.067069053649902, -5.80377197265625, -2.5404739379882812, 0.7228240966796875, 3.9861202239990234, 7.249418258666992, 10.512716293334961]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 4.0, 9.0, 5.0, 6.0, 17.0, 14.0, 13.0, 17.0, 27.0, 15.0, 25.0, 36.0, 26.0, 33.0, 25.0, 29.0, 34.0, 42.0, 32.0, 50.0, 37.0, 35.0, 43.0, 40.0, 35.0, 40.0, 43.0, 30.0, 36.0, 28.0, 27.0, 21.0, 19.0, 18.0, 13.0, 8.0, 11.0, 10.0, 10.0, 9.0, 10.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-31.950580596923828, -31.040042877197266, -30.129507064819336, -29.218969345092773, -28.308433532714844, -27.39789581298828, -26.48736000061035, -25.57682228088379, -24.66628646850586, -23.755748748779297, -22.845212936401367, -21.934675216674805, -21.024139404296875, -20.113601684570312, -19.203065872192383, -18.29252815246582, -17.38199234008789, -16.471454620361328, -15.560918807983398, -14.650382041931152, -13.739845275878906, -12.829307556152344, -11.918771743774414, -11.008234024047852, -10.097696304321289, -9.187159538269043, -8.276622772216797, -7.366086006164551, -6.455549240112305, -5.5450119972229, -4.634475231170654, -3.723938465118408, -2.8134021759033203, -1.9028654098510742, -0.9923285245895386, -0.08179163932800293, 0.8287451267242432, 1.7392821311950684, 2.6498188972473145, 3.5603556632995605, 4.470892429351807, 5.381429195404053, 6.291965961456299, 7.202503204345703, 8.11303997039795, 9.023576736450195, 9.934113502502441, 10.844650268554688, 11.755187034606934, 12.66572380065918, 13.576260566711426, 14.486797332763672, 15.397334098815918, 16.307870864868164, 17.218408584594727, 18.128944396972656, 19.03948211669922, 19.95001983642578, 20.86055564880371, 21.771093368530273, 22.681629180908203, 23.592166900634766, 24.502702713012695, 25.413240432739258, 26.323776245117188]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 10.0, 4.0, 8.0, 8.0, 9.0, 14.0, 19.0, 17.0, 18.0, 19.0, 24.0, 31.0, 35.0, 34.0, 46.0, 33.0, 45.0, 52.0, 37.0, 39.0, 50.0, 47.0, 37.0, 36.0, 32.0, 45.0, 33.0, 31.0, 29.0, 21.0, 29.0, 14.0, 15.0, 12.0, 16.0, 7.0, 12.0, 6.0, 4.0, 3.0, 3.0, 4.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-4.01953125, -3.90399169921875, -3.7884521484375, -3.67291259765625, -3.557373046875, -3.44183349609375, -3.3262939453125, -3.21075439453125, -3.09521484375, -2.97967529296875, -2.8641357421875, -2.74859619140625, -2.633056640625, -2.51751708984375, -2.4019775390625, -2.28643798828125, -2.1708984375, -2.05535888671875, -1.9398193359375, -1.82427978515625, -1.708740234375, -1.59320068359375, -1.4776611328125, -1.36212158203125, -1.24658203125, -1.13104248046875, -1.0155029296875, -0.89996337890625, -0.784423828125, -0.66888427734375, -0.5533447265625, -0.43780517578125, -0.322265625, -0.20672607421875, -0.0911865234375, 0.02435302734375, 0.139892578125, 0.25543212890625, 0.3709716796875, 0.48651123046875, 0.60205078125, 0.71759033203125, 0.8331298828125, 0.94866943359375, 1.064208984375, 1.17974853515625, 1.2952880859375, 1.41082763671875, 1.5263671875, 1.64190673828125, 1.7574462890625, 1.87298583984375, 1.988525390625, 2.10406494140625, 2.2196044921875, 2.33514404296875, 2.45068359375, 2.56622314453125, 2.6817626953125, 2.79730224609375, 2.912841796875, 3.02838134765625, 3.1439208984375, 3.25946044921875, 3.375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 10.0, 10.0, 18.0, 11.0, 26.0, 15.0, 19.0, 25.0, 33.0, 46.0, 65.0, 171.0, 463.0, 2523.0, 15123.0, 116813.0, 1012029.0, 2530272.0, 454288.0, 53052.0, 7344.0, 1260.0, 293.0, 93.0, 51.0, 28.0, 32.0, 28.0, 26.0, 13.0, 13.0, 9.0, 13.0, 14.0, 8.0, 10.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-10.4765625, -10.18804931640625, -9.8995361328125, -9.61102294921875, -9.322509765625, -9.03399658203125, -8.7454833984375, -8.45697021484375, -8.16845703125, -7.87994384765625, -7.5914306640625, -7.30291748046875, -7.014404296875, -6.72589111328125, -6.4373779296875, -6.14886474609375, -5.8603515625, -5.57183837890625, -5.2833251953125, -4.99481201171875, -4.706298828125, -4.41778564453125, -4.1292724609375, -3.84075927734375, -3.55224609375, -3.26373291015625, -2.9752197265625, -2.68670654296875, -2.398193359375, -2.10968017578125, -1.8211669921875, -1.53265380859375, -1.244140625, -0.95562744140625, -0.6671142578125, -0.37860107421875, -0.090087890625, 0.19842529296875, 0.4869384765625, 0.77545166015625, 1.06396484375, 1.35247802734375, 1.6409912109375, 1.92950439453125, 2.218017578125, 2.50653076171875, 2.7950439453125, 3.08355712890625, 3.3720703125, 3.66058349609375, 3.9490966796875, 4.23760986328125, 4.526123046875, 4.81463623046875, 5.1031494140625, 5.39166259765625, 5.68017578125, 5.96868896484375, 6.2572021484375, 6.54571533203125, 6.834228515625, 7.12274169921875, 7.4112548828125, 7.69976806640625, 7.98828125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 4.0, 11.0, 10.0, 16.0, 19.0, 26.0, 39.0, 34.0, 58.0, 75.0, 102.0, 122.0, 153.0, 212.0, 256.0, 356.0, 442.0, 404.0, 380.0, 302.0, 219.0, 205.0, 148.0, 115.0, 94.0, 71.0, 50.0, 31.0, 36.0, 24.0, 17.0, 11.0, 8.0, 5.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.98828125, -5.8135986328125, -5.638916015625, -5.4642333984375, -5.28955078125, -5.1148681640625, -4.940185546875, -4.7655029296875, -4.5908203125, -4.4161376953125, -4.241455078125, -4.0667724609375, -3.89208984375, -3.7174072265625, -3.542724609375, -3.3680419921875, -3.193359375, -3.0186767578125, -2.843994140625, -2.6693115234375, -2.49462890625, -2.3199462890625, -2.145263671875, -1.9705810546875, -1.7958984375, -1.6212158203125, -1.446533203125, -1.2718505859375, -1.09716796875, -0.9224853515625, -0.747802734375, -0.5731201171875, -0.3984375, -0.2237548828125, -0.049072265625, 0.1256103515625, 0.30029296875, 0.4749755859375, 0.649658203125, 0.8243408203125, 0.9990234375, 1.1737060546875, 1.348388671875, 1.5230712890625, 1.69775390625, 1.8724365234375, 2.047119140625, 2.2218017578125, 2.396484375, 2.5711669921875, 2.745849609375, 2.9205322265625, 3.09521484375, 3.2698974609375, 3.444580078125, 3.6192626953125, 3.7939453125, 3.9686279296875, 4.143310546875, 4.3179931640625, 4.49267578125, 4.6673583984375, 4.842041015625, 5.0167236328125, 5.19140625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 4.0, 7.0, 12.0, 16.0, 25.0, 26.0, 41.0, 55.0, 87.0, 105.0, 163.0, 224.0, 370.0, 696.0, 3412.0, 81409.0, 2751343.0, 1319863.0, 32870.0, 1981.0, 571.0, 303.0, 182.0, 142.0, 115.0, 63.0, 48.0, 42.0, 21.0, 22.0, 17.0, 14.0, 9.0, 6.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.348876953125, -17.71337890625, -17.077880859375, -16.4423828125, -15.806884765625, -15.17138671875, -14.535888671875, -13.900390625, -13.264892578125, -12.62939453125, -11.993896484375, -11.3583984375, -10.722900390625, -10.08740234375, -9.451904296875, -8.81640625, -8.180908203125, -7.54541015625, -6.909912109375, -6.2744140625, -5.638916015625, -5.00341796875, -4.367919921875, -3.732421875, -3.096923828125, -2.46142578125, -1.825927734375, -1.1904296875, -0.554931640625, 0.08056640625, 0.716064453125, 1.3515625, 1.987060546875, 2.62255859375, 3.258056640625, 3.8935546875, 4.529052734375, 5.16455078125, 5.800048828125, 6.435546875, 7.071044921875, 7.70654296875, 8.342041015625, 8.9775390625, 9.613037109375, 10.24853515625, 10.884033203125, 11.51953125, 12.155029296875, 12.79052734375, 13.426025390625, 14.0615234375, 14.697021484375, 15.33251953125, 15.968017578125, 16.603515625, 17.239013671875, 17.87451171875, 18.510009765625, 19.1455078125, 19.781005859375, 20.41650390625, 21.052001953125, 21.6875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 12.0, 76.0, 175.0, 360.0, 260.0, 108.0, 26.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.68100357055664, -15.911445617675781, -13.141887664794922, -10.372329711914062, -7.602771759033203, -4.833213806152344, -2.0636558532714844, 0.705902099609375, 3.4754600524902344, 6.245018005371094, 9.014575958251953, 11.784133911132812, 14.553691864013672, 17.32324981689453, 20.09280776977539, 22.86236572265625, 25.63192367553711, 28.40148162841797, 31.171039581298828, 33.94059753417969, 36.71015548706055, 39.479713439941406, 42.249271392822266, 45.018829345703125, 47.788387298583984, 50.557945251464844, 53.3275032043457, 56.09706115722656, 58.86661911010742, 61.63617706298828, 64.40573120117188, 67.17529296875, 69.94485473632812, 72.71441650390625, 75.48397064208984, 78.25352478027344, 81.02308654785156, 83.79264831542969, 86.56220245361328, 89.33175659179688, 92.101318359375, 94.87088012695312, 97.64043426513672, 100.40998840332031, 103.17955017089844, 105.94911193847656, 108.71866607666016, 111.48822021484375, 114.25778198242188, 117.02734375, 119.7968978881836, 122.56645202636719, 125.33601379394531, 128.10557556152344, 130.8751220703125, 133.64468383789062, 136.41424560546875, 139.18380737304688, 141.953369140625, 144.72291564941406, 147.4924774169922, 150.2620391845703, 153.03158569335938, 155.8011474609375, 158.57070922851562]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 12.0, 6.0, 7.0, 6.0, 12.0, 17.0, 19.0, 21.0, 18.0, 21.0, 24.0, 28.0, 25.0, 33.0, 41.0, 44.0, 40.0, 54.0, 52.0, 46.0, 31.0, 46.0, 48.0, 29.0, 42.0, 33.0, 41.0, 40.0, 29.0, 20.0, 23.0, 24.0, 13.0, 13.0, 11.0, 9.0, 10.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.800262451171875, -19.150474548339844, -18.50068473815918, -17.85089683532715, -17.201108932495117, -16.551321029663086, -15.901531219482422, -15.25174331665039, -14.60195541381836, -13.952166557312012, -13.30237865447998, -12.652589797973633, -12.002801895141602, -11.353013038635254, -10.703224182128906, -10.053436279296875, -9.403647422790527, -8.75385856628418, -8.104070663452148, -7.454281806945801, -6.8044939041137695, -6.154705047607422, -5.504916667938232, -4.855128288269043, -4.2053399085998535, -3.555551528930664, -2.9057631492614746, -2.255974531173706, -1.6061861515045166, -0.9563977718353271, -0.3066091537475586, 0.34317922592163086, 0.9929676055908203, 1.6427559852600098, 2.292544364929199, 2.9423329830169678, 3.5921213626861572, 4.241909980773926, 4.891698360443115, 5.541486740112305, 6.191275119781494, 6.841063499450684, 7.490851879119873, 8.140640258789062, 8.79042911529541, 9.440217018127441, 10.090005874633789, 10.73979377746582, 11.389582633972168, 12.039371490478516, 12.689159393310547, 13.338948249816895, 13.988736152648926, 14.638525009155273, 15.288312911987305, 15.938101768493652, 16.587890625, 17.23767852783203, 17.887468338012695, 18.537256240844727, 19.187044143676758, 19.83683204650879, 20.486621856689453, 21.136409759521484, 21.786197662353516]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 4.0, 10.0, 5.0, 12.0, 13.0, 11.0, 11.0, 16.0, 19.0, 27.0, 33.0, 27.0, 35.0, 37.0, 37.0, 34.0, 30.0, 36.0, 45.0, 54.0, 48.0, 40.0, 32.0, 36.0, 27.0, 39.0, 34.0, 22.0, 35.0, 31.0, 17.0, 21.0, 22.0, 15.0, 9.0, 16.0, 4.0, 7.0, 6.0, 8.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0], "bins": [-4.0234375, -3.911712646484375, -3.79998779296875, -3.688262939453125, -3.5765380859375, -3.464813232421875, -3.35308837890625, -3.241363525390625, -3.129638671875, -3.017913818359375, -2.90618896484375, -2.794464111328125, -2.6827392578125, -2.571014404296875, -2.45928955078125, -2.347564697265625, -2.23583984375, -2.124114990234375, -2.01239013671875, -1.900665283203125, -1.7889404296875, -1.677215576171875, -1.56549072265625, -1.453765869140625, -1.342041015625, -1.230316162109375, -1.11859130859375, -1.006866455078125, -0.8951416015625, -0.783416748046875, -0.67169189453125, -0.559967041015625, -0.4482421875, -0.336517333984375, -0.22479248046875, -0.113067626953125, -0.0013427734375, 0.110382080078125, 0.22210693359375, 0.333831787109375, 0.445556640625, 0.557281494140625, 0.66900634765625, 0.780731201171875, 0.8924560546875, 1.004180908203125, 1.11590576171875, 1.227630615234375, 1.33935546875, 1.451080322265625, 1.56280517578125, 1.674530029296875, 1.7862548828125, 1.897979736328125, 2.00970458984375, 2.121429443359375, 2.233154296875, 2.344879150390625, 2.45660400390625, 2.568328857421875, 2.6800537109375, 2.791778564453125, 2.90350341796875, 3.015228271484375, 3.126953125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 5.0, 10.0, 19.0, 22.0, 32.0, 64.0, 80.0, 140.0, 183.0, 308.0, 525.0, 741.0, 1095.0, 1738.0, 2632.0, 3877.0, 6229.0, 9739.0, 15858.0, 26695.0, 45513.0, 81189.0, 155089.0, 356711.0, 148802.0, 78270.0, 44492.0, 26026.0, 15806.0, 9452.0, 6052.0, 3834.0, 2561.0, 1624.0, 1043.0, 697.0, 490.0, 278.0, 214.0, 126.0, 99.0, 62.0, 40.0, 32.0, 15.0, 12.0, 15.0, 5.0, 1.0, 3.0, 5.0, 2.0], "bins": [-0.195068359375, -0.18956947326660156, -0.18407058715820312, -0.1785717010498047, -0.17307281494140625, -0.1675739288330078, -0.16207504272460938, -0.15657615661621094, -0.1510772705078125, -0.14557838439941406, -0.14007949829101562, -0.1345806121826172, -0.12908172607421875, -0.12358283996582031, -0.11808395385742188, -0.11258506774902344, -0.107086181640625, -0.10158729553222656, -0.09608840942382812, -0.09058952331542969, -0.08509063720703125, -0.07959175109863281, -0.07409286499023438, -0.06859397888183594, -0.0630950927734375, -0.05759620666503906, -0.052097320556640625, -0.04659843444824219, -0.04109954833984375, -0.03560066223144531, -0.030101776123046875, -0.024602890014648438, -0.01910400390625, -0.013605117797851562, -0.008106231689453125, -0.0026073455810546875, 0.00289154052734375, 0.008390426635742188, 0.013889312744140625, 0.019388198852539062, 0.0248870849609375, 0.030385971069335938, 0.035884857177734375, 0.04138374328613281, 0.04688262939453125, 0.05238151550292969, 0.057880401611328125, 0.06337928771972656, 0.068878173828125, 0.07437705993652344, 0.07987594604492188, 0.08537483215332031, 0.09087371826171875, 0.09637260437011719, 0.10187149047851562, 0.10737037658691406, 0.1128692626953125, 0.11836814880371094, 0.12386703491210938, 0.1293659210205078, 0.13486480712890625, 0.1403636932373047, 0.14586257934570312, 0.15136146545410156, 0.1568603515625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 2.0, 13.0, 13.0, 8.0, 10.0, 10.0, 7.0, 16.0, 14.0, 21.0, 20.0, 19.0, 30.0, 26.0, 32.0, 28.0, 37.0, 31.0, 37.0, 39.0, 48.0, 1059.0, 31.0, 49.0, 43.0, 40.0, 44.0, 21.0, 29.0, 38.0, 27.0, 23.0, 16.0, 22.0, 14.0, 17.0, 18.0, 14.0, 11.0, 4.0, 7.0, 9.0, 4.0, 3.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.4375, -2.3553466796875, -2.273193359375, -2.1910400390625, -2.10888671875, -2.0267333984375, -1.944580078125, -1.8624267578125, -1.7802734375, -1.6981201171875, -1.615966796875, -1.5338134765625, -1.45166015625, -1.3695068359375, -1.287353515625, -1.2052001953125, -1.123046875, -1.0408935546875, -0.958740234375, -0.8765869140625, -0.79443359375, -0.7122802734375, -0.630126953125, -0.5479736328125, -0.4658203125, -0.3836669921875, -0.301513671875, -0.2193603515625, -0.13720703125, -0.0550537109375, 0.027099609375, 0.1092529296875, 0.19140625, 0.2735595703125, 0.355712890625, 0.4378662109375, 0.52001953125, 0.6021728515625, 0.684326171875, 0.7664794921875, 0.8486328125, 0.9307861328125, 1.012939453125, 1.0950927734375, 1.17724609375, 1.2593994140625, 1.341552734375, 1.4237060546875, 1.505859375, 1.5880126953125, 1.670166015625, 1.7523193359375, 1.83447265625, 1.9166259765625, 1.998779296875, 2.0809326171875, 2.1630859375, 2.2452392578125, 2.327392578125, 2.4095458984375, 2.49169921875, 2.5738525390625, 2.656005859375, 2.7381591796875, 2.8203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 11.0, 17.0, 29.0, 33.0, 63.0, 99.0, 147.0, 226.0, 317.0, 526.0, 652.0, 1015.0, 1362.0, 2023.0, 2812.0, 4026.0, 5773.0, 8434.0, 11640.0, 17348.0, 25645.0, 39817.0, 63868.0, 112640.0, 1317746.0, 210712.0, 99598.0, 57886.0, 36423.0, 23782.0, 16019.0, 11127.0, 7396.0, 5399.0, 3875.0, 2602.0, 1928.0, 1261.0, 901.0, 619.0, 409.0, 290.0, 207.0, 153.0, 88.0, 65.0, 41.0, 30.0, 16.0, 14.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.08123779296875, -0.07876873016357422, -0.07629966735839844, -0.07383060455322266, -0.07136154174804688, -0.0688924789428711, -0.06642341613769531, -0.06395435333251953, -0.06148529052734375, -0.05901622772216797, -0.05654716491699219, -0.054078102111816406, -0.051609039306640625, -0.049139976501464844, -0.04667091369628906, -0.04420185089111328, -0.0417327880859375, -0.03926372528076172, -0.03679466247558594, -0.034325599670410156, -0.031856536865234375, -0.029387474060058594, -0.026918411254882812, -0.02444934844970703, -0.02198028564453125, -0.01951122283935547, -0.017042160034179688, -0.014573097229003906, -0.012104034423828125, -0.009634971618652344, -0.0071659088134765625, -0.004696846008300781, -0.002227783203125, 0.00024127960205078125, 0.0027103424072265625, 0.005179405212402344, 0.007648468017578125, 0.010117530822753906, 0.012586593627929688, 0.015055656433105469, 0.01752471923828125, 0.01999378204345703, 0.022462844848632812, 0.024931907653808594, 0.027400970458984375, 0.029870033264160156, 0.03233909606933594, 0.03480815887451172, 0.0372772216796875, 0.03974628448486328, 0.04221534729003906, 0.044684410095214844, 0.047153472900390625, 0.049622535705566406, 0.05209159851074219, 0.05456066131591797, 0.05702972412109375, 0.05949878692626953, 0.06196784973144531, 0.0644369125366211, 0.06690597534179688, 0.06937503814697266, 0.07184410095214844, 0.07431316375732422, 0.0767822265625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 9.0, 5.0, 11.0, 9.0, 18.0, 10.0, 7.0, 24.0, 39.0, 23.0, 54.0, 101.0, 73.0, 279.0, 49.0, 81.0, 56.0, 26.0, 43.0, 20.0, 9.0, 12.0, 13.0, 2.0, 8.0, 10.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.538094460964203e-06, -3.4403055906295776e-06, -3.3425167202949524e-06, -3.244727849960327e-06, -3.146938979625702e-06, -3.0491501092910767e-06, -2.9513612389564514e-06, -2.853572368621826e-06, -2.755783498287201e-06, -2.6579946279525757e-06, -2.5602057576179504e-06, -2.462416887283325e-06, -2.3646280169487e-06, -2.2668391466140747e-06, -2.1690502762794495e-06, -2.0712614059448242e-06, -1.973472535610199e-06, -1.8756836652755737e-06, -1.7778947949409485e-06, -1.6801059246063232e-06, -1.582317054271698e-06, -1.4845281839370728e-06, -1.3867393136024475e-06, -1.2889504432678223e-06, -1.191161572933197e-06, -1.0933727025985718e-06, -9.955838322639465e-07, -8.977949619293213e-07, -8.00006091594696e-07, -7.022172212600708e-07, -6.044283509254456e-07, -5.066394805908203e-07, -4.0885061025619507e-07, -3.110617399215698e-07, -2.1327286958694458e-07, -1.1548399925231934e-07, -1.7695128917694092e-08, 8.009374141693115e-08, 1.778826117515564e-07, 2.7567148208618164e-07, 3.734603524208069e-07, 4.7124922275543213e-07, 5.690380930900574e-07, 6.668269634246826e-07, 7.646158337593079e-07, 8.624047040939331e-07, 9.601935744285583e-07, 1.0579824447631836e-06, 1.1557713150978088e-06, 1.253560185432434e-06, 1.3513490557670593e-06, 1.4491379261016846e-06, 1.5469267964363098e-06, 1.644715666770935e-06, 1.7425045371055603e-06, 1.8402934074401855e-06, 1.938082277774811e-06, 2.035871148109436e-06, 2.1336600184440613e-06, 2.2314488887786865e-06, 2.3292377591133118e-06, 2.427026629447937e-06, 2.5248154997825623e-06, 2.6226043701171875e-06]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 7.0, 6.0, 6.0, 13.0, 12.0, 20.0, 29.0, 49.0, 96.0, 122.0, 269.0, 1234.0, 943055.0, 102459.0, 646.0, 215.0, 106.0, 63.0, 39.0, 19.0, 15.0, 12.0, 19.0, 9.0, 9.0, 6.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6803226470947266e-05, -5.46872615814209e-05, -5.257129669189453e-05, -5.0455331802368164e-05, -4.83393669128418e-05, -4.622340202331543e-05, -4.410743713378906e-05, -4.1991472244262695e-05, -3.987550735473633e-05, -3.775954246520996e-05, -3.5643577575683594e-05, -3.3527612686157227e-05, -3.141164779663086e-05, -2.9295682907104492e-05, -2.7179718017578125e-05, -2.5063753128051758e-05, -2.294778823852539e-05, -2.0831823348999023e-05, -1.8715858459472656e-05, -1.659989356994629e-05, -1.4483928680419922e-05, -1.2367963790893555e-05, -1.0251998901367188e-05, -8.13603401184082e-06, -6.020069122314453e-06, -3.904104232788086e-06, -1.7881393432617188e-06, 3.2782554626464844e-07, 2.4437904357910156e-06, 4.559755325317383e-06, 6.67572021484375e-06, 8.791685104370117e-06, 1.0907649993896484e-05, 1.3023614883422852e-05, 1.5139579772949219e-05, 1.7255544662475586e-05, 1.9371509552001953e-05, 2.148747444152832e-05, 2.3603439331054688e-05, 2.5719404220581055e-05, 2.7835369110107422e-05, 2.995133399963379e-05, 3.2067298889160156e-05, 3.4183263778686523e-05, 3.629922866821289e-05, 3.841519355773926e-05, 4.0531158447265625e-05, 4.264712333679199e-05, 4.476308822631836e-05, 4.6879053115844727e-05, 4.8995018005371094e-05, 5.111098289489746e-05, 5.322694778442383e-05, 5.5342912673950195e-05, 5.745887756347656e-05, 5.957484245300293e-05, 6.16908073425293e-05, 6.380677223205566e-05, 6.592273712158203e-05, 6.80387020111084e-05, 7.015466690063477e-05, 7.227063179016113e-05, 7.43865966796875e-05, 7.650256156921387e-05, 7.861852645874023e-05]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 19.0, 66.0, 217.0, 396.0, 217.0, 57.0, 23.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2027502281125635e-06, -6.07735819357913e-06, -5.951965704298345e-06, -5.826573669764912e-06, -5.701181180484127e-06, -5.575789145950694e-06, -5.450396656669909e-06, -5.3250046221364755e-06, -5.199612132855691e-06, -5.074220098322257e-06, -4.948827609041473e-06, -4.823435574508039e-06, -4.698043085227255e-06, -4.572651050693821e-06, -4.447258561413037e-06, -4.321866526879603e-06, -4.1964740375988185e-06, -4.071082003065385e-06, -3.9456895137846e-06, -3.820297479251167e-06, -3.6949049899703823e-06, -3.5695127280632732e-06, -3.444120466156164e-06, -3.3187284316227306e-06, -3.193336397089297e-06, -3.067944135182188e-06, -2.942551873275079e-06, -2.8171596113679698e-06, -2.6917673494608607e-06, -2.5663750875537517e-06, -2.4409828256466426e-06, -2.315590791113209e-06, -2.1901987565797754e-06, -2.0648064946726663e-06, -1.9394142327655572e-06, -1.8140219708584482e-06, -1.6886297089513391e-06, -1.56323744704423e-06, -1.4378452988239587e-06, -1.3124530369168497e-06, -1.1870606613229029e-06, -1.0616683994157938e-06, -9.362761375086848e-07, -8.108839324449946e-07, -6.854916705378855e-07, -5.600994086307765e-07, -4.3470720356708625e-07, -3.093149416599772e-07, -1.8392267975286813e-07, -5.853043205661379e-08, 6.686181563964055e-08, 1.9225404912504018e-07, 3.1764631103214924e-07, 4.430385729392583e-07, 5.684307780029485e-07, 6.938230399100576e-07, 8.192153018171666e-07, 9.446075637242757e-07, 1.0699998256313847e-06, 1.1953920875384938e-06, 1.3207843494456029e-06, 1.446176611352712e-06, 1.5715687595729833e-06, 1.6969610214800923e-06, 1.8223532833872014e-06]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 0.0, 6.0, 7.0, 0.0, 8.0, 8.0, 0.0, 12.0, 18.0, 0.0, 23.0, 22.0, 0.0, 28.0, 42.0, 0.0, 60.0, 59.0, 0.0, 73.0, 83.0, 0.0, 97.0, 80.0, 0.0, 67.0, 54.0, 0.0, 54.0, 47.0, 0.0, 32.0, 16.0, 0.0, 29.0, 23.0, 0.0, 18.0, 11.0, 0.0, 14.0, 3.0, 0.0, 4.0, 3.0, 0.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2116506695747375e-06, -1.171603798866272e-06, -1.1315569281578064e-06, -1.0915100574493408e-06, -1.0514631867408752e-06, -1.0114163160324097e-06, -9.71369445323944e-07, -9.313225746154785e-07, -8.912757039070129e-07, -8.512288331985474e-07, -8.111819624900818e-07, -7.711350917816162e-07, -7.310882210731506e-07, -6.910413503646851e-07, -6.509944796562195e-07, -6.109476089477539e-07, -5.709007382392883e-07, -5.308538675308228e-07, -4.908069968223572e-07, -4.507601261138916e-07, -4.10713255405426e-07, -3.7066638469696045e-07, -3.3061951398849487e-07, -2.905726432800293e-07, -2.505257725715637e-07, -2.1047890186309814e-07, -1.7043203115463257e-07, -1.30385160446167e-07, -9.033828973770142e-08, -5.029141902923584e-08, -1.0244548320770264e-08, 2.9802322387695312e-08, 6.984919309616089e-08, 1.0989606380462646e-07, 1.4994293451309204e-07, 1.8998980522155762e-07, 2.300366759300232e-07, 2.7008354663848877e-07, 3.1013041734695435e-07, 3.501772880554199e-07, 3.902241587638855e-07, 4.302710294723511e-07, 4.7031790018081665e-07, 5.103647708892822e-07, 5.504116415977478e-07, 5.904585123062134e-07, 6.30505383014679e-07, 6.705522537231445e-07, 7.105991244316101e-07, 7.506459951400757e-07, 7.906928658485413e-07, 8.307397365570068e-07, 8.707866072654724e-07, 9.10833477973938e-07, 9.508803486824036e-07, 9.909272193908691e-07, 1.0309740900993347e-06, 1.0710209608078003e-06, 1.1110678315162659e-06, 1.1511147022247314e-06, 1.191161572933197e-06, 1.2312084436416626e-06, 1.2712553143501282e-06, 1.3113021850585938e-06]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 4.0, 10.0, 5.0, 12.0, 13.0, 11.0, 11.0, 16.0, 19.0, 27.0, 33.0, 27.0, 35.0, 37.0, 37.0, 34.0, 30.0, 36.0, 45.0, 54.0, 48.0, 40.0, 32.0, 36.0, 27.0, 39.0, 34.0, 22.0, 35.0, 31.0, 17.0, 21.0, 22.0, 15.0, 9.0, 16.0, 4.0, 7.0, 6.0, 8.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0], "bins": [-4.0234375, -3.911712646484375, -3.79998779296875, -3.688262939453125, -3.5765380859375, -3.464813232421875, -3.35308837890625, -3.241363525390625, -3.129638671875, -3.017913818359375, -2.90618896484375, -2.794464111328125, -2.6827392578125, -2.571014404296875, -2.45928955078125, -2.347564697265625, -2.23583984375, -2.124114990234375, -2.01239013671875, -1.900665283203125, -1.7889404296875, -1.677215576171875, -1.56549072265625, -1.453765869140625, -1.342041015625, -1.230316162109375, -1.11859130859375, -1.006866455078125, -0.8951416015625, -0.783416748046875, -0.67169189453125, -0.559967041015625, -0.4482421875, -0.336517333984375, -0.22479248046875, -0.113067626953125, -0.0013427734375, 0.110382080078125, 0.22210693359375, 0.333831787109375, 0.445556640625, 0.557281494140625, 0.66900634765625, 0.780731201171875, 0.8924560546875, 1.004180908203125, 1.11590576171875, 1.227630615234375, 1.33935546875, 1.451080322265625, 1.56280517578125, 1.674530029296875, 1.7862548828125, 1.897979736328125, 2.00970458984375, 2.121429443359375, 2.233154296875, 2.344879150390625, 2.45660400390625, 2.568328857421875, 2.6800537109375, 2.791778564453125, 2.90350341796875, 3.015228271484375, 3.126953125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 3.0, 7.0, 9.0, 6.0, 9.0, 12.0, 21.0, 19.0, 29.0, 43.0, 57.0, 99.0, 165.0, 234.0, 532.0, 935.0, 1763.0, 3297.0, 6138.0, 11366.0, 23861.0, 54550.0, 132031.0, 280638.0, 288268.0, 137476.0, 56802.0, 24658.0, 11951.0, 6273.0, 3355.0, 1708.0, 926.0, 535.0, 288.0, 167.0, 77.0, 52.0, 40.0, 29.0, 30.0, 21.0, 15.0, 14.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-5.11328125, -4.95843505859375, -4.8035888671875, -4.64874267578125, -4.493896484375, -4.33905029296875, -4.1842041015625, -4.02935791015625, -3.87451171875, -3.71966552734375, -3.5648193359375, -3.40997314453125, -3.255126953125, -3.10028076171875, -2.9454345703125, -2.79058837890625, -2.6357421875, -2.48089599609375, -2.3260498046875, -2.17120361328125, -2.016357421875, -1.86151123046875, -1.7066650390625, -1.55181884765625, -1.39697265625, -1.24212646484375, -1.0872802734375, -0.93243408203125, -0.777587890625, -0.62274169921875, -0.4678955078125, -0.31304931640625, -0.158203125, -0.00335693359375, 0.1514892578125, 0.30633544921875, 0.461181640625, 0.61602783203125, 0.7708740234375, 0.92572021484375, 1.08056640625, 1.23541259765625, 1.3902587890625, 1.54510498046875, 1.699951171875, 1.85479736328125, 2.0096435546875, 2.16448974609375, 2.3193359375, 2.47418212890625, 2.6290283203125, 2.78387451171875, 2.938720703125, 3.09356689453125, 3.2484130859375, 3.40325927734375, 3.55810546875, 3.71295166015625, 3.8677978515625, 4.02264404296875, 4.177490234375, 4.33233642578125, 4.4871826171875, 4.64202880859375, 4.796875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 4.0, 3.0, 7.0, 13.0, 8.0, 7.0, 15.0, 16.0, 15.0, 20.0, 24.0, 18.0, 24.0, 35.0, 39.0, 39.0, 31.0, 60.0, 80.0, 160.0, 243.0, 1391.0, 229.0, 114.0, 73.0, 55.0, 44.0, 38.0, 42.0, 33.0, 27.0, 25.0, 15.0, 27.0, 11.0, 11.0, 10.0, 5.0, 8.0, 5.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.28125, -11.8912353515625, -11.501220703125, -11.1112060546875, -10.72119140625, -10.3311767578125, -9.941162109375, -9.5511474609375, -9.1611328125, -8.7711181640625, -8.381103515625, -7.9910888671875, -7.60107421875, -7.2110595703125, -6.821044921875, -6.4310302734375, -6.041015625, -5.6510009765625, -5.260986328125, -4.8709716796875, -4.48095703125, -4.0909423828125, -3.700927734375, -3.3109130859375, -2.9208984375, -2.5308837890625, -2.140869140625, -1.7508544921875, -1.36083984375, -0.9708251953125, -0.580810546875, -0.1907958984375, 0.19921875, 0.5892333984375, 0.979248046875, 1.3692626953125, 1.75927734375, 2.1492919921875, 2.539306640625, 2.9293212890625, 3.3193359375, 3.7093505859375, 4.099365234375, 4.4893798828125, 4.87939453125, 5.2694091796875, 5.659423828125, 6.0494384765625, 6.439453125, 6.8294677734375, 7.219482421875, 7.6094970703125, 7.99951171875, 8.3895263671875, 8.779541015625, 9.1695556640625, 9.5595703125, 9.9495849609375, 10.339599609375, 10.7296142578125, 11.11962890625, 11.5096435546875, 11.899658203125, 12.2896728515625, 12.6796875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 10.0, 9.0, 7.0, 12.0, 13.0, 22.0, 25.0, 28.0, 46.0, 53.0, 55.0, 75.0, 123.0, 166.0, 319.0, 605.0, 1951.0, 10109.0, 98246.0, 2349596.0, 645430.0, 31861.0, 4540.0, 1104.0, 424.0, 227.0, 155.0, 107.0, 82.0, 55.0, 42.0, 28.0, 35.0, 18.0, 22.0, 17.0, 19.0, 6.0, 5.0, 13.0, 11.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-16.5625, -16.041259765625, -15.52001953125, -14.998779296875, -14.4775390625, -13.956298828125, -13.43505859375, -12.913818359375, -12.392578125, -11.871337890625, -11.35009765625, -10.828857421875, -10.3076171875, -9.786376953125, -9.26513671875, -8.743896484375, -8.22265625, -7.701416015625, -7.18017578125, -6.658935546875, -6.1376953125, -5.616455078125, -5.09521484375, -4.573974609375, -4.052734375, -3.531494140625, -3.01025390625, -2.489013671875, -1.9677734375, -1.446533203125, -0.92529296875, -0.404052734375, 0.1171875, 0.638427734375, 1.15966796875, 1.680908203125, 2.2021484375, 2.723388671875, 3.24462890625, 3.765869140625, 4.287109375, 4.808349609375, 5.32958984375, 5.850830078125, 6.3720703125, 6.893310546875, 7.41455078125, 7.935791015625, 8.45703125, 8.978271484375, 9.49951171875, 10.020751953125, 10.5419921875, 11.063232421875, 11.58447265625, 12.105712890625, 12.626953125, 13.148193359375, 13.66943359375, 14.190673828125, 14.7119140625, 15.233154296875, 15.75439453125, 16.275634765625, 16.796875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [11.0, 98.0, 421.0, 387.0, 84.0, 16.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.581006050109863, -6.396378517150879, -3.2117505073547363, -0.02712249755859375, 3.1575050354003906, 6.342132568359375, 9.526761054992676, 12.71138858795166, 15.896016120910645, 19.080644607543945, 22.26527214050293, 25.449899673461914, 28.6345272064209, 31.819154739379883, 35.0037841796875, 38.188411712646484, 41.37303924560547, 44.55766677856445, 47.74229431152344, 50.92692184448242, 54.111549377441406, 57.29617691040039, 60.480804443359375, 63.665435791015625, 66.85005950927734, 70.0346908569336, 73.21931457519531, 76.40394592285156, 79.58856964111328, 82.77320098876953, 85.95782470703125, 89.1424560546875, 92.32707977294922, 95.51171112060547, 98.69633483886719, 101.88096618652344, 105.06558990478516, 108.2502212524414, 111.43484497070312, 114.61947631835938, 117.8041000366211, 120.98873138427734, 124.17335510253906, 127.35798645019531, 130.54261779785156, 133.72723388671875, 136.911865234375, 140.09649658203125, 143.2811279296875, 146.46575927734375, 149.650390625, 152.8350067138672, 156.01963806152344, 159.2042694091797, 162.38890075683594, 165.57351684570312, 168.75814819335938, 171.94277954101562, 175.12741088867188, 178.31202697753906, 181.4966583251953, 184.68128967285156, 187.8659210205078, 191.050537109375, 194.23516845703125]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 4.0, 7.0, 9.0, 13.0, 23.0, 22.0, 23.0, 19.0, 23.0, 27.0, 30.0, 39.0, 39.0, 24.0, 49.0, 37.0, 42.0, 44.0, 51.0, 43.0, 35.0, 47.0, 33.0, 30.0, 31.0, 29.0, 33.0, 29.0, 17.0, 32.0, 18.0, 20.0, 12.0, 11.0, 11.0, 8.0, 8.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.528907775878906, -34.39859390258789, -33.268280029296875, -32.137962341308594, -31.00765037536621, -29.877334594726562, -28.747020721435547, -27.61670684814453, -26.486392974853516, -25.3560791015625, -24.22576332092285, -23.095449447631836, -21.96513557434082, -20.834819793701172, -19.704505920410156, -18.57419204711914, -17.443876266479492, -16.313562393188477, -15.183247566223145, -14.052932739257812, -12.922618865966797, -11.792304039001465, -10.661989212036133, -9.531675338745117, -8.401360511779785, -7.271046161651611, -6.1407318115234375, -5.0104169845581055, -3.8801026344299316, -2.749788284301758, -1.6194734573364258, -0.48915910720825195, 0.6411552429199219, 1.7714697122573853, 2.9017841815948486, 4.032098770141602, 5.162413120269775, 6.292727470397949, 7.423042297363281, 8.553356170654297, 9.683670997619629, 10.813985824584961, 11.944299697875977, 13.074614524841309, 14.20492935180664, 15.335243225097656, 16.465557098388672, 17.59587287902832, 18.726186752319336, 19.85650062561035, 20.98681640625, 22.117130279541016, 23.24744415283203, 24.377758026123047, 25.508073806762695, 26.63838768005371, 27.76870346069336, 28.899017333984375, 30.029333114624023, 31.15964698791504, 32.28996276855469, 33.4202766418457, 34.55059051513672, 35.680904388427734, 36.81121826171875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 10.0, 12.0, 8.0, 15.0, 21.0, 15.0, 11.0, 34.0, 33.0, 37.0, 32.0, 22.0, 41.0, 27.0, 41.0, 41.0, 42.0, 45.0, 43.0, 53.0, 28.0, 38.0, 35.0, 37.0, 26.0, 30.0, 31.0, 22.0, 13.0, 33.0, 13.0, 17.0, 18.0, 4.0, 9.0, 13.0, 6.0, 5.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-4.265625, -4.14398193359375, -4.0223388671875, -3.90069580078125, -3.779052734375, -3.65740966796875, -3.5357666015625, -3.41412353515625, -3.29248046875, -3.17083740234375, -3.0491943359375, -2.92755126953125, -2.805908203125, -2.68426513671875, -2.5626220703125, -2.44097900390625, -2.3193359375, -2.19769287109375, -2.0760498046875, -1.95440673828125, -1.832763671875, -1.71112060546875, -1.5894775390625, -1.46783447265625, -1.34619140625, -1.22454833984375, -1.1029052734375, -0.98126220703125, -0.859619140625, -0.73797607421875, -0.6163330078125, -0.49468994140625, -0.373046875, -0.25140380859375, -0.1297607421875, -0.00811767578125, 0.113525390625, 0.23516845703125, 0.3568115234375, 0.47845458984375, 0.60009765625, 0.72174072265625, 0.8433837890625, 0.96502685546875, 1.086669921875, 1.20831298828125, 1.3299560546875, 1.45159912109375, 1.5732421875, 1.69488525390625, 1.8165283203125, 1.93817138671875, 2.059814453125, 2.18145751953125, 2.3031005859375, 2.42474365234375, 2.54638671875, 2.66802978515625, 2.7896728515625, 2.91131591796875, 3.032958984375, 3.15460205078125, 3.2762451171875, 3.39788818359375, 3.51953125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 9.0, 7.0, 10.0, 6.0, 14.0, 15.0, 17.0, 26.0, 35.0, 66.0, 128.0, 282.0, 610.0, 1627.0, 4679.0, 14376.0, 48346.0, 182278.0, 702769.0, 1847594.0, 1018841.0, 270377.0, 71259.0, 20539.0, 6536.0, 2183.0, 856.0, 343.0, 169.0, 88.0, 45.0, 29.0, 22.0, 26.0, 18.0, 7.0, 13.0, 9.0, 4.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.10546875, -5.92401123046875, -5.7425537109375, -5.56109619140625, -5.379638671875, -5.19818115234375, -5.0167236328125, -4.83526611328125, -4.65380859375, -4.47235107421875, -4.2908935546875, -4.10943603515625, -3.927978515625, -3.74652099609375, -3.5650634765625, -3.38360595703125, -3.2021484375, -3.02069091796875, -2.8392333984375, -2.65777587890625, -2.476318359375, -2.29486083984375, -2.1134033203125, -1.93194580078125, -1.75048828125, -1.56903076171875, -1.3875732421875, -1.20611572265625, -1.024658203125, -0.84320068359375, -0.6617431640625, -0.48028564453125, -0.298828125, -0.11737060546875, 0.0640869140625, 0.24554443359375, 0.427001953125, 0.60845947265625, 0.7899169921875, 0.97137451171875, 1.15283203125, 1.33428955078125, 1.5157470703125, 1.69720458984375, 1.878662109375, 2.06011962890625, 2.2415771484375, 2.42303466796875, 2.6044921875, 2.78594970703125, 2.9674072265625, 3.14886474609375, 3.330322265625, 3.51177978515625, 3.6932373046875, 3.87469482421875, 4.05615234375, 4.23760986328125, 4.4190673828125, 4.60052490234375, 4.781982421875, 4.96343994140625, 5.1448974609375, 5.32635498046875, 5.5078125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 4.0, 7.0, 6.0, 16.0, 19.0, 36.0, 39.0, 71.0, 87.0, 150.0, 207.0, 293.0, 414.0, 541.0, 560.0, 486.0, 351.0, 294.0, 156.0, 97.0, 82.0, 49.0, 30.0, 24.0, 16.0, 13.0, 5.0, 9.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -6.0789794921875, -5.837646484375, -5.5963134765625, -5.35498046875, -5.1136474609375, -4.872314453125, -4.6309814453125, -4.3896484375, -4.1483154296875, -3.906982421875, -3.6656494140625, -3.42431640625, -3.1829833984375, -2.941650390625, -2.7003173828125, -2.458984375, -2.2176513671875, -1.976318359375, -1.7349853515625, -1.49365234375, -1.2523193359375, -1.010986328125, -0.7696533203125, -0.5283203125, -0.2869873046875, -0.045654296875, 0.1956787109375, 0.43701171875, 0.6783447265625, 0.919677734375, 1.1610107421875, 1.40234375, 1.6436767578125, 1.885009765625, 2.1263427734375, 2.36767578125, 2.6090087890625, 2.850341796875, 3.0916748046875, 3.3330078125, 3.5743408203125, 3.815673828125, 4.0570068359375, 4.29833984375, 4.5396728515625, 4.781005859375, 5.0223388671875, 5.263671875, 5.5050048828125, 5.746337890625, 5.9876708984375, 6.22900390625, 6.4703369140625, 6.711669921875, 6.9530029296875, 7.1943359375, 7.4356689453125, 7.677001953125, 7.9183349609375, 8.15966796875, 8.4010009765625, 8.642333984375, 8.8836669921875, 9.125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 8.0, 8.0, 21.0, 25.0, 34.0, 50.0, 93.0, 133.0, 220.0, 414.0, 905.0, 3533.0, 44253.0, 1317846.0, 2713932.0, 104273.0, 6188.0, 1153.0, 500.0, 243.0, 158.0, 102.0, 62.0, 40.0, 27.0, 16.0, 17.0, 9.0, 1.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.46875, -21.8795166015625, -21.290283203125, -20.7010498046875, -20.11181640625, -19.5225830078125, -18.933349609375, -18.3441162109375, -17.7548828125, -17.1656494140625, -16.576416015625, -15.9871826171875, -15.39794921875, -14.8087158203125, -14.219482421875, -13.6302490234375, -13.041015625, -12.4517822265625, -11.862548828125, -11.2733154296875, -10.68408203125, -10.0948486328125, -9.505615234375, -8.9163818359375, -8.3271484375, -7.7379150390625, -7.148681640625, -6.5594482421875, -5.97021484375, -5.3809814453125, -4.791748046875, -4.2025146484375, -3.61328125, -3.0240478515625, -2.434814453125, -1.8455810546875, -1.25634765625, -0.6671142578125, -0.077880859375, 0.5113525390625, 1.1005859375, 1.6898193359375, 2.279052734375, 2.8682861328125, 3.45751953125, 4.0467529296875, 4.635986328125, 5.2252197265625, 5.814453125, 6.4036865234375, 6.992919921875, 7.5821533203125, 8.17138671875, 8.7606201171875, 9.349853515625, 9.9390869140625, 10.5283203125, 11.1175537109375, 11.706787109375, 12.2960205078125, 12.88525390625, 13.4744873046875, 14.063720703125, 14.6529541015625, 15.2421875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 25.0, 96.0, 238.0, 276.0, 224.0, 109.0, 30.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.45670700073242, -43.01179504394531, -40.5668830871582, -38.121971130371094, -35.67705535888672, -33.23214340209961, -30.7872314453125, -28.342317581176758, -25.89740562438965, -23.45249366760254, -21.007579803466797, -18.562667846679688, -16.117755889892578, -13.672842025756836, -11.227930068969727, -8.783016204833984, -6.338104248046875, -3.8931915760040283, -1.4482789039611816, 0.9966335296630859, 3.4415464401245117, 5.8864593505859375, 8.331371307373047, 10.776285171508789, 13.221197128295898, 15.666110038757324, 18.11102294921875, 20.55593490600586, 23.00084686279297, 25.44576072692871, 27.89067268371582, 30.335586547851562, 32.780494689941406, 35.225406646728516, 37.670318603515625, 40.115234375, 42.56014633178711, 45.00505828857422, 47.44997024536133, 49.89488220214844, 52.33979797363281, 54.78470993041992, 57.22962188720703, 59.674537658691406, 62.119449615478516, 64.56436157226562, 67.00927734375, 69.45418548583984, 71.89909362792969, 74.34400939941406, 76.7889175415039, 79.23383331298828, 81.67874145507812, 84.1236572265625, 86.56857299804688, 89.01348114013672, 91.4583969116211, 93.90331268310547, 96.34822082519531, 98.79313659667969, 101.23804473876953, 103.6829605102539, 106.12786865234375, 108.57278442382812, 111.0177001953125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 1.0, 2.0, 4.0, 9.0, 9.0, 8.0, 10.0, 10.0, 9.0, 14.0, 9.0, 17.0, 14.0, 22.0, 30.0, 35.0, 28.0, 30.0, 32.0, 33.0, 36.0, 37.0, 38.0, 34.0, 33.0, 38.0, 45.0, 37.0, 40.0, 30.0, 36.0, 27.0, 20.0, 25.0, 21.0, 13.0, 27.0, 26.0, 21.0, 12.0, 15.0, 10.0, 10.0, 7.0, 11.0, 7.0, 6.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.797183990478516, -19.18671226501465, -18.576242446899414, -17.965770721435547, -17.35529899597168, -16.744827270507812, -16.134357452392578, -15.523885726928711, -14.913414001464844, -14.302943229675293, -13.692471504211426, -13.082000732421875, -12.471529006958008, -11.861058235168457, -11.250587463378906, -10.640115737915039, -10.029644966125488, -9.419174194335938, -8.80870246887207, -8.19823169708252, -7.587759971618652, -6.977289199829102, -6.366817951202393, -5.756346702575684, -5.145875453948975, -4.535404205322266, -3.9249329566955566, -3.3144619464874268, -2.7039906978607178, -2.093519449234009, -1.483048439025879, -0.8725771903991699, -0.26210594177246094, 0.34836524724960327, 0.9588364362716675, 1.569307565689087, 2.179778814315796, 2.790250062942505, 3.4007210731506348, 4.011192321777344, 4.621663570404053, 5.232134819030762, 5.842606067657471, 6.45307731628418, 7.0635480880737305, 7.674019813537598, 8.284490585327148, 8.894962310791016, 9.505433082580566, 10.115903854370117, 10.726375579833984, 11.336846351623535, 11.947318077087402, 12.557788848876953, 13.16826057434082, 13.778731346130371, 14.389202117919922, 14.999672889709473, 15.61014461517334, 16.22061538696289, 16.831087112426758, 17.441558837890625, 18.05202865600586, 18.662500381469727, 19.272972106933594]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 10.0, 11.0, 16.0, 16.0, 19.0, 22.0, 26.0, 32.0, 22.0, 38.0, 41.0, 39.0, 36.0, 31.0, 42.0, 51.0, 49.0, 43.0, 37.0, 30.0, 37.0, 33.0, 33.0, 35.0, 31.0, 33.0, 19.0, 22.0, 17.0, 15.0, 21.0, 15.0, 9.0, 8.0, 7.0, 6.0, 6.0, 4.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.33203125, -4.207550048828125, -4.08306884765625, -3.958587646484375, -3.8341064453125, -3.709625244140625, -3.58514404296875, -3.460662841796875, -3.336181640625, -3.211700439453125, -3.08721923828125, -2.962738037109375, -2.8382568359375, -2.713775634765625, -2.58929443359375, -2.464813232421875, -2.34033203125, -2.215850830078125, -2.09136962890625, -1.966888427734375, -1.8424072265625, -1.717926025390625, -1.59344482421875, -1.468963623046875, -1.344482421875, -1.220001220703125, -1.09552001953125, -0.971038818359375, -0.8465576171875, -0.722076416015625, -0.59759521484375, -0.473114013671875, -0.3486328125, -0.224151611328125, -0.09967041015625, 0.024810791015625, 0.1492919921875, 0.273773193359375, 0.39825439453125, 0.522735595703125, 0.647216796875, 0.771697998046875, 0.89617919921875, 1.020660400390625, 1.1451416015625, 1.269622802734375, 1.39410400390625, 1.518585205078125, 1.64306640625, 1.767547607421875, 1.89202880859375, 2.016510009765625, 2.1409912109375, 2.265472412109375, 2.38995361328125, 2.514434814453125, 2.638916015625, 2.763397216796875, 2.88787841796875, 3.012359619140625, 3.1368408203125, 3.261322021484375, 3.38580322265625, 3.510284423828125, 3.634765625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 9.0, 7.0, 25.0, 35.0, 48.0, 92.0, 130.0, 216.0, 327.0, 511.0, 791.0, 1243.0, 1880.0, 3014.0, 4808.0, 7724.0, 12604.0, 21007.0, 35911.0, 64294.0, 123078.0, 349525.0, 204421.0, 92718.0, 50606.0, 28680.0, 17037.0, 10355.0, 6394.0, 4090.0, 2545.0, 1606.0, 1036.0, 656.0, 383.0, 262.0, 165.0, 109.0, 62.0, 53.0, 35.0, 18.0, 11.0, 14.0, 8.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.20654296875, -0.2006072998046875, -0.194671630859375, -0.1887359619140625, -0.18280029296875, -0.1768646240234375, -0.170928955078125, -0.1649932861328125, -0.1590576171875, -0.1531219482421875, -0.147186279296875, -0.1412506103515625, -0.13531494140625, -0.1293792724609375, -0.123443603515625, -0.1175079345703125, -0.111572265625, -0.1056365966796875, -0.099700927734375, -0.0937652587890625, -0.08782958984375, -0.0818939208984375, -0.075958251953125, -0.0700225830078125, -0.0640869140625, -0.0581512451171875, -0.052215576171875, -0.0462799072265625, -0.04034423828125, -0.0344085693359375, -0.028472900390625, -0.0225372314453125, -0.0166015625, -0.0106658935546875, -0.004730224609375, 0.0012054443359375, 0.00714111328125, 0.0130767822265625, 0.019012451171875, 0.0249481201171875, 0.0308837890625, 0.0368194580078125, 0.042755126953125, 0.0486907958984375, 0.05462646484375, 0.0605621337890625, 0.066497802734375, 0.0724334716796875, 0.078369140625, 0.0843048095703125, 0.090240478515625, 0.0961761474609375, 0.10211181640625, 0.1080474853515625, 0.113983154296875, 0.1199188232421875, 0.1258544921875, 0.1317901611328125, 0.137725830078125, 0.1436614990234375, 0.14959716796875, 0.1555328369140625, 0.161468505859375, 0.1674041748046875, 0.17333984375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 4.0, 14.0, 16.0, 15.0, 16.0, 19.0, 17.0, 28.0, 26.0, 21.0, 46.0, 28.0, 36.0, 30.0, 39.0, 42.0, 43.0, 42.0, 1065.0, 40.0, 53.0, 34.0, 37.0, 33.0, 31.0, 27.0, 26.0, 27.0, 23.0, 18.0, 24.0, 11.0, 15.0, 12.0, 9.0, 12.0, 9.0, 7.0, 4.0, 9.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.78125, -2.6929931640625, -2.604736328125, -2.5164794921875, -2.42822265625, -2.3399658203125, -2.251708984375, -2.1634521484375, -2.0751953125, -1.9869384765625, -1.898681640625, -1.8104248046875, -1.72216796875, -1.6339111328125, -1.545654296875, -1.4573974609375, -1.369140625, -1.2808837890625, -1.192626953125, -1.1043701171875, -1.01611328125, -0.9278564453125, -0.839599609375, -0.7513427734375, -0.6630859375, -0.5748291015625, -0.486572265625, -0.3983154296875, -0.31005859375, -0.2218017578125, -0.133544921875, -0.0452880859375, 0.04296875, 0.1312255859375, 0.219482421875, 0.3077392578125, 0.39599609375, 0.4842529296875, 0.572509765625, 0.6607666015625, 0.7490234375, 0.8372802734375, 0.925537109375, 1.0137939453125, 1.10205078125, 1.1903076171875, 1.278564453125, 1.3668212890625, 1.455078125, 1.5433349609375, 1.631591796875, 1.7198486328125, 1.80810546875, 1.8963623046875, 1.984619140625, 2.0728759765625, 2.1611328125, 2.2493896484375, 2.337646484375, 2.4259033203125, 2.51416015625, 2.6024169921875, 2.690673828125, 2.7789306640625, 2.8671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 19.0, 23.0, 33.0, 47.0, 64.0, 97.0, 146.0, 201.0, 308.0, 472.0, 642.0, 955.0, 1507.0, 2073.0, 3018.0, 4486.0, 6296.0, 9379.0, 13904.0, 20435.0, 30686.0, 48242.0, 79338.0, 148734.0, 1357225.0, 147138.0, 79005.0, 48144.0, 30937.0, 20473.0, 13607.0, 9257.0, 6540.0, 4262.0, 2943.0, 2036.0, 1369.0, 988.0, 622.0, 491.0, 292.0, 229.0, 153.0, 88.0, 71.0, 52.0, 32.0, 23.0, 18.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0826416015625, -0.08009815216064453, -0.07755470275878906, -0.0750112533569336, -0.07246780395507812, -0.06992435455322266, -0.06738090515136719, -0.06483745574951172, -0.06229400634765625, -0.05975055694580078, -0.05720710754394531, -0.054663658142089844, -0.052120208740234375, -0.049576759338378906, -0.04703330993652344, -0.04448986053466797, -0.0419464111328125, -0.03940296173095703, -0.03685951232910156, -0.034316062927246094, -0.031772613525390625, -0.029229164123535156, -0.026685714721679688, -0.02414226531982422, -0.02159881591796875, -0.01905536651611328, -0.016511917114257812, -0.013968467712402344, -0.011425018310546875, -0.008881568908691406, -0.0063381195068359375, -0.0037946701049804688, -0.001251220703125, 0.0012922286987304688, 0.0038356781005859375, 0.006379127502441406, 0.008922576904296875, 0.011466026306152344, 0.014009475708007812, 0.01655292510986328, 0.01909637451171875, 0.02163982391357422, 0.024183273315429688, 0.026726722717285156, 0.029270172119140625, 0.031813621520996094, 0.03435707092285156, 0.03690052032470703, 0.0394439697265625, 0.04198741912841797, 0.04453086853027344, 0.047074317932128906, 0.049617767333984375, 0.052161216735839844, 0.05470466613769531, 0.05724811553955078, 0.05979156494140625, 0.06233501434326172, 0.06487846374511719, 0.06742191314697266, 0.06996536254882812, 0.0725088119506836, 0.07505226135253906, 0.07759571075439453, 0.08013916015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 1.0, 8.0, 7.0, 20.0, 8.0, 10.0, 13.0, 33.0, 20.0, 25.0, 20.0, 51.0, 38.0, 56.0, 62.0, 271.0, 37.0, 41.0, 35.0, 27.0, 34.0, 20.0, 17.0, 12.0, 26.0, 13.0, 11.0, 11.0, 8.0, 5.0, 6.0, 7.0, 8.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1457672119140625e-06, -2.0721927285194397e-06, -1.998618245124817e-06, -1.925043761730194e-06, -1.8514692783355713e-06, -1.7778947949409485e-06, -1.7043203115463257e-06, -1.6307458281517029e-06, -1.55717134475708e-06, -1.4835968613624573e-06, -1.4100223779678345e-06, -1.3364478945732117e-06, -1.2628734111785889e-06, -1.189298927783966e-06, -1.1157244443893433e-06, -1.0421499609947205e-06, -9.685754776000977e-07, -8.950009942054749e-07, -8.21426510810852e-07, -7.478520274162292e-07, -6.742775440216064e-07, -6.007030606269836e-07, -5.271285772323608e-07, -4.5355409383773804e-07, -3.7997961044311523e-07, -3.0640512704849243e-07, -2.3283064365386963e-07, -1.5925616025924683e-07, -8.568167686462402e-08, -1.210719347000122e-08, 6.146728992462158e-08, 1.3504177331924438e-07, 2.086162567138672e-07, 2.8219074010849e-07, 3.557652235031128e-07, 4.293397068977356e-07, 5.029141902923584e-07, 5.764886736869812e-07, 6.50063157081604e-07, 7.236376404762268e-07, 7.972121238708496e-07, 8.707866072654724e-07, 9.443610906600952e-07, 1.017935574054718e-06, 1.0915100574493408e-06, 1.1650845408439636e-06, 1.2386590242385864e-06, 1.3122335076332092e-06, 1.385807991027832e-06, 1.4593824744224548e-06, 1.5329569578170776e-06, 1.6065314412117004e-06, 1.6801059246063232e-06, 1.753680408000946e-06, 1.8272548913955688e-06, 1.9008293747901917e-06, 1.9744038581848145e-06, 2.0479783415794373e-06, 2.12155282497406e-06, 2.195127308368683e-06, 2.2687017917633057e-06, 2.3422762751579285e-06, 2.4158507585525513e-06, 2.489425241947174e-06, 2.562999725341797e-06]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 2.0, 9.0, 7.0, 7.0, 6.0, 21.0, 27.0, 18.0, 25.0, 39.0, 43.0, 73.0, 95.0, 191.0, 280.0, 865.0, 185019.0, 859306.0, 1621.0, 303.0, 163.0, 131.0, 54.0, 47.0, 38.0, 35.0, 18.0, 25.0, 13.0, 18.0, 7.0, 4.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.716085433959961e-05, -5.553197115659714e-05, -5.3903087973594666e-05, -5.2274204790592194e-05, -5.064532160758972e-05, -4.901643842458725e-05, -4.738755524158478e-05, -4.5758672058582306e-05, -4.4129788875579834e-05, -4.250090569257736e-05, -4.087202250957489e-05, -3.924313932657242e-05, -3.7614256143569946e-05, -3.5985372960567474e-05, -3.4356489777565e-05, -3.272760659456253e-05, -3.109872341156006e-05, -2.9469840228557587e-05, -2.7840957045555115e-05, -2.6212073862552643e-05, -2.458319067955017e-05, -2.29543074965477e-05, -2.1325424313545227e-05, -1.9696541130542755e-05, -1.8067657947540283e-05, -1.643877476453781e-05, -1.480989158153534e-05, -1.3181008398532867e-05, -1.1552125215530396e-05, -9.923242032527924e-06, -8.294358849525452e-06, -6.66547566652298e-06, -5.036592483520508e-06, -3.407709300518036e-06, -1.778826117515564e-06, -1.4994293451309204e-07, 1.4789402484893799e-06, 3.107823431491852e-06, 4.736706614494324e-06, 6.365589797496796e-06, 7.994472980499268e-06, 9.62335616350174e-06, 1.1252239346504211e-05, 1.2881122529506683e-05, 1.4510005712509155e-05, 1.6138888895511627e-05, 1.77677720785141e-05, 1.939665526151657e-05, 2.1025538444519043e-05, 2.2654421627521515e-05, 2.4283304810523987e-05, 2.591218799352646e-05, 2.754107117652893e-05, 2.9169954359531403e-05, 3.0798837542533875e-05, 3.2427720725536346e-05, 3.405660390853882e-05, 3.568548709154129e-05, 3.731437027454376e-05, 3.8943253457546234e-05, 4.0572136640548706e-05, 4.220101982355118e-05, 4.382990300655365e-05, 4.545878618955612e-05, 4.7087669372558594e-05]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 25.0, 429.0, 537.0, 29.0], "bins": [-1.535175761091523e-05, -1.5104257727216464e-05, -1.4856757843517698e-05, -1.4609257959818933e-05, -1.4361758076120168e-05, -1.4114258192421403e-05, -1.3866758308722638e-05, -1.3619258425023872e-05, -1.3371758541325107e-05, -1.3124258657626342e-05, -1.2876758773927577e-05, -1.2629258890228812e-05, -1.2381759006530046e-05, -1.2134259122831281e-05, -1.1886759239132516e-05, -1.1639259355433751e-05, -1.1391759471734986e-05, -1.114425958803622e-05, -1.0896759704337455e-05, -1.064925982063869e-05, -1.0401759936939925e-05, -1.015426005324116e-05, -9.906760169542395e-06, -9.65926028584363e-06, -9.411759492650162e-06, -9.164259608951397e-06, -8.916759725252632e-06, -8.669259841553867e-06, -8.421759957855102e-06, -8.174260074156336e-06, -7.926760190457571e-06, -7.679260306758806e-06, -7.431760877807392e-06, -7.184260994108627e-06, -6.9367611104098614e-06, -6.689261226711096e-06, -6.441761343012331e-06, -6.194261459313566e-06, -5.94676112086745e-06, -5.699261237168685e-06, -5.45176180821727e-06, -5.204261924518505e-06, -4.95676204081974e-06, -4.709262157120975e-06, -4.4617622734222095e-06, -4.214262389723444e-06, -3.966762051277328e-06, -3.7192623949522385e-06, -3.471762283879798e-06, -3.2242624001810327e-06, -2.9767625164822675e-06, -2.7292626327835023e-06, -2.481762749084737e-06, -2.234262865385972e-06, -1.9867627543135313e-06, -1.7392628706147661e-06, -1.4917631006028387e-06, -1.2442632169040735e-06, -9.967632195184706e-07, -7.492633358197054e-07, -5.017634521209402e-07, -2.54263568422175e-07, -6.7635710365721025e-09, 2.407363126621931e-07, 4.882361963609583e-07]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 0.0, 9.0, 0.0, 11.0, 13.0, 0.0, 23.0, 24.0, 0.0, 38.0, 0.0, 52.0, 58.0, 0.0, 89.0, 0.0, 105.0, 130.0, 0.0, 118.0, 0.0, 79.0, 85.0, 0.0, 46.0, 0.0, 34.0, 23.0, 0.0, 29.0, 13.0, 0.0, 6.0, 0.0, 7.0, 10.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1557713150978088e-06, -1.1194497346878052e-06, -1.0831281542778015e-06, -1.0468065738677979e-06, -1.0104849934577942e-06, -9.741634130477905e-07, -9.378418326377869e-07, -9.015202522277832e-07, -8.651986718177795e-07, -8.288770914077759e-07, -7.925555109977722e-07, -7.562339305877686e-07, -7.199123501777649e-07, -6.835907697677612e-07, -6.472691893577576e-07, -6.109476089477539e-07, -5.746260285377502e-07, -5.383044481277466e-07, -5.019828677177429e-07, -4.6566128730773926e-07, -4.293397068977356e-07, -3.9301812648773193e-07, -3.5669654607772827e-07, -3.203749656677246e-07, -2.8405338525772095e-07, -2.477318048477173e-07, -2.1141022443771362e-07, -1.7508864402770996e-07, -1.387670636177063e-07, -1.0244548320770264e-07, -6.612390279769897e-08, -2.9802322387695312e-08, 6.51925802230835e-09, 4.284083843231201e-08, 7.916241884231567e-08, 1.1548399925231934e-07, 1.51805579662323e-07, 1.8812716007232666e-07, 2.2444874048233032e-07, 2.60770320892334e-07, 2.9709190130233765e-07, 3.334134817123413e-07, 3.6973506212234497e-07, 4.0605664253234863e-07, 4.423782229423523e-07, 4.78699803352356e-07, 5.150213837623596e-07, 5.513429641723633e-07, 5.876645445823669e-07, 6.239861249923706e-07, 6.603077054023743e-07, 6.966292858123779e-07, 7.329508662223816e-07, 7.692724466323853e-07, 8.055940270423889e-07, 8.419156074523926e-07, 8.782371878623962e-07, 9.145587682723999e-07, 9.508803486824036e-07, 9.872019290924072e-07, 1.0235235095024109e-06, 1.0598450899124146e-06, 1.0961666703224182e-06, 1.1324882507324219e-06]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 10.0, 11.0, 16.0, 16.0, 19.0, 22.0, 26.0, 32.0, 22.0, 38.0, 41.0, 39.0, 36.0, 31.0, 42.0, 51.0, 49.0, 43.0, 37.0, 30.0, 37.0, 33.0, 33.0, 35.0, 31.0, 33.0, 19.0, 22.0, 17.0, 15.0, 21.0, 15.0, 9.0, 8.0, 7.0, 6.0, 6.0, 4.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.33203125, -4.207550048828125, -4.08306884765625, -3.958587646484375, -3.8341064453125, -3.709625244140625, -3.58514404296875, -3.460662841796875, -3.336181640625, -3.211700439453125, -3.08721923828125, -2.962738037109375, -2.8382568359375, -2.713775634765625, -2.58929443359375, -2.464813232421875, -2.34033203125, -2.215850830078125, -2.09136962890625, -1.966888427734375, -1.8424072265625, -1.717926025390625, -1.59344482421875, -1.468963623046875, -1.344482421875, -1.220001220703125, -1.09552001953125, -0.971038818359375, -0.8465576171875, -0.722076416015625, -0.59759521484375, -0.473114013671875, -0.3486328125, -0.224151611328125, -0.09967041015625, 0.024810791015625, 0.1492919921875, 0.273773193359375, 0.39825439453125, 0.522735595703125, 0.647216796875, 0.771697998046875, 0.89617919921875, 1.020660400390625, 1.1451416015625, 1.269622802734375, 1.39410400390625, 1.518585205078125, 1.64306640625, 1.767547607421875, 1.89202880859375, 2.016510009765625, 2.1409912109375, 2.265472412109375, 2.38995361328125, 2.514434814453125, 2.638916015625, 2.763397216796875, 2.88787841796875, 3.012359619140625, 3.1368408203125, 3.261322021484375, 3.38580322265625, 3.510284423828125, 3.634765625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 10.0, 16.0, 17.0, 21.0, 26.0, 37.0, 44.0, 59.0, 75.0, 120.0, 170.0, 307.0, 520.0, 1005.0, 1831.0, 3382.0, 6454.0, 12499.0, 26664.0, 65702.0, 252236.0, 486996.0, 113482.0, 40210.0, 17767.0, 8760.0, 4580.0, 2442.0, 1300.0, 723.0, 359.0, 187.0, 112.0, 88.0, 68.0, 60.0, 31.0, 40.0, 28.0, 22.0, 12.0, 17.0, 12.0, 12.0, 13.0, 8.0, 3.0, 6.0, 4.0, 1.0, 2.0], "bins": [-6.90234375, -6.70074462890625, -6.4991455078125, -6.29754638671875, -6.095947265625, -5.89434814453125, -5.6927490234375, -5.49114990234375, -5.28955078125, -5.08795166015625, -4.8863525390625, -4.68475341796875, -4.483154296875, -4.28155517578125, -4.0799560546875, -3.87835693359375, -3.6767578125, -3.47515869140625, -3.2735595703125, -3.07196044921875, -2.870361328125, -2.66876220703125, -2.4671630859375, -2.26556396484375, -2.06396484375, -1.86236572265625, -1.6607666015625, -1.45916748046875, -1.257568359375, -1.05596923828125, -0.8543701171875, -0.65277099609375, -0.451171875, -0.24957275390625, -0.0479736328125, 0.15362548828125, 0.355224609375, 0.55682373046875, 0.7584228515625, 0.96002197265625, 1.16162109375, 1.36322021484375, 1.5648193359375, 1.76641845703125, 1.968017578125, 2.16961669921875, 2.3712158203125, 2.57281494140625, 2.7744140625, 2.97601318359375, 3.1776123046875, 3.37921142578125, 3.580810546875, 3.78240966796875, 3.9840087890625, 4.18560791015625, 4.38720703125, 4.58880615234375, 4.7904052734375, 4.99200439453125, 5.193603515625, 5.39520263671875, 5.5968017578125, 5.79840087890625, 6.0]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 6.0, 12.0, 12.0, 14.0, 11.0, 17.0, 13.0, 18.0, 16.0, 25.0, 24.0, 36.0, 37.0, 37.0, 42.0, 60.0, 65.0, 87.0, 203.0, 1413.0, 261.0, 128.0, 72.0, 64.0, 43.0, 44.0, 37.0, 26.0, 26.0, 32.0, 20.0, 17.0, 27.0, 9.0, 21.0, 6.0, 14.0, 10.0, 8.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2578125, -9.9127197265625, -9.567626953125, -9.2225341796875, -8.87744140625, -8.5323486328125, -8.187255859375, -7.8421630859375, -7.4970703125, -7.1519775390625, -6.806884765625, -6.4617919921875, -6.11669921875, -5.7716064453125, -5.426513671875, -5.0814208984375, -4.736328125, -4.3912353515625, -4.046142578125, -3.7010498046875, -3.35595703125, -3.0108642578125, -2.665771484375, -2.3206787109375, -1.9755859375, -1.6304931640625, -1.285400390625, -0.9403076171875, -0.59521484375, -0.2501220703125, 0.094970703125, 0.4400634765625, 0.78515625, 1.1302490234375, 1.475341796875, 1.8204345703125, 2.16552734375, 2.5106201171875, 2.855712890625, 3.2008056640625, 3.5458984375, 3.8909912109375, 4.236083984375, 4.5811767578125, 4.92626953125, 5.2713623046875, 5.616455078125, 5.9615478515625, 6.306640625, 6.6517333984375, 6.996826171875, 7.3419189453125, 7.68701171875, 8.0321044921875, 8.377197265625, 8.7222900390625, 9.0673828125, 9.4124755859375, 9.757568359375, 10.1026611328125, 10.44775390625, 10.7928466796875, 11.137939453125, 11.4830322265625, 11.828125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 7.0, 7.0, 9.0, 14.0, 14.0, 16.0, 22.0, 25.0, 28.0, 27.0, 38.0, 48.0, 72.0, 97.0, 161.0, 193.0, 301.0, 642.0, 2076.0, 9735.0, 66844.0, 2120473.0, 894012.0, 40770.0, 6914.0, 1635.0, 531.0, 268.0, 171.0, 116.0, 100.0, 69.0, 52.0, 43.0, 23.0, 15.0, 18.0, 21.0, 17.0, 19.0, 14.0, 9.0, 3.0, 8.0, 3.0, 4.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.8125, -16.3013916015625, -15.790283203125, -15.2791748046875, -14.76806640625, -14.2569580078125, -13.745849609375, -13.2347412109375, -12.7236328125, -12.2125244140625, -11.701416015625, -11.1903076171875, -10.67919921875, -10.1680908203125, -9.656982421875, -9.1458740234375, -8.634765625, -8.1236572265625, -7.612548828125, -7.1014404296875, -6.59033203125, -6.0792236328125, -5.568115234375, -5.0570068359375, -4.5458984375, -4.0347900390625, -3.523681640625, -3.0125732421875, -2.50146484375, -1.9903564453125, -1.479248046875, -0.9681396484375, -0.45703125, 0.0540771484375, 0.565185546875, 1.0762939453125, 1.58740234375, 2.0985107421875, 2.609619140625, 3.1207275390625, 3.6318359375, 4.1429443359375, 4.654052734375, 5.1651611328125, 5.67626953125, 6.1873779296875, 6.698486328125, 7.2095947265625, 7.720703125, 8.2318115234375, 8.742919921875, 9.2540283203125, 9.76513671875, 10.2762451171875, 10.787353515625, 11.2984619140625, 11.8095703125, 12.3206787109375, 12.831787109375, 13.3428955078125, 13.85400390625, 14.3651123046875, 14.876220703125, 15.3873291015625, 15.8984375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 14.0, 132.0, 414.0, 359.0, 88.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.984806060791016, -14.138572692871094, -11.292338371276855, -8.446104049682617, -5.599870681762695, -2.7536373138427734, 0.09259796142578125, 2.938831329345703, 5.785064697265625, 8.631298065185547, 11.477532386779785, 14.323766708374023, 17.170000076293945, 20.016233444213867, 22.862468719482422, 25.708702087402344, 28.554935455322266, 31.401168823242188, 34.24740219116211, 37.09363555908203, 39.93987274169922, 42.786102294921875, 45.63233947753906, 48.478572845458984, 51.324806213378906, 54.17103958129883, 57.01727294921875, 59.86351013183594, 62.709739685058594, 65.55597686767578, 68.40220642089844, 71.24844360351562, 74.09468078613281, 76.94091796875, 79.78714752197266, 82.63338470458984, 85.4796142578125, 88.32585144042969, 91.17208862304688, 94.01831817626953, 96.86454772949219, 99.71078491210938, 102.55701446533203, 105.40325164794922, 108.24948120117188, 111.09571838378906, 113.94195556640625, 116.7881851196289, 119.6344223022461, 122.48065948486328, 125.32688903808594, 128.17312622070312, 131.0193634033203, 133.86558532714844, 136.71182250976562, 139.5580596923828, 142.404296875, 145.2505340576172, 148.09677124023438, 150.9429931640625, 153.7892303466797, 156.63546752929688, 159.48170471191406, 162.32794189453125, 165.17416381835938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 9.0, 7.0, 10.0, 10.0, 15.0, 13.0, 12.0, 17.0, 16.0, 22.0, 15.0, 24.0, 27.0, 42.0, 29.0, 35.0, 28.0, 40.0, 32.0, 49.0, 36.0, 46.0, 44.0, 57.0, 41.0, 30.0, 38.0, 33.0, 27.0, 26.0, 26.0, 21.0, 20.0, 20.0, 26.0, 17.0, 14.0, 1.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.67845916748047, -34.64162063598633, -33.60478210449219, -32.56794357299805, -31.531105041503906, -30.494266510009766, -29.457429885864258, -28.420591354370117, -27.383752822875977, -26.346914291381836, -25.310075759887695, -24.273237228393555, -23.236400604248047, -22.199562072753906, -21.162723541259766, -20.125885009765625, -19.089046478271484, -18.052207946777344, -17.015369415283203, -15.978531837463379, -14.941693305969238, -13.904854774475098, -12.868017196655273, -11.831178665161133, -10.794340133666992, -9.757501602172852, -8.720663070678711, -7.683825492858887, -6.646986961364746, -5.6101484298706055, -4.573310375213623, -3.5364723205566406, -2.4996376037597656, -1.462799310684204, -0.4259610176086426, 0.610877275466919, 1.6477155685424805, 2.684554100036621, 3.7213921546936035, 4.758230209350586, 5.795068740844727, 6.831907272338867, 7.86874532699585, 8.905583381652832, 9.942421913146973, 10.979260444641113, 12.016098022460938, 13.052936553955078, 14.089775085449219, 15.12661361694336, 16.1634521484375, 17.20029067993164, 18.23712921142578, 19.273967742919922, 20.31080436706543, 21.34764289855957, 22.38448143005371, 23.42131996154785, 24.458158493041992, 25.494997024536133, 26.53183364868164, 27.56867218017578, 28.605510711669922, 29.642349243164062, 30.679187774658203]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 3.0, 5.0, 7.0, 10.0, 5.0, 13.0, 18.0, 15.0, 25.0, 15.0, 31.0, 20.0, 23.0, 33.0, 32.0, 32.0, 38.0, 43.0, 47.0, 41.0, 33.0, 32.0, 45.0, 36.0, 34.0, 26.0, 39.0, 36.0, 27.0, 27.0, 22.0, 22.0, 19.0, 18.0, 19.0, 16.0, 10.0, 15.0, 15.0, 9.0, 7.0, 9.0, 10.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 4.0], "bins": [-4.26171875, -4.137939453125, -4.01416015625, -3.890380859375, -3.7666015625, -3.642822265625, -3.51904296875, -3.395263671875, -3.271484375, -3.147705078125, -3.02392578125, -2.900146484375, -2.7763671875, -2.652587890625, -2.52880859375, -2.405029296875, -2.28125, -2.157470703125, -2.03369140625, -1.909912109375, -1.7861328125, -1.662353515625, -1.53857421875, -1.414794921875, -1.291015625, -1.167236328125, -1.04345703125, -0.919677734375, -0.7958984375, -0.672119140625, -0.54833984375, -0.424560546875, -0.30078125, -0.177001953125, -0.05322265625, 0.070556640625, 0.1943359375, 0.318115234375, 0.44189453125, 0.565673828125, 0.689453125, 0.813232421875, 0.93701171875, 1.060791015625, 1.1845703125, 1.308349609375, 1.43212890625, 1.555908203125, 1.6796875, 1.803466796875, 1.92724609375, 2.051025390625, 2.1748046875, 2.298583984375, 2.42236328125, 2.546142578125, 2.669921875, 2.793701171875, 2.91748046875, 3.041259765625, 3.1650390625, 3.288818359375, 3.41259765625, 3.536376953125, 3.66015625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 7.0, 14.0, 17.0, 20.0, 38.0, 53.0, 80.0, 154.0, 293.0, 688.0, 1453.0, 3631.0, 9231.0, 25157.0, 72570.0, 220079.0, 689725.0, 1631903.0, 1032633.0, 337620.0, 108799.0, 37463.0, 13474.0, 5151.0, 2079.0, 901.0, 486.0, 232.0, 116.0, 64.0, 46.0, 30.0, 19.0, 18.0, 12.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.74609375, -5.5804443359375, -5.414794921875, -5.2491455078125, -5.08349609375, -4.9178466796875, -4.752197265625, -4.5865478515625, -4.4208984375, -4.2552490234375, -4.089599609375, -3.9239501953125, -3.75830078125, -3.5926513671875, -3.427001953125, -3.2613525390625, -3.095703125, -2.9300537109375, -2.764404296875, -2.5987548828125, -2.43310546875, -2.2674560546875, -2.101806640625, -1.9361572265625, -1.7705078125, -1.6048583984375, -1.439208984375, -1.2735595703125, -1.10791015625, -0.9422607421875, -0.776611328125, -0.6109619140625, -0.4453125, -0.2796630859375, -0.114013671875, 0.0516357421875, 0.21728515625, 0.3829345703125, 0.548583984375, 0.7142333984375, 0.8798828125, 1.0455322265625, 1.211181640625, 1.3768310546875, 1.54248046875, 1.7081298828125, 1.873779296875, 2.0394287109375, 2.205078125, 2.3707275390625, 2.536376953125, 2.7020263671875, 2.86767578125, 3.0333251953125, 3.198974609375, 3.3646240234375, 3.5302734375, 3.6959228515625, 3.861572265625, 4.0272216796875, 4.19287109375, 4.3585205078125, 4.524169921875, 4.6898193359375, 4.85546875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 12.0, 11.0, 14.0, 22.0, 11.0, 24.0, 47.0, 54.0, 52.0, 87.0, 101.0, 129.0, 197.0, 233.0, 326.0, 360.0, 401.0, 409.0, 359.0, 230.0, 222.0, 158.0, 152.0, 119.0, 76.0, 54.0, 52.0, 28.0, 28.0, 18.0, 21.0, 16.0, 11.0, 8.0, 8.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.4140625, -6.234375, -6.0546875, -5.875, -5.6953125, -5.515625, -5.3359375, -5.15625, -4.9765625, -4.796875, -4.6171875, -4.4375, -4.2578125, -4.078125, -3.8984375, -3.71875, -3.5390625, -3.359375, -3.1796875, -3.0, -2.8203125, -2.640625, -2.4609375, -2.28125, -2.1015625, -1.921875, -1.7421875, -1.5625, -1.3828125, -1.203125, -1.0234375, -0.84375, -0.6640625, -0.484375, -0.3046875, -0.125, 0.0546875, 0.234375, 0.4140625, 0.59375, 0.7734375, 0.953125, 1.1328125, 1.3125, 1.4921875, 1.671875, 1.8515625, 2.03125, 2.2109375, 2.390625, 2.5703125, 2.75, 2.9296875, 3.109375, 3.2890625, 3.46875, 3.6484375, 3.828125, 4.0078125, 4.1875, 4.3671875, 4.546875, 4.7265625, 4.90625, 5.0859375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 12.0, 12.0, 18.0, 30.0, 27.0, 41.0, 52.0, 69.0, 102.0, 156.0, 220.0, 329.0, 599.0, 1644.0, 8828.0, 89223.0, 1336119.0, 2544215.0, 191486.0, 16694.0, 2446.0, 751.0, 396.0, 221.0, 171.0, 117.0, 93.0, 59.0, 32.0, 27.0, 23.0, 20.0, 13.0, 10.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.984375, -14.4873046875, -13.990234375, -13.4931640625, -12.99609375, -12.4990234375, -12.001953125, -11.5048828125, -11.0078125, -10.5107421875, -10.013671875, -9.5166015625, -9.01953125, -8.5224609375, -8.025390625, -7.5283203125, -7.03125, -6.5341796875, -6.037109375, -5.5400390625, -5.04296875, -4.5458984375, -4.048828125, -3.5517578125, -3.0546875, -2.5576171875, -2.060546875, -1.5634765625, -1.06640625, -0.5693359375, -0.072265625, 0.4248046875, 0.921875, 1.4189453125, 1.916015625, 2.4130859375, 2.91015625, 3.4072265625, 3.904296875, 4.4013671875, 4.8984375, 5.3955078125, 5.892578125, 6.3896484375, 6.88671875, 7.3837890625, 7.880859375, 8.3779296875, 8.875, 9.3720703125, 9.869140625, 10.3662109375, 10.86328125, 11.3603515625, 11.857421875, 12.3544921875, 12.8515625, 13.3486328125, 13.845703125, 14.3427734375, 14.83984375, 15.3369140625, 15.833984375, 16.3310546875, 16.828125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 10.0, 10.0, 38.0, 47.0, 77.0, 105.0, 133.0, 153.0, 121.0, 120.0, 79.0, 59.0, 33.0, 21.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.97929382324219, -36.68626022338867, -35.393226623535156, -34.100189208984375, -32.80715560913086, -31.514122009277344, -30.221086502075195, -28.928050994873047, -27.63501739501953, -26.341983795166016, -25.048948287963867, -23.75591278076172, -22.462879180908203, -21.169845581054688, -19.87681007385254, -18.58377456665039, -17.290740966796875, -15.997706413269043, -14.704671859741211, -13.411637306213379, -12.118602752685547, -10.825568199157715, -9.532533645629883, -8.23949909210205, -6.946464538574219, -5.653429985046387, -4.360395431518555, -3.0673608779907227, -1.7743263244628906, -0.4812917709350586, 0.8117427825927734, 2.1047773361206055, 3.3978118896484375, 4.6908464431762695, 5.983880996704102, 7.276915550231934, 8.569950103759766, 9.862984657287598, 11.15601921081543, 12.449053764343262, 13.742088317871094, 15.035122871398926, 16.328157424926758, 17.621192932128906, 18.914226531982422, 20.207260131835938, 21.500295639038086, 22.793331146240234, 24.08636474609375, 25.379398345947266, 26.672433853149414, 27.965469360351562, 29.258502960205078, 30.551536560058594, 31.844572067260742, 33.13760757446289, 34.430641174316406, 35.72367477416992, 37.01670837402344, 38.30974578857422, 39.602779388427734, 40.89581298828125, 42.18885040283203, 43.48188400268555, 44.77491760253906]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 2.0, 8.0, 5.0, 9.0, 11.0, 17.0, 22.0, 19.0, 10.0, 29.0, 28.0, 20.0, 18.0, 22.0, 34.0, 32.0, 28.0, 41.0, 41.0, 38.0, 46.0, 34.0, 45.0, 41.0, 39.0, 35.0, 30.0, 35.0, 38.0, 32.0, 23.0, 18.0, 19.0, 16.0, 18.0, 15.0, 15.0, 8.0, 14.0, 4.0, 8.0, 5.0, 1.0, 3.0, 2.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.344802856445312, -19.695880889892578, -19.046960830688477, -18.398040771484375, -17.74911880493164, -17.100196838378906, -16.451276779174805, -15.802355766296387, -15.153434753417969, -14.50451374053955, -13.855592727661133, -13.206671714782715, -12.557750701904297, -11.908829689025879, -11.259908676147461, -10.610987663269043, -9.962066650390625, -9.313145637512207, -8.664224624633789, -8.015303611755371, -7.366382598876953, -6.717461585998535, -6.068540573120117, -5.419619560241699, -4.770698547363281, -4.121777534484863, -3.4728565216064453, -2.8239355087280273, -2.1750144958496094, -1.5260934829711914, -0.8771724700927734, -0.22825145721435547, 0.4206695556640625, 1.0695905685424805, 1.7185115814208984, 2.3674325942993164, 3.0163536071777344, 3.6652746200561523, 4.31419563293457, 4.963116645812988, 5.612037658691406, 6.260958671569824, 6.909879684448242, 7.55880069732666, 8.207721710205078, 8.856642723083496, 9.505563735961914, 10.154484748840332, 10.80340576171875, 11.452326774597168, 12.101247787475586, 12.750168800354004, 13.399089813232422, 14.04801082611084, 14.696931838989258, 15.345852851867676, 15.994773864746094, 16.643695831298828, 17.29261589050293, 17.94153594970703, 18.590457916259766, 19.2393798828125, 19.8882999420166, 20.537220001220703, 21.186141967773438]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 6.0, 12.0, 10.0, 13.0, 10.0, 16.0, 22.0, 24.0, 28.0, 28.0, 18.0, 40.0, 36.0, 30.0, 40.0, 34.0, 43.0, 43.0, 40.0, 43.0, 34.0, 35.0, 35.0, 30.0, 30.0, 27.0, 27.0, 23.0, 24.0, 22.0, 19.0, 23.0, 16.0, 21.0, 12.0, 16.0, 14.0, 10.0, 11.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.783203125, -3.661895751953125, -3.54058837890625, -3.419281005859375, -3.2979736328125, -3.176666259765625, -3.05535888671875, -2.934051513671875, -2.812744140625, -2.691436767578125, -2.57012939453125, -2.448822021484375, -2.3275146484375, -2.206207275390625, -2.08489990234375, -1.963592529296875, -1.84228515625, -1.720977783203125, -1.59967041015625, -1.478363037109375, -1.3570556640625, -1.235748291015625, -1.11444091796875, -0.993133544921875, -0.871826171875, -0.750518798828125, -0.62921142578125, -0.507904052734375, -0.3865966796875, -0.265289306640625, -0.14398193359375, -0.022674560546875, 0.0986328125, 0.219940185546875, 0.34124755859375, 0.462554931640625, 0.5838623046875, 0.705169677734375, 0.82647705078125, 0.947784423828125, 1.069091796875, 1.190399169921875, 1.31170654296875, 1.433013916015625, 1.5543212890625, 1.675628662109375, 1.79693603515625, 1.918243408203125, 2.03955078125, 2.160858154296875, 2.28216552734375, 2.403472900390625, 2.5247802734375, 2.646087646484375, 2.76739501953125, 2.888702392578125, 3.010009765625, 3.131317138671875, 3.25262451171875, 3.373931884765625, 3.4952392578125, 3.616546630859375, 3.73785400390625, 3.859161376953125, 3.98046875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 6.0, 7.0, 17.0, 26.0, 18.0, 45.0, 46.0, 74.0, 104.0, 133.0, 182.0, 258.0, 359.0, 490.0, 680.0, 948.0, 1349.0, 1891.0, 2601.0, 3517.0, 5228.0, 7441.0, 10979.0, 16035.0, 24126.0, 36938.0, 58071.0, 97313.0, 209561.0, 274511.0, 108944.0, 63652.0, 40408.0, 26065.0, 17617.0, 11761.0, 8053.0, 5593.0, 3897.0, 2794.0, 1891.0, 1379.0, 995.0, 732.0, 532.0, 343.0, 247.0, 189.0, 156.0, 104.0, 80.0, 53.0, 39.0, 24.0, 20.0, 21.0, 7.0, 7.0, 7.0, 2.0, 1.0], "bins": [-0.1422119140625, -0.13778114318847656, -0.13335037231445312, -0.1289196014404297, -0.12448883056640625, -0.12005805969238281, -0.11562728881835938, -0.11119651794433594, -0.1067657470703125, -0.10233497619628906, -0.09790420532226562, -0.09347343444824219, -0.08904266357421875, -0.08461189270019531, -0.08018112182617188, -0.07575035095214844, -0.071319580078125, -0.06688880920410156, -0.062458038330078125, -0.05802726745605469, -0.05359649658203125, -0.04916572570800781, -0.044734954833984375, -0.04030418395996094, -0.0358734130859375, -0.03144264221191406, -0.027011871337890625, -0.022581100463867188, -0.01815032958984375, -0.013719558715820312, -0.009288787841796875, -0.0048580169677734375, -0.00042724609375, 0.0040035247802734375, 0.008434295654296875, 0.012865066528320312, 0.01729583740234375, 0.021726608276367188, 0.026157379150390625, 0.030588150024414062, 0.0350189208984375, 0.03944969177246094, 0.043880462646484375, 0.04831123352050781, 0.05274200439453125, 0.05717277526855469, 0.061603546142578125, 0.06603431701660156, 0.070465087890625, 0.07489585876464844, 0.07932662963867188, 0.08375740051269531, 0.08818817138671875, 0.09261894226074219, 0.09704971313476562, 0.10148048400878906, 0.1059112548828125, 0.11034202575683594, 0.11477279663085938, 0.11920356750488281, 0.12363433837890625, 0.1280651092529297, 0.13249588012695312, 0.13692665100097656, 0.141357421875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 9.0, 8.0, 15.0, 20.0, 13.0, 10.0, 26.0, 14.0, 24.0, 29.0, 29.0, 37.0, 40.0, 26.0, 35.0, 49.0, 45.0, 1068.0, 38.0, 47.0, 35.0, 38.0, 43.0, 31.0, 38.0, 25.0, 26.0, 31.0, 29.0, 19.0, 21.0, 20.0, 14.0, 12.0, 7.0, 10.0, 11.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.822265625, -2.726593017578125, -2.63092041015625, -2.535247802734375, -2.4395751953125, -2.343902587890625, -2.24822998046875, -2.152557373046875, -2.056884765625, -1.961212158203125, -1.86553955078125, -1.769866943359375, -1.6741943359375, -1.578521728515625, -1.48284912109375, -1.387176513671875, -1.29150390625, -1.195831298828125, -1.10015869140625, -1.004486083984375, -0.9088134765625, -0.813140869140625, -0.71746826171875, -0.621795654296875, -0.526123046875, -0.430450439453125, -0.33477783203125, -0.239105224609375, -0.1434326171875, -0.047760009765625, 0.04791259765625, 0.143585205078125, 0.2392578125, 0.334930419921875, 0.43060302734375, 0.526275634765625, 0.6219482421875, 0.717620849609375, 0.81329345703125, 0.908966064453125, 1.004638671875, 1.100311279296875, 1.19598388671875, 1.291656494140625, 1.3873291015625, 1.483001708984375, 1.57867431640625, 1.674346923828125, 1.77001953125, 1.865692138671875, 1.96136474609375, 2.057037353515625, 2.1527099609375, 2.248382568359375, 2.34405517578125, 2.439727783203125, 2.535400390625, 2.631072998046875, 2.72674560546875, 2.822418212890625, 2.9180908203125, 3.013763427734375, 3.10943603515625, 3.205108642578125, 3.30078125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 14.0, 21.0, 25.0, 42.0, 70.0, 87.0, 133.0, 210.0, 269.0, 459.0, 640.0, 954.0, 1501.0, 2249.0, 3316.0, 4838.0, 7131.0, 10932.0, 16323.0, 24824.0, 38885.0, 63645.0, 112157.0, 1326286.0, 219127.0, 101159.0, 58154.0, 35687.0, 22535.0, 14929.0, 9946.0, 6810.0, 4409.0, 3068.0, 2004.0, 1351.0, 932.0, 664.0, 474.0, 278.0, 211.0, 133.0, 78.0, 54.0, 38.0, 29.0, 13.0, 18.0, 2.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.09515380859375, -0.09226322174072266, -0.08937263488769531, -0.08648204803466797, -0.08359146118164062, -0.08070087432861328, -0.07781028747558594, -0.0749197006225586, -0.07202911376953125, -0.0691385269165039, -0.06624794006347656, -0.06335735321044922, -0.060466766357421875, -0.05757617950439453, -0.05468559265136719, -0.051795005798339844, -0.0489044189453125, -0.046013832092285156, -0.04312324523925781, -0.04023265838623047, -0.037342071533203125, -0.03445148468017578, -0.03156089782714844, -0.028670310974121094, -0.02577972412109375, -0.022889137268066406, -0.019998550415039062, -0.01710796356201172, -0.014217376708984375, -0.011326789855957031, -0.008436203002929688, -0.005545616149902344, -0.002655029296875, 0.00023555755615234375, 0.0031261444091796875, 0.006016731262207031, 0.008907318115234375, 0.011797904968261719, 0.014688491821289062, 0.017579078674316406, 0.02046966552734375, 0.023360252380371094, 0.026250839233398438, 0.02914142608642578, 0.032032012939453125, 0.03492259979248047, 0.03781318664550781, 0.040703773498535156, 0.0435943603515625, 0.046484947204589844, 0.04937553405761719, 0.05226612091064453, 0.055156707763671875, 0.05804729461669922, 0.06093788146972656, 0.0638284683227539, 0.06671905517578125, 0.0696096420288086, 0.07250022888183594, 0.07539081573486328, 0.07828140258789062, 0.08117198944091797, 0.08406257629394531, 0.08695316314697266, 0.08984375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 16.0, 2.0, 3.0, 6.0, 14.0, 14.0, 13.0, 54.0, 29.0, 37.0, 48.0, 50.0, 83.0, 244.0, 130.0, 39.0, 23.0, 31.0, 18.0, 15.0, 19.0, 33.0, 5.0, 8.0, 1.0, 5.0, 4.0, 7.0, 15.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-2.3245811462402344e-06, -2.2565945982933044e-06, -2.1886080503463745e-06, -2.1206215023994446e-06, -2.0526349544525146e-06, -1.9846484065055847e-06, -1.9166618585586548e-06, -1.8486753106117249e-06, -1.780688762664795e-06, -1.712702214717865e-06, -1.644715666770935e-06, -1.5767291188240051e-06, -1.5087425708770752e-06, -1.4407560229301453e-06, -1.3727694749832153e-06, -1.3047829270362854e-06, -1.2367963790893555e-06, -1.1688098311424255e-06, -1.1008232831954956e-06, -1.0328367352485657e-06, -9.648501873016357e-07, -8.968636393547058e-07, -8.288770914077759e-07, -7.60890543460846e-07, -6.92903995513916e-07, -6.249174475669861e-07, -5.569308996200562e-07, -4.889443516731262e-07, -4.209578037261963e-07, -3.5297125577926636e-07, -2.849847078323364e-07, -2.169981598854065e-07, -1.4901161193847656e-07, -8.102506399154663e-08, -1.30385160446167e-08, 5.494803190231323e-08, 1.2293457984924316e-07, 1.909211277961731e-07, 2.5890767574310303e-07, 3.2689422369003296e-07, 3.948807716369629e-07, 4.628673195838928e-07, 5.308538675308228e-07, 5.988404154777527e-07, 6.668269634246826e-07, 7.348135113716125e-07, 8.028000593185425e-07, 8.707866072654724e-07, 9.387731552124023e-07, 1.0067597031593323e-06, 1.0747462511062622e-06, 1.1427327990531921e-06, 1.210719347000122e-06, 1.278705894947052e-06, 1.346692442893982e-06, 1.4146789908409119e-06, 1.4826655387878418e-06, 1.5506520867347717e-06, 1.6186386346817017e-06, 1.6866251826286316e-06, 1.7546117305755615e-06, 1.8225982785224915e-06, 1.8905848264694214e-06, 1.9585713744163513e-06, 2.0265579223632812e-06]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 5.0, 9.0, 8.0, 14.0, 16.0, 14.0, 14.0, 39.0, 41.0, 63.0, 85.0, 166.0, 271.0, 1062.0, 350210.0, 694749.0, 1027.0, 268.0, 152.0, 92.0, 67.0, 44.0, 37.0, 10.0, 19.0, 13.0, 17.0, 3.0, 7.0, 4.0, 0.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5239925384521484e-05, -4.3732114136219025e-05, -4.2224302887916565e-05, -4.0716491639614105e-05, -3.9208680391311646e-05, -3.7700869143009186e-05, -3.6193057894706726e-05, -3.4685246646404266e-05, -3.317743539810181e-05, -3.166962414979935e-05, -3.0161812901496887e-05, -2.8654001653194427e-05, -2.7146190404891968e-05, -2.5638379156589508e-05, -2.413056790828705e-05, -2.262275665998459e-05, -2.111494541168213e-05, -1.960713416337967e-05, -1.809932291507721e-05, -1.659151166677475e-05, -1.508370041847229e-05, -1.357588917016983e-05, -1.206807792186737e-05, -1.0560266673564911e-05, -9.052455425262451e-06, -7.5446441769599915e-06, -6.036832928657532e-06, -4.529021680355072e-06, -3.0212104320526123e-06, -1.5133991837501526e-06, -5.587935447692871e-09, 1.5022233128547668e-06, 3.0100345611572266e-06, 4.517845809459686e-06, 6.025657057762146e-06, 7.533468306064606e-06, 9.041279554367065e-06, 1.0549090802669525e-05, 1.2056902050971985e-05, 1.3564713299274445e-05, 1.5072524547576904e-05, 1.6580335795879364e-05, 1.8088147044181824e-05, 1.9595958292484283e-05, 2.1103769540786743e-05, 2.2611580789089203e-05, 2.4119392037391663e-05, 2.5627203285694122e-05, 2.7135014533996582e-05, 2.8642825782299042e-05, 3.01506370306015e-05, 3.165844827890396e-05, 3.316625952720642e-05, 3.467407077550888e-05, 3.618188202381134e-05, 3.76896932721138e-05, 3.919750452041626e-05, 4.070531576871872e-05, 4.221312701702118e-05, 4.372093826532364e-05, 4.52287495136261e-05, 4.673656076192856e-05, 4.824437201023102e-05, 4.975218325853348e-05, 5.125999450683594e-05]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 12.0, 40.0, 214.0, 507.0, 181.0, 41.0, 12.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3205189942673314e-06, -5.214945304032881e-06, -5.10937161379843e-06, -5.0037979235639796e-06, -4.89822468807688e-06, -4.792650997842429e-06, -4.687077307607979e-06, -4.581503617373528e-06, -4.475929927139077e-06, -4.370356236904627e-06, -4.264782546670176e-06, -4.159209311183076e-06, -4.053635620948626e-06, -3.948061930714175e-06, -3.8424882404797245e-06, -3.736914550245274e-06, -3.6313410873844987e-06, -3.525767397150048e-06, -3.420193934289273e-06, -3.3146202440548223e-06, -3.2090465538203716e-06, -3.103472863585921e-06, -2.997899400725146e-06, -2.892325710490695e-06, -2.78675224762992e-06, -2.6811785573954694e-06, -2.5756050945346942e-06, -2.4700314043002436e-06, -2.364457714065793e-06, -2.258884251205018e-06, -2.153310560970567e-06, -2.0477368707361165e-06, -1.942163180501666e-06, -1.836589603954053e-06, -1.7310159137196024e-06, -1.6254423371719895e-06, -1.5198686469375389e-06, -1.414295070389926e-06, -1.308721493842313e-06, -1.2031478036078624e-06, -1.0975741133734118e-06, -9.92000536825799e-07, -8.864268465913483e-07, -7.808532700437354e-07, -6.752796366527036e-07, -5.697060032616719e-07, -4.6413242671405897e-07, -3.585587933230272e-07, -2.5298515993199544e-07, -1.474115407518184e-07, -4.1837921571641346e-08, 6.373568339768099e-08, 1.6930931678871275e-07, 2.748829501797445e-07, 3.804565267273574e-07, 4.860301601183892e-07, 5.916037935094209e-07, 6.971774269004527e-07, 8.027510602914845e-07, 9.083246368390974e-07, 1.013898327073548e-06, 1.1194719036211609e-06, 1.2250454801687738e-06, 1.3306191704032244e-06, 1.4361927469508373e-06]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 11.0, 0.0, 7.0, 0.0, 15.0, 0.0, 20.0, 0.0, 0.0, 39.0, 0.0, 50.0, 0.0, 57.0, 0.0, 101.0, 0.0, 122.0, 0.0, 0.0, 158.0, 0.0, 134.0, 0.0, 90.0, 0.0, 71.0, 0.0, 44.0, 0.0, 0.0, 28.0, 0.0, 24.0, 0.0, 19.0, 0.0, 6.0, 0.0, 7.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.940696716308594e-07, -8.670613169670105e-07, -8.400529623031616e-07, -8.130446076393127e-07, -7.860362529754639e-07, -7.59027898311615e-07, -7.320195436477661e-07, -7.050111889839172e-07, -6.780028343200684e-07, -6.509944796562195e-07, -6.239861249923706e-07, -5.969777703285217e-07, -5.699694156646729e-07, -5.42961061000824e-07, -5.159527063369751e-07, -4.889443516731262e-07, -4.6193599700927734e-07, -4.3492764234542847e-07, -4.079192876815796e-07, -3.809109330177307e-07, -3.5390257835388184e-07, -3.2689422369003296e-07, -2.998858690261841e-07, -2.728775143623352e-07, -2.4586915969848633e-07, -2.1886080503463745e-07, -1.9185245037078857e-07, -1.648440957069397e-07, -1.3783574104309082e-07, -1.1082738637924194e-07, -8.381903171539307e-08, -5.681067705154419e-08, -2.9802322387695312e-08, -2.7939677238464355e-09, 2.421438694000244e-08, 5.122274160385132e-08, 7.82310962677002e-08, 1.0523945093154907e-07, 1.3224780559539795e-07, 1.5925616025924683e-07, 1.862645149230957e-07, 2.1327286958694458e-07, 2.4028122425079346e-07, 2.6728957891464233e-07, 2.942979335784912e-07, 3.213062882423401e-07, 3.4831464290618896e-07, 3.7532299757003784e-07, 4.023313522338867e-07, 4.293397068977356e-07, 4.5634806156158447e-07, 4.833564162254333e-07, 5.103647708892822e-07, 5.373731255531311e-07, 5.6438148021698e-07, 5.913898348808289e-07, 6.183981895446777e-07, 6.454065442085266e-07, 6.724148988723755e-07, 6.994232535362244e-07, 7.264316082000732e-07, 7.534399628639221e-07, 7.80448317527771e-07, 8.074566721916199e-07, 8.344650268554688e-07]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 6.0, 12.0, 10.0, 13.0, 10.0, 16.0, 22.0, 24.0, 28.0, 28.0, 18.0, 40.0, 36.0, 30.0, 40.0, 34.0, 43.0, 43.0, 40.0, 43.0, 34.0, 35.0, 35.0, 30.0, 30.0, 27.0, 27.0, 23.0, 24.0, 22.0, 19.0, 23.0, 16.0, 21.0, 12.0, 16.0, 14.0, 10.0, 11.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.783203125, -3.661895751953125, -3.54058837890625, -3.419281005859375, -3.2979736328125, -3.176666259765625, -3.05535888671875, -2.934051513671875, -2.812744140625, -2.691436767578125, -2.57012939453125, -2.448822021484375, -2.3275146484375, -2.206207275390625, -2.08489990234375, -1.963592529296875, -1.84228515625, -1.720977783203125, -1.59967041015625, -1.478363037109375, -1.3570556640625, -1.235748291015625, -1.11444091796875, -0.993133544921875, -0.871826171875, -0.750518798828125, -0.62921142578125, -0.507904052734375, -0.3865966796875, -0.265289306640625, -0.14398193359375, -0.022674560546875, 0.0986328125, 0.219940185546875, 0.34124755859375, 0.462554931640625, 0.5838623046875, 0.705169677734375, 0.82647705078125, 0.947784423828125, 1.069091796875, 1.190399169921875, 1.31170654296875, 1.433013916015625, 1.5543212890625, 1.675628662109375, 1.79693603515625, 1.918243408203125, 2.03955078125, 2.160858154296875, 2.28216552734375, 2.403472900390625, 2.5247802734375, 2.646087646484375, 2.76739501953125, 2.888702392578125, 3.010009765625, 3.131317138671875, 3.25262451171875, 3.373931884765625, 3.4952392578125, 3.616546630859375, 3.73785400390625, 3.859161376953125, 3.98046875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 10.0, 13.0, 21.0, 20.0, 33.0, 44.0, 53.0, 118.0, 161.0, 221.0, 437.0, 664.0, 1088.0, 1922.0, 3086.0, 4955.0, 8026.0, 12703.0, 20410.0, 32092.0, 50573.0, 81437.0, 146583.0, 251974.0, 179190.0, 95748.0, 58212.0, 36850.0, 23370.0, 14655.0, 9175.0, 5747.0, 3374.0, 2164.0, 1307.0, 813.0, 464.0, 282.0, 196.0, 120.0, 75.0, 62.0, 36.0, 24.0, 14.0, 9.0, 7.0, 2.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-4.421875, -4.28643798828125, -4.1510009765625, -4.01556396484375, -3.880126953125, -3.74468994140625, -3.6092529296875, -3.47381591796875, -3.33837890625, -3.20294189453125, -3.0675048828125, -2.93206787109375, -2.796630859375, -2.66119384765625, -2.5257568359375, -2.39031982421875, -2.2548828125, -2.11944580078125, -1.9840087890625, -1.84857177734375, -1.713134765625, -1.57769775390625, -1.4422607421875, -1.30682373046875, -1.17138671875, -1.03594970703125, -0.9005126953125, -0.76507568359375, -0.629638671875, -0.49420166015625, -0.3587646484375, -0.22332763671875, -0.087890625, 0.04754638671875, 0.1829833984375, 0.31842041015625, 0.453857421875, 0.58929443359375, 0.7247314453125, 0.86016845703125, 0.99560546875, 1.13104248046875, 1.2664794921875, 1.40191650390625, 1.537353515625, 1.67279052734375, 1.8082275390625, 1.94366455078125, 2.0791015625, 2.21453857421875, 2.3499755859375, 2.48541259765625, 2.620849609375, 2.75628662109375, 2.8917236328125, 3.02716064453125, 3.16259765625, 3.29803466796875, 3.4334716796875, 3.56890869140625, 3.704345703125, 3.83978271484375, 3.9752197265625, 4.11065673828125, 4.24609375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 6.0, 6.0, 8.0, 15.0, 20.0, 16.0, 24.0, 31.0, 35.0, 37.0, 46.0, 71.0, 81.0, 114.0, 197.0, 1373.0, 280.0, 145.0, 92.0, 87.0, 57.0, 57.0, 44.0, 19.0, 26.0, 29.0, 29.0, 11.0, 16.0, 16.0, 11.0, 12.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.1953125, -12.76708984375, -12.3388671875, -11.91064453125, -11.482421875, -11.05419921875, -10.6259765625, -10.19775390625, -9.76953125, -9.34130859375, -8.9130859375, -8.48486328125, -8.056640625, -7.62841796875, -7.2001953125, -6.77197265625, -6.34375, -5.91552734375, -5.4873046875, -5.05908203125, -4.630859375, -4.20263671875, -3.7744140625, -3.34619140625, -2.91796875, -2.48974609375, -2.0615234375, -1.63330078125, -1.205078125, -0.77685546875, -0.3486328125, 0.07958984375, 0.5078125, 0.93603515625, 1.3642578125, 1.79248046875, 2.220703125, 2.64892578125, 3.0771484375, 3.50537109375, 3.93359375, 4.36181640625, 4.7900390625, 5.21826171875, 5.646484375, 6.07470703125, 6.5029296875, 6.93115234375, 7.359375, 7.78759765625, 8.2158203125, 8.64404296875, 9.072265625, 9.50048828125, 9.9287109375, 10.35693359375, 10.78515625, 11.21337890625, 11.6416015625, 12.06982421875, 12.498046875, 12.92626953125, 13.3544921875, 13.78271484375, 14.2109375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 10.0, 15.0, 18.0, 23.0, 38.0, 50.0, 60.0, 83.0, 137.0, 220.0, 400.0, 872.0, 3666.0, 21627.0, 156123.0, 1889978.0, 964374.0, 90399.0, 13567.0, 2474.0, 653.0, 343.0, 184.0, 127.0, 89.0, 52.0, 40.0, 29.0, 21.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.78125, -15.3153076171875, -14.849365234375, -14.3834228515625, -13.91748046875, -13.4515380859375, -12.985595703125, -12.5196533203125, -12.0537109375, -11.5877685546875, -11.121826171875, -10.6558837890625, -10.18994140625, -9.7239990234375, -9.258056640625, -8.7921142578125, -8.326171875, -7.8602294921875, -7.394287109375, -6.9283447265625, -6.46240234375, -5.9964599609375, -5.530517578125, -5.0645751953125, -4.5986328125, -4.1326904296875, -3.666748046875, -3.2008056640625, -2.73486328125, -2.2689208984375, -1.802978515625, -1.3370361328125, -0.87109375, -0.4051513671875, 0.060791015625, 0.5267333984375, 0.99267578125, 1.4586181640625, 1.924560546875, 2.3905029296875, 2.8564453125, 3.3223876953125, 3.788330078125, 4.2542724609375, 4.72021484375, 5.1861572265625, 5.652099609375, 6.1180419921875, 6.583984375, 7.0499267578125, 7.515869140625, 7.9818115234375, 8.44775390625, 8.9136962890625, 9.379638671875, 9.8455810546875, 10.3115234375, 10.7774658203125, 11.243408203125, 11.7093505859375, 12.17529296875, 12.6412353515625, 13.107177734375, 13.5731201171875, 14.0390625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 31.0, 89.0, 230.0, 359.0, 217.0, 70.0, 17.0, 3.0, 1.0, 1.0], "bins": [-161.70558166503906, -158.8855743408203, -156.06558227539062, -153.24557495117188, -150.42556762695312, -147.60556030273438, -144.7855682373047, -141.96556091308594, -139.1455535888672, -136.32554626464844, -133.50555419921875, -130.685546875, -127.86553955078125, -125.04553985595703, -122.22554016113281, -119.40553283691406, -116.58554077148438, -113.76554107666016, -110.9455337524414, -108.12553405761719, -105.30552673339844, -102.48552703857422, -99.66552734375, -96.84552001953125, -94.0255126953125, -91.20551300048828, -88.38550567626953, -85.56550598144531, -82.74549865722656, -79.92549896240234, -77.10549926757812, -74.28549194335938, -71.46549224853516, -68.64549255371094, -65.82548522949219, -63.00548553466797, -60.185482025146484, -57.365478515625, -54.545475006103516, -51.72547149658203, -48.90546798706055, -46.08546447753906, -43.26546096801758, -40.445457458496094, -37.625457763671875, -34.80545425415039, -31.985450744628906, -29.165449142456055, -26.34544563293457, -23.525442123413086, -20.705440521240234, -17.88543701171875, -15.065434455871582, -12.245431900024414, -9.42542839050293, -6.605426788330078, -3.7854232788085938, -0.9654204845428467, 1.8545823097229004, 4.674585342407227, 7.4945878982543945, 10.314590454101562, 13.134593963623047, 15.954595565795898, 18.774599075317383]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 8.0, 7.0, 13.0, 9.0, 14.0, 13.0, 15.0, 21.0, 16.0, 19.0, 25.0, 28.0, 26.0, 29.0, 34.0, 34.0, 35.0, 36.0, 44.0, 38.0, 45.0, 46.0, 33.0, 32.0, 36.0, 40.0, 41.0, 33.0, 30.0, 32.0, 21.0, 18.0, 21.0, 20.0, 13.0, 13.0, 12.0, 9.0, 10.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0], "bins": [-32.12983703613281, -31.19971466064453, -30.26959228515625, -29.33946990966797, -28.409347534179688, -27.479225158691406, -26.549102783203125, -25.618980407714844, -24.688858032226562, -23.75873565673828, -22.82861328125, -21.89849090576172, -20.968368530273438, -20.038246154785156, -19.108123779296875, -18.178001403808594, -17.247879028320312, -16.31775665283203, -15.38763427734375, -14.457511901855469, -13.527389526367188, -12.597267150878906, -11.667144775390625, -10.737022399902344, -9.806901931762695, -8.876779556274414, -7.946657180786133, -7.016534805297852, -6.08641242980957, -5.156290531158447, -4.226168155670166, -3.2960457801818848, -2.3659229278564453, -1.435800552368164, -0.5056782960891724, 0.42444396018981934, 1.3545663356781006, 2.2846884727478027, 3.214810848236084, 4.144933223724365, 5.0750555992126465, 6.005177974700928, 6.935300350189209, 7.865422248840332, 8.795544624328613, 9.725666999816895, 10.655789375305176, 11.585911750793457, 12.516034126281738, 13.44615650177002, 14.3762788772583, 15.306401252746582, 16.236522674560547, 17.166645050048828, 18.09676742553711, 19.02688980102539, 19.957012176513672, 20.887134552001953, 21.817256927490234, 22.747379302978516, 23.677501678466797, 24.607624053955078, 25.53774642944336, 26.46786880493164, 27.397991180419922]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 13.0, 6.0, 5.0, 10.0, 13.0, 23.0, 17.0, 23.0, 14.0, 20.0, 22.0, 37.0, 24.0, 37.0, 36.0, 34.0, 42.0, 34.0, 34.0, 36.0, 38.0, 33.0, 41.0, 30.0, 39.0, 40.0, 31.0, 18.0, 19.0, 31.0, 17.0, 26.0, 23.0, 18.0, 11.0, 13.0, 20.0, 8.0, 9.0, 14.0, 11.0, 4.0, 2.0, 6.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.1484375, -4.0234375, -3.8984375, -3.7734375, -3.6484375, -3.5234375, -3.3984375, -3.2734375, -3.1484375, -3.0234375, -2.8984375, -2.7734375, -2.6484375, -2.5234375, -2.3984375, -2.2734375, -2.1484375, -2.0234375, -1.8984375, -1.7734375, -1.6484375, -1.5234375, -1.3984375, -1.2734375, -1.1484375, -1.0234375, -0.8984375, -0.7734375, -0.6484375, -0.5234375, -0.3984375, -0.2734375, -0.1484375, -0.0234375, 0.1015625, 0.2265625, 0.3515625, 0.4765625, 0.6015625, 0.7265625, 0.8515625, 0.9765625, 1.1015625, 1.2265625, 1.3515625, 1.4765625, 1.6015625, 1.7265625, 1.8515625, 1.9765625, 2.1015625, 2.2265625, 2.3515625, 2.4765625, 2.6015625, 2.7265625, 2.8515625, 2.9765625, 3.1015625, 3.2265625, 3.3515625, 3.4765625, 3.6015625, 3.7265625, 3.8515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 8.0, 10.0, 12.0, 15.0, 27.0, 31.0, 56.0, 69.0, 105.0, 176.0, 270.0, 484.0, 877.0, 1765.0, 3776.0, 8605.0, 20398.0, 51788.0, 142085.0, 425659.0, 1279978.0, 1476426.0, 509274.0, 169275.0, 60762.0, 23780.0, 9764.0, 4292.0, 2025.0, 1023.0, 532.0, 318.0, 207.0, 119.0, 76.0, 41.0, 61.0, 29.0, 12.0, 11.0, 11.0, 16.0, 11.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.38671875, -5.21881103515625, -5.0509033203125, -4.88299560546875, -4.715087890625, -4.54718017578125, -4.3792724609375, -4.21136474609375, -4.04345703125, -3.87554931640625, -3.7076416015625, -3.53973388671875, -3.371826171875, -3.20391845703125, -3.0360107421875, -2.86810302734375, -2.7001953125, -2.53228759765625, -2.3643798828125, -2.19647216796875, -2.028564453125, -1.86065673828125, -1.6927490234375, -1.52484130859375, -1.35693359375, -1.18902587890625, -1.0211181640625, -0.85321044921875, -0.685302734375, -0.51739501953125, -0.3494873046875, -0.18157958984375, -0.013671875, 0.15423583984375, 0.3221435546875, 0.49005126953125, 0.657958984375, 0.82586669921875, 0.9937744140625, 1.16168212890625, 1.32958984375, 1.49749755859375, 1.6654052734375, 1.83331298828125, 2.001220703125, 2.16912841796875, 2.3370361328125, 2.50494384765625, 2.6728515625, 2.84075927734375, 3.0086669921875, 3.17657470703125, 3.344482421875, 3.51239013671875, 3.6802978515625, 3.84820556640625, 4.01611328125, 4.18402099609375, 4.3519287109375, 4.51983642578125, 4.687744140625, 4.85565185546875, 5.0235595703125, 5.19146728515625, 5.359375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 6.0, 8.0, 10.0, 10.0, 10.0, 17.0, 38.0, 25.0, 53.0, 47.0, 79.0, 105.0, 153.0, 193.0, 248.0, 348.0, 442.0, 474.0, 435.0, 346.0, 287.0, 178.0, 131.0, 130.0, 69.0, 66.0, 49.0, 29.0, 18.0, 13.0, 10.0, 13.0, 10.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.3116455078125, -5.119384765625, -4.9271240234375, -4.73486328125, -4.5426025390625, -4.350341796875, -4.1580810546875, -3.9658203125, -3.7735595703125, -3.581298828125, -3.3890380859375, -3.19677734375, -3.0045166015625, -2.812255859375, -2.6199951171875, -2.427734375, -2.2354736328125, -2.043212890625, -1.8509521484375, -1.65869140625, -1.4664306640625, -1.274169921875, -1.0819091796875, -0.8896484375, -0.6973876953125, -0.505126953125, -0.3128662109375, -0.12060546875, 0.0716552734375, 0.263916015625, 0.4561767578125, 0.6484375, 0.8406982421875, 1.032958984375, 1.2252197265625, 1.41748046875, 1.6097412109375, 1.802001953125, 1.9942626953125, 2.1865234375, 2.3787841796875, 2.571044921875, 2.7633056640625, 2.95556640625, 3.1478271484375, 3.340087890625, 3.5323486328125, 3.724609375, 3.9168701171875, 4.109130859375, 4.3013916015625, 4.49365234375, 4.6859130859375, 4.878173828125, 5.0704345703125, 5.2626953125, 5.4549560546875, 5.647216796875, 5.8394775390625, 6.03173828125, 6.2239990234375, 6.416259765625, 6.6085205078125, 6.80078125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 11.0, 12.0, 16.0, 23.0, 26.0, 46.0, 58.0, 81.0, 125.0, 193.0, 362.0, 790.0, 1895.0, 5336.0, 19329.0, 86639.0, 464767.0, 2308076.0, 1068743.0, 185048.0, 37741.0, 9479.0, 2999.0, 1140.0, 536.0, 239.0, 168.0, 131.0, 59.0, 52.0, 44.0, 22.0, 16.0, 15.0, 13.0, 8.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.84375, -9.5234375, -9.203125, -8.8828125, -8.5625, -8.2421875, -7.921875, -7.6015625, -7.28125, -6.9609375, -6.640625, -6.3203125, -6.0, -5.6796875, -5.359375, -5.0390625, -4.71875, -4.3984375, -4.078125, -3.7578125, -3.4375, -3.1171875, -2.796875, -2.4765625, -2.15625, -1.8359375, -1.515625, -1.1953125, -0.875, -0.5546875, -0.234375, 0.0859375, 0.40625, 0.7265625, 1.046875, 1.3671875, 1.6875, 2.0078125, 2.328125, 2.6484375, 2.96875, 3.2890625, 3.609375, 3.9296875, 4.25, 4.5703125, 4.890625, 5.2109375, 5.53125, 5.8515625, 6.171875, 6.4921875, 6.8125, 7.1328125, 7.453125, 7.7734375, 8.09375, 8.4140625, 8.734375, 9.0546875, 9.375, 9.6953125, 10.015625, 10.3359375, 10.65625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 50.0, 316.0, 463.0, 170.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.245723724365234, -27.861465454101562, -23.477209091186523, -19.092952728271484, -14.708694458007812, -10.32443618774414, -5.940179824829102, -1.5559234619140625, 2.8283348083496094, 7.212592124938965, 11.59684944152832, 15.981106758117676, 20.36536407470703, 24.749622344970703, 29.133878707885742, 33.51813507080078, 37.90239334106445, 42.286651611328125, 46.67090606689453, 51.0551643371582, 55.439422607421875, 59.82368087768555, 64.20793914794922, 68.59219360351562, 72.97645568847656, 77.36071014404297, 81.7449722290039, 86.12922668457031, 90.51348876953125, 94.89774322509766, 99.28199768066406, 103.666259765625, 108.05050659179688, 112.43476104736328, 116.81902313232422, 121.20327758789062, 125.58753967285156, 129.9718017578125, 134.35604858398438, 138.7403106689453, 143.12457275390625, 147.5088348388672, 151.89308166503906, 156.27734375, 160.66160583496094, 165.04586791992188, 169.43011474609375, 173.8143768310547, 178.19862365722656, 182.5828857421875, 186.96713256835938, 191.3513946533203, 195.73565673828125, 200.11990356445312, 204.50416564941406, 208.888427734375, 213.27267456054688, 217.6569366455078, 222.0411834716797, 226.42544555664062, 230.80970764160156, 235.1939697265625, 239.57821655273438, 243.9624786376953, 248.34674072265625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 4.0, 9.0, 12.0, 8.0, 9.0, 13.0, 15.0, 14.0, 19.0, 18.0, 18.0, 36.0, 33.0, 23.0, 33.0, 25.0, 38.0, 39.0, 35.0, 35.0, 41.0, 35.0, 31.0, 35.0, 51.0, 28.0, 43.0, 31.0, 27.0, 31.0, 30.0, 22.0, 20.0, 22.0, 14.0, 13.0, 9.0, 15.0, 12.0, 10.0, 5.0, 13.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0], "bins": [-19.534732818603516, -18.914165496826172, -18.293596267700195, -17.67302703857422, -17.052459716796875, -16.43189239501953, -15.811323165893555, -15.190754890441895, -14.570186614990234, -13.949618339538574, -13.329050064086914, -12.708481788635254, -12.087913513183594, -11.467345237731934, -10.846776962280273, -10.226208686828613, -9.605640411376953, -8.985072135925293, -8.364503860473633, -7.743935585021973, -7.1233673095703125, -6.502799034118652, -5.882230758666992, -5.261662483215332, -4.641094207763672, -4.020525932312012, -3.3999576568603516, -2.7793893814086914, -2.1588211059570312, -1.538252830505371, -0.9176845550537109, -0.2971162796020508, 0.3234519958496094, 0.9440202713012695, 1.5645885467529297, 2.18515682220459, 2.80572509765625, 3.42629337310791, 4.04686164855957, 4.6674299240112305, 5.287998199462891, 5.908566474914551, 6.529134750366211, 7.149703025817871, 7.770271301269531, 8.390839576721191, 9.011407852172852, 9.631976127624512, 10.252544403076172, 10.873112678527832, 11.493680953979492, 12.114249229431152, 12.734817504882812, 13.355385780334473, 13.975954055786133, 14.596522331237793, 15.217090606689453, 15.837658882141113, 16.458227157592773, 17.07879638671875, 17.699363708496094, 18.319931030273438, 18.940500259399414, 19.56106948852539, 20.181636810302734]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 6.0, 7.0, 6.0, 6.0, 5.0, 12.0, 13.0, 15.0, 18.0, 27.0, 19.0, 20.0, 27.0, 40.0, 31.0, 20.0, 32.0, 43.0, 59.0, 41.0, 43.0, 40.0, 28.0, 32.0, 45.0, 36.0, 30.0, 28.0, 32.0, 29.0, 29.0, 27.0, 23.0, 18.0, 15.0, 20.0, 12.0, 19.0, 9.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.22265625, -4.0892333984375, -3.955810546875, -3.8223876953125, -3.68896484375, -3.5555419921875, -3.422119140625, -3.2886962890625, -3.1552734375, -3.0218505859375, -2.888427734375, -2.7550048828125, -2.62158203125, -2.4881591796875, -2.354736328125, -2.2213134765625, -2.087890625, -1.9544677734375, -1.821044921875, -1.6876220703125, -1.55419921875, -1.4207763671875, -1.287353515625, -1.1539306640625, -1.0205078125, -0.8870849609375, -0.753662109375, -0.6202392578125, -0.48681640625, -0.3533935546875, -0.219970703125, -0.0865478515625, 0.046875, 0.1802978515625, 0.313720703125, 0.4471435546875, 0.58056640625, 0.7139892578125, 0.847412109375, 0.9808349609375, 1.1142578125, 1.2476806640625, 1.381103515625, 1.5145263671875, 1.64794921875, 1.7813720703125, 1.914794921875, 2.0482177734375, 2.181640625, 2.3150634765625, 2.448486328125, 2.5819091796875, 2.71533203125, 2.8487548828125, 2.982177734375, 3.1156005859375, 3.2490234375, 3.3824462890625, 3.515869140625, 3.6492919921875, 3.78271484375, 3.9161376953125, 4.049560546875, 4.1829833984375, 4.31640625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 11.0, 14.0, 13.0, 28.0, 36.0, 50.0, 79.0, 103.0, 145.0, 209.0, 358.0, 483.0, 683.0, 1069.0, 1635.0, 2368.0, 3666.0, 5521.0, 8568.0, 13270.0, 20704.0, 32312.0, 51785.0, 89360.0, 180592.0, 319713.0, 129328.0, 69367.0, 41997.0, 26570.0, 16804.0, 10932.0, 7068.0, 4578.0, 3013.0, 2006.0, 1325.0, 931.0, 581.0, 402.0, 261.0, 194.0, 129.0, 83.0, 59.0, 50.0, 26.0, 22.0, 23.0, 9.0, 11.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.1617431640625, -0.15673255920410156, -0.15172195434570312, -0.1467113494873047, -0.14170074462890625, -0.1366901397705078, -0.13167953491210938, -0.12666893005371094, -0.1216583251953125, -0.11664772033691406, -0.11163711547851562, -0.10662651062011719, -0.10161590576171875, -0.09660530090332031, -0.09159469604492188, -0.08658409118652344, -0.081573486328125, -0.07656288146972656, -0.07155227661132812, -0.06654167175292969, -0.06153106689453125, -0.05652046203613281, -0.051509857177734375, -0.04649925231933594, -0.0414886474609375, -0.03647804260253906, -0.031467437744140625, -0.026456832885742188, -0.02144622802734375, -0.016435623168945312, -0.011425018310546875, -0.0064144134521484375, -0.00140380859375, 0.0036067962646484375, 0.008617401123046875, 0.013628005981445312, 0.01863861083984375, 0.023649215698242188, 0.028659820556640625, 0.03367042541503906, 0.0386810302734375, 0.04369163513183594, 0.048702239990234375, 0.05371284484863281, 0.05872344970703125, 0.06373405456542969, 0.06874465942382812, 0.07375526428222656, 0.078765869140625, 0.08377647399902344, 0.08878707885742188, 0.09379768371582031, 0.09880828857421875, 0.10381889343261719, 0.10882949829101562, 0.11384010314941406, 0.1188507080078125, 0.12386131286621094, 0.12887191772460938, 0.1338825225830078, 0.13889312744140625, 0.1439037322998047, 0.14891433715820312, 0.15392494201660156, 0.158935546875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 3.0, 5.0, 6.0, 9.0, 10.0, 6.0, 10.0, 15.0, 13.0, 18.0, 17.0, 24.0, 26.0, 35.0, 39.0, 38.0, 37.0, 40.0, 32.0, 42.0, 32.0, 44.0, 1055.0, 41.0, 46.0, 39.0, 33.0, 37.0, 32.0, 32.0, 26.0, 33.0, 18.0, 21.0, 13.0, 18.0, 12.0, 13.0, 10.0, 7.0, 11.0, 5.0, 2.0, 8.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.00390625, -2.910064697265625, -2.81622314453125, -2.722381591796875, -2.6285400390625, -2.534698486328125, -2.44085693359375, -2.347015380859375, -2.253173828125, -2.159332275390625, -2.06549072265625, -1.971649169921875, -1.8778076171875, -1.783966064453125, -1.69012451171875, -1.596282958984375, -1.50244140625, -1.408599853515625, -1.31475830078125, -1.220916748046875, -1.1270751953125, -1.033233642578125, -0.93939208984375, -0.845550537109375, -0.751708984375, -0.657867431640625, -0.56402587890625, -0.470184326171875, -0.3763427734375, -0.282501220703125, -0.18865966796875, -0.094818115234375, -0.0009765625, 0.092864990234375, 0.18670654296875, 0.280548095703125, 0.3743896484375, 0.468231201171875, 0.56207275390625, 0.655914306640625, 0.749755859375, 0.843597412109375, 0.93743896484375, 1.031280517578125, 1.1251220703125, 1.218963623046875, 1.31280517578125, 1.406646728515625, 1.50048828125, 1.594329833984375, 1.68817138671875, 1.782012939453125, 1.8758544921875, 1.969696044921875, 2.06353759765625, 2.157379150390625, 2.251220703125, 2.345062255859375, 2.43890380859375, 2.532745361328125, 2.6265869140625, 2.720428466796875, 2.81427001953125, 2.908111572265625, 3.001953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 18.0, 27.0, 42.0, 45.0, 73.0, 109.0, 151.0, 241.0, 331.0, 471.0, 679.0, 930.0, 1349.0, 1860.0, 2660.0, 3797.0, 5377.0, 7760.0, 11322.0, 16654.0, 25384.0, 39499.0, 63351.0, 109781.0, 1286668.0, 229544.0, 108409.0, 62973.0, 39184.0, 25119.0, 16508.0, 11167.0, 7642.0, 5241.0, 3849.0, 2583.0, 1890.0, 1336.0, 933.0, 622.0, 513.0, 297.0, 238.0, 158.0, 109.0, 74.0, 56.0, 32.0, 30.0, 20.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.0865478515625, -0.08384227752685547, -0.08113670349121094, -0.0784311294555664, -0.07572555541992188, -0.07301998138427734, -0.07031440734863281, -0.06760883331298828, -0.06490325927734375, -0.06219768524169922, -0.05949211120605469, -0.056786537170410156, -0.054080963134765625, -0.051375389099121094, -0.04866981506347656, -0.04596424102783203, -0.0432586669921875, -0.04055309295654297, -0.03784751892089844, -0.035141944885253906, -0.032436370849609375, -0.029730796813964844, -0.027025222778320312, -0.02431964874267578, -0.02161407470703125, -0.01890850067138672, -0.016202926635742188, -0.013497352600097656, -0.010791778564453125, -0.008086204528808594, -0.0053806304931640625, -0.0026750564575195312, 3.0517578125e-05, 0.0027360916137695312, 0.0054416656494140625, 0.008147239685058594, 0.010852813720703125, 0.013558387756347656, 0.016263961791992188, 0.01896953582763672, 0.02167510986328125, 0.02438068389892578, 0.027086257934570312, 0.029791831970214844, 0.032497406005859375, 0.035202980041503906, 0.03790855407714844, 0.04061412811279297, 0.0433197021484375, 0.04602527618408203, 0.04873085021972656, 0.051436424255371094, 0.054141998291015625, 0.056847572326660156, 0.05955314636230469, 0.06225872039794922, 0.06496429443359375, 0.06766986846923828, 0.07037544250488281, 0.07308101654052734, 0.07578659057617188, 0.0784921646118164, 0.08119773864746094, 0.08390331268310547, 0.08660888671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 5.0, 6.0, 9.0, 0.0, 7.0, 10.0, 8.0, 0.0, 18.0, 11.0, 26.0, 25.0, 0.0, 46.0, 50.0, 73.0, 0.0, 105.0, 224.0, 97.0, 69.0, 0.0, 58.0, 29.0, 32.0, 27.0, 0.0, 6.0, 14.0, 8.0, 0.0, 9.0, 9.0, 5.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5031546354293823e-06, -1.4565885066986084e-06, -1.4100223779678345e-06, -1.3634562492370605e-06, -1.3168901205062866e-06, -1.2703239917755127e-06, -1.2237578630447388e-06, -1.1771917343139648e-06, -1.130625605583191e-06, -1.084059476852417e-06, -1.037493348121643e-06, -9.909272193908691e-07, -9.443610906600952e-07, -8.977949619293213e-07, -8.512288331985474e-07, -8.046627044677734e-07, -7.580965757369995e-07, -7.115304470062256e-07, -6.649643182754517e-07, -6.183981895446777e-07, -5.718320608139038e-07, -5.252659320831299e-07, -4.78699803352356e-07, -4.3213367462158203e-07, -3.855675458908081e-07, -3.390014171600342e-07, -2.9243528842926025e-07, -2.4586915969848633e-07, -1.993030309677124e-07, -1.5273690223693848e-07, -1.0617077350616455e-07, -5.960464477539063e-08, -1.30385160446167e-08, 3.3527612686157227e-08, 8.009374141693115e-08, 1.2665987014770508e-07, 1.73225998878479e-07, 2.1979212760925293e-07, 2.6635825634002686e-07, 3.129243850708008e-07, 3.594905138015747e-07, 4.0605664253234863e-07, 4.5262277126312256e-07, 4.991888999938965e-07, 5.457550287246704e-07, 5.923211574554443e-07, 6.388872861862183e-07, 6.854534149169922e-07, 7.320195436477661e-07, 7.7858567237854e-07, 8.25151801109314e-07, 8.717179298400879e-07, 9.182840585708618e-07, 9.648501873016357e-07, 1.0114163160324097e-06, 1.0579824447631836e-06, 1.1045485734939575e-06, 1.1511147022247314e-06, 1.1976808309555054e-06, 1.2442469596862793e-06, 1.2908130884170532e-06, 1.3373792171478271e-06, 1.383945345878601e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 7.0, 10.0, 11.0, 10.0, 10.0, 19.0, 23.0, 16.0, 48.0, 59.0, 63.0, 114.0, 236.0, 612.0, 13989.0, 970979.0, 60445.0, 1099.0, 273.0, 163.0, 86.0, 61.0, 56.0, 39.0, 18.0, 19.0, 16.0, 12.0, 7.0, 8.0, 11.0, 9.0, 2.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.0159950256347656e-05, -2.9175542294979095e-05, -2.8191134333610535e-05, -2.7206726372241974e-05, -2.6222318410873413e-05, -2.5237910449504852e-05, -2.425350248813629e-05, -2.326909452676773e-05, -2.228468656539917e-05, -2.130027860403061e-05, -2.031587064266205e-05, -1.9331462681293488e-05, -1.8347054719924927e-05, -1.7362646758556366e-05, -1.6378238797187805e-05, -1.5393830835819244e-05, -1.4409422874450684e-05, -1.3425014913082123e-05, -1.2440606951713562e-05, -1.1456198990345001e-05, -1.047179102897644e-05, -9.48738306760788e-06, -8.502975106239319e-06, -7.518567144870758e-06, -6.534159183502197e-06, -5.5497512221336365e-06, -4.565343260765076e-06, -3.580935299396515e-06, -2.596527338027954e-06, -1.6121193766593933e-06, -6.277114152908325e-07, 3.5669654607772827e-07, 1.341104507446289e-06, 2.32551246881485e-06, 3.3099204301834106e-06, 4.2943283915519714e-06, 5.278736352920532e-06, 6.263144314289093e-06, 7.247552275657654e-06, 8.231960237026215e-06, 9.216368198394775e-06, 1.0200776159763336e-05, 1.1185184121131897e-05, 1.2169592082500458e-05, 1.3154000043869019e-05, 1.413840800523758e-05, 1.512281596660614e-05, 1.61072239279747e-05, 1.7091631889343262e-05, 1.8076039850711823e-05, 1.9060447812080383e-05, 2.0044855773448944e-05, 2.1029263734817505e-05, 2.2013671696186066e-05, 2.2998079657554626e-05, 2.3982487618923187e-05, 2.4966895580291748e-05, 2.595130354166031e-05, 2.693571150302887e-05, 2.792011946439743e-05, 2.890452742576599e-05, 2.9888935387134552e-05, 3.087334334850311e-05, 3.1857751309871674e-05, 3.2842159271240234e-05]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 14.0, 38.0, 96.0, 333.0, 366.0, 123.0, 33.0, 11.0], "bins": [-5.794078333565267e-06, -5.697569577023387e-06, -5.601061275228858e-06, -5.504552518686978e-06, -5.408043762145098e-06, -5.311535460350569e-06, -5.2150267038086895e-06, -5.11851794726681e-06, -5.022009645472281e-06, -4.925500888930401e-06, -4.828992587135872e-06, -4.732483830593992e-06, -4.635975074052112e-06, -4.539466772257583e-06, -4.442958015715703e-06, -4.3464492591738235e-06, -4.249940502631944e-06, -4.153431746090064e-06, -4.056923444295535e-06, -3.960414687753655e-06, -3.863905931211775e-06, -3.767397629417246e-06, -3.6708888728753664e-06, -3.574380343707162e-06, -3.4778718145389576e-06, -3.381363285370753e-06, -3.2848545288288733e-06, -3.188345999660669e-06, -3.0918374704924645e-06, -2.99532894132426e-06, -2.8988201847823802e-06, -2.802311655614176e-06, -2.7058031264459714e-06, -2.609294597277767e-06, -2.512785840735887e-06, -2.4162773115676828e-06, -2.3197687823994784e-06, -2.223260253231274e-06, -2.126751496689394e-06, -2.0302429675211897e-06, -1.9337344383529853e-06, -1.8372257954979432e-06, -1.7407172663297388e-06, -1.6442086234746967e-06, -1.5477000943064922e-06, -1.4511914514514501e-06, -1.354682808596408e-06, -1.2581742794282036e-06, -1.1616656365731615e-06, -1.0651569937181193e-06, -9.68648464549915e-07, -8.721398216948728e-07, -7.756312356832495e-07, -6.791226496716263e-07, -5.826140068165842e-07, -4.861054208049609e-07, -3.895968347933376e-07, -2.9308824878171436e-07, -1.9657963434838166e-07, -1.0007101991504896e-07, -3.562433903425699e-09, 9.294615210819757e-08, 1.894547949632397e-07, 2.8596338097486296e-07, 3.824719669864862e-07]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 11.0, 0.0, 0.0, 25.0, 0.0, 43.0, 0.0, 0.0, 50.0, 0.0, 0.0, 82.0, 0.0, 102.0, 0.0, 0.0, 105.0, 0.0, 129.0, 0.0, 0.0, 123.0, 0.0, 111.0, 0.0, 0.0, 70.0, 0.0, 60.0, 0.0, 0.0, 34.0, 0.0, 0.0, 32.0, 0.0, 20.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.919726729393005e-07, -6.686896085739136e-07, -6.454065442085266e-07, -6.221234798431396e-07, -5.988404154777527e-07, -5.755573511123657e-07, -5.522742867469788e-07, -5.289912223815918e-07, -5.057081580162048e-07, -4.824250936508179e-07, -4.591420292854309e-07, -4.3585896492004395e-07, -4.12575900554657e-07, -3.8929283618927e-07, -3.6600977182388306e-07, -3.427267074584961e-07, -3.1944364309310913e-07, -2.9616057872772217e-07, -2.728775143623352e-07, -2.4959444999694824e-07, -2.2631138563156128e-07, -2.0302832126617432e-07, -1.7974525690078735e-07, -1.564621925354004e-07, -1.3317912817001343e-07, -1.0989606380462646e-07, -8.66129994392395e-08, -6.332993507385254e-08, -4.0046870708465576e-08, -1.6763806343078613e-08, 6.51925802230835e-09, 2.9802322387695312e-08, 5.3085386753082275e-08, 7.636845111846924e-08, 9.96515154838562e-08, 1.2293457984924316e-07, 1.4621764421463013e-07, 1.695007085800171e-07, 1.9278377294540405e-07, 2.1606683731079102e-07, 2.39349901676178e-07, 2.6263296604156494e-07, 2.859160304069519e-07, 3.0919909477233887e-07, 3.3248215913772583e-07, 3.557652235031128e-07, 3.7904828786849976e-07, 4.023313522338867e-07, 4.256144165992737e-07, 4.4889748096466064e-07, 4.721805453300476e-07, 4.954636096954346e-07, 5.187466740608215e-07, 5.420297384262085e-07, 5.653128027915955e-07, 5.885958671569824e-07, 6.118789315223694e-07, 6.351619958877563e-07, 6.584450602531433e-07, 6.817281246185303e-07, 7.050111889839172e-07, 7.282942533493042e-07, 7.515773177146912e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 6.0, 7.0, 6.0, 6.0, 5.0, 12.0, 13.0, 15.0, 18.0, 27.0, 19.0, 20.0, 27.0, 40.0, 31.0, 20.0, 32.0, 43.0, 59.0, 41.0, 43.0, 40.0, 28.0, 32.0, 45.0, 36.0, 30.0, 28.0, 32.0, 29.0, 29.0, 27.0, 23.0, 18.0, 15.0, 20.0, 12.0, 19.0, 9.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.22265625, -4.0892333984375, -3.955810546875, -3.8223876953125, -3.68896484375, -3.5555419921875, -3.422119140625, -3.2886962890625, -3.1552734375, -3.0218505859375, -2.888427734375, -2.7550048828125, -2.62158203125, -2.4881591796875, -2.354736328125, -2.2213134765625, -2.087890625, -1.9544677734375, -1.821044921875, -1.6876220703125, -1.55419921875, -1.4207763671875, -1.287353515625, -1.1539306640625, -1.0205078125, -0.8870849609375, -0.753662109375, -0.6202392578125, -0.48681640625, -0.3533935546875, -0.219970703125, -0.0865478515625, 0.046875, 0.1802978515625, 0.313720703125, 0.4471435546875, 0.58056640625, 0.7139892578125, 0.847412109375, 0.9808349609375, 1.1142578125, 1.2476806640625, 1.381103515625, 1.5145263671875, 1.64794921875, 1.7813720703125, 1.914794921875, 2.0482177734375, 2.181640625, 2.3150634765625, 2.448486328125, 2.5819091796875, 2.71533203125, 2.8487548828125, 2.982177734375, 3.1156005859375, 3.2490234375, 3.3824462890625, 3.515869140625, 3.6492919921875, 3.78271484375, 3.9161376953125, 4.049560546875, 4.1829833984375, 4.31640625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 13.0, 11.0, 21.0, 23.0, 38.0, 65.0, 86.0, 189.0, 263.0, 453.0, 894.0, 1492.0, 2650.0, 4720.0, 7926.0, 13092.0, 21233.0, 33767.0, 52910.0, 83317.0, 151240.0, 288023.0, 157131.0, 85789.0, 54096.0, 34384.0, 21909.0, 13444.0, 8049.0, 4782.0, 2736.0, 1634.0, 883.0, 516.0, 305.0, 179.0, 102.0, 67.0, 34.0, 20.0, 18.0, 16.0, 10.0, 11.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.328369140625, -5.16455078125, -5.000732421875, -4.8369140625, -4.673095703125, -4.50927734375, -4.345458984375, -4.181640625, -4.017822265625, -3.85400390625, -3.690185546875, -3.5263671875, -3.362548828125, -3.19873046875, -3.034912109375, -2.87109375, -2.707275390625, -2.54345703125, -2.379638671875, -2.2158203125, -2.052001953125, -1.88818359375, -1.724365234375, -1.560546875, -1.396728515625, -1.23291015625, -1.069091796875, -0.9052734375, -0.741455078125, -0.57763671875, -0.413818359375, -0.25, -0.086181640625, 0.07763671875, 0.241455078125, 0.4052734375, 0.569091796875, 0.73291015625, 0.896728515625, 1.060546875, 1.224365234375, 1.38818359375, 1.552001953125, 1.7158203125, 1.879638671875, 2.04345703125, 2.207275390625, 2.37109375, 2.534912109375, 2.69873046875, 2.862548828125, 3.0263671875, 3.190185546875, 3.35400390625, 3.517822265625, 3.681640625, 3.845458984375, 4.00927734375, 4.173095703125, 4.3369140625, 4.500732421875, 4.66455078125, 4.828369140625, 4.9921875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 16.0, 17.0, 9.0, 12.0, 21.0, 29.0, 27.0, 31.0, 30.0, 47.0, 58.0, 65.0, 93.0, 138.0, 232.0, 1397.0, 216.0, 149.0, 110.0, 77.0, 43.0, 49.0, 31.0, 28.0, 30.0, 26.0, 19.0, 15.0, 10.0, 12.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6015625, -15.1505126953125, -14.699462890625, -14.2484130859375, -13.79736328125, -13.3463134765625, -12.895263671875, -12.4442138671875, -11.9931640625, -11.5421142578125, -11.091064453125, -10.6400146484375, -10.18896484375, -9.7379150390625, -9.286865234375, -8.8358154296875, -8.384765625, -7.9337158203125, -7.482666015625, -7.0316162109375, -6.58056640625, -6.1295166015625, -5.678466796875, -5.2274169921875, -4.7763671875, -4.3253173828125, -3.874267578125, -3.4232177734375, -2.97216796875, -2.5211181640625, -2.070068359375, -1.6190185546875, -1.16796875, -0.7169189453125, -0.265869140625, 0.1851806640625, 0.63623046875, 1.0872802734375, 1.538330078125, 1.9893798828125, 2.4404296875, 2.8914794921875, 3.342529296875, 3.7935791015625, 4.24462890625, 4.6956787109375, 5.146728515625, 5.5977783203125, 6.048828125, 6.4998779296875, 6.950927734375, 7.4019775390625, 7.85302734375, 8.3040771484375, 8.755126953125, 9.2061767578125, 9.6572265625, 10.1082763671875, 10.559326171875, 11.0103759765625, 11.46142578125, 11.9124755859375, 12.363525390625, 12.8145751953125, 13.265625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 7.0, 9.0, 17.0, 24.0, 29.0, 24.0, 48.0, 65.0, 88.0, 134.0, 208.0, 300.0, 495.0, 1149.0, 4606.0, 24348.0, 157044.0, 1916928.0, 928284.0, 91607.0, 15126.0, 2955.0, 888.0, 423.0, 244.0, 164.0, 138.0, 86.0, 62.0, 54.0, 43.0, 27.0, 20.0, 11.0, 12.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.125, -13.6673583984375, -13.209716796875, -12.7520751953125, -12.29443359375, -11.8367919921875, -11.379150390625, -10.9215087890625, -10.4638671875, -10.0062255859375, -9.548583984375, -9.0909423828125, -8.63330078125, -8.1756591796875, -7.718017578125, -7.2603759765625, -6.802734375, -6.3450927734375, -5.887451171875, -5.4298095703125, -4.97216796875, -4.5145263671875, -4.056884765625, -3.5992431640625, -3.1416015625, -2.6839599609375, -2.226318359375, -1.7686767578125, -1.31103515625, -0.8533935546875, -0.395751953125, 0.0618896484375, 0.51953125, 0.9771728515625, 1.434814453125, 1.8924560546875, 2.35009765625, 2.8077392578125, 3.265380859375, 3.7230224609375, 4.1806640625, 4.6383056640625, 5.095947265625, 5.5535888671875, 6.01123046875, 6.4688720703125, 6.926513671875, 7.3841552734375, 7.841796875, 8.2994384765625, 8.757080078125, 9.2147216796875, 9.67236328125, 10.1300048828125, 10.587646484375, 11.0452880859375, 11.5029296875, 11.9605712890625, 12.418212890625, 12.8758544921875, 13.33349609375, 13.7911376953125, 14.248779296875, 14.7064208984375, 15.1640625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 45.0, 178.0, 308.0, 298.0, 158.0, 16.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.47114562988281, -65.18412780761719, -61.89710998535156, -58.6100959777832, -55.32307815551758, -52.03606033325195, -48.749046325683594, -45.46202850341797, -42.175010681152344, -38.88799285888672, -35.600975036621094, -32.313961029052734, -29.02694320678711, -25.739925384521484, -22.452909469604492, -19.1658935546875, -15.878875732421875, -12.591858863830566, -9.304841995239258, -6.017825126647949, -2.7308082580566406, 0.5562095642089844, 3.8432254791259766, 7.130241394042969, 10.417259216308594, 13.704276084899902, 16.99129295349121, 20.278308868408203, 23.565326690673828, 26.852344512939453, 30.139360427856445, 33.42637634277344, 36.71339416503906, 40.00041198730469, 43.28742980957031, 46.57444381713867, 49.8614616394043, 53.14847946166992, 56.43549346923828, 59.722511291503906, 63.00952911376953, 66.29654693603516, 69.58356475830078, 72.8705825805664, 76.1575927734375, 79.44461059570312, 82.73162841796875, 86.01864624023438, 89.3056640625, 92.59268188476562, 95.87969970703125, 99.16671752929688, 102.4537353515625, 105.74075317382812, 109.02776336669922, 112.31478118896484, 115.60179901123047, 118.8888168334961, 122.17583465576172, 125.46285247802734, 128.74986267089844, 132.03688049316406, 135.3238983154297, 138.6109161376953, 141.89793395996094]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 10.0, 9.0, 12.0, 17.0, 20.0, 22.0, 16.0, 19.0, 25.0, 25.0, 28.0, 37.0, 33.0, 38.0, 35.0, 36.0, 44.0, 44.0, 41.0, 46.0, 46.0, 41.0, 28.0, 37.0, 40.0, 34.0, 28.0, 33.0, 23.0, 23.0, 14.0, 12.0, 14.0, 17.0, 11.0, 12.0, 7.0, 9.0, 3.0, 2.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.44413375854492, -34.48119354248047, -33.51824951171875, -32.5553092956543, -31.592369079589844, -30.629426956176758, -29.666484832763672, -28.70354461669922, -27.740602493286133, -26.777660369873047, -25.814720153808594, -24.851778030395508, -23.888837814331055, -22.92589569091797, -21.962955474853516, -21.00001335144043, -20.037071228027344, -19.074129104614258, -18.111188888549805, -17.14824676513672, -16.185306549072266, -15.22236442565918, -14.25942325592041, -13.29648208618164, -12.333541870117188, -11.370600700378418, -10.407659530639648, -9.444717407226562, -8.481776237487793, -7.518835067749023, -6.555893898010254, -5.592952251434326, -4.630010604858398, -3.66706919670105, -2.704127788543701, -1.7411866188049316, -0.778245210647583, 0.18469619750976562, 1.1476373672485352, 2.110579013824463, 3.0735201835632324, 4.036461353302002, 4.99940299987793, 5.962344169616699, 6.925285339355469, 7.8882269859313965, 8.851167678833008, 9.814109802246094, 10.777050971984863, 11.739992141723633, 12.702933311462402, 13.665874481201172, 14.628816604614258, 15.591757774353027, 16.554698944091797, 17.517641067504883, 18.480581283569336, 19.443523406982422, 20.406463623046875, 21.36940574645996, 22.332345962524414, 23.2952880859375, 24.258228302001953, 25.22117042541504, 26.184112548828125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 3.0, 7.0, 11.0, 13.0, 10.0, 17.0, 15.0, 17.0, 18.0, 28.0, 28.0, 29.0, 28.0, 29.0, 33.0, 33.0, 36.0, 40.0, 35.0, 57.0, 36.0, 38.0, 37.0, 26.0, 37.0, 35.0, 42.0, 37.0, 26.0, 31.0, 23.0, 20.0, 12.0, 20.0, 16.0, 14.0, 21.0, 9.0, 3.0, 6.0, 7.0, 3.0, 7.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8125, -3.67413330078125, -3.5357666015625, -3.39739990234375, -3.259033203125, -3.12066650390625, -2.9822998046875, -2.84393310546875, -2.70556640625, -2.56719970703125, -2.4288330078125, -2.29046630859375, -2.152099609375, -2.01373291015625, -1.8753662109375, -1.73699951171875, -1.5986328125, -1.46026611328125, -1.3218994140625, -1.18353271484375, -1.045166015625, -0.90679931640625, -0.7684326171875, -0.63006591796875, -0.49169921875, -0.35333251953125, -0.2149658203125, -0.07659912109375, 0.061767578125, 0.20013427734375, 0.3385009765625, 0.47686767578125, 0.615234375, 0.75360107421875, 0.8919677734375, 1.03033447265625, 1.168701171875, 1.30706787109375, 1.4454345703125, 1.58380126953125, 1.72216796875, 1.86053466796875, 1.9989013671875, 2.13726806640625, 2.275634765625, 2.41400146484375, 2.5523681640625, 2.69073486328125, 2.8291015625, 2.96746826171875, 3.1058349609375, 3.24420166015625, 3.382568359375, 3.52093505859375, 3.6593017578125, 3.79766845703125, 3.93603515625, 4.07440185546875, 4.2127685546875, 4.35113525390625, 4.489501953125, 4.62786865234375, 4.7662353515625, 4.90460205078125, 5.04296875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 11.0, 15.0, 22.0, 26.0, 30.0, 35.0, 43.0, 57.0, 76.0, 105.0, 142.0, 207.0, 389.0, 822.0, 16796.0, 3973194.0, 199106.0, 1763.0, 464.0, 283.0, 159.0, 129.0, 93.0, 50.0, 47.0, 43.0, 26.0, 30.0, 20.0, 16.0, 16.0, 12.0, 8.0, 4.0, 4.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.4228515625, -38.095703125, -36.7685546875, -35.44140625, -34.1142578125, -32.787109375, -31.4599609375, -30.1328125, -28.8056640625, -27.478515625, -26.1513671875, -24.82421875, -23.4970703125, -22.169921875, -20.8427734375, -19.515625, -18.1884765625, -16.861328125, -15.5341796875, -14.20703125, -12.8798828125, -11.552734375, -10.2255859375, -8.8984375, -7.5712890625, -6.244140625, -4.9169921875, -3.58984375, -2.2626953125, -0.935546875, 0.3916015625, 1.71875, 3.0458984375, 4.373046875, 5.7001953125, 7.02734375, 8.3544921875, 9.681640625, 11.0087890625, 12.3359375, 13.6630859375, 14.990234375, 16.3173828125, 17.64453125, 18.9716796875, 20.298828125, 21.6259765625, 22.953125, 24.2802734375, 25.607421875, 26.9345703125, 28.26171875, 29.5888671875, 30.916015625, 32.2431640625, 33.5703125, 34.8974609375, 36.224609375, 37.5517578125, 38.87890625, 40.2060546875, 41.533203125, 42.8603515625, 44.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 8.0, 12.0, 14.0, 18.0, 14.0, 28.0, 51.0, 72.0, 90.0, 130.0, 187.0, 256.0, 389.0, 547.0, 655.0, 454.0, 329.0, 237.0, 155.0, 136.0, 68.0, 53.0, 42.0, 29.0, 25.0, 13.0, 16.0, 8.0, 11.0, 4.0, 2.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.828125, -7.59918212890625, -7.3702392578125, -7.14129638671875, -6.912353515625, -6.68341064453125, -6.4544677734375, -6.22552490234375, -5.99658203125, -5.76763916015625, -5.5386962890625, -5.30975341796875, -5.080810546875, -4.85186767578125, -4.6229248046875, -4.39398193359375, -4.1650390625, -3.93609619140625, -3.7071533203125, -3.47821044921875, -3.249267578125, -3.02032470703125, -2.7913818359375, -2.56243896484375, -2.33349609375, -2.10455322265625, -1.8756103515625, -1.64666748046875, -1.417724609375, -1.18878173828125, -0.9598388671875, -0.73089599609375, -0.501953125, -0.27301025390625, -0.0440673828125, 0.18487548828125, 0.413818359375, 0.64276123046875, 0.8717041015625, 1.10064697265625, 1.32958984375, 1.55853271484375, 1.7874755859375, 2.01641845703125, 2.245361328125, 2.47430419921875, 2.7032470703125, 2.93218994140625, 3.1611328125, 3.39007568359375, 3.6190185546875, 3.84796142578125, 4.076904296875, 4.30584716796875, 4.5347900390625, 4.76373291015625, 4.99267578125, 5.22161865234375, 5.4505615234375, 5.67950439453125, 5.908447265625, 6.13739013671875, 6.3663330078125, 6.59527587890625, 6.82421875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 8.0, 18.0, 13.0, 14.0, 22.0, 47.0, 44.0, 58.0, 80.0, 147.0, 247.0, 413.0, 1185.0, 3991.0, 21577.0, 199882.0, 2917172.0, 964462.0, 71279.0, 9792.0, 2205.0, 748.0, 307.0, 169.0, 105.0, 78.0, 43.0, 46.0, 26.0, 24.0, 15.0, 18.0, 12.0, 10.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.90625, -17.376220703125, -16.84619140625, -16.316162109375, -15.7861328125, -15.256103515625, -14.72607421875, -14.196044921875, -13.666015625, -13.135986328125, -12.60595703125, -12.075927734375, -11.5458984375, -11.015869140625, -10.48583984375, -9.955810546875, -9.42578125, -8.895751953125, -8.36572265625, -7.835693359375, -7.3056640625, -6.775634765625, -6.24560546875, -5.715576171875, -5.185546875, -4.655517578125, -4.12548828125, -3.595458984375, -3.0654296875, -2.535400390625, -2.00537109375, -1.475341796875, -0.9453125, -0.415283203125, 0.11474609375, 0.644775390625, 1.1748046875, 1.704833984375, 2.23486328125, 2.764892578125, 3.294921875, 3.824951171875, 4.35498046875, 4.885009765625, 5.4150390625, 5.945068359375, 6.47509765625, 7.005126953125, 7.53515625, 8.065185546875, 8.59521484375, 9.125244140625, 9.6552734375, 10.185302734375, 10.71533203125, 11.245361328125, 11.775390625, 12.305419921875, 12.83544921875, 13.365478515625, 13.8955078125, 14.425537109375, 14.95556640625, 15.485595703125, 16.015625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 37.0, 179.0, 302.0, 296.0, 129.0, 55.0, 7.0, 1.0, 2.0], "bins": [-172.10218811035156, -169.1282501220703, -166.15431213378906, -163.1803741455078, -160.20643615722656, -157.23251342773438, -154.25857543945312, -151.28463745117188, -148.31069946289062, -145.33676147460938, -142.36282348632812, -139.38888549804688, -136.41494750976562, -133.44100952148438, -130.46707153320312, -127.4931411743164, -124.51920318603516, -121.5452651977539, -118.57132720947266, -115.59739685058594, -112.62345886230469, -109.64952087402344, -106.67558288574219, -103.70164489746094, -100.72770690917969, -97.75376892089844, -94.77983093261719, -91.80589294433594, -88.83196258544922, -85.85802459716797, -82.88408660888672, -79.91014862060547, -76.93622589111328, -73.96228790283203, -70.98834991455078, -68.01441955566406, -65.04048156738281, -62.06654357910156, -59.09260559082031, -56.11866760253906, -53.14472961425781, -50.17079162597656, -47.19685745239258, -44.22291946411133, -41.248985290527344, -38.275047302246094, -35.301109313964844, -32.327171325683594, -29.353239059448242, -26.379302978515625, -23.405364990234375, -20.431428909301758, -17.45749282836914, -14.483556747436523, -11.509618759155273, -8.535682678222656, -5.561746597290039, -2.5878100395202637, 0.3861265182495117, 3.3600635528564453, 6.3339996337890625, 9.30793571472168, 12.28187370300293, 15.255809783935547, 18.229745864868164]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 9.0, 7.0, 12.0, 13.0, 14.0, 12.0, 20.0, 17.0, 23.0, 28.0, 33.0, 32.0, 51.0, 38.0, 35.0, 33.0, 47.0, 43.0, 39.0, 45.0, 35.0, 42.0, 36.0, 34.0, 34.0, 27.0, 23.0, 36.0, 26.0, 22.0, 22.0, 15.0, 17.0, 13.0, 10.0, 14.0, 6.0, 6.0, 8.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.676143646240234, -21.95744514465332, -21.238746643066406, -20.520048141479492, -19.801349639892578, -19.082651138305664, -18.36395263671875, -17.645254135131836, -16.926555633544922, -16.207857131958008, -15.489158630371094, -14.77046012878418, -14.051761627197266, -13.333063125610352, -12.614364624023438, -11.895666122436523, -11.176968574523926, -10.458270072937012, -9.739571571350098, -9.020873069763184, -8.30217456817627, -7.5834760665893555, -6.8647780418396, -6.1460795402526855, -5.4273810386657715, -4.708682537078857, -3.9899840354919434, -3.2712857723236084, -2.5525872707366943, -1.8338887691497803, -1.1151905059814453, -0.39649200439453125, 0.3222064971923828, 1.0409049987792969, 1.7596033811569214, 2.478301763534546, 3.19700026512146, 3.915698766708374, 4.634397029876709, 5.353095531463623, 6.071794033050537, 6.790492534637451, 7.509191036224365, 8.227889060974121, 8.946587562561035, 9.66528606414795, 10.383984565734863, 11.102683067321777, 11.821381568908691, 12.540080070495605, 13.25877857208252, 13.977477073669434, 14.696175575256348, 15.414874076843262, 16.13357162475586, 16.852270126342773, 17.570968627929688, 18.2896671295166, 19.008365631103516, 19.72706413269043, 20.445762634277344, 21.164461135864258, 21.883159637451172, 22.601858139038086, 23.320556640625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 7.0, 4.0, 7.0, 10.0, 15.0, 14.0, 14.0, 23.0, 25.0, 27.0, 21.0, 34.0, 32.0, 29.0, 38.0, 41.0, 43.0, 51.0, 50.0, 36.0, 38.0, 34.0, 33.0, 31.0, 36.0, 36.0, 29.0, 28.0, 28.0, 32.0, 16.0, 18.0, 19.0, 16.0, 15.0, 14.0, 5.0, 12.0, 4.0, 6.0, 4.0, 11.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.1484375, -4.00909423828125, -3.8697509765625, -3.73040771484375, -3.591064453125, -3.45172119140625, -3.3123779296875, -3.17303466796875, -3.03369140625, -2.89434814453125, -2.7550048828125, -2.61566162109375, -2.476318359375, -2.33697509765625, -2.1976318359375, -2.05828857421875, -1.9189453125, -1.77960205078125, -1.6402587890625, -1.50091552734375, -1.361572265625, -1.22222900390625, -1.0828857421875, -0.94354248046875, -0.80419921875, -0.66485595703125, -0.5255126953125, -0.38616943359375, -0.246826171875, -0.10748291015625, 0.0318603515625, 0.17120361328125, 0.310546875, 0.44989013671875, 0.5892333984375, 0.72857666015625, 0.867919921875, 1.00726318359375, 1.1466064453125, 1.28594970703125, 1.42529296875, 1.56463623046875, 1.7039794921875, 1.84332275390625, 1.982666015625, 2.12200927734375, 2.2613525390625, 2.40069580078125, 2.5400390625, 2.67938232421875, 2.8187255859375, 2.95806884765625, 3.097412109375, 3.23675537109375, 3.3760986328125, 3.51544189453125, 3.65478515625, 3.79412841796875, 3.9334716796875, 4.07281494140625, 4.212158203125, 4.35150146484375, 4.4908447265625, 4.63018798828125, 4.76953125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 8.0, 10.0, 33.0, 21.0, 31.0, 57.0, 93.0, 143.0, 220.0, 306.0, 463.0, 759.0, 1198.0, 1901.0, 2732.0, 4030.0, 6488.0, 9976.0, 15393.0, 24398.0, 38855.0, 64982.0, 120141.0, 317284.0, 201134.0, 93519.0, 53667.0, 32691.0, 20325.0, 13120.0, 8580.0, 5492.0, 3568.0, 2426.0, 1577.0, 1044.0, 626.0, 425.0, 299.0, 200.0, 119.0, 69.0, 48.0, 35.0, 23.0, 13.0, 15.0, 9.0, 10.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.1920166015625, -0.1863384246826172, -0.18066024780273438, -0.17498207092285156, -0.16930389404296875, -0.16362571716308594, -0.15794754028320312, -0.1522693634033203, -0.1465911865234375, -0.1409130096435547, -0.13523483276367188, -0.12955665588378906, -0.12387847900390625, -0.11820030212402344, -0.11252212524414062, -0.10684394836425781, -0.101165771484375, -0.09548759460449219, -0.08980941772460938, -0.08413124084472656, -0.07845306396484375, -0.07277488708496094, -0.06709671020507812, -0.06141853332519531, -0.0557403564453125, -0.05006217956542969, -0.044384002685546875, -0.03870582580566406, -0.03302764892578125, -0.027349472045898438, -0.021671295166015625, -0.015993118286132812, -0.01031494140625, -0.0046367645263671875, 0.001041412353515625, 0.0067195892333984375, 0.01239776611328125, 0.018075942993164062, 0.023754119873046875, 0.029432296752929688, 0.0351104736328125, 0.04078865051269531, 0.046466827392578125, 0.05214500427246094, 0.05782318115234375, 0.06350135803222656, 0.06917953491210938, 0.07485771179199219, 0.080535888671875, 0.08621406555175781, 0.09189224243164062, 0.09757041931152344, 0.10324859619140625, 0.10892677307128906, 0.11460494995117188, 0.12028312683105469, 0.1259613037109375, 0.1316394805908203, 0.13731765747070312, 0.14299583435058594, 0.14867401123046875, 0.15435218811035156, 0.16003036499023438, 0.1657085418701172, 0.17138671875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 3.0, 4.0, 10.0, 13.0, 15.0, 12.0, 17.0, 13.0, 27.0, 21.0, 26.0, 40.0, 28.0, 36.0, 47.0, 47.0, 41.0, 47.0, 46.0, 1066.0, 39.0, 35.0, 31.0, 39.0, 44.0, 26.0, 28.0, 37.0, 27.0, 18.0, 24.0, 15.0, 18.0, 19.0, 16.0, 7.0, 12.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.369140625, -3.26409912109375, -3.1590576171875, -3.05401611328125, -2.948974609375, -2.84393310546875, -2.7388916015625, -2.63385009765625, -2.52880859375, -2.42376708984375, -2.3187255859375, -2.21368408203125, -2.108642578125, -2.00360107421875, -1.8985595703125, -1.79351806640625, -1.6884765625, -1.58343505859375, -1.4783935546875, -1.37335205078125, -1.268310546875, -1.16326904296875, -1.0582275390625, -0.95318603515625, -0.84814453125, -0.74310302734375, -0.6380615234375, -0.53302001953125, -0.427978515625, -0.32293701171875, -0.2178955078125, -0.11285400390625, -0.0078125, 0.09722900390625, 0.2022705078125, 0.30731201171875, 0.412353515625, 0.51739501953125, 0.6224365234375, 0.72747802734375, 0.83251953125, 0.93756103515625, 1.0426025390625, 1.14764404296875, 1.252685546875, 1.35772705078125, 1.4627685546875, 1.56781005859375, 1.6728515625, 1.77789306640625, 1.8829345703125, 1.98797607421875, 2.093017578125, 2.19805908203125, 2.3031005859375, 2.40814208984375, 2.51318359375, 2.61822509765625, 2.7232666015625, 2.82830810546875, 2.933349609375, 3.03839111328125, 3.1434326171875, 3.24847412109375, 3.353515625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 20.0, 19.0, 34.0, 44.0, 72.0, 99.0, 156.0, 197.0, 334.0, 454.0, 672.0, 983.0, 1572.0, 2237.0, 3381.0, 4945.0, 7392.0, 10949.0, 16328.0, 25086.0, 39127.0, 64457.0, 112763.0, 1319746.0, 218223.0, 102641.0, 59360.0, 36160.0, 22992.0, 15250.0, 10132.0, 6976.0, 4547.0, 3088.0, 2221.0, 1442.0, 981.0, 664.0, 460.0, 289.0, 231.0, 127.0, 80.0, 61.0, 43.0, 27.0, 26.0, 10.0, 12.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0965576171875, -0.09353256225585938, -0.09050750732421875, -0.08748245239257812, -0.0844573974609375, -0.08143234252929688, -0.07840728759765625, -0.07538223266601562, -0.072357177734375, -0.06933212280273438, -0.06630706787109375, -0.06328201293945312, -0.0602569580078125, -0.057231903076171875, -0.05420684814453125, -0.051181793212890625, -0.04815673828125, -0.045131683349609375, -0.04210662841796875, -0.039081573486328125, -0.0360565185546875, -0.033031463623046875, -0.03000640869140625, -0.026981353759765625, -0.023956298828125, -0.020931243896484375, -0.01790618896484375, -0.014881134033203125, -0.0118560791015625, -0.008831024169921875, -0.00580596923828125, -0.002780914306640625, 0.000244140625, 0.003269195556640625, 0.00629425048828125, 0.009319305419921875, 0.0123443603515625, 0.015369415283203125, 0.01839447021484375, 0.021419525146484375, 0.024444580078125, 0.027469635009765625, 0.03049468994140625, 0.033519744873046875, 0.0365447998046875, 0.039569854736328125, 0.04259490966796875, 0.045619964599609375, 0.04864501953125, 0.051670074462890625, 0.05469512939453125, 0.057720184326171875, 0.0607452392578125, 0.06377029418945312, 0.06679534912109375, 0.06982040405273438, 0.072845458984375, 0.07587051391601562, 0.07889556884765625, 0.08192062377929688, 0.0849456787109375, 0.08797073364257812, 0.09099578857421875, 0.09402084350585938, 0.0970458984375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 6.0, 4.0, 3.0, 5.0, 8.0, 8.0, 8.0, 10.0, 6.0, 9.0, 9.0, 13.0, 11.0, 17.0, 13.0, 20.0, 22.0, 17.0, 72.0, 57.0, 104.0, 219.0, 92.0, 55.0, 46.0, 18.0, 19.0, 18.0, 19.0, 22.0, 5.0, 8.0, 9.0, 6.0, 12.0, 5.0, 5.0, 4.0, 3.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5441328287124634e-06, -1.4789402484893799e-06, -1.4137476682662964e-06, -1.3485550880432129e-06, -1.2833625078201294e-06, -1.218169927597046e-06, -1.1529773473739624e-06, -1.087784767150879e-06, -1.0225921869277954e-06, -9.57399606704712e-07, -8.922070264816284e-07, -8.270144462585449e-07, -7.618218660354614e-07, -6.966292858123779e-07, -6.314367055892944e-07, -5.662441253662109e-07, -5.010515451431274e-07, -4.3585896492004395e-07, -3.7066638469696045e-07, -3.0547380447387695e-07, -2.4028122425079346e-07, -1.7508864402770996e-07, -1.0989606380462646e-07, -4.470348358154297e-08, 2.0489096641540527e-08, 8.568167686462402e-08, 1.5087425708770752e-07, 2.1606683731079102e-07, 2.812594175338745e-07, 3.46451997756958e-07, 4.116445779800415e-07, 4.76837158203125e-07, 5.420297384262085e-07, 6.07222318649292e-07, 6.724148988723755e-07, 7.37607479095459e-07, 8.028000593185425e-07, 8.67992639541626e-07, 9.331852197647095e-07, 9.98377799987793e-07, 1.0635703802108765e-06, 1.12876296043396e-06, 1.1939555406570435e-06, 1.259148120880127e-06, 1.3243407011032104e-06, 1.389533281326294e-06, 1.4547258615493774e-06, 1.519918441772461e-06, 1.5851110219955444e-06, 1.650303602218628e-06, 1.7154961824417114e-06, 1.780688762664795e-06, 1.8458813428878784e-06, 1.911073923110962e-06, 1.9762665033340454e-06, 2.041459083557129e-06, 2.1066516637802124e-06, 2.171844244003296e-06, 2.2370368242263794e-06, 2.302229404449463e-06, 2.3674219846725464e-06, 2.43261456489563e-06, 2.4978071451187134e-06, 2.562999725341797e-06]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 6.0, 5.0, 5.0, 5.0, 5.0, 13.0, 14.0, 19.0, 28.0, 43.0, 45.0, 45.0, 84.0, 136.0, 214.0, 469.0, 10905.0, 1007587.0, 27412.0, 689.0, 258.0, 144.0, 105.0, 69.0, 42.0, 40.0, 31.0, 25.0, 22.0, 12.0, 10.0, 4.0, 5.0, 7.0, 12.0, 5.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0], "bins": [-5.352497100830078e-05, -5.2138231694698334e-05, -5.0751492381095886e-05, -4.936475306749344e-05, -4.797801375389099e-05, -4.6591274440288544e-05, -4.5204535126686096e-05, -4.381779581308365e-05, -4.24310564994812e-05, -4.1044317185878754e-05, -3.9657577872276306e-05, -3.827083855867386e-05, -3.688409924507141e-05, -3.5497359931468964e-05, -3.4110620617866516e-05, -3.272388130426407e-05, -3.133714199066162e-05, -2.9950402677059174e-05, -2.8563663363456726e-05, -2.717692404985428e-05, -2.579018473625183e-05, -2.4403445422649384e-05, -2.3016706109046936e-05, -2.162996679544449e-05, -2.024322748184204e-05, -1.8856488168239594e-05, -1.7469748854637146e-05, -1.60830095410347e-05, -1.4696270227432251e-05, -1.3309530913829803e-05, -1.1922791600227356e-05, -1.0536052286624908e-05, -9.149312973022461e-06, -7.762573659420013e-06, -6.375834345817566e-06, -4.989095032215118e-06, -3.602355718612671e-06, -2.2156164050102234e-06, -8.288770914077759e-07, 5.578622221946716e-07, 1.944601535797119e-06, 3.3313408493995667e-06, 4.718080163002014e-06, 6.104819476604462e-06, 7.491558790206909e-06, 8.878298103809357e-06, 1.0265037417411804e-05, 1.1651776731014252e-05, 1.30385160446167e-05, 1.4425255358219147e-05, 1.5811994671821594e-05, 1.7198733985424042e-05, 1.858547329902649e-05, 1.9972212612628937e-05, 2.1358951926231384e-05, 2.2745691239833832e-05, 2.413243055343628e-05, 2.5519169867038727e-05, 2.6905909180641174e-05, 2.8292648494243622e-05, 2.967938780784607e-05, 3.106612712144852e-05, 3.2452866435050964e-05, 3.383960574865341e-05, 3.522634506225586e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 16.0, 60.0, 224.0, 462.0, 205.0, 39.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.366380595565715e-07, -7.908117822807981e-07, -6.449855618484435e-07, -4.9915928457267e-07, -3.5333300729689654e-07, -2.0750673002112308e-07, -6.168050958876847e-08, 8.414582453042385e-08, 2.2997204496277845e-07, 3.757983222385519e-07, 5.216245426709065e-07, 6.6745081994668e-07, 8.132770972224534e-07, 9.59103317654808e-07, 1.1049296517740004e-06, 1.2507559858931927e-06, 1.3965820926387096e-06, 1.5424083130710642e-06, 1.6882346471902565e-06, 1.8340608676226111e-06, 1.9798872017418034e-06, 2.1257133084873203e-06, 2.2715396426065126e-06, 2.417365976725705e-06, 2.5631923108448973e-06, 2.7090186449640896e-06, 2.8548447517096065e-06, 3.000671085828799e-06, 3.146497419947991e-06, 3.292323526693508e-06, 3.4381498608127004e-06, 3.5839761949318927e-06, 3.7298027564247604e-06, 3.875628863170277e-06, 4.021455424663145e-06, 4.167281531408662e-06, 4.313107638154179e-06, 4.458934199647047e-06, 4.6047603063925635e-06, 4.75058641313808e-06, 4.896412974630948e-06, 5.042239081376465e-06, 5.188065642869333e-06, 5.33389174961485e-06, 5.4797178563603666e-06, 5.625544417853234e-06, 5.771370524598751e-06, 5.917197086091619e-06, 6.063022738089785e-06, 6.208848844835302e-06, 6.35467540632817e-06, 6.5005015130736865e-06, 6.646327619819203e-06, 6.792154181312071e-06, 6.937980288057588e-06, 7.083806849550456e-06, 7.229632956295973e-06, 7.3754590630414896e-06, 7.521285624534357e-06, 7.667111276532523e-06, 7.812937838025391e-06, 7.958764399518259e-06, 8.104590961011127e-06, 8.250416613009293e-06, 8.39624317450216e-06]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 0.0, 5.0, 15.0, 0.0, 23.0, 0.0, 25.0, 0.0, 43.0, 72.0, 0.0, 118.0, 0.0, 132.0, 0.0, 131.0, 0.0, 106.0, 108.0, 0.0, 92.0, 0.0, 47.0, 0.0, 44.0, 17.0, 0.0, 10.0, 0.0, 12.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.797513484954834e-07, -9.462237358093262e-07, -9.126961231231689e-07, -8.791685104370117e-07, -8.456408977508545e-07, -8.121132850646973e-07, -7.7858567237854e-07, -7.450580596923828e-07, -7.115304470062256e-07, -6.780028343200684e-07, -6.444752216339111e-07, -6.109476089477539e-07, -5.774199962615967e-07, -5.438923835754395e-07, -5.103647708892822e-07, -4.76837158203125e-07, -4.4330954551696777e-07, -4.0978193283081055e-07, -3.762543201446533e-07, -3.427267074584961e-07, -3.0919909477233887e-07, -2.7567148208618164e-07, -2.421438694000244e-07, -2.086162567138672e-07, -1.7508864402770996e-07, -1.4156103134155273e-07, -1.0803341865539551e-07, -7.450580596923828e-08, -4.0978193283081055e-08, -7.450580596923828e-09, 2.60770320892334e-08, 5.960464477539063e-08, 9.313225746154785e-08, 1.2665987014770508e-07, 1.601874828338623e-07, 1.9371509552001953e-07, 2.2724270820617676e-07, 2.60770320892334e-07, 2.942979335784912e-07, 3.2782554626464844e-07, 3.6135315895080566e-07, 3.948807716369629e-07, 4.284083843231201e-07, 4.6193599700927734e-07, 4.954636096954346e-07, 5.289912223815918e-07, 5.62518835067749e-07, 5.960464477539062e-07, 6.295740604400635e-07, 6.631016731262207e-07, 6.966292858123779e-07, 7.301568984985352e-07, 7.636845111846924e-07, 7.972121238708496e-07, 8.307397365570068e-07, 8.642673492431641e-07, 8.977949619293213e-07, 9.313225746154785e-07, 9.648501873016357e-07, 9.98377799987793e-07, 1.0319054126739502e-06, 1.0654330253601074e-06, 1.0989606380462646e-06, 1.1324882507324219e-06]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 7.0, 4.0, 7.0, 10.0, 15.0, 14.0, 14.0, 23.0, 25.0, 27.0, 21.0, 34.0, 32.0, 29.0, 38.0, 41.0, 43.0, 51.0, 50.0, 36.0, 38.0, 34.0, 33.0, 31.0, 36.0, 36.0, 29.0, 28.0, 28.0, 32.0, 16.0, 18.0, 19.0, 16.0, 15.0, 14.0, 5.0, 12.0, 4.0, 6.0, 4.0, 11.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.1484375, -4.00909423828125, -3.8697509765625, -3.73040771484375, -3.591064453125, -3.45172119140625, -3.3123779296875, -3.17303466796875, -3.03369140625, -2.89434814453125, -2.7550048828125, -2.61566162109375, -2.476318359375, -2.33697509765625, -2.1976318359375, -2.05828857421875, -1.9189453125, -1.77960205078125, -1.6402587890625, -1.50091552734375, -1.361572265625, -1.22222900390625, -1.0828857421875, -0.94354248046875, -0.80419921875, -0.66485595703125, -0.5255126953125, -0.38616943359375, -0.246826171875, -0.10748291015625, 0.0318603515625, 0.17120361328125, 0.310546875, 0.44989013671875, 0.5892333984375, 0.72857666015625, 0.867919921875, 1.00726318359375, 1.1466064453125, 1.28594970703125, 1.42529296875, 1.56463623046875, 1.7039794921875, 1.84332275390625, 1.982666015625, 2.12200927734375, 2.2613525390625, 2.40069580078125, 2.5400390625, 2.67938232421875, 2.8187255859375, 2.95806884765625, 3.097412109375, 3.23675537109375, 3.3760986328125, 3.51544189453125, 3.65478515625, 3.79412841796875, 3.9334716796875, 4.07281494140625, 4.212158203125, 4.35150146484375, 4.4908447265625, 4.63018798828125, 4.76953125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 2.0, 9.0, 9.0, 7.0, 11.0, 18.0, 27.0, 38.0, 63.0, 92.0, 102.0, 187.0, 291.0, 477.0, 868.0, 1560.0, 3051.0, 6201.0, 11730.0, 22796.0, 45198.0, 87821.0, 165870.0, 264947.0, 206847.0, 111424.0, 58280.0, 29391.0, 14987.0, 7736.0, 3817.0, 2024.0, 1061.0, 615.0, 328.0, 217.0, 137.0, 102.0, 68.0, 40.0, 36.0, 15.0, 13.0, 16.0, 6.0, 12.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.33203125, -6.12567138671875, -5.9193115234375, -5.71295166015625, -5.506591796875, -5.30023193359375, -5.0938720703125, -4.88751220703125, -4.68115234375, -4.47479248046875, -4.2684326171875, -4.06207275390625, -3.855712890625, -3.64935302734375, -3.4429931640625, -3.23663330078125, -3.0302734375, -2.82391357421875, -2.6175537109375, -2.41119384765625, -2.204833984375, -1.99847412109375, -1.7921142578125, -1.58575439453125, -1.37939453125, -1.17303466796875, -0.9666748046875, -0.76031494140625, -0.553955078125, -0.34759521484375, -0.1412353515625, 0.06512451171875, 0.271484375, 0.47784423828125, 0.6842041015625, 0.89056396484375, 1.096923828125, 1.30328369140625, 1.5096435546875, 1.71600341796875, 1.92236328125, 2.12872314453125, 2.3350830078125, 2.54144287109375, 2.747802734375, 2.95416259765625, 3.1605224609375, 3.36688232421875, 3.5732421875, 3.77960205078125, 3.9859619140625, 4.19232177734375, 4.398681640625, 4.60504150390625, 4.8114013671875, 5.01776123046875, 5.22412109375, 5.43048095703125, 5.6368408203125, 5.84320068359375, 6.049560546875, 6.25592041015625, 6.4622802734375, 6.66864013671875, 6.875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 6.0, 9.0, 14.0, 14.0, 21.0, 19.0, 27.0, 43.0, 39.0, 38.0, 65.0, 78.0, 135.0, 228.0, 1341.0, 265.0, 199.0, 110.0, 86.0, 56.0, 36.0, 31.0, 35.0, 21.0, 27.0, 16.0, 23.0, 15.0, 9.0, 12.0, 4.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.875, -10.454833984375, -10.03466796875, -9.614501953125, -9.1943359375, -8.774169921875, -8.35400390625, -7.933837890625, -7.513671875, -7.093505859375, -6.67333984375, -6.253173828125, -5.8330078125, -5.412841796875, -4.99267578125, -4.572509765625, -4.15234375, -3.732177734375, -3.31201171875, -2.891845703125, -2.4716796875, -2.051513671875, -1.63134765625, -1.211181640625, -0.791015625, -0.370849609375, 0.04931640625, 0.469482421875, 0.8896484375, 1.309814453125, 1.72998046875, 2.150146484375, 2.5703125, 2.990478515625, 3.41064453125, 3.830810546875, 4.2509765625, 4.671142578125, 5.09130859375, 5.511474609375, 5.931640625, 6.351806640625, 6.77197265625, 7.192138671875, 7.6123046875, 8.032470703125, 8.45263671875, 8.872802734375, 9.29296875, 9.713134765625, 10.13330078125, 10.553466796875, 10.9736328125, 11.393798828125, 11.81396484375, 12.234130859375, 12.654296875, 13.074462890625, 13.49462890625, 13.914794921875, 14.3349609375, 14.755126953125, 15.17529296875, 15.595458984375, 16.015625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 11.0, 8.0, 9.0, 20.0, 22.0, 27.0, 41.0, 69.0, 88.0, 128.0, 195.0, 406.0, 669.0, 1815.0, 75357.0, 3049194.0, 14881.0, 1316.0, 560.0, 292.0, 213.0, 133.0, 77.0, 46.0, 40.0, 27.0, 19.0, 15.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.84375, -51.46630859375, -50.0888671875, -48.71142578125, -47.333984375, -45.95654296875, -44.5791015625, -43.20166015625, -41.82421875, -40.44677734375, -39.0693359375, -37.69189453125, -36.314453125, -34.93701171875, -33.5595703125, -32.18212890625, -30.8046875, -29.42724609375, -28.0498046875, -26.67236328125, -25.294921875, -23.91748046875, -22.5400390625, -21.16259765625, -19.78515625, -18.40771484375, -17.0302734375, -15.65283203125, -14.275390625, -12.89794921875, -11.5205078125, -10.14306640625, -8.765625, -7.38818359375, -6.0107421875, -4.63330078125, -3.255859375, -1.87841796875, -0.5009765625, 0.87646484375, 2.25390625, 3.63134765625, 5.0087890625, 6.38623046875, 7.763671875, 9.14111328125, 10.5185546875, 11.89599609375, 13.2734375, 14.65087890625, 16.0283203125, 17.40576171875, 18.783203125, 20.16064453125, 21.5380859375, 22.91552734375, 24.29296875, 25.67041015625, 27.0478515625, 28.42529296875, 29.802734375, 31.18017578125, 32.5576171875, 33.93505859375, 35.3125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 27.0, 73.0, 178.0, 244.0, 248.0, 143.0, 75.0, 15.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.38157653808594, -36.541175842285156, -33.700775146484375, -30.860374450683594, -28.019973754882812, -25.17957305908203, -22.339170455932617, -19.498769760131836, -16.658369064331055, -13.817968368530273, -10.977567672729492, -8.137166023254395, -5.296765327453613, -2.456364631652832, 0.3840370178222656, 3.224437713623047, 6.064838409423828, 8.90523910522461, 11.74563980102539, 14.586041450500488, 17.426441192626953, 20.266841888427734, 23.10724449157715, 25.94764518737793, 28.78804588317871, 31.628446578979492, 34.468849182128906, 37.30924987792969, 40.14965057373047, 42.99005126953125, 45.83045196533203, 48.67085266113281, 51.511253356933594, 54.351654052734375, 57.192054748535156, 60.03245544433594, 62.87285614013672, 65.7132568359375, 68.55365753173828, 71.39405822753906, 74.23445892333984, 77.07485961914062, 79.9152603149414, 82.75566101074219, 85.59606170654297, 88.43646240234375, 91.27686309814453, 94.11726379394531, 96.95767211914062, 99.7980728149414, 102.63847351074219, 105.47887420654297, 108.31927490234375, 111.15967559814453, 114.00007629394531, 116.8404769897461, 119.68087768554688, 122.52127838134766, 125.36167907714844, 128.20208740234375, 131.04248046875, 133.8828887939453, 136.72328186035156, 139.56369018554688, 142.40408325195312]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 13.0, 8.0, 15.0, 18.0, 13.0, 23.0, 16.0, 16.0, 24.0, 29.0, 35.0, 41.0, 43.0, 44.0, 46.0, 49.0, 50.0, 46.0, 37.0, 60.0, 43.0, 38.0, 30.0, 28.0, 31.0, 28.0, 18.0, 21.0, 16.0, 12.0, 19.0, 16.0, 20.0, 13.0, 6.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.38334655761719, -36.24794006347656, -35.1125373840332, -33.97713088989258, -32.84172821044922, -31.706321716308594, -30.5709171295166, -29.43551254272461, -28.300107955932617, -27.164703369140625, -26.029298782348633, -24.89389419555664, -23.758487701416016, -22.623085021972656, -21.48767852783203, -20.35227394104004, -19.216869354248047, -18.081464767456055, -16.946060180664062, -15.810654640197754, -14.675250053405762, -13.53984546661377, -12.404439926147461, -11.269035339355469, -10.133630752563477, -8.998226165771484, -7.862821102142334, -6.727416038513184, -5.592011451721191, -4.456606864929199, -3.321201801300049, -2.1857967376708984, -1.0503921508789062, 0.08501267433166504, 1.2204174995422363, 2.3558223247528076, 3.491227149963379, 4.626631736755371, 5.7620368003845215, 6.897441864013672, 8.032846450805664, 9.168251037597656, 10.303655624389648, 11.439061164855957, 12.57446575164795, 13.709870338439941, 14.84527587890625, 15.980680465698242, 17.116085052490234, 18.251489639282227, 19.38689422607422, 20.52229881286621, 21.657703399658203, 22.793109893798828, 23.92851448059082, 25.063919067382812, 26.199323654174805, 27.334728240966797, 28.47013282775879, 29.60553741455078, 30.740943908691406, 31.876346588134766, 33.01175308227539, 34.14715576171875, 35.282562255859375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 10.0, 7.0, 10.0, 11.0, 17.0, 18.0, 11.0, 17.0, 22.0, 32.0, 34.0, 22.0, 28.0, 38.0, 42.0, 45.0, 51.0, 49.0, 41.0, 28.0, 39.0, 39.0, 32.0, 44.0, 24.0, 20.0, 39.0, 32.0, 23.0, 33.0, 16.0, 15.0, 17.0, 12.0, 12.0, 15.0, 8.0, 17.0, 7.0, 2.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.12109375, -3.98046875, -3.83984375, -3.69921875, -3.55859375, -3.41796875, -3.27734375, -3.13671875, -2.99609375, -2.85546875, -2.71484375, -2.57421875, -2.43359375, -2.29296875, -2.15234375, -2.01171875, -1.87109375, -1.73046875, -1.58984375, -1.44921875, -1.30859375, -1.16796875, -1.02734375, -0.88671875, -0.74609375, -0.60546875, -0.46484375, -0.32421875, -0.18359375, -0.04296875, 0.09765625, 0.23828125, 0.37890625, 0.51953125, 0.66015625, 0.80078125, 0.94140625, 1.08203125, 1.22265625, 1.36328125, 1.50390625, 1.64453125, 1.78515625, 1.92578125, 2.06640625, 2.20703125, 2.34765625, 2.48828125, 2.62890625, 2.76953125, 2.91015625, 3.05078125, 3.19140625, 3.33203125, 3.47265625, 3.61328125, 3.75390625, 3.89453125, 4.03515625, 4.17578125, 4.31640625, 4.45703125, 4.59765625, 4.73828125, 4.87890625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 5.0, 8.0, 13.0, 23.0, 53.0, 116.0, 387.0, 1482.0, 7013.0, 54494.0, 1591454.0, 2447779.0, 79336.0, 9422.0, 1903.0, 470.0, 169.0, 75.0, 31.0, 9.0, 10.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.75, -16.173828125, -15.59765625, -15.021484375, -14.4453125, -13.869140625, -13.29296875, -12.716796875, -12.140625, -11.564453125, -10.98828125, -10.412109375, -9.8359375, -9.259765625, -8.68359375, -8.107421875, -7.53125, -6.955078125, -6.37890625, -5.802734375, -5.2265625, -4.650390625, -4.07421875, -3.498046875, -2.921875, -2.345703125, -1.76953125, -1.193359375, -0.6171875, -0.041015625, 0.53515625, 1.111328125, 1.6875, 2.263671875, 2.83984375, 3.416015625, 3.9921875, 4.568359375, 5.14453125, 5.720703125, 6.296875, 6.873046875, 7.44921875, 8.025390625, 8.6015625, 9.177734375, 9.75390625, 10.330078125, 10.90625, 11.482421875, 12.05859375, 12.634765625, 13.2109375, 13.787109375, 14.36328125, 14.939453125, 15.515625, 16.091796875, 16.66796875, 17.244140625, 17.8203125, 18.396484375, 18.97265625, 19.548828125, 20.125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 13.0, 16.0, 27.0, 42.0, 71.0, 89.0, 146.0, 224.0, 348.0, 426.0, 655.0, 702.0, 429.0, 294.0, 189.0, 131.0, 82.0, 69.0, 46.0, 22.0, 18.0, 12.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.953125, -11.6607666015625, -11.368408203125, -11.0760498046875, -10.78369140625, -10.4913330078125, -10.198974609375, -9.9066162109375, -9.6142578125, -9.3218994140625, -9.029541015625, -8.7371826171875, -8.44482421875, -8.1524658203125, -7.860107421875, -7.5677490234375, -7.275390625, -6.9830322265625, -6.690673828125, -6.3983154296875, -6.10595703125, -5.8135986328125, -5.521240234375, -5.2288818359375, -4.9365234375, -4.6441650390625, -4.351806640625, -4.0594482421875, -3.76708984375, -3.4747314453125, -3.182373046875, -2.8900146484375, -2.59765625, -2.3052978515625, -2.012939453125, -1.7205810546875, -1.42822265625, -1.1358642578125, -0.843505859375, -0.5511474609375, -0.2587890625, 0.0335693359375, 0.325927734375, 0.6182861328125, 0.91064453125, 1.2030029296875, 1.495361328125, 1.7877197265625, 2.080078125, 2.3724365234375, 2.664794921875, 2.9571533203125, 3.24951171875, 3.5418701171875, 3.834228515625, 4.1265869140625, 4.4189453125, 4.7113037109375, 5.003662109375, 5.2960205078125, 5.58837890625, 5.8807373046875, 6.173095703125, 6.4654541015625, 6.7578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 16.0, 34.0, 56.0, 78.0, 185.0, 387.0, 840.0, 2393.0, 11184.0, 147860.0, 3128461.0, 858170.0, 37377.0, 4794.0, 1350.0, 586.0, 224.0, 114.0, 63.0, 38.0, 25.0, 13.0, 9.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.90625, -19.36474609375, -18.8232421875, -18.28173828125, -17.740234375, -17.19873046875, -16.6572265625, -16.11572265625, -15.57421875, -15.03271484375, -14.4912109375, -13.94970703125, -13.408203125, -12.86669921875, -12.3251953125, -11.78369140625, -11.2421875, -10.70068359375, -10.1591796875, -9.61767578125, -9.076171875, -8.53466796875, -7.9931640625, -7.45166015625, -6.91015625, -6.36865234375, -5.8271484375, -5.28564453125, -4.744140625, -4.20263671875, -3.6611328125, -3.11962890625, -2.578125, -2.03662109375, -1.4951171875, -0.95361328125, -0.412109375, 0.12939453125, 0.6708984375, 1.21240234375, 1.75390625, 2.29541015625, 2.8369140625, 3.37841796875, 3.919921875, 4.46142578125, 5.0029296875, 5.54443359375, 6.0859375, 6.62744140625, 7.1689453125, 7.71044921875, 8.251953125, 8.79345703125, 9.3349609375, 9.87646484375, 10.41796875, 10.95947265625, 11.5009765625, 12.04248046875, 12.583984375, 13.12548828125, 13.6669921875, 14.20849609375, 14.75]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 30.0, 116.0, 280.0, 339.0, 176.0, 45.0, 17.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.49299621582031, -88.46482849121094, -85.43665313720703, -82.40848541259766, -79.38031768798828, -76.3521499633789, -73.323974609375, -70.29580688476562, -67.26763916015625, -64.23947143554688, -61.211299896240234, -58.183128356933594, -55.15496063232422, -52.12678909301758, -49.09861755371094, -46.07044982910156, -43.04227828979492, -40.01410675048828, -36.985939025878906, -33.957767486572266, -30.92959976196289, -27.90142822265625, -24.873258590698242, -21.845088958740234, -18.816919326782227, -15.788749694824219, -12.760580062866211, -9.732409477233887, -6.704239845275879, -3.676070213317871, -0.6478996276855469, 2.380270004272461, 5.408439636230469, 8.436609268188477, 11.464778900146484, 14.492949485778809, 17.5211181640625, 20.54928970336914, 23.57745933532715, 26.605628967285156, 29.633798599243164, 32.66196823120117, 35.69013977050781, 38.71830749511719, 41.74647903442383, 44.7746467590332, 47.802818298339844, 50.83098602294922, 53.85915756225586, 56.8873291015625, 59.915496826171875, 62.943668365478516, 65.97183990478516, 69.00000762939453, 72.0281753540039, 75.05635070800781, 78.08451843261719, 81.11268615722656, 84.14086151123047, 87.16902923583984, 90.19719696044922, 93.2253646850586, 96.2535400390625, 99.28170776367188, 102.30987548828125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 6.0, 11.0, 11.0, 14.0, 14.0, 16.0, 18.0, 12.0, 25.0, 31.0, 28.0, 32.0, 32.0, 41.0, 41.0, 44.0, 51.0, 31.0, 48.0, 33.0, 35.0, 47.0, 46.0, 29.0, 30.0, 31.0, 29.0, 27.0, 20.0, 24.0, 23.0, 15.0, 15.0, 11.0, 11.0, 15.0, 6.0, 11.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-24.68231964111328, -23.925870895385742, -23.169422149658203, -22.412975311279297, -21.656526565551758, -20.90007781982422, -20.14362907409668, -19.38718032836914, -18.630733489990234, -17.874284744262695, -17.117835998535156, -16.36138916015625, -15.604940414428711, -14.848491668701172, -14.092042922973633, -13.335594177246094, -12.579145431518555, -11.822696685791016, -11.066248893737793, -10.309800148010254, -9.553352355957031, -8.796903610229492, -8.040454864501953, -7.284006595611572, -6.527558326721191, -5.7711100578308105, -5.01466178894043, -4.258213043212891, -3.5017647743225098, -2.745316505432129, -1.9888677597045898, -1.232419490814209, -0.4759712219238281, 0.2804771661758423, 1.0369255542755127, 1.7933740615844727, 2.5498223304748535, 3.3062705993652344, 4.062719345092773, 4.819167613983154, 5.575615882873535, 6.332064151763916, 7.088512420654297, 7.844961166381836, 8.601409912109375, 9.357857704162598, 10.114306449890137, 10.87075424194336, 11.627202987670898, 12.383651733398438, 13.14009952545166, 13.8965482711792, 14.652996063232422, 15.409444808959961, 16.1658935546875, 16.92234230041504, 17.678791046142578, 18.435239791870117, 19.191688537597656, 19.948135375976562, 20.7045841217041, 21.46103286743164, 22.21748161315918, 22.97393035888672, 23.730377197265625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 5.0, 9.0, 9.0, 8.0, 14.0, 12.0, 17.0, 10.0, 17.0, 23.0, 27.0, 32.0, 25.0, 34.0, 43.0, 37.0, 56.0, 39.0, 37.0, 43.0, 44.0, 40.0, 56.0, 26.0, 23.0, 18.0, 32.0, 28.0, 29.0, 31.0, 23.0, 22.0, 22.0, 18.0, 12.0, 16.0, 11.0, 7.0, 6.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.654296875, -3.528656005859375, -3.40301513671875, -3.277374267578125, -3.1517333984375, -3.026092529296875, -2.90045166015625, -2.774810791015625, -2.649169921875, -2.523529052734375, -2.39788818359375, -2.272247314453125, -2.1466064453125, -2.020965576171875, -1.89532470703125, -1.769683837890625, -1.64404296875, -1.518402099609375, -1.39276123046875, -1.267120361328125, -1.1414794921875, -1.015838623046875, -0.89019775390625, -0.764556884765625, -0.638916015625, -0.513275146484375, -0.38763427734375, -0.261993408203125, -0.1363525390625, -0.010711669921875, 0.11492919921875, 0.240570068359375, 0.3662109375, 0.491851806640625, 0.61749267578125, 0.743133544921875, 0.8687744140625, 0.994415283203125, 1.12005615234375, 1.245697021484375, 1.371337890625, 1.496978759765625, 1.62261962890625, 1.748260498046875, 1.8739013671875, 1.999542236328125, 2.12518310546875, 2.250823974609375, 2.37646484375, 2.502105712890625, 2.62774658203125, 2.753387451171875, 2.8790283203125, 3.004669189453125, 3.13031005859375, 3.255950927734375, 3.381591796875, 3.507232666015625, 3.63287353515625, 3.758514404296875, 3.8841552734375, 4.009796142578125, 4.13543701171875, 4.261077880859375, 4.38671875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 10.0, 10.0, 20.0, 36.0, 37.0, 65.0, 86.0, 140.0, 197.0, 295.0, 478.0, 660.0, 1059.0, 1548.0, 2227.0, 3275.0, 4860.0, 7208.0, 10906.0, 16493.0, 25493.0, 40611.0, 67468.0, 127368.0, 332440.0, 180472.0, 85907.0, 49801.0, 30735.0, 19746.0, 12722.0, 8498.0, 5729.0, 3858.0, 2669.0, 1779.0, 1258.0, 778.0, 543.0, 362.0, 240.0, 148.0, 108.0, 75.0, 50.0, 30.0, 16.0, 17.0, 9.0, 8.0, 8.0, 4.0, 1.0, 2.0], "bins": [-0.1800537109375, -0.17486572265625, -0.169677734375, -0.16448974609375, -0.1593017578125, -0.15411376953125, -0.14892578125, -0.14373779296875, -0.1385498046875, -0.13336181640625, -0.128173828125, -0.12298583984375, -0.1177978515625, -0.11260986328125, -0.107421875, -0.10223388671875, -0.0970458984375, -0.09185791015625, -0.086669921875, -0.08148193359375, -0.0762939453125, -0.07110595703125, -0.06591796875, -0.06072998046875, -0.0555419921875, -0.05035400390625, -0.045166015625, -0.03997802734375, -0.0347900390625, -0.02960205078125, -0.0244140625, -0.01922607421875, -0.0140380859375, -0.00885009765625, -0.003662109375, 0.00152587890625, 0.0067138671875, 0.01190185546875, 0.01708984375, 0.02227783203125, 0.0274658203125, 0.03265380859375, 0.037841796875, 0.04302978515625, 0.0482177734375, 0.05340576171875, 0.05859375, 0.06378173828125, 0.0689697265625, 0.07415771484375, 0.079345703125, 0.08453369140625, 0.0897216796875, 0.09490966796875, 0.10009765625, 0.10528564453125, 0.1104736328125, 0.11566162109375, 0.120849609375, 0.12603759765625, 0.1312255859375, 0.13641357421875, 0.1416015625, 0.14678955078125, 0.1519775390625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 4.0, 0.0, 7.0, 3.0, 4.0, 10.0, 8.0, 10.0, 14.0, 11.0, 14.0, 16.0, 23.0, 21.0, 30.0, 33.0, 29.0, 34.0, 42.0, 28.0, 38.0, 27.0, 42.0, 36.0, 1061.0, 39.0, 46.0, 40.0, 25.0, 35.0, 32.0, 42.0, 30.0, 28.0, 31.0, 27.0, 22.0, 11.0, 13.0, 14.0, 6.0, 5.0, 6.0, 7.0, 13.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.673828125, -2.587646484375, -2.50146484375, -2.415283203125, -2.3291015625, -2.242919921875, -2.15673828125, -2.070556640625, -1.984375, -1.898193359375, -1.81201171875, -1.725830078125, -1.6396484375, -1.553466796875, -1.46728515625, -1.381103515625, -1.294921875, -1.208740234375, -1.12255859375, -1.036376953125, -0.9501953125, -0.864013671875, -0.77783203125, -0.691650390625, -0.60546875, -0.519287109375, -0.43310546875, -0.346923828125, -0.2607421875, -0.174560546875, -0.08837890625, -0.002197265625, 0.083984375, 0.170166015625, 0.25634765625, 0.342529296875, 0.4287109375, 0.514892578125, 0.60107421875, 0.687255859375, 0.7734375, 0.859619140625, 0.94580078125, 1.031982421875, 1.1181640625, 1.204345703125, 1.29052734375, 1.376708984375, 1.462890625, 1.549072265625, 1.63525390625, 1.721435546875, 1.8076171875, 1.893798828125, 1.97998046875, 2.066162109375, 2.15234375, 2.238525390625, 2.32470703125, 2.410888671875, 2.4970703125, 2.583251953125, 2.66943359375, 2.755615234375, 2.841796875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 14.0, 14.0, 23.0, 38.0, 55.0, 88.0, 123.0, 175.0, 208.0, 344.0, 485.0, 605.0, 967.0, 1285.0, 1957.0, 2737.0, 3855.0, 5402.0, 8110.0, 11887.0, 17847.0, 26842.0, 41386.0, 65001.0, 111009.0, 1292457.0, 216208.0, 105453.0, 62251.0, 39749.0, 25969.0, 17151.0, 11516.0, 7762.0, 5559.0, 3762.0, 2567.0, 1854.0, 1315.0, 951.0, 701.0, 446.0, 329.0, 221.0, 161.0, 103.0, 68.0, 40.0, 28.0, 20.0, 13.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.0819091796875, -0.07942390441894531, -0.07693862915039062, -0.07445335388183594, -0.07196807861328125, -0.06948280334472656, -0.06699752807617188, -0.06451225280761719, -0.0620269775390625, -0.05954170227050781, -0.057056427001953125, -0.05457115173339844, -0.05208587646484375, -0.04960060119628906, -0.047115325927734375, -0.04463005065917969, -0.042144775390625, -0.03965950012207031, -0.037174224853515625, -0.03468894958496094, -0.03220367431640625, -0.029718399047851562, -0.027233123779296875, -0.024747848510742188, -0.0222625732421875, -0.019777297973632812, -0.017292022705078125, -0.014806747436523438, -0.01232147216796875, -0.009836196899414062, -0.007350921630859375, -0.0048656463623046875, -0.00238037109375, 0.0001049041748046875, 0.002590179443359375, 0.0050754547119140625, 0.00756072998046875, 0.010046005249023438, 0.012531280517578125, 0.015016555786132812, 0.0175018310546875, 0.019987106323242188, 0.022472381591796875, 0.024957656860351562, 0.02744293212890625, 0.029928207397460938, 0.032413482666015625, 0.03489875793457031, 0.037384033203125, 0.03986930847167969, 0.042354583740234375, 0.04483985900878906, 0.04732513427734375, 0.04981040954589844, 0.052295684814453125, 0.05478096008300781, 0.0572662353515625, 0.05975151062011719, 0.062236785888671875, 0.06472206115722656, 0.06720733642578125, 0.06969261169433594, 0.07217788696289062, 0.07466316223144531, 0.0771484375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 13.0, 11.0, 16.0, 6.0, 12.0, 31.0, 20.0, 21.0, 59.0, 46.0, 167.0, 198.0, 85.0, 90.0, 41.0, 27.0, 47.0, 17.0, 18.0, 15.0, 12.0, 18.0, 7.0, 4.0, 6.0, 2.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5273690223693848e-06, -1.4454126358032227e-06, -1.3634562492370605e-06, -1.2814998626708984e-06, -1.1995434761047363e-06, -1.1175870895385742e-06, -1.0356307029724121e-06, -9.5367431640625e-07, -8.717179298400879e-07, -7.897615432739258e-07, -7.078051567077637e-07, -6.258487701416016e-07, -5.438923835754395e-07, -4.6193599700927734e-07, -3.7997961044311523e-07, -2.980232238769531e-07, -2.1606683731079102e-07, -1.341104507446289e-07, -5.21540641784668e-08, 2.9802322387695312e-08, 1.1175870895385742e-07, 1.9371509552001953e-07, 2.7567148208618164e-07, 3.5762786865234375e-07, 4.3958425521850586e-07, 5.21540641784668e-07, 6.034970283508301e-07, 6.854534149169922e-07, 7.674098014831543e-07, 8.493661880493164e-07, 9.313225746154785e-07, 1.0132789611816406e-06, 1.0952353477478027e-06, 1.1771917343139648e-06, 1.259148120880127e-06, 1.341104507446289e-06, 1.4230608940124512e-06, 1.5050172805786133e-06, 1.5869736671447754e-06, 1.6689300537109375e-06, 1.7508864402770996e-06, 1.8328428268432617e-06, 1.914799213409424e-06, 1.996755599975586e-06, 2.078711986541748e-06, 2.16066837310791e-06, 2.2426247596740723e-06, 2.3245811462402344e-06, 2.4065375328063965e-06, 2.4884939193725586e-06, 2.5704503059387207e-06, 2.652406692504883e-06, 2.734363079071045e-06, 2.816319465637207e-06, 2.898275852203369e-06, 2.9802322387695312e-06, 3.0621886253356934e-06, 3.1441450119018555e-06, 3.2261013984680176e-06, 3.3080577850341797e-06, 3.390014171600342e-06, 3.471970558166504e-06, 3.553926944732666e-06, 3.635883331298828e-06]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 7.0, 23.0, 22.0, 25.0, 43.0, 42.0, 94.0, 124.0, 236.0, 658.0, 17711.0, 1021885.0, 6612.0, 523.0, 186.0, 92.0, 71.0, 57.0, 32.0, 25.0, 19.0, 11.0, 7.0, 8.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.081031799316406e-05, -6.914045661687851e-05, -6.747059524059296e-05, -6.58007338643074e-05, -6.413087248802185e-05, -6.24610111117363e-05, -6.0791149735450745e-05, -5.912128835916519e-05, -5.745142698287964e-05, -5.5781565606594086e-05, -5.411170423030853e-05, -5.244184285402298e-05, -5.077198147773743e-05, -4.9102120101451874e-05, -4.743225872516632e-05, -4.576239734888077e-05, -4.4092535972595215e-05, -4.242267459630966e-05, -4.075281322002411e-05, -3.9082951843738556e-05, -3.7413090467453e-05, -3.574322909116745e-05, -3.40733677148819e-05, -3.2403506338596344e-05, -3.073364496231079e-05, -2.9063783586025238e-05, -2.7393922209739685e-05, -2.5724060833454132e-05, -2.405419945716858e-05, -2.2384338080883026e-05, -2.0714476704597473e-05, -1.904461532831192e-05, -1.7374753952026367e-05, -1.5704892575740814e-05, -1.4035031199455261e-05, -1.2365169823169708e-05, -1.0695308446884155e-05, -9.025447070598602e-06, -7.355585694313049e-06, -5.685724318027496e-06, -4.015862941741943e-06, -2.3460015654563904e-06, -6.761401891708374e-07, 9.937211871147156e-07, 2.6635825634002686e-06, 4.3334439396858215e-06, 6.0033053159713745e-06, 7.673166692256927e-06, 9.34302806854248e-06, 1.1012889444828033e-05, 1.2682750821113586e-05, 1.435261219739914e-05, 1.6022473573684692e-05, 1.7692334949970245e-05, 1.93621963262558e-05, 2.103205770254135e-05, 2.2701919078826904e-05, 2.4371780455112457e-05, 2.604164183139801e-05, 2.7711503207683563e-05, 2.9381364583969116e-05, 3.105122596025467e-05, 3.272108733654022e-05, 3.4390948712825775e-05, 3.606081008911133e-05]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 20.0, 62.0, 135.0, 318.0, 291.0, 124.0, 36.0, 14.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.361519015423255e-06, -5.249654350336641e-06, -5.137789230502676e-06, -5.025924565416062e-06, -4.914059445582097e-06, -4.8021947804954834e-06, -4.6903296606615186e-06, -4.578464995574905e-06, -4.466600330488291e-06, -4.354735665401677e-06, -4.242870545567712e-06, -4.131005880481098e-06, -4.019140760647133e-06, -3.907276095560519e-06, -3.7954112031002296e-06, -3.68354631063994e-06, -3.571681418179651e-06, -3.4598165257193614e-06, -3.347951633259072e-06, -3.2360867407987826e-06, -3.1242220757121686e-06, -3.012357183251879e-06, -2.9004922907915898e-06, -2.7886273983313004e-06, -2.676762505871011e-06, -2.5648976134107215e-06, -2.453032720950432e-06, -2.341168055863818e-06, -2.2293031634035287e-06, -2.1174382709432393e-06, -2.00557337848295e-06, -1.8937084860226605e-06, -1.7818437072492088e-06, -1.6699788147889194e-06, -1.5581140360154677e-06, -1.4462491435551783e-06, -1.334384251094889e-06, -1.2225194723214372e-06, -1.1106545798611478e-06, -9.98789801087696e-07, -8.869249086274067e-07, -7.750600730105361e-07, -6.631952373936656e-07, -5.513303449333762e-07, -4.3946550931650563e-07, -3.276006736996351e-07, -2.1573578123934567e-07, -1.0387094562247512e-07, 7.993889994395431e-09, 1.198587398221207e-07, 2.3172358964984596e-07, 3.4358845368842594e-07, 4.554532893052965e-07, 5.67318124922167e-07, 6.791830173824565e-07, 7.91047852999327e-07, 9.029126886161976e-07, 1.014777581076487e-06, 1.1266423598499387e-06, 1.238507252310228e-06, 1.3503720310836798e-06, 1.4622369235439692e-06, 1.5741018160042586e-06, 1.685966708464548e-06, 1.7978314872379997e-06]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 13.0, 0.0, 11.0, 0.0, 14.0, 0.0, 0.0, 22.0, 0.0, 36.0, 0.0, 53.0, 0.0, 71.0, 0.0, 94.0, 0.0, 0.0, 124.0, 0.0, 104.0, 0.0, 133.0, 0.0, 83.0, 0.0, 84.0, 0.0, 0.0, 61.0, 0.0, 43.0, 0.0, 25.0, 0.0, 16.0, 0.0, 10.0, 0.0, 0.0, 10.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.5367431640625e-07, -9.266659617424011e-07, -8.996576070785522e-07, -8.726492524147034e-07, -8.456408977508545e-07, -8.186325430870056e-07, -7.916241884231567e-07, -7.646158337593079e-07, -7.37607479095459e-07, -7.105991244316101e-07, -6.835907697677612e-07, -6.565824151039124e-07, -6.295740604400635e-07, -6.025657057762146e-07, -5.755573511123657e-07, -5.485489964485168e-07, -5.21540641784668e-07, -4.945322871208191e-07, -4.675239324569702e-07, -4.4051557779312134e-07, -4.1350722312927246e-07, -3.864988684654236e-07, -3.594905138015747e-07, -3.3248215913772583e-07, -3.0547380447387695e-07, -2.784654498100281e-07, -2.514570951461792e-07, -2.2444874048233032e-07, -1.9744038581848145e-07, -1.7043203115463257e-07, -1.434236764907837e-07, -1.1641532182693481e-07, -8.940696716308594e-08, -6.239861249923706e-08, -3.5390257835388184e-08, -8.381903171539307e-09, 1.862645149230957e-08, 4.563480615615845e-08, 7.264316082000732e-08, 9.96515154838562e-08, 1.2665987014770508e-07, 1.5366822481155396e-07, 1.8067657947540283e-07, 2.076849341392517e-07, 2.3469328880310059e-07, 2.6170164346694946e-07, 2.8870999813079834e-07, 3.157183527946472e-07, 3.427267074584961e-07, 3.6973506212234497e-07, 3.9674341678619385e-07, 4.237517714500427e-07, 4.507601261138916e-07, 4.777684807777405e-07, 5.047768354415894e-07, 5.317851901054382e-07, 5.587935447692871e-07, 5.85801899433136e-07, 6.128102540969849e-07, 6.398186087608337e-07, 6.668269634246826e-07, 6.938353180885315e-07, 7.208436727523804e-07, 7.478520274162292e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 5.0, 9.0, 9.0, 8.0, 14.0, 12.0, 17.0, 10.0, 17.0, 23.0, 27.0, 32.0, 25.0, 34.0, 43.0, 37.0, 56.0, 39.0, 37.0, 43.0, 44.0, 40.0, 56.0, 26.0, 23.0, 18.0, 32.0, 28.0, 29.0, 31.0, 23.0, 22.0, 22.0, 18.0, 12.0, 16.0, 11.0, 7.0, 6.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.654296875, -3.528656005859375, -3.40301513671875, -3.277374267578125, -3.1517333984375, -3.026092529296875, -2.90045166015625, -2.774810791015625, -2.649169921875, -2.523529052734375, -2.39788818359375, -2.272247314453125, -2.1466064453125, -2.020965576171875, -1.89532470703125, -1.769683837890625, -1.64404296875, -1.518402099609375, -1.39276123046875, -1.267120361328125, -1.1414794921875, -1.015838623046875, -0.89019775390625, -0.764556884765625, -0.638916015625, -0.513275146484375, -0.38763427734375, -0.261993408203125, -0.1363525390625, -0.010711669921875, 0.11492919921875, 0.240570068359375, 0.3662109375, 0.491851806640625, 0.61749267578125, 0.743133544921875, 0.8687744140625, 0.994415283203125, 1.12005615234375, 1.245697021484375, 1.371337890625, 1.496978759765625, 1.62261962890625, 1.748260498046875, 1.8739013671875, 1.999542236328125, 2.12518310546875, 2.250823974609375, 2.37646484375, 2.502105712890625, 2.62774658203125, 2.753387451171875, 2.8790283203125, 3.004669189453125, 3.13031005859375, 3.255950927734375, 3.381591796875, 3.507232666015625, 3.63287353515625, 3.758514404296875, 3.8841552734375, 4.009796142578125, 4.13543701171875, 4.261077880859375, 4.38671875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 1.0, 6.0, 10.0, 13.0, 10.0, 18.0, 34.0, 44.0, 57.0, 91.0, 103.0, 146.0, 217.0, 337.0, 480.0, 715.0, 1183.0, 2228.0, 4173.0, 8952.0, 21336.0, 51591.0, 126904.0, 340414.0, 298556.0, 109878.0, 45011.0, 18889.0, 8164.0, 3688.0, 1979.0, 1124.0, 717.0, 436.0, 317.0, 213.0, 141.0, 107.0, 75.0, 52.0, 44.0, 34.0, 19.0, 13.0, 8.0, 6.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.5078125, -7.27264404296875, -7.0374755859375, -6.80230712890625, -6.567138671875, -6.33197021484375, -6.0968017578125, -5.86163330078125, -5.62646484375, -5.39129638671875, -5.1561279296875, -4.92095947265625, -4.685791015625, -4.45062255859375, -4.2154541015625, -3.98028564453125, -3.7451171875, -3.50994873046875, -3.2747802734375, -3.03961181640625, -2.804443359375, -2.56927490234375, -2.3341064453125, -2.09893798828125, -1.86376953125, -1.62860107421875, -1.3934326171875, -1.15826416015625, -0.923095703125, -0.68792724609375, -0.4527587890625, -0.21759033203125, 0.017578125, 0.25274658203125, 0.4879150390625, 0.72308349609375, 0.958251953125, 1.19342041015625, 1.4285888671875, 1.66375732421875, 1.89892578125, 2.13409423828125, 2.3692626953125, 2.60443115234375, 2.839599609375, 3.07476806640625, 3.3099365234375, 3.54510498046875, 3.7802734375, 4.01544189453125, 4.2506103515625, 4.48577880859375, 4.720947265625, 4.95611572265625, 5.1912841796875, 5.42645263671875, 5.66162109375, 5.89678955078125, 6.1319580078125, 6.36712646484375, 6.602294921875, 6.83746337890625, 7.0726318359375, 7.30780029296875, 7.54296875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 3.0, 9.0, 13.0, 7.0, 7.0, 15.0, 12.0, 16.0, 17.0, 29.0, 22.0, 24.0, 36.0, 40.0, 54.0, 69.0, 65.0, 128.0, 195.0, 752.0, 773.0, 162.0, 113.0, 89.0, 68.0, 48.0, 45.0, 27.0, 27.0, 27.0, 31.0, 12.0, 23.0, 13.0, 12.0, 10.0, 13.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.2109375, -8.923095703125, -8.63525390625, -8.347412109375, -8.0595703125, -7.771728515625, -7.48388671875, -7.196044921875, -6.908203125, -6.620361328125, -6.33251953125, -6.044677734375, -5.7568359375, -5.468994140625, -5.18115234375, -4.893310546875, -4.60546875, -4.317626953125, -4.02978515625, -3.741943359375, -3.4541015625, -3.166259765625, -2.87841796875, -2.590576171875, -2.302734375, -2.014892578125, -1.72705078125, -1.439208984375, -1.1513671875, -0.863525390625, -0.57568359375, -0.287841796875, 0.0, 0.287841796875, 0.57568359375, 0.863525390625, 1.1513671875, 1.439208984375, 1.72705078125, 2.014892578125, 2.302734375, 2.590576171875, 2.87841796875, 3.166259765625, 3.4541015625, 3.741943359375, 4.02978515625, 4.317626953125, 4.60546875, 4.893310546875, 5.18115234375, 5.468994140625, 5.7568359375, 6.044677734375, 6.33251953125, 6.620361328125, 6.908203125, 7.196044921875, 7.48388671875, 7.771728515625, 8.0595703125, 8.347412109375, 8.63525390625, 8.923095703125, 9.2109375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 11.0, 18.0, 17.0, 18.0, 21.0, 41.0, 47.0, 74.0, 90.0, 167.0, 212.0, 319.0, 533.0, 789.0, 1612.0, 5946.0, 581130.0, 2538619.0, 11270.0, 2093.0, 986.0, 521.0, 378.0, 224.0, 159.0, 100.0, 67.0, 58.0, 34.0, 26.0, 33.0, 15.0, 14.0, 10.0, 9.0, 3.0, 7.0, 8.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-27.515625, -26.684814453125, -25.85400390625, -25.023193359375, -24.1923828125, -23.361572265625, -22.53076171875, -21.699951171875, -20.869140625, -20.038330078125, -19.20751953125, -18.376708984375, -17.5458984375, -16.715087890625, -15.88427734375, -15.053466796875, -14.22265625, -13.391845703125, -12.56103515625, -11.730224609375, -10.8994140625, -10.068603515625, -9.23779296875, -8.406982421875, -7.576171875, -6.745361328125, -5.91455078125, -5.083740234375, -4.2529296875, -3.422119140625, -2.59130859375, -1.760498046875, -0.9296875, -0.098876953125, 0.73193359375, 1.562744140625, 2.3935546875, 3.224365234375, 4.05517578125, 4.885986328125, 5.716796875, 6.547607421875, 7.37841796875, 8.209228515625, 9.0400390625, 9.870849609375, 10.70166015625, 11.532470703125, 12.36328125, 13.194091796875, 14.02490234375, 14.855712890625, 15.6865234375, 16.517333984375, 17.34814453125, 18.178955078125, 19.009765625, 19.840576171875, 20.67138671875, 21.502197265625, 22.3330078125, 23.163818359375, 23.99462890625, 24.825439453125, 25.65625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 13.0, 59.0, 187.0, 320.0, 264.0, 135.0, 28.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-181.91429138183594, -178.2638397216797, -174.6134033203125, -170.96295166015625, -167.3125, -163.66204833984375, -160.01161193847656, -156.3611602783203, -152.71070861816406, -149.0602569580078, -145.40982055664062, -141.75936889648438, -138.10891723632812, -134.45846557617188, -130.8080291748047, -127.15757751464844, -123.50712585449219, -119.85668182373047, -116.20623016357422, -112.5557861328125, -108.90533447265625, -105.25489044189453, -101.60443878173828, -97.95399475097656, -94.30355072021484, -90.65310668945312, -87.00265502929688, -83.35221099853516, -79.7017593383789, -76.05131530761719, -72.40086364746094, -68.75041961669922, -65.09996795654297, -61.449520111083984, -57.799072265625, -54.148624420166016, -50.49817657470703, -46.84773254394531, -43.19728088378906, -39.546836853027344, -35.896385192871094, -32.24593734741211, -28.595489501953125, -24.94504165649414, -21.294593811035156, -17.644147872924805, -13.99370002746582, -10.343252182006836, -6.692806243896484, -3.042358636856079, 0.6080889701843262, 4.258536338806152, 7.908984184265137, 11.559431076049805, 15.209878921508789, 18.860326766967773, 22.510774612426758, 26.161222457885742, 29.811670303344727, 33.46211624145508, 37.11256408691406, 40.76301193237305, 44.41345977783203, 48.063907623291016, 51.71435546875]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 4.0, 10.0, 9.0, 16.0, 15.0, 17.0, 17.0, 19.0, 24.0, 27.0, 28.0, 22.0, 28.0, 30.0, 27.0, 39.0, 31.0, 46.0, 47.0, 39.0, 44.0, 48.0, 46.0, 35.0, 35.0, 37.0, 25.0, 26.0, 26.0, 26.0, 21.0, 15.0, 23.0, 18.0, 12.0, 11.0, 7.0, 9.0, 9.0, 5.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-34.04804229736328, -33.092899322509766, -32.13775634765625, -31.1826114654541, -30.227468490600586, -29.27232551574707, -28.317180633544922, -27.362037658691406, -26.40689468383789, -25.451751708984375, -24.49660873413086, -23.54146385192871, -22.586320877075195, -21.63117790222168, -20.67603302001953, -19.720890045166016, -18.7657470703125, -17.810604095458984, -16.85546112060547, -15.90031623840332, -14.945173263549805, -13.990030288696289, -13.034886360168457, -12.079742431640625, -11.12459945678711, -10.169456481933594, -9.214312553405762, -8.25916862487793, -7.304025650024414, -6.34888219833374, -5.393738746643066, -4.438595294952393, -3.4834518432617188, -2.528308391571045, -1.573164939880371, -0.6180214881896973, 0.33712196350097656, 1.2922654151916504, 2.247408866882324, 3.202552318572998, 4.157695770263672, 5.112839221954346, 6.0679826736450195, 7.023126125335693, 7.978269577026367, 8.933412551879883, 9.888556480407715, 10.843700408935547, 11.798843383789062, 12.753986358642578, 13.70913028717041, 14.664274215698242, 15.619417190551758, 16.574560165405273, 17.529705047607422, 18.484848022460938, 19.439990997314453, 20.39513397216797, 21.350276947021484, 22.305421829223633, 23.26056480407715, 24.215707778930664, 25.170852661132812, 26.125995635986328, 27.081138610839844]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 10.0, 13.0, 7.0, 17.0, 16.0, 18.0, 16.0, 24.0, 25.0, 21.0, 24.0, 26.0, 37.0, 30.0, 38.0, 37.0, 37.0, 43.0, 40.0, 34.0, 36.0, 35.0, 33.0, 36.0, 30.0, 29.0, 32.0, 37.0, 19.0, 28.0, 11.0, 27.0, 15.0, 19.0, 12.0, 14.0, 12.0, 11.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.05859375, -3.9326171875, -3.806640625, -3.6806640625, -3.5546875, -3.4287109375, -3.302734375, -3.1767578125, -3.05078125, -2.9248046875, -2.798828125, -2.6728515625, -2.546875, -2.4208984375, -2.294921875, -2.1689453125, -2.04296875, -1.9169921875, -1.791015625, -1.6650390625, -1.5390625, -1.4130859375, -1.287109375, -1.1611328125, -1.03515625, -0.9091796875, -0.783203125, -0.6572265625, -0.53125, -0.4052734375, -0.279296875, -0.1533203125, -0.02734375, 0.0986328125, 0.224609375, 0.3505859375, 0.4765625, 0.6025390625, 0.728515625, 0.8544921875, 0.98046875, 1.1064453125, 1.232421875, 1.3583984375, 1.484375, 1.6103515625, 1.736328125, 1.8623046875, 1.98828125, 2.1142578125, 2.240234375, 2.3662109375, 2.4921875, 2.6181640625, 2.744140625, 2.8701171875, 2.99609375, 3.1220703125, 3.248046875, 3.3740234375, 3.5, 3.6259765625, 3.751953125, 3.8779296875, 4.00390625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 14.0, 18.0, 13.0, 48.0, 76.0, 105.0, 222.0, 436.0, 771.0, 1688.0, 3947.0, 10297.0, 31213.0, 184602.0, 1972967.0, 1777305.0, 164526.0, 29111.0, 9685.0, 3852.0, 1655.0, 806.0, 389.0, 227.0, 125.0, 86.0, 34.0, 24.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.5, -11.140380859375, -10.78076171875, -10.421142578125, -10.0615234375, -9.701904296875, -9.34228515625, -8.982666015625, -8.623046875, -8.263427734375, -7.90380859375, -7.544189453125, -7.1845703125, -6.824951171875, -6.46533203125, -6.105712890625, -5.74609375, -5.386474609375, -5.02685546875, -4.667236328125, -4.3076171875, -3.947998046875, -3.58837890625, -3.228759765625, -2.869140625, -2.509521484375, -2.14990234375, -1.790283203125, -1.4306640625, -1.071044921875, -0.71142578125, -0.351806640625, 0.0078125, 0.367431640625, 0.72705078125, 1.086669921875, 1.4462890625, 1.805908203125, 2.16552734375, 2.525146484375, 2.884765625, 3.244384765625, 3.60400390625, 3.963623046875, 4.3232421875, 4.682861328125, 5.04248046875, 5.402099609375, 5.76171875, 6.121337890625, 6.48095703125, 6.840576171875, 7.2001953125, 7.559814453125, 7.91943359375, 8.279052734375, 8.638671875, 8.998291015625, 9.35791015625, 9.717529296875, 10.0771484375, 10.436767578125, 10.79638671875, 11.156005859375, 11.515625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 2.0, 4.0, 4.0, 9.0, 11.0, 9.0, 11.0, 28.0, 30.0, 29.0, 40.0, 62.0, 84.0, 95.0, 147.0, 144.0, 203.0, 250.0, 318.0, 381.0, 416.0, 402.0, 294.0, 249.0, 191.0, 149.0, 112.0, 89.0, 71.0, 47.0, 43.0, 35.0, 26.0, 19.0, 12.0, 11.0, 7.0, 6.0, 12.0, 4.0, 9.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.6484375, -5.48931884765625, -5.3302001953125, -5.17108154296875, -5.011962890625, -4.85284423828125, -4.6937255859375, -4.53460693359375, -4.37548828125, -4.21636962890625, -4.0572509765625, -3.89813232421875, -3.739013671875, -3.57989501953125, -3.4207763671875, -3.26165771484375, -3.1025390625, -2.94342041015625, -2.7843017578125, -2.62518310546875, -2.466064453125, -2.30694580078125, -2.1478271484375, -1.98870849609375, -1.82958984375, -1.67047119140625, -1.5113525390625, -1.35223388671875, -1.193115234375, -1.03399658203125, -0.8748779296875, -0.71575927734375, -0.556640625, -0.39752197265625, -0.2384033203125, -0.07928466796875, 0.079833984375, 0.23895263671875, 0.3980712890625, 0.55718994140625, 0.71630859375, 0.87542724609375, 1.0345458984375, 1.19366455078125, 1.352783203125, 1.51190185546875, 1.6710205078125, 1.83013916015625, 1.9892578125, 2.14837646484375, 2.3074951171875, 2.46661376953125, 2.625732421875, 2.78485107421875, 2.9439697265625, 3.10308837890625, 3.26220703125, 3.42132568359375, 3.5804443359375, 3.73956298828125, 3.898681640625, 4.05780029296875, 4.2169189453125, 4.37603759765625, 4.53515625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 11.0, 13.0, 6.0, 13.0, 16.0, 19.0, 44.0, 37.0, 50.0, 95.0, 118.0, 178.0, 293.0, 480.0, 1041.0, 2259.0, 7126.0, 30919.0, 234991.0, 2373074.0, 1381693.0, 132507.0, 20280.0, 5121.0, 1824.0, 777.0, 464.0, 251.0, 184.0, 98.0, 83.0, 46.0, 33.0, 28.0, 28.0, 17.0, 15.0, 7.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.6640625, -9.36083984375, -9.0576171875, -8.75439453125, -8.451171875, -8.14794921875, -7.8447265625, -7.54150390625, -7.23828125, -6.93505859375, -6.6318359375, -6.32861328125, -6.025390625, -5.72216796875, -5.4189453125, -5.11572265625, -4.8125, -4.50927734375, -4.2060546875, -3.90283203125, -3.599609375, -3.29638671875, -2.9931640625, -2.68994140625, -2.38671875, -2.08349609375, -1.7802734375, -1.47705078125, -1.173828125, -0.87060546875, -0.5673828125, -0.26416015625, 0.0390625, 0.34228515625, 0.6455078125, 0.94873046875, 1.251953125, 1.55517578125, 1.8583984375, 2.16162109375, 2.46484375, 2.76806640625, 3.0712890625, 3.37451171875, 3.677734375, 3.98095703125, 4.2841796875, 4.58740234375, 4.890625, 5.19384765625, 5.4970703125, 5.80029296875, 6.103515625, 6.40673828125, 6.7099609375, 7.01318359375, 7.31640625, 7.61962890625, 7.9228515625, 8.22607421875, 8.529296875, 8.83251953125, 9.1357421875, 9.43896484375, 9.7421875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 27.0, 47.0, 105.0, 151.0, 167.0, 179.0, 146.0, 103.0, 46.0, 17.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-65.17100524902344, -63.507144927978516, -61.843284606933594, -60.17942810058594, -58.515567779541016, -56.851707458496094, -55.18784713745117, -53.52398681640625, -51.860130310058594, -50.19626998901367, -48.53240966796875, -46.868553161621094, -45.20469284057617, -43.54083251953125, -41.87697219848633, -40.213111877441406, -38.549251556396484, -36.88539123535156, -35.22153091430664, -33.55767059326172, -31.893814086914062, -30.22995376586914, -28.56609344482422, -26.902233123779297, -25.238374710083008, -23.574514389038086, -21.910655975341797, -20.246795654296875, -18.582935333251953, -16.919076919555664, -15.255216598510742, -13.591357231140137, -11.927501678466797, -10.263642311096191, -8.599782943725586, -6.935922622680664, -5.272063255310059, -3.608203887939453, -1.9443435668945312, -0.2804841995239258, 1.3833751678466797, 3.0472347736358643, 4.711094379425049, 6.3749542236328125, 8.038813591003418, 9.702672958374023, 11.366533279418945, 13.03039264678955, 14.694252014160156, 16.358112335205078, 18.021970748901367, 19.68583106994629, 21.349689483642578, 23.0135498046875, 24.677410125732422, 26.341270446777344, 28.005128860473633, 29.668989181518555, 31.332847595214844, 32.996707916259766, 34.66056823730469, 36.324424743652344, 37.98828887939453, 39.65214538574219, 41.31600570678711]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 9.0, 13.0, 7.0, 11.0, 11.0, 17.0, 13.0, 22.0, 19.0, 21.0, 28.0, 32.0, 43.0, 31.0, 41.0, 26.0, 49.0, 31.0, 40.0, 42.0, 35.0, 39.0, 35.0, 34.0, 37.0, 31.0, 31.0, 35.0, 22.0, 25.0, 25.0, 26.0, 14.0, 12.0, 17.0, 13.0, 13.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.790016174316406, -23.031953811645508, -22.27389144897461, -21.515830993652344, -20.757768630981445, -19.999706268310547, -19.24164390563965, -18.48358154296875, -17.725521087646484, -16.967458724975586, -16.209396362304688, -15.451334953308105, -14.693273544311523, -13.935211181640625, -13.177148818969727, -12.419086456298828, -11.66102409362793, -10.902961730957031, -10.14490032196045, -9.38683795928955, -8.628776550292969, -7.87071418762207, -7.112651824951172, -6.354589939117432, -5.596528053283691, -4.838466167449951, -4.080404281616211, -3.3223419189453125, -2.5642800331115723, -1.806218147277832, -1.0481557846069336, -0.29009389877319336, 0.4679679870605469, 1.2260299921035767, 1.9840919971466064, 2.742154121398926, 3.500216007232666, 4.258277893066406, 5.016340255737305, 5.774402141571045, 6.532464027404785, 7.290525913238525, 8.048587799072266, 8.806650161743164, 9.564712524414062, 10.322773933410645, 11.080836296081543, 11.838897705078125, 12.596960067749023, 13.355022430419922, 14.113083839416504, 14.871146202087402, 15.629207611083984, 16.387269973754883, 17.14533233642578, 17.90339469909668, 18.661457061767578, 19.419519424438477, 20.177581787109375, 20.93564224243164, 21.69370460510254, 22.451766967773438, 23.209829330444336, 23.967891693115234, 24.7259521484375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 8.0, 3.0, 7.0, 9.0, 12.0, 8.0, 14.0, 17.0, 12.0, 26.0, 23.0, 26.0, 36.0, 30.0, 26.0, 35.0, 47.0, 40.0, 42.0, 44.0, 46.0, 40.0, 39.0, 41.0, 30.0, 29.0, 25.0, 35.0, 32.0, 29.0, 27.0, 24.0, 21.0, 24.0, 20.0, 12.0, 13.0, 13.0, 7.0, 8.0, 4.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.818359375, -3.690948486328125, -3.56353759765625, -3.436126708984375, -3.3087158203125, -3.181304931640625, -3.05389404296875, -2.926483154296875, -2.799072265625, -2.671661376953125, -2.54425048828125, -2.416839599609375, -2.2894287109375, -2.162017822265625, -2.03460693359375, -1.907196044921875, -1.77978515625, -1.652374267578125, -1.52496337890625, -1.397552490234375, -1.2701416015625, -1.142730712890625, -1.01531982421875, -0.887908935546875, -0.760498046875, -0.633087158203125, -0.50567626953125, -0.378265380859375, -0.2508544921875, -0.123443603515625, 0.00396728515625, 0.131378173828125, 0.2587890625, 0.386199951171875, 0.51361083984375, 0.641021728515625, 0.7684326171875, 0.895843505859375, 1.02325439453125, 1.150665283203125, 1.278076171875, 1.405487060546875, 1.53289794921875, 1.660308837890625, 1.7877197265625, 1.915130615234375, 2.04254150390625, 2.169952392578125, 2.29736328125, 2.424774169921875, 2.55218505859375, 2.679595947265625, 2.8070068359375, 2.934417724609375, 3.06182861328125, 3.189239501953125, 3.316650390625, 3.444061279296875, 3.57147216796875, 3.698883056640625, 3.8262939453125, 3.953704833984375, 4.08111572265625, 4.208526611328125, 4.3359375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 6.0, 8.0, 21.0, 14.0, 42.0, 64.0, 92.0, 132.0, 160.0, 259.0, 365.0, 556.0, 829.0, 1204.0, 1745.0, 2749.0, 4052.0, 6130.0, 9340.0, 14369.0, 22365.0, 35685.0, 57783.0, 102566.0, 261757.0, 263501.0, 104205.0, 58603.0, 35556.0, 22427.0, 14221.0, 9437.0, 6059.0, 4021.0, 2684.0, 1787.0, 1170.0, 875.0, 555.0, 359.0, 233.0, 186.0, 136.0, 91.0, 49.0, 42.0, 21.0, 18.0, 10.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.2052001953125, -0.19916534423828125, -0.1931304931640625, -0.18709564208984375, -0.181060791015625, -0.17502593994140625, -0.1689910888671875, -0.16295623779296875, -0.15692138671875, -0.15088653564453125, -0.1448516845703125, -0.13881683349609375, -0.132781982421875, -0.12674713134765625, -0.1207122802734375, -0.11467742919921875, -0.108642578125, -0.10260772705078125, -0.0965728759765625, -0.09053802490234375, -0.084503173828125, -0.07846832275390625, -0.0724334716796875, -0.06639862060546875, -0.06036376953125, -0.05432891845703125, -0.0482940673828125, -0.04225921630859375, -0.036224365234375, -0.03018951416015625, -0.0241546630859375, -0.01811981201171875, -0.0120849609375, -0.00605010986328125, -1.52587890625e-05, 0.00601959228515625, 0.012054443359375, 0.01808929443359375, 0.0241241455078125, 0.03015899658203125, 0.03619384765625, 0.04222869873046875, 0.0482635498046875, 0.05429840087890625, 0.060333251953125, 0.06636810302734375, 0.0724029541015625, 0.07843780517578125, 0.08447265625, 0.09050750732421875, 0.0965423583984375, 0.10257720947265625, 0.108612060546875, 0.11464691162109375, 0.1206817626953125, 0.12671661376953125, 0.13275146484375, 0.13878631591796875, 0.1448211669921875, 0.15085601806640625, 0.156890869140625, 0.16292572021484375, 0.1689605712890625, 0.17499542236328125, 0.1810302734375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 3.0, 7.0, 14.0, 17.0, 12.0, 17.0, 14.0, 18.0, 24.0, 29.0, 31.0, 20.0, 31.0, 29.0, 33.0, 38.0, 46.0, 32.0, 37.0, 46.0, 1058.0, 31.0, 35.0, 31.0, 36.0, 49.0, 28.0, 32.0, 31.0, 28.0, 18.0, 19.0, 26.0, 14.0, 10.0, 5.0, 9.0, 14.0, 9.0, 7.0, 9.0, 4.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.75390625, -2.66510009765625, -2.5762939453125, -2.48748779296875, -2.398681640625, -2.30987548828125, -2.2210693359375, -2.13226318359375, -2.04345703125, -1.95465087890625, -1.8658447265625, -1.77703857421875, -1.688232421875, -1.59942626953125, -1.5106201171875, -1.42181396484375, -1.3330078125, -1.24420166015625, -1.1553955078125, -1.06658935546875, -0.977783203125, -0.88897705078125, -0.8001708984375, -0.71136474609375, -0.62255859375, -0.53375244140625, -0.4449462890625, -0.35614013671875, -0.267333984375, -0.17852783203125, -0.0897216796875, -0.00091552734375, 0.087890625, 0.17669677734375, 0.2655029296875, 0.35430908203125, 0.443115234375, 0.53192138671875, 0.6207275390625, 0.70953369140625, 0.79833984375, 0.88714599609375, 0.9759521484375, 1.06475830078125, 1.153564453125, 1.24237060546875, 1.3311767578125, 1.41998291015625, 1.5087890625, 1.59759521484375, 1.6864013671875, 1.77520751953125, 1.864013671875, 1.95281982421875, 2.0416259765625, 2.13043212890625, 2.21923828125, 2.30804443359375, 2.3968505859375, 2.48565673828125, 2.574462890625, 2.66326904296875, 2.7520751953125, 2.84088134765625, 2.9296875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 10.0, 14.0, 17.0, 27.0, 43.0, 59.0, 81.0, 112.0, 168.0, 237.0, 374.0, 510.0, 730.0, 1075.0, 1548.0, 2103.0, 3088.0, 4361.0, 6041.0, 8705.0, 12807.0, 18115.0, 27530.0, 41765.0, 66909.0, 114096.0, 1304220.0, 199180.0, 102107.0, 60878.0, 38705.0, 25046.0, 17416.0, 11666.0, 8295.0, 5777.0, 3972.0, 2796.0, 1933.0, 1379.0, 947.0, 715.0, 479.0, 337.0, 235.0, 158.0, 122.0, 73.0, 51.0, 51.0, 25.0, 20.0, 12.0, 7.0, 5.0, 2.0, 3.0, 3.0], "bins": [-0.08447265625, -0.08190536499023438, -0.07933807373046875, -0.07677078247070312, -0.0742034912109375, -0.07163619995117188, -0.06906890869140625, -0.06650161743164062, -0.063934326171875, -0.061367034912109375, -0.05879974365234375, -0.056232452392578125, -0.0536651611328125, -0.051097869873046875, -0.04853057861328125, -0.045963287353515625, -0.04339599609375, -0.040828704833984375, -0.03826141357421875, -0.035694122314453125, -0.0331268310546875, -0.030559539794921875, -0.02799224853515625, -0.025424957275390625, -0.022857666015625, -0.020290374755859375, -0.01772308349609375, -0.015155792236328125, -0.0125885009765625, -0.010021209716796875, -0.00745391845703125, -0.004886627197265625, -0.0023193359375, 0.000247955322265625, 0.00281524658203125, 0.005382537841796875, 0.0079498291015625, 0.010517120361328125, 0.01308441162109375, 0.015651702880859375, 0.018218994140625, 0.020786285400390625, 0.02335357666015625, 0.025920867919921875, 0.0284881591796875, 0.031055450439453125, 0.03362274169921875, 0.036190032958984375, 0.03875732421875, 0.041324615478515625, 0.04389190673828125, 0.046459197998046875, 0.0490264892578125, 0.051593780517578125, 0.05416107177734375, 0.056728363037109375, 0.059295654296875, 0.061862945556640625, 0.06443023681640625, 0.06699752807617188, 0.0695648193359375, 0.07213211059570312, 0.07469940185546875, 0.07726669311523438, 0.079833984375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 11.0, 10.0, 12.0, 13.0, 16.0, 49.0, 29.0, 24.0, 31.0, 39.0, 50.0, 67.0, 83.0, 118.0, 84.0, 59.0, 48.0, 34.0, 37.0, 26.0, 32.0, 17.0, 19.0, 19.0, 12.0, 11.0, 16.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7853453755378723e-06, -1.7229467630386353e-06, -1.6605481505393982e-06, -1.5981495380401611e-06, -1.535750925540924e-06, -1.473352313041687e-06, -1.41095370054245e-06, -1.3485550880432129e-06, -1.2861564755439758e-06, -1.2237578630447388e-06, -1.1613592505455017e-06, -1.0989606380462646e-06, -1.0365620255470276e-06, -9.741634130477905e-07, -9.117648005485535e-07, -8.493661880493164e-07, -7.869675755500793e-07, -7.245689630508423e-07, -6.621703505516052e-07, -5.997717380523682e-07, -5.373731255531311e-07, -4.7497451305389404e-07, -4.12575900554657e-07, -3.501772880554199e-07, -2.8777867555618286e-07, -2.253800630569458e-07, -1.6298145055770874e-07, -1.0058283805847168e-07, -3.818422555923462e-08, 2.421438694000244e-08, 8.66129994392395e-08, 1.4901161193847656e-07, 2.1141022443771362e-07, 2.738088369369507e-07, 3.3620744943618774e-07, 3.986060619354248e-07, 4.6100467443466187e-07, 5.234032869338989e-07, 5.85801899433136e-07, 6.48200511932373e-07, 7.105991244316101e-07, 7.729977369308472e-07, 8.353963494300842e-07, 8.977949619293213e-07, 9.601935744285583e-07, 1.0225921869277954e-06, 1.0849907994270325e-06, 1.1473894119262695e-06, 1.2097880244255066e-06, 1.2721866369247437e-06, 1.3345852494239807e-06, 1.3969838619232178e-06, 1.4593824744224548e-06, 1.521781086921692e-06, 1.584179699420929e-06, 1.646578311920166e-06, 1.708976924419403e-06, 1.7713755369186401e-06, 1.8337741494178772e-06, 1.8961727619171143e-06, 1.9585713744163513e-06, 2.0209699869155884e-06, 2.0833685994148254e-06, 2.1457672119140625e-06]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 9.0, 8.0, 7.0, 17.0, 26.0, 22.0, 34.0, 37.0, 60.0, 61.0, 108.0, 151.0, 187.0, 351.0, 936.0, 4102.0, 36720.0, 650106.0, 327137.0, 23737.0, 3007.0, 684.0, 323.0, 173.0, 123.0, 102.0, 67.0, 53.0, 41.0, 30.0, 22.0, 25.0, 19.0, 16.0, 7.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.212690353393555e-05, -3.117881715297699e-05, -3.0230730772018433e-05, -2.9282644391059875e-05, -2.833455801010132e-05, -2.738647162914276e-05, -2.6438385248184204e-05, -2.5490298867225647e-05, -2.454221248626709e-05, -2.3594126105308533e-05, -2.2646039724349976e-05, -2.169795334339142e-05, -2.074986696243286e-05, -1.9801780581474304e-05, -1.8853694200515747e-05, -1.790560781955719e-05, -1.6957521438598633e-05, -1.6009435057640076e-05, -1.5061348676681519e-05, -1.4113262295722961e-05, -1.3165175914764404e-05, -1.2217089533805847e-05, -1.126900315284729e-05, -1.0320916771888733e-05, -9.372830390930176e-06, -8.424744009971619e-06, -7.4766576290130615e-06, -6.528571248054504e-06, -5.580484867095947e-06, -4.63239848613739e-06, -3.684312105178833e-06, -2.736225724220276e-06, -1.7881393432617188e-06, -8.400529623031616e-07, 1.0803341865539551e-07, 1.0561197996139526e-06, 2.0042061805725098e-06, 2.952292561531067e-06, 3.900378942489624e-06, 4.848465323448181e-06, 5.796551704406738e-06, 6.744638085365295e-06, 7.692724466323853e-06, 8.64081084728241e-06, 9.588897228240967e-06, 1.0536983609199524e-05, 1.1485069990158081e-05, 1.2433156371116638e-05, 1.3381242752075195e-05, 1.4329329133033752e-05, 1.527741551399231e-05, 1.6225501894950867e-05, 1.7173588275909424e-05, 1.812167465686798e-05, 1.9069761037826538e-05, 2.0017847418785095e-05, 2.0965933799743652e-05, 2.191402018070221e-05, 2.2862106561660767e-05, 2.3810192942619324e-05, 2.475827932357788e-05, 2.5706365704536438e-05, 2.6654452085494995e-05, 2.7602538466453552e-05, 2.855062484741211e-05]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 10.0, 24.0, 51.0, 137.0, 275.0, 278.0, 143.0, 52.0, 23.0, 4.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0994086753489682e-06, -1.9088206499873195e-06, -1.7182326246256707e-06, -1.527644599264022e-06, -1.3370565739023732e-06, -1.1464685485407244e-06, -9.558806368659134e-07, -7.652926115042646e-07, -5.747045861426159e-07, -3.841165607809671e-07, -1.935285638410278e-07, -2.9405669010884594e-09, 1.876474584605603e-07, 3.7823548382220906e-07, 5.68823452340439e-07, 7.594114777020877e-07, 9.499995030637365e-07, 1.1405875284253852e-06, 1.331175553787034e-06, 1.5217635791486828e-06, 1.7123516045103315e-06, 1.9029396298719803e-06, 2.093527655233629e-06, 2.2841154532216024e-06, 2.4747037059569266e-06, 2.6652917313185753e-06, 2.855879756680224e-06, 3.046467782041873e-06, 3.2370558074035216e-06, 3.4276438327651704e-06, 3.618231858126819e-06, 3.8088196561147925e-06, 3.999407908850117e-06, 4.18999570683809e-06, 4.380583959573414e-06, 4.5711717575613875e-06, 4.761760010296712e-06, 4.952347808284685e-06, 5.142936061020009e-06, 5.3335238590079825e-06, 5.524112111743307e-06, 5.71469990973128e-06, 5.905288162466604e-06, 6.095875960454578e-06, 6.286464213189902e-06, 6.477052011177875e-06, 6.667640263913199e-06, 6.858228061901173e-06, 7.048815859889146e-06, 7.239403657877119e-06, 7.4299919106124435e-06, 7.620579708600417e-06, 7.811167961335741e-06, 8.001756214071065e-06, 8.192343557311688e-06, 8.382931810047012e-06, 8.573520062782336e-06, 8.76410831551766e-06, 8.954695658758283e-06, 9.145283911493607e-06, 9.335872164228931e-06, 9.526460416964255e-06, 9.717047760204878e-06, 9.907636012940202e-06, 1.0098224265675526e-05]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 8.0, 16.0, 20.0, 0.0, 24.0, 30.0, 35.0, 29.0, 40.0, 54.0, 65.0, 65.0, 62.0, 0.0, 72.0, 65.0, 50.0, 56.0, 48.0, 43.0, 37.0, 33.0, 36.0, 24.0, 0.0, 12.0, 15.0, 14.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6745179891586304e-06, -1.6205012798309326e-06, -1.5664845705032349e-06, -1.5124678611755371e-06, -1.4584511518478394e-06, -1.4044344425201416e-06, -1.3504177331924438e-06, -1.296401023864746e-06, -1.2423843145370483e-06, -1.1883676052093506e-06, -1.1343508958816528e-06, -1.080334186553955e-06, -1.0263174772262573e-06, -9.723007678985596e-07, -9.182840585708618e-07, -8.642673492431641e-07, -8.102506399154663e-07, -7.562339305877686e-07, -7.022172212600708e-07, -6.48200511932373e-07, -5.941838026046753e-07, -5.401670932769775e-07, -4.861503839492798e-07, -4.3213367462158203e-07, -3.781169652938843e-07, -3.241002559661865e-07, -2.7008354663848877e-07, -2.1606683731079102e-07, -1.6205012798309326e-07, -1.0803341865539551e-07, -5.4016709327697754e-08, 0.0, 5.4016709327697754e-08, 1.0803341865539551e-07, 1.6205012798309326e-07, 2.1606683731079102e-07, 2.7008354663848877e-07, 3.241002559661865e-07, 3.781169652938843e-07, 4.3213367462158203e-07, 4.861503839492798e-07, 5.401670932769775e-07, 5.941838026046753e-07, 6.48200511932373e-07, 7.022172212600708e-07, 7.562339305877686e-07, 8.102506399154663e-07, 8.642673492431641e-07, 9.182840585708618e-07, 9.723007678985596e-07, 1.0263174772262573e-06, 1.080334186553955e-06, 1.1343508958816528e-06, 1.1883676052093506e-06, 1.2423843145370483e-06, 1.296401023864746e-06, 1.3504177331924438e-06, 1.4044344425201416e-06, 1.4584511518478394e-06, 1.5124678611755371e-06, 1.5664845705032349e-06, 1.6205012798309326e-06, 1.6745179891586304e-06, 1.7285346984863281e-06]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 8.0, 3.0, 7.0, 9.0, 12.0, 8.0, 14.0, 17.0, 12.0, 26.0, 23.0, 26.0, 36.0, 30.0, 26.0, 35.0, 47.0, 40.0, 42.0, 44.0, 46.0, 40.0, 39.0, 41.0, 30.0, 29.0, 25.0, 35.0, 32.0, 29.0, 27.0, 24.0, 21.0, 24.0, 20.0, 12.0, 13.0, 13.0, 7.0, 8.0, 4.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.818359375, -3.690948486328125, -3.56353759765625, -3.436126708984375, -3.3087158203125, -3.181304931640625, -3.05389404296875, -2.926483154296875, -2.799072265625, -2.671661376953125, -2.54425048828125, -2.416839599609375, -2.2894287109375, -2.162017822265625, -2.03460693359375, -1.907196044921875, -1.77978515625, -1.652374267578125, -1.52496337890625, -1.397552490234375, -1.2701416015625, -1.142730712890625, -1.01531982421875, -0.887908935546875, -0.760498046875, -0.633087158203125, -0.50567626953125, -0.378265380859375, -0.2508544921875, -0.123443603515625, 0.00396728515625, 0.131378173828125, 0.2587890625, 0.386199951171875, 0.51361083984375, 0.641021728515625, 0.7684326171875, 0.895843505859375, 1.02325439453125, 1.150665283203125, 1.278076171875, 1.405487060546875, 1.53289794921875, 1.660308837890625, 1.7877197265625, 1.915130615234375, 2.04254150390625, 2.169952392578125, 2.29736328125, 2.424774169921875, 2.55218505859375, 2.679595947265625, 2.8070068359375, 2.934417724609375, 3.06182861328125, 3.189239501953125, 3.316650390625, 3.444061279296875, 3.57147216796875, 3.698883056640625, 3.8262939453125, 3.953704833984375, 4.08111572265625, 4.208526611328125, 4.3359375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 11.0, 22.0, 18.0, 29.0, 41.0, 45.0, 55.0, 74.0, 78.0, 117.0, 135.0, 206.0, 275.0, 378.0, 561.0, 908.0, 1538.0, 2909.0, 5663.0, 11737.0, 25716.0, 59516.0, 141002.0, 270446.0, 272416.0, 142819.0, 60882.0, 26043.0, 11649.0, 5670.0, 2963.0, 1612.0, 903.0, 592.0, 417.0, 247.0, 186.0, 150.0, 139.0, 83.0, 67.0, 65.0, 45.0, 32.0, 24.0, 15.0, 11.0, 12.0, 8.0, 7.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.9140625, -3.78363037109375, -3.6531982421875, -3.52276611328125, -3.392333984375, -3.26190185546875, -3.1314697265625, -3.00103759765625, -2.87060546875, -2.74017333984375, -2.6097412109375, -2.47930908203125, -2.348876953125, -2.21844482421875, -2.0880126953125, -1.95758056640625, -1.8271484375, -1.69671630859375, -1.5662841796875, -1.43585205078125, -1.305419921875, -1.17498779296875, -1.0445556640625, -0.91412353515625, -0.78369140625, -0.65325927734375, -0.5228271484375, -0.39239501953125, -0.261962890625, -0.13153076171875, -0.0010986328125, 0.12933349609375, 0.259765625, 0.39019775390625, 0.5206298828125, 0.65106201171875, 0.781494140625, 0.91192626953125, 1.0423583984375, 1.17279052734375, 1.30322265625, 1.43365478515625, 1.5640869140625, 1.69451904296875, 1.824951171875, 1.95538330078125, 2.0858154296875, 2.21624755859375, 2.3466796875, 2.47711181640625, 2.6075439453125, 2.73797607421875, 2.868408203125, 2.99884033203125, 3.1292724609375, 3.25970458984375, 3.39013671875, 3.52056884765625, 3.6510009765625, 3.78143310546875, 3.911865234375, 4.04229736328125, 4.1727294921875, 4.30316162109375, 4.43359375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 7.0, 11.0, 19.0, 17.0, 21.0, 16.0, 39.0, 37.0, 26.0, 40.0, 60.0, 62.0, 81.0, 184.0, 358.0, 1415.0, 178.0, 95.0, 57.0, 59.0, 42.0, 31.0, 35.0, 28.0, 33.0, 16.0, 20.0, 12.0, 3.0, 9.0, 5.0, 10.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9375, -11.5654296875, -11.193359375, -10.8212890625, -10.44921875, -10.0771484375, -9.705078125, -9.3330078125, -8.9609375, -8.5888671875, -8.216796875, -7.8447265625, -7.47265625, -7.1005859375, -6.728515625, -6.3564453125, -5.984375, -5.6123046875, -5.240234375, -4.8681640625, -4.49609375, -4.1240234375, -3.751953125, -3.3798828125, -3.0078125, -2.6357421875, -2.263671875, -1.8916015625, -1.51953125, -1.1474609375, -0.775390625, -0.4033203125, -0.03125, 0.3408203125, 0.712890625, 1.0849609375, 1.45703125, 1.8291015625, 2.201171875, 2.5732421875, 2.9453125, 3.3173828125, 3.689453125, 4.0615234375, 4.43359375, 4.8056640625, 5.177734375, 5.5498046875, 5.921875, 6.2939453125, 6.666015625, 7.0380859375, 7.41015625, 7.7822265625, 8.154296875, 8.5263671875, 8.8984375, 9.2705078125, 9.642578125, 10.0146484375, 10.38671875, 10.7587890625, 11.130859375, 11.5029296875, 11.875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 5.0, 7.0, 11.0, 13.0, 18.0, 30.0, 22.0, 43.0, 52.0, 47.0, 69.0, 104.0, 140.0, 210.0, 395.0, 719.0, 2516.0, 69428.0, 3012451.0, 55147.0, 2330.0, 748.0, 379.0, 231.0, 136.0, 118.0, 69.0, 55.0, 54.0, 27.0, 28.0, 28.0, 16.0, 14.0, 7.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.359375, -16.789794921875, -16.22021484375, -15.650634765625, -15.0810546875, -14.511474609375, -13.94189453125, -13.372314453125, -12.802734375, -12.233154296875, -11.66357421875, -11.093994140625, -10.5244140625, -9.954833984375, -9.38525390625, -8.815673828125, -8.24609375, -7.676513671875, -7.10693359375, -6.537353515625, -5.9677734375, -5.398193359375, -4.82861328125, -4.259033203125, -3.689453125, -3.119873046875, -2.55029296875, -1.980712890625, -1.4111328125, -0.841552734375, -0.27197265625, 0.297607421875, 0.8671875, 1.436767578125, 2.00634765625, 2.575927734375, 3.1455078125, 3.715087890625, 4.28466796875, 4.854248046875, 5.423828125, 5.993408203125, 6.56298828125, 7.132568359375, 7.7021484375, 8.271728515625, 8.84130859375, 9.410888671875, 9.98046875, 10.550048828125, 11.11962890625, 11.689208984375, 12.2587890625, 12.828369140625, 13.39794921875, 13.967529296875, 14.537109375, 15.106689453125, 15.67626953125, 16.245849609375, 16.8154296875, 17.385009765625, 17.95458984375, 18.524169921875, 19.09375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 44.0, 282.0, 482.0, 165.0, 31.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.62942886352539, -51.48860168457031, -48.347774505615234, -45.206947326660156, -42.06611633300781, -38.925289154052734, -35.784461975097656, -32.64363098144531, -29.502805709838867, -26.36197853088379, -23.221149444580078, -20.080322265625, -16.939495086669922, -13.798666000366211, -10.657838821411133, -7.517009735107422, -4.376182556152344, -1.2353546619415283, 1.905473232269287, 5.046300888061523, 8.187129020690918, 11.327957153320312, 14.46878433227539, 17.6096134185791, 20.75044059753418, 23.891267776489258, 27.03209686279297, 30.172924041748047, 33.313751220703125, 36.45458221435547, 39.59540557861328, 42.736236572265625, 45.87706756591797, 49.01789474487305, 52.158721923828125, 55.29955291748047, 58.44038009643555, 61.581207275390625, 64.72203063964844, 67.86286163330078, 71.00369262695312, 74.14452362060547, 77.28534698486328, 80.42617797851562, 83.56700134277344, 86.70783233642578, 89.84866333007812, 92.98948669433594, 96.13031005859375, 99.2711410522461, 102.4119644165039, 105.55279541015625, 108.69361877441406, 111.8344497680664, 114.97528076171875, 118.11610412597656, 121.2569351196289, 124.39776611328125, 127.53858947753906, 130.67941284179688, 133.82025146484375, 136.96107482910156, 140.10189819335938, 143.24273681640625, 146.38356018066406]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 8.0, 7.0, 3.0, 5.0, 8.0, 15.0, 19.0, 16.0, 27.0, 32.0, 21.0, 37.0, 48.0, 30.0, 56.0, 45.0, 54.0, 52.0, 51.0, 45.0, 41.0, 40.0, 44.0, 48.0, 33.0, 27.0, 33.0, 29.0, 30.0, 21.0, 17.0, 16.0, 9.0, 8.0, 16.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.740962982177734, -39.63297653198242, -38.524993896484375, -37.41700744628906, -36.30902099609375, -35.2010383605957, -34.09305191040039, -32.985069274902344, -31.87708282470703, -30.76909828186035, -29.661113739013672, -28.55312728881836, -27.44514274597168, -26.337158203125, -25.229171752929688, -24.121187210083008, -23.013202667236328, -21.90521812438965, -20.79723358154297, -19.689247131347656, -18.581262588500977, -17.473278045654297, -16.365291595458984, -15.257307052612305, -14.149322509765625, -13.041337966918945, -11.93335247039795, -10.825366973876953, -9.717382431030273, -8.609397888183594, -7.501412391662598, -6.39342737197876, -5.285442352294922, -4.177457332611084, -3.069472312927246, -1.9614872932434082, -0.8535022735595703, 0.2544827461242676, 1.3624677658081055, 2.4704527854919434, 3.5784378051757812, 4.686422824859619, 5.794407844543457, 6.902392864227295, 8.010377883911133, 9.118362426757812, 10.226347923278809, 11.334333419799805, 12.442317962646484, 13.550302505493164, 14.65828800201416, 15.766273498535156, 16.874258041381836, 17.982242584228516, 19.090229034423828, 20.198213577270508, 21.306198120117188, 22.414182662963867, 23.522167205810547, 24.63015365600586, 25.73813819885254, 26.84612274169922, 27.95410919189453, 29.06209373474121, 30.17007827758789]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 2.0, 7.0, 5.0, 6.0, 6.0, 5.0, 11.0, 10.0, 15.0, 22.0, 16.0, 20.0, 23.0, 25.0, 33.0, 26.0, 30.0, 38.0, 27.0, 27.0, 41.0, 39.0, 54.0, 40.0, 31.0, 36.0, 33.0, 27.0, 35.0, 18.0, 31.0, 28.0, 21.0, 16.0, 25.0, 23.0, 24.0, 23.0, 10.0, 11.0, 13.0, 12.0, 11.0, 8.0, 8.0, 5.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0], "bins": [-4.33203125, -4.203399658203125, -4.07476806640625, -3.946136474609375, -3.8175048828125, -3.688873291015625, -3.56024169921875, -3.431610107421875, -3.302978515625, -3.174346923828125, -3.04571533203125, -2.917083740234375, -2.7884521484375, -2.659820556640625, -2.53118896484375, -2.402557373046875, -2.27392578125, -2.145294189453125, -2.01666259765625, -1.888031005859375, -1.7593994140625, -1.630767822265625, -1.50213623046875, -1.373504638671875, -1.244873046875, -1.116241455078125, -0.98760986328125, -0.858978271484375, -0.7303466796875, -0.601715087890625, -0.47308349609375, -0.344451904296875, -0.2158203125, -0.087188720703125, 0.04144287109375, 0.170074462890625, 0.2987060546875, 0.427337646484375, 0.55596923828125, 0.684600830078125, 0.813232421875, 0.941864013671875, 1.07049560546875, 1.199127197265625, 1.3277587890625, 1.456390380859375, 1.58502197265625, 1.713653564453125, 1.84228515625, 1.970916748046875, 2.09954833984375, 2.228179931640625, 2.3568115234375, 2.485443115234375, 2.61407470703125, 2.742706298828125, 2.871337890625, 2.999969482421875, 3.12860107421875, 3.257232666015625, 3.3858642578125, 3.514495849609375, 3.64312744140625, 3.771759033203125, 3.900390625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 8.0, 7.0, 7.0, 8.0, 7.0, 22.0, 16.0, 27.0, 26.0, 60.0, 71.0, 95.0, 118.0, 166.0, 219.0, 316.0, 425.0, 655.0, 1216.0, 2775.0, 11505.0, 114488.0, 2172891.0, 1783821.0, 90025.0, 9515.0, 2506.0, 1081.0, 633.0, 416.0, 289.0, 219.0, 160.0, 114.0, 100.0, 79.0, 45.0, 33.0, 31.0, 17.0, 20.0, 16.0, 4.0, 5.0, 3.0, 5.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0], "bins": [-24.484375, -23.783935546875, -23.08349609375, -22.383056640625, -21.6826171875, -20.982177734375, -20.28173828125, -19.581298828125, -18.880859375, -18.180419921875, -17.47998046875, -16.779541015625, -16.0791015625, -15.378662109375, -14.67822265625, -13.977783203125, -13.27734375, -12.576904296875, -11.87646484375, -11.176025390625, -10.4755859375, -9.775146484375, -9.07470703125, -8.374267578125, -7.673828125, -6.973388671875, -6.27294921875, -5.572509765625, -4.8720703125, -4.171630859375, -3.47119140625, -2.770751953125, -2.0703125, -1.369873046875, -0.66943359375, 0.031005859375, 0.7314453125, 1.431884765625, 2.13232421875, 2.832763671875, 3.533203125, 4.233642578125, 4.93408203125, 5.634521484375, 6.3349609375, 7.035400390625, 7.73583984375, 8.436279296875, 9.13671875, 9.837158203125, 10.53759765625, 11.238037109375, 11.9384765625, 12.638916015625, 13.33935546875, 14.039794921875, 14.740234375, 15.440673828125, 16.14111328125, 16.841552734375, 17.5419921875, 18.242431640625, 18.94287109375, 19.643310546875, 20.34375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 9.0, 6.0, 10.0, 11.0, 14.0, 20.0, 30.0, 49.0, 63.0, 107.0, 175.0, 211.0, 295.0, 353.0, 434.0, 477.0, 469.0, 393.0, 276.0, 186.0, 155.0, 102.0, 63.0, 46.0, 32.0, 21.0, 23.0, 10.0, 8.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6640625, -9.3603515625, -9.056640625, -8.7529296875, -8.44921875, -8.1455078125, -7.841796875, -7.5380859375, -7.234375, -6.9306640625, -6.626953125, -6.3232421875, -6.01953125, -5.7158203125, -5.412109375, -5.1083984375, -4.8046875, -4.5009765625, -4.197265625, -3.8935546875, -3.58984375, -3.2861328125, -2.982421875, -2.6787109375, -2.375, -2.0712890625, -1.767578125, -1.4638671875, -1.16015625, -0.8564453125, -0.552734375, -0.2490234375, 0.0546875, 0.3583984375, 0.662109375, 0.9658203125, 1.26953125, 1.5732421875, 1.876953125, 2.1806640625, 2.484375, 2.7880859375, 3.091796875, 3.3955078125, 3.69921875, 4.0029296875, 4.306640625, 4.6103515625, 4.9140625, 5.2177734375, 5.521484375, 5.8251953125, 6.12890625, 6.4326171875, 6.736328125, 7.0400390625, 7.34375, 7.6474609375, 7.951171875, 8.2548828125, 8.55859375, 8.8623046875, 9.166015625, 9.4697265625, 9.7734375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 11.0, 12.0, 16.0, 46.0, 68.0, 154.0, 292.0, 712.0, 1845.0, 7132.0, 49782.0, 574114.0, 2890757.0, 606610.0, 52068.0, 7339.0, 1925.0, 732.0, 334.0, 146.0, 80.0, 39.0, 26.0, 7.0, 14.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.9296875, -12.4761962890625, -12.022705078125, -11.5692138671875, -11.11572265625, -10.6622314453125, -10.208740234375, -9.7552490234375, -9.3017578125, -8.8482666015625, -8.394775390625, -7.9412841796875, -7.48779296875, -7.0343017578125, -6.580810546875, -6.1273193359375, -5.673828125, -5.2203369140625, -4.766845703125, -4.3133544921875, -3.85986328125, -3.4063720703125, -2.952880859375, -2.4993896484375, -2.0458984375, -1.5924072265625, -1.138916015625, -0.6854248046875, -0.23193359375, 0.2215576171875, 0.675048828125, 1.1285400390625, 1.58203125, 2.0355224609375, 2.489013671875, 2.9425048828125, 3.39599609375, 3.8494873046875, 4.302978515625, 4.7564697265625, 5.2099609375, 5.6634521484375, 6.116943359375, 6.5704345703125, 7.02392578125, 7.4774169921875, 7.930908203125, 8.3843994140625, 8.837890625, 9.2913818359375, 9.744873046875, 10.1983642578125, 10.65185546875, 11.1053466796875, 11.558837890625, 12.0123291015625, 12.4658203125, 12.9193115234375, 13.372802734375, 13.8262939453125, 14.27978515625, 14.7332763671875, 15.186767578125, 15.6402587890625, 16.09375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 13.0, 22.0, 33.0, 54.0, 74.0, 100.0, 114.0, 118.0, 124.0, 121.0, 79.0, 54.0, 32.0, 22.0, 13.0, 11.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.53193664550781, -77.36991119384766, -74.2078857421875, -71.04585266113281, -67.88382720947266, -64.7218017578125, -61.559776306152344, -58.39774703979492, -55.2357177734375, -52.073692321777344, -48.91166305541992, -45.749637603759766, -42.587608337402344, -39.42558288574219, -36.26355743408203, -33.10152816772461, -29.939502716064453, -26.777475357055664, -23.615447998046875, -20.45342254638672, -17.291393280029297, -14.129366874694824, -10.967340469360352, -7.8053131103515625, -4.643285751342773, -1.4812586307525635, 1.6807684898376465, 4.842795372009277, 8.004822731018066, 11.166850090026855, 14.328876495361328, 17.490903854370117, 20.652931213378906, 23.814958572387695, 26.976985931396484, 30.13901138305664, 33.30104064941406, 36.46306610107422, 39.625091552734375, 42.7871208190918, 45.94915008544922, 49.111175537109375, 52.2732048034668, 55.43523025512695, 58.597259521484375, 61.75928497314453, 64.92131042480469, 68.08334350585938, 71.245361328125, 74.40738677978516, 77.56941223144531, 80.7314453125, 83.89347076416016, 87.05549621582031, 90.21752166748047, 93.37954711914062, 96.54158020019531, 99.70360565185547, 102.86563110351562, 106.02766418457031, 109.18968963623047, 112.35171508789062, 115.51374053955078, 118.67576599121094, 121.83779907226562]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 11.0, 14.0, 10.0, 10.0, 14.0, 19.0, 16.0, 29.0, 27.0, 24.0, 21.0, 31.0, 32.0, 31.0, 46.0, 30.0, 47.0, 32.0, 40.0, 42.0, 45.0, 31.0, 43.0, 42.0, 31.0, 36.0, 27.0, 23.0, 23.0, 18.0, 19.0, 16.0, 28.0, 20.0, 6.0, 11.0, 9.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-45.17182159423828, -43.788028717041016, -42.404232025146484, -41.02043914794922, -39.63664245605469, -38.25284957885742, -36.869056701660156, -35.485260009765625, -34.101463317871094, -32.71767044067383, -31.333873748779297, -29.95008087158203, -28.5662841796875, -27.182491302490234, -25.798696517944336, -24.414901733398438, -23.031108856201172, -21.647314071655273, -20.263519287109375, -18.87972640991211, -17.495929718017578, -16.112136840820312, -14.728342056274414, -13.344547271728516, -11.960752487182617, -10.576957702636719, -9.19316291809082, -7.809369087219238, -6.42557430267334, -5.041779518127441, -3.6579856872558594, -2.274190902709961, -0.8903961181640625, 0.49339842796325684, 1.8771929740905762, 3.2609872817993164, 4.644782066345215, 6.028576850891113, 7.412370681762695, 8.796165466308594, 10.179960250854492, 11.56375503540039, 12.947549819946289, 14.331343650817871, 15.71513843536377, 17.098934173583984, 18.48272705078125, 19.86652183532715, 21.250316619873047, 22.634111404418945, 24.017906188964844, 25.40169906616211, 26.78549575805664, 28.169288635253906, 29.553083419799805, 30.936878204345703, 32.32067108154297, 33.704463958740234, 35.088260650634766, 36.47205352783203, 37.85585021972656, 39.23964309692383, 40.623435974121094, 42.007232666015625, 43.391029357910156]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 13.0, 8.0, 5.0, 13.0, 17.0, 21.0, 27.0, 24.0, 25.0, 30.0, 32.0, 38.0, 33.0, 34.0, 44.0, 46.0, 40.0, 44.0, 46.0, 37.0, 37.0, 48.0, 47.0, 36.0, 29.0, 29.0, 30.0, 26.0, 20.0, 24.0, 17.0, 22.0, 5.0, 10.0, 10.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-101.125, -97.84765625, -94.5703125, -91.29296875, -88.015625, -84.73828125, -81.4609375, -78.18359375, -74.90625, -71.62890625, -68.3515625, -65.07421875, -61.796875, -58.51953125, -55.2421875, -51.96484375, -48.6875, -45.41015625, -42.1328125, -38.85546875, -35.578125, -32.30078125, -29.0234375, -25.74609375, -22.46875, -19.19140625, -15.9140625, -12.63671875, -9.359375, -6.08203125, -2.8046875, 0.47265625, 3.75, 7.02734375, 10.3046875, 13.58203125, 16.859375, 20.13671875, 23.4140625, 26.69140625, 29.96875, 33.24609375, 36.5234375, 39.80078125, 43.078125, 46.35546875, 49.6328125, 52.91015625, 56.1875, 59.46484375, 62.7421875, 66.01953125, 69.296875, 72.57421875, 75.8515625, 79.12890625, 82.40625, 85.68359375, 88.9609375, 92.23828125, 95.515625, 98.79296875, 102.0703125, 105.34765625, 108.625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 19.0, 24.0, 30.0, 44.0, 78.0, 106.0, 159.0, 224.0, 367.0, 570.0, 885.0, 1286.0, 2097.0, 3218.0, 5266.0, 8036.0, 12892.0, 20736.0, 33053.0, 55151.0, 97546.0, 210835.0, 307353.0, 119870.0, 65136.0, 38911.0, 23650.0, 15039.0, 9360.0, 6001.0, 3753.0, 2431.0, 1497.0, 1027.0, 622.0, 411.0, 273.0, 196.0, 125.0, 75.0, 57.0, 44.0, 28.0, 22.0, 17.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.4765625, -4.341552734375, -4.20654296875, -4.071533203125, -3.9365234375, -3.801513671875, -3.66650390625, -3.531494140625, -3.396484375, -3.261474609375, -3.12646484375, -2.991455078125, -2.8564453125, -2.721435546875, -2.58642578125, -2.451416015625, -2.31640625, -2.181396484375, -2.04638671875, -1.911376953125, -1.7763671875, -1.641357421875, -1.50634765625, -1.371337890625, -1.236328125, -1.101318359375, -0.96630859375, -0.831298828125, -0.6962890625, -0.561279296875, -0.42626953125, -0.291259765625, -0.15625, -0.021240234375, 0.11376953125, 0.248779296875, 0.3837890625, 0.518798828125, 0.65380859375, 0.788818359375, 0.923828125, 1.058837890625, 1.19384765625, 1.328857421875, 1.4638671875, 1.598876953125, 1.73388671875, 1.868896484375, 2.00390625, 2.138916015625, 2.27392578125, 2.408935546875, 2.5439453125, 2.678955078125, 2.81396484375, 2.948974609375, 3.083984375, 3.218994140625, 3.35400390625, 3.489013671875, 3.6240234375, 3.759033203125, 3.89404296875, 4.029052734375, 4.1640625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 7.0, 10.0, 12.0, 5.0, 19.0, 11.0, 12.0, 19.0, 21.0, 23.0, 34.0, 30.0, 35.0, 30.0, 39.0, 36.0, 39.0, 33.0, 37.0, 1059.0, 39.0, 57.0, 47.0, 45.0, 37.0, 37.0, 29.0, 28.0, 33.0, 30.0, 26.0, 20.0, 16.0, 14.0, 8.0, 9.0, 12.0, 4.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.4375, -65.087890625, -62.73828125, -60.388671875, -58.0390625, -55.689453125, -53.33984375, -50.990234375, -48.640625, -46.291015625, -43.94140625, -41.591796875, -39.2421875, -36.892578125, -34.54296875, -32.193359375, -29.84375, -27.494140625, -25.14453125, -22.794921875, -20.4453125, -18.095703125, -15.74609375, -13.396484375, -11.046875, -8.697265625, -6.34765625, -3.998046875, -1.6484375, 0.701171875, 3.05078125, 5.400390625, 7.75, 10.099609375, 12.44921875, 14.798828125, 17.1484375, 19.498046875, 21.84765625, 24.197265625, 26.546875, 28.896484375, 31.24609375, 33.595703125, 35.9453125, 38.294921875, 40.64453125, 42.994140625, 45.34375, 47.693359375, 50.04296875, 52.392578125, 54.7421875, 57.091796875, 59.44140625, 61.791015625, 64.140625, 66.490234375, 68.83984375, 71.189453125, 73.5390625, 75.888671875, 78.23828125, 80.587890625, 82.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 13.0, 19.0, 35.0, 54.0, 66.0, 104.0, 195.0, 250.0, 377.0, 581.0, 875.0, 1257.0, 1843.0, 2775.0, 4029.0, 6481.0, 9632.0, 15090.0, 23662.0, 37691.0, 63651.0, 116625.0, 1328971.0, 223192.0, 104372.0, 57769.0, 35137.0, 21827.0, 13888.0, 9019.0, 5900.0, 4062.0, 2472.0, 1729.0, 1182.0, 722.0, 520.0, 337.0, 236.0, 156.0, 120.0, 68.0, 54.0, 28.0, 22.0, 15.0, 15.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.388671875, -2.31610107421875, -2.2435302734375, -2.17095947265625, -2.098388671875, -2.02581787109375, -1.9532470703125, -1.88067626953125, -1.80810546875, -1.73553466796875, -1.6629638671875, -1.59039306640625, -1.517822265625, -1.44525146484375, -1.3726806640625, -1.30010986328125, -1.2275390625, -1.15496826171875, -1.0823974609375, -1.00982666015625, -0.937255859375, -0.86468505859375, -0.7921142578125, -0.71954345703125, -0.64697265625, -0.57440185546875, -0.5018310546875, -0.42926025390625, -0.356689453125, -0.28411865234375, -0.2115478515625, -0.13897705078125, -0.06640625, 0.00616455078125, 0.0787353515625, 0.15130615234375, 0.223876953125, 0.29644775390625, 0.3690185546875, 0.44158935546875, 0.51416015625, 0.58673095703125, 0.6593017578125, 0.73187255859375, 0.804443359375, 0.87701416015625, 0.9495849609375, 1.02215576171875, 1.0947265625, 1.16729736328125, 1.2398681640625, 1.31243896484375, 1.385009765625, 1.45758056640625, 1.5301513671875, 1.60272216796875, 1.67529296875, 1.74786376953125, 1.8204345703125, 1.89300537109375, 1.965576171875, 2.03814697265625, 2.1107177734375, 2.18328857421875, 2.255859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 6.0, 10.0, 9.0, 14.0, 12.0, 18.0, 19.0, 24.0, 31.0, 37.0, 51.0, 64.0, 87.0, 94.0, 110.0, 82.0, 62.0, 60.0, 51.0, 35.0, 27.0, 19.0, 16.0, 12.0, 10.0, 7.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0961971282958984e-05, -4.9219466745853424e-05, -4.7476962208747864e-05, -4.5734457671642303e-05, -4.399195313453674e-05, -4.224944859743118e-05, -4.050694406032562e-05, -3.876443952322006e-05, -3.70219349861145e-05, -3.527943044900894e-05, -3.353692591190338e-05, -3.179442137479782e-05, -3.005191683769226e-05, -2.83094123005867e-05, -2.656690776348114e-05, -2.482440322637558e-05, -2.308189868927002e-05, -2.133939415216446e-05, -1.95968896150589e-05, -1.785438507795334e-05, -1.611188054084778e-05, -1.4369376003742218e-05, -1.2626871466636658e-05, -1.0884366929531097e-05, -9.141862392425537e-06, -7.399357855319977e-06, -5.6568533182144165e-06, -3.914348781108856e-06, -2.171844244003296e-06, -4.293397068977356e-07, 1.3131648302078247e-06, 3.055669367313385e-06, 4.798173904418945e-06, 6.540678441524506e-06, 8.283182978630066e-06, 1.0025687515735626e-05, 1.1768192052841187e-05, 1.3510696589946747e-05, 1.5253201127052307e-05, 1.6995705664157867e-05, 1.8738210201263428e-05, 2.0480714738368988e-05, 2.222321927547455e-05, 2.396572381258011e-05, 2.570822834968567e-05, 2.745073288679123e-05, 2.919323742389679e-05, 3.093574196100235e-05, 3.267824649810791e-05, 3.442075103521347e-05, 3.616325557231903e-05, 3.790576010942459e-05, 3.964826464653015e-05, 4.139076918363571e-05, 4.313327372074127e-05, 4.487577825784683e-05, 4.661828279495239e-05, 4.836078733205795e-05, 5.010329186916351e-05, 5.1845796406269073e-05, 5.3588300943374634e-05, 5.5330805480480194e-05, 5.7073310017585754e-05, 5.8815814554691315e-05, 6.0558319091796875e-05]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 14.0, 8.0, 17.0, 27.0, 33.0, 56.0, 96.0, 138.0, 188.0, 320.0, 542.0, 984.0, 1764.0, 3517.0, 7526.0, 17231.0, 42015.0, 122735.0, 490472.0, 241510.0, 70852.0, 26365.0, 11354.0, 5125.0, 2497.0, 1279.0, 741.0, 394.0, 267.0, 153.0, 106.0, 65.0, 41.0, 36.0, 16.0, 16.0, 8.0, 8.0, 6.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002391338348388672, -0.00023204833269119263, -0.00022496283054351807, -0.0002178773283958435, -0.00021079182624816895, -0.00020370632410049438, -0.00019662082195281982, -0.00018953531980514526, -0.0001824498176574707, -0.00017536431550979614, -0.00016827881336212158, -0.00016119331121444702, -0.00015410780906677246, -0.0001470223069190979, -0.00013993680477142334, -0.00013285130262374878, -0.00012576580047607422, -0.00011868029832839966, -0.0001115947961807251, -0.00010450929403305054, -9.742379188537598e-05, -9.033828973770142e-05, -8.325278759002686e-05, -7.61672854423523e-05, -6.908178329467773e-05, -6.199628114700317e-05, -5.491077899932861e-05, -4.782527685165405e-05, -4.073977470397949e-05, -3.365427255630493e-05, -2.656877040863037e-05, -1.948326826095581e-05, -1.239776611328125e-05, -5.3122639656066895e-06, 1.773238182067871e-06, 8.858740329742432e-06, 1.5944242477416992e-05, 2.3029744625091553e-05, 3.0115246772766113e-05, 3.7200748920440674e-05, 4.4286251068115234e-05, 5.1371753215789795e-05, 5.8457255363464355e-05, 6.554275751113892e-05, 7.262825965881348e-05, 7.971376180648804e-05, 8.67992639541626e-05, 9.388476610183716e-05, 0.00010097026824951172, 0.00010805577039718628, 0.00011514127254486084, 0.0001222267746925354, 0.00012931227684020996, 0.00013639777898788452, 0.00014348328113555908, 0.00015056878328323364, 0.0001576542854309082, 0.00016473978757858276, 0.00017182528972625732, 0.00017891079187393188, 0.00018599629402160645, 0.000193081796169281, 0.00020016729831695557, 0.00020725280046463013, 0.0002143383026123047]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 12.0, 17.0, 26.0, 31.0, 55.0, 67.0, 98.0, 94.0, 109.0, 104.0, 82.0, 74.0, 53.0, 51.0, 27.0, 25.0, 16.0, 14.0, 8.0, 9.0, 3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4051616239594296e-05, -3.2660464057698846e-05, -3.126930823782459e-05, -2.987815605592914e-05, -2.848700387403369e-05, -2.709585169213824e-05, -2.5704697691253386e-05, -2.4313543690368533e-05, -2.2922391508473083e-05, -2.1531239326577634e-05, -2.014008532569278e-05, -1.8748931324807927e-05, -1.7357779142912477e-05, -1.5966626961017027e-05, -1.4575472960132174e-05, -1.3184319868742023e-05, -1.1793166777351871e-05, -1.040201368596172e-05, -9.010860594571568e-06, -7.6197075031814165e-06, -6.228554411791265e-06, -4.8374013204011135e-06, -3.446248229010962e-06, -2.0550951376208104e-06, -6.639420462306589e-07, 7.272110451594926e-07, 2.118364136549644e-06, 3.5095172279397957e-06, 4.900670319329947e-06, 6.291823410720099e-06, 7.68297650211025e-06, 9.074129593500402e-06, 1.046528632286936e-05, 1.1856439414259512e-05, 1.3247592505649664e-05, 1.4638745597039815e-05, 1.6029898688429967e-05, 1.7421050870325416e-05, 1.881220487121027e-05, 2.0203358872095123e-05, 2.1594511053990573e-05, 2.2985663235886022e-05, 2.4376817236770876e-05, 2.576797123765573e-05, 2.715912341955118e-05, 2.855027560144663e-05, 2.9941429602331482e-05, 3.1332583603216335e-05, 3.2723735785111785e-05, 3.4114887967007235e-05, 3.5506040148902684e-05, 3.689719596877694e-05, 3.828834815067239e-05, 3.967950033256784e-05, 4.10706561524421e-05, 4.246180833433755e-05, 4.3852960516233e-05, 4.524411269812845e-05, 4.66352648800239e-05, 4.8026420699898154e-05, 4.94175728817936e-05, 5.080872506368905e-05, 5.219988088356331e-05, 5.359103306545876e-05, 5.498218524735421e-05]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 7.0, 5.0, 17.0, 8.0, 13.0, 10.0, 14.0, 18.0, 20.0, 18.0, 26.0, 31.0, 32.0, 30.0, 28.0, 23.0, 21.0, 42.0, 45.0, 37.0, 51.0, 36.0, 36.0, 43.0, 41.0, 37.0, 39.0, 30.0, 37.0, 27.0, 29.0, 18.0, 12.0, 15.0, 20.0, 19.0, 10.0, 10.0, 10.0, 9.0, 2.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.3245811462402344e-05, -2.2532418370246887e-05, -2.181902527809143e-05, -2.1105632185935974e-05, -2.0392239093780518e-05, -1.967884600162506e-05, -1.8965452909469604e-05, -1.8252059817314148e-05, -1.753866672515869e-05, -1.6825273633003235e-05, -1.611188054084778e-05, -1.5398487448692322e-05, -1.4685094356536865e-05, -1.3971701264381409e-05, -1.3258308172225952e-05, -1.2544915080070496e-05, -1.1831521987915039e-05, -1.1118128895759583e-05, -1.0404735803604126e-05, -9.69134271144867e-06, -8.977949619293213e-06, -8.264556527137756e-06, -7.5511634349823e-06, -6.837770342826843e-06, -6.124377250671387e-06, -5.41098415851593e-06, -4.697591066360474e-06, -3.984197974205017e-06, -3.2708048820495605e-06, -2.557411789894104e-06, -1.8440186977386475e-06, -1.130625605583191e-06, -4.172325134277344e-07, 2.9616057872772217e-07, 1.0095536708831787e-06, 1.7229467630386353e-06, 2.436339855194092e-06, 3.1497329473495483e-06, 3.863126039505005e-06, 4.5765191316604614e-06, 5.289912223815918e-06, 6.0033053159713745e-06, 6.716698408126831e-06, 7.430091500282288e-06, 8.143484592437744e-06, 8.8568776845932e-06, 9.570270776748657e-06, 1.0283663868904114e-05, 1.099705696105957e-05, 1.1710450053215027e-05, 1.2423843145370483e-05, 1.313723623752594e-05, 1.3850629329681396e-05, 1.4564022421836853e-05, 1.527741551399231e-05, 1.5990808606147766e-05, 1.6704201698303223e-05, 1.741759479045868e-05, 1.8130987882614136e-05, 1.8844380974769592e-05, 1.955777406692505e-05, 2.0271167159080505e-05, 2.0984560251235962e-05, 2.169795334339142e-05, 2.2411346435546875e-05]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 13.0, 8.0, 5.0, 13.0, 17.0, 21.0, 27.0, 24.0, 25.0, 30.0, 32.0, 38.0, 33.0, 34.0, 44.0, 46.0, 40.0, 44.0, 46.0, 37.0, 37.0, 48.0, 47.0, 36.0, 29.0, 29.0, 30.0, 26.0, 20.0, 24.0, 17.0, 22.0, 5.0, 10.0, 10.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-101.125, -97.84765625, -94.5703125, -91.29296875, -88.015625, -84.73828125, -81.4609375, -78.18359375, -74.90625, -71.62890625, -68.3515625, -65.07421875, -61.796875, -58.51953125, -55.2421875, -51.96484375, -48.6875, -45.41015625, -42.1328125, -38.85546875, -35.578125, -32.30078125, -29.0234375, -25.74609375, -22.46875, -19.19140625, -15.9140625, -12.63671875, -9.359375, -6.08203125, -2.8046875, 0.47265625, 3.75, 7.02734375, 10.3046875, 13.58203125, 16.859375, 20.13671875, 23.4140625, 26.69140625, 29.96875, 33.24609375, 36.5234375, 39.80078125, 43.078125, 46.35546875, 49.6328125, 52.91015625, 56.1875, 59.46484375, 62.7421875, 66.01953125, 69.296875, 72.57421875, 75.8515625, 79.12890625, 82.40625, 85.68359375, 88.9609375, 92.23828125, 95.515625, 98.79296875, 102.0703125, 105.34765625, 108.625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 10.0, 9.0, 8.0, 17.0, 11.0, 22.0, 27.0, 24.0, 24.0, 41.0, 51.0, 82.0, 121.0, 346.0, 1056.0, 5678.0, 55293.0, 549378.0, 396796.0, 34065.0, 3995.0, 774.0, 264.0, 136.0, 65.0, 49.0, 32.0, 37.0, 21.0, 23.0, 18.0, 19.0, 11.0, 9.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.546875, -20.849609375, -20.15234375, -19.455078125, -18.7578125, -18.060546875, -17.36328125, -16.666015625, -15.96875, -15.271484375, -14.57421875, -13.876953125, -13.1796875, -12.482421875, -11.78515625, -11.087890625, -10.390625, -9.693359375, -8.99609375, -8.298828125, -7.6015625, -6.904296875, -6.20703125, -5.509765625, -4.8125, -4.115234375, -3.41796875, -2.720703125, -2.0234375, -1.326171875, -0.62890625, 0.068359375, 0.765625, 1.462890625, 2.16015625, 2.857421875, 3.5546875, 4.251953125, 4.94921875, 5.646484375, 6.34375, 7.041015625, 7.73828125, 8.435546875, 9.1328125, 9.830078125, 10.52734375, 11.224609375, 11.921875, 12.619140625, 13.31640625, 14.013671875, 14.7109375, 15.408203125, 16.10546875, 16.802734375, 17.5, 18.197265625, 18.89453125, 19.591796875, 20.2890625, 20.986328125, 21.68359375, 22.380859375, 23.078125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 9.0, 13.0, 32.0, 41.0, 67.0, 111.0, 151.0, 2196.0, 131.0, 103.0, 92.0, 48.0, 25.0, 14.0, 9.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-506.75, -492.4453125, -478.140625, -463.8359375, -449.53125, -435.2265625, -420.921875, -406.6171875, -392.3125, -378.0078125, -363.703125, -349.3984375, -335.09375, -320.7890625, -306.484375, -292.1796875, -277.875, -263.5703125, -249.265625, -234.9609375, -220.65625, -206.3515625, -192.046875, -177.7421875, -163.4375, -149.1328125, -134.828125, -120.5234375, -106.21875, -91.9140625, -77.609375, -63.3046875, -49.0, -34.6953125, -20.390625, -6.0859375, 8.21875, 22.5234375, 36.828125, 51.1328125, 65.4375, 79.7421875, 94.046875, 108.3515625, 122.65625, 136.9609375, 151.265625, 165.5703125, 179.875, 194.1796875, 208.484375, 222.7890625, 237.09375, 251.3984375, 265.703125, 280.0078125, 294.3125, 308.6171875, 322.921875, 337.2265625, 351.53125, 365.8359375, 380.140625, 394.4453125, 408.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 13.0, 17.0, 23.0, 33.0, 62.0, 104.0, 171.0, 329.0, 715.0, 1838.0, 7016.0, 72542.0, 2832490.0, 211946.0, 13746.0, 2736.0, 894.0, 460.0, 231.0, 125.0, 72.0, 47.0, 22.0, 23.0, 7.0, 13.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -17.005126953125, -16.43212890625, -15.859130859375, -15.2861328125, -14.713134765625, -14.14013671875, -13.567138671875, -12.994140625, -12.421142578125, -11.84814453125, -11.275146484375, -10.7021484375, -10.129150390625, -9.55615234375, -8.983154296875, -8.41015625, -7.837158203125, -7.26416015625, -6.691162109375, -6.1181640625, -5.545166015625, -4.97216796875, -4.399169921875, -3.826171875, -3.253173828125, -2.68017578125, -2.107177734375, -1.5341796875, -0.961181640625, -0.38818359375, 0.184814453125, 0.7578125, 1.330810546875, 1.90380859375, 2.476806640625, 3.0498046875, 3.622802734375, 4.19580078125, 4.768798828125, 5.341796875, 5.914794921875, 6.48779296875, 7.060791015625, 7.6337890625, 8.206787109375, 8.77978515625, 9.352783203125, 9.92578125, 10.498779296875, 11.07177734375, 11.644775390625, 12.2177734375, 12.790771484375, 13.36376953125, 13.936767578125, 14.509765625, 15.082763671875, 15.65576171875, 16.228759765625, 16.8017578125, 17.374755859375, 17.94775390625, 18.520751953125, 19.09375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 9.0, 13.0, 16.0, 29.0, 49.0, 112.0, 180.0, 201.0, 172.0, 94.0, 33.0, 25.0, 16.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-496.2736511230469, -485.98358154296875, -475.6935119628906, -465.4034423828125, -455.1133728027344, -444.82330322265625, -434.5332336425781, -424.2431640625, -413.9530944824219, -403.66302490234375, -393.3729553222656, -383.0828857421875, -372.7928161621094, -362.50274658203125, -352.2126770019531, -341.922607421875, -331.6325378417969, -321.34246826171875, -311.0523986816406, -300.7623291015625, -290.4722595214844, -280.18218994140625, -269.8921203613281, -259.60205078125, -249.31198120117188, -239.02191162109375, -228.73184204101562, -218.4417724609375, -208.15170288085938, -197.86163330078125, -187.57156372070312, -177.281494140625, -166.9914093017578, -156.7013397216797, -146.41127014160156, -136.12120056152344, -125.83113098144531, -115.54106140136719, -105.25099182128906, -94.96092224121094, -84.67085266113281, -74.38078308105469, -64.09071350097656, -53.80064392089844, -43.51057434082031, -33.22050476074219, -22.930435180664062, -12.640365600585938, -2.3502960205078125, 7.9397735595703125, 18.229843139648438, 28.519912719726562, 38.80998229980469, 49.10005187988281, 59.39012145996094, 69.68019104003906, 79.97026062011719, 90.26033020019531, 100.55039978027344, 110.84046936035156, 121.13053894042969, 131.4206085205078, 141.71067810058594, 152.00074768066406, 162.2908172607422]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 0.0, 7.0, 4.0, 7.0, 5.0, 7.0, 13.0, 12.0, 12.0, 9.0, 15.0, 9.0, 17.0, 22.0, 19.0, 32.0, 17.0, 27.0, 28.0, 44.0, 36.0, 33.0, 43.0, 38.0, 27.0, 38.0, 42.0, 29.0, 42.0, 37.0, 23.0, 39.0, 31.0, 28.0, 27.0, 22.0, 18.0, 20.0, 12.0, 17.0, 9.0, 15.0, 11.0, 9.0, 5.0, 9.0, 7.0, 8.0, 7.0, 2.0, 4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-246.9398193359375, -239.129638671875, -231.31944274902344, -223.50926208496094, -215.69906616210938, -207.88888549804688, -200.07870483398438, -192.26852416992188, -184.4583282470703, -176.6481475830078, -168.83795166015625, -161.02777099609375, -153.21759033203125, -145.4073944091797, -137.5972137451172, -129.78701782226562, -121.97683715820312, -114.1666488647461, -106.35646057128906, -98.54627990722656, -90.73609161376953, -82.9259033203125, -75.11572265625, -67.30553436279297, -59.49534606933594, -51.685157775878906, -43.87497329711914, -36.064788818359375, -28.254600524902344, -20.444412231445312, -12.634227752685547, -4.824043273925781, 2.98614501953125, 10.796331405639648, 18.606517791748047, 26.416704177856445, 34.226890563964844, 42.037078857421875, 49.84726333618164, 57.657447814941406, 65.46763610839844, 73.27782440185547, 81.0880126953125, 88.898193359375, 96.70838165283203, 104.51856994628906, 112.32875061035156, 120.1389389038086, 127.94912719726562, 135.75930786132812, 143.5695037841797, 151.3796844482422, 159.18988037109375, 167.00006103515625, 174.81024169921875, 182.62042236328125, 190.4306182861328, 198.2407989501953, 206.05099487304688, 213.86117553710938, 221.67135620117188, 229.48155212402344, 237.29173278808594, 245.1019287109375, 252.912109375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 8.0, 7.0, 13.0, 13.0, 18.0, 25.0, 48.0, 68.0, 96.0, 118.0, 139.0, 220.0, 317.0, 407.0, 533.0, 712.0, 973.0, 1404.0, 1811.0, 2395.0, 3095.0, 4102.0, 1018202.0, 3453.0, 2704.0, 1941.0, 1566.0, 1155.0, 796.0, 605.0, 443.0, 315.0, 254.0, 165.0, 144.0, 84.0, 58.0, 43.0, 35.0, 19.0, 11.0, 11.0, 13.0, 7.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-29.696792602539062, -28.773496627807617, -27.850200653076172, -26.92690658569336, -26.003610610961914, -25.08031463623047, -24.157020568847656, -23.23372459411621, -22.310428619384766, -21.38713264465332, -20.463836669921875, -19.540542602539062, -18.617246627807617, -17.693950653076172, -16.77065658569336, -15.847360610961914, -14.924064636230469, -14.000768661499023, -13.077473640441895, -12.154178619384766, -11.23088264465332, -10.307586669921875, -9.384291648864746, -8.460996627807617, -7.537700653076172, -6.614405155181885, -5.691109657287598, -4.7678141593933105, -3.8445186614990234, -2.9212231636047363, -1.9979276657104492, -1.074632167816162, -0.1513347625732422, 0.7719607353210449, 1.695256233215332, 2.618551731109619, 3.5418472290039062, 4.465142726898193, 5.3884382247924805, 6.311733722686768, 7.235029220581055, 8.1583251953125, 9.081620216369629, 10.004915237426758, 10.928211212158203, 11.851507186889648, 12.774802207946777, 13.698097229003906, 14.621393203735352, 15.544689178466797, 16.46798324584961, 17.391279220581055, 18.3145751953125, 19.237871170043945, 20.16116714477539, 21.084461212158203, 22.00775718688965, 22.931053161621094, 23.854347229003906, 24.77764320373535, 25.700939178466797, 26.624235153198242, 27.547531127929688, 28.4708251953125, 29.394121170043945]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 8.0, 19.0, 25.0, 32.0, 48.0, 96.0, 211.0, 883.0, 86618.0, 51373864.0, 1062.0, 187.0, 92.0, 38.0, 30.0, 13.0, 15.0, 13.0, 13.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-759.0606079101562, -733.8005981445312, -708.54052734375, -683.280517578125, -658.0205078125, -632.760498046875, -607.50048828125, -582.2404174804688, -556.9804077148438, -531.7203979492188, -506.4603576660156, -481.2003173828125, -455.9403076171875, -430.6802978515625, -405.4202575683594, -380.16021728515625, -354.90020751953125, -329.64019775390625, -304.3801574707031, -279.1201171875, -253.860107421875, -228.60008239746094, -203.34005737304688, -178.0800323486328, -152.82000732421875, -127.55998229980469, -102.29995727539062, -77.03993225097656, -51.7799072265625, -26.519882202148438, -1.259857177734375, 24.000167846679688, 49.26019287109375, 74.52021789550781, 99.78024291992188, 125.04026794433594, 150.30029296875, 175.56031799316406, 200.82034301757812, 226.0803680419922, 251.34039306640625, 276.60040283203125, 301.8604431152344, 327.1204833984375, 352.3804931640625, 377.6405029296875, 402.9005432128906, 428.16058349609375, 453.42059326171875, 478.68060302734375, 503.9406433105469, 529.20068359375, 554.460693359375, 579.720703125, 604.980712890625, 630.2407836914062, 655.5007934570312, 680.7608032226562, 706.0208740234375, 731.2808837890625, 756.5408935546875, 781.8009033203125, 807.0609130859375, 832.3209838867188, 857.5809936523438]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [6.0, 6.0, 5.0, 7.0, 18.0, 22.0, 35.0, 63.0, 79.0, 105.0, 141.0, 216.0, 272.0, 456.0, 610.0, 837.0, 1231.0, 1868.0, 2521.0, 3890.0, 5640.0, 8126.0, 11999.0, 18024.0, 26831.0, 39866.0, 59988.0, 94146.0, 151209.0, 250762.0, 478640.0, 4099761.0, 414703.0, 227114.0, 136192.0, 86722.0, 55941.0, 36412.0, 24592.0, 16589.0, 11200.0, 7565.0, 5188.0, 3672.0, 2520.0, 1756.0, 1226.0, 860.0, 562.0, 405.0, 257.0, 200.0, 140.0, 93.0, 35.0, 37.0, 24.0, 27.0, 14.0, 17.0, 4.0, 0.0, 3.0, 6.0], "bins": [-0.888671875, -0.8603744506835938, -0.8320770263671875, -0.8037796020507812, -0.775482177734375, -0.7471847534179688, -0.7188873291015625, -0.6905899047851562, -0.66229248046875, -0.6339950561523438, -0.6056976318359375, -0.5774002075195312, -0.549102783203125, -0.5208053588867188, -0.4925079345703125, -0.46421051025390625, -0.4359130859375, -0.40761566162109375, -0.3793182373046875, -0.35102081298828125, -0.322723388671875, -0.29442596435546875, -0.2661285400390625, -0.23783111572265625, -0.20953369140625, -0.18123626708984375, -0.1529388427734375, -0.12464141845703125, -0.096343994140625, -0.06804656982421875, -0.0397491455078125, -0.01145172119140625, 0.016845703125, 0.04514312744140625, 0.0734405517578125, 0.10173797607421875, 0.130035400390625, 0.15833282470703125, 0.1866302490234375, 0.21492767333984375, 0.24322509765625, 0.27152252197265625, 0.2998199462890625, 0.32811737060546875, 0.356414794921875, 0.38471221923828125, 0.4130096435546875, 0.44130706787109375, 0.4696044921875, 0.49790191650390625, 0.5261993408203125, 0.5544967651367188, 0.582794189453125, 0.6110916137695312, 0.6393890380859375, 0.6676864624023438, 0.69598388671875, 0.7242813110351562, 0.7525787353515625, 0.7808761596679688, 0.809173583984375, 0.8374710083007812, 0.8657684326171875, 0.8940658569335938, 0.92236328125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 2.0, 7.0, 3.0, 14.0, 14.0, 8.0, 14.0, 19.0, 17.0, 25.0, 19.0, 17.0, 26.0, 18.0, 27.0, 34.0, 36.0, 30.0, 37.0, 29.0, 38.0, 52.0, 1043.0, 32.0, 29.0, 38.0, 29.0, 23.0, 32.0, 38.0, 27.0, 31.0, 27.0, 25.0, 15.0, 22.0, 18.0, 19.0, 13.0, 8.0, 8.0, 9.0, 8.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0], "bins": [-39.1875, -38.01318359375, -36.8388671875, -35.66455078125, -34.490234375, -33.31591796875, -32.1416015625, -30.96728515625, -29.79296875, -28.61865234375, -27.4443359375, -26.27001953125, -25.095703125, -23.92138671875, -22.7470703125, -21.57275390625, -20.3984375, -19.22412109375, -18.0498046875, -16.87548828125, -15.701171875, -14.52685546875, -13.3525390625, -12.17822265625, -11.00390625, -9.82958984375, -8.6552734375, -7.48095703125, -6.306640625, -5.13232421875, -3.9580078125, -2.78369140625, -1.609375, -0.43505859375, 0.7392578125, 1.91357421875, 3.087890625, 4.26220703125, 5.4365234375, 6.61083984375, 7.78515625, 8.95947265625, 10.1337890625, 11.30810546875, 12.482421875, 13.65673828125, 14.8310546875, 16.00537109375, 17.1796875, 18.35400390625, 19.5283203125, 20.70263671875, 21.876953125, 23.05126953125, 24.2255859375, 25.39990234375, 26.57421875, 27.74853515625, 28.9228515625, 30.09716796875, 31.271484375, 32.44580078125, 33.6201171875, 34.79443359375, 35.96875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 9.0, 9.0, 18.0, 21.0, 35.0, 39.0, 77.0, 135.0, 217.0, 301.0, 467.0, 747.0, 1110.0, 1752.0, 2648.0, 4036.0, 6502.0, 10398.0, 16323.0, 25993.0, 41434.0, 66259.0, 109983.0, 195848.0, 404109.0, 4279443.0, 542423.0, 243177.0, 130033.0, 77718.0, 48321.0, 30000.0, 18883.0, 12031.0, 7460.0, 4878.0, 3094.0, 1883.0, 1316.0, 833.0, 516.0, 297.0, 230.0, 133.0, 92.0, 73.0, 54.0, 34.0, 20.0, 22.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.3291015625, -1.2884063720703125, -1.247711181640625, -1.2070159912109375, -1.16632080078125, -1.1256256103515625, -1.084930419921875, -1.0442352294921875, -1.0035400390625, -0.9628448486328125, -0.922149658203125, -0.8814544677734375, -0.84075927734375, -0.8000640869140625, -0.759368896484375, -0.7186737060546875, -0.677978515625, -0.6372833251953125, -0.596588134765625, -0.5558929443359375, -0.51519775390625, -0.4745025634765625, -0.433807373046875, -0.3931121826171875, -0.3524169921875, -0.3117218017578125, -0.271026611328125, -0.2303314208984375, -0.18963623046875, -0.1489410400390625, -0.108245849609375, -0.0675506591796875, -0.02685546875, 0.0138397216796875, 0.054534912109375, 0.0952301025390625, 0.13592529296875, 0.1766204833984375, 0.217315673828125, 0.2580108642578125, 0.2987060546875, 0.3394012451171875, 0.380096435546875, 0.4207916259765625, 0.46148681640625, 0.5021820068359375, 0.542877197265625, 0.5835723876953125, 0.624267578125, 0.6649627685546875, 0.705657958984375, 0.7463531494140625, 0.78704833984375, 0.8277435302734375, 0.868438720703125, 0.9091339111328125, 0.9498291015625, 0.9905242919921875, 1.031219482421875, 1.0719146728515625, 1.11260986328125, 1.1533050537109375, 1.194000244140625, 1.2346954345703125, 1.275390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 11.0, 17.0, 12.0, 21.0, 16.0, 25.0, 17.0, 26.0, 27.0, 40.0, 32.0, 43.0, 62.0, 46.0, 44.0, 1059.0, 50.0, 47.0, 49.0, 48.0, 41.0, 40.0, 29.0, 27.0, 25.0, 32.0, 16.0, 19.0, 20.0, 11.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.5, -65.435546875, -63.37109375, -61.306640625, -59.2421875, -57.177734375, -55.11328125, -53.048828125, -50.984375, -48.919921875, -46.85546875, -44.791015625, -42.7265625, -40.662109375, -38.59765625, -36.533203125, -34.46875, -32.404296875, -30.33984375, -28.275390625, -26.2109375, -24.146484375, -22.08203125, -20.017578125, -17.953125, -15.888671875, -13.82421875, -11.759765625, -9.6953125, -7.630859375, -5.56640625, -3.501953125, -1.4375, 0.626953125, 2.69140625, 4.755859375, 6.8203125, 8.884765625, 10.94921875, 13.013671875, 15.078125, 17.142578125, 19.20703125, 21.271484375, 23.3359375, 25.400390625, 27.46484375, 29.529296875, 31.59375, 33.658203125, 35.72265625, 37.787109375, 39.8515625, 41.916015625, 43.98046875, 46.044921875, 48.109375, 50.173828125, 52.23828125, 54.302734375, 56.3671875, 58.431640625, 60.49609375, 62.560546875, 64.625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 15.0, 24.0, 18.0, 16.0, 46.0, 42.0, 57.0, 81.0, 96.0, 175.0, 237.0, 260.0, 392.0, 553.0, 751.0, 1244.0, 1949.0, 3100.0, 4717.0, 7686.0, 13151.0, 25295.0, 59100.0, 305384.0, 5601290.0, 169957.0, 46109.0, 20584.0, 11055.0, 6524.0, 3939.0, 2417.0, 1619.0, 1020.0, 734.0, 409.0, 374.0, 268.0, 187.0, 111.0, 108.0, 89.0, 65.0, 31.0, 35.0, 55.0, 12.0, 14.0, 12.0, 9.0, 10.0, 9.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.275390625, -3.170989990234375, -3.06658935546875, -2.962188720703125, -2.8577880859375, -2.753387451171875, -2.64898681640625, -2.544586181640625, -2.440185546875, -2.335784912109375, -2.23138427734375, -2.126983642578125, -2.0225830078125, -1.918182373046875, -1.81378173828125, -1.709381103515625, -1.60498046875, -1.500579833984375, -1.39617919921875, -1.291778564453125, -1.1873779296875, -1.082977294921875, -0.97857666015625, -0.874176025390625, -0.769775390625, -0.665374755859375, -0.56097412109375, -0.456573486328125, -0.3521728515625, -0.247772216796875, -0.14337158203125, -0.038970947265625, 0.0654296875, 0.169830322265625, 0.27423095703125, 0.378631591796875, 0.4830322265625, 0.587432861328125, 0.69183349609375, 0.796234130859375, 0.900634765625, 1.005035400390625, 1.10943603515625, 1.213836669921875, 1.3182373046875, 1.422637939453125, 1.52703857421875, 1.631439208984375, 1.73583984375, 1.840240478515625, 1.94464111328125, 2.049041748046875, 2.1534423828125, 2.257843017578125, 2.36224365234375, 2.466644287109375, 2.571044921875, 2.675445556640625, 2.77984619140625, 2.884246826171875, 2.9886474609375, 3.093048095703125, 3.19744873046875, 3.301849365234375, 3.40625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 9.0, 10.0, 12.0, 8.0, 21.0, 18.0, 17.0, 18.0, 12.0, 26.0, 29.0, 37.0, 28.0, 32.0, 32.0, 42.0, 42.0, 35.0, 54.0, 44.0, 1052.0, 28.0, 44.0, 31.0, 57.0, 35.0, 31.0, 26.0, 24.0, 25.0, 20.0, 24.0, 17.0, 15.0, 11.0, 10.0, 12.0, 9.0, 5.0, 3.0, 1.0, 3.0, 8.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.46875, -59.36376953125, -57.2587890625, -55.15380859375, -53.048828125, -50.94384765625, -48.8388671875, -46.73388671875, -44.62890625, -42.52392578125, -40.4189453125, -38.31396484375, -36.208984375, -34.10400390625, -31.9990234375, -29.89404296875, -27.7890625, -25.68408203125, -23.5791015625, -21.47412109375, -19.369140625, -17.26416015625, -15.1591796875, -13.05419921875, -10.94921875, -8.84423828125, -6.7392578125, -4.63427734375, -2.529296875, -0.42431640625, 1.6806640625, 3.78564453125, 5.890625, 7.99560546875, 10.1005859375, 12.20556640625, 14.310546875, 16.41552734375, 18.5205078125, 20.62548828125, 22.73046875, 24.83544921875, 26.9404296875, 29.04541015625, 31.150390625, 33.25537109375, 35.3603515625, 37.46533203125, 39.5703125, 41.67529296875, 43.7802734375, 45.88525390625, 47.990234375, 50.09521484375, 52.2001953125, 54.30517578125, 56.41015625, 58.51513671875, 60.6201171875, 62.72509765625, 64.830078125, 66.93505859375, 69.0400390625, 71.14501953125, 73.25]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 11.0, 9.0, 13.0, 16.0, 14.0, 29.0, 46.0, 240.0, 419.0, 51.0, 26.0, 29.0, 19.0, 15.0, 8.0, 10.0, 6.0, 3.0, 9.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.4184875488281, -309.28857421875, -292.1586608886719, -275.02874755859375, -257.8988037109375, -240.76889038085938, -223.63897705078125, -206.50906372070312, -189.37913513183594, -172.2492218017578, -155.11929321289062, -137.9893798828125, -120.85945892333984, -103.72953796386719, -86.59962463378906, -69.4697036743164, -52.33978271484375, -35.209861755371094, -18.079944610595703, -0.9500274658203125, 16.179893493652344, 33.309814453125, 50.439727783203125, 67.56964874267578, 84.69956970214844, 101.8294906616211, 118.95941162109375, 136.08932495117188, 153.21923828125, 170.3491668701172, 187.4790802001953, 204.6090087890625, 221.7388916015625, 238.86880493164062, 255.9987335205078, 273.128662109375, 290.2585754394531, 307.38848876953125, 324.5184020996094, 341.6483154296875, 358.77825927734375, 375.9081726074219, 393.0380859375, 410.16802978515625, 427.2979431152344, 444.4278564453125, 461.5577697753906, 478.68768310546875, 495.8175964355469, 512.947509765625, 530.0774536132812, 547.2073364257812, 564.3372802734375, 581.4671630859375, 598.5971069335938, 615.72705078125, 632.85693359375, 649.9868774414062, 667.1167602539062, 684.2467041015625, 701.3765869140625, 718.5065307617188, 735.636474609375, 752.766357421875, 769.8963012695312]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 2.0, 8.0, 7.0, 8.0, 16.0, 16.0, 21.0, 16.0, 16.0, 17.0, 27.0, 22.0, 20.0, 30.0, 33.0, 23.0, 38.0, 44.0, 49.0, 41.0, 41.0, 39.0, 30.0, 37.0, 32.0, 35.0, 42.0, 37.0, 38.0, 26.0, 23.0, 31.0, 23.0, 21.0, 18.0, 17.0, 10.0, 10.0, 8.0, 5.0, 3.0, 8.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-238.36233520507812, -231.1828155517578, -224.0032958984375, -216.82379150390625, -209.64427185058594, -202.46475219726562, -195.28524780273438, -188.10572814941406, -180.92620849609375, -173.74668884277344, -166.56716918945312, -159.38766479492188, -152.20814514160156, -145.02862548828125, -137.84912109375, -130.6696014404297, -123.49008178710938, -116.31056213378906, -109.13105010986328, -101.9515380859375, -94.77201843261719, -87.59249877929688, -80.4129867553711, -73.23347473144531, -66.053955078125, -58.87443923950195, -51.694923400878906, -44.51540756225586, -37.33589172363281, -30.156375885009766, -22.97686004638672, -15.797344207763672, -8.617843627929688, -1.4383277893066406, 5.741188049316406, 12.920703887939453, 20.1002197265625, 27.279735565185547, 34.459251403808594, 41.63876724243164, 48.81828308105469, 55.997798919677734, 63.17731475830078, 70.35682678222656, 77.53634643554688, 84.71586608886719, 91.89537811279297, 99.07489013671875, 106.25440979003906, 113.43392944335938, 120.61344146728516, 127.79295349121094, 134.97247314453125, 142.15199279785156, 149.33151245117188, 156.51101684570312, 163.69053649902344, 170.87005615234375, 178.049560546875, 185.2290802001953, 192.40859985351562, 199.58811950683594, 206.76763916015625, 213.9471435546875, 221.1266632080078]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 7.0, 10.0, 16.0, 16.0, 21.0, 49.0, 58.0, 79.0, 143.0, 145.0, 201.0, 278.0, 364.0, 454.0, 505.0, 574.0, 676.0, 844.0, 1070.0, 1258.0, 1837.0, 3050.0, 4103.0, 7972.0, 4129380.0, 11858.0, 6935.0, 4431.0, 3256.0, 2545.0, 2005.0, 1730.0, 1458.0, 1266.0, 1053.0, 882.0, 712.0, 541.0, 479.0, 363.0, 306.0, 236.0, 222.0, 180.0, 143.0, 143.0, 113.0, 74.0, 59.0, 58.0, 35.0, 29.0, 18.0, 21.0, 11.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0], "bins": [-1.5078125, -1.4535980224609375, -1.399383544921875, -1.3451690673828125, -1.29095458984375, -1.2367401123046875, -1.182525634765625, -1.1283111572265625, -1.0740966796875, -1.0198822021484375, -0.965667724609375, -0.9114532470703125, -0.85723876953125, -0.8030242919921875, -0.748809814453125, -0.6945953369140625, -0.640380859375, -0.5861663818359375, -0.531951904296875, -0.4777374267578125, -0.42352294921875, -0.3693084716796875, -0.315093994140625, -0.2608795166015625, -0.2066650390625, -0.1524505615234375, -0.098236083984375, -0.0440216064453125, 0.01019287109375, 0.0644073486328125, 0.118621826171875, 0.1728363037109375, 0.22705078125, 0.2812652587890625, 0.335479736328125, 0.3896942138671875, 0.44390869140625, 0.4981231689453125, 0.552337646484375, 0.6065521240234375, 0.6607666015625, 0.7149810791015625, 0.769195556640625, 0.8234100341796875, 0.87762451171875, 0.9318389892578125, 0.986053466796875, 1.0402679443359375, 1.094482421875, 1.1486968994140625, 1.202911376953125, 1.2571258544921875, 1.31134033203125, 1.3655548095703125, 1.419769287109375, 1.4739837646484375, 1.5281982421875, 1.5824127197265625, 1.636627197265625, 1.6908416748046875, 1.74505615234375, 1.7992706298828125, 1.853485107421875, 1.9076995849609375, 1.9619140625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 8.0, 10.0, 7.0, 14.0, 50.0, 760.0, 20.0, 15.0, 15.0, 10.0, 5.0, 9.0, 4.0, 7.0, 5.0, 2.0, 5.0, 6.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0791015625, -0.07625770568847656, -0.07341384887695312, -0.07056999206542969, -0.06772613525390625, -0.06488227844238281, -0.062038421630859375, -0.05919456481933594, -0.0563507080078125, -0.05350685119628906, -0.050662994384765625, -0.04781913757324219, -0.04497528076171875, -0.04213142395019531, -0.039287567138671875, -0.03644371032714844, -0.033599853515625, -0.030755996704101562, -0.027912139892578125, -0.025068283081054688, -0.02222442626953125, -0.019380569458007812, -0.016536712646484375, -0.013692855834960938, -0.0108489990234375, -0.008005142211914062, -0.005161285400390625, -0.0023174285888671875, 0.00052642822265625, 0.0033702850341796875, 0.006214141845703125, 0.009057998657226562, 0.01190185546875, 0.014745712280273438, 0.017589569091796875, 0.020433425903320312, 0.02327728271484375, 0.026121139526367188, 0.028964996337890625, 0.03180885314941406, 0.0346527099609375, 0.03749656677246094, 0.040340423583984375, 0.04318428039550781, 0.04602813720703125, 0.04887199401855469, 0.051715850830078125, 0.05455970764160156, 0.057403564453125, 0.06024742126464844, 0.06309127807617188, 0.06593513488769531, 0.06877899169921875, 0.07162284851074219, 0.07446670532226562, 0.07731056213378906, 0.0801544189453125, 0.08299827575683594, 0.08584213256835938, 0.08868598937988281, 0.09152984619140625, 0.09437370300292969, 0.09721755981445312, 0.10006141662597656, 0.1029052734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 12.0, 7.0, 9.0, 12.0, 10.0, 21.0, 27.0, 51.0, 84.0, 98.0, 161.0, 262.0, 493.0, 832.0, 1525.0, 2884.0, 5775.0, 13045.0, 49897.0, 4072225.0, 26754.0, 9878.0, 4643.0, 2417.0, 1252.0, 749.0, 444.0, 231.0, 165.0, 107.0, 80.0, 30.0, 25.0, 22.0, 10.0, 15.0, 3.0, 9.0, 10.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.1083221435546875, -1.075042724609375, -1.0417633056640625, -1.00848388671875, -0.9752044677734375, -0.941925048828125, -0.9086456298828125, -0.8753662109375, -0.8420867919921875, -0.808807373046875, -0.7755279541015625, -0.74224853515625, -0.7089691162109375, -0.675689697265625, -0.6424102783203125, -0.609130859375, -0.5758514404296875, -0.542572021484375, -0.5092926025390625, -0.47601318359375, -0.4427337646484375, -0.409454345703125, -0.3761749267578125, -0.3428955078125, -0.3096160888671875, -0.276336669921875, -0.2430572509765625, -0.20977783203125, -0.1764984130859375, -0.143218994140625, -0.1099395751953125, -0.07666015625, -0.0433807373046875, -0.010101318359375, 0.0231781005859375, 0.05645751953125, 0.0897369384765625, 0.123016357421875, 0.1562957763671875, 0.1895751953125, 0.2228546142578125, 0.256134033203125, 0.2894134521484375, 0.32269287109375, 0.3559722900390625, 0.389251708984375, 0.4225311279296875, 0.455810546875, 0.4890899658203125, 0.522369384765625, 0.5556488037109375, 0.58892822265625, 0.6222076416015625, 0.655487060546875, 0.6887664794921875, 0.7220458984375, 0.7553253173828125, 0.788604736328125, 0.8218841552734375, 0.85516357421875, 0.8884429931640625, 0.921722412109375, 0.9550018310546875, 0.98828125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 3.0, 6.0, 6.0, 9.0, 1.0, 13.0, 16.0, 9.0, 19.0, 14.0, 29.0, 3725.0, 78.0, 25.0, 19.0, 14.0, 19.0, 8.0, 16.0, 9.0, 11.0, 8.0, 4.0, 1.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.235107421875, -0.22481536865234375, -0.2145233154296875, -0.20423126220703125, -0.193939208984375, -0.18364715576171875, -0.1733551025390625, -0.16306304931640625, -0.15277099609375, -0.14247894287109375, -0.1321868896484375, -0.12189483642578125, -0.111602783203125, -0.10131072998046875, -0.0910186767578125, -0.08072662353515625, -0.0704345703125, -0.06014251708984375, -0.0498504638671875, -0.03955841064453125, -0.029266357421875, -0.01897430419921875, -0.0086822509765625, 0.00160980224609375, 0.01190185546875, 0.02219390869140625, 0.0324859619140625, 0.04277801513671875, 0.053070068359375, 0.06336212158203125, 0.0736541748046875, 0.08394622802734375, 0.09423828125, 0.10453033447265625, 0.1148223876953125, 0.12511444091796875, 0.135406494140625, 0.14569854736328125, 0.1559906005859375, 0.16628265380859375, 0.17657470703125, 0.18686676025390625, 0.1971588134765625, 0.20745086669921875, 0.217742919921875, 0.22803497314453125, 0.2383270263671875, 0.24861907958984375, 0.2589111328125, 0.26920318603515625, 0.2794952392578125, 0.28978729248046875, 0.300079345703125, 0.31037139892578125, 0.3206634521484375, 0.33095550537109375, 0.34124755859375, 0.35153961181640625, 0.3618316650390625, 0.37212371826171875, 0.382415771484375, 0.39270782470703125, 0.4029998779296875, 0.41329193115234375, 0.423583984375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 14.0, 59.0, 639.0, 195.0, 55.0, 20.0, 13.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3403024673461914, -0.2676445245742798, -0.19498655200004578, -0.12232859432697296, -0.049670636653900146, 0.022987306118011475, 0.09564527869224548, 0.1683032512664795, 0.2409611940383911, 0.31361913681030273, 0.38627710938453674, 0.45893508195877075, 0.5315930247306824, 0.604250967502594, 0.6769089698791504, 0.749566912651062, 0.8222248554229736, 0.8948827981948853, 0.9675407409667969, 1.0401986837387085, 1.1128566265106201, 1.1855146884918213, 1.258172631263733, 1.3308305740356445, 1.4034885168075562, 1.4761464595794678, 1.5488044023513794, 1.621462345123291, 1.6941204071044922, 1.7667782306671143, 1.8394362926483154, 1.912094235420227, 1.9847521781921387, 2.05741024017334, 2.130068063735962, 2.202726125717163, 2.275383949279785, 2.3480420112609863, 2.4206998348236084, 2.4933578968048096, 2.5660157203674316, 2.638673782348633, 2.711331605911255, 2.783989667892456, 2.856647491455078, 2.9293055534362793, 3.0019633769989014, 3.0746214389801025, 3.1472795009613037, 3.219937562942505, 3.292595386505127, 3.365253448486328, 3.43791127204895, 3.5105693340301514, 3.5832271575927734, 3.6558852195739746, 3.728543281555176, 3.801201343536377, 3.873859167098999, 3.9465172290802, 4.019175052642822, 4.091833114624023, 4.164491176605225, 4.237149238586426, 4.309806823730469]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 7.0, 5.0, 10.0, 11.0, 14.0, 11.0, 15.0, 27.0, 42.0, 64.0, 74.0, 89.0, 103.0, 110.0, 102.0, 79.0, 68.0, 33.0, 33.0, 27.0, 15.0, 7.0, 11.0, 6.0, 4.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9741743206977844, -0.941252589225769, -0.9083309173583984, -0.8754091858863831, -0.8424875140190125, -0.8095657825469971, -0.7766441106796265, -0.7437223792076111, -0.7108006477355957, -0.6778789162635803, -0.6449572443962097, -0.6120355129241943, -0.5791138410568237, -0.5461921095848083, -0.513270378112793, -0.48034870624542236, -0.44742703437805176, -0.41450533270835876, -0.38158363103866577, -0.3486618995666504, -0.3157402276992798, -0.2828184962272644, -0.2498967945575714, -0.21697509288787842, -0.18405339121818542, -0.15113168954849243, -0.11820998042821884, -0.08528827130794525, -0.05236656963825226, -0.019444867968559265, 0.013476848602294922, 0.046398550271987915, 0.07932019233703613, 0.11224189400672913, 0.14516359567642212, 0.1780853122472763, 0.2110070139169693, 0.2439287155866623, 0.2768504321575165, 0.3097721338272095, 0.34269383549690247, 0.37561553716659546, 0.40853723883628845, 0.44145894050598145, 0.4743806719779968, 0.5073023438453674, 0.5402240753173828, 0.5731457471847534, 0.6060674786567688, 0.6389892101287842, 0.6719108819961548, 0.7048326134681702, 0.7377542853355408, 0.7706760168075562, 0.8035976886749268, 0.8365194201469421, 0.8694411516189575, 0.9023628830909729, 0.9352845549583435, 0.9682062864303589, 1.0011279582977295, 1.0340496301651, 1.0669714212417603, 1.0998930931091309, 1.1328147649765015]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 15.0, 22.0, 25.0, 38.0, 49.0, 70.0, 99.0, 118.0, 165.0, 228.0, 323.0, 469.0, 609.0, 899.0, 1269.0, 1716.0, 2618.0, 3977.0, 6209.0, 10890.0, 24140.0, 867617.0, 87720.0, 15249.0, 8173.0, 4932.0, 3286.0, 2200.0, 1511.0, 1095.0, 747.0, 563.0, 387.0, 298.0, 220.0, 158.0, 121.0, 85.0, 59.0, 43.0, 36.0, 25.0, 17.0, 18.0, 13.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.52734375, -0.5112380981445312, -0.4951324462890625, -0.47902679443359375, -0.462921142578125, -0.44681549072265625, -0.4307098388671875, -0.41460418701171875, -0.39849853515625, -0.38239288330078125, -0.3662872314453125, -0.35018157958984375, -0.334075927734375, -0.31797027587890625, -0.3018646240234375, -0.28575897216796875, -0.2696533203125, -0.25354766845703125, -0.2374420166015625, -0.22133636474609375, -0.205230712890625, -0.18912506103515625, -0.1730194091796875, -0.15691375732421875, -0.14080810546875, -0.12470245361328125, -0.1085968017578125, -0.09249114990234375, -0.076385498046875, -0.06027984619140625, -0.0441741943359375, -0.02806854248046875, -0.011962890625, 0.00414276123046875, 0.0202484130859375, 0.03635406494140625, 0.052459716796875, 0.06856536865234375, 0.0846710205078125, 0.10077667236328125, 0.11688232421875, 0.13298797607421875, 0.1490936279296875, 0.16519927978515625, 0.181304931640625, 0.19741058349609375, 0.2135162353515625, 0.22962188720703125, 0.2457275390625, 0.26183319091796875, 0.2779388427734375, 0.29404449462890625, 0.310150146484375, 0.32625579833984375, 0.3423614501953125, 0.35846710205078125, 0.37457275390625, 0.39067840576171875, 0.4067840576171875, 0.42288970947265625, 0.438995361328125, 0.45510101318359375, 0.4712066650390625, 0.48731231689453125, 0.50341796875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 4.0, 5.0, 12.0, 7.0, 9.0, 13.0, 700.0, 115.0, 14.0, 18.0, 11.0, 9.0, 5.0, 7.0, 6.0, 6.0, 5.0, 2.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07440185546875, -0.07169723510742188, -0.06899261474609375, -0.06628799438476562, -0.0635833740234375, -0.060878753662109375, -0.05817413330078125, -0.055469512939453125, -0.052764892578125, -0.050060272216796875, -0.04735565185546875, -0.044651031494140625, -0.0419464111328125, -0.039241790771484375, -0.03653717041015625, -0.033832550048828125, -0.0311279296875, -0.028423309326171875, -0.02571868896484375, -0.023014068603515625, -0.0203094482421875, -0.017604827880859375, -0.01490020751953125, -0.012195587158203125, -0.009490966796875, -0.006786346435546875, -0.00408172607421875, -0.001377105712890625, 0.0013275146484375, 0.004032135009765625, 0.00673675537109375, 0.009441375732421875, 0.01214599609375, 0.014850616455078125, 0.01755523681640625, 0.020259857177734375, 0.0229644775390625, 0.025669097900390625, 0.02837371826171875, 0.031078338623046875, 0.033782958984375, 0.036487579345703125, 0.03919219970703125, 0.041896820068359375, 0.0446014404296875, 0.047306060791015625, 0.05001068115234375, 0.052715301513671875, 0.055419921875, 0.058124542236328125, 0.06082916259765625, 0.06353378295898438, 0.0662384033203125, 0.06894302368164062, 0.07164764404296875, 0.07435226440429688, 0.077056884765625, 0.07976150512695312, 0.08246612548828125, 0.08517074584960938, 0.0878753662109375, 0.09057998657226562, 0.09328460693359375, 0.09598922729492188, 0.09869384765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 16.0, 14.0, 22.0, 27.0, 49.0, 66.0, 82.0, 123.0, 202.0, 269.0, 459.0, 634.0, 1087.0, 1671.0, 2749.0, 4530.0, 7631.0, 13334.0, 24206.0, 47383.0, 135774.0, 602937.0, 110295.0, 42533.0, 21833.0, 12381.0, 7103.0, 4215.0, 2483.0, 1563.0, 984.0, 628.0, 409.0, 252.0, 173.0, 132.0, 74.0, 62.0, 38.0, 37.0, 19.0, 23.0, 7.0, 16.0, 7.0, 7.0, 3.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32568359375, -0.3146171569824219, -0.30355072021484375, -0.2924842834472656, -0.2814178466796875, -0.2703514099121094, -0.25928497314453125, -0.24821853637695312, -0.237152099609375, -0.22608566284179688, -0.21501922607421875, -0.20395278930664062, -0.1928863525390625, -0.18181991577148438, -0.17075347900390625, -0.15968704223632812, -0.14862060546875, -0.13755416870117188, -0.12648773193359375, -0.11542129516601562, -0.1043548583984375, -0.09328842163085938, -0.08222198486328125, -0.07115554809570312, -0.060089111328125, -0.049022674560546875, -0.03795623779296875, -0.026889801025390625, -0.0158233642578125, -0.004756927490234375, 0.00630950927734375, 0.017375946044921875, 0.0284423828125, 0.039508819580078125, 0.05057525634765625, 0.061641693115234375, 0.0727081298828125, 0.08377456665039062, 0.09484100341796875, 0.10590744018554688, 0.116973876953125, 0.12804031372070312, 0.13910675048828125, 0.15017318725585938, 0.1612396240234375, 0.17230606079101562, 0.18337249755859375, 0.19443893432617188, 0.20550537109375, 0.21657180786132812, 0.22763824462890625, 0.23870468139648438, 0.2497711181640625, 0.2608375549316406, 0.27190399169921875, 0.2829704284667969, 0.294036865234375, 0.3051033020019531, 0.31616973876953125, 0.3272361755371094, 0.3383026123046875, 0.3493690490722656, 0.36043548583984375, 0.3715019226074219, 0.382568359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 1.0, 9.0, 4.0, 9.0, 13.0, 10.0, 14.0, 21.0, 14.0, 21.0, 22.0, 24.0, 26.0, 33.0, 29.0, 39.0, 52.0, 30.0, 38.0, 35.0, 41.0, 40.0, 30.0, 36.0, 47.0, 35.0, 35.0, 25.0, 35.0, 28.0, 29.0, 29.0, 15.0, 25.0, 18.0, 21.0, 10.0, 9.0, 12.0, 8.0, 5.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.377685546875, -0.3667564392089844, -0.35582733154296875, -0.3448982238769531, -0.3339691162109375, -0.3230400085449219, -0.31211090087890625, -0.3011817932128906, -0.290252685546875, -0.2793235778808594, -0.26839447021484375, -0.2574653625488281, -0.2465362548828125, -0.23560714721679688, -0.22467803955078125, -0.21374893188476562, -0.20281982421875, -0.19189071655273438, -0.18096160888671875, -0.17003250122070312, -0.1591033935546875, -0.14817428588867188, -0.13724517822265625, -0.12631607055664062, -0.115386962890625, -0.10445785522460938, -0.09352874755859375, -0.08259963989257812, -0.0716705322265625, -0.060741424560546875, -0.04981231689453125, -0.038883209228515625, -0.0279541015625, -0.017024993896484375, -0.00609588623046875, 0.004833221435546875, 0.0157623291015625, 0.026691436767578125, 0.03762054443359375, 0.048549652099609375, 0.059478759765625, 0.07040786743164062, 0.08133697509765625, 0.09226608276367188, 0.1031951904296875, 0.11412429809570312, 0.12505340576171875, 0.13598251342773438, 0.14691162109375, 0.15784072875976562, 0.16876983642578125, 0.17969894409179688, 0.1906280517578125, 0.20155715942382812, 0.21248626708984375, 0.22341537475585938, 0.234344482421875, 0.24527359008789062, 0.25620269775390625, 0.2671318054199219, 0.2780609130859375, 0.2889900207519531, 0.29991912841796875, 0.3108482360839844, 0.32177734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 18.0, 24.0, 46.0, 94.0, 137.0, 418.0, 1956.0, 70982.0, 967608.0, 6070.0, 695.0, 246.0, 127.0, 59.0, 24.0, 14.0, 8.0, 9.0, 6.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032787322998046875, -0.003192901611328125, -0.0031070709228515625, -0.003021240234375, -0.0029354095458984375, -0.002849578857421875, -0.0027637481689453125, -0.00267791748046875, -0.0025920867919921875, -0.002506256103515625, -0.0024204254150390625, -0.0023345947265625, -0.0022487640380859375, -0.002162933349609375, -0.0020771026611328125, -0.00199127197265625, -0.0019054412841796875, -0.001819610595703125, -0.0017337799072265625, -0.00164794921875, -0.0015621185302734375, -0.001476287841796875, -0.0013904571533203125, -0.00130462646484375, -0.0012187957763671875, -0.001132965087890625, -0.0010471343994140625, -0.0009613037109375, -0.0008754730224609375, -0.000789642333984375, -0.0007038116455078125, -0.00061798095703125, -0.0005321502685546875, -0.000446319580078125, -0.0003604888916015625, -0.000274658203125, -0.0001888275146484375, -0.000102996826171875, -1.71661376953125e-05, 6.866455078125e-05, 0.0001544952392578125, 0.000240325927734375, 0.0003261566162109375, 0.0004119873046875, 0.0004978179931640625, 0.000583648681640625, 0.0006694793701171875, 0.00075531005859375, 0.0008411407470703125, 0.000926971435546875, 0.0010128021240234375, 0.0010986328125, 0.0011844635009765625, 0.001270294189453125, 0.0013561248779296875, 0.00144195556640625, 0.0015277862548828125, 0.001613616943359375, 0.0016994476318359375, 0.0017852783203125, 0.0018711090087890625, 0.001956939697265625, 0.0020427703857421875, 0.00212860107421875, 0.0022144317626953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 14.0, 12.0, 23.0, 26.0, 44.0, 76.0, 185.0, 274.0, 154.0, 73.0, 37.0, 31.0, 16.0, 9.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006814002990722656, -0.0006631985306739807, -0.0006449967622756958, -0.0006267949938774109, -0.000608593225479126, -0.0005903914570808411, -0.0005721896886825562, -0.0005539879202842712, -0.0005357861518859863, -0.0005175843834877014, -0.0004993826150894165, -0.0004811808466911316, -0.0004629790782928467, -0.00044477730989456177, -0.00042657554149627686, -0.00040837377309799194, -0.00039017200469970703, -0.0003719702363014221, -0.0003537684679031372, -0.0003355666995048523, -0.0003173649311065674, -0.00029916316270828247, -0.00028096139430999756, -0.00026275962591171265, -0.00024455785751342773, -0.00022635608911514282, -0.0002081543207168579, -0.000189952552318573, -0.00017175078392028809, -0.00015354901552200317, -0.00013534724712371826, -0.00011714547872543335, -9.894371032714844e-05, -8.074194192886353e-05, -6.254017353057861e-05, -4.43384051322937e-05, -2.613663673400879e-05, -7.934868335723877e-06, 1.0266900062561035e-05, 2.8468668460845947e-05, 4.667043685913086e-05, 6.487220525741577e-05, 8.307397365570068e-05, 0.0001012757420539856, 0.00011947751045227051, 0.00013767927885055542, 0.00015588104724884033, 0.00017408281564712524, 0.00019228458404541016, 0.00021048635244369507, 0.00022868812084197998, 0.0002468898892402649, 0.0002650916576385498, 0.0002832934260368347, 0.00030149519443511963, 0.00031969696283340454, 0.00033789873123168945, 0.00035610049962997437, 0.0003743022680282593, 0.0003925040364265442, 0.0004107058048248291, 0.000428907573223114, 0.0004471093416213989, 0.00046531111001968384, 0.00048351287841796875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 14.0, 11.0, 27.0, 24.0, 40.0, 58.0, 86.0, 99.0, 173.0, 258.0, 421.0, 655.0, 1067.0, 1795.0, 3222.0, 6617.0, 14964.0, 45895.0, 739457.0, 179243.0, 31226.0, 11254.0, 5193.0, 2687.0, 1518.0, 869.0, 549.0, 350.0, 235.0, 168.0, 107.0, 78.0, 56.0, 31.0, 33.0, 10.0, 14.0, 10.0, 4.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004382133483886719, -0.0004230216145515442, -0.0004078298807144165, -0.0003926381468772888, -0.00037744641304016113, -0.00036225467920303345, -0.00034706294536590576, -0.0003318712115287781, -0.0003166794776916504, -0.0003014877438545227, -0.000286296010017395, -0.00027110427618026733, -0.00025591254234313965, -0.00024072080850601196, -0.00022552907466888428, -0.0002103373408317566, -0.0001951456069946289, -0.00017995387315750122, -0.00016476213932037354, -0.00014957040548324585, -0.00013437867164611816, -0.00011918693780899048, -0.00010399520397186279, -8.880347013473511e-05, -7.361173629760742e-05, -5.8420002460479736e-05, -4.322826862335205e-05, -2.8036534786224365e-05, -1.284480094909668e-05, 2.346932888031006e-06, 1.753866672515869e-05, 3.273040056228638e-05, 4.792213439941406e-05, 6.311386823654175e-05, 7.830560207366943e-05, 9.349733591079712e-05, 0.0001086890697479248, 0.0001238808035850525, 0.00013907253742218018, 0.00015426427125930786, 0.00016945600509643555, 0.00018464773893356323, 0.00019983947277069092, 0.0002150312066078186, 0.0002302229404449463, 0.000245414674282074, 0.00026060640811920166, 0.00027579814195632935, 0.00029098987579345703, 0.0003061816096305847, 0.0003213733434677124, 0.0003365650773048401, 0.0003517568111419678, 0.00036694854497909546, 0.00038214027881622314, 0.00039733201265335083, 0.0004125237464904785, 0.0004277154803276062, 0.0004429072141647339, 0.00045809894800186157, 0.00047329068183898926, 0.0004884824156761169, 0.0005036741495132446, 0.0005188658833503723, 0.0005340576171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 5.0, 10.0, 5.0, 11.0, 19.0, 17.0, 36.0, 27.0, 43.0, 51.0, 68.0, 119.0, 189.0, 86.0, 68.0, 52.0, 41.0, 30.0, 21.0, 15.0, 23.0, 7.0, 8.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0005273818969726562, -0.0005123801529407501, -0.000497378408908844, -0.00048237666487693787, -0.00046737492084503174, -0.0004523731768131256, -0.0004373714327812195, -0.00042236968874931335, -0.0004073679447174072, -0.0003923662006855011, -0.00037736445665359497, -0.00036236271262168884, -0.0003473609685897827, -0.0003323592245578766, -0.00031735748052597046, -0.00030235573649406433, -0.0002873539924621582, -0.0002723522484302521, -0.00025735050439834595, -0.00024234876036643982, -0.0002273470163345337, -0.00021234527230262756, -0.00019734352827072144, -0.0001823417842388153, -0.00016734004020690918, -0.00015233829617500305, -0.00013733655214309692, -0.0001223348081111908, -0.00010733306407928467, -9.233132004737854e-05, -7.732957601547241e-05, -6.232783198356628e-05, -4.7326087951660156e-05, -3.232434391975403e-05, -1.73225998878479e-05, -2.3208558559417725e-06, 1.2680888175964355e-05, 2.7682632207870483e-05, 4.268437623977661e-05, 5.768612027168274e-05, 7.268786430358887e-05, 8.7689608335495e-05, 0.00010269135236740112, 0.00011769309639930725, 0.00013269484043121338, 0.0001476965844631195, 0.00016269832849502563, 0.00017770007252693176, 0.0001927018165588379, 0.00020770356059074402, 0.00022270530462265015, 0.00023770704865455627, 0.0002527087926864624, 0.00026771053671836853, 0.00028271228075027466, 0.0002977140247821808, 0.0003127157688140869, 0.00032771751284599304, 0.00034271925687789917, 0.0003577210009098053, 0.0003727227449417114, 0.00038772448897361755, 0.0004027262330055237, 0.0004177279770374298, 0.00043272972106933594]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 6.0, 4.0, 6.0, 2.0, 9.0, 8.0, 18.0, 26.0, 33.0, 49.0, 94.0, 414.0, 178.0, 61.0, 31.0, 22.0, 14.0, 11.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.104447364807129, -4.988015174865723, -4.871582508087158, -4.755150318145752, -4.638718128204346, -4.5222859382629395, -4.405853271484375, -4.289421081542969, -4.1729888916015625, -4.056556701660156, -3.940124273300171, -3.8236918449401855, -3.7072596549987793, -3.590827226638794, -3.4743950366973877, -3.3579626083374023, -3.241530418395996, -3.1250979900360107, -3.0086658000946045, -2.892233371734619, -2.775801181793213, -2.6593687534332275, -2.5429365634918213, -2.426504135131836, -2.3100717067718506, -2.1936392784118652, -2.077207088470459, -1.9607747793197632, -1.8443424701690674, -1.727910041809082, -1.6114778518676758, -1.4950454235076904, -1.3786132335662842, -1.2621809244155884, -1.1457486152648926, -1.0293163061141968, -0.912883996963501, -0.7964516282081604, -0.6800193190574646, -0.5635870099067688, -0.447154700756073, -0.3307223916053772, -0.2142900675535202, -0.09785774350166321, 0.018574565649032593, 0.13500690460205078, 0.2514392137527466, 0.3678715229034424, 0.4843038320541382, 0.600736141204834, 0.7171684503555298, 0.8336007595062256, 0.9500330686569214, 1.0664653778076172, 1.1828978061676025, 1.2993299961090088, 1.4157624244689941, 1.53219473361969, 1.6486270427703857, 1.7650593519210815, 1.8814916610717773, 1.9979240894317627, 2.114356279373169, 2.2307887077331543, 2.3472208976745605]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 5.0, 16.0, 14.0, 16.0, 18.0, 38.0, 75.0, 100.0, 153.0, 181.0, 135.0, 92.0, 56.0, 20.0, 20.0, 7.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.555797576904297, -8.305106163024902, -8.054415702819824, -7.80372428894043, -7.553033351898193, -7.302342414855957, -7.0516510009765625, -6.800960063934326, -6.55026912689209, -6.2995781898498535, -6.048886775970459, -5.798195838928223, -5.547504901885986, -5.29681396484375, -5.0461225509643555, -4.795431613922119, -4.544740200042725, -4.294049263000488, -4.043357849121094, -3.7926669120788574, -3.541975975036621, -3.2912847995758057, -3.0405936241149902, -2.789902687072754, -2.5392115116119385, -2.288520336151123, -2.0378293991088867, -1.7871382236480713, -1.5364471673965454, -1.2857561111450195, -1.035064935684204, -0.7843738794326782, -0.5336823463439941, -0.2829912602901459, -0.03230017423629761, 0.21839094161987305, 0.4690819978713989, 0.7197730541229248, 0.9704642295837402, 1.2211552858352661, 1.471846342086792, 1.7225373983383179, 1.9732284545898438, 2.223919630050659, 2.4746108055114746, 2.725301742553711, 2.9759929180145264, 3.226684093475342, 3.477375030517578, 3.7280662059783936, 3.97875714302063, 4.229448318481445, 4.480139255523682, 4.730830192565918, 4.9815216064453125, 5.232212543487549, 5.482903480529785, 5.7335944175720215, 5.984285831451416, 6.234976768493652, 6.485667705535889, 6.736358642578125, 6.9870500564575195, 7.237740993499756, 7.48843240737915]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 3.0, 8.0, 10.0, 13.0, 21.0, 35.0, 67.0, 134.0, 321.0, 744.0, 2063.0, 5571.0, 29780.0, 4129031.0, 15669.0, 6076.0, 2561.0, 1016.0, 537.0, 232.0, 127.0, 72.0, 45.0, 38.0, 19.0, 10.0, 13.0, 5.0, 12.0, 9.0, 5.0, 1.0, 3.0, 4.0, 4.0, 6.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.1953125, -6.9405517578125, -6.685791015625, -6.4310302734375, -6.17626953125, -5.9215087890625, -5.666748046875, -5.4119873046875, -5.1572265625, -4.9024658203125, -4.647705078125, -4.3929443359375, -4.13818359375, -3.8834228515625, -3.628662109375, -3.3739013671875, -3.119140625, -2.8643798828125, -2.609619140625, -2.3548583984375, -2.10009765625, -1.8453369140625, -1.590576171875, -1.3358154296875, -1.0810546875, -0.8262939453125, -0.571533203125, -0.3167724609375, -0.06201171875, 0.1927490234375, 0.447509765625, 0.7022705078125, 0.95703125, 1.2117919921875, 1.466552734375, 1.7213134765625, 1.97607421875, 2.2308349609375, 2.485595703125, 2.7403564453125, 2.9951171875, 3.2498779296875, 3.504638671875, 3.7593994140625, 4.01416015625, 4.2689208984375, 4.523681640625, 4.7784423828125, 5.033203125, 5.2879638671875, 5.542724609375, 5.7974853515625, 6.05224609375, 6.3070068359375, 6.561767578125, 6.8165283203125, 7.0712890625, 7.3260498046875, 7.580810546875, 7.8355712890625, 8.09033203125, 8.3450927734375, 8.599853515625, 8.8546142578125, 9.109375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 3.0, 5.0, 9.0, 6.0, 7.0, 12.0, 35.0, 743.0, 41.0, 14.0, 11.0, 10.0, 10.0, 7.0, 10.0, 3.0, 3.0, 5.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 7.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.061309814453125, -0.05913972854614258, -0.056969642639160156, -0.054799556732177734, -0.05262947082519531, -0.05045938491821289, -0.04828929901123047, -0.04611921310424805, -0.043949127197265625, -0.0417790412902832, -0.03960895538330078, -0.03743886947631836, -0.03526878356933594, -0.033098697662353516, -0.030928611755371094, -0.028758525848388672, -0.02658843994140625, -0.024418354034423828, -0.022248268127441406, -0.020078182220458984, -0.017908096313476562, -0.01573801040649414, -0.013567924499511719, -0.011397838592529297, -0.009227752685546875, -0.007057666778564453, -0.004887580871582031, -0.0027174949645996094, -0.0005474090576171875, 0.0016226768493652344, 0.0037927627563476562, 0.005962848663330078, 0.0081329345703125, 0.010303020477294922, 0.012473106384277344, 0.014643192291259766, 0.016813278198242188, 0.01898336410522461, 0.02115345001220703, 0.023323535919189453, 0.025493621826171875, 0.027663707733154297, 0.02983379364013672, 0.03200387954711914, 0.03417396545410156, 0.036344051361083984, 0.038514137268066406, 0.04068422317504883, 0.04285430908203125, 0.04502439498901367, 0.047194480895996094, 0.049364566802978516, 0.05153465270996094, 0.05370473861694336, 0.05587482452392578, 0.0580449104309082, 0.060214996337890625, 0.06238508224487305, 0.06455516815185547, 0.06672525405883789, 0.06889533996582031, 0.07106542587280273, 0.07323551177978516, 0.07540559768676758, 0.07757568359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 15.0, 15.0, 29.0, 34.0, 53.0, 103.0, 126.0, 227.0, 418.0, 805.0, 1400.0, 2772.0, 5711.0, 13052.0, 36308.0, 3877999.0, 197351.0, 33839.0, 12465.0, 5576.0, 2746.0, 1394.0, 741.0, 431.0, 260.0, 140.0, 99.0, 47.0, 33.0, 24.0, 19.0, 10.0, 6.0, 6.0, 7.0, 0.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.3654098510742188, -1.3284759521484375, -1.2915420532226562, -1.254608154296875, -1.2176742553710938, -1.1807403564453125, -1.1438064575195312, -1.10687255859375, -1.0699386596679688, -1.0330047607421875, -0.9960708618164062, -0.959136962890625, -0.9222030639648438, -0.8852691650390625, -0.8483352661132812, -0.8114013671875, -0.7744674682617188, -0.7375335693359375, -0.7005996704101562, -0.663665771484375, -0.6267318725585938, -0.5897979736328125, -0.5528640747070312, -0.51593017578125, -0.47899627685546875, -0.4420623779296875, -0.40512847900390625, -0.368194580078125, -0.33126068115234375, -0.2943267822265625, -0.25739288330078125, -0.220458984375, -0.18352508544921875, -0.1465911865234375, -0.10965728759765625, -0.072723388671875, -0.03578948974609375, 0.0011444091796875, 0.03807830810546875, 0.07501220703125, 0.11194610595703125, 0.1488800048828125, 0.18581390380859375, 0.222747802734375, 0.25968170166015625, 0.2966156005859375, 0.33354949951171875, 0.3704833984375, 0.40741729736328125, 0.4443511962890625, 0.48128509521484375, 0.518218994140625, 0.5551528930664062, 0.5920867919921875, 0.6290206909179688, 0.66595458984375, 0.7028884887695312, 0.7398223876953125, 0.7767562866210938, 0.813690185546875, 0.8506240844726562, 0.8875579833984375, 0.9244918823242188, 0.96142578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 9.0, 7.0, 9.0, 17.0, 20.0, 19.0, 17.0, 14.0, 29.0, 26.0, 23.0, 21.0, 44.0, 3561.0, 28.0, 20.0, 28.0, 15.0, 26.0, 17.0, 15.0, 17.0, 15.0, 12.0, 7.0, 10.0, 6.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1300048828125, -0.12502098083496094, -0.12003707885742188, -0.11505317687988281, -0.11006927490234375, -0.10508537292480469, -0.10010147094726562, -0.09511756896972656, -0.0901336669921875, -0.08514976501464844, -0.08016586303710938, -0.07518196105957031, -0.07019805908203125, -0.06521415710449219, -0.060230255126953125, -0.05524635314941406, -0.050262451171875, -0.04527854919433594, -0.040294647216796875, -0.03531074523925781, -0.03032684326171875, -0.025342941284179688, -0.020359039306640625, -0.015375137329101562, -0.0103912353515625, -0.0054073333740234375, -0.000423431396484375, 0.0045604705810546875, 0.00954437255859375, 0.014528274536132812, 0.019512176513671875, 0.024496078491210938, 0.02947998046875, 0.03446388244628906, 0.039447784423828125, 0.04443168640136719, 0.04941558837890625, 0.05439949035644531, 0.059383392333984375, 0.06436729431152344, 0.0693511962890625, 0.07433509826660156, 0.07931900024414062, 0.08430290222167969, 0.08928680419921875, 0.09427070617675781, 0.09925460815429688, 0.10423851013183594, 0.109222412109375, 0.11420631408691406, 0.11919021606445312, 0.12417411804199219, 0.12915802001953125, 0.1341419219970703, 0.13912582397460938, 0.14410972595214844, 0.1490936279296875, 0.15407752990722656, 0.15906143188476562, 0.1640453338623047, 0.16902923583984375, 0.1740131378173828, 0.17899703979492188, 0.18398094177246094, 0.18896484375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 6.0, 10.0, 37.0, 236.0, 578.0, 87.0, 26.0, 17.0, 9.0, 4.0, 0.0, 2.0], "bins": [-2.3651981353759766, -2.323052167892456, -2.2809059619903564, -2.238759994506836, -2.1966140270233154, -2.154467821121216, -2.1123218536376953, -2.070175886154175, -2.028029680252075, -1.9858835935592651, -1.9437376260757446, -1.9015915393829346, -1.8594454526901245, -1.8172993659973145, -1.775153398513794, -1.7330073118209839, -1.6908613443374634, -1.6487152576446533, -1.6065692901611328, -1.5644232034683228, -1.5222771167755127, -1.4801311492919922, -1.4379850625991821, -1.395838975906372, -1.3536930084228516, -1.3115469217300415, -1.269400954246521, -1.227254867553711, -1.1851087808609009, -1.1429626941680908, -1.1008167266845703, -1.0586706399917603, -1.0165245532989502, -0.9743785262107849, -0.9322324395179749, -0.8900864124298096, -0.8479403257369995, -0.8057942986488342, -0.763648271560669, -0.7215021848678589, -0.6793560981750488, -0.6372100710868835, -0.5950639843940735, -0.5529179573059082, -0.5107718706130981, -0.46862584352493286, -0.4264798164367676, -0.3843337595462799, -0.34218770265579224, -0.30004164576530457, -0.2578955888748169, -0.2157495617866516, -0.17360350489616394, -0.13145744800567627, -0.08931142091751099, -0.047165364027023315, -0.0050193071365356445, 0.03712674230337143, 0.0792727917432785, 0.12141883373260498, 0.16356489062309265, 0.20571094751358032, 0.2478569746017456, 0.2900030314922333, 0.33214908838272095]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 5.0, 7.0, 9.0, 13.0, 13.0, 17.0, 29.0, 37.0, 70.0, 106.0, 87.0, 117.0, 104.0, 116.0, 72.0, 51.0, 41.0, 18.0, 17.0, 12.0, 4.0, 5.0, 6.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8739718794822693, -0.8499200940132141, -0.8258683085441589, -0.8018165826797485, -0.7777647972106934, -0.7537130117416382, -0.729661226272583, -0.7056094408035278, -0.6815576553344727, -0.6575058698654175, -0.6334540843963623, -0.6094022989273071, -0.5853505730628967, -0.5612987875938416, -0.5372470021247864, -0.5131952166557312, -0.4891434907913208, -0.4650917053222656, -0.44103994965553284, -0.41698816418647766, -0.3929364085197449, -0.3688846230506897, -0.3448328375816345, -0.32078105211257935, -0.29672929644584656, -0.2726775109767914, -0.2486257553100586, -0.22457396984100342, -0.20052219927310944, -0.17647042870521545, -0.15241864323616028, -0.1283668726682663, -0.10431504249572754, -0.08026327192783356, -0.05621149390935898, -0.0321597158908844, -0.008107945322990417, 0.015943825244903564, 0.03999561071395874, 0.06404738128185272, 0.0880991518497467, 0.11215092241764069, 0.13620269298553467, 0.16025447845458984, 0.18430624902248383, 0.2083580195903778, 0.23240980505943298, 0.25646156072616577, 0.28051334619522095, 0.3045651316642761, 0.3286168873310089, 0.3526686728000641, 0.3767204284667969, 0.40077221393585205, 0.4248239994049072, 0.4488757848739624, 0.4729275405406952, 0.49697932600975037, 0.5210310816764832, 0.5450828671455383, 0.5691346526145935, 0.5931863784790039, 0.6172381639480591, 0.6412899494171143, 0.6653417348861694]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 9.0, 9.0, 9.0, 22.0, 32.0, 45.0, 61.0, 93.0, 143.0, 235.0, 315.0, 470.0, 778.0, 1136.0, 1751.0, 2660.0, 4041.0, 6794.0, 12319.0, 32333.0, 879173.0, 68551.0, 15626.0, 8082.0, 4779.0, 3068.0, 1969.0, 1343.0, 909.0, 575.0, 394.0, 271.0, 173.0, 109.0, 81.0, 59.0, 37.0, 28.0, 25.0, 14.0, 10.0, 7.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.373046875, -0.35955810546875, -0.3460693359375, -0.33258056640625, -0.319091796875, -0.30560302734375, -0.2921142578125, -0.27862548828125, -0.26513671875, -0.25164794921875, -0.2381591796875, -0.22467041015625, -0.211181640625, -0.19769287109375, -0.1842041015625, -0.17071533203125, -0.1572265625, -0.14373779296875, -0.1302490234375, -0.11676025390625, -0.103271484375, -0.08978271484375, -0.0762939453125, -0.06280517578125, -0.04931640625, -0.03582763671875, -0.0223388671875, -0.00885009765625, 0.004638671875, 0.01812744140625, 0.0316162109375, 0.04510498046875, 0.05859375, 0.07208251953125, 0.0855712890625, 0.09906005859375, 0.112548828125, 0.12603759765625, 0.1395263671875, 0.15301513671875, 0.16650390625, 0.17999267578125, 0.1934814453125, 0.20697021484375, 0.220458984375, 0.23394775390625, 0.2474365234375, 0.26092529296875, 0.2744140625, 0.28790283203125, 0.3013916015625, 0.31488037109375, 0.328369140625, 0.34185791015625, 0.3553466796875, 0.36883544921875, 0.38232421875, 0.39581298828125, 0.4093017578125, 0.42279052734375, 0.436279296875, 0.44976806640625, 0.4632568359375, 0.47674560546875, 0.490234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 3.0, 4.0, 11.0, 3.0, 6.0, 10.0, 12.0, 107.0, 514.0, 175.0, 30.0, 12.0, 16.0, 5.0, 8.0, 5.0, 9.0, 2.0, 3.0, 5.0, 7.0, 3.0, 7.0, 6.0, 2.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048614501953125, -0.04676389694213867, -0.044913291931152344, -0.043062686920166016, -0.04121208190917969, -0.03936147689819336, -0.03751087188720703, -0.0356602668762207, -0.033809661865234375, -0.03195905685424805, -0.03010845184326172, -0.02825784683227539, -0.026407241821289062, -0.024556636810302734, -0.022706031799316406, -0.020855426788330078, -0.01900482177734375, -0.017154216766357422, -0.015303611755371094, -0.013453006744384766, -0.011602401733398438, -0.00975179672241211, -0.007901191711425781, -0.006050586700439453, -0.004199981689453125, -0.002349376678466797, -0.0004987716674804688, 0.0013518333435058594, 0.0032024383544921875, 0.005053043365478516, 0.006903648376464844, 0.008754253387451172, 0.0106048583984375, 0.012455463409423828, 0.014306068420410156, 0.016156673431396484, 0.018007278442382812, 0.01985788345336914, 0.02170848846435547, 0.023559093475341797, 0.025409698486328125, 0.027260303497314453, 0.02911090850830078, 0.03096151351928711, 0.03281211853027344, 0.034662723541259766, 0.036513328552246094, 0.03836393356323242, 0.04021453857421875, 0.04206514358520508, 0.043915748596191406, 0.045766353607177734, 0.04761695861816406, 0.04946756362915039, 0.05131816864013672, 0.05316877365112305, 0.055019378662109375, 0.0568699836730957, 0.05872058868408203, 0.06057119369506836, 0.06242179870605469, 0.06427240371704102, 0.06612300872802734, 0.06797361373901367, 0.06982421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 6.0, 7.0, 17.0, 21.0, 17.0, 27.0, 34.0, 40.0, 50.0, 68.0, 110.0, 211.0, 389.0, 871.0, 2474.0, 8966.0, 49075.0, 819639.0, 141846.0, 17947.0, 4178.0, 1255.0, 553.0, 249.0, 163.0, 87.0, 72.0, 41.0, 28.0, 23.0, 16.0, 13.0, 10.0, 10.0, 9.0, 2.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.70361328125, -0.6827392578125, -0.661865234375, -0.6409912109375, -0.6201171875, -0.5992431640625, -0.578369140625, -0.5574951171875, -0.53662109375, -0.5157470703125, -0.494873046875, -0.4739990234375, -0.453125, -0.4322509765625, -0.411376953125, -0.3905029296875, -0.36962890625, -0.3487548828125, -0.327880859375, -0.3070068359375, -0.2861328125, -0.2652587890625, -0.244384765625, -0.2235107421875, -0.20263671875, -0.1817626953125, -0.160888671875, -0.1400146484375, -0.119140625, -0.0982666015625, -0.077392578125, -0.0565185546875, -0.03564453125, -0.0147705078125, 0.006103515625, 0.0269775390625, 0.0478515625, 0.0687255859375, 0.089599609375, 0.1104736328125, 0.13134765625, 0.1522216796875, 0.173095703125, 0.1939697265625, 0.21484375, 0.2357177734375, 0.256591796875, 0.2774658203125, 0.29833984375, 0.3192138671875, 0.340087890625, 0.3609619140625, 0.3818359375, 0.4027099609375, 0.423583984375, 0.4444580078125, 0.46533203125, 0.4862060546875, 0.507080078125, 0.5279541015625, 0.548828125, 0.5697021484375, 0.590576171875, 0.6114501953125, 0.63232421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 9.0, 11.0, 6.0, 13.0, 18.0, 20.0, 19.0, 26.0, 22.0, 35.0, 31.0, 27.0, 41.0, 38.0, 35.0, 48.0, 49.0, 59.0, 46.0, 36.0, 45.0, 45.0, 37.0, 39.0, 25.0, 26.0, 21.0, 30.0, 27.0, 22.0, 15.0, 15.0, 18.0, 7.0, 5.0, 7.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18268775939941406, -0.17641067504882812, -0.1701335906982422, -0.16385650634765625, -0.1575794219970703, -0.15130233764648438, -0.14502525329589844, -0.1387481689453125, -0.13247108459472656, -0.12619400024414062, -0.11991691589355469, -0.11363983154296875, -0.10736274719238281, -0.10108566284179688, -0.09480857849121094, -0.088531494140625, -0.08225440979003906, -0.07597732543945312, -0.06970024108886719, -0.06342315673828125, -0.05714607238769531, -0.050868988037109375, -0.04459190368652344, -0.0383148193359375, -0.03203773498535156, -0.025760650634765625, -0.019483566284179688, -0.01320648193359375, -0.0069293975830078125, -0.000652313232421875, 0.0056247711181640625, 0.01190185546875, 0.018178939819335938, 0.024456024169921875, 0.030733108520507812, 0.03701019287109375, 0.04328727722167969, 0.049564361572265625, 0.05584144592285156, 0.0621185302734375, 0.06839561462402344, 0.07467269897460938, 0.08094978332519531, 0.08722686767578125, 0.09350395202636719, 0.09978103637695312, 0.10605812072753906, 0.112335205078125, 0.11861228942871094, 0.12488937377929688, 0.1311664581298828, 0.13744354248046875, 0.1437206268310547, 0.14999771118164062, 0.15627479553222656, 0.1625518798828125, 0.16882896423339844, 0.17510604858398438, 0.1813831329345703, 0.18766021728515625, 0.1939373016357422, 0.20021438598632812, 0.20649147033691406, 0.2127685546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 19.0, 22.0, 17.0, 37.0, 60.0, 269.0, 1793.0, 919620.0, 124843.0, 1434.0, 234.0, 74.0, 33.0, 24.0, 16.0, 18.0, 10.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0242462158203125, -0.023552417755126953, -0.022858619689941406, -0.02216482162475586, -0.021471023559570312, -0.020777225494384766, -0.02008342742919922, -0.019389629364013672, -0.018695831298828125, -0.018002033233642578, -0.01730823516845703, -0.016614437103271484, -0.015920639038085938, -0.01522684097290039, -0.014533042907714844, -0.013839244842529297, -0.01314544677734375, -0.012451648712158203, -0.011757850646972656, -0.01106405258178711, -0.010370254516601562, -0.009676456451416016, -0.008982658386230469, -0.008288860321044922, -0.007595062255859375, -0.006901264190673828, -0.006207466125488281, -0.005513668060302734, -0.0048198699951171875, -0.004126071929931641, -0.0034322738647460938, -0.002738475799560547, -0.002044677734375, -0.0013508796691894531, -0.0006570816040039062, 3.6716461181640625e-05, 0.0007305145263671875, 0.0014243125915527344, 0.0021181106567382812, 0.002811908721923828, 0.003505706787109375, 0.004199504852294922, 0.004893302917480469, 0.005587100982666016, 0.0062808990478515625, 0.006974697113037109, 0.007668495178222656, 0.008362293243408203, 0.00905609130859375, 0.009749889373779297, 0.010443687438964844, 0.01113748550415039, 0.011831283569335938, 0.012525081634521484, 0.013218879699707031, 0.013912677764892578, 0.014606475830078125, 0.015300273895263672, 0.01599407196044922, 0.016687870025634766, 0.017381668090820312, 0.01807546615600586, 0.018769264221191406, 0.019463062286376953, 0.0201568603515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 0.0, 3.0, 4.0, 8.0, 5.0, 5.0, 8.0, 22.0, 18.0, 31.0, 30.0, 52.0, 60.0, 160.0, 256.0, 112.0, 52.0, 48.0, 33.0, 29.0, 17.0, 13.0, 9.0, 8.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.41157341003418e-05, -9.054038673639297e-05, -8.696503937244415e-05, -8.338969200849533e-05, -7.981434464454651e-05, -7.623899728059769e-05, -7.266364991664886e-05, -6.908830255270004e-05, -6.551295518875122e-05, -6.19376078248024e-05, -5.836226046085358e-05, -5.4786913096904755e-05, -5.121156573295593e-05, -4.763621836900711e-05, -4.406087100505829e-05, -4.0485523641109467e-05, -3.6910176277160645e-05, -3.333482891321182e-05, -2.9759481549263e-05, -2.618413418531418e-05, -2.2608786821365356e-05, -1.9033439457416534e-05, -1.5458092093467712e-05, -1.188274472951889e-05, -8.307397365570068e-06, -4.732050001621246e-06, -1.1567026376724243e-06, 2.4186447262763977e-06, 5.99399209022522e-06, 9.569339454174042e-06, 1.3144686818122864e-05, 1.6720034182071686e-05, 2.0295381546020508e-05, 2.387072890996933e-05, 2.7446076273918152e-05, 3.1021423637866974e-05, 3.4596771001815796e-05, 3.817211836576462e-05, 4.174746572971344e-05, 4.532281309366226e-05, 4.8898160457611084e-05, 5.2473507821559906e-05, 5.604885518550873e-05, 5.962420254945755e-05, 6.319954991340637e-05, 6.67748972773552e-05, 7.035024464130402e-05, 7.392559200525284e-05, 7.750093936920166e-05, 8.107628673315048e-05, 8.46516340970993e-05, 8.822698146104813e-05, 9.180232882499695e-05, 9.537767618894577e-05, 9.895302355289459e-05, 0.00010252837091684341, 0.00010610371828079224, 0.00010967906564474106, 0.00011325441300868988, 0.0001168297603726387, 0.00012040510773658752, 0.00012398045510053635, 0.00012755580246448517, 0.000131131149828434, 0.0001347064971923828]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 8.0, 10.0, 24.0, 37.0, 61.0, 143.0, 309.0, 708.0, 2049.0, 12011.0, 1019944.0, 9935.0, 1957.0, 708.0, 310.0, 147.0, 58.0, 35.0, 25.0, 21.0, 6.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0235443115234375, -0.022861242294311523, -0.022178173065185547, -0.02149510383605957, -0.020812034606933594, -0.020128965377807617, -0.01944589614868164, -0.018762826919555664, -0.018079757690429688, -0.01739668846130371, -0.016713619232177734, -0.016030550003051758, -0.015347480773925781, -0.014664411544799805, -0.013981342315673828, -0.013298273086547852, -0.012615203857421875, -0.011932134628295898, -0.011249065399169922, -0.010565996170043945, -0.009882926940917969, -0.009199857711791992, -0.008516788482666016, -0.007833719253540039, -0.0071506500244140625, -0.006467580795288086, -0.005784511566162109, -0.005101442337036133, -0.004418373107910156, -0.0037353038787841797, -0.003052234649658203, -0.0023691654205322266, -0.00168609619140625, -0.0010030269622802734, -0.0003199577331542969, 0.0003631114959716797, 0.0010461807250976562, 0.0017292499542236328, 0.0024123191833496094, 0.003095388412475586, 0.0037784576416015625, 0.004461526870727539, 0.005144596099853516, 0.005827665328979492, 0.006510734558105469, 0.007193803787231445, 0.007876873016357422, 0.008559942245483398, 0.009243011474609375, 0.009926080703735352, 0.010609149932861328, 0.011292219161987305, 0.011975288391113281, 0.012658357620239258, 0.013341426849365234, 0.014024496078491211, 0.014707565307617188, 0.015390634536743164, 0.01607370376586914, 0.016756772994995117, 0.017439842224121094, 0.01812291145324707, 0.018805980682373047, 0.019489049911499023, 0.020172119140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 23.0, 22.0, 45.0, 154.0, 462.0, 166.0, 54.0, 27.0, 11.0, 4.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00649261474609375, -0.006272792816162109, -0.006052970886230469, -0.005833148956298828, -0.0056133270263671875, -0.005393505096435547, -0.005173683166503906, -0.004953861236572266, -0.004734039306640625, -0.004514217376708984, -0.004294395446777344, -0.004074573516845703, -0.0038547515869140625, -0.003634929656982422, -0.0034151077270507812, -0.0031952857971191406, -0.0029754638671875, -0.0027556419372558594, -0.0025358200073242188, -0.002315998077392578, -0.0020961761474609375, -0.0018763542175292969, -0.0016565322875976562, -0.0014367103576660156, -0.001216888427734375, -0.0009970664978027344, -0.0007772445678710938, -0.0005574226379394531, -0.0003376007080078125, -0.00011777877807617188, 0.00010204315185546875, 0.0003218650817871094, 0.00054168701171875, 0.0007615089416503906, 0.0009813308715820312, 0.0012011528015136719, 0.0014209747314453125, 0.0016407966613769531, 0.0018606185913085938, 0.0020804405212402344, 0.002300262451171875, 0.0025200843811035156, 0.0027399063110351562, 0.002959728240966797, 0.0031795501708984375, 0.003399372100830078, 0.0036191940307617188, 0.0038390159606933594, 0.004058837890625, 0.004278659820556641, 0.004498481750488281, 0.004718303680419922, 0.0049381256103515625, 0.005157947540283203, 0.005377769470214844, 0.005597591400146484, 0.005817413330078125, 0.006037235260009766, 0.006257057189941406, 0.006476879119873047, 0.0066967010498046875, 0.006916522979736328, 0.007136344909667969, 0.007356166839599609, 0.00757598876953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 32.0, 922.0, 57.0, 6.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.794506072998047, -26.329580307006836, -25.864656448364258, -25.399730682373047, -24.934804916381836, -24.469879150390625, -24.004955291748047, -23.540029525756836, -23.075103759765625, -22.610177993774414, -22.145254135131836, -21.680328369140625, -21.215402603149414, -20.750476837158203, -20.285552978515625, -19.820627212524414, -19.355703353881836, -18.890777587890625, -18.425853729248047, -17.960927963256836, -17.496002197265625, -17.031078338623047, -16.566152572631836, -16.101226806640625, -15.636301040649414, -15.17137622833252, -14.706450462341309, -14.241525650024414, -13.776599884033203, -13.311675071716309, -12.846750259399414, -12.381824493408203, -11.916900634765625, -11.45197582244873, -10.98705005645752, -10.522125244140625, -10.057199478149414, -9.59227466583252, -9.127349853515625, -8.662424087524414, -8.197498321533203, -7.73257303237915, -7.267647743225098, -6.802722930908203, -6.33779764175415, -5.872872352600098, -5.407947063446045, -4.943021774291992, -4.478096961975098, -4.013171672821045, -3.5482466220855713, -3.0833213329315186, -2.618396282196045, -2.153470993041992, -1.6885457038879395, -1.2236206531524658, -0.7586953639984131, -0.2937701642513275, 0.17115503549575806, 0.636080265045166, 1.1010054349899292, 1.5659306049346924, 2.030855894088745, 2.4957809448242188, 2.9607062339782715]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 3.0, 4.0, 8.0, 3.0, 7.0, 14.0, 18.0, 24.0, 28.0, 56.0, 59.0, 68.0, 80.0, 90.0, 102.0, 85.0, 68.0, 62.0, 51.0, 43.0, 25.0, 28.0, 11.0, 12.0, 9.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.3362526893615723, -2.2663745880126953, -2.1964962482452393, -2.1266181468963623, -2.0567398071289062, -1.9868617057800293, -1.9169836044311523, -1.8471053838729858, -1.7772271633148193, -1.7073489427566528, -1.6374707221984863, -1.5675926208496094, -1.4977144002914429, -1.4278361797332764, -1.3579580783843994, -1.288079857826233, -1.2182016372680664, -1.1483234167099, -1.0784451961517334, -1.0085670948028564, -0.9386888742446899, -0.8688106536865234, -0.7989324927330017, -0.72905433177948, -0.6591761112213135, -0.589297890663147, -0.5194197297096252, -0.44954153895378113, -0.379663348197937, -0.3097851574420929, -0.23990696668624878, -0.17002877593040466, -0.10015058517456055, -0.03027239441871643, 0.039605796337127686, 0.1094839870929718, 0.17936217784881592, 0.24924036860466003, 0.31911855936050415, 0.38899675011634827, 0.4588749408721924, 0.5287531614303589, 0.5986313223838806, 0.6685094833374023, 0.7383877038955688, 0.8082659244537354, 0.8781440854072571, 0.9480222463607788, 1.0179004669189453, 1.0877786874771118, 1.1576569080352783, 1.2275350093841553, 1.2974132299423218, 1.3672914505004883, 1.4371695518493652, 1.5070477724075317, 1.5769259929656982, 1.6468042135238647, 1.7166824340820312, 1.7865605354309082, 1.8564387559890747, 1.9263169765472412, 1.9961950778961182, 2.066073417663574, 2.135951519012451]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 5.0, 13.0, 49.0, 174.0, 735.0, 2850.0, 11600.0, 3987534.0, 166485.0, 17533.0, 5133.0, 1461.0, 436.0, 122.0, 49.0, 15.0, 10.0, 8.0, 7.0, 4.0, 4.0, 4.0, 4.0, 5.0, 2.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9814453125, -1.9079742431640625, -1.834503173828125, -1.7610321044921875, -1.68756103515625, -1.6140899658203125, -1.540618896484375, -1.4671478271484375, -1.3936767578125, -1.3202056884765625, -1.246734619140625, -1.1732635498046875, -1.09979248046875, -1.0263214111328125, -0.952850341796875, -0.8793792724609375, -0.805908203125, -0.7324371337890625, -0.658966064453125, -0.5854949951171875, -0.51202392578125, -0.4385528564453125, -0.365081787109375, -0.2916107177734375, -0.2181396484375, -0.1446685791015625, -0.071197509765625, 0.0022735595703125, 0.07574462890625, 0.1492156982421875, 0.222686767578125, 0.2961578369140625, 0.36962890625, 0.4430999755859375, 0.516571044921875, 0.5900421142578125, 0.66351318359375, 0.7369842529296875, 0.810455322265625, 0.8839263916015625, 0.9573974609375, 1.0308685302734375, 1.104339599609375, 1.1778106689453125, 1.25128173828125, 1.3247528076171875, 1.398223876953125, 1.4716949462890625, 1.545166015625, 1.6186370849609375, 1.692108154296875, 1.7655792236328125, 1.83905029296875, 1.9125213623046875, 1.985992431640625, 2.0594635009765625, 2.1329345703125, 2.2064056396484375, 2.279876708984375, 2.3533477783203125, 2.42681884765625, 2.5002899169921875, 2.573760986328125, 2.6472320556640625, 2.720703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 4.0, 7.0, 6.0, 13.0, 7.0, 41.0, 235.0, 369.0, 151.0, 33.0, 20.0, 7.0, 11.0, 6.0, 7.0, 3.0, 5.0, 7.0, 7.0, 4.0, 4.0, 4.0, 4.0, 5.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043914794921875, -0.04228544235229492, -0.040656089782714844, -0.039026737213134766, -0.03739738464355469, -0.03576803207397461, -0.03413867950439453, -0.03250932693481445, -0.030879974365234375, -0.029250621795654297, -0.02762126922607422, -0.02599191665649414, -0.024362564086914062, -0.022733211517333984, -0.021103858947753906, -0.019474506378173828, -0.01784515380859375, -0.016215801239013672, -0.014586448669433594, -0.012957096099853516, -0.011327743530273438, -0.00969839096069336, -0.008069038391113281, -0.006439685821533203, -0.004810333251953125, -0.003180980682373047, -0.0015516281127929688, 7.772445678710938e-05, 0.0017070770263671875, 0.0033364295959472656, 0.004965782165527344, 0.006595134735107422, 0.0082244873046875, 0.009853839874267578, 0.011483192443847656, 0.013112545013427734, 0.014741897583007812, 0.01637125015258789, 0.01800060272216797, 0.019629955291748047, 0.021259307861328125, 0.022888660430908203, 0.02451801300048828, 0.02614736557006836, 0.027776718139648438, 0.029406070709228516, 0.031035423278808594, 0.03266477584838867, 0.03429412841796875, 0.03592348098754883, 0.037552833557128906, 0.039182186126708984, 0.04081153869628906, 0.04244089126586914, 0.04407024383544922, 0.0456995964050293, 0.047328948974609375, 0.04895830154418945, 0.05058765411376953, 0.05221700668334961, 0.05384635925292969, 0.055475711822509766, 0.057105064392089844, 0.05873441696166992, 0.06036376953125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 16.0, 14.0, 24.0, 26.0, 42.0, 42.0, 77.0, 118.0, 228.0, 606.0, 3125.0, 65248.0, 4110409.0, 12099.0, 1362.0, 383.0, 156.0, 86.0, 59.0, 50.0, 26.0, 22.0, 20.0, 13.0, 14.0, 4.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.5838775634765625, -2.521270751953125, -2.4586639404296875, -2.39605712890625, -2.3334503173828125, -2.270843505859375, -2.2082366943359375, -2.1456298828125, -2.0830230712890625, -2.020416259765625, -1.9578094482421875, -1.89520263671875, -1.8325958251953125, -1.769989013671875, -1.7073822021484375, -1.644775390625, -1.5821685791015625, -1.519561767578125, -1.4569549560546875, -1.39434814453125, -1.3317413330078125, -1.269134521484375, -1.2065277099609375, -1.1439208984375, -1.0813140869140625, -1.018707275390625, -0.9561004638671875, -0.89349365234375, -0.8308868408203125, -0.768280029296875, -0.7056732177734375, -0.64306640625, -0.5804595947265625, -0.517852783203125, -0.4552459716796875, -0.39263916015625, -0.3300323486328125, -0.267425537109375, -0.2048187255859375, -0.1422119140625, -0.0796051025390625, -0.016998291015625, 0.0456085205078125, 0.10821533203125, 0.1708221435546875, 0.233428955078125, 0.2960357666015625, 0.358642578125, 0.4212493896484375, 0.483856201171875, 0.5464630126953125, 0.60906982421875, 0.6716766357421875, 0.734283447265625, 0.7968902587890625, 0.8594970703125, 0.9221038818359375, 0.984710693359375, 1.0473175048828125, 1.10992431640625, 1.1725311279296875, 1.235137939453125, 1.2977447509765625, 1.3603515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 1.0, 2.0, 12.0, 13.0, 13.0, 15.0, 16.0, 23.0, 34.0, 39.0, 46.0, 57.0, 85.0, 100.0, 2976.0, 211.0, 98.0, 61.0, 57.0, 54.0, 39.0, 24.0, 27.0, 18.0, 17.0, 10.0, 17.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11981201171875, -0.11431598663330078, -0.10881996154785156, -0.10332393646240234, -0.09782791137695312, -0.0923318862915039, -0.08683586120605469, -0.08133983612060547, -0.07584381103515625, -0.07034778594970703, -0.06485176086425781, -0.059355735778808594, -0.053859710693359375, -0.048363685607910156, -0.04286766052246094, -0.03737163543701172, -0.0318756103515625, -0.02637958526611328, -0.020883560180664062, -0.015387535095214844, -0.009891510009765625, -0.004395484924316406, 0.0011005401611328125, 0.006596565246582031, 0.01209259033203125, 0.01758861541748047, 0.023084640502929688, 0.028580665588378906, 0.034076690673828125, 0.039572715759277344, 0.04506874084472656, 0.05056476593017578, 0.056060791015625, 0.06155681610107422, 0.06705284118652344, 0.07254886627197266, 0.07804489135742188, 0.0835409164428711, 0.08903694152832031, 0.09453296661376953, 0.10002899169921875, 0.10552501678466797, 0.11102104187011719, 0.1165170669555664, 0.12201309204101562, 0.12750911712646484, 0.13300514221191406, 0.13850116729736328, 0.1439971923828125, 0.14949321746826172, 0.15498924255371094, 0.16048526763916016, 0.16598129272460938, 0.1714773178100586, 0.1769733428955078, 0.18246936798095703, 0.18796539306640625, 0.19346141815185547, 0.1989574432373047, 0.2044534683227539, 0.20994949340820312, 0.21544551849365234, 0.22094154357910156, 0.22643756866455078, 0.23193359375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 55.0, 742.0, 164.0, 26.0, 3.0, 8.0, 2.0, 3.0, 0.0, 3.0], "bins": [-2.836090564727783, -2.785233497619629, -2.7343766689300537, -2.6835196018218994, -2.632662534713745, -2.58180570602417, -2.5309486389160156, -2.4800915718078613, -2.429234743118286, -2.378377676010132, -2.3275208473205566, -2.2766637802124023, -2.225806713104248, -2.174949884414673, -2.1240928173065186, -2.0732357501983643, -2.02237868309021, -1.9715217351913452, -1.920664668083191, -1.8698077201843262, -1.8189507722854614, -1.7680937051773071, -1.7172367572784424, -1.666379690170288, -1.615522861480713, -1.5646659135818481, -1.5138088464736938, -1.462951898574829, -1.4120949506759644, -1.36123788356781, -1.3103809356689453, -1.259523868560791, -1.2086668014526367, -1.157809853553772, -1.1069527864456177, -1.056095838546753, -1.0052388906478882, -0.9543818235397339, -0.9035248756408691, -0.8526678681373596, -0.8018109798431396, -0.7509539723396301, -0.7000970244407654, -0.6492400169372559, -0.5983830094337463, -0.5475260019302368, -0.49666905403137207, -0.44581204652786255, -0.394955039024353, -0.3440980613231659, -0.29324105381965637, -0.24238407611846924, -0.1915270835161209, -0.14067009091377258, -0.08981311321258545, -0.03895610570907593, 0.011900871992111206, 0.06275786459445953, 0.11361484974622726, 0.164471834897995, 0.21532882750034332, 0.26618582010269165, 0.3170427978038788, 0.3678998053073883, 0.41875678300857544]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 8.0, 23.0, 21.0, 27.0, 34.0, 51.0, 51.0, 69.0, 77.0, 80.0, 82.0, 94.0, 83.0, 60.0, 45.0, 48.0, 24.0, 27.0, 17.0, 8.0, 8.0, 2.0, 2.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7812978625297546, -0.7593730688095093, -0.7374482750892639, -0.7155234813690186, -0.6935986876487732, -0.6716738939285278, -0.6497490406036377, -0.6278243064880371, -0.605899453163147, -0.5839746594429016, -0.5620498657226562, -0.5401250720024109, -0.5182002782821655, -0.49627548456192017, -0.4743506610393524, -0.45242586731910706, -0.4305011034011841, -0.4085763096809387, -0.38665151596069336, -0.364726722240448, -0.34280192852020264, -0.3208771347999573, -0.2989523112773895, -0.27702751755714417, -0.2551027238368988, -0.23317793011665344, -0.21125313639640808, -0.18932832777500153, -0.16740353405475616, -0.1454787403345108, -0.12355393171310425, -0.10162913799285889, -0.07970428466796875, -0.05777948722243309, -0.03585468977689743, -0.013929888606071472, 0.00799490511417389, 0.02991969883441925, 0.051844507455825806, 0.07376930117607117, 0.09569409489631653, 0.11761888861656189, 0.13954368233680725, 0.1614684909582138, 0.18339328467845917, 0.20531807839870453, 0.22724288702011108, 0.24916768074035645, 0.2710924744606018, 0.29301726818084717, 0.31494206190109253, 0.3368668556213379, 0.35879164934158325, 0.3807164430618286, 0.40264126658439636, 0.4245660603046417, 0.4464908540248871, 0.46841564774513245, 0.4903404414653778, 0.5122652649879456, 0.5341900587081909, 0.5561148524284363, 0.5780396461486816, 0.599964439868927, 0.6218892335891724]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 9.0, 8.0, 19.0, 25.0, 24.0, 36.0, 64.0, 69.0, 114.0, 148.0, 194.0, 257.0, 378.0, 507.0, 759.0, 1094.0, 1611.0, 2495.0, 4149.0, 7706.0, 17401.0, 66869.0, 776559.0, 121318.0, 23383.0, 9365.0, 4875.0, 2977.0, 1896.0, 1266.0, 844.0, 591.0, 415.0, 309.0, 232.0, 152.0, 127.0, 78.0, 69.0, 49.0, 30.0, 24.0, 21.0, 8.0, 13.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20556640625, -0.19885826110839844, -0.19215011596679688, -0.1854419708251953, -0.17873382568359375, -0.1720256805419922, -0.16531753540039062, -0.15860939025878906, -0.1519012451171875, -0.14519309997558594, -0.13848495483398438, -0.1317768096923828, -0.12506866455078125, -0.11836051940917969, -0.11165237426757812, -0.10494422912597656, -0.098236083984375, -0.09152793884277344, -0.08481979370117188, -0.07811164855957031, -0.07140350341796875, -0.06469535827636719, -0.057987213134765625, -0.05127906799316406, -0.0445709228515625, -0.03786277770996094, -0.031154632568359375, -0.024446487426757812, -0.01773834228515625, -0.011030197143554688, -0.004322052001953125, 0.0023860931396484375, 0.00909423828125, 0.015802383422851562, 0.022510528564453125, 0.029218673706054688, 0.03592681884765625, 0.04263496398925781, 0.049343109130859375, 0.05605125427246094, 0.0627593994140625, 0.06946754455566406, 0.07617568969726562, 0.08288383483886719, 0.08959197998046875, 0.09630012512207031, 0.10300827026367188, 0.10971641540527344, 0.116424560546875, 0.12313270568847656, 0.12984085083007812, 0.1365489959716797, 0.14325714111328125, 0.1499652862548828, 0.15667343139648438, 0.16338157653808594, 0.1700897216796875, 0.17679786682128906, 0.18350601196289062, 0.1902141571044922, 0.19692230224609375, 0.2036304473876953, 0.21033859252929688, 0.21704673767089844, 0.2237548828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 3.0, 8.0, 13.0, 40.0, 84.0, 131.0, 181.0, 176.0, 116.0, 67.0, 44.0, 15.0, 19.0, 9.0, 11.0, 7.0, 5.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 4.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034515380859375, -0.03338289260864258, -0.032250404357910156, -0.031117916107177734, -0.029985427856445312, -0.02885293960571289, -0.02772045135498047, -0.026587963104248047, -0.025455474853515625, -0.024322986602783203, -0.02319049835205078, -0.02205801010131836, -0.020925521850585938, -0.019793033599853516, -0.018660545349121094, -0.017528057098388672, -0.01639556884765625, -0.015263080596923828, -0.014130592346191406, -0.012998104095458984, -0.011865615844726562, -0.01073312759399414, -0.009600639343261719, -0.008468151092529297, -0.007335662841796875, -0.006203174591064453, -0.005070686340332031, -0.003938198089599609, -0.0028057098388671875, -0.0016732215881347656, -0.0005407333374023438, 0.0005917549133300781, 0.0017242431640625, 0.002856731414794922, 0.003989219665527344, 0.005121707916259766, 0.0062541961669921875, 0.007386684417724609, 0.008519172668457031, 0.009651660919189453, 0.010784149169921875, 0.011916637420654297, 0.013049125671386719, 0.01418161392211914, 0.015314102172851562, 0.016446590423583984, 0.017579078674316406, 0.018711566925048828, 0.01984405517578125, 0.020976543426513672, 0.022109031677246094, 0.023241519927978516, 0.024374008178710938, 0.02550649642944336, 0.02663898468017578, 0.027771472930908203, 0.028903961181640625, 0.030036449432373047, 0.03116893768310547, 0.03230142593383789, 0.03343391418457031, 0.034566402435302734, 0.035698890686035156, 0.03683137893676758, 0.0379638671875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 11.0, 11.0, 13.0, 21.0, 19.0, 35.0, 49.0, 54.0, 111.0, 165.0, 331.0, 648.0, 1643.0, 6661.0, 322897.0, 704593.0, 7935.0, 1793.0, 708.0, 319.0, 169.0, 118.0, 63.0, 61.0, 30.0, 21.0, 21.0, 18.0, 7.0, 6.0, 9.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470947265625, -0.4557762145996094, -0.44060516357421875, -0.4254341125488281, -0.4102630615234375, -0.3950920104980469, -0.37992095947265625, -0.3647499084472656, -0.349578857421875, -0.3344078063964844, -0.31923675537109375, -0.3040657043457031, -0.2888946533203125, -0.2737236022949219, -0.25855255126953125, -0.24338150024414062, -0.22821044921875, -0.21303939819335938, -0.19786834716796875, -0.18269729614257812, -0.1675262451171875, -0.15235519409179688, -0.13718414306640625, -0.12201309204101562, -0.106842041015625, -0.09167098999023438, -0.07649993896484375, -0.061328887939453125, -0.0461578369140625, -0.030986785888671875, -0.01581573486328125, -0.000644683837890625, 0.0145263671875, 0.029697418212890625, 0.04486846923828125, 0.060039520263671875, 0.0752105712890625, 0.09038162231445312, 0.10555267333984375, 0.12072372436523438, 0.135894775390625, 0.15106582641601562, 0.16623687744140625, 0.18140792846679688, 0.1965789794921875, 0.21175003051757812, 0.22692108154296875, 0.24209213256835938, 0.25726318359375, 0.2724342346191406, 0.28760528564453125, 0.3027763366699219, 0.3179473876953125, 0.3331184387207031, 0.34828948974609375, 0.3634605407714844, 0.378631591796875, 0.3938026428222656, 0.40897369384765625, 0.4241447448730469, 0.4393157958984375, 0.4544868469238281, 0.46965789794921875, 0.4848289489746094, 0.5]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 9.0, 7.0, 11.0, 12.0, 19.0, 24.0, 24.0, 39.0, 37.0, 41.0, 49.0, 47.0, 37.0, 45.0, 53.0, 58.0, 59.0, 56.0, 51.0, 47.0, 56.0, 48.0, 32.0, 29.0, 23.0, 19.0, 18.0, 14.0, 12.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138916015625, -0.13463211059570312, -0.13034820556640625, -0.12606430053710938, -0.1217803955078125, -0.11749649047851562, -0.11321258544921875, -0.10892868041992188, -0.104644775390625, -0.10036087036132812, -0.09607696533203125, -0.09179306030273438, -0.0875091552734375, -0.08322525024414062, -0.07894134521484375, -0.07465744018554688, -0.07037353515625, -0.06608963012695312, -0.06180572509765625, -0.057521820068359375, -0.0532379150390625, -0.048954010009765625, -0.04467010498046875, -0.040386199951171875, -0.036102294921875, -0.031818389892578125, -0.02753448486328125, -0.023250579833984375, -0.0189666748046875, -0.014682769775390625, -0.01039886474609375, -0.006114959716796875, -0.0018310546875, 0.002452850341796875, 0.00673675537109375, 0.011020660400390625, 0.0153045654296875, 0.019588470458984375, 0.02387237548828125, 0.028156280517578125, 0.032440185546875, 0.036724090576171875, 0.04100799560546875, 0.045291900634765625, 0.0495758056640625, 0.053859710693359375, 0.05814361572265625, 0.062427520751953125, 0.06671142578125, 0.07099533081054688, 0.07527923583984375, 0.07956314086914062, 0.0838470458984375, 0.08813095092773438, 0.09241485595703125, 0.09669876098632812, 0.100982666015625, 0.10526657104492188, 0.10955047607421875, 0.11383438110351562, 0.1181182861328125, 0.12240219116210938, 0.12668609619140625, 0.13097000122070312, 0.13525390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 6.0, 3.0, 13.0, 25.0, 34.0, 20.0, 29.0, 51.0, 55.0, 81.0, 134.0, 190.0, 289.0, 537.0, 1272.0, 4262.0, 44398.0, 967360.0, 24149.0, 3117.0, 1106.0, 512.0, 281.0, 181.0, 111.0, 79.0, 47.0, 46.0, 38.0, 28.0, 17.0, 14.0, 9.0, 14.0, 5.0, 6.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00838470458984375, -0.008108973503112793, -0.007833242416381836, -0.007557511329650879, -0.007281780242919922, -0.007006049156188965, -0.006730318069458008, -0.006454586982727051, -0.006178855895996094, -0.005903124809265137, -0.00562739372253418, -0.005351662635803223, -0.005075931549072266, -0.004800200462341309, -0.0045244693756103516, -0.0042487382888793945, -0.0039730072021484375, -0.0036972761154174805, -0.0034215450286865234, -0.0031458139419555664, -0.0028700828552246094, -0.0025943517684936523, -0.0023186206817626953, -0.0020428895950317383, -0.0017671585083007812, -0.0014914274215698242, -0.0012156963348388672, -0.0009399652481079102, -0.0006642341613769531, -0.0003885030746459961, -0.00011277198791503906, 0.00016295909881591797, 0.000438690185546875, 0.000714421272277832, 0.000990152359008789, 0.001265883445739746, 0.0015416145324707031, 0.0018173456192016602, 0.002093076705932617, 0.0023688077926635742, 0.0026445388793945312, 0.0029202699661254883, 0.0031960010528564453, 0.0034717321395874023, 0.0037474632263183594, 0.004023194313049316, 0.0042989253997802734, 0.0045746564865112305, 0.0048503875732421875, 0.0051261186599731445, 0.0054018497467041016, 0.005677580833435059, 0.005953311920166016, 0.006229043006896973, 0.00650477409362793, 0.006780505180358887, 0.007056236267089844, 0.007331967353820801, 0.007607698440551758, 0.007883429527282715, 0.008159160614013672, 0.008434891700744629, 0.008710622787475586, 0.008986353874206543, 0.0092620849609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 3.0, 1.0, 4.0, 9.0, 9.0, 2.0, 6.0, 7.0, 11.0, 11.0, 24.0, 21.0, 17.0, 31.0, 38.0, 98.0, 159.0, 229.0, 90.0, 62.0, 43.0, 27.0, 20.0, 21.0, 13.0, 15.0, 7.0, 6.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.728006362915039e-05, -5.549192428588867e-05, -5.370378494262695e-05, -5.1915645599365234e-05, -5.0127506256103516e-05, -4.83393669128418e-05, -4.655122756958008e-05, -4.476308822631836e-05, -4.297494888305664e-05, -4.118680953979492e-05, -3.93986701965332e-05, -3.7610530853271484e-05, -3.5822391510009766e-05, -3.403425216674805e-05, -3.224611282348633e-05, -3.045797348022461e-05, -2.866983413696289e-05, -2.6881694793701172e-05, -2.5093555450439453e-05, -2.3305416107177734e-05, -2.1517276763916016e-05, -1.9729137420654297e-05, -1.7940998077392578e-05, -1.615285873413086e-05, -1.436471939086914e-05, -1.2576580047607422e-05, -1.0788440704345703e-05, -9.000301361083984e-06, -7.212162017822266e-06, -5.424022674560547e-06, -3.635883331298828e-06, -1.8477439880371094e-06, -5.960464477539063e-08, 1.7285346984863281e-06, 3.516674041748047e-06, 5.304813385009766e-06, 7.092952728271484e-06, 8.881092071533203e-06, 1.0669231414794922e-05, 1.245737075805664e-05, 1.424551010131836e-05, 1.6033649444580078e-05, 1.7821788787841797e-05, 1.9609928131103516e-05, 2.1398067474365234e-05, 2.3186206817626953e-05, 2.4974346160888672e-05, 2.676248550415039e-05, 2.855062484741211e-05, 3.0338764190673828e-05, 3.212690353393555e-05, 3.3915042877197266e-05, 3.5703182220458984e-05, 3.74913215637207e-05, 3.927946090698242e-05, 4.106760025024414e-05, 4.285573959350586e-05, 4.464387893676758e-05, 4.64320182800293e-05, 4.8220157623291016e-05, 5.0008296966552734e-05, 5.179643630981445e-05, 5.358457565307617e-05, 5.537271499633789e-05, 5.716085433959961e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 10.0, 9.0, 12.0, 18.0, 36.0, 51.0, 93.0, 226.0, 608.0, 2816.0, 788820.0, 252174.0, 2612.0, 585.0, 217.0, 108.0, 49.0, 35.0, 22.0, 14.0, 12.0, 6.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249481201171875, -0.024254560470581055, -0.02356100082397461, -0.022867441177368164, -0.02217388153076172, -0.021480321884155273, -0.020786762237548828, -0.020093202590942383, -0.019399642944335938, -0.018706083297729492, -0.018012523651123047, -0.0173189640045166, -0.016625404357910156, -0.01593184471130371, -0.015238285064697266, -0.01454472541809082, -0.013851165771484375, -0.01315760612487793, -0.012464046478271484, -0.011770486831665039, -0.011076927185058594, -0.010383367538452148, -0.009689807891845703, -0.008996248245239258, -0.008302688598632812, -0.007609128952026367, -0.006915569305419922, -0.0062220096588134766, -0.005528450012207031, -0.004834890365600586, -0.004141330718994141, -0.0034477710723876953, -0.00275421142578125, -0.0020606517791748047, -0.0013670921325683594, -0.0006735324859619141, 2.002716064453125e-05, 0.0007135868072509766, 0.0014071464538574219, 0.002100706100463867, 0.0027942657470703125, 0.003487825393676758, 0.004181385040283203, 0.0048749446868896484, 0.005568504333496094, 0.006262063980102539, 0.006955623626708984, 0.00764918327331543, 0.008342742919921875, 0.00903630256652832, 0.009729862213134766, 0.010423421859741211, 0.011116981506347656, 0.011810541152954102, 0.012504100799560547, 0.013197660446166992, 0.013891220092773438, 0.014584779739379883, 0.015278339385986328, 0.015971899032592773, 0.01666545867919922, 0.017359018325805664, 0.01805257797241211, 0.018746137619018555, 0.019439697265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 15.0, 14.0, 21.0, 34.0, 44.0, 72.0, 109.0, 169.0, 167.0, 127.0, 76.0, 39.0, 26.0, 20.0, 16.0, 10.0, 4.0, 2.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005382537841796875, -0.005190372467041016, -0.004998207092285156, -0.004806041717529297, -0.0046138763427734375, -0.004421710968017578, -0.004229545593261719, -0.004037380218505859, -0.00384521484375, -0.0036530494689941406, -0.0034608840942382812, -0.003268718719482422, -0.0030765533447265625, -0.002884387969970703, -0.0026922225952148438, -0.0025000572204589844, -0.002307891845703125, -0.0021157264709472656, -0.0019235610961914062, -0.0017313957214355469, -0.0015392303466796875, -0.0013470649719238281, -0.0011548995971679688, -0.0009627342224121094, -0.00077056884765625, -0.0005784034729003906, -0.00038623809814453125, -0.00019407272338867188, -1.9073486328125e-06, 0.00019025802612304688, 0.00038242340087890625, 0.0005745887756347656, 0.000766754150390625, 0.0009589195251464844, 0.0011510848999023438, 0.0013432502746582031, 0.0015354156494140625, 0.0017275810241699219, 0.0019197463989257812, 0.0021119117736816406, 0.0023040771484375, 0.0024962425231933594, 0.0026884078979492188, 0.002880573272705078, 0.0030727386474609375, 0.003264904022216797, 0.0034570693969726562, 0.0036492347717285156, 0.003841400146484375, 0.004033565521240234, 0.004225730895996094, 0.004417896270751953, 0.0046100616455078125, 0.004802227020263672, 0.004994392395019531, 0.005186557769775391, 0.00537872314453125, 0.005570888519287109, 0.005763053894042969, 0.005955219268798828, 0.0061473846435546875, 0.006339550018310547, 0.006531715393066406, 0.006723880767822266, 0.006916046142578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 14.0, 669.0, 328.0, 5.0, 0.0, 2.0, 1.0], "bins": [-9.949470520019531, -9.780729293823242, -9.611988067626953, -9.443246841430664, -9.274505615234375, -9.105764389038086, -8.937023162841797, -8.768281936645508, -8.599540710449219, -8.43079948425293, -8.26205825805664, -8.093317031860352, -7.9245758056640625, -7.755834579467773, -7.587093353271484, -7.418352127075195, -7.249610424041748, -7.080869197845459, -6.91212797164917, -6.743386745452881, -6.574645519256592, -6.405904293060303, -6.2371625900268555, -6.068421363830566, -5.899680137634277, -5.730938911437988, -5.562197685241699, -5.39345645904541, -5.224715232849121, -5.055974006652832, -4.887232780456543, -4.718491554260254, -4.549750804901123, -4.381009578704834, -4.212268352508545, -4.043527126312256, -3.874785900115967, -3.7060446739196777, -3.5373032093048096, -3.3685619831085205, -3.1998207569122314, -3.0310795307159424, -2.8623383045196533, -2.693596839904785, -2.524855613708496, -2.356114387512207, -2.187373161315918, -2.018631935119629, -1.8498907089233398, -1.6811494827270508, -1.5124082565307617, -1.343666911125183, -1.174925684928894, -1.006184458732605, -0.8374431133270264, -0.6687018871307373, -0.49996060132980347, -0.331219345331192, -0.16247808933258057, 0.0062631964683532715, 0.17500442266464233, 0.3437456488609314, 0.51248699426651, 0.6812282204627991, 0.8499694466590881]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 18.0, 19.0, 15.0, 13.0, 22.0, 35.0, 24.0, 46.0, 53.0, 59.0, 50.0, 54.0, 52.0, 58.0, 67.0, 58.0, 52.0, 45.0, 44.0, 41.0, 26.0, 32.0, 21.0, 21.0, 18.0, 13.0, 8.0, 3.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7800173163414001, -0.7510339617729187, -0.722050666809082, -0.6930673122406006, -0.6640839576721191, -0.6351006031036377, -0.606117308139801, -0.5771339535713196, -0.5481506586074829, -0.5191673040390015, -0.4901839792728424, -0.46120065450668335, -0.4322172999382019, -0.40323397517204285, -0.3742506504058838, -0.34526729583740234, -0.3162839412689209, -0.28730061650276184, -0.2583172619342804, -0.22933393716812134, -0.2003505975008011, -0.17136725783348083, -0.14238393306732178, -0.11340059340000153, -0.08441725373268127, -0.05543391779065132, -0.02645058184862137, 0.002532750368118286, 0.03151609003543854, 0.06049942970275879, 0.08948275446891785, 0.1184660941362381, 0.14744937419891357, 0.17643271386623383, 0.20541605353355408, 0.23439937829971313, 0.2633827328681946, 0.29236605763435364, 0.3213493824005127, 0.35033273696899414, 0.3793160617351532, 0.40829938650131226, 0.4372827410697937, 0.46626606583595276, 0.4952493906021118, 0.5242327451705933, 0.5532160997390747, 0.5821993947029114, 0.6111827492713928, 0.6401661038398743, 0.6691493988037109, 0.6981327533721924, 0.7271161079406738, 0.7560994625091553, 0.7850827574729919, 0.8140661120414734, 0.8430494070053101, 0.8720327615737915, 0.9010160565376282, 0.9299994111061096, 0.9589827656745911, 0.9879660606384277, 1.0169494152069092, 1.0459327697753906, 1.074916124343872]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 5.0, 12.0, 16.0, 28.0, 63.0, 184.0, 536.0, 2178.0, 51733.0, 4133052.0, 4799.0, 1071.0, 312.0, 119.0, 57.0, 31.0, 11.0, 12.0, 10.0, 5.0, 3.0, 5.0, 5.0, 2.0, 1.0, 7.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89111328125, -0.8633804321289062, -0.8356475830078125, -0.8079147338867188, -0.780181884765625, -0.7524490356445312, -0.7247161865234375, -0.6969833374023438, -0.66925048828125, -0.6415176391601562, -0.6137847900390625, -0.5860519409179688, -0.558319091796875, -0.5305862426757812, -0.5028533935546875, -0.47512054443359375, -0.4473876953125, -0.41965484619140625, -0.3919219970703125, -0.36418914794921875, -0.336456298828125, -0.30872344970703125, -0.2809906005859375, -0.25325775146484375, -0.22552490234375, -0.19779205322265625, -0.1700592041015625, -0.14232635498046875, -0.114593505859375, -0.08686065673828125, -0.0591278076171875, -0.03139495849609375, -0.003662109375, 0.02407073974609375, 0.0518035888671875, 0.07953643798828125, 0.107269287109375, 0.13500213623046875, 0.1627349853515625, 0.19046783447265625, 0.21820068359375, 0.24593353271484375, 0.2736663818359375, 0.30139923095703125, 0.329132080078125, 0.35686492919921875, 0.3845977783203125, 0.41233062744140625, 0.4400634765625, 0.46779632568359375, 0.4955291748046875, 0.5232620239257812, 0.550994873046875, 0.5787277221679688, 0.6064605712890625, 0.6341934204101562, 0.66192626953125, 0.6896591186523438, 0.7173919677734375, 0.7451248168945312, 0.772857666015625, 0.8005905151367188, 0.8283233642578125, 0.8560562133789062, 0.8837890625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 9.0, 14.0, 19.0, 60.0, 98.0, 159.0, 159.0, 149.0, 96.0, 62.0, 31.0, 27.0, 19.0, 15.0, 6.0, 8.0, 9.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03594970703125, -0.03483009338378906, -0.033710479736328125, -0.03259086608886719, -0.03147125244140625, -0.030351638793945312, -0.029232025146484375, -0.028112411499023438, -0.0269927978515625, -0.025873184204101562, -0.024753570556640625, -0.023633956909179688, -0.02251434326171875, -0.021394729614257812, -0.020275115966796875, -0.019155502319335938, -0.018035888671875, -0.016916275024414062, -0.015796661376953125, -0.014677047729492188, -0.01355743408203125, -0.012437820434570312, -0.011318206787109375, -0.010198593139648438, -0.0090789794921875, -0.007959365844726562, -0.006839752197265625, -0.0057201385498046875, -0.00460052490234375, -0.0034809112548828125, -0.002361297607421875, -0.0012416839599609375, -0.0001220703125, 0.0009975433349609375, 0.002117156982421875, 0.0032367706298828125, 0.00435638427734375, 0.0054759979248046875, 0.006595611572265625, 0.0077152252197265625, 0.0088348388671875, 0.009954452514648438, 0.011074066162109375, 0.012193679809570312, 0.01331329345703125, 0.014432907104492188, 0.015552520751953125, 0.016672134399414062, 0.017791748046875, 0.018911361694335938, 0.020030975341796875, 0.021150588989257812, 0.02227020263671875, 0.023389816284179688, 0.024509429931640625, 0.025629043579101562, 0.0267486572265625, 0.027868270874023438, 0.028987884521484375, 0.030107498168945312, 0.03122711181640625, 0.03234672546386719, 0.033466339111328125, 0.03458595275878906, 0.03570556640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 0.0, 14.0, 13.0, 20.0, 22.0, 44.0, 84.0, 151.0, 413.0, 1744.0, 14324.0, 4142069.0, 31938.0, 2423.0, 561.0, 197.0, 96.0, 44.0, 25.0, 20.0, 17.0, 11.0, 14.0, 7.0, 4.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57861328125, -0.5603485107421875, -0.542083740234375, -0.5238189697265625, -0.50555419921875, -0.4872894287109375, -0.469024658203125, -0.4507598876953125, -0.4324951171875, -0.4142303466796875, -0.395965576171875, -0.3777008056640625, -0.35943603515625, -0.3411712646484375, -0.322906494140625, -0.3046417236328125, -0.286376953125, -0.2681121826171875, -0.249847412109375, -0.2315826416015625, -0.21331787109375, -0.1950531005859375, -0.176788330078125, -0.1585235595703125, -0.1402587890625, -0.1219940185546875, -0.103729248046875, -0.0854644775390625, -0.06719970703125, -0.0489349365234375, -0.030670166015625, -0.0124053955078125, 0.005859375, 0.0241241455078125, 0.042388916015625, 0.0606536865234375, 0.07891845703125, 0.0971832275390625, 0.115447998046875, 0.1337127685546875, 0.1519775390625, 0.1702423095703125, 0.188507080078125, 0.2067718505859375, 0.22503662109375, 0.2433013916015625, 0.261566162109375, 0.2798309326171875, 0.298095703125, 0.3163604736328125, 0.334625244140625, 0.3528900146484375, 0.37115478515625, 0.3894195556640625, 0.407684326171875, 0.4259490966796875, 0.4442138671875, 0.4624786376953125, 0.480743408203125, 0.4990081787109375, 0.51727294921875, 0.5355377197265625, 0.553802490234375, 0.5720672607421875, 0.59033203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 3.0, 11.0, 6.0, 13.0, 11.0, 10.0, 8.0, 14.0, 14.0, 24.0, 40.0, 45.0, 3472.0, 228.0, 42.0, 26.0, 19.0, 20.0, 16.0, 7.0, 7.0, 8.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08392333984375, -0.08136558532714844, -0.07880783081054688, -0.07625007629394531, -0.07369232177734375, -0.07113456726074219, -0.06857681274414062, -0.06601905822753906, -0.0634613037109375, -0.06090354919433594, -0.058345794677734375, -0.05578804016113281, -0.05323028564453125, -0.05067253112792969, -0.048114776611328125, -0.04555702209472656, -0.042999267578125, -0.04044151306152344, -0.037883758544921875, -0.03532600402832031, -0.03276824951171875, -0.030210494995117188, -0.027652740478515625, -0.025094985961914062, -0.0225372314453125, -0.019979476928710938, -0.017421722412109375, -0.014863967895507812, -0.01230621337890625, -0.009748458862304688, -0.007190704345703125, -0.0046329498291015625, -0.0020751953125, 0.0004825592041015625, 0.003040313720703125, 0.0055980682373046875, 0.00815582275390625, 0.010713577270507812, 0.013271331787109375, 0.015829086303710938, 0.0183868408203125, 0.020944595336914062, 0.023502349853515625, 0.026060104370117188, 0.02861785888671875, 0.031175613403320312, 0.033733367919921875, 0.03629112243652344, 0.038848876953125, 0.04140663146972656, 0.043964385986328125, 0.04652214050292969, 0.04907989501953125, 0.05163764953613281, 0.054195404052734375, 0.05675315856933594, 0.0593109130859375, 0.06186866760253906, 0.06442642211914062, 0.06698417663574219, 0.06954193115234375, 0.07209968566894531, 0.07465744018554688, 0.07721519470214844, 0.07977294921875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 239.0, 774.0, 5.0], "bins": [-3.634164810180664, -3.5756020545959473, -3.5170395374298096, -3.4584767818450928, -3.399914264678955, -3.3413515090942383, -3.2827889919281006, -3.224226236343384, -3.165663719177246, -3.1071009635925293, -3.0485384464263916, -2.989975690841675, -2.931413173675537, -2.8728504180908203, -2.8142879009246826, -2.755725145339966, -2.697162628173828, -2.6385998725891113, -2.5800373554229736, -2.521474599838257, -2.462912082672119, -2.4043493270874023, -2.3457868099212646, -2.287224054336548, -2.22866153717041, -2.1700987815856934, -2.1115362644195557, -2.052973508834839, -1.9944109916687012, -1.935848355293274, -1.8772857189178467, -1.8187230825424194, -1.7601604461669922, -1.701597809791565, -1.6430351734161377, -1.5844725370407104, -1.5259099006652832, -1.467347264289856, -1.4087846279144287, -1.3502219915390015, -1.2916593551635742, -1.233096718788147, -1.1745340824127197, -1.1159714460372925, -1.0574088096618652, -0.998846173286438, -0.9402835369110107, -0.8817209005355835, -0.8231581449508667, -0.7645955085754395, -0.7060328722000122, -0.647470235824585, -0.5889075994491577, -0.5303449630737305, -0.47178229689598083, -0.4132196605205536, -0.35465705394744873, -0.2960944175720215, -0.23753178119659424, -0.1789691299200058, -0.12040649354457855, -0.06184384226799011, -0.003281205892562866, 0.05528143048286438, 0.11384406685829163]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 8.0, 12.0, 9.0, 12.0, 21.0, 34.0, 28.0, 41.0, 42.0, 45.0, 52.0, 50.0, 57.0, 50.0, 64.0, 50.0, 62.0, 45.0, 54.0, 62.0, 42.0, 30.0, 28.0, 29.0, 13.0, 11.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23556888103485107, -0.2282554805278778, -0.22094208002090454, -0.21362867951393127, -0.2063152939081192, -0.19900189340114594, -0.19168849289417267, -0.1843750923871994, -0.17706170678138733, -0.16974830627441406, -0.1624349057674408, -0.15512150526046753, -0.14780811965465546, -0.1404947191476822, -0.13318131864070892, -0.12586791813373566, -0.11855451762676239, -0.11124111711978912, -0.10392772406339645, -0.09661432355642319, -0.08930093050003052, -0.08198752999305725, -0.07467412948608398, -0.06736072897911072, -0.06004733592271805, -0.05273393914103508, -0.04542054235935211, -0.038107141852378845, -0.030793745070695877, -0.02348034828901291, -0.016166947782039642, -0.008853551000356674, -0.001540154218673706, 0.005773243494331837, 0.01308664120733738, 0.020400039851665497, 0.027713436633348465, 0.03502683341503143, 0.0423402339220047, 0.04965363070368767, 0.056967027485370636, 0.0642804279923439, 0.07159382104873657, 0.07890722155570984, 0.0862206220626831, 0.09353401511907578, 0.10084741562604904, 0.10816080868244171, 0.11547420918941498, 0.12278760969638824, 0.1301010102033615, 0.13741439580917358, 0.14472779631614685, 0.15204119682312012, 0.15935459733009338, 0.16666799783706665, 0.17398139834403992, 0.18129479885101318, 0.18860819935798645, 0.19592159986495972, 0.2032349854707718, 0.21054838597774506, 0.21786178648471832, 0.2251751869916916, 0.23248857259750366]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 2.0, 5.0, 8.0, 11.0, 9.0, 22.0, 29.0, 38.0, 46.0, 67.0, 97.0, 155.0, 206.0, 306.0, 380.0, 624.0, 990.0, 1500.0, 2370.0, 4369.0, 8777.0, 23098.0, 105017.0, 761661.0, 97966.0, 21523.0, 8328.0, 4204.0, 2272.0, 1443.0, 993.0, 632.0, 437.0, 273.0, 182.0, 126.0, 106.0, 89.0, 56.0, 47.0, 20.0, 28.0, 15.0, 9.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.166015625, -0.16074180603027344, -0.15546798706054688, -0.1501941680908203, -0.14492034912109375, -0.1396465301513672, -0.13437271118164062, -0.12909889221191406, -0.1238250732421875, -0.11855125427246094, -0.11327743530273438, -0.10800361633300781, -0.10272979736328125, -0.09745597839355469, -0.09218215942382812, -0.08690834045410156, -0.081634521484375, -0.07636070251464844, -0.07108688354492188, -0.06581306457519531, -0.06053924560546875, -0.05526542663574219, -0.049991607666015625, -0.04471778869628906, -0.0394439697265625, -0.03417015075683594, -0.028896331787109375, -0.023622512817382812, -0.01834869384765625, -0.013074874877929688, -0.007801055908203125, -0.0025272369384765625, 0.00274658203125, 0.008020401000976562, 0.013294219970703125, 0.018568038940429688, 0.02384185791015625, 0.029115676879882812, 0.034389495849609375, 0.03966331481933594, 0.0449371337890625, 0.05021095275878906, 0.055484771728515625, 0.06075859069824219, 0.06603240966796875, 0.07130622863769531, 0.07658004760742188, 0.08185386657714844, 0.087127685546875, 0.09240150451660156, 0.09767532348632812, 0.10294914245605469, 0.10822296142578125, 0.11349678039550781, 0.11877059936523438, 0.12404441833496094, 0.1293182373046875, 0.13459205627441406, 0.13986587524414062, 0.1451396942138672, 0.15041351318359375, 0.1556873321533203, 0.16096115112304688, 0.16623497009277344, 0.1715087890625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 5.0, 9.0, 17.0, 41.0, 57.0, 110.0, 139.0, 143.0, 129.0, 107.0, 57.0, 45.0, 27.0, 23.0, 8.0, 8.0, 5.0, 8.0, 8.0, 5.0, 2.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0335693359375, -0.03258347511291504, -0.03159761428833008, -0.030611753463745117, -0.029625892639160156, -0.028640031814575195, -0.027654170989990234, -0.026668310165405273, -0.025682449340820312, -0.02469658851623535, -0.02371072769165039, -0.02272486686706543, -0.02173900604248047, -0.020753145217895508, -0.019767284393310547, -0.018781423568725586, -0.017795562744140625, -0.016809701919555664, -0.015823841094970703, -0.014837980270385742, -0.013852119445800781, -0.01286625862121582, -0.01188039779663086, -0.010894536972045898, -0.009908676147460938, -0.008922815322875977, -0.007936954498291016, -0.006951093673706055, -0.005965232849121094, -0.004979372024536133, -0.003993511199951172, -0.003007650375366211, -0.00202178955078125, -0.001035928726196289, -5.0067901611328125e-05, 0.0009357929229736328, 0.0019216537475585938, 0.0029075145721435547, 0.0038933753967285156, 0.0048792362213134766, 0.0058650970458984375, 0.0068509578704833984, 0.00783681869506836, 0.00882267951965332, 0.009808540344238281, 0.010794401168823242, 0.011780261993408203, 0.012766122817993164, 0.013751983642578125, 0.014737844467163086, 0.015723705291748047, 0.016709566116333008, 0.01769542694091797, 0.01868128776550293, 0.01966714859008789, 0.02065300941467285, 0.021638870239257812, 0.022624731063842773, 0.023610591888427734, 0.024596452713012695, 0.025582313537597656, 0.026568174362182617, 0.027554035186767578, 0.02853989601135254, 0.0295257568359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 8.0, 14.0, 23.0, 16.0, 22.0, 40.0, 38.0, 56.0, 73.0, 121.0, 154.0, 298.0, 728.0, 1957.0, 9024.0, 831282.0, 196166.0, 5606.0, 1507.0, 609.0, 256.0, 152.0, 106.0, 81.0, 58.0, 33.0, 29.0, 21.0, 16.0, 12.0, 8.0, 7.0, 8.0, 6.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4375, -0.4253082275390625, -0.413116455078125, -0.4009246826171875, -0.38873291015625, -0.3765411376953125, -0.364349365234375, -0.3521575927734375, -0.3399658203125, -0.3277740478515625, -0.315582275390625, -0.3033905029296875, -0.29119873046875, -0.2790069580078125, -0.266815185546875, -0.2546234130859375, -0.242431640625, -0.2302398681640625, -0.218048095703125, -0.2058563232421875, -0.19366455078125, -0.1814727783203125, -0.169281005859375, -0.1570892333984375, -0.1448974609375, -0.1327056884765625, -0.120513916015625, -0.1083221435546875, -0.09613037109375, -0.0839385986328125, -0.071746826171875, -0.0595550537109375, -0.04736328125, -0.0351715087890625, -0.022979736328125, -0.0107879638671875, 0.00140380859375, 0.0135955810546875, 0.025787353515625, 0.0379791259765625, 0.0501708984375, 0.0623626708984375, 0.074554443359375, 0.0867462158203125, 0.09893798828125, 0.1111297607421875, 0.123321533203125, 0.1355133056640625, 0.147705078125, 0.1598968505859375, 0.172088623046875, 0.1842803955078125, 0.19647216796875, 0.2086639404296875, 0.220855712890625, 0.2330474853515625, 0.2452392578125, 0.2574310302734375, 0.269622802734375, 0.2818145751953125, 0.29400634765625, 0.3061981201171875, 0.318389892578125, 0.3305816650390625, 0.3427734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 4.0, 12.0, 16.0, 11.0, 19.0, 19.0, 23.0, 27.0, 46.0, 39.0, 45.0, 41.0, 39.0, 48.0, 43.0, 49.0, 58.0, 59.0, 60.0, 33.0, 33.0, 29.0, 38.0, 35.0, 28.0, 22.0, 25.0, 24.0, 15.0, 13.0, 11.0, 12.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10858154296875, -0.1049795150756836, -0.10137748718261719, -0.09777545928955078, -0.09417343139648438, -0.09057140350341797, -0.08696937561035156, -0.08336734771728516, -0.07976531982421875, -0.07616329193115234, -0.07256126403808594, -0.06895923614501953, -0.06535720825195312, -0.06175518035888672, -0.05815315246582031, -0.054551124572753906, -0.0509490966796875, -0.047347068786621094, -0.04374504089355469, -0.04014301300048828, -0.036540985107421875, -0.03293895721435547, -0.029336929321289062, -0.025734901428222656, -0.02213287353515625, -0.018530845642089844, -0.014928817749023438, -0.011326789855957031, -0.007724761962890625, -0.004122734069824219, -0.0005207061767578125, 0.0030813217163085938, 0.006683349609375, 0.010285377502441406, 0.013887405395507812, 0.01748943328857422, 0.021091461181640625, 0.02469348907470703, 0.028295516967773438, 0.031897544860839844, 0.03549957275390625, 0.039101600646972656, 0.04270362854003906, 0.04630565643310547, 0.049907684326171875, 0.05350971221923828, 0.05711174011230469, 0.060713768005371094, 0.0643157958984375, 0.0679178237915039, 0.07151985168457031, 0.07512187957763672, 0.07872390747070312, 0.08232593536376953, 0.08592796325683594, 0.08952999114990234, 0.09313201904296875, 0.09673404693603516, 0.10033607482910156, 0.10393810272216797, 0.10754013061523438, 0.11114215850830078, 0.11474418640136719, 0.1183462142944336, 0.1219482421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 1.0, 5.0, 1.0, 9.0, 12.0, 13.0, 13.0, 26.0, 47.0, 55.0, 115.0, 245.0, 708.0, 2798.0, 362112.0, 677929.0, 3195.0, 640.0, 278.0, 151.0, 66.0, 36.0, 23.0, 21.0, 8.0, 12.0, 3.0, 6.0, 7.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015228271484375, -0.014720916748046875, -0.01421356201171875, -0.013706207275390625, -0.0131988525390625, -0.012691497802734375, -0.01218414306640625, -0.011676788330078125, -0.01116943359375, -0.010662078857421875, -0.01015472412109375, -0.009647369384765625, -0.0091400146484375, -0.008632659912109375, -0.00812530517578125, -0.007617950439453125, -0.007110595703125, -0.006603240966796875, -0.00609588623046875, -0.005588531494140625, -0.0050811767578125, -0.004573822021484375, -0.00406646728515625, -0.003559112548828125, -0.0030517578125, -0.002544403076171875, -0.00203704833984375, -0.001529693603515625, -0.0010223388671875, -0.000514984130859375, -7.62939453125e-06, 0.000499725341796875, 0.001007080078125, 0.001514434814453125, 0.00202178955078125, 0.002529144287109375, 0.0030364990234375, 0.003543853759765625, 0.00405120849609375, 0.004558563232421875, 0.00506591796875, 0.005573272705078125, 0.00608062744140625, 0.006587982177734375, 0.0070953369140625, 0.007602691650390625, 0.00811004638671875, 0.008617401123046875, 0.009124755859375, 0.009632110595703125, 0.01013946533203125, 0.010646820068359375, 0.0111541748046875, 0.011661529541015625, 0.01216888427734375, 0.012676239013671875, 0.01318359375, 0.013690948486328125, 0.01419830322265625, 0.014705657958984375, 0.0152130126953125, 0.015720367431640625, 0.01622772216796875, 0.016735076904296875, 0.017242431640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 7.0, 0.0, 6.0, 6.0, 8.0, 11.0, 8.0, 8.0, 22.0, 18.0, 15.0, 30.0, 23.0, 45.0, 79.0, 85.0, 93.0, 92.0, 87.0, 72.0, 59.0, 53.0, 35.0, 34.0, 21.0, 24.0, 14.0, 16.0, 3.0, 9.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.279613494873047e-05, -4.143174737691879e-05, -4.006735980510712e-05, -3.870297223329544e-05, -3.7338584661483765e-05, -3.597419708967209e-05, -3.460980951786041e-05, -3.3245421946048737e-05, -3.188103437423706e-05, -3.0516646802425385e-05, -2.915225923061371e-05, -2.7787871658802032e-05, -2.6423484086990356e-05, -2.505909651517868e-05, -2.3694708943367004e-05, -2.233032137155533e-05, -2.0965933799743652e-05, -1.9601546227931976e-05, -1.82371586561203e-05, -1.6872771084308624e-05, -1.5508383512496948e-05, -1.4143995940685272e-05, -1.2779608368873596e-05, -1.141522079706192e-05, -1.0050833225250244e-05, -8.686445653438568e-06, -7.322058081626892e-06, -5.957670509815216e-06, -4.59328293800354e-06, -3.228895366191864e-06, -1.864507794380188e-06, -5.00120222568512e-07, 8.642673492431641e-07, 2.22865492105484e-06, 3.593042492866516e-06, 4.957430064678192e-06, 6.321817636489868e-06, 7.686205208301544e-06, 9.05059278011322e-06, 1.0414980351924896e-05, 1.1779367923736572e-05, 1.3143755495548248e-05, 1.4508143067359924e-05, 1.58725306391716e-05, 1.7236918210983276e-05, 1.8601305782794952e-05, 1.996569335460663e-05, 2.1330080926418304e-05, 2.269446849822998e-05, 2.4058856070041656e-05, 2.5423243641853333e-05, 2.678763121366501e-05, 2.8152018785476685e-05, 2.951640635728836e-05, 3.088079392910004e-05, 3.224518150091171e-05, 3.360956907272339e-05, 3.4973956644535065e-05, 3.633834421634674e-05, 3.770273178815842e-05, 3.906711935997009e-05, 4.043150693178177e-05, 4.1795894503593445e-05, 4.316028207540512e-05, 4.45246696472168e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 13.0, 16.0, 21.0, 35.0, 48.0, 74.0, 126.0, 289.0, 1016.0, 7942.0, 1025832.0, 11094.0, 1296.0, 352.0, 142.0, 79.0, 47.0, 34.0, 24.0, 15.0, 8.0, 13.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02947998046875, -0.028574228286743164, -0.027668476104736328, -0.026762723922729492, -0.025856971740722656, -0.02495121955871582, -0.024045467376708984, -0.02313971519470215, -0.022233963012695312, -0.021328210830688477, -0.02042245864868164, -0.019516706466674805, -0.01861095428466797, -0.017705202102661133, -0.016799449920654297, -0.01589369773864746, -0.014987945556640625, -0.014082193374633789, -0.013176441192626953, -0.012270689010620117, -0.011364936828613281, -0.010459184646606445, -0.00955343246459961, -0.008647680282592773, -0.0077419281005859375, -0.0068361759185791016, -0.005930423736572266, -0.00502467155456543, -0.004118919372558594, -0.003213167190551758, -0.002307415008544922, -0.001401662826538086, -0.00049591064453125, 0.00040984153747558594, 0.0013155937194824219, 0.002221345901489258, 0.0031270980834960938, 0.00403285026550293, 0.004938602447509766, 0.0058443546295166016, 0.0067501068115234375, 0.0076558589935302734, 0.00856161117553711, 0.009467363357543945, 0.010373115539550781, 0.011278867721557617, 0.012184619903564453, 0.013090372085571289, 0.013996124267578125, 0.014901876449584961, 0.015807628631591797, 0.016713380813598633, 0.01761913299560547, 0.018524885177612305, 0.01943063735961914, 0.020336389541625977, 0.021242141723632812, 0.02214789390563965, 0.023053646087646484, 0.02395939826965332, 0.024865150451660156, 0.025770902633666992, 0.026676654815673828, 0.027582406997680664, 0.0284881591796875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 5.0, 6.0, 22.0, 16.0, 37.0, 103.0, 166.0, 292.0, 164.0, 83.0, 34.0, 28.0, 11.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0108184814453125, -0.010473847389221191, -0.010129213333129883, -0.009784579277038574, -0.009439945220947266, -0.009095311164855957, -0.008750677108764648, -0.00840604305267334, -0.008061408996582031, -0.007716774940490723, -0.007372140884399414, -0.0070275068283081055, -0.006682872772216797, -0.006338238716125488, -0.00599360466003418, -0.005648970603942871, -0.0053043365478515625, -0.004959702491760254, -0.004615068435668945, -0.004270434379577637, -0.003925800323486328, -0.0035811662673950195, -0.003236532211303711, -0.0028918981552124023, -0.0025472640991210938, -0.002202630043029785, -0.0018579959869384766, -0.001513361930847168, -0.0011687278747558594, -0.0008240938186645508, -0.0004794597625732422, -0.0001348257064819336, 0.000209808349609375, 0.0005544424057006836, 0.0008990764617919922, 0.0012437105178833008, 0.0015883445739746094, 0.001932978630065918, 0.0022776126861572266, 0.002622246742248535, 0.0029668807983398438, 0.0033115148544311523, 0.003656148910522461, 0.0040007829666137695, 0.004345417022705078, 0.004690051078796387, 0.005034685134887695, 0.005379319190979004, 0.0057239532470703125, 0.006068587303161621, 0.00641322135925293, 0.006757855415344238, 0.007102489471435547, 0.0074471235275268555, 0.007791757583618164, 0.008136391639709473, 0.008481025695800781, 0.00882565975189209, 0.009170293807983398, 0.009514927864074707, 0.009859561920166016, 0.010204195976257324, 0.010548830032348633, 0.010893464088439941, 0.01123809814453125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 68.0, 924.0, 21.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.005024909973145, -7.865721225738525, -7.726417541503906, -7.587113857269287, -7.447810173034668, -7.308506488800049, -7.16920280456543, -7.029898643493652, -6.890595436096191, -6.751291751861572, -6.611988067626953, -6.472684383392334, -6.333380699157715, -6.194077014923096, -6.054773330688477, -5.915469169616699, -5.77616548538208, -5.636861801147461, -5.497558116912842, -5.358254432678223, -5.2189507484436035, -5.079647064208984, -4.940343379974365, -4.801039695739746, -4.661735534667969, -4.52243185043335, -4.3831281661987305, -4.243824481964111, -4.104520797729492, -3.965217113494873, -3.825913190841675, -3.6866095066070557, -3.547306537628174, -3.4080028533935547, -3.2686991691589355, -3.1293954849243164, -2.9900918006896973, -2.850788116455078, -2.71148419380188, -2.5721805095672607, -2.4328765869140625, -2.2935729026794434, -2.154269218444824, -2.014965534210205, -1.8756617307662964, -1.7363580465316772, -1.5970542430877686, -1.4577505588531494, -1.3184469938278198, -1.1791433095932007, -1.039839506149292, -0.9005358219146729, -0.7612321376800537, -0.6219284534454346, -0.48262470960617065, -0.34332096576690674, -0.2040172815322876, -0.06471356749534607, 0.07459014654159546, 0.213893860578537, 0.3531975746154785, 0.49250125885009766, 0.6318050026893616, 0.7711087465286255, 0.9104124307632446]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 7.0, 3.0, 8.0, 13.0, 16.0, 15.0, 11.0, 17.0, 25.0, 27.0, 30.0, 24.0, 34.0, 38.0, 34.0, 47.0, 33.0, 59.0, 54.0, 38.0, 44.0, 39.0, 44.0, 37.0, 24.0, 32.0, 33.0, 28.0, 29.0, 23.0, 23.0, 18.0, 14.0, 12.0, 9.0, 8.0, 10.0, 7.0, 6.0, 3.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.6520004868507385, -0.6329001784324646, -0.6137998700141907, -0.5946995615959167, -0.5755993127822876, -0.5564990043640137, -0.5373986959457397, -0.5182983875274658, -0.4991980791091919, -0.48009777069091797, -0.46099746227264404, -0.4418971836566925, -0.4227968752384186, -0.40369656682014465, -0.3845962882041931, -0.3654959797859192, -0.34639567136764526, -0.32729536294937134, -0.3081950545310974, -0.2890947759151459, -0.26999446749687195, -0.250894159078598, -0.2317938655614853, -0.21269357204437256, -0.19359326362609863, -0.1744929552078247, -0.15539266169071198, -0.13629236817359924, -0.11719205975532532, -0.09809175878763199, -0.07899145781993866, -0.05989116430282593, -0.040790855884552, -0.021690554916858673, -0.0025902539491653442, 0.016510047018527985, 0.035610347986221313, 0.05471064895391464, 0.07381094992160797, 0.0929112434387207, 0.11201155185699463, 0.13111186027526855, 0.1502121537923813, 0.16931244730949402, 0.18841275572776794, 0.20751306414604187, 0.2266133576631546, 0.24571365118026733, 0.26481395959854126, 0.2839142680168152, 0.3030145764350891, 0.32211485505104065, 0.3412151634693146, 0.3603154718875885, 0.37941575050354004, 0.39851605892181396, 0.4176163673400879, 0.4367166757583618, 0.45581698417663574, 0.4749172627925873, 0.4940175712108612, 0.5131178498268127, 0.5322181582450867, 0.5513184666633606, 0.5704187750816345]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 5.0, 10.0, 16.0, 23.0, 41.0, 61.0, 120.0, 257.0, 720.0, 5805.0, 4182173.0, 3808.0, 637.0, 247.0, 113.0, 81.0, 40.0, 26.0, 19.0, 13.0, 7.0, 9.0, 8.0, 7.0, 4.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.467529296875, -0.4531059265136719, -0.43868255615234375, -0.4242591857910156, -0.4098358154296875, -0.3954124450683594, -0.38098907470703125, -0.3665657043457031, -0.352142333984375, -0.3377189636230469, -0.32329559326171875, -0.3088722229003906, -0.2944488525390625, -0.2800254821777344, -0.26560211181640625, -0.2511787414550781, -0.23675537109375, -0.22233200073242188, -0.20790863037109375, -0.19348526000976562, -0.1790618896484375, -0.16463851928710938, -0.15021514892578125, -0.13579177856445312, -0.121368408203125, -0.10694503784179688, -0.09252166748046875, -0.07809829711914062, -0.0636749267578125, -0.049251556396484375, -0.03482818603515625, -0.020404815673828125, -0.0059814453125, 0.008441925048828125, 0.02286529541015625, 0.037288665771484375, 0.0517120361328125, 0.06613540649414062, 0.08055877685546875, 0.09498214721679688, 0.109405517578125, 0.12382888793945312, 0.13825225830078125, 0.15267562866210938, 0.1670989990234375, 0.18152236938476562, 0.19594573974609375, 0.21036911010742188, 0.22479248046875, 0.23921585083007812, 0.25363922119140625, 0.2680625915527344, 0.2824859619140625, 0.2969093322753906, 0.31133270263671875, 0.3257560729980469, 0.340179443359375, 0.3546028137207031, 0.36902618408203125, 0.3834495544433594, 0.3978729248046875, 0.4122962951660156, 0.42671966552734375, 0.4411430358886719, 0.45556640625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 3.0, 5.0, 14.0, 16.0, 26.0, 32.0, 62.0, 93.0, 114.0, 131.0, 116.0, 89.0, 70.0, 69.0, 31.0, 33.0, 14.0, 12.0, 9.0, 4.0, 6.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0292816162109375, -0.028374433517456055, -0.02746725082397461, -0.026560068130493164, -0.02565288543701172, -0.024745702743530273, -0.023838520050048828, -0.022931337356567383, -0.022024154663085938, -0.021116971969604492, -0.020209789276123047, -0.0193026065826416, -0.018395423889160156, -0.01748824119567871, -0.016581058502197266, -0.01567387580871582, -0.014766693115234375, -0.01385951042175293, -0.012952327728271484, -0.012045145034790039, -0.011137962341308594, -0.010230779647827148, -0.009323596954345703, -0.008416414260864258, -0.0075092315673828125, -0.006602048873901367, -0.005694866180419922, -0.0047876834869384766, -0.0038805007934570312, -0.002973318099975586, -0.0020661354064941406, -0.0011589527130126953, -0.00025177001953125, 0.0006554126739501953, 0.0015625953674316406, 0.002469778060913086, 0.0033769607543945312, 0.0042841434478759766, 0.005191326141357422, 0.006098508834838867, 0.0070056915283203125, 0.007912874221801758, 0.008820056915283203, 0.009727239608764648, 0.010634422302246094, 0.011541604995727539, 0.012448787689208984, 0.01335597038269043, 0.014263153076171875, 0.01517033576965332, 0.016077518463134766, 0.01698470115661621, 0.017891883850097656, 0.0187990665435791, 0.019706249237060547, 0.020613431930541992, 0.021520614624023438, 0.022427797317504883, 0.023334980010986328, 0.024242162704467773, 0.02514934539794922, 0.026056528091430664, 0.02696371078491211, 0.027870893478393555, 0.028778076171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 5.0, 8.0, 13.0, 16.0, 25.0, 61.0, 106.0, 332.0, 1121.0, 7589.0, 4140858.0, 39710.0, 3214.0, 793.0, 218.0, 84.0, 33.0, 23.0, 13.0, 11.0, 8.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.29456329345703125, -0.2846832275390625, -0.27480316162109375, -0.264923095703125, -0.25504302978515625, -0.2451629638671875, -0.23528289794921875, -0.22540283203125, -0.21552276611328125, -0.2056427001953125, -0.19576263427734375, -0.185882568359375, -0.17600250244140625, -0.1661224365234375, -0.15624237060546875, -0.1463623046875, -0.13648223876953125, -0.1266021728515625, -0.11672210693359375, -0.106842041015625, -0.09696197509765625, -0.0870819091796875, -0.07720184326171875, -0.06732177734375, -0.05744171142578125, -0.0475616455078125, -0.03768157958984375, -0.027801513671875, -0.01792144775390625, -0.0080413818359375, 0.00183868408203125, 0.01171875, 0.02159881591796875, 0.0314788818359375, 0.04135894775390625, 0.051239013671875, 0.06111907958984375, 0.0709991455078125, 0.08087921142578125, 0.09075927734375, 0.10063934326171875, 0.1105194091796875, 0.12039947509765625, 0.130279541015625, 0.14015960693359375, 0.1500396728515625, 0.15991973876953125, 0.1697998046875, 0.17967987060546875, 0.1895599365234375, 0.19944000244140625, 0.209320068359375, 0.21920013427734375, 0.2290802001953125, 0.23896026611328125, 0.24884033203125, 0.25872039794921875, 0.2686004638671875, 0.27848052978515625, 0.288360595703125, 0.29824066162109375, 0.3081207275390625, 0.31800079345703125, 0.327880859375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 4.0, 7.0, 5.0, 7.0, 7.0, 11.0, 25.0, 31.0, 175.0, 3645.0, 67.0, 11.0, 12.0, 10.0, 10.0, 5.0, 2.0, 7.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.053619384765625, -0.0519556999206543, -0.050292015075683594, -0.04862833023071289, -0.04696464538574219, -0.045300960540771484, -0.04363727569580078, -0.04197359085083008, -0.040309906005859375, -0.03864622116088867, -0.03698253631591797, -0.035318851470947266, -0.03365516662597656, -0.03199148178100586, -0.030327796936035156, -0.028664112091064453, -0.02700042724609375, -0.025336742401123047, -0.023673057556152344, -0.02200937271118164, -0.020345687866210938, -0.018682003021240234, -0.01701831817626953, -0.015354633331298828, -0.013690948486328125, -0.012027263641357422, -0.010363578796386719, -0.008699893951416016, -0.0070362091064453125, -0.005372524261474609, -0.0037088394165039062, -0.002045154571533203, -0.0003814697265625, 0.0012822151184082031, 0.0029458999633789062, 0.004609584808349609, 0.0062732696533203125, 0.007936954498291016, 0.009600639343261719, 0.011264324188232422, 0.012928009033203125, 0.014591693878173828, 0.01625537872314453, 0.017919063568115234, 0.019582748413085938, 0.02124643325805664, 0.022910118103027344, 0.024573802947998047, 0.02623748779296875, 0.027901172637939453, 0.029564857482910156, 0.03122854232788086, 0.03289222717285156, 0.034555912017822266, 0.03621959686279297, 0.03788328170776367, 0.039546966552734375, 0.04121065139770508, 0.04287433624267578, 0.044538021087646484, 0.04620170593261719, 0.04786539077758789, 0.049529075622558594, 0.0511927604675293, 0.0528564453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 1006.0, 6.0], "bins": [-4.4444966316223145, -4.373301029205322, -4.30210542678833, -4.230909824371338, -4.159714221954346, -4.0885186195373535, -4.017323017120361, -3.9461276531219482, -3.874932050704956, -3.803736448287964, -3.7325408458709717, -3.6613452434539795, -3.5901498794555664, -3.518954277038574, -3.447758674621582, -3.37656307220459, -3.3053674697875977, -3.2341718673706055, -3.1629762649536133, -3.091780662536621, -3.020585060119629, -2.949389696121216, -2.8781940937042236, -2.8069984912872314, -2.7358028888702393, -2.664607286453247, -2.593411684036255, -2.5222160816192627, -2.4510207176208496, -2.3798251152038574, -2.3086295127868652, -2.237433910369873, -2.166238307952881, -2.0950427055358887, -2.0238471031188965, -1.9526516199111938, -1.8814560174942017, -1.8102604150772095, -1.7390649318695068, -1.6678693294525146, -1.596673846244812, -1.5254782438278198, -1.4542827606201172, -1.383087158203125, -1.3118915557861328, -1.2406959533691406, -1.1695003509521484, -1.0983048677444458, -1.0271092653274536, -0.9559136629104614, -0.884718120098114, -0.8135225772857666, -0.7423269748687744, -0.6711313724517822, -0.5999358296394348, -0.5287402868270874, -0.45754462480545044, -0.38634905219078064, -0.31515347957611084, -0.24395790696144104, -0.17276233434677124, -0.10156676173210144, -0.03037118911743164, 0.04082438349723816, 0.11201994866132736]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 13.0, 6.0, 8.0, 17.0, 21.0, 20.0, 15.0, 26.0, 38.0, 38.0, 38.0, 54.0, 54.0, 53.0, 54.0, 64.0, 53.0, 49.0, 73.0, 45.0, 45.0, 44.0, 36.0, 38.0, 17.0, 18.0, 15.0, 19.0, 10.0, 6.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1196402907371521, -0.11546975374221802, -0.11129921674728394, -0.10712868720293045, -0.10295815020799637, -0.09878761321306229, -0.0946170836687088, -0.09044654667377472, -0.08627600967884064, -0.08210547268390656, -0.07793493568897247, -0.07376440614461899, -0.0695938691496849, -0.06542333215475082, -0.06125279888510704, -0.05708226561546326, -0.052911728620529175, -0.04874119162559509, -0.04457065835595131, -0.040400125086307526, -0.036229588091373444, -0.03205905109643936, -0.027888517826795578, -0.023717982694506645, -0.019547447562217712, -0.01537691242992878, -0.011206377297639847, -0.007035842165350914, -0.002865307033061981, 0.0013052280992269516, 0.005475763231515884, 0.009646298363804817, 0.01381683349609375, 0.017987368628382683, 0.022157903760671616, 0.02632843889296055, 0.03049897402524948, 0.03466951102018356, 0.03884004428982735, 0.04301057755947113, 0.04718111455440521, 0.051351651549339294, 0.05552218481898308, 0.05969271808862686, 0.06386325508356094, 0.06803379207849503, 0.07220432162284851, 0.07637485861778259, 0.08054539561271667, 0.08471593260765076, 0.08888646960258484, 0.09305699914693832, 0.0972275361418724, 0.10139807313680649, 0.10556860268115997, 0.10973913967609406, 0.11390967667102814, 0.11808021366596222, 0.1222507506608963, 0.12642128765583038, 0.13059180974960327, 0.13476234674453735, 0.13893288373947144, 0.14310342073440552, 0.1472739577293396]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 2.0, 6.0, 9.0, 6.0, 14.0, 25.0, 42.0, 43.0, 66.0, 76.0, 110.0, 177.0, 246.0, 368.0, 525.0, 786.0, 1252.0, 1976.0, 3369.0, 6215.0, 13042.0, 35114.0, 153241.0, 673946.0, 105207.0, 27963.0, 11116.0, 5448.0, 3006.0, 1753.0, 1129.0, 709.0, 503.0, 303.0, 214.0, 152.0, 110.0, 86.0, 52.0, 39.0, 25.0, 25.0, 17.0, 11.0, 9.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0775146484375, -0.07512187957763672, -0.07272911071777344, -0.07033634185791016, -0.06794357299804688, -0.0655508041381836, -0.06315803527832031, -0.06076526641845703, -0.05837249755859375, -0.05597972869873047, -0.05358695983886719, -0.051194190979003906, -0.048801422119140625, -0.046408653259277344, -0.04401588439941406, -0.04162311553955078, -0.0392303466796875, -0.03683757781982422, -0.03444480895996094, -0.032052040100097656, -0.029659271240234375, -0.027266502380371094, -0.024873733520507812, -0.02248096466064453, -0.02008819580078125, -0.01769542694091797, -0.015302658081054688, -0.012909889221191406, -0.010517120361328125, -0.008124351501464844, -0.0057315826416015625, -0.0033388137817382812, -0.000946044921875, 0.0014467239379882812, 0.0038394927978515625, 0.006232261657714844, 0.008625030517578125, 0.011017799377441406, 0.013410568237304688, 0.01580333709716797, 0.01819610595703125, 0.02058887481689453, 0.022981643676757812, 0.025374412536621094, 0.027767181396484375, 0.030159950256347656, 0.03255271911621094, 0.03494548797607422, 0.0373382568359375, 0.03973102569580078, 0.04212379455566406, 0.044516563415527344, 0.046909332275390625, 0.049302101135253906, 0.05169486999511719, 0.05408763885498047, 0.05648040771484375, 0.05887317657470703, 0.06126594543457031, 0.0636587142944336, 0.06605148315429688, 0.06844425201416016, 0.07083702087402344, 0.07322978973388672, 0.07562255859375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 6.0, 6.0, 2.0, 7.0, 11.0, 24.0, 22.0, 35.0, 54.0, 88.0, 112.0, 127.0, 124.0, 80.0, 80.0, 54.0, 48.0, 23.0, 22.0, 13.0, 11.0, 8.0, 3.0, 8.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02813720703125, -0.027268648147583008, -0.026400089263916016, -0.025531530380249023, -0.02466297149658203, -0.02379441261291504, -0.022925853729248047, -0.022057294845581055, -0.021188735961914062, -0.02032017707824707, -0.019451618194580078, -0.018583059310913086, -0.017714500427246094, -0.0168459415435791, -0.01597738265991211, -0.015108823776245117, -0.014240264892578125, -0.013371706008911133, -0.01250314712524414, -0.011634588241577148, -0.010766029357910156, -0.009897470474243164, -0.009028911590576172, -0.00816035270690918, -0.0072917938232421875, -0.006423234939575195, -0.005554676055908203, -0.004686117172241211, -0.0038175582885742188, -0.0029489994049072266, -0.0020804405212402344, -0.0012118816375732422, -0.00034332275390625, 0.0005252361297607422, 0.0013937950134277344, 0.0022623538970947266, 0.0031309127807617188, 0.003999471664428711, 0.004868030548095703, 0.005736589431762695, 0.0066051483154296875, 0.00747370719909668, 0.008342266082763672, 0.009210824966430664, 0.010079383850097656, 0.010947942733764648, 0.01181650161743164, 0.012685060501098633, 0.013553619384765625, 0.014422178268432617, 0.01529073715209961, 0.0161592960357666, 0.017027854919433594, 0.017896413803100586, 0.018764972686767578, 0.01963353157043457, 0.020502090454101562, 0.021370649337768555, 0.022239208221435547, 0.02310776710510254, 0.02397632598876953, 0.024844884872436523, 0.025713443756103516, 0.026582002639770508, 0.0274505615234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 4.0, 4.0, 8.0, 10.0, 17.0, 5.0, 28.0, 24.0, 30.0, 43.0, 46.0, 48.0, 56.0, 91.0, 143.0, 285.0, 571.0, 1279.0, 3418.0, 32756.0, 957643.0, 45363.0, 3816.0, 1347.0, 626.0, 295.0, 170.0, 92.0, 72.0, 59.0, 44.0, 29.0, 25.0, 16.0, 20.0, 13.0, 11.0, 15.0, 5.0, 13.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2109375, -0.20425033569335938, -0.19756317138671875, -0.19087600708007812, -0.1841888427734375, -0.17750167846679688, -0.17081451416015625, -0.16412734985351562, -0.157440185546875, -0.15075302124023438, -0.14406585693359375, -0.13737869262695312, -0.1306915283203125, -0.12400436401367188, -0.11731719970703125, -0.11063003540039062, -0.10394287109375, -0.09725570678710938, -0.09056854248046875, -0.08388137817382812, -0.0771942138671875, -0.07050704956054688, -0.06381988525390625, -0.057132720947265625, -0.050445556640625, -0.043758392333984375, -0.03707122802734375, -0.030384063720703125, -0.0236968994140625, -0.017009735107421875, -0.01032257080078125, -0.003635406494140625, 0.0030517578125, 0.009738922119140625, 0.01642608642578125, 0.023113250732421875, 0.0298004150390625, 0.036487579345703125, 0.04317474365234375, 0.049861907958984375, 0.056549072265625, 0.06323623657226562, 0.06992340087890625, 0.07661056518554688, 0.0832977294921875, 0.08998489379882812, 0.09667205810546875, 0.10335922241210938, 0.11004638671875, 0.11673355102539062, 0.12342071533203125, 0.13010787963867188, 0.1367950439453125, 0.14348220825195312, 0.15016937255859375, 0.15685653686523438, 0.163543701171875, 0.17023086547851562, 0.17691802978515625, 0.18360519409179688, 0.1902923583984375, 0.19697952270507812, 0.20366668701171875, 0.21035385131835938, 0.217041015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 10.0, 8.0, 13.0, 12.0, 12.0, 11.0, 16.0, 21.0, 19.0, 28.0, 22.0, 29.0, 25.0, 40.0, 37.0, 40.0, 33.0, 50.0, 34.0, 43.0, 54.0, 54.0, 44.0, 36.0, 35.0, 25.0, 33.0, 28.0, 24.0, 18.0, 28.0, 19.0, 26.0, 16.0, 11.0, 10.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083984375, -0.0813741683959961, -0.07876396179199219, -0.07615375518798828, -0.07354354858398438, -0.07093334197998047, -0.06832313537597656, -0.06571292877197266, -0.06310272216796875, -0.060492515563964844, -0.05788230895996094, -0.05527210235595703, -0.052661895751953125, -0.05005168914794922, -0.04744148254394531, -0.044831275939941406, -0.0422210693359375, -0.039610862731933594, -0.03700065612792969, -0.03439044952392578, -0.031780242919921875, -0.02917003631591797, -0.026559829711914062, -0.023949623107910156, -0.02133941650390625, -0.018729209899902344, -0.016119003295898438, -0.013508796691894531, -0.010898590087890625, -0.008288383483886719, -0.0056781768798828125, -0.0030679702758789062, -0.000457763671875, 0.0021524429321289062, 0.0047626495361328125, 0.007372856140136719, 0.009983062744140625, 0.012593269348144531, 0.015203475952148438, 0.017813682556152344, 0.02042388916015625, 0.023034095764160156, 0.025644302368164062, 0.02825450897216797, 0.030864715576171875, 0.03347492218017578, 0.03608512878417969, 0.038695335388183594, 0.0413055419921875, 0.043915748596191406, 0.04652595520019531, 0.04913616180419922, 0.051746368408203125, 0.05435657501220703, 0.05696678161621094, 0.059576988220214844, 0.06218719482421875, 0.06479740142822266, 0.06740760803222656, 0.07001781463623047, 0.07262802124023438, 0.07523822784423828, 0.07784843444824219, 0.0804586410522461, 0.08306884765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 7.0, 4.0, 2.0, 3.0, 9.0, 5.0, 7.0, 14.0, 30.0, 32.0, 42.0, 71.0, 160.0, 382.0, 1724.0, 40426.0, 999745.0, 4657.0, 695.0, 222.0, 103.0, 63.0, 31.0, 24.0, 23.0, 12.0, 17.0, 9.0, 11.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01221466064453125, -0.011835575103759766, -0.011456489562988281, -0.011077404022216797, -0.010698318481445312, -0.010319232940673828, -0.009940147399902344, -0.00956106185913086, -0.009181976318359375, -0.00880289077758789, -0.008423805236816406, -0.008044719696044922, -0.0076656341552734375, -0.007286548614501953, -0.006907463073730469, -0.006528377532958984, -0.0061492919921875, -0.005770206451416016, -0.005391120910644531, -0.005012035369873047, -0.0046329498291015625, -0.004253864288330078, -0.0038747787475585938, -0.0034956932067871094, -0.003116607666015625, -0.0027375221252441406, -0.0023584365844726562, -0.001979351043701172, -0.0016002655029296875, -0.0012211799621582031, -0.0008420944213867188, -0.0004630088806152344, -8.392333984375e-05, 0.0002951622009277344, 0.0006742477416992188, 0.0010533332824707031, 0.0014324188232421875, 0.0018115043640136719, 0.0021905899047851562, 0.0025696754455566406, 0.002948760986328125, 0.0033278465270996094, 0.0037069320678710938, 0.004086017608642578, 0.0044651031494140625, 0.004844188690185547, 0.005223274230957031, 0.005602359771728516, 0.0059814453125, 0.006360530853271484, 0.006739616394042969, 0.007118701934814453, 0.0074977874755859375, 0.007876873016357422, 0.008255958557128906, 0.00863504409790039, 0.009014129638671875, 0.00939321517944336, 0.009772300720214844, 0.010151386260986328, 0.010530471801757812, 0.010909557342529297, 0.011288642883300781, 0.011667728424072266, 0.01204681396484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 4.0, 4.0, 4.0, 10.0, 11.0, 13.0, 15.0, 13.0, 13.0, 27.0, 31.0, 29.0, 30.0, 67.0, 96.0, 143.0, 148.0, 72.0, 46.0, 37.0, 35.0, 30.0, 15.0, 17.0, 12.0, 8.0, 15.0, 12.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.166364669799805e-05, -4.0261074900627136e-05, -3.8858503103256226e-05, -3.7455931305885315e-05, -3.6053359508514404e-05, -3.4650787711143494e-05, -3.324821591377258e-05, -3.184564411640167e-05, -3.0443072319030762e-05, -2.904050052165985e-05, -2.763792872428894e-05, -2.623535692691803e-05, -2.483278512954712e-05, -2.343021333217621e-05, -2.2027641534805298e-05, -2.0625069737434387e-05, -1.9222497940063477e-05, -1.7819926142692566e-05, -1.6417354345321655e-05, -1.5014782547950745e-05, -1.3612210750579834e-05, -1.2209638953208923e-05, -1.0807067155838013e-05, -9.404495358467102e-06, -8.001923561096191e-06, -6.599351763725281e-06, -5.19677996635437e-06, -3.7942081689834595e-06, -2.391636371612549e-06, -9.890645742416382e-07, 4.1350722312927246e-07, 1.816079020500183e-06, 3.2186508178710938e-06, 4.621222615242004e-06, 6.023794412612915e-06, 7.426366209983826e-06, 8.828938007354736e-06, 1.0231509804725647e-05, 1.1634081602096558e-05, 1.3036653399467468e-05, 1.4439225196838379e-05, 1.584179699420929e-05, 1.72443687915802e-05, 1.864694058895111e-05, 2.004951238632202e-05, 2.1452084183692932e-05, 2.2854655981063843e-05, 2.4257227778434753e-05, 2.5659799575805664e-05, 2.7062371373176575e-05, 2.8464943170547485e-05, 2.9867514967918396e-05, 3.127008676528931e-05, 3.267265856266022e-05, 3.407523036003113e-05, 3.547780215740204e-05, 3.688037395477295e-05, 3.828294575214386e-05, 3.968551754951477e-05, 4.108808934688568e-05, 4.249066114425659e-05, 4.38932329416275e-05, 4.529580473899841e-05, 4.6698376536369324e-05, 4.8100948333740234e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 7.0, 11.0, 10.0, 13.0, 18.0, 44.0, 48.0, 134.0, 291.0, 1058.0, 15970.0, 1025587.0, 4264.0, 648.0, 210.0, 99.0, 47.0, 28.0, 18.0, 13.0, 5.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.035614013671875, -0.034708261489868164, -0.03380250930786133, -0.03289675712585449, -0.031991004943847656, -0.03108525276184082, -0.030179500579833984, -0.02927374839782715, -0.028367996215820312, -0.027462244033813477, -0.02655649185180664, -0.025650739669799805, -0.02474498748779297, -0.023839235305786133, -0.022933483123779297, -0.02202773094177246, -0.021121978759765625, -0.02021622657775879, -0.019310474395751953, -0.018404722213745117, -0.01749897003173828, -0.016593217849731445, -0.01568746566772461, -0.014781713485717773, -0.013875961303710938, -0.012970209121704102, -0.012064456939697266, -0.01115870475769043, -0.010252952575683594, -0.009347200393676758, -0.008441448211669922, -0.007535696029663086, -0.00662994384765625, -0.005724191665649414, -0.004818439483642578, -0.003912687301635742, -0.0030069351196289062, -0.0021011829376220703, -0.0011954307556152344, -0.00028967857360839844, 0.0006160736083984375, 0.0015218257904052734, 0.0024275779724121094, 0.0033333301544189453, 0.004239082336425781, 0.005144834518432617, 0.006050586700439453, 0.006956338882446289, 0.007862091064453125, 0.008767843246459961, 0.009673595428466797, 0.010579347610473633, 0.011485099792480469, 0.012390851974487305, 0.01329660415649414, 0.014202356338500977, 0.015108108520507812, 0.01601386070251465, 0.016919612884521484, 0.01782536506652832, 0.018731117248535156, 0.019636869430541992, 0.020542621612548828, 0.021448373794555664, 0.0223541259765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 7.0, 9.0, 4.0, 16.0, 27.0, 47.0, 97.0, 190.0, 245.0, 135.0, 81.0, 45.0, 21.0, 14.0, 11.0, 8.0, 4.0, 8.0, 4.0, 5.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008636474609375, -0.00829458236694336, -0.007952690124511719, -0.007610797882080078, -0.0072689056396484375, -0.006927013397216797, -0.006585121154785156, -0.006243228912353516, -0.005901336669921875, -0.005559444427490234, -0.005217552185058594, -0.004875659942626953, -0.0045337677001953125, -0.004191875457763672, -0.0038499832153320312, -0.0035080909729003906, -0.00316619873046875, -0.0028243064880371094, -0.0024824142456054688, -0.002140522003173828, -0.0017986297607421875, -0.0014567375183105469, -0.0011148452758789062, -0.0007729530334472656, -0.000431060791015625, -8.916854858398438e-05, 0.00025272369384765625, 0.0005946159362792969, 0.0009365081787109375, 0.0012784004211425781, 0.0016202926635742188, 0.0019621849060058594, 0.0023040771484375, 0.0026459693908691406, 0.0029878616333007812, 0.003329753875732422, 0.0036716461181640625, 0.004013538360595703, 0.004355430603027344, 0.004697322845458984, 0.005039215087890625, 0.005381107330322266, 0.005722999572753906, 0.006064891815185547, 0.0064067840576171875, 0.006748676300048828, 0.007090568542480469, 0.007432460784912109, 0.00777435302734375, 0.00811624526977539, 0.008458137512207031, 0.008800029754638672, 0.009141921997070312, 0.009483814239501953, 0.009825706481933594, 0.010167598724365234, 0.010509490966796875, 0.010851383209228516, 0.011193275451660156, 0.011535167694091797, 0.011877059936523438, 0.012218952178955078, 0.012560844421386719, 0.01290273666381836, 0.01324462890625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 21.0, 208.0, 734.0, 46.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.108874797821045, -3.05159592628479, -2.994317054748535, -2.9370384216308594, -2.8797595500946045, -2.8224806785583496, -2.765202045440674, -2.707923173904419, -2.650644302368164, -2.593365430831909, -2.5360865592956543, -2.4788079261779785, -2.4215290546417236, -2.3642501831054688, -2.306971549987793, -2.249692678451538, -2.192413806915283, -2.1351349353790283, -2.0778560638427734, -2.0205774307250977, -1.9632985591888428, -1.906019687652588, -1.8487409353256226, -1.7914621829986572, -1.7341833114624023, -1.6769044399261475, -1.6196256875991821, -1.5623469352722168, -1.505068063735962, -1.447789192199707, -1.3905104398727417, -1.3332316875457764, -1.275952696800232, -1.2186739444732666, -1.1613950729370117, -1.1041162014007568, -1.0468374490737915, -0.9895586371421814, -0.9322798252105713, -0.8750010132789612, -0.8177222013473511, -0.760443389415741, -0.7031645774841309, -0.6458857655525208, -0.5886069536209106, -0.5313281416893005, -0.47404932975769043, -0.4167705178260803, -0.3594917058944702, -0.3022128939628601, -0.24493408203125, -0.1876552700996399, -0.13037645816802979, -0.07309764623641968, -0.01581883430480957, 0.04145997762680054, 0.09873878955841064, 0.15601760149002075, 0.21329641342163086, 0.27057522535324097, 0.3278540372848511, 0.3851328492164612, 0.4424116611480713, 0.4996904730796814, 0.5569692850112915]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 8.0, 7.0, 12.0, 21.0, 13.0, 20.0, 11.0, 17.0, 27.0, 31.0, 28.0, 40.0, 45.0, 32.0, 45.0, 45.0, 54.0, 35.0, 41.0, 38.0, 53.0, 36.0, 34.0, 36.0, 29.0, 29.0, 33.0, 32.0, 25.0, 13.0, 17.0, 12.0, 11.0, 6.0, 10.0, 13.0, 4.0, 5.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4919113516807556, -0.4765775203704834, -0.46124371886253357, -0.44590988755226135, -0.43057605624198914, -0.4152422547340393, -0.3999084234237671, -0.3845745921134949, -0.36924076080322266, -0.35390692949295044, -0.3385731279850006, -0.3232392966747284, -0.3079054653644562, -0.29257166385650635, -0.27723783254623413, -0.2619040012359619, -0.2465701848268509, -0.23123636841773987, -0.21590253710746765, -0.20056872069835663, -0.1852348893880844, -0.1699010729789734, -0.15456724166870117, -0.13923342525959015, -0.12389960139989853, -0.10856577754020691, -0.09323195368051529, -0.07789812982082367, -0.06256431341171265, -0.04723048955202103, -0.03189666569232941, -0.016562841832637787, -0.001229017972946167, 0.014104804955422878, 0.029438627883791924, 0.044772449880838394, 0.060106273740530014, 0.07544009387493134, 0.09077391773462296, 0.10610774159431458, 0.1214415654540062, 0.13677538931369781, 0.15210920572280884, 0.16744303703308105, 0.18277685344219208, 0.1981106698513031, 0.21344450116157532, 0.22877833247184753, 0.24411214888095856, 0.2594459652900696, 0.2747797966003418, 0.290113627910614, 0.30544742941856384, 0.32078126072883606, 0.3361150920391083, 0.3514488935470581, 0.3667827248573303, 0.38211655616760254, 0.39745035767555237, 0.4127841889858246, 0.4281180202960968, 0.44345182180404663, 0.45878565311431885, 0.47411948442459106, 0.4894533157348633]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 4.0, 5.0, 16.0, 21.0, 30.0, 42.0, 63.0, 112.0, 183.0, 806.0, 4191336.0, 1107.0, 227.0, 85.0, 71.0, 34.0, 23.0, 22.0, 16.0, 8.0, 10.0, 14.0, 6.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.390625, -0.3782463073730469, -0.36586761474609375, -0.3534889221191406, -0.3411102294921875, -0.3287315368652344, -0.31635284423828125, -0.3039741516113281, -0.291595458984375, -0.2792167663574219, -0.26683807373046875, -0.2544593811035156, -0.2420806884765625, -0.22970199584960938, -0.21732330322265625, -0.20494461059570312, -0.19256591796875, -0.18018722534179688, -0.16780853271484375, -0.15542984008789062, -0.1430511474609375, -0.13067245483398438, -0.11829376220703125, -0.10591506958007812, -0.093536376953125, -0.08115768432617188, -0.06877899169921875, -0.056400299072265625, -0.0440216064453125, -0.031642913818359375, -0.01926422119140625, -0.006885528564453125, 0.0054931640625, 0.017871856689453125, 0.03025054931640625, 0.042629241943359375, 0.0550079345703125, 0.06738662719726562, 0.07976531982421875, 0.09214401245117188, 0.104522705078125, 0.11690139770507812, 0.12928009033203125, 0.14165878295898438, 0.1540374755859375, 0.16641616821289062, 0.17879486083984375, 0.19117355346679688, 0.20355224609375, 0.21593093872070312, 0.22830963134765625, 0.24068832397460938, 0.2530670166015625, 0.2654457092285156, 0.27782440185546875, 0.2902030944824219, 0.302581787109375, 0.3149604797363281, 0.32733917236328125, 0.3397178649902344, 0.3520965576171875, 0.3644752502441406, 0.37685394287109375, 0.3892326354980469, 0.401611328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 4.0, 8.0, 26.0, 21.0, 38.0, 49.0, 81.0, 105.0, 99.0, 103.0, 90.0, 84.0, 69.0, 51.0, 28.0, 24.0, 16.0, 19.0, 8.0, 12.0, 14.0, 6.0, 6.0, 1.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025146484375, -0.024355649948120117, -0.023564815521240234, -0.02277398109436035, -0.02198314666748047, -0.021192312240600586, -0.020401477813720703, -0.01961064338684082, -0.018819808959960938, -0.018028974533081055, -0.017238140106201172, -0.01644730567932129, -0.015656471252441406, -0.014865636825561523, -0.01407480239868164, -0.013283967971801758, -0.012493133544921875, -0.011702299118041992, -0.01091146469116211, -0.010120630264282227, -0.009329795837402344, -0.008538961410522461, -0.007748126983642578, -0.006957292556762695, -0.0061664581298828125, -0.00537562370300293, -0.004584789276123047, -0.003793954849243164, -0.0030031204223632812, -0.0022122859954833984, -0.0014214515686035156, -0.0006306171417236328, 0.00016021728515625, 0.0009510517120361328, 0.0017418861389160156, 0.0025327205657958984, 0.0033235549926757812, 0.004114389419555664, 0.004905223846435547, 0.00569605827331543, 0.0064868927001953125, 0.007277727127075195, 0.008068561553955078, 0.008859395980834961, 0.009650230407714844, 0.010441064834594727, 0.01123189926147461, 0.012022733688354492, 0.012813568115234375, 0.013604402542114258, 0.01439523696899414, 0.015186071395874023, 0.015976905822753906, 0.01676774024963379, 0.017558574676513672, 0.018349409103393555, 0.019140243530273438, 0.01993107795715332, 0.020721912384033203, 0.021512746810913086, 0.02230358123779297, 0.02309441566467285, 0.023885250091552734, 0.024676084518432617, 0.0254669189453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 5.0, 19.0, 38.0, 96.0, 238.0, 704.0, 2225.0, 13427.0, 4169797.0, 5771.0, 1334.0, 389.0, 113.0, 50.0, 28.0, 14.0, 11.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1220703125, -0.11850929260253906, -0.11494827270507812, -0.11138725280761719, -0.10782623291015625, -0.10426521301269531, -0.10070419311523438, -0.09714317321777344, -0.0935821533203125, -0.09002113342285156, -0.08646011352539062, -0.08289909362792969, -0.07933807373046875, -0.07577705383300781, -0.07221603393554688, -0.06865501403808594, -0.065093994140625, -0.06153297424316406, -0.057971954345703125, -0.05441093444824219, -0.05084991455078125, -0.04728889465332031, -0.043727874755859375, -0.04016685485839844, -0.0366058349609375, -0.03304481506347656, -0.029483795166015625, -0.025922775268554688, -0.02236175537109375, -0.018800735473632812, -0.015239715576171875, -0.011678695678710938, -0.00811767578125, -0.0045566558837890625, -0.000995635986328125, 0.0025653839111328125, 0.00612640380859375, 0.009687423706054688, 0.013248443603515625, 0.016809463500976562, 0.0203704833984375, 0.023931503295898438, 0.027492523193359375, 0.031053543090820312, 0.03461456298828125, 0.03817558288574219, 0.041736602783203125, 0.04529762268066406, 0.048858642578125, 0.05241966247558594, 0.055980682373046875, 0.05954170227050781, 0.06310272216796875, 0.06666374206542969, 0.07022476196289062, 0.07378578186035156, 0.0773468017578125, 0.08090782165527344, 0.08446884155273438, 0.08802986145019531, 0.09159088134765625, 0.09515190124511719, 0.09871292114257812, 0.10227394104003906, 0.1058349609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 10.0, 27.0, 139.0, 3774.0, 66.0, 23.0, 10.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0230255126953125, -0.022264480590820312, -0.021503448486328125, -0.020742416381835938, -0.01998138427734375, -0.019220352172851562, -0.018459320068359375, -0.017698287963867188, -0.016937255859375, -0.016176223754882812, -0.015415191650390625, -0.014654159545898438, -0.01389312744140625, -0.013132095336914062, -0.012371063232421875, -0.011610031127929688, -0.0108489990234375, -0.010087966918945312, -0.009326934814453125, -0.008565902709960938, -0.00780487060546875, -0.0070438385009765625, -0.006282806396484375, -0.0055217742919921875, -0.0047607421875, -0.0039997100830078125, -0.003238677978515625, -0.0024776458740234375, -0.00171661376953125, -0.0009555816650390625, -0.000194549560546875, 0.0005664825439453125, 0.0013275146484375, 0.0020885467529296875, 0.002849578857421875, 0.0036106109619140625, 0.00437164306640625, 0.0051326751708984375, 0.005893707275390625, 0.0066547393798828125, 0.007415771484375, 0.008176803588867188, 0.008937835693359375, 0.009698867797851562, 0.01045989990234375, 0.011220932006835938, 0.011981964111328125, 0.012742996215820312, 0.0135040283203125, 0.014265060424804688, 0.015026092529296875, 0.015787124633789062, 0.01654815673828125, 0.017309188842773438, 0.018070220947265625, 0.018831253051757812, 0.01959228515625, 0.020353317260742188, 0.021114349365234375, 0.021875381469726562, 0.02263641357421875, 0.023397445678710938, 0.024158477783203125, 0.024919509887695312, 0.0256805419921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 26.0, 95.0, 664.0, 182.0, 23.0, 11.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02374577894806862, -0.021013734862208366, -0.018281690776348114, -0.015549646690487862, -0.01281760260462761, -0.010085558518767357, -0.0073535144329071045, -0.004621470347046852, -0.0018894262611865997, 0.0008426178246736526, 0.003574661910533905, 0.006306705996394157, 0.00903875008225441, 0.011770794168114662, 0.014502838253974915, 0.017234882339835167, 0.01996692642569542, 0.02269897051155567, 0.025431014597415924, 0.028163058683276176, 0.03089510276913643, 0.03362714499235153, 0.036359190940856934, 0.039091236889362335, 0.04182327911257744, 0.04455532133579254, 0.04728736728429794, 0.050019413232803345, 0.05275145545601845, 0.05548349767923355, 0.05821554362773895, 0.060947589576244354, 0.06367963552474976, 0.06641168147325516, 0.06914372742176056, 0.07187576591968536, 0.07460781186819077, 0.07733985781669617, 0.08007189631462097, 0.08280394226312637, 0.08553598821163177, 0.08826803416013718, 0.09100008010864258, 0.09373211860656738, 0.09646416455507278, 0.09919621050357819, 0.10192824900150299, 0.10466029495000839, 0.1073923408985138, 0.1101243868470192, 0.1128564327955246, 0.1155884712934494, 0.1183205172419548, 0.1210525631904602, 0.12378460168838501, 0.126516655087471, 0.1292486935853958, 0.13198073208332062, 0.13471278548240662, 0.13744482398033142, 0.14017686247825623, 0.14290891587734222, 0.14564095437526703, 0.14837300777435303, 0.15110504627227783]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 10.0, 12.0, 15.0, 19.0, 25.0, 24.0, 31.0, 31.0, 44.0, 38.0, 36.0, 76.0, 54.0, 55.0, 51.0, 53.0, 46.0, 56.0, 40.0, 35.0, 46.0, 32.0, 32.0, 38.0, 31.0, 12.0, 9.0, 12.0, 7.0, 2.0, 6.0, 0.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034337759017944336, -0.03314549848437309, -0.03195323795080185, -0.030760977417230606, -0.029568716883659363, -0.02837645635008812, -0.027184195816516876, -0.025991935282945633, -0.02479967474937439, -0.023607414215803146, -0.022415153682231903, -0.02122289314866066, -0.020030632615089417, -0.018838372081518173, -0.01764611154794693, -0.016453851014375687, -0.015261590480804443, -0.0140693299472332, -0.012877069413661957, -0.011684808880090714, -0.01049254834651947, -0.009300287812948227, -0.008108027279376984, -0.00691576674580574, -0.005723506212234497, -0.004531245678663254, -0.0033389851450920105, -0.002146724611520767, -0.0009544640779495239, 0.00023779645562171936, 0.0014300569891929626, 0.002622317522764206, 0.0038145780563354492, 0.0050068385899066925, 0.006199099123477936, 0.007391359657049179, 0.008583620190620422, 0.009775880724191666, 0.010968141257762909, 0.012160401791334152, 0.013352662324905396, 0.014544922858476639, 0.015737183392047882, 0.016929443925619125, 0.01812170445919037, 0.019313964992761612, 0.020506225526332855, 0.0216984860599041, 0.022890746593475342, 0.024083007127046585, 0.02527526766061783, 0.02646752819418907, 0.027659788727760315, 0.028852049261331558, 0.0300443097949028, 0.031236570328474045, 0.03242883086204529, 0.03362109139561653, 0.034813351929187775, 0.03600561246275902, 0.03719787299633026, 0.038390133529901505, 0.03958239406347275, 0.04077465459704399, 0.041966915130615234]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 10.0, 8.0, 15.0, 13.0, 19.0, 47.0, 47.0, 79.0, 118.0, 175.0, 273.0, 376.0, 635.0, 1032.0, 1763.0, 3183.0, 5731.0, 12789.0, 32893.0, 125702.0, 647680.0, 150027.0, 36870.0, 13889.0, 6707.0, 3441.0, 1830.0, 1136.0, 764.0, 473.0, 253.0, 188.0, 118.0, 86.0, 52.0, 42.0, 38.0, 17.0, 6.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.052703857421875, -0.05108499526977539, -0.04946613311767578, -0.04784727096557617, -0.04622840881347656, -0.04460954666137695, -0.042990684509277344, -0.041371822357177734, -0.039752960205078125, -0.038134098052978516, -0.036515235900878906, -0.0348963737487793, -0.03327751159667969, -0.03165864944458008, -0.03003978729248047, -0.02842092514038086, -0.02680206298828125, -0.02518320083618164, -0.02356433868408203, -0.021945476531982422, -0.020326614379882812, -0.018707752227783203, -0.017088890075683594, -0.015470027923583984, -0.013851165771484375, -0.012232303619384766, -0.010613441467285156, -0.008994579315185547, -0.0073757171630859375, -0.005756855010986328, -0.004137992858886719, -0.0025191307067871094, -0.0009002685546875, 0.0007185935974121094, 0.0023374557495117188, 0.003956317901611328, 0.0055751800537109375, 0.007194042205810547, 0.008812904357910156, 0.010431766510009766, 0.012050628662109375, 0.013669490814208984, 0.015288352966308594, 0.016907215118408203, 0.018526077270507812, 0.020144939422607422, 0.02176380157470703, 0.02338266372680664, 0.02500152587890625, 0.02662038803100586, 0.02823925018310547, 0.029858112335205078, 0.03147697448730469, 0.0330958366394043, 0.034714698791503906, 0.036333560943603516, 0.037952423095703125, 0.039571285247802734, 0.041190147399902344, 0.04280900955200195, 0.04442787170410156, 0.04604673385620117, 0.04766559600830078, 0.04928445816040039, 0.0509033203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 5.0, 3.0, 8.0, 4.0, 5.0, 5.0, 15.0, 24.0, 30.0, 37.0, 60.0, 89.0, 104.0, 101.0, 96.0, 88.0, 82.0, 62.0, 48.0, 22.0, 20.0, 18.0, 15.0, 8.0, 14.0, 10.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0245361328125, -0.02375626564025879, -0.022976398468017578, -0.022196531295776367, -0.021416664123535156, -0.020636796951293945, -0.019856929779052734, -0.019077062606811523, -0.018297195434570312, -0.0175173282623291, -0.01673746109008789, -0.01595759391784668, -0.015177726745605469, -0.014397859573364258, -0.013617992401123047, -0.012838125228881836, -0.012058258056640625, -0.011278390884399414, -0.010498523712158203, -0.009718656539916992, -0.008938789367675781, -0.00815892219543457, -0.007379055023193359, -0.0065991878509521484, -0.0058193206787109375, -0.0050394535064697266, -0.004259586334228516, -0.0034797191619873047, -0.0026998519897460938, -0.0019199848175048828, -0.0011401176452636719, -0.00036025047302246094, 0.00041961669921875, 0.001199483871459961, 0.001979351043701172, 0.002759218215942383, 0.0035390853881835938, 0.004318952560424805, 0.005098819732666016, 0.0058786869049072266, 0.0066585540771484375, 0.0074384212493896484, 0.00821828842163086, 0.00899815559387207, 0.009778022766113281, 0.010557889938354492, 0.011337757110595703, 0.012117624282836914, 0.012897491455078125, 0.013677358627319336, 0.014457225799560547, 0.015237092971801758, 0.01601696014404297, 0.01679682731628418, 0.01757669448852539, 0.0183565616607666, 0.019136428833007812, 0.019916296005249023, 0.020696163177490234, 0.021476030349731445, 0.022255897521972656, 0.023035764694213867, 0.023815631866455078, 0.02459549903869629, 0.0253753662109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 7.0, 12.0, 19.0, 11.0, 21.0, 19.0, 33.0, 41.0, 54.0, 55.0, 76.0, 119.0, 156.0, 253.0, 400.0, 556.0, 971.0, 1850.0, 4997.0, 28305.0, 606758.0, 371921.0, 23186.0, 4382.0, 1643.0, 916.0, 552.0, 352.0, 244.0, 156.0, 112.0, 86.0, 66.0, 36.0, 48.0, 27.0, 22.0, 19.0, 17.0, 12.0, 7.0, 6.0, 5.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09161376953125, -0.08844947814941406, -0.08528518676757812, -0.08212089538574219, -0.07895660400390625, -0.07579231262207031, -0.07262802124023438, -0.06946372985839844, -0.0662994384765625, -0.06313514709472656, -0.059970855712890625, -0.05680656433105469, -0.05364227294921875, -0.05047798156738281, -0.047313690185546875, -0.04414939880371094, -0.040985107421875, -0.03782081604003906, -0.034656524658203125, -0.03149223327636719, -0.02832794189453125, -0.025163650512695312, -0.021999359130859375, -0.018835067749023438, -0.0156707763671875, -0.012506484985351562, -0.009342193603515625, -0.0061779022216796875, -0.00301361083984375, 0.0001506805419921875, 0.003314971923828125, 0.0064792633056640625, 0.0096435546875, 0.012807846069335938, 0.015972137451171875, 0.019136428833007812, 0.02230072021484375, 0.025465011596679688, 0.028629302978515625, 0.03179359436035156, 0.0349578857421875, 0.03812217712402344, 0.041286468505859375, 0.04445075988769531, 0.04761505126953125, 0.05077934265136719, 0.053943634033203125, 0.05710792541503906, 0.060272216796875, 0.06343650817871094, 0.06660079956054688, 0.06976509094238281, 0.07292938232421875, 0.07609367370605469, 0.07925796508789062, 0.08242225646972656, 0.0855865478515625, 0.08875083923339844, 0.09191513061523438, 0.09507942199707031, 0.09824371337890625, 0.10140800476074219, 0.10457229614257812, 0.10773658752441406, 0.11090087890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 8.0, 10.0, 14.0, 14.0, 18.0, 18.0, 20.0, 26.0, 27.0, 33.0, 28.0, 30.0, 30.0, 35.0, 36.0, 52.0, 30.0, 42.0, 38.0, 39.0, 43.0, 36.0, 39.0, 26.0, 34.0, 27.0, 41.0, 26.0, 16.0, 25.0, 18.0, 19.0, 15.0, 13.0, 10.0, 10.0, 10.0, 8.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.07598876953125, -0.07383108139038086, -0.07167339324951172, -0.06951570510864258, -0.06735801696777344, -0.0652003288269043, -0.06304264068603516, -0.060884952545166016, -0.058727264404296875, -0.056569576263427734, -0.054411888122558594, -0.05225419998168945, -0.05009651184082031, -0.04793882369995117, -0.04578113555908203, -0.04362344741821289, -0.04146575927734375, -0.03930807113647461, -0.03715038299560547, -0.03499269485473633, -0.03283500671386719, -0.030677318572998047, -0.028519630432128906, -0.026361942291259766, -0.024204254150390625, -0.022046566009521484, -0.019888877868652344, -0.017731189727783203, -0.015573501586914062, -0.013415813446044922, -0.011258125305175781, -0.00910043716430664, -0.0069427490234375, -0.004785060882568359, -0.0026273727416992188, -0.0004696846008300781, 0.0016880035400390625, 0.003845691680908203, 0.006003379821777344, 0.008161067962646484, 0.010318756103515625, 0.012476444244384766, 0.014634132385253906, 0.016791820526123047, 0.018949508666992188, 0.021107196807861328, 0.02326488494873047, 0.02542257308959961, 0.02758026123046875, 0.02973794937133789, 0.03189563751220703, 0.03405332565307617, 0.03621101379394531, 0.03836870193481445, 0.040526390075683594, 0.042684078216552734, 0.044841766357421875, 0.046999454498291016, 0.049157142639160156, 0.0513148307800293, 0.05347251892089844, 0.05563020706176758, 0.05778789520263672, 0.05994558334350586, 0.062103271484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 9.0, 8.0, 25.0, 25.0, 21.0, 22.0, 27.0, 54.0, 70.0, 84.0, 123.0, 174.0, 314.0, 580.0, 1559.0, 5723.0, 52761.0, 949563.0, 30380.0, 4316.0, 1233.0, 558.0, 244.0, 176.0, 129.0, 85.0, 60.0, 51.0, 27.0, 27.0, 16.0, 21.0, 14.0, 10.0, 9.0, 7.0, 5.0, 7.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00449371337890625, -0.004359185695648193, -0.004224658012390137, -0.00409013032913208, -0.0039556026458740234, -0.003821074962615967, -0.00368654727935791, -0.0035520195960998535, -0.003417491912841797, -0.0032829642295837402, -0.0031484365463256836, -0.003013908863067627, -0.0028793811798095703, -0.0027448534965515137, -0.002610325813293457, -0.0024757981300354004, -0.0023412704467773438, -0.002206742763519287, -0.0020722150802612305, -0.0019376873970031738, -0.0018031597137451172, -0.0016686320304870605, -0.001534104347229004, -0.0013995766639709473, -0.0012650489807128906, -0.001130521297454834, -0.0009959936141967773, -0.0008614659309387207, -0.0007269382476806641, -0.0005924105644226074, -0.0004578828811645508, -0.00032335519790649414, -0.0001888275146484375, -5.429983139038086e-05, 8.022785186767578e-05, 0.00021475553512573242, 0.00034928321838378906, 0.0004838109016418457, 0.0006183385848999023, 0.000752866268157959, 0.0008873939514160156, 0.0010219216346740723, 0.001156449317932129, 0.0012909770011901855, 0.0014255046844482422, 0.0015600323677062988, 0.0016945600509643555, 0.0018290877342224121, 0.0019636154174804688, 0.0020981431007385254, 0.002232670783996582, 0.0023671984672546387, 0.0025017261505126953, 0.002636253833770752, 0.0027707815170288086, 0.0029053092002868652, 0.003039836883544922, 0.0031743645668029785, 0.003308892250061035, 0.003443419933319092, 0.0035779476165771484, 0.003712475299835205, 0.0038470029830932617, 0.003981530666351318, 0.004116058349609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 3.0, 3.0, 7.0, 7.0, 16.0, 22.0, 15.0, 27.0, 50.0, 66.0, 83.0, 162.0, 171.0, 106.0, 79.0, 38.0, 32.0, 30.0, 15.0, 14.0, 11.0, 7.0, 7.0, 3.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.0558319091796875e-05, -5.8671459555625916e-05, -5.6784600019454956e-05, -5.4897740483283997e-05, -5.301088094711304e-05, -5.112402141094208e-05, -4.923716187477112e-05, -4.735030233860016e-05, -4.54634428024292e-05, -4.357658326625824e-05, -4.168972373008728e-05, -3.980286419391632e-05, -3.791600465774536e-05, -3.60291451215744e-05, -3.414228558540344e-05, -3.225542604923248e-05, -3.0368566513061523e-05, -2.8481706976890564e-05, -2.6594847440719604e-05, -2.4707987904548645e-05, -2.2821128368377686e-05, -2.0934268832206726e-05, -1.9047409296035767e-05, -1.7160549759864807e-05, -1.5273690223693848e-05, -1.3386830687522888e-05, -1.1499971151351929e-05, -9.61311161518097e-06, -7.72625207901001e-06, -5.83939254283905e-06, -3.952533006668091e-06, -2.0656734704971313e-06, -1.7881393432617188e-07, 1.7080456018447876e-06, 3.594905138015747e-06, 5.4817646741867065e-06, 7.368624210357666e-06, 9.255483746528625e-06, 1.1142343282699585e-05, 1.3029202818870544e-05, 1.4916062355041504e-05, 1.6802921891212463e-05, 1.8689781427383423e-05, 2.0576640963554382e-05, 2.2463500499725342e-05, 2.43503600358963e-05, 2.623721957206726e-05, 2.812407910823822e-05, 3.001093864440918e-05, 3.189779818058014e-05, 3.37846577167511e-05, 3.567151725292206e-05, 3.755837678909302e-05, 3.944523632526398e-05, 4.1332095861434937e-05, 4.3218955397605896e-05, 4.5105814933776855e-05, 4.6992674469947815e-05, 4.8879534006118774e-05, 5.0766393542289734e-05, 5.265325307846069e-05, 5.454011261463165e-05, 5.642697215080261e-05, 5.831383168697357e-05, 6.020069122314453e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 23.0, 14.0, 27.0, 31.0, 48.0, 62.0, 100.0, 177.0, 320.0, 719.0, 2729.0, 23573.0, 995007.0, 21240.0, 2796.0, 843.0, 319.0, 176.0, 93.0, 66.0, 43.0, 35.0, 30.0, 16.0, 10.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0117645263671875, -0.011423349380493164, -0.011082172393798828, -0.010740995407104492, -0.010399818420410156, -0.01005864143371582, -0.009717464447021484, -0.009376287460327148, -0.009035110473632812, -0.008693933486938477, -0.00835275650024414, -0.008011579513549805, -0.007670402526855469, -0.007329225540161133, -0.006988048553466797, -0.006646871566772461, -0.006305694580078125, -0.005964517593383789, -0.005623340606689453, -0.005282163619995117, -0.004940986633300781, -0.004599809646606445, -0.004258632659912109, -0.0039174556732177734, -0.0035762786865234375, -0.0032351016998291016, -0.0028939247131347656, -0.0025527477264404297, -0.0022115707397460938, -0.0018703937530517578, -0.0015292167663574219, -0.001188039779663086, -0.00084686279296875, -0.0005056858062744141, -0.00016450881958007812, 0.0001766681671142578, 0.0005178451538085938, 0.0008590221405029297, 0.0012001991271972656, 0.0015413761138916016, 0.0018825531005859375, 0.0022237300872802734, 0.0025649070739746094, 0.0029060840606689453, 0.0032472610473632812, 0.003588438034057617, 0.003929615020751953, 0.004270792007446289, 0.004611968994140625, 0.004953145980834961, 0.005294322967529297, 0.005635499954223633, 0.005976676940917969, 0.006317853927612305, 0.006659030914306641, 0.0070002079010009766, 0.0073413848876953125, 0.0076825618743896484, 0.008023738861083984, 0.00836491584777832, 0.008706092834472656, 0.009047269821166992, 0.009388446807861328, 0.009729623794555664, 0.01007080078125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 7.0, 6.0, 12.0, 21.0, 27.0, 28.0, 61.0, 91.0, 155.0, 202.0, 136.0, 65.0, 46.0, 23.0, 23.0, 17.0, 11.0, 4.0, 8.0, 6.0, 6.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0066375732421875, -0.0064125657081604, -0.006187558174133301, -0.005962550640106201, -0.0057375431060791016, -0.005512535572052002, -0.005287528038024902, -0.005062520503997803, -0.004837512969970703, -0.0046125054359436035, -0.004387497901916504, -0.004162490367889404, -0.003937482833862305, -0.003712475299835205, -0.0034874677658081055, -0.003262460231781006, -0.0030374526977539062, -0.0028124451637268066, -0.002587437629699707, -0.0023624300956726074, -0.002137422561645508, -0.0019124150276184082, -0.0016874074935913086, -0.001462399959564209, -0.0012373924255371094, -0.0010123848915100098, -0.0007873773574829102, -0.0005623698234558105, -0.00033736228942871094, -0.00011235475540161133, 0.00011265277862548828, 0.0003376603126525879, 0.0005626678466796875, 0.0007876753807067871, 0.0010126829147338867, 0.0012376904487609863, 0.001462697982788086, 0.0016877055168151855, 0.0019127130508422852, 0.0021377205848693848, 0.0023627281188964844, 0.002587735652923584, 0.0028127431869506836, 0.003037750720977783, 0.003262758255004883, 0.0034877657890319824, 0.003712773323059082, 0.003937780857086182, 0.004162788391113281, 0.004387795925140381, 0.0046128034591674805, 0.00483781099319458, 0.00506281852722168, 0.005287826061248779, 0.005512833595275879, 0.0057378411293029785, 0.005962848663330078, 0.006187856197357178, 0.006412863731384277, 0.006637871265411377, 0.0068628787994384766, 0.007087886333465576, 0.007312893867492676, 0.007537901401519775, 0.007762908935546875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 13.0, 17.0, 69.0, 297.0, 535.0, 54.0, 15.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5895233154296875, -1.5601515769958496, -1.5307799577713013, -1.501408338546753, -1.472036600112915, -1.4426648616790771, -1.4132932424545288, -1.3839216232299805, -1.3545498847961426, -1.3251781463623047, -1.2958065271377563, -1.266434907913208, -1.2370631694793701, -1.2076914310455322, -1.1783198118209839, -1.1489481925964355, -1.1195764541625977, -1.0902047157287598, -1.0608330965042114, -1.031461477279663, -1.0020897388458252, -0.9727180600166321, -0.943346381187439, -0.9139747023582458, -0.8846030235290527, -0.8552313446998596, -0.8258596658706665, -0.7964879870414734, -0.7671163082122803, -0.7377446293830872, -0.708372950553894, -0.6790012717247009, -0.6496295928955078, -0.6202579140663147, -0.5908862352371216, -0.5615145564079285, -0.5321428775787354, -0.5027711987495422, -0.4733995199203491, -0.444027841091156, -0.4146561622619629, -0.3852844834327698, -0.35591280460357666, -0.32654112577438354, -0.29716944694519043, -0.2677977681159973, -0.2384260892868042, -0.20905441045761108, -0.17968273162841797, -0.15031105279922485, -0.12093937397003174, -0.09156769514083862, -0.06219601631164551, -0.03282433748245239, -0.0034526586532592773, 0.025919020175933838, 0.05529069900512695, 0.08466237783432007, 0.11403405666351318, 0.1434057354927063, 0.17277741432189941, 0.20214909315109253, 0.23152077198028564, 0.26089245080947876, 0.2902641296386719]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 4.0, 7.0, 6.0, 10.0, 13.0, 15.0, 22.0, 19.0, 18.0, 35.0, 33.0, 36.0, 41.0, 46.0, 37.0, 49.0, 62.0, 54.0, 55.0, 64.0, 47.0, 44.0, 43.0, 27.0, 42.0, 36.0, 20.0, 21.0, 16.0, 14.0, 8.0, 12.0, 6.0, 7.0, 6.0, 5.0, 6.0, 6.0, 0.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.5914543867111206, -0.5761537551879883, -0.560853123664856, -0.5455524921417236, -0.5302518606185913, -0.5149512887001038, -0.49965065717697144, -0.4843500256538391, -0.4690493941307068, -0.45374876260757446, -0.43844813108444214, -0.4231475293636322, -0.4078468978404999, -0.39254626631736755, -0.3772456645965576, -0.3619450330734253, -0.34664440155029297, -0.33134377002716064, -0.3160431385040283, -0.3007425367832184, -0.28544190526008606, -0.27014127373695374, -0.2548406720161438, -0.23954004049301147, -0.22423940896987915, -0.20893877744674683, -0.1936381608247757, -0.17833754420280457, -0.16303691267967224, -0.14773628115653992, -0.1324356645345688, -0.11713504046201706, -0.10183441638946533, -0.0865337923169136, -0.07123316824436188, -0.05593254417181015, -0.04063192009925842, -0.025331296026706696, -0.010030671954154968, 0.005269952118396759, 0.020570576190948486, 0.035871200263500214, 0.05117182433605194, 0.06647244840860367, 0.0817730724811554, 0.09707369655370712, 0.11237432062625885, 0.12767493724822998, 0.1429755687713623, 0.15827620029449463, 0.17357681691646576, 0.1888774335384369, 0.2041780650615692, 0.21947869658470154, 0.23477931320667267, 0.2500799298286438, 0.2653805613517761, 0.28068119287490845, 0.29598182439804077, 0.3112824261188507, 0.32658305764198303, 0.34188368916511536, 0.3571842908859253, 0.3724849224090576, 0.38778555393218994]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 9.0, 3.0, 5.0, 11.0, 14.0, 16.0, 29.0, 33.0, 43.0, 58.0, 81.0, 93.0, 167.0, 280.0, 467.0, 822.0, 1455.0, 3965.0, 51894.0, 4117068.0, 12179.0, 2467.0, 1092.0, 661.0, 394.0, 274.0, 164.0, 145.0, 93.0, 71.0, 46.0, 48.0, 31.0, 29.0, 9.0, 19.0, 9.0, 8.0, 8.0, 5.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.050140380859375, -0.04848670959472656, -0.046833038330078125, -0.04517936706542969, -0.04352569580078125, -0.04187202453613281, -0.040218353271484375, -0.03856468200683594, -0.0369110107421875, -0.03525733947753906, -0.033603668212890625, -0.03194999694824219, -0.03029632568359375, -0.028642654418945312, -0.026988983154296875, -0.025335311889648438, -0.023681640625, -0.022027969360351562, -0.020374298095703125, -0.018720626831054688, -0.01706695556640625, -0.015413284301757812, -0.013759613037109375, -0.012105941772460938, -0.0104522705078125, -0.008798599243164062, -0.007144927978515625, -0.0054912567138671875, -0.00383758544921875, -0.0021839141845703125, -0.000530242919921875, 0.0011234283447265625, 0.002777099609375, 0.0044307708740234375, 0.006084442138671875, 0.0077381134033203125, 0.00939178466796875, 0.011045455932617188, 0.012699127197265625, 0.014352798461914062, 0.0160064697265625, 0.017660140991210938, 0.019313812255859375, 0.020967483520507812, 0.02262115478515625, 0.024274826049804688, 0.025928497314453125, 0.027582168579101562, 0.02923583984375, 0.030889511108398438, 0.032543182373046875, 0.03419685363769531, 0.03585052490234375, 0.03750419616699219, 0.039157867431640625, 0.04081153869628906, 0.0424652099609375, 0.04411888122558594, 0.045772552490234375, 0.04742622375488281, 0.04907989501953125, 0.05073356628417969, 0.052387237548828125, 0.05404090881347656, 0.055694580078125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 3.0, 6.0, 11.0, 17.0, 21.0, 34.0, 52.0, 55.0, 90.0, 98.0, 108.0, 80.0, 96.0, 67.0, 63.0, 36.0, 35.0, 24.0, 14.0, 22.0, 8.0, 9.0, 5.0, 10.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0225677490234375, -0.021822690963745117, -0.021077632904052734, -0.02033257484436035, -0.01958751678466797, -0.018842458724975586, -0.018097400665283203, -0.01735234260559082, -0.016607284545898438, -0.015862226486206055, -0.015117168426513672, -0.014372110366821289, -0.013627052307128906, -0.012881994247436523, -0.01213693618774414, -0.011391878128051758, -0.010646820068359375, -0.009901762008666992, -0.00915670394897461, -0.008411645889282227, -0.007666587829589844, -0.006921529769897461, -0.006176471710205078, -0.005431413650512695, -0.0046863555908203125, -0.00394129753112793, -0.003196239471435547, -0.002451181411743164, -0.0017061233520507812, -0.0009610652923583984, -0.00021600723266601562, 0.0005290508270263672, 0.00127410888671875, 0.002019166946411133, 0.0027642250061035156, 0.0035092830657958984, 0.004254341125488281, 0.004999399185180664, 0.005744457244873047, 0.00648951530456543, 0.0072345733642578125, 0.007979631423950195, 0.008724689483642578, 0.009469747543334961, 0.010214805603027344, 0.010959863662719727, 0.01170492172241211, 0.012449979782104492, 0.013195037841796875, 0.013940095901489258, 0.01468515396118164, 0.015430212020874023, 0.016175270080566406, 0.01692032814025879, 0.017665386199951172, 0.018410444259643555, 0.019155502319335938, 0.01990056037902832, 0.020645618438720703, 0.021390676498413086, 0.02213573455810547, 0.02288079261779785, 0.023625850677490234, 0.024370908737182617, 0.025115966796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 20.0, 21.0, 47.0, 132.0, 511.0, 2511.0, 4009577.0, 179171.0, 1652.0, 392.0, 130.0, 62.0, 18.0, 18.0, 1.0, 7.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218994140625, -0.2121448516845703, -0.20529556274414062, -0.19844627380371094, -0.19159698486328125, -0.18474769592285156, -0.17789840698242188, -0.1710491180419922, -0.1641998291015625, -0.1573505401611328, -0.15050125122070312, -0.14365196228027344, -0.13680267333984375, -0.12995338439941406, -0.12310409545898438, -0.11625480651855469, -0.109405517578125, -0.10255622863769531, -0.09570693969726562, -0.08885765075683594, -0.08200836181640625, -0.07515907287597656, -0.06830978393554688, -0.06146049499511719, -0.0546112060546875, -0.04776191711425781, -0.040912628173828125, -0.03406333923339844, -0.02721405029296875, -0.020364761352539062, -0.013515472412109375, -0.0066661834716796875, 0.00018310546875, 0.0070323944091796875, 0.013881683349609375, 0.020730972290039062, 0.02758026123046875, 0.03442955017089844, 0.041278839111328125, 0.04812812805175781, 0.0549774169921875, 0.06182670593261719, 0.06867599487304688, 0.07552528381347656, 0.08237457275390625, 0.08922386169433594, 0.09607315063476562, 0.10292243957519531, 0.109771728515625, 0.11662101745605469, 0.12347030639648438, 0.13031959533691406, 0.13716888427734375, 0.14401817321777344, 0.15086746215820312, 0.1577167510986328, 0.1645660400390625, 0.1714153289794922, 0.17826461791992188, 0.18511390686035156, 0.19196319580078125, 0.19881248474121094, 0.20566177368164062, 0.2125110626220703, 0.2193603515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 4.0, 2.0, 8.0, 3.0, 17.0, 48.0, 2816.0, 1091.0, 51.0, 15.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05950927734375, -0.057587623596191406, -0.05566596984863281, -0.05374431610107422, -0.051822662353515625, -0.04990100860595703, -0.04797935485839844, -0.046057701110839844, -0.04413604736328125, -0.042214393615722656, -0.04029273986816406, -0.03837108612060547, -0.036449432373046875, -0.03452777862548828, -0.03260612487792969, -0.030684471130371094, -0.0287628173828125, -0.026841163635253906, -0.024919509887695312, -0.02299785614013672, -0.021076202392578125, -0.01915454864501953, -0.017232894897460938, -0.015311241149902344, -0.01338958740234375, -0.011467933654785156, -0.009546279907226562, -0.007624626159667969, -0.005702972412109375, -0.0037813186645507812, -0.0018596649169921875, 6.198883056640625e-05, 0.001983642578125, 0.0039052963256835938, 0.0058269500732421875, 0.007748603820800781, 0.009670257568359375, 0.011591911315917969, 0.013513565063476562, 0.015435218811035156, 0.01735687255859375, 0.019278526306152344, 0.021200180053710938, 0.02312183380126953, 0.025043487548828125, 0.02696514129638672, 0.028886795043945312, 0.030808448791503906, 0.0327301025390625, 0.034651756286621094, 0.03657341003417969, 0.03849506378173828, 0.040416717529296875, 0.04233837127685547, 0.04426002502441406, 0.046181678771972656, 0.04810333251953125, 0.050024986267089844, 0.05194664001464844, 0.05386829376220703, 0.055789947509765625, 0.05771160125732422, 0.05963325500488281, 0.061554908752441406, 0.0634765625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 15.0, 46.0, 381.0, 462.0, 70.0, 18.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138719379901886, -0.13294430077075958, -0.12716922163963318, -0.12139414250850677, -0.11561906337738037, -0.10984398424625397, -0.10406890511512756, -0.09829382598400116, -0.09251874685287476, -0.08674366772174835, -0.08096858859062195, -0.07519350945949554, -0.06941843032836914, -0.06364335119724274, -0.05786827206611633, -0.05209319293498993, -0.046318113803863525, -0.04054303467273712, -0.03476795554161072, -0.028992876410484314, -0.02321779727935791, -0.017442718148231506, -0.011667639017105103, -0.005892559885978699, -0.00011748075485229492, 0.005657598376274109, 0.011432677507400513, 0.017207756638526917, 0.02298283576965332, 0.028757914900779724, 0.03453299403190613, 0.04030807316303253, 0.046083152294158936, 0.05185823142528534, 0.05763331055641174, 0.06340838968753815, 0.06918346881866455, 0.07495854794979095, 0.08073362708091736, 0.08650870621204376, 0.09228378534317017, 0.09805886447429657, 0.10383394360542297, 0.10960902273654938, 0.11538410186767578, 0.12115918099880219, 0.1269342601299286, 0.132709339261055, 0.1384844183921814, 0.1442594975233078, 0.1500345766544342, 0.1558096557855606, 0.161584734916687, 0.16735981404781342, 0.17313489317893982, 0.17890997231006622, 0.18468505144119263, 0.19046013057231903, 0.19623520970344543, 0.20201028883457184, 0.20778536796569824, 0.21356044709682465, 0.21933552622795105, 0.22511060535907745, 0.23088568449020386]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 10.0, 12.0, 11.0, 13.0, 24.0, 32.0, 40.0, 52.0, 60.0, 58.0, 66.0, 73.0, 68.0, 71.0, 72.0, 71.0, 43.0, 50.0, 45.0, 29.0, 23.0, 18.0, 18.0, 9.0, 11.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0848386287689209, -0.08125575631856918, -0.07767288386821747, -0.07409001141786575, -0.07050713896751404, -0.06692426651716232, -0.06334139406681061, -0.05975852161645889, -0.05617564916610718, -0.05259277671575546, -0.04900990426540375, -0.04542703181505203, -0.04184415936470032, -0.0382612869143486, -0.03467841446399689, -0.031095542013645172, -0.027512669563293457, -0.023929797112941742, -0.020346924662590027, -0.016764052212238312, -0.013181179761886597, -0.009598307311534882, -0.0060154348611831665, -0.0024325624108314514, 0.0011503100395202637, 0.004733182489871979, 0.008316054940223694, 0.011898927390575409, 0.015481799840927124, 0.01906467229127884, 0.022647544741630554, 0.02623041719198227, 0.029813289642333984, 0.0333961620926857, 0.036979034543037415, 0.04056190699338913, 0.044144779443740845, 0.04772765189409256, 0.051310524344444275, 0.05489339679479599, 0.058476269245147705, 0.06205914169549942, 0.06564201414585114, 0.06922488659620285, 0.07280775904655457, 0.07639063149690628, 0.079973503947258, 0.08355637639760971, 0.08713924884796143, 0.09072212129831314, 0.09430499374866486, 0.09788786619901657, 0.10147073864936829, 0.10505361109972, 0.10863648355007172, 0.11221935600042343, 0.11580222845077515, 0.11938510090112686, 0.12296797335147858, 0.1265508532524109, 0.130133718252182, 0.13371658325195312, 0.13729946315288544, 0.14088234305381775, 0.14446520805358887]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 10.0, 13.0, 14.0, 18.0, 20.0, 31.0, 56.0, 71.0, 133.0, 164.0, 262.0, 419.0, 704.0, 1209.0, 2345.0, 4778.0, 10989.0, 34388.0, 201238.0, 687438.0, 70991.0, 18548.0, 7119.0, 3310.0, 1726.0, 956.0, 529.0, 347.0, 242.0, 150.0, 96.0, 63.0, 43.0, 41.0, 30.0, 18.0, 11.0, 7.0, 3.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0721435546875, -0.06975841522216797, -0.06737327575683594, -0.0649881362915039, -0.06260299682617188, -0.060217857360839844, -0.05783271789550781, -0.05544757843017578, -0.05306243896484375, -0.05067729949951172, -0.04829216003417969, -0.045907020568847656, -0.043521881103515625, -0.041136741638183594, -0.03875160217285156, -0.03636646270751953, -0.0339813232421875, -0.03159618377685547, -0.029211044311523438, -0.026825904846191406, -0.024440765380859375, -0.022055625915527344, -0.019670486450195312, -0.01728534698486328, -0.01490020751953125, -0.012515068054199219, -0.010129928588867188, -0.007744789123535156, -0.005359649658203125, -0.0029745101928710938, -0.0005893707275390625, 0.0017957687377929688, 0.004180908203125, 0.006566047668457031, 0.008951187133789062, 0.011336326599121094, 0.013721466064453125, 0.016106605529785156, 0.018491744995117188, 0.02087688446044922, 0.02326202392578125, 0.02564716339111328, 0.028032302856445312, 0.030417442321777344, 0.032802581787109375, 0.035187721252441406, 0.03757286071777344, 0.03995800018310547, 0.0423431396484375, 0.04472827911376953, 0.04711341857910156, 0.049498558044433594, 0.051883697509765625, 0.054268836975097656, 0.05665397644042969, 0.05903911590576172, 0.06142425537109375, 0.06380939483642578, 0.06619453430175781, 0.06857967376708984, 0.07096481323242188, 0.0733499526977539, 0.07573509216308594, 0.07812023162841797, 0.08050537109375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 2.0, 5.0, 4.0, 5.0, 5.0, 17.0, 9.0, 33.0, 38.0, 54.0, 72.0, 81.0, 95.0, 104.0, 96.0, 82.0, 65.0, 63.0, 37.0, 23.0, 24.0, 13.0, 15.0, 13.0, 6.0, 6.0, 7.0, 3.0, 8.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0223236083984375, -0.02157878875732422, -0.020833969116210938, -0.020089149475097656, -0.019344329833984375, -0.018599510192871094, -0.017854690551757812, -0.01710987091064453, -0.01636505126953125, -0.015620231628417969, -0.014875411987304688, -0.014130592346191406, -0.013385772705078125, -0.012640953063964844, -0.011896133422851562, -0.011151313781738281, -0.010406494140625, -0.009661674499511719, -0.008916854858398438, -0.008172035217285156, -0.007427215576171875, -0.006682395935058594, -0.0059375762939453125, -0.005192756652832031, -0.00444793701171875, -0.0037031173706054688, -0.0029582977294921875, -0.0022134780883789062, -0.001468658447265625, -0.0007238388061523438, 2.09808349609375e-05, 0.0007658004760742188, 0.0015106201171875, 0.0022554397583007812, 0.0030002593994140625, 0.0037450790405273438, 0.004489898681640625, 0.005234718322753906, 0.0059795379638671875, 0.006724357604980469, 0.00746917724609375, 0.008213996887207031, 0.008958816528320312, 0.009703636169433594, 0.010448455810546875, 0.011193275451660156, 0.011938095092773438, 0.012682914733886719, 0.013427734375, 0.014172554016113281, 0.014917373657226562, 0.015662193298339844, 0.016407012939453125, 0.017151832580566406, 0.017896652221679688, 0.01864147186279297, 0.01938629150390625, 0.02013111114501953, 0.020875930786132812, 0.021620750427246094, 0.022365570068359375, 0.023110389709472656, 0.023855209350585938, 0.02460002899169922, 0.0253448486328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 11.0, 12.0, 14.0, 10.0, 20.0, 24.0, 30.0, 42.0, 40.0, 76.0, 81.0, 99.0, 187.0, 288.0, 468.0, 1088.0, 3462.0, 28012.0, 823952.0, 176568.0, 10000.0, 2026.0, 818.0, 396.0, 214.0, 149.0, 111.0, 65.0, 59.0, 44.0, 32.0, 28.0, 27.0, 23.0, 12.0, 16.0, 10.0, 3.0, 9.0, 5.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11138916015625, -0.10752010345458984, -0.10365104675292969, -0.09978199005126953, -0.09591293334960938, -0.09204387664794922, -0.08817481994628906, -0.0843057632446289, -0.08043670654296875, -0.0765676498413086, -0.07269859313964844, -0.06882953643798828, -0.06496047973632812, -0.06109142303466797, -0.05722236633300781, -0.053353309631347656, -0.0494842529296875, -0.045615196228027344, -0.04174613952636719, -0.03787708282470703, -0.034008026123046875, -0.03013896942138672, -0.026269912719726562, -0.022400856018066406, -0.01853179931640625, -0.014662742614746094, -0.010793685913085938, -0.006924629211425781, -0.003055572509765625, 0.0008134841918945312, 0.0046825408935546875, 0.008551597595214844, 0.012420654296875, 0.016289710998535156, 0.020158767700195312, 0.02402782440185547, 0.027896881103515625, 0.03176593780517578, 0.03563499450683594, 0.039504051208496094, 0.04337310791015625, 0.047242164611816406, 0.05111122131347656, 0.05498027801513672, 0.058849334716796875, 0.06271839141845703, 0.06658744812011719, 0.07045650482177734, 0.0743255615234375, 0.07819461822509766, 0.08206367492675781, 0.08593273162841797, 0.08980178833007812, 0.09367084503173828, 0.09753990173339844, 0.1014089584350586, 0.10527801513671875, 0.1091470718383789, 0.11301612854003906, 0.11688518524169922, 0.12075424194335938, 0.12462329864501953, 0.1284923553466797, 0.13236141204833984, 0.13623046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 6.0, 7.0, 6.0, 8.0, 11.0, 13.0, 13.0, 15.0, 23.0, 21.0, 22.0, 38.0, 29.0, 24.0, 37.0, 38.0, 33.0, 32.0, 32.0, 49.0, 36.0, 46.0, 37.0, 47.0, 35.0, 39.0, 31.0, 41.0, 30.0, 28.0, 32.0, 19.0, 28.0, 15.0, 15.0, 18.0, 9.0, 12.0, 5.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0], "bins": [-0.07342529296875, -0.07135438919067383, -0.06928348541259766, -0.06721258163452148, -0.06514167785644531, -0.06307077407836914, -0.06099987030029297, -0.0589289665222168, -0.056858062744140625, -0.05478715896606445, -0.05271625518798828, -0.05064535140991211, -0.04857444763183594, -0.046503543853759766, -0.044432640075683594, -0.04236173629760742, -0.04029083251953125, -0.03821992874145508, -0.036149024963378906, -0.034078121185302734, -0.03200721740722656, -0.02993631362915039, -0.02786540985107422, -0.025794506072998047, -0.023723602294921875, -0.021652698516845703, -0.01958179473876953, -0.01751089096069336, -0.015439987182617188, -0.013369083404541016, -0.011298179626464844, -0.009227275848388672, -0.0071563720703125, -0.005085468292236328, -0.0030145645141601562, -0.0009436607360839844, 0.0011272430419921875, 0.0031981468200683594, 0.005269050598144531, 0.007339954376220703, 0.009410858154296875, 0.011481761932373047, 0.013552665710449219, 0.01562356948852539, 0.017694473266601562, 0.019765377044677734, 0.021836280822753906, 0.023907184600830078, 0.02597808837890625, 0.028048992156982422, 0.030119895935058594, 0.032190799713134766, 0.03426170349121094, 0.03633260726928711, 0.03840351104736328, 0.04047441482543945, 0.042545318603515625, 0.0446162223815918, 0.04668712615966797, 0.04875802993774414, 0.05082893371582031, 0.052899837493896484, 0.054970741271972656, 0.05704164505004883, 0.059112548828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 6.0, 6.0, 13.0, 22.0, 29.0, 47.0, 66.0, 119.0, 289.0, 756.0, 2338.0, 14479.0, 1013316.0, 13411.0, 2308.0, 716.0, 270.0, 135.0, 57.0, 42.0, 38.0, 16.0, 14.0, 16.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011444091796875, -0.01106870174407959, -0.01069331169128418, -0.01031792163848877, -0.00994253158569336, -0.00956714153289795, -0.009191751480102539, -0.008816361427307129, -0.008440971374511719, -0.008065581321716309, -0.0076901912689208984, -0.007314801216125488, -0.006939411163330078, -0.006564021110534668, -0.006188631057739258, -0.005813241004943848, -0.0054378509521484375, -0.005062460899353027, -0.004687070846557617, -0.004311680793762207, -0.003936290740966797, -0.0035609006881713867, -0.0031855106353759766, -0.0028101205825805664, -0.0024347305297851562, -0.002059340476989746, -0.001683950424194336, -0.0013085603713989258, -0.0009331703186035156, -0.0005577802658081055, -0.0001823902130126953, 0.00019299983978271484, 0.000568389892578125, 0.0009437799453735352, 0.0013191699981689453, 0.0016945600509643555, 0.0020699501037597656, 0.0024453401565551758, 0.002820730209350586, 0.003196120262145996, 0.0035715103149414062, 0.003946900367736816, 0.0043222904205322266, 0.004697680473327637, 0.005073070526123047, 0.005448460578918457, 0.005823850631713867, 0.006199240684509277, 0.0065746307373046875, 0.006950020790100098, 0.007325410842895508, 0.007700800895690918, 0.008076190948486328, 0.008451581001281738, 0.008826971054077148, 0.009202361106872559, 0.009577751159667969, 0.009953141212463379, 0.010328531265258789, 0.0107039213180542, 0.01107931137084961, 0.01145470142364502, 0.01183009147644043, 0.01220548152923584, 0.01258087158203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 7.0, 5.0, 6.0, 23.0, 125.0, 525.0, 183.0, 44.0, 9.0, 9.0, 11.0, 3.0, 4.0, 2.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002741813659667969, -0.00026551634073257446, -0.00025685131549835205, -0.00024818629026412964, -0.00023952126502990723, -0.00023085623979568481, -0.0002221912145614624, -0.00021352618932724, -0.00020486116409301758, -0.00019619613885879517, -0.00018753111362457275, -0.00017886608839035034, -0.00017020106315612793, -0.00016153603792190552, -0.0001528710126876831, -0.0001442059874534607, -0.00013554096221923828, -0.00012687593698501587, -0.00011821091175079346, -0.00010954588651657104, -0.00010088086128234863, -9.221583604812622e-05, -8.355081081390381e-05, -7.48857855796814e-05, -6.622076034545898e-05, -5.755573511123657e-05, -4.889070987701416e-05, -4.022568464279175e-05, -3.1560659408569336e-05, -2.2895634174346924e-05, -1.4230608940124512e-05, -5.5655837059021e-06, 3.0994415283203125e-06, 1.1764466762542725e-05, 2.0429491996765137e-05, 2.909451723098755e-05, 3.775954246520996e-05, 4.642456769943237e-05, 5.5089592933654785e-05, 6.37546181678772e-05, 7.241964340209961e-05, 8.108466863632202e-05, 8.974969387054443e-05, 9.841471910476685e-05, 0.00010707974433898926, 0.00011574476957321167, 0.00012440979480743408, 0.0001330748200416565, 0.0001417398452758789, 0.00015040487051010132, 0.00015906989574432373, 0.00016773492097854614, 0.00017639994621276855, 0.00018506497144699097, 0.00019372999668121338, 0.0002023950219154358, 0.0002110600471496582, 0.00021972507238388062, 0.00022839009761810303, 0.00023705512285232544, 0.00024572014808654785, 0.00025438517332077026, 0.0002630501985549927, 0.0002717152237892151, 0.0002803802490234375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 9.0, 11.0, 17.0, 34.0, 73.0, 167.0, 622.0, 6612.0, 1032828.0, 7174.0, 679.0, 153.0, 69.0, 31.0, 20.0, 17.0, 13.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.033050537109375, -0.03203392028808594, -0.031017303466796875, -0.030000686645507812, -0.02898406982421875, -0.027967453002929688, -0.026950836181640625, -0.025934219360351562, -0.0249176025390625, -0.023900985717773438, -0.022884368896484375, -0.021867752075195312, -0.02085113525390625, -0.019834518432617188, -0.018817901611328125, -0.017801284790039062, -0.01678466796875, -0.015768051147460938, -0.014751434326171875, -0.013734817504882812, -0.01271820068359375, -0.011701583862304688, -0.010684967041015625, -0.009668350219726562, -0.0086517333984375, -0.0076351165771484375, -0.006618499755859375, -0.0056018829345703125, -0.00458526611328125, -0.0035686492919921875, -0.002552032470703125, -0.0015354156494140625, -0.000518798828125, 0.0004978179931640625, 0.001514434814453125, 0.0025310516357421875, 0.00354766845703125, 0.0045642852783203125, 0.005580902099609375, 0.0065975189208984375, 0.0076141357421875, 0.008630752563476562, 0.009647369384765625, 0.010663986206054688, 0.01168060302734375, 0.012697219848632812, 0.013713836669921875, 0.014730453491210938, 0.0157470703125, 0.016763687133789062, 0.017780303955078125, 0.018796920776367188, 0.01981353759765625, 0.020830154418945312, 0.021846771240234375, 0.022863388061523438, 0.0238800048828125, 0.024896621704101562, 0.025913238525390625, 0.026929855346679688, 0.02794647216796875, 0.028963088989257812, 0.029979705810546875, 0.030996322631835938, 0.032012939453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 11.0, 11.0, 16.0, 28.0, 55.0, 176.0, 408.0, 152.0, 49.0, 33.0, 15.0, 6.0, 9.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0156097412109375, -0.01511383056640625, -0.014617919921875, -0.01412200927734375, -0.0136260986328125, -0.01313018798828125, -0.01263427734375, -0.01213836669921875, -0.0116424560546875, -0.01114654541015625, -0.010650634765625, -0.01015472412109375, -0.0096588134765625, -0.00916290283203125, -0.0086669921875, -0.00817108154296875, -0.0076751708984375, -0.00717926025390625, -0.006683349609375, -0.00618743896484375, -0.0056915283203125, -0.00519561767578125, -0.00469970703125, -0.00420379638671875, -0.0037078857421875, -0.00321197509765625, -0.002716064453125, -0.00222015380859375, -0.0017242431640625, -0.00122833251953125, -0.000732421875, -0.00023651123046875, 0.0002593994140625, 0.00075531005859375, 0.001251220703125, 0.00174713134765625, 0.0022430419921875, 0.00273895263671875, 0.00323486328125, 0.00373077392578125, 0.0042266845703125, 0.00472259521484375, 0.005218505859375, 0.00571441650390625, 0.0062103271484375, 0.00670623779296875, 0.0072021484375, 0.00769805908203125, 0.0081939697265625, 0.00868988037109375, 0.009185791015625, 0.00968170166015625, 0.0101776123046875, 0.01067352294921875, 0.01116943359375, 0.01166534423828125, 0.0121612548828125, 0.01265716552734375, 0.013153076171875, 0.01364898681640625, 0.0141448974609375, 0.01464080810546875, 0.01513671875, 0.01563262939453125, 0.0161285400390625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 12.0, 23.0, 42.0, 165.0, 491.0, 187.0, 56.0, 15.0, 10.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18612724542617798, -0.1666599065065384, -0.1471925675868988, -0.12772522866725922, -0.10825788974761963, -0.08879055082798004, -0.06932321190834045, -0.04985587298870087, -0.03038853406906128, -0.010921195149421692, 0.008546143770217896, 0.028013482689857483, 0.04748082160949707, 0.06694816052913666, 0.08641549944877625, 0.10588283836841583, 0.12535017728805542, 0.144817516207695, 0.1642848551273346, 0.18375219404697418, 0.20321953296661377, 0.22268687188625336, 0.24215421080589294, 0.26162153482437134, 0.2810888886451721, 0.3005562424659729, 0.3200235664844513, 0.3394908905029297, 0.35895824432373047, 0.37842559814453125, 0.39789292216300964, 0.41736024618148804, 0.43682754039764404, 0.4562948942184448, 0.4757622182369232, 0.4952295422554016, 0.5146968960762024, 0.5341642498970032, 0.5536315441131592, 0.57309889793396, 0.5925662517547607, 0.6120336055755615, 0.6315009593963623, 0.6509682536125183, 0.6704356074333191, 0.6899029612541199, 0.7093702554702759, 0.7288376092910767, 0.7483049631118774, 0.7677723169326782, 0.787239670753479, 0.806706964969635, 0.8261743187904358, 0.8456416726112366, 0.8651089668273926, 0.8845763206481934, 0.9040436744689941, 0.9235110282897949, 0.9429783821105957, 0.9624456763267517, 0.9819130301475525, 1.0013803243637085, 1.0208476781845093, 1.04031503200531, 1.0597823858261108]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 10.0, 9.0, 13.0, 19.0, 12.0, 18.0, 23.0, 28.0, 29.0, 29.0, 38.0, 29.0, 49.0, 52.0, 44.0, 46.0, 42.0, 42.0, 42.0, 37.0, 29.0, 43.0, 44.0, 34.0, 20.0, 30.0, 30.0, 21.0, 22.0, 20.0, 18.0, 9.0, 6.0, 8.0, 8.0, 9.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36525487899780273, -0.3532108962535858, -0.3411669433116913, -0.32912296056747437, -0.31707900762557983, -0.3050350248813629, -0.292991042137146, -0.28094708919525146, -0.26890313625335693, -0.25685915350914, -0.24481520056724548, -0.23277121782302856, -0.22072726488113403, -0.20868328213691711, -0.1966393142938614, -0.18459534645080566, -0.17255136370658875, -0.16050739586353302, -0.1484634280204773, -0.13641944527626038, -0.12437548488378525, -0.11233151704072952, -0.1002875417470932, -0.08824357390403748, -0.07619960606098175, -0.06415563821792603, -0.05211166664958, -0.04006769508123398, -0.028023727238178253, -0.015979759395122528, -0.003935784101486206, 0.008108183741569519, 0.020152151584625244, 0.03219611942768097, 0.04424009099602699, 0.056284062564373016, 0.06832803040742874, 0.08037199825048447, 0.09241597354412079, 0.10445994138717651, 0.11650390923023224, 0.12854787707328796, 0.1405918449163437, 0.15263581275939941, 0.16467979550361633, 0.17672374844551086, 0.18876773118972778, 0.2008116990327835, 0.21285566687583923, 0.22489963471889496, 0.23694360256195068, 0.2489875853061676, 0.26103153824806213, 0.27307552099227905, 0.2851194739341736, 0.2971634566783905, 0.3092074394226074, 0.32125142216682434, 0.33329537510871887, 0.3453393578529358, 0.3573833107948303, 0.36942729353904724, 0.38147127628326416, 0.3935152292251587, 0.4055591821670532]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 5.0, 6.0, 5.0, 12.0, 18.0, 35.0, 41.0, 54.0, 76.0, 112.0, 252.0, 3029.0, 4189715.0, 483.0, 126.0, 80.0, 63.0, 39.0, 24.0, 18.0, 16.0, 15.0, 7.0, 7.0, 8.0, 6.0, 4.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.26416015625, -0.2551116943359375, -0.246063232421875, -0.2370147705078125, -0.22796630859375, -0.2189178466796875, -0.209869384765625, -0.2008209228515625, -0.1917724609375, -0.1827239990234375, -0.173675537109375, -0.1646270751953125, -0.15557861328125, -0.1465301513671875, -0.137481689453125, -0.1284332275390625, -0.119384765625, -0.1103363037109375, -0.101287841796875, -0.0922393798828125, -0.08319091796875, -0.0741424560546875, -0.065093994140625, -0.0560455322265625, -0.0469970703125, -0.0379486083984375, -0.028900146484375, -0.0198516845703125, -0.01080322265625, -0.0017547607421875, 0.007293701171875, 0.0163421630859375, 0.025390625, 0.0344390869140625, 0.043487548828125, 0.0525360107421875, 0.06158447265625, 0.0706329345703125, 0.079681396484375, 0.0887298583984375, 0.0977783203125, 0.1068267822265625, 0.115875244140625, 0.1249237060546875, 0.13397216796875, 0.1430206298828125, 0.152069091796875, 0.1611175537109375, 0.170166015625, 0.1792144775390625, 0.188262939453125, 0.1973114013671875, 0.20635986328125, 0.2154083251953125, 0.224456787109375, 0.2335052490234375, 0.2425537109375, 0.2516021728515625, 0.260650634765625, 0.2696990966796875, 0.27874755859375, 0.2877960205078125, 0.296844482421875, 0.3058929443359375, 0.31494140625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 6.0, 5.0, 12.0, 14.0, 33.0, 33.0, 55.0, 65.0, 76.0, 88.0, 91.0, 81.0, 98.0, 52.0, 65.0, 59.0, 30.0, 33.0, 16.0, 12.0, 15.0, 9.0, 6.0, 6.0, 8.0, 4.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02093505859375, -0.020221710205078125, -0.01950836181640625, -0.018795013427734375, -0.0180816650390625, -0.017368316650390625, -0.01665496826171875, -0.015941619873046875, -0.015228271484375, -0.014514923095703125, -0.01380157470703125, -0.013088226318359375, -0.0123748779296875, -0.011661529541015625, -0.01094818115234375, -0.010234832763671875, -0.009521484375, -0.008808135986328125, -0.00809478759765625, -0.007381439208984375, -0.0066680908203125, -0.005954742431640625, -0.00524139404296875, -0.004528045654296875, -0.003814697265625, -0.003101348876953125, -0.00238800048828125, -0.001674652099609375, -0.0009613037109375, -0.000247955322265625, 0.00046539306640625, 0.001178741455078125, 0.00189208984375, 0.002605438232421875, 0.00331878662109375, 0.004032135009765625, 0.0047454833984375, 0.005458831787109375, 0.00617218017578125, 0.006885528564453125, 0.007598876953125, 0.008312225341796875, 0.00902557373046875, 0.009738922119140625, 0.0104522705078125, 0.011165618896484375, 0.01187896728515625, 0.012592315673828125, 0.0133056640625, 0.014019012451171875, 0.01473236083984375, 0.015445709228515625, 0.0161590576171875, 0.016872406005859375, 0.01758575439453125, 0.018299102783203125, 0.019012451171875, 0.019725799560546875, 0.02043914794921875, 0.021152496337890625, 0.0218658447265625, 0.022579193115234375, 0.02329254150390625, 0.024005889892578125, 0.02471923828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 25.0, 50.0, 190.0, 713.0, 3134.0, 4149615.0, 37978.0, 1774.0, 500.0, 190.0, 52.0, 19.0, 13.0, 9.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.08020210266113281, -0.07776260375976562, -0.07532310485839844, -0.07288360595703125, -0.07044410705566406, -0.06800460815429688, -0.06556510925292969, -0.0631256103515625, -0.06068611145019531, -0.058246612548828125, -0.05580711364746094, -0.05336761474609375, -0.05092811584472656, -0.048488616943359375, -0.04604911804199219, -0.043609619140625, -0.04117012023925781, -0.038730621337890625, -0.03629112243652344, -0.03385162353515625, -0.03141212463378906, -0.028972625732421875, -0.026533126831054688, -0.0240936279296875, -0.021654129028320312, -0.019214630126953125, -0.016775131225585938, -0.01433563232421875, -0.011896133422851562, -0.009456634521484375, -0.0070171356201171875, -0.00457763671875, -0.0021381378173828125, 0.000301361083984375, 0.0027408599853515625, 0.00518035888671875, 0.0076198577880859375, 0.010059356689453125, 0.012498855590820312, 0.0149383544921875, 0.017377853393554688, 0.019817352294921875, 0.022256851196289062, 0.02469635009765625, 0.027135848999023438, 0.029575347900390625, 0.03201484680175781, 0.034454345703125, 0.03689384460449219, 0.039333343505859375, 0.04177284240722656, 0.04421234130859375, 0.04665184020996094, 0.049091339111328125, 0.05153083801269531, 0.0539703369140625, 0.05640983581542969, 0.058849334716796875, 0.06128883361816406, 0.06372833251953125, 0.06616783142089844, 0.06860733032226562, 0.07104682922363281, 0.073486328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 15.0, 26.0, 88.0, 3779.0, 93.0, 20.0, 13.0, 13.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01548004150390625, -0.014955401420593262, -0.014430761337280273, -0.013906121253967285, -0.013381481170654297, -0.012856841087341309, -0.01233220100402832, -0.011807560920715332, -0.011282920837402344, -0.010758280754089355, -0.010233640670776367, -0.009709000587463379, -0.00918436050415039, -0.008659720420837402, -0.008135080337524414, -0.007610440254211426, -0.0070858001708984375, -0.006561160087585449, -0.006036520004272461, -0.005511879920959473, -0.004987239837646484, -0.004462599754333496, -0.003937959671020508, -0.0034133195877075195, -0.0028886795043945312, -0.002364039421081543, -0.0018393993377685547, -0.0013147592544555664, -0.0007901191711425781, -0.00026547908782958984, 0.00025916099548339844, 0.0007838010787963867, 0.001308441162109375, 0.0018330812454223633, 0.0023577213287353516, 0.00288236141204834, 0.003407001495361328, 0.003931641578674316, 0.004456281661987305, 0.004980921745300293, 0.005505561828613281, 0.0060302019119262695, 0.006554841995239258, 0.007079482078552246, 0.007604122161865234, 0.008128762245178223, 0.008653402328491211, 0.0091780424118042, 0.009702682495117188, 0.010227322578430176, 0.010751962661743164, 0.011276602745056152, 0.01180124282836914, 0.012325882911682129, 0.012850522994995117, 0.013375163078308105, 0.013899803161621094, 0.014424443244934082, 0.01494908332824707, 0.015473723411560059, 0.015998363494873047, 0.016523003578186035, 0.017047643661499023, 0.01757228374481201, 0.018096923828125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 22.0, 78.0, 650.0, 221.0, 31.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12705132365226746, -0.12464351952075958, -0.12223571538925171, -0.11982790380716324, -0.11742009967565536, -0.11501229554414749, -0.11260449141263962, -0.11019668728113174, -0.10778887569904327, -0.1053810715675354, -0.10297326743602753, -0.10056545585393906, -0.09815765172243118, -0.09574984759092331, -0.09334204345941544, -0.09093423932790756, -0.08852643519639969, -0.08611863106489182, -0.08371082693338394, -0.08130301535129547, -0.0788952112197876, -0.07648740708827972, -0.07407960295677185, -0.07167179882526398, -0.0692639946937561, -0.06685619056224823, -0.06444838643074036, -0.062040578573942184, -0.05963277071714401, -0.05722496658563614, -0.054817162454128265, -0.05240935832262039, -0.05000155046582222, -0.047593746334314346, -0.045185938477516174, -0.0427781343460083, -0.04037033021450043, -0.037962522357702255, -0.03555471822619438, -0.03314691036939621, -0.030739106237888336, -0.028331300243735313, -0.02592349424958229, -0.023515690118074417, -0.021107884123921394, -0.01870007812976837, -0.016292273998260498, -0.013884468004107475, -0.011476662009954453, -0.00906885601580143, -0.006661050952970982, -0.004253245424479246, -0.0018454398959875107, 0.0005623660981655121, 0.0029701711609959602, 0.005377976223826408, 0.007785782217979431, 0.010193588212132454, 0.012601393274962902, 0.01500919833779335, 0.017417004331946373, 0.019824810326099396, 0.02223261445760727, 0.024640420451760292, 0.027048226445913315]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 3.0, 11.0, 6.0, 13.0, 18.0, 31.0, 32.0, 41.0, 47.0, 45.0, 61.0, 57.0, 77.0, 85.0, 72.0, 52.0, 56.0, 61.0, 50.0, 39.0, 48.0, 27.0, 22.0, 17.0, 5.0, 7.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026152849197387695, -0.02509773150086403, -0.024042613804340363, -0.022987496107816696, -0.02193237841129303, -0.020877260714769363, -0.019822143018245697, -0.01876702532172203, -0.017711907625198364, -0.016656789928674698, -0.015601672232151031, -0.014546554535627365, -0.013491436839103699, -0.012436319142580032, -0.011381201446056366, -0.0103260837495327, -0.009270966053009033, -0.008215848356485367, -0.0071607306599617004, -0.006105612963438034, -0.005050495266914368, -0.003995377570390701, -0.002940259873867035, -0.0018851421773433685, -0.0008300244808197021, 0.00022509321570396423, 0.0012802109122276306, 0.002335328608751297, 0.0033904463052749634, 0.00444556400179863, 0.005500681698322296, 0.0065557993948459625, 0.007610917091369629, 0.008666034787893295, 0.009721152484416962, 0.010776270180940628, 0.011831387877464294, 0.01288650557398796, 0.013941623270511627, 0.014996740967035294, 0.01605185866355896, 0.017106976360082626, 0.018162094056606293, 0.01921721175312996, 0.020272329449653625, 0.021327447146177292, 0.022382564842700958, 0.023437682539224625, 0.02449280023574829, 0.025547917932271957, 0.026603035628795624, 0.02765815332531929, 0.028713271021842957, 0.029768388718366623, 0.03082350641489029, 0.031878624111413956, 0.03293374180793762, 0.03398885950446129, 0.035043977200984955, 0.03609909489750862, 0.03715421259403229, 0.038209330290555954, 0.03926444798707962, 0.04031956568360329, 0.04137468338012695]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 12.0, 14.0, 10.0, 19.0, 44.0, 37.0, 90.0, 111.0, 169.0, 255.0, 411.0, 754.0, 1409.0, 2865.0, 6383.0, 16929.0, 63722.0, 614746.0, 274258.0, 43086.0, 12726.0, 5188.0, 2437.0, 1143.0, 672.0, 354.0, 215.0, 160.0, 94.0, 67.0, 46.0, 38.0, 26.0, 12.0, 12.0, 5.0, 3.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06756591796875, -0.06530380249023438, -0.06304168701171875, -0.060779571533203125, -0.0585174560546875, -0.056255340576171875, -0.05399322509765625, -0.051731109619140625, -0.049468994140625, -0.047206878662109375, -0.04494476318359375, -0.042682647705078125, -0.0404205322265625, -0.038158416748046875, -0.03589630126953125, -0.033634185791015625, -0.0313720703125, -0.029109954833984375, -0.02684783935546875, -0.024585723876953125, -0.0223236083984375, -0.020061492919921875, -0.01779937744140625, -0.015537261962890625, -0.013275146484375, -0.011013031005859375, -0.00875091552734375, -0.006488800048828125, -0.0042266845703125, -0.001964569091796875, 0.00029754638671875, 0.002559661865234375, 0.00482177734375, 0.007083892822265625, 0.00934600830078125, 0.011608123779296875, 0.0138702392578125, 0.016132354736328125, 0.01839447021484375, 0.020656585693359375, 0.022918701171875, 0.025180816650390625, 0.02744293212890625, 0.029705047607421875, 0.0319671630859375, 0.034229278564453125, 0.03649139404296875, 0.038753509521484375, 0.041015625, 0.043277740478515625, 0.04553985595703125, 0.047801971435546875, 0.0500640869140625, 0.052326202392578125, 0.05458831787109375, 0.056850433349609375, 0.059112548828125, 0.061374664306640625, 0.06363677978515625, 0.06589889526367188, 0.0681610107421875, 0.07042312622070312, 0.07268524169921875, 0.07494735717773438, 0.07720947265625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 7.0, 3.0, 6.0, 4.0, 14.0, 15.0, 32.0, 37.0, 53.0, 62.0, 80.0, 85.0, 96.0, 85.0, 90.0, 52.0, 65.0, 56.0, 41.0, 20.0, 16.0, 14.0, 14.0, 10.0, 9.0, 3.0, 8.0, 5.0, 7.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020904541015625, -0.020190715789794922, -0.019476890563964844, -0.018763065338134766, -0.018049240112304688, -0.01733541488647461, -0.01662158966064453, -0.015907764434814453, -0.015193939208984375, -0.014480113983154297, -0.013766288757324219, -0.01305246353149414, -0.012338638305664062, -0.011624813079833984, -0.010910987854003906, -0.010197162628173828, -0.00948333740234375, -0.008769512176513672, -0.008055686950683594, -0.007341861724853516, -0.0066280364990234375, -0.005914211273193359, -0.005200386047363281, -0.004486560821533203, -0.003772735595703125, -0.003058910369873047, -0.0023450851440429688, -0.0016312599182128906, -0.0009174346923828125, -0.00020360946655273438, 0.0005102157592773438, 0.0012240409851074219, 0.0019378662109375, 0.002651691436767578, 0.0033655166625976562, 0.004079341888427734, 0.0047931671142578125, 0.005506992340087891, 0.006220817565917969, 0.006934642791748047, 0.007648468017578125, 0.008362293243408203, 0.009076118469238281, 0.00978994369506836, 0.010503768920898438, 0.011217594146728516, 0.011931419372558594, 0.012645244598388672, 0.01335906982421875, 0.014072895050048828, 0.014786720275878906, 0.015500545501708984, 0.016214370727539062, 0.01692819595336914, 0.01764202117919922, 0.018355846405029297, 0.019069671630859375, 0.019783496856689453, 0.02049732208251953, 0.02121114730834961, 0.021924972534179688, 0.022638797760009766, 0.023352622985839844, 0.024066448211669922, 0.0247802734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 6.0, 1.0, 8.0, 6.0, 8.0, 4.0, 5.0, 11.0, 18.0, 17.0, 19.0, 28.0, 29.0, 46.0, 60.0, 74.0, 81.0, 127.0, 247.0, 349.0, 777.0, 1951.0, 11103.0, 443339.0, 573835.0, 12432.0, 2005.0, 819.0, 379.0, 216.0, 143.0, 101.0, 71.0, 51.0, 41.0, 32.0, 23.0, 25.0, 25.0, 12.0, 12.0, 8.0, 2.0, 5.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1370849609375, -0.1329326629638672, -0.12878036499023438, -0.12462806701660156, -0.12047576904296875, -0.11632347106933594, -0.11217117309570312, -0.10801887512207031, -0.1038665771484375, -0.09971427917480469, -0.09556198120117188, -0.09140968322753906, -0.08725738525390625, -0.08310508728027344, -0.07895278930664062, -0.07480049133300781, -0.070648193359375, -0.06649589538574219, -0.062343597412109375, -0.05819129943847656, -0.05403900146484375, -0.04988670349121094, -0.045734405517578125, -0.04158210754394531, -0.0374298095703125, -0.03327751159667969, -0.029125213623046875, -0.024972915649414062, -0.02082061767578125, -0.016668319702148438, -0.012516021728515625, -0.008363723754882812, -0.00421142578125, -5.91278076171875e-05, 0.004093170166015625, 0.008245468139648438, 0.01239776611328125, 0.016550064086914062, 0.020702362060546875, 0.024854660034179688, 0.0290069580078125, 0.03315925598144531, 0.037311553955078125, 0.04146385192871094, 0.04561614990234375, 0.04976844787597656, 0.053920745849609375, 0.05807304382324219, 0.062225341796875, 0.06637763977050781, 0.07052993774414062, 0.07468223571777344, 0.07883453369140625, 0.08298683166503906, 0.08713912963867188, 0.09129142761230469, 0.0954437255859375, 0.09959602355957031, 0.10374832153320312, 0.10790061950683594, 0.11205291748046875, 0.11620521545410156, 0.12035751342773438, 0.12450981140136719, 0.128662109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 9.0, 9.0, 16.0, 9.0, 16.0, 14.0, 19.0, 22.0, 32.0, 38.0, 24.0, 33.0, 32.0, 39.0, 44.0, 43.0, 39.0, 41.0, 50.0, 45.0, 44.0, 32.0, 34.0, 39.0, 43.0, 34.0, 30.0, 23.0, 18.0, 25.0, 16.0, 17.0, 13.0, 11.0, 11.0, 8.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0631103515625, -0.06107807159423828, -0.05904579162597656, -0.057013511657714844, -0.054981231689453125, -0.052948951721191406, -0.05091667175292969, -0.04888439178466797, -0.04685211181640625, -0.04481983184814453, -0.04278755187988281, -0.040755271911621094, -0.038722991943359375, -0.036690711975097656, -0.03465843200683594, -0.03262615203857422, -0.0305938720703125, -0.02856159210205078, -0.026529312133789062, -0.024497032165527344, -0.022464752197265625, -0.020432472229003906, -0.018400192260742188, -0.01636791229248047, -0.01433563232421875, -0.012303352355957031, -0.010271072387695312, -0.008238792419433594, -0.006206512451171875, -0.004174232482910156, -0.0021419525146484375, -0.00010967254638671875, 0.001922607421875, 0.003954887390136719, 0.0059871673583984375, 0.008019447326660156, 0.010051727294921875, 0.012084007263183594, 0.014116287231445312, 0.01614856719970703, 0.01818084716796875, 0.02021312713623047, 0.022245407104492188, 0.024277687072753906, 0.026309967041015625, 0.028342247009277344, 0.030374526977539062, 0.03240680694580078, 0.0344390869140625, 0.03647136688232422, 0.03850364685058594, 0.040535926818847656, 0.042568206787109375, 0.044600486755371094, 0.04663276672363281, 0.04866504669189453, 0.05069732666015625, 0.05272960662841797, 0.05476188659667969, 0.056794166564941406, 0.058826446533203125, 0.060858726501464844, 0.06289100646972656, 0.06492328643798828, 0.06695556640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 5.0, 8.0, 12.0, 24.0, 31.0, 44.0, 62.0, 114.0, 220.0, 403.0, 785.0, 1890.0, 4632.0, 19574.0, 999092.0, 14420.0, 4017.0, 1601.0, 731.0, 355.0, 204.0, 104.0, 59.0, 37.0, 26.0, 19.0, 20.0, 14.0, 13.0, 3.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01654052734375, -0.016045808792114258, -0.015551090240478516, -0.015056371688842773, -0.014561653137207031, -0.014066934585571289, -0.013572216033935547, -0.013077497482299805, -0.012582778930664062, -0.01208806037902832, -0.011593341827392578, -0.011098623275756836, -0.010603904724121094, -0.010109186172485352, -0.00961446762084961, -0.009119749069213867, -0.008625030517578125, -0.008130311965942383, -0.007635593414306641, -0.0071408748626708984, -0.006646156311035156, -0.006151437759399414, -0.005656719207763672, -0.00516200065612793, -0.0046672821044921875, -0.004172563552856445, -0.003677845001220703, -0.003183126449584961, -0.0026884078979492188, -0.0021936893463134766, -0.0016989707946777344, -0.0012042522430419922, -0.00070953369140625, -0.0002148151397705078, 0.0002799034118652344, 0.0007746219635009766, 0.0012693405151367188, 0.001764059066772461, 0.002258777618408203, 0.0027534961700439453, 0.0032482147216796875, 0.0037429332733154297, 0.004237651824951172, 0.004732370376586914, 0.005227088928222656, 0.0057218074798583984, 0.006216526031494141, 0.006711244583129883, 0.007205963134765625, 0.007700681686401367, 0.00819540023803711, 0.008690118789672852, 0.009184837341308594, 0.009679555892944336, 0.010174274444580078, 0.01066899299621582, 0.011163711547851562, 0.011658430099487305, 0.012153148651123047, 0.012647867202758789, 0.013142585754394531, 0.013637304306030273, 0.014132022857666016, 0.014626741409301758, 0.0151214599609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 4.0, 17.0, 50.0, 178.0, 526.0, 145.0, 33.0, 12.0, 4.0, 5.0, 0.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003387928009033203, -0.00032726675271987915, -0.000315740704536438, -0.0003042146563529968, -0.00029268860816955566, -0.0002811625599861145, -0.00026963651180267334, -0.0002581104636192322, -0.000246584415435791, -0.00023505836725234985, -0.0002235323190689087, -0.00021200627088546753, -0.00020048022270202637, -0.0001889541745185852, -0.00017742812633514404, -0.00016590207815170288, -0.00015437602996826172, -0.00014284998178482056, -0.0001313239336013794, -0.00011979788541793823, -0.00010827183723449707, -9.674578905105591e-05, -8.521974086761475e-05, -7.369369268417358e-05, -6.216764450073242e-05, -5.064159631729126e-05, -3.91155481338501e-05, -2.7589499950408936e-05, -1.6063451766967773e-05, -4.537403583526611e-06, 6.988644599914551e-06, 1.8514692783355713e-05, 3.0040740966796875e-05, 4.156678915023804e-05, 5.30928373336792e-05, 6.461888551712036e-05, 7.614493370056152e-05, 8.767098188400269e-05, 9.919703006744385e-05, 0.00011072307825088501, 0.00012224912643432617, 0.00013377517461776733, 0.0001453012228012085, 0.00015682727098464966, 0.00016835331916809082, 0.00017987936735153198, 0.00019140541553497314, 0.0002029314637184143, 0.00021445751190185547, 0.00022598356008529663, 0.0002375096082687378, 0.00024903565645217896, 0.0002605617046356201, 0.0002720877528190613, 0.00028361380100250244, 0.0002951398491859436, 0.00030666589736938477, 0.00031819194555282593, 0.0003297179937362671, 0.00034124404191970825, 0.0003527700901031494, 0.0003642961382865906, 0.00037582218647003174, 0.0003873482346534729, 0.00039887428283691406]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 10.0, 13.0, 14.0, 45.0, 52.0, 136.0, 452.0, 4718.0, 1032084.0, 10018.0, 640.0, 185.0, 67.0, 41.0, 16.0, 16.0, 7.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.047271728515625, -0.04586505889892578, -0.04445838928222656, -0.043051719665527344, -0.041645050048828125, -0.040238380432128906, -0.03883171081542969, -0.03742504119873047, -0.03601837158203125, -0.03461170196533203, -0.03320503234863281, -0.031798362731933594, -0.030391693115234375, -0.028985023498535156, -0.027578353881835938, -0.02617168426513672, -0.0247650146484375, -0.02335834503173828, -0.021951675415039062, -0.020545005798339844, -0.019138336181640625, -0.017731666564941406, -0.016324996948242188, -0.014918327331542969, -0.01351165771484375, -0.012104988098144531, -0.010698318481445312, -0.009291648864746094, -0.007884979248046875, -0.006478309631347656, -0.0050716400146484375, -0.0036649703979492188, -0.00225830078125, -0.0008516311645507812, 0.0005550384521484375, 0.0019617080688476562, 0.003368377685546875, 0.004775047302246094, 0.0061817169189453125, 0.007588386535644531, 0.00899505615234375, 0.010401725769042969, 0.011808395385742188, 0.013215065002441406, 0.014621734619140625, 0.016028404235839844, 0.017435073852539062, 0.01884174346923828, 0.0202484130859375, 0.02165508270263672, 0.023061752319335938, 0.024468421936035156, 0.025875091552734375, 0.027281761169433594, 0.028688430786132812, 0.03009510040283203, 0.03150177001953125, 0.03290843963623047, 0.03431510925292969, 0.035721778869628906, 0.037128448486328125, 0.038535118103027344, 0.03994178771972656, 0.04134845733642578, 0.042755126953125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 9.0, 10.0, 11.0, 16.0, 29.0, 65.0, 192.0, 352.0, 145.0, 58.0, 21.0, 16.0, 17.0, 8.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016326904296875, -0.015790224075317383, -0.015253543853759766, -0.014716863632202148, -0.014180183410644531, -0.013643503189086914, -0.013106822967529297, -0.01257014274597168, -0.012033462524414062, -0.011496782302856445, -0.010960102081298828, -0.010423421859741211, -0.009886741638183594, -0.009350061416625977, -0.00881338119506836, -0.008276700973510742, -0.007740020751953125, -0.007203340530395508, -0.006666660308837891, -0.0061299800872802734, -0.005593299865722656, -0.005056619644165039, -0.004519939422607422, -0.003983259201049805, -0.0034465789794921875, -0.0029098987579345703, -0.002373218536376953, -0.001836538314819336, -0.0012998580932617188, -0.0007631778717041016, -0.00022649765014648438, 0.0003101825714111328, 0.00084686279296875, 0.0013835430145263672, 0.0019202232360839844, 0.0024569034576416016, 0.0029935836791992188, 0.003530263900756836, 0.004066944122314453, 0.00460362434387207, 0.0051403045654296875, 0.005676984786987305, 0.006213665008544922, 0.006750345230102539, 0.007287025451660156, 0.007823705673217773, 0.00836038589477539, 0.008897066116333008, 0.009433746337890625, 0.009970426559448242, 0.01050710678100586, 0.011043787002563477, 0.011580467224121094, 0.012117147445678711, 0.012653827667236328, 0.013190507888793945, 0.013727188110351562, 0.01426386833190918, 0.014800548553466797, 0.015337228775024414, 0.01587390899658203, 0.01641058921813965, 0.016947269439697266, 0.017483949661254883, 0.0180206298828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 6.0, 77.0, 795.0, 121.0, 13.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18552322685718536, -0.13408255577087402, -0.08264187723398209, -0.03120119869709015, 0.02023947238922119, 0.07168014347553253, 0.12312082946300507, 0.1745614856481552, 0.22600217163562775, 0.2774428427219391, 0.3288835287094116, 0.38032418489456177, 0.4317648708820343, 0.48320555686950684, 0.534646213054657, 0.5860868692398071, 0.637527585029602, 0.6889682412147522, 0.7404089570045471, 0.7918496131896973, 0.8432902693748474, 0.8947309255599976, 0.9461716413497925, 0.9976122975349426, 1.0490529537200928, 1.1004936695098877, 1.151934266090393, 1.203374981880188, 1.254815697669983, 1.3062562942504883, 1.3576970100402832, 1.4091377258300781, 1.4605783224105835, 1.5120190382003784, 1.5634596347808838, 1.6149003505706787, 1.6663410663604736, 1.717781662940979, 1.769222378730774, 1.8206629753112793, 1.8721036911010742, 1.9235444068908691, 1.9749850034713745, 2.026425838470459, 2.077866315841675, 2.1293070316314697, 2.1807477474212646, 2.2321884632110596, 2.2836291790008545, 2.3350698947906494, 2.3865106105804443, 2.43795108795166, 2.489391803741455, 2.54083251953125, 2.592273235321045, 2.64371395111084, 2.6951544284820557, 2.7465951442718506, 2.7980358600616455, 2.8494763374328613, 2.9009170532226562, 2.952357769012451, 3.003798484802246, 3.055239200592041, 3.106679916381836]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 7.0, 8.0, 11.0, 11.0, 14.0, 15.0, 26.0, 20.0, 28.0, 35.0, 46.0, 50.0, 44.0, 53.0, 62.0, 61.0, 54.0, 55.0, 51.0, 58.0, 45.0, 43.0, 40.0, 32.0, 21.0, 25.0, 16.0, 13.0, 19.0, 13.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4125663638114929, -0.3979475796222687, -0.38332876563072205, -0.3687099814414978, -0.35409119725227356, -0.3394724130630493, -0.3248535990715027, -0.31023481488227844, -0.2956160306930542, -0.28099724650382996, -0.2663784325122833, -0.2517596483230591, -0.23714086413383484, -0.2225220650434494, -0.20790326595306396, -0.19328448176383972, -0.17866568267345428, -0.16404688358306885, -0.1494280993938446, -0.13480930030345917, -0.12019051611423492, -0.10557171702384949, -0.09095292538404465, -0.07633413374423981, -0.06171534210443497, -0.04709655046463013, -0.03247775882482529, -0.01785896345973015, -0.0032401718199253082, 0.01137862354516983, 0.02599741518497467, 0.04061620682477951, 0.05523499846458435, 0.06985379010438919, 0.08447258174419403, 0.09909138083457947, 0.11371016502380371, 0.12832896411418915, 0.14294776320457458, 0.15756654739379883, 0.17218533158302307, 0.1868041306734085, 0.20142291486263275, 0.2160417139530182, 0.23066049814224243, 0.24527929723262787, 0.2598980963230133, 0.27451688051223755, 0.2891356945037842, 0.3037544786930084, 0.31837329268455505, 0.3329920768737793, 0.34761086106300354, 0.3622296452522278, 0.3768484592437744, 0.39146724343299866, 0.4060860276222229, 0.42070481181144714, 0.4353236258029938, 0.449942409992218, 0.46456119418144226, 0.4791799783706665, 0.49379879236221313, 0.5084176063537598, 0.5230363607406616]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 6.0, 4.0, 6.0, 11.0, 19.0, 18.0, 32.0, 43.0, 60.0, 84.0, 130.0, 181.0, 333.0, 669.0, 19541.0, 4171276.0, 843.0, 348.0, 225.0, 122.0, 93.0, 65.0, 45.0, 27.0, 28.0, 14.0, 8.0, 19.0, 7.0, 6.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.15952110290527344, -0.15363693237304688, -0.1477527618408203, -0.14186859130859375, -0.1359844207763672, -0.13010025024414062, -0.12421607971191406, -0.1183319091796875, -0.11244773864746094, -0.10656356811523438, -0.10067939758300781, -0.09479522705078125, -0.08891105651855469, -0.08302688598632812, -0.07714271545410156, -0.071258544921875, -0.06537437438964844, -0.059490203857421875, -0.05360603332519531, -0.04772186279296875, -0.04183769226074219, -0.035953521728515625, -0.030069351196289062, -0.0241851806640625, -0.018301010131835938, -0.012416839599609375, -0.0065326690673828125, -0.00064849853515625, 0.0052356719970703125, 0.011119842529296875, 0.017004013061523438, 0.02288818359375, 0.028772354125976562, 0.034656524658203125, 0.04054069519042969, 0.04642486572265625, 0.05230903625488281, 0.058193206787109375, 0.06407737731933594, 0.0699615478515625, 0.07584571838378906, 0.08172988891601562, 0.08761405944824219, 0.09349822998046875, 0.09938240051269531, 0.10526657104492188, 0.11115074157714844, 0.117034912109375, 0.12291908264160156, 0.12880325317382812, 0.1346874237060547, 0.14057159423828125, 0.1464557647705078, 0.15233993530273438, 0.15822410583496094, 0.1641082763671875, 0.16999244689941406, 0.17587661743164062, 0.1817607879638672, 0.18764495849609375, 0.1935291290283203, 0.19941329956054688, 0.20529747009277344, 0.211181640625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 11.0, 16.0, 20.0, 34.0, 35.0, 56.0, 63.0, 79.0, 76.0, 87.0, 93.0, 54.0, 69.0, 64.0, 52.0, 36.0, 27.0, 26.0, 12.0, 14.0, 14.0, 6.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019805908203125, -0.01912665367126465, -0.018447399139404297, -0.017768144607543945, -0.017088890075683594, -0.016409635543823242, -0.01573038101196289, -0.015051126480102539, -0.014371871948242188, -0.013692617416381836, -0.013013362884521484, -0.012334108352661133, -0.011654853820800781, -0.01097559928894043, -0.010296344757080078, -0.009617090225219727, -0.008937835693359375, -0.008258581161499023, -0.007579326629638672, -0.00690007209777832, -0.006220817565917969, -0.005541563034057617, -0.004862308502197266, -0.004183053970336914, -0.0035037994384765625, -0.002824544906616211, -0.0021452903747558594, -0.0014660358428955078, -0.0007867813110351562, -0.00010752677917480469, 0.0005717277526855469, 0.0012509822845458984, 0.00193023681640625, 0.0026094913482666016, 0.003288745880126953, 0.003968000411987305, 0.004647254943847656, 0.005326509475708008, 0.006005764007568359, 0.006685018539428711, 0.0073642730712890625, 0.008043527603149414, 0.008722782135009766, 0.009402036666870117, 0.010081291198730469, 0.01076054573059082, 0.011439800262451172, 0.012119054794311523, 0.012798309326171875, 0.013477563858032227, 0.014156818389892578, 0.01483607292175293, 0.015515327453613281, 0.016194581985473633, 0.016873836517333984, 0.017553091049194336, 0.018232345581054688, 0.01891160011291504, 0.01959085464477539, 0.020270109176635742, 0.020949363708496094, 0.021628618240356445, 0.022307872772216797, 0.02298712730407715, 0.0236663818359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 14.0, 30.0, 103.0, 214.0, 488.0, 1732.0, 4174460.0, 15837.0, 1005.0, 262.0, 83.0, 29.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08349609375, -0.07983207702636719, -0.07616806030273438, -0.07250404357910156, -0.06884002685546875, -0.06517601013183594, -0.061511993408203125, -0.05784797668457031, -0.0541839599609375, -0.05051994323730469, -0.046855926513671875, -0.04319190979003906, -0.03952789306640625, -0.03586387634277344, -0.032199859619140625, -0.028535842895507812, -0.024871826171875, -0.021207809448242188, -0.017543792724609375, -0.013879776000976562, -0.01021575927734375, -0.0065517425537109375, -0.002887725830078125, 0.0007762908935546875, 0.0044403076171875, 0.008104324340820312, 0.011768341064453125, 0.015432357788085938, 0.01909637451171875, 0.022760391235351562, 0.026424407958984375, 0.030088424682617188, 0.03375244140625, 0.03741645812988281, 0.041080474853515625, 0.04474449157714844, 0.04840850830078125, 0.05207252502441406, 0.055736541748046875, 0.05940055847167969, 0.0630645751953125, 0.06672859191894531, 0.07039260864257812, 0.07405662536621094, 0.07772064208984375, 0.08138465881347656, 0.08504867553710938, 0.08871269226074219, 0.092376708984375, 0.09604072570800781, 0.09970474243164062, 0.10336875915527344, 0.10703277587890625, 0.11069679260253906, 0.11436080932617188, 0.11802482604980469, 0.1216888427734375, 0.1253528594970703, 0.12901687622070312, 0.13268089294433594, 0.13634490966796875, 0.14000892639160156, 0.14367294311523438, 0.1473369598388672, 0.1510009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 16.0, 41.0, 167.0, 3720.0, 83.0, 22.0, 11.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03985595703125, -0.038936614990234375, -0.03801727294921875, -0.037097930908203125, -0.0361785888671875, -0.035259246826171875, -0.03433990478515625, -0.033420562744140625, -0.032501220703125, -0.031581878662109375, -0.03066253662109375, -0.029743194580078125, -0.0288238525390625, -0.027904510498046875, -0.02698516845703125, -0.026065826416015625, -0.025146484375, -0.024227142333984375, -0.02330780029296875, -0.022388458251953125, -0.0214691162109375, -0.020549774169921875, -0.01963043212890625, -0.018711090087890625, -0.017791748046875, -0.016872406005859375, -0.01595306396484375, -0.015033721923828125, -0.0141143798828125, -0.013195037841796875, -0.01227569580078125, -0.011356353759765625, -0.01043701171875, -0.009517669677734375, -0.00859832763671875, -0.007678985595703125, -0.0067596435546875, -0.005840301513671875, -0.00492095947265625, -0.004001617431640625, -0.003082275390625, -0.002162933349609375, -0.00124359130859375, -0.000324249267578125, 0.0005950927734375, 0.001514434814453125, 0.00243377685546875, 0.003353118896484375, 0.0042724609375, 0.005191802978515625, 0.00611114501953125, 0.007030487060546875, 0.0079498291015625, 0.008869171142578125, 0.00978851318359375, 0.010707855224609375, 0.011627197265625, 0.012546539306640625, 0.01346588134765625, 0.014385223388671875, 0.0153045654296875, 0.016223907470703125, 0.01714324951171875, 0.018062591552734375, 0.01898193359375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 783.0, 236.0, 3.0], "bins": [-1.6484768390655518, -1.6218676567077637, -1.5952584743499756, -1.5686492919921875, -1.5420401096343994, -1.5154309272766113, -1.4888217449188232, -1.4622125625610352, -1.4356034994125366, -1.4089943170547485, -1.3823851346969604, -1.3557759523391724, -1.3291667699813843, -1.3025575876235962, -1.2759485244750977, -1.2493393421173096, -1.222730040550232, -1.1961208581924438, -1.1695116758346558, -1.1429024934768677, -1.1162933111190796, -1.0896841287612915, -1.063075065612793, -1.0364658832550049, -1.0098567008972168, -0.9832475185394287, -0.9566383361816406, -0.9300291538238525, -0.9034200310707092, -0.8768108487129211, -0.8502016663551331, -0.823592483997345, -0.7969832420349121, -0.770374059677124, -0.7437648773193359, -0.7171556949615479, -0.6905465722084045, -0.6639373898506165, -0.6373282074928284, -0.6107190251350403, -0.5841098427772522, -0.5575006604194641, -0.530891478061676, -0.5042823553085327, -0.47767314314842224, -0.45106399059295654, -0.42445480823516846, -0.39784562587738037, -0.3712364733219147, -0.3446272909641266, -0.3180181384086609, -0.2914089560508728, -0.2647997736930847, -0.23819060623645782, -0.21158143877983093, -0.18497225642204285, -0.15836310386657715, -0.13175393640995026, -0.10514475405216217, -0.07853558659553528, -0.05192641168832779, -0.0253172367811203, 0.0012919306755065918, 0.027901113033294678, 0.05451028794050217]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 8.0, 13.0, 16.0, 23.0, 46.0, 56.0, 58.0, 72.0, 73.0, 75.0, 78.0, 65.0, 83.0, 88.0, 56.0, 44.0, 38.0, 36.0, 18.0, 15.0, 15.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048928022384643555, -0.0472177192568779, -0.045507416129112244, -0.04379710927605629, -0.042086806148290634, -0.04037650302052498, -0.038666196167469025, -0.03695589303970337, -0.035245589911937714, -0.03353528678417206, -0.0318249836564064, -0.03011467680335045, -0.028404373675584793, -0.026694070547819138, -0.024983765557408333, -0.023273460566997528, -0.021563157439231873, -0.019852854311466217, -0.018142549321055412, -0.016432244330644608, -0.014721941202878952, -0.013011637143790722, -0.011301333084702492, -0.009591029025614262, -0.007880724966526031, -0.006170420907437801, -0.004460116848349571, -0.002749812789261341, -0.001039508730173111, 0.0006707953289151192, 0.0023810993880033493, 0.0040914034470915794, 0.00580170750617981, 0.00751201156526804, 0.00922231562435627, 0.0109326196834445, 0.01264292374253273, 0.01435322780162096, 0.01606353186070919, 0.017773836851119995, 0.01948413997888565, 0.021194443106651306, 0.02290474809706211, 0.024615053087472916, 0.02632535621523857, 0.028035659343004227, 0.02974596433341503, 0.031456269323825836, 0.03316657245159149, 0.03487687557935715, 0.0365871787071228, 0.03829748556017876, 0.04000778868794441, 0.04171809181571007, 0.04342839866876602, 0.04513870179653168, 0.04684900492429733, 0.04855930805206299, 0.050269611179828644, 0.0519799180328846, 0.05369022116065025, 0.05540052428841591, 0.05711083114147186, 0.05882113426923752, 0.060531437397003174]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 9.0, 13.0, 17.0, 21.0, 31.0, 60.0, 74.0, 121.0, 201.0, 307.0, 538.0, 1046.0, 2063.0, 4525.0, 12246.0, 44698.0, 471023.0, 446801.0, 43751.0, 11993.0, 4448.0, 2103.0, 1012.0, 564.0, 338.0, 188.0, 124.0, 70.0, 54.0, 26.0, 29.0, 15.0, 11.0, 8.0, 8.0, 2.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06402587890625, -0.06219625473022461, -0.06036663055419922, -0.05853700637817383, -0.05670738220214844, -0.05487775802612305, -0.053048133850097656, -0.051218509674072266, -0.049388885498046875, -0.047559261322021484, -0.045729637145996094, -0.0439000129699707, -0.04207038879394531, -0.04024076461791992, -0.03841114044189453, -0.03658151626586914, -0.03475189208984375, -0.03292226791381836, -0.03109264373779297, -0.029263019561767578, -0.027433395385742188, -0.025603771209716797, -0.023774147033691406, -0.021944522857666016, -0.020114898681640625, -0.018285274505615234, -0.016455650329589844, -0.014626026153564453, -0.012796401977539062, -0.010966777801513672, -0.009137153625488281, -0.007307529449462891, -0.0054779052734375, -0.0036482810974121094, -0.0018186569213867188, 1.0967254638671875e-05, 0.0018405914306640625, 0.003670215606689453, 0.005499839782714844, 0.007329463958740234, 0.009159088134765625, 0.010988712310791016, 0.012818336486816406, 0.014647960662841797, 0.016477584838867188, 0.018307209014892578, 0.02013683319091797, 0.02196645736694336, 0.02379608154296875, 0.02562570571899414, 0.02745532989501953, 0.029284954071044922, 0.031114578247070312, 0.0329442024230957, 0.034773826599121094, 0.036603450775146484, 0.038433074951171875, 0.040262699127197266, 0.042092323303222656, 0.04392194747924805, 0.04575157165527344, 0.04758119583129883, 0.04941082000732422, 0.05124044418334961, 0.053070068359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 4.0, 8.0, 10.0, 18.0, 21.0, 30.0, 39.0, 51.0, 62.0, 87.0, 64.0, 92.0, 93.0, 59.0, 64.0, 65.0, 53.0, 37.0, 23.0, 27.0, 12.0, 11.0, 16.0, 7.0, 7.0, 8.0, 3.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196990966796875, -0.019023895263671875, -0.01834869384765625, -0.017673492431640625, -0.016998291015625, -0.016323089599609375, -0.01564788818359375, -0.014972686767578125, -0.0142974853515625, -0.013622283935546875, -0.01294708251953125, -0.012271881103515625, -0.0115966796875, -0.010921478271484375, -0.01024627685546875, -0.009571075439453125, -0.0088958740234375, -0.008220672607421875, -0.00754547119140625, -0.006870269775390625, -0.006195068359375, -0.005519866943359375, -0.00484466552734375, -0.004169464111328125, -0.0034942626953125, -0.002819061279296875, -0.00214385986328125, -0.001468658447265625, -0.00079345703125, -0.000118255615234375, 0.00055694580078125, 0.001232147216796875, 0.0019073486328125, 0.002582550048828125, 0.00325775146484375, 0.003932952880859375, 0.004608154296875, 0.005283355712890625, 0.00595855712890625, 0.006633758544921875, 0.0073089599609375, 0.007984161376953125, 0.00865936279296875, 0.009334564208984375, 0.010009765625, 0.010684967041015625, 0.01136016845703125, 0.012035369873046875, 0.0127105712890625, 0.013385772705078125, 0.01406097412109375, 0.014736175537109375, 0.015411376953125, 0.016086578369140625, 0.01676177978515625, 0.017436981201171875, 0.0181121826171875, 0.018787384033203125, 0.01946258544921875, 0.020137786865234375, 0.02081298828125, 0.021488189697265625, 0.02216339111328125, 0.022838592529296875, 0.0235137939453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 5.0, 9.0, 16.0, 16.0, 16.0, 29.0, 39.0, 48.0, 67.0, 69.0, 110.0, 138.0, 217.0, 344.0, 716.0, 2289.0, 23290.0, 946470.0, 68751.0, 3734.0, 870.0, 382.0, 280.0, 163.0, 129.0, 86.0, 56.0, 43.0, 34.0, 37.0, 20.0, 18.0, 10.0, 14.0, 9.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12234115600585938, -0.11870574951171875, -0.11507034301757812, -0.1114349365234375, -0.10779953002929688, -0.10416412353515625, -0.10052871704101562, -0.096893310546875, -0.09325790405273438, -0.08962249755859375, -0.08598709106445312, -0.0823516845703125, -0.07871627807617188, -0.07508087158203125, -0.07144546508789062, -0.06781005859375, -0.06417465209960938, -0.06053924560546875, -0.056903839111328125, -0.0532684326171875, -0.049633026123046875, -0.04599761962890625, -0.042362213134765625, -0.038726806640625, -0.035091400146484375, -0.03145599365234375, -0.027820587158203125, -0.0241851806640625, -0.020549774169921875, -0.01691436767578125, -0.013278961181640625, -0.0096435546875, -0.006008148193359375, -0.00237274169921875, 0.001262664794921875, 0.0048980712890625, 0.008533477783203125, 0.01216888427734375, 0.015804290771484375, 0.019439697265625, 0.023075103759765625, 0.02671051025390625, 0.030345916748046875, 0.0339813232421875, 0.037616729736328125, 0.04125213623046875, 0.044887542724609375, 0.04852294921875, 0.052158355712890625, 0.05579376220703125, 0.059429168701171875, 0.0630645751953125, 0.06669998168945312, 0.07033538818359375, 0.07397079467773438, 0.077606201171875, 0.08124160766601562, 0.08487701416015625, 0.08851242065429688, 0.0921478271484375, 0.09578323364257812, 0.09941864013671875, 0.10305404663085938, 0.106689453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 8.0, 13.0, 16.0, 14.0, 16.0, 13.0, 24.0, 23.0, 29.0, 35.0, 34.0, 31.0, 37.0, 45.0, 44.0, 55.0, 45.0, 46.0, 47.0, 42.0, 46.0, 32.0, 32.0, 43.0, 32.0, 36.0, 24.0, 17.0, 24.0, 12.0, 16.0, 8.0, 8.0, 12.0, 9.0, 6.0, 1.0, 4.0, 0.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07293701171875, -0.07087850570678711, -0.06881999969482422, -0.06676149368286133, -0.06470298767089844, -0.06264448165893555, -0.060585975646972656, -0.058527469635009766, -0.056468963623046875, -0.054410457611083984, -0.052351951599121094, -0.0502934455871582, -0.04823493957519531, -0.04617643356323242, -0.04411792755126953, -0.04205942153930664, -0.04000091552734375, -0.03794240951538086, -0.03588390350341797, -0.03382539749145508, -0.03176689147949219, -0.029708385467529297, -0.027649879455566406, -0.025591373443603516, -0.023532867431640625, -0.021474361419677734, -0.019415855407714844, -0.017357349395751953, -0.015298843383789062, -0.013240337371826172, -0.011181831359863281, -0.00912332534790039, -0.0070648193359375, -0.005006313323974609, -0.0029478073120117188, -0.0008893013000488281, 0.0011692047119140625, 0.003227710723876953, 0.005286216735839844, 0.007344722747802734, 0.009403228759765625, 0.011461734771728516, 0.013520240783691406, 0.015578746795654297, 0.017637252807617188, 0.019695758819580078, 0.02175426483154297, 0.02381277084350586, 0.02587127685546875, 0.02792978286743164, 0.02998828887939453, 0.03204679489135742, 0.03410530090332031, 0.0361638069152832, 0.038222312927246094, 0.040280818939208984, 0.042339324951171875, 0.044397830963134766, 0.046456336975097656, 0.04851484298706055, 0.05057334899902344, 0.05263185501098633, 0.05469036102294922, 0.05674886703491211, 0.058807373046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 10.0, 25.0, 28.0, 37.0, 57.0, 108.0, 282.0, 667.0, 2249.0, 9801.0, 902036.0, 123234.0, 7194.0, 1670.0, 580.0, 227.0, 101.0, 58.0, 50.0, 25.0, 22.0, 17.0, 12.0, 8.0, 1.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015655517578125, -0.015149116516113281, -0.014642715454101562, -0.014136314392089844, -0.013629913330078125, -0.013123512268066406, -0.012617111206054688, -0.012110710144042969, -0.01160430908203125, -0.011097908020019531, -0.010591506958007812, -0.010085105895996094, -0.009578704833984375, -0.009072303771972656, -0.008565902709960938, -0.008059501647949219, -0.0075531005859375, -0.007046699523925781, -0.0065402984619140625, -0.006033897399902344, -0.005527496337890625, -0.005021095275878906, -0.0045146942138671875, -0.004008293151855469, -0.00350189208984375, -0.0029954910278320312, -0.0024890899658203125, -0.0019826889038085938, -0.001476287841796875, -0.0009698867797851562, -0.0004634857177734375, 4.291534423828125e-05, 0.00054931640625, 0.0010557174682617188, 0.0015621185302734375, 0.0020685195922851562, 0.002574920654296875, 0.0030813217163085938, 0.0035877227783203125, 0.004094123840332031, 0.00460052490234375, 0.005106925964355469, 0.0056133270263671875, 0.006119728088378906, 0.006626129150390625, 0.007132530212402344, 0.0076389312744140625, 0.008145332336425781, 0.0086517333984375, 0.009158134460449219, 0.009664535522460938, 0.010170936584472656, 0.010677337646484375, 0.011183738708496094, 0.011690139770507812, 0.012196540832519531, 0.01270294189453125, 0.013209342956542969, 0.013715744018554688, 0.014222145080566406, 0.014728546142578125, 0.015234947204589844, 0.015741348266601562, 0.01624774932861328, 0.016754150390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 9.0, 28.0, 56.0, 82.0, 227.0, 361.0, 113.0, 59.0, 19.0, 13.0, 7.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008444786071777344, -0.0008133724331855774, -0.0007822662591934204, -0.0007511600852012634, -0.0007200539112091064, -0.0006889477372169495, -0.0006578415632247925, -0.0006267353892326355, -0.0005956292152404785, -0.0005645230412483215, -0.0005334168672561646, -0.0005023106932640076, -0.0004712045192718506, -0.0004400983452796936, -0.0004089921712875366, -0.00037788599729537964, -0.00034677982330322266, -0.0003156736493110657, -0.0002845674753189087, -0.0002534613013267517, -0.00022235512733459473, -0.00019124895334243774, -0.00016014277935028076, -0.00012903660535812378, -9.79304313659668e-05, -6.682425737380981e-05, -3.571808338165283e-05, -4.61190938949585e-06, 2.6494264602661133e-05, 5.7600438594818115e-05, 8.87066125869751e-05, 0.00011981278657913208, 0.00015091896057128906, 0.00018202513456344604, 0.00021313130855560303, 0.00024423748254776, 0.000275343656539917, 0.000306449830532074, 0.00033755600452423096, 0.00036866217851638794, 0.0003997683525085449, 0.0004308745265007019, 0.0004619807004928589, 0.0004930868744850159, 0.0005241930484771729, 0.0005552992224693298, 0.0005864053964614868, 0.0006175115704536438, 0.0006486177444458008, 0.0006797239184379578, 0.0007108300924301147, 0.0007419362664222717, 0.0007730424404144287, 0.0008041486144065857, 0.0008352547883987427, 0.0008663609623908997, 0.0008974671363830566, 0.0009285733103752136, 0.0009596794843673706, 0.0009907856583595276, 0.0010218918323516846, 0.0010529980063438416, 0.0010841041803359985, 0.0011152103543281555, 0.0011463165283203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 13.0, 28.0, 80.0, 337.0, 4478.0, 1034398.0, 8474.0, 497.0, 121.0, 35.0, 17.0, 7.0, 9.0, 10.0, 4.0, 7.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.051727294921875, -0.050452470779418945, -0.04917764663696289, -0.047902822494506836, -0.04662799835205078, -0.04535317420959473, -0.04407835006713867, -0.04280352592468262, -0.04152870178222656, -0.04025387763977051, -0.03897905349731445, -0.0377042293548584, -0.036429405212402344, -0.03515458106994629, -0.033879756927490234, -0.03260493278503418, -0.031330108642578125, -0.03005528450012207, -0.028780460357666016, -0.02750563621520996, -0.026230812072753906, -0.02495598793029785, -0.023681163787841797, -0.022406339645385742, -0.021131515502929688, -0.019856691360473633, -0.018581867218017578, -0.017307043075561523, -0.01603221893310547, -0.014757394790649414, -0.01348257064819336, -0.012207746505737305, -0.01093292236328125, -0.009658098220825195, -0.00838327407836914, -0.007108449935913086, -0.005833625793457031, -0.0045588016510009766, -0.003283977508544922, -0.002009153366088867, -0.0007343292236328125, 0.0005404949188232422, 0.0018153190612792969, 0.0030901432037353516, 0.004364967346191406, 0.005639791488647461, 0.006914615631103516, 0.00818943977355957, 0.009464263916015625, 0.01073908805847168, 0.012013912200927734, 0.013288736343383789, 0.014563560485839844, 0.0158383846282959, 0.017113208770751953, 0.018388032913208008, 0.019662857055664062, 0.020937681198120117, 0.022212505340576172, 0.023487329483032227, 0.02476215362548828, 0.026036977767944336, 0.02731180191040039, 0.028586626052856445, 0.0298614501953125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 8.0, 3.0, 5.0, 8.0, 9.0, 3.0, 16.0, 20.0, 29.0, 36.0, 115.0, 419.0, 173.0, 58.0, 28.0, 18.0, 14.0, 5.0, 6.0, 7.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011627197265625, -0.01113438606262207, -0.01064157485961914, -0.010148763656616211, -0.009655952453613281, -0.009163141250610352, -0.008670330047607422, -0.008177518844604492, -0.0076847076416015625, -0.007191896438598633, -0.006699085235595703, -0.0062062740325927734, -0.005713462829589844, -0.005220651626586914, -0.004727840423583984, -0.004235029220581055, -0.003742218017578125, -0.0032494068145751953, -0.0027565956115722656, -0.002263784408569336, -0.0017709732055664062, -0.0012781620025634766, -0.0007853507995605469, -0.0002925395965576172, 0.0002002716064453125, 0.0006930828094482422, 0.0011858940124511719, 0.0016787052154541016, 0.0021715164184570312, 0.002664327621459961, 0.0031571388244628906, 0.0036499500274658203, 0.00414276123046875, 0.00463557243347168, 0.005128383636474609, 0.005621194839477539, 0.006114006042480469, 0.0066068172454833984, 0.007099628448486328, 0.007592439651489258, 0.008085250854492188, 0.008578062057495117, 0.009070873260498047, 0.009563684463500977, 0.010056495666503906, 0.010549306869506836, 0.011042118072509766, 0.011534929275512695, 0.012027740478515625, 0.012520551681518555, 0.013013362884521484, 0.013506174087524414, 0.013998985290527344, 0.014491796493530273, 0.014984607696533203, 0.015477418899536133, 0.015970230102539062, 0.016463041305541992, 0.016955852508544922, 0.01744866371154785, 0.01794147491455078, 0.01843428611755371, 0.01892709732055664, 0.01941990852355957, 0.0199127197265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 18.0, 141.0, 721.0, 109.0, 12.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2854030132293701, -0.2550022006034851, -0.2246014028787613, -0.19420060515403748, -0.16379979252815247, -0.13339897990226746, -0.10299818217754364, -0.07259738445281982, -0.042196571826934814, -0.011795766651630402, 0.01860503852367401, 0.049005843698978424, 0.07940664887428284, 0.10980746150016785, 0.14020825922489166, 0.17060905694961548, 0.2010098695755005, 0.2314106822013855, 0.2618114948272705, 0.29221227765083313, 0.32261309027671814, 0.35301390290260315, 0.38341468572616577, 0.4138154983520508, 0.4442163109779358, 0.4746171236038208, 0.5050179362297058, 0.5354187488555908, 0.565819501876831, 0.5962203741073608, 0.6266211271286011, 0.6570219397544861, 0.6874227523803711, 0.7178235650062561, 0.7482243776321411, 0.7786251902580261, 0.8090260028839111, 0.8394267559051514, 0.8698275685310364, 0.9002283811569214, 0.9306291937828064, 0.9610300064086914, 0.9914308190345764, 1.0218316316604614, 1.0522323846817017, 1.0826332569122314, 1.1130340099334717, 1.143434762954712, 1.1738356351852417, 1.204236388206482, 1.2346372604370117, 1.265038013458252, 1.2954388856887817, 1.325839638710022, 1.3562405109405518, 1.386641263961792, 1.4170420169830322, 1.4474427700042725, 1.4778436422348022, 1.5082443952560425, 1.5386452674865723, 1.5690460205078125, 1.5994468927383423, 1.6298476457595825, 1.6602485179901123]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 12.0, 14.0, 19.0, 13.0, 21.0, 28.0, 28.0, 20.0, 20.0, 32.0, 29.0, 30.0, 36.0, 37.0, 45.0, 45.0, 55.0, 43.0, 48.0, 40.0, 46.0, 28.0, 38.0, 31.0, 27.0, 31.0, 27.0, 18.0, 19.0, 15.0, 19.0, 9.0, 14.0, 11.0, 6.0, 11.0, 3.0, 0.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2896274924278259, -0.28044748306274414, -0.27126750349998474, -0.26208749413490295, -0.25290748476982117, -0.24372749030590057, -0.23454749584197998, -0.2253674864768982, -0.2161874771118164, -0.2070074826478958, -0.19782747328281403, -0.18864747881889343, -0.17946746945381165, -0.17028747498989105, -0.16110748052597046, -0.15192747116088867, -0.14274747669696808, -0.13356748223304749, -0.1243874728679657, -0.1152074784040451, -0.10602746903896332, -0.09684747457504272, -0.08766747266054153, -0.07848747074604034, -0.06930746883153915, -0.060127466917037964, -0.050947465002536774, -0.04176746681332588, -0.03258746489882469, -0.0234074629843235, -0.01422746479511261, -0.00504746288061142, 0.0041325390338897705, 0.013312540017068386, 0.022492541000247, 0.03167254105210304, 0.04085254296660423, 0.05003254488110542, 0.059212543070316315, 0.0683925449848175, 0.0775725468993187, 0.08675254881381989, 0.09593255072832108, 0.10511255264282227, 0.11429254710674286, 0.12347255647182465, 0.13265255093574524, 0.14183256030082703, 0.15101255476474762, 0.1601925492286682, 0.16937255859375, 0.1785525530576706, 0.18773256242275238, 0.19691255688667297, 0.20609256625175476, 0.21527256071567535, 0.22445255517959595, 0.23363254964351654, 0.24281255900859833, 0.2519925534725189, 0.2611725628376007, 0.2703525722026825, 0.2795325517654419, 0.2887125611305237, 0.29789257049560547]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 8.0, 4.0, 8.0, 9.0, 18.0, 12.0, 28.0, 44.0, 45.0, 69.0, 69.0, 300.0, 6157.0, 4184446.0, 2529.0, 208.0, 82.0, 58.0, 49.0, 29.0, 20.0, 17.0, 9.0, 14.0, 14.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0521240234375, -0.05040931701660156, -0.048694610595703125, -0.04697990417480469, -0.04526519775390625, -0.04355049133300781, -0.041835784912109375, -0.04012107849121094, -0.0384063720703125, -0.03669166564941406, -0.034976959228515625, -0.03326225280761719, -0.03154754638671875, -0.029832839965820312, -0.028118133544921875, -0.026403427124023438, -0.024688720703125, -0.022974014282226562, -0.021259307861328125, -0.019544601440429688, -0.01782989501953125, -0.016115188598632812, -0.014400482177734375, -0.012685775756835938, -0.0109710693359375, -0.009256362915039062, -0.007541656494140625, -0.0058269500732421875, -0.00411224365234375, -0.0023975372314453125, -0.000682830810546875, 0.0010318756103515625, 0.00274658203125, 0.0044612884521484375, 0.006175994873046875, 0.007890701293945312, 0.00960540771484375, 0.011320114135742188, 0.013034820556640625, 0.014749526977539062, 0.0164642333984375, 0.018178939819335938, 0.019893646240234375, 0.021608352661132812, 0.02332305908203125, 0.025037765502929688, 0.026752471923828125, 0.028467178344726562, 0.030181884765625, 0.03189659118652344, 0.033611297607421875, 0.03532600402832031, 0.03704071044921875, 0.03875541687011719, 0.040470123291015625, 0.04218482971191406, 0.0438995361328125, 0.04561424255371094, 0.047328948974609375, 0.04904365539550781, 0.05075836181640625, 0.05247306823730469, 0.054187774658203125, 0.05590248107910156, 0.0576171875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 7.0, 4.0, 7.0, 13.0, 15.0, 13.0, 30.0, 40.0, 49.0, 64.0, 59.0, 72.0, 103.0, 96.0, 67.0, 58.0, 59.0, 57.0, 44.0, 26.0, 23.0, 21.0, 10.0, 10.0, 13.0, 11.0, 6.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020294189453125, -0.019627094268798828, -0.018959999084472656, -0.018292903900146484, -0.017625808715820312, -0.01695871353149414, -0.01629161834716797, -0.015624523162841797, -0.014957427978515625, -0.014290332794189453, -0.013623237609863281, -0.01295614242553711, -0.012289047241210938, -0.011621952056884766, -0.010954856872558594, -0.010287761688232422, -0.00962066650390625, -0.008953571319580078, -0.008286476135253906, -0.007619380950927734, -0.0069522857666015625, -0.006285190582275391, -0.005618095397949219, -0.004951000213623047, -0.004283905029296875, -0.003616809844970703, -0.0029497146606445312, -0.0022826194763183594, -0.0016155242919921875, -0.0009484291076660156, -0.00028133392333984375, 0.0003857612609863281, 0.0010528564453125, 0.0017199516296386719, 0.0023870468139648438, 0.0030541419982910156, 0.0037212371826171875, 0.004388332366943359, 0.005055427551269531, 0.005722522735595703, 0.006389617919921875, 0.007056713104248047, 0.007723808288574219, 0.00839090347290039, 0.009057998657226562, 0.009725093841552734, 0.010392189025878906, 0.011059284210205078, 0.01172637939453125, 0.012393474578857422, 0.013060569763183594, 0.013727664947509766, 0.014394760131835938, 0.01506185531616211, 0.01572895050048828, 0.016396045684814453, 0.017063140869140625, 0.017730236053466797, 0.01839733123779297, 0.01906442642211914, 0.019731521606445312, 0.020398616790771484, 0.021065711975097656, 0.021732807159423828, 0.02239990234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 4.0, 12.0, 28.0, 103.0, 336.0, 1141.0, 6974.0, 4176963.0, 7167.0, 1089.0, 298.0, 96.0, 32.0, 16.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0654296875, -0.0634164810180664, -0.06140327453613281, -0.05939006805419922, -0.057376861572265625, -0.05536365509033203, -0.05335044860839844, -0.051337242126464844, -0.04932403564453125, -0.047310829162597656, -0.04529762268066406, -0.04328441619873047, -0.041271209716796875, -0.03925800323486328, -0.03724479675292969, -0.035231590270996094, -0.0332183837890625, -0.031205177307128906, -0.029191970825195312, -0.02717876434326172, -0.025165557861328125, -0.02315235137939453, -0.021139144897460938, -0.019125938415527344, -0.01711273193359375, -0.015099525451660156, -0.013086318969726562, -0.011073112487792969, -0.009059906005859375, -0.007046699523925781, -0.0050334930419921875, -0.0030202865600585938, -0.001007080078125, 0.0010061264038085938, 0.0030193328857421875, 0.005032539367675781, 0.007045745849609375, 0.009058952331542969, 0.011072158813476562, 0.013085365295410156, 0.01509857177734375, 0.017111778259277344, 0.019124984741210938, 0.02113819122314453, 0.023151397705078125, 0.02516460418701172, 0.027177810668945312, 0.029191017150878906, 0.0312042236328125, 0.033217430114746094, 0.03523063659667969, 0.03724384307861328, 0.039257049560546875, 0.04127025604248047, 0.04328346252441406, 0.045296669006347656, 0.04730987548828125, 0.049323081970214844, 0.05133628845214844, 0.05334949493408203, 0.055362701416015625, 0.05737590789794922, 0.05938911437988281, 0.061402320861816406, 0.06341552734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 10.0, 24.0, 328.0, 3633.0, 36.0, 16.0, 7.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0162353515625, -0.015729427337646484, -0.015223503112792969, -0.014717578887939453, -0.014211654663085938, -0.013705730438232422, -0.013199806213378906, -0.01269388198852539, -0.012187957763671875, -0.01168203353881836, -0.011176109313964844, -0.010670185089111328, -0.010164260864257812, -0.009658336639404297, -0.009152412414550781, -0.008646488189697266, -0.00814056396484375, -0.007634639739990234, -0.007128715515136719, -0.006622791290283203, -0.0061168670654296875, -0.005610942840576172, -0.005105018615722656, -0.004599094390869141, -0.004093170166015625, -0.0035872459411621094, -0.0030813217163085938, -0.002575397491455078, -0.0020694732666015625, -0.0015635490417480469, -0.0010576248168945312, -0.0005517005920410156, -4.57763671875e-05, 0.0004601478576660156, 0.0009660720825195312, 0.0014719963073730469, 0.0019779205322265625, 0.002483844757080078, 0.0029897689819335938, 0.0034956932067871094, 0.004001617431640625, 0.004507541656494141, 0.005013465881347656, 0.005519390106201172, 0.0060253143310546875, 0.006531238555908203, 0.007037162780761719, 0.007543087005615234, 0.00804901123046875, 0.008554935455322266, 0.009060859680175781, 0.009566783905029297, 0.010072708129882812, 0.010578632354736328, 0.011084556579589844, 0.01159048080444336, 0.012096405029296875, 0.01260232925415039, 0.013108253479003906, 0.013614177703857422, 0.014120101928710938, 0.014626026153564453, 0.015131950378417969, 0.015637874603271484, 0.016143798828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 19.0, 62.0, 369.0, 447.0, 88.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09399300068616867, -0.09218736737966537, -0.09038172662258148, -0.08857609331607819, -0.08677046000957489, -0.084964819252491, -0.0831591859459877, -0.0813535526394844, -0.07954791188240051, -0.07774227857589722, -0.07593663781881332, -0.07413100451231003, -0.07232537120580673, -0.07051973044872284, -0.06871409714221954, -0.06690846383571625, -0.06510283052921295, -0.06329719722270966, -0.06149156019091606, -0.05968592315912247, -0.05788028612732887, -0.05607464909553528, -0.05426901578903198, -0.05246337875723839, -0.050657741725444794, -0.0488521046936512, -0.0470464713871479, -0.04524083435535431, -0.043435197323560715, -0.04162956029176712, -0.039823926985263824, -0.03801828995347023, -0.036212652921676636, -0.03440701588988304, -0.032601382583379745, -0.03079574555158615, -0.028990108519792557, -0.02718447335064411, -0.025378838181495667, -0.023573201149702072, -0.021767565980553627, -0.019961930811405182, -0.018156293779611588, -0.016350658610463142, -0.014545022509992123, -0.012739386409521103, -0.010933751240372658, -0.009128115139901638, -0.007322479039430618, -0.0055168429389595985, -0.003711207304149866, -0.0019055716693401337, -9.993556886911392e-05, 0.0017057005316019058, 0.003511335700750351, 0.005316971801221371, 0.0071226079016923904, 0.00892824400216341, 0.01073388010263443, 0.012539515271782875, 0.014345151372253895, 0.016150787472724915, 0.01795642264187336, 0.019762057811021805, 0.0215676948428154]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 1.0, 4.0, 9.0, 11.0, 14.0, 18.0, 7.0, 15.0, 31.0, 28.0, 33.0, 39.0, 43.0, 38.0, 44.0, 53.0, 66.0, 47.0, 50.0, 56.0, 49.0, 58.0, 50.0, 36.0, 41.0, 22.0, 28.0, 31.0, 23.0, 17.0, 11.0, 5.0, 6.0, 5.0, 7.0, 0.0, 5.0, 5.0, 1.0, 1.0, 3.0], "bins": [-0.02752143144607544, -0.026845330372452736, -0.026169229298830032, -0.02549312822520733, -0.024817027151584625, -0.02414092607796192, -0.023464825004339218, -0.022788723930716515, -0.02211262285709381, -0.021436521783471107, -0.020760420709848404, -0.0200843196362257, -0.019408218562602997, -0.018732117488980293, -0.01805601641535759, -0.017379915341734886, -0.016703814268112183, -0.01602771319448948, -0.015351612120866776, -0.014675511047244072, -0.013999409973621368, -0.013323308899998665, -0.012647207826375961, -0.011971106752753258, -0.011295005679130554, -0.01061890460550785, -0.009942803531885147, -0.009266702458262444, -0.00859060138463974, -0.007914500311017036, -0.007238399237394333, -0.006562298163771629, -0.005886197090148926, -0.005210096016526222, -0.004533994942903519, -0.003857893869280815, -0.0031817927956581116, -0.002505691722035408, -0.0018295906484127045, -0.001153489574790001, -0.00047738850116729736, 0.0001987125724554062, 0.0008748136460781097, 0.0015509147197008133, 0.002227015793323517, 0.0029031168669462204, 0.003579217940568924, 0.0042553190141916275, 0.004931420087814331, 0.005607521161437035, 0.006283622235059738, 0.006959723308682442, 0.007635824382305145, 0.008311925455927849, 0.008988026529550552, 0.009664127603173256, 0.01034022867679596, 0.011016329750418663, 0.011692430824041367, 0.01236853189766407, 0.013044632971286774, 0.013720734044909477, 0.01439683511853218, 0.015072936192154884, 0.015749037265777588]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 8.0, 15.0, 11.0, 16.0, 23.0, 37.0, 49.0, 78.0, 106.0, 145.0, 198.0, 324.0, 418.0, 692.0, 1049.0, 1664.0, 2749.0, 4711.0, 9253.0, 19131.0, 46417.0, 154268.0, 582688.0, 141296.0, 43934.0, 18321.0, 8767.0, 4762.0, 2638.0, 1663.0, 1051.0, 639.0, 415.0, 304.0, 217.0, 141.0, 90.0, 77.0, 49.0, 36.0, 33.0, 18.0, 9.0, 9.0, 11.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0241851806640625, -0.0233914852142334, -0.022597789764404297, -0.021804094314575195, -0.021010398864746094, -0.020216703414916992, -0.01942300796508789, -0.01862931251525879, -0.017835617065429688, -0.017041921615600586, -0.016248226165771484, -0.015454530715942383, -0.014660835266113281, -0.01386713981628418, -0.013073444366455078, -0.012279748916625977, -0.011486053466796875, -0.010692358016967773, -0.009898662567138672, -0.00910496711730957, -0.008311271667480469, -0.007517576217651367, -0.006723880767822266, -0.005930185317993164, -0.0051364898681640625, -0.004342794418334961, -0.0035490989685058594, -0.002755403518676758, -0.0019617080688476562, -0.0011680126190185547, -0.0003743171691894531, 0.00041937828063964844, 0.00121307373046875, 0.0020067691802978516, 0.002800464630126953, 0.0035941600799560547, 0.004387855529785156, 0.005181550979614258, 0.005975246429443359, 0.006768941879272461, 0.0075626373291015625, 0.008356332778930664, 0.009150028228759766, 0.009943723678588867, 0.010737419128417969, 0.01153111457824707, 0.012324810028076172, 0.013118505477905273, 0.013912200927734375, 0.014705896377563477, 0.015499591827392578, 0.01629328727722168, 0.01708698272705078, 0.017880678176879883, 0.018674373626708984, 0.019468069076538086, 0.020261764526367188, 0.02105545997619629, 0.02184915542602539, 0.022642850875854492, 0.023436546325683594, 0.024230241775512695, 0.025023937225341797, 0.0258176326751709, 0.026611328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 7.0, 8.0, 20.0, 13.0, 23.0, 46.0, 48.0, 62.0, 65.0, 70.0, 101.0, 98.0, 66.0, 62.0, 56.0, 54.0, 49.0, 25.0, 23.0, 20.0, 10.0, 13.0, 11.0, 9.0, 8.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020294189453125, -0.01962733268737793, -0.01896047592163086, -0.01829361915588379, -0.01762676239013672, -0.01695990562438965, -0.016293048858642578, -0.015626192092895508, -0.014959335327148438, -0.014292478561401367, -0.013625621795654297, -0.012958765029907227, -0.012291908264160156, -0.011625051498413086, -0.010958194732666016, -0.010291337966918945, -0.009624481201171875, -0.008957624435424805, -0.008290767669677734, -0.007623910903930664, -0.006957054138183594, -0.0062901973724365234, -0.005623340606689453, -0.004956483840942383, -0.0042896270751953125, -0.003622770309448242, -0.002955913543701172, -0.0022890567779541016, -0.0016222000122070312, -0.0009553432464599609, -0.0002884864807128906, 0.0003783702850341797, 0.00104522705078125, 0.0017120838165283203, 0.0023789405822753906, 0.003045797348022461, 0.0037126541137695312, 0.0043795108795166016, 0.005046367645263672, 0.005713224411010742, 0.0063800811767578125, 0.007046937942504883, 0.007713794708251953, 0.008380651473999023, 0.009047508239746094, 0.009714365005493164, 0.010381221771240234, 0.011048078536987305, 0.011714935302734375, 0.012381792068481445, 0.013048648834228516, 0.013715505599975586, 0.014382362365722656, 0.015049219131469727, 0.015716075897216797, 0.016382932662963867, 0.017049789428710938, 0.017716646194458008, 0.018383502960205078, 0.01905035972595215, 0.01971721649169922, 0.02038407325744629, 0.02105093002319336, 0.02171778678894043, 0.0223846435546875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 9.0, 1.0, 5.0, 3.0, 10.0, 13.0, 14.0, 12.0, 11.0, 18.0, 32.0, 37.0, 47.0, 51.0, 50.0, 80.0, 105.0, 157.0, 291.0, 646.0, 3578.0, 74931.0, 936540.0, 28504.0, 2132.0, 453.0, 225.0, 141.0, 82.0, 93.0, 64.0, 54.0, 27.0, 27.0, 24.0, 22.0, 10.0, 13.0, 7.0, 6.0, 5.0, 6.0, 5.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.10369873046875, -0.10076618194580078, -0.09783363342285156, -0.09490108489990234, -0.09196853637695312, -0.0890359878540039, -0.08610343933105469, -0.08317089080810547, -0.08023834228515625, -0.07730579376220703, -0.07437324523925781, -0.0714406967163086, -0.06850814819335938, -0.06557559967041016, -0.06264305114746094, -0.05971050262451172, -0.0567779541015625, -0.05384540557861328, -0.05091285705566406, -0.047980308532714844, -0.045047760009765625, -0.042115211486816406, -0.03918266296386719, -0.03625011444091797, -0.03331756591796875, -0.03038501739501953, -0.027452468872070312, -0.024519920349121094, -0.021587371826171875, -0.018654823303222656, -0.015722274780273438, -0.012789726257324219, -0.009857177734375, -0.006924629211425781, -0.0039920806884765625, -0.0010595321655273438, 0.001873016357421875, 0.004805564880371094, 0.0077381134033203125, 0.010670661926269531, 0.01360321044921875, 0.01653575897216797, 0.019468307495117188, 0.022400856018066406, 0.025333404541015625, 0.028265953063964844, 0.031198501586914062, 0.03413105010986328, 0.0370635986328125, 0.03999614715576172, 0.04292869567871094, 0.045861244201660156, 0.048793792724609375, 0.051726341247558594, 0.05465888977050781, 0.05759143829345703, 0.06052398681640625, 0.06345653533935547, 0.06638908386230469, 0.0693216323852539, 0.07225418090820312, 0.07518672943115234, 0.07811927795410156, 0.08105182647705078, 0.083984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 4.0, 5.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 7.0, 15.0, 26.0, 16.0, 24.0, 26.0, 19.0, 26.0, 24.0, 33.0, 30.0, 28.0, 49.0, 49.0, 40.0, 46.0, 55.0, 49.0, 42.0, 25.0, 28.0, 28.0, 31.0, 33.0, 22.0, 28.0, 22.0, 15.0, 16.0, 17.0, 15.0, 15.0, 16.0, 4.0, 4.0, 4.0, 5.0, 6.0, 4.0, 10.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05029296875, -0.048638343811035156, -0.04698371887207031, -0.04532909393310547, -0.043674468994140625, -0.04201984405517578, -0.04036521911621094, -0.038710594177246094, -0.03705596923828125, -0.035401344299316406, -0.03374671936035156, -0.03209209442138672, -0.030437469482421875, -0.02878284454345703, -0.027128219604492188, -0.025473594665527344, -0.0238189697265625, -0.022164344787597656, -0.020509719848632812, -0.01885509490966797, -0.017200469970703125, -0.015545845031738281, -0.013891220092773438, -0.012236595153808594, -0.01058197021484375, -0.008927345275878906, -0.0072727203369140625, -0.005618095397949219, -0.003963470458984375, -0.0023088455200195312, -0.0006542205810546875, 0.0010004043579101562, 0.002655029296875, 0.004309654235839844, 0.0059642791748046875, 0.007618904113769531, 0.009273529052734375, 0.010928153991699219, 0.012582778930664062, 0.014237403869628906, 0.01589202880859375, 0.017546653747558594, 0.019201278686523438, 0.02085590362548828, 0.022510528564453125, 0.02416515350341797, 0.025819778442382812, 0.027474403381347656, 0.0291290283203125, 0.030783653259277344, 0.03243827819824219, 0.03409290313720703, 0.035747528076171875, 0.03740215301513672, 0.03905677795410156, 0.040711402893066406, 0.04236602783203125, 0.044020652770996094, 0.04567527770996094, 0.04732990264892578, 0.048984527587890625, 0.05063915252685547, 0.05229377746582031, 0.053948402404785156, 0.05560302734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 14.0, 10.0, 16.0, 25.0, 55.0, 77.0, 217.0, 990.0, 893407.0, 152589.0, 732.0, 183.0, 90.0, 50.0, 24.0, 17.0, 13.0, 6.0, 12.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01480865478515625, -0.01431429386138916, -0.01381993293762207, -0.01332557201385498, -0.01283121109008789, -0.0123368501663208, -0.011842489242553711, -0.011348128318786621, -0.010853767395019531, -0.010359406471252441, -0.009865045547485352, -0.009370684623718262, -0.008876323699951172, -0.008381962776184082, -0.007887601852416992, -0.007393240928649902, -0.0068988800048828125, -0.006404519081115723, -0.005910158157348633, -0.005415797233581543, -0.004921436309814453, -0.004427075386047363, -0.0039327144622802734, -0.0034383535385131836, -0.0029439926147460938, -0.002449631690979004, -0.001955270767211914, -0.0014609098434448242, -0.0009665489196777344, -0.00047218799591064453, 2.2172927856445312e-05, 0.0005165338516235352, 0.001010894775390625, 0.0015052556991577148, 0.0019996166229248047, 0.0024939775466918945, 0.0029883384704589844, 0.0034826993942260742, 0.003977060317993164, 0.004471421241760254, 0.004965782165527344, 0.005460143089294434, 0.0059545040130615234, 0.006448864936828613, 0.006943225860595703, 0.007437586784362793, 0.007931947708129883, 0.008426308631896973, 0.008920669555664062, 0.009415030479431152, 0.009909391403198242, 0.010403752326965332, 0.010898113250732422, 0.011392474174499512, 0.011886835098266602, 0.012381196022033691, 0.012875556945800781, 0.013369917869567871, 0.013864278793334961, 0.01435863971710205, 0.01485300064086914, 0.01534736156463623, 0.01584172248840332, 0.01633608341217041, 0.0168304443359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 4.0, 2.0, 3.0, 11.0, 9.0, 9.0, 19.0, 30.0, 62.0, 115.0, 314.0, 219.0, 77.0, 40.0, 23.0, 15.0, 3.0, 8.0, 8.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017976760864257812, -0.00017371401190757751, -0.0001676604151725769, -0.0001616068184375763, -0.00015555322170257568, -0.00014949962496757507, -0.00014344602823257446, -0.00013739243149757385, -0.00013133883476257324, -0.00012528523802757263, -0.00011923164129257202, -0.00011317804455757141, -0.0001071244478225708, -0.00010107085108757019, -9.501725435256958e-05, -8.896365761756897e-05, -8.291006088256836e-05, -7.685646414756775e-05, -7.080286741256714e-05, -6.474927067756653e-05, -5.869567394256592e-05, -5.264207720756531e-05, -4.65884804725647e-05, -4.053488373756409e-05, -3.4481287002563477e-05, -2.8427690267562866e-05, -2.2374093532562256e-05, -1.6320496797561646e-05, -1.0266900062561035e-05, -4.213303327560425e-06, 1.8402934074401855e-06, 7.893890142440796e-06, 1.3947486877441406e-05, 2.0001083612442017e-05, 2.6054680347442627e-05, 3.210827708244324e-05, 3.816187381744385e-05, 4.421547055244446e-05, 5.026906728744507e-05, 5.632266402244568e-05, 6.237626075744629e-05, 6.84298574924469e-05, 7.448345422744751e-05, 8.053705096244812e-05, 8.659064769744873e-05, 9.264424443244934e-05, 9.869784116744995e-05, 0.00010475143790245056, 0.00011080503463745117, 0.00011685863137245178, 0.0001229122281074524, 0.000128965824842453, 0.0001350194215774536, 0.00014107301831245422, 0.00014712661504745483, 0.00015318021178245544, 0.00015923380851745605, 0.00016528740525245667, 0.00017134100198745728, 0.00017739459872245789, 0.0001834481954574585, 0.0001895017921924591, 0.00019555538892745972, 0.00020160898566246033, 0.00020766258239746094]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 17.0, 17.0, 35.0, 92.0, 524.0, 9922.0, 1033834.0, 3600.0, 347.0, 70.0, 24.0, 16.0, 14.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.020538330078125, -0.019922733306884766, -0.01930713653564453, -0.018691539764404297, -0.018075942993164062, -0.017460346221923828, -0.016844749450683594, -0.01622915267944336, -0.015613555908203125, -0.01499795913696289, -0.014382362365722656, -0.013766765594482422, -0.013151168823242188, -0.012535572052001953, -0.011919975280761719, -0.011304378509521484, -0.01068878173828125, -0.010073184967041016, -0.009457588195800781, -0.008841991424560547, -0.008226394653320312, -0.007610797882080078, -0.006995201110839844, -0.006379604339599609, -0.005764007568359375, -0.005148410797119141, -0.004532814025878906, -0.003917217254638672, -0.0033016204833984375, -0.002686023712158203, -0.0020704269409179688, -0.0014548301696777344, -0.0008392333984375, -0.00022363662719726562, 0.00039196014404296875, 0.0010075569152832031, 0.0016231536865234375, 0.002238750457763672, 0.0028543472290039062, 0.0034699440002441406, 0.004085540771484375, 0.004701137542724609, 0.005316734313964844, 0.005932331085205078, 0.0065479278564453125, 0.007163524627685547, 0.007779121398925781, 0.008394718170166016, 0.00901031494140625, 0.009625911712646484, 0.010241508483886719, 0.010857105255126953, 0.011472702026367188, 0.012088298797607422, 0.012703895568847656, 0.01331949234008789, 0.013935089111328125, 0.01455068588256836, 0.015166282653808594, 0.015781879425048828, 0.016397476196289062, 0.017013072967529297, 0.01762866973876953, 0.018244266510009766, 0.01885986328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 15.0, 18.0, 35.0, 62.0, 132.0, 285.0, 199.0, 99.0, 48.0, 28.0, 17.0, 14.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00852203369140625, -0.00824582576751709, -0.00796961784362793, -0.0076934099197387695, -0.007417201995849609, -0.007140994071960449, -0.006864786148071289, -0.006588578224182129, -0.006312370300292969, -0.006036162376403809, -0.0057599544525146484, -0.005483746528625488, -0.005207538604736328, -0.004931330680847168, -0.004655122756958008, -0.004378914833068848, -0.0041027069091796875, -0.0038264989852905273, -0.003550291061401367, -0.003274083137512207, -0.002997875213623047, -0.0027216672897338867, -0.0024454593658447266, -0.0021692514419555664, -0.0018930435180664062, -0.001616835594177246, -0.001340627670288086, -0.0010644197463989258, -0.0007882118225097656, -0.0005120038986206055, -0.0002357959747314453, 4.0411949157714844e-05, 0.000316619873046875, 0.0005928277969360352, 0.0008690357208251953, 0.0011452436447143555, 0.0014214515686035156, 0.0016976594924926758, 0.001973867416381836, 0.002250075340270996, 0.0025262832641601562, 0.0028024911880493164, 0.0030786991119384766, 0.0033549070358276367, 0.003631114959716797, 0.003907322883605957, 0.004183530807495117, 0.004459738731384277, 0.0047359466552734375, 0.005012154579162598, 0.005288362503051758, 0.005564570426940918, 0.005840778350830078, 0.006116986274719238, 0.0063931941986083984, 0.006669402122497559, 0.006945610046386719, 0.007221817970275879, 0.007498025894165039, 0.007774233818054199, 0.00805044174194336, 0.00832664966583252, 0.00860285758972168, 0.00887906551361084, 0.0091552734375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 11.0, 449.0, 531.0, 21.0, 5.0, 0.0, 2.0], "bins": [-2.8113479614257812, -2.7637081146240234, -2.7160680294036865, -2.6684279441833496, -2.620788097381592, -2.573148250579834, -2.525508165359497, -2.47786808013916, -2.4302282333374023, -2.3825883865356445, -2.3349483013153076, -2.2873082160949707, -2.239668369293213, -2.192028522491455, -2.144388437271118, -2.0967483520507812, -2.0491085052490234, -2.0014686584472656, -1.9538285732269287, -1.9061886072158813, -1.858548641204834, -1.8109086751937866, -1.7632687091827393, -1.715628743171692, -1.6679887771606445, -1.6203488111495972, -1.5727088451385498, -1.5250688791275024, -1.477428913116455, -1.4297889471054077, -1.3821489810943604, -1.334509015083313, -1.286868929862976, -1.2392289638519287, -1.1915889978408813, -1.143949031829834, -1.0963090658187866, -1.0486690998077393, -1.001029133796692, -0.9533891677856445, -0.9057492017745972, -0.8581092357635498, -0.8104692697525024, -0.7628293037414551, -0.7151893377304077, -0.6675493717193604, -0.619909405708313, -0.5722694396972656, -0.5246294736862183, -0.4769895076751709, -0.42934954166412354, -0.38170957565307617, -0.3340696096420288, -0.28642964363098145, -0.23878967761993408, -0.19114971160888672, -0.14350977540016174, -0.09586980938911438, -0.04822984337806702, -0.0005898773670196533, 0.04705008864402771, 0.09469005465507507, 0.14233002066612244, 0.1899699866771698, 0.23760995268821716]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 6.0, 7.0, 5.0, 11.0, 22.0, 13.0, 22.0, 18.0, 25.0, 31.0, 33.0, 38.0, 34.0, 31.0, 41.0, 52.0, 53.0, 35.0, 44.0, 35.0, 41.0, 39.0, 28.0, 43.0, 30.0, 32.0, 36.0, 24.0, 37.0, 21.0, 21.0, 15.0, 11.0, 12.0, 10.0, 8.0, 7.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2521507740020752, -0.24320858716964722, -0.23426640033721924, -0.22532421350479126, -0.21638204157352448, -0.2074398547410965, -0.19849766790866852, -0.18955549597740173, -0.18061330914497375, -0.17167112231254578, -0.1627289354801178, -0.15378674864768982, -0.14484457671642303, -0.13590238988399506, -0.12696020305156708, -0.1180180236697197, -0.10907582938671112, -0.10013364255428314, -0.09119146317243576, -0.08224927634000778, -0.0733070969581604, -0.06436491012573242, -0.05542272329330444, -0.04648054391145706, -0.03753835707902908, -0.028596173971891403, -0.019653989002108574, -0.010711804032325745, -0.0017696209251880646, 0.0071725621819496155, 0.016114749014377594, 0.025056928396224976, 0.033999115228652954, 0.042941298335790634, 0.051883481442928314, 0.06082566827535629, 0.06976784765720367, 0.07871003448963165, 0.08765222132205963, 0.09659440070390701, 0.10553658753633499, 0.11447877436876297, 0.12342095375061035, 0.13236314058303833, 0.1413053274154663, 0.1502475142478943, 0.15918970108032227, 0.16813187301158905, 0.17707405984401703, 0.186016246676445, 0.19495843350887299, 0.20390060544013977, 0.21284279227256775, 0.22178497910499573, 0.2307271659374237, 0.23966935276985168, 0.24861153960227966, 0.25755372643470764, 0.2664959132671356, 0.2754381000995636, 0.2843802869319916, 0.29332244396209717, 0.30226463079452515, 0.3112068176269531, 0.3201490044593811]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 5.0, 7.0, 11.0, 9.0, 17.0, 23.0, 36.0, 66.0, 88.0, 112.0, 228.0, 476.0, 2141.0, 4187700.0, 2230.0, 468.0, 222.0, 130.0, 92.0, 69.0, 32.0, 23.0, 16.0, 22.0, 13.0, 9.0, 7.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11077880859375, -0.10737228393554688, -0.10396575927734375, -0.10055923461914062, -0.0971527099609375, -0.09374618530273438, -0.09033966064453125, -0.08693313598632812, -0.083526611328125, -0.08012008666992188, -0.07671356201171875, -0.07330703735351562, -0.0699005126953125, -0.06649398803710938, -0.06308746337890625, -0.059680938720703125, -0.0562744140625, -0.052867889404296875, -0.04946136474609375, -0.046054840087890625, -0.0426483154296875, -0.039241790771484375, -0.03583526611328125, -0.032428741455078125, -0.029022216796875, -0.025615692138671875, -0.02220916748046875, -0.018802642822265625, -0.0153961181640625, -0.011989593505859375, -0.00858306884765625, -0.005176544189453125, -0.00177001953125, 0.001636505126953125, 0.00504302978515625, 0.008449554443359375, 0.0118560791015625, 0.015262603759765625, 0.01866912841796875, 0.022075653076171875, 0.025482177734375, 0.028888702392578125, 0.03229522705078125, 0.035701751708984375, 0.0391082763671875, 0.042514801025390625, 0.04592132568359375, 0.049327850341796875, 0.052734375, 0.056140899658203125, 0.05954742431640625, 0.06295394897460938, 0.0663604736328125, 0.06976699829101562, 0.07317352294921875, 0.07658004760742188, 0.079986572265625, 0.08339309692382812, 0.08679962158203125, 0.09020614624023438, 0.0936126708984375, 0.09701919555664062, 0.10042572021484375, 0.10383224487304688, 0.10723876953125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 5.0, 6.0, 11.0, 9.0, 11.0, 19.0, 26.0, 42.0, 49.0, 52.0, 83.0, 75.0, 95.0, 83.0, 78.0, 52.0, 70.0, 49.0, 40.0, 38.0, 18.0, 17.0, 11.0, 15.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0207977294921875, -0.02015519142150879, -0.019512653350830078, -0.018870115280151367, -0.018227577209472656, -0.017585039138793945, -0.016942501068115234, -0.016299962997436523, -0.015657424926757812, -0.015014886856079102, -0.01437234878540039, -0.01372981071472168, -0.013087272644042969, -0.012444734573364258, -0.011802196502685547, -0.011159658432006836, -0.010517120361328125, -0.009874582290649414, -0.009232044219970703, -0.008589506149291992, -0.007946968078613281, -0.00730443000793457, -0.006661891937255859, -0.0060193538665771484, -0.0053768157958984375, -0.0047342777252197266, -0.004091739654541016, -0.0034492015838623047, -0.0028066635131835938, -0.002164125442504883, -0.0015215873718261719, -0.0008790493011474609, -0.00023651123046875, 0.00040602684020996094, 0.0010485649108886719, 0.0016911029815673828, 0.0023336410522460938, 0.0029761791229248047, 0.0036187171936035156, 0.0042612552642822266, 0.0049037933349609375, 0.0055463314056396484, 0.006188869476318359, 0.00683140754699707, 0.007473945617675781, 0.008116483688354492, 0.008759021759033203, 0.009401559829711914, 0.010044097900390625, 0.010686635971069336, 0.011329174041748047, 0.011971712112426758, 0.012614250183105469, 0.01325678825378418, 0.01389932632446289, 0.014541864395141602, 0.015184402465820312, 0.015826940536499023, 0.016469478607177734, 0.017112016677856445, 0.017754554748535156, 0.018397092819213867, 0.019039630889892578, 0.01968216896057129, 0.02032470703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 9.0, 15.0, 38.0, 111.0, 416.0, 1997.0, 14459.0, 4169203.0, 6231.0, 1375.0, 316.0, 63.0, 20.0, 4.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.052276611328125, -0.0505523681640625, -0.048828125, -0.0471038818359375, -0.045379638671875, -0.0436553955078125, -0.04193115234375, -0.0402069091796875, -0.038482666015625, -0.0367584228515625, -0.0350341796875, -0.0333099365234375, -0.031585693359375, -0.0298614501953125, -0.02813720703125, -0.0264129638671875, -0.024688720703125, -0.0229644775390625, -0.021240234375, -0.0195159912109375, -0.017791748046875, -0.0160675048828125, -0.01434326171875, -0.0126190185546875, -0.010894775390625, -0.0091705322265625, -0.0074462890625, -0.0057220458984375, -0.003997802734375, -0.0022735595703125, -0.00054931640625, 0.0011749267578125, 0.002899169921875, 0.0046234130859375, 0.00634765625, 0.0080718994140625, 0.009796142578125, 0.0115203857421875, 0.01324462890625, 0.0149688720703125, 0.016693115234375, 0.0184173583984375, 0.0201416015625, 0.0218658447265625, 0.023590087890625, 0.0253143310546875, 0.02703857421875, 0.0287628173828125, 0.030487060546875, 0.0322113037109375, 0.033935546875, 0.0356597900390625, 0.037384033203125, 0.0391082763671875, 0.04083251953125, 0.0425567626953125, 0.044281005859375, 0.0460052490234375, 0.0477294921875, 0.0494537353515625, 0.051177978515625, 0.0529022216796875, 0.05462646484375, 0.0563507080078125, 0.058074951171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 18.0, 36.0, 146.0, 3799.0, 20.0, 14.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01149749755859375, -0.011160492897033691, -0.010823488235473633, -0.010486483573913574, -0.010149478912353516, -0.009812474250793457, -0.009475469589233398, -0.00913846492767334, -0.008801460266113281, -0.008464455604553223, -0.008127450942993164, -0.0077904462814331055, -0.007453441619873047, -0.007116436958312988, -0.00677943229675293, -0.006442427635192871, -0.0061054229736328125, -0.005768418312072754, -0.005431413650512695, -0.005094408988952637, -0.004757404327392578, -0.0044203996658325195, -0.004083395004272461, -0.0037463903427124023, -0.0034093856811523438, -0.003072381019592285, -0.0027353763580322266, -0.002398371696472168, -0.0020613670349121094, -0.0017243623733520508, -0.0013873577117919922, -0.0010503530502319336, -0.000713348388671875, -0.0003763437271118164, -3.933906555175781e-05, 0.0002976655960083008, 0.0006346702575683594, 0.000971674919128418, 0.0013086795806884766, 0.0016456842422485352, 0.0019826889038085938, 0.0023196935653686523, 0.002656698226928711, 0.0029937028884887695, 0.003330707550048828, 0.0036677122116088867, 0.004004716873168945, 0.004341721534729004, 0.0046787261962890625, 0.005015730857849121, 0.00535273551940918, 0.005689740180969238, 0.006026744842529297, 0.0063637495040893555, 0.006700754165649414, 0.007037758827209473, 0.007374763488769531, 0.00771176815032959, 0.008048772811889648, 0.008385777473449707, 0.008722782135009766, 0.009059786796569824, 0.009396791458129883, 0.009733796119689941, 0.01007080078125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 18.0, 826.0, 164.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16483236849308014, -0.16170695424079895, -0.15858155488967896, -0.15545614063739777, -0.15233074128627777, -0.14920532703399658, -0.1460799276828766, -0.1429545134305954, -0.1398291140794754, -0.1367036998271942, -0.13357830047607422, -0.13045288622379303, -0.12732748687267303, -0.12420208007097244, -0.12107667326927185, -0.11795126646757126, -0.11482585966587067, -0.11170045286417007, -0.10857504606246948, -0.10544963926076889, -0.1023242324590683, -0.0991988256573677, -0.09607341885566711, -0.09294801205396652, -0.08982259780168533, -0.08669719099998474, -0.08357178419828415, -0.08044637739658356, -0.07732097059488297, -0.07419556379318237, -0.07107015699148178, -0.06794475018978119, -0.0648193359375, -0.06169392913579941, -0.058568522334098816, -0.055443115532398224, -0.05231770873069763, -0.04919230192899704, -0.04606689512729645, -0.042941488325595856, -0.039816081523895264, -0.03669067472219467, -0.03356526792049408, -0.030439861118793488, -0.027314454317092896, -0.024189045652747154, -0.021063638851046562, -0.01793823204934597, -0.014812827110290527, -0.011687420308589935, -0.008562013506889343, -0.005436605773866177, -0.0023111989721655846, 0.0008142087608575821, 0.003939615562558174, 0.007065022364258766, 0.010190429165959358, 0.01331583596765995, 0.016441242769360542, 0.019566651433706284, 0.022692058235406876, 0.025817465037107468, 0.02894287183880806, 0.03206827864050865, 0.035193685442209244]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 6.0, 10.0, 10.0, 10.0, 11.0, 15.0, 18.0, 21.0, 23.0, 27.0, 26.0, 30.0, 26.0, 41.0, 45.0, 41.0, 36.0, 46.0, 44.0, 39.0, 38.0, 35.0, 47.0, 40.0, 28.0, 36.0, 22.0, 29.0, 23.0, 23.0, 21.0, 18.0, 17.0, 12.0, 14.0, 10.0, 7.0, 10.0, 6.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.011601507663726807, -0.011241189204156399, -0.010880870744585991, -0.010520552285015583, -0.010160233825445175, -0.009799915365874767, -0.00943959690630436, -0.009079278446733952, -0.008718959987163544, -0.008358641527593136, -0.007998323068022728, -0.00763800460845232, -0.007277686148881912, -0.006917367689311504, -0.0065570492297410965, -0.006196730770170689, -0.005836412310600281, -0.005476093851029873, -0.005115775391459465, -0.004755456931889057, -0.004395138472318649, -0.004034820012748241, -0.0036745015531778336, -0.0033141830936074257, -0.002953864634037018, -0.00259354617446661, -0.002233227714896202, -0.0018729092553257942, -0.0015125907957553864, -0.0011522723361849785, -0.0007919538766145706, -0.00043163541704416275, -7.131695747375488e-05, 0.000289001502096653, 0.0006493199616670609, 0.0010096384212374687, 0.0013699568808078766, 0.0017302753403782845, 0.0020905937999486923, 0.0024509122595191, 0.002811230719089508, 0.003171549178659916, 0.003531867638230324, 0.0038921860978007317, 0.0042525045573711395, 0.004612823016941547, 0.004973141476511955, 0.005333459936082363, 0.005693778395652771, 0.006054096855223179, 0.006414415314793587, 0.006774733774363995, 0.0071350522339344025, 0.00749537069350481, 0.007855689153075218, 0.008216007612645626, 0.008576326072216034, 0.008936644531786442, 0.00929696299135685, 0.009657281450927258, 0.010017599910497665, 0.010377918370068073, 0.010738236829638481, 0.011098555289208889, 0.011458873748779297]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 13.0, 13.0, 12.0, 16.0, 31.0, 51.0, 72.0, 118.0, 166.0, 271.0, 475.0, 762.0, 1375.0, 2772.0, 5725.0, 13108.0, 37134.0, 146360.0, 644157.0, 136419.0, 35297.0, 12616.0, 5527.0, 2654.0, 1414.0, 773.0, 415.0, 303.0, 175.0, 103.0, 72.0, 43.0, 31.0, 32.0, 15.0, 9.0, 4.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035919189453125, -0.03477811813354492, -0.033637046813964844, -0.032495975494384766, -0.03135490417480469, -0.03021383285522461, -0.02907276153564453, -0.027931690216064453, -0.026790618896484375, -0.025649547576904297, -0.02450847625732422, -0.02336740493774414, -0.022226333618164062, -0.021085262298583984, -0.019944190979003906, -0.018803119659423828, -0.01766204833984375, -0.016520977020263672, -0.015379905700683594, -0.014238834381103516, -0.013097763061523438, -0.01195669174194336, -0.010815620422363281, -0.009674549102783203, -0.008533477783203125, -0.007392406463623047, -0.006251335144042969, -0.005110263824462891, -0.0039691925048828125, -0.0028281211853027344, -0.0016870498657226562, -0.0005459785461425781, 0.0005950927734375, 0.0017361640930175781, 0.0028772354125976562, 0.004018306732177734, 0.0051593780517578125, 0.006300449371337891, 0.007441520690917969, 0.008582592010498047, 0.009723663330078125, 0.010864734649658203, 0.012005805969238281, 0.01314687728881836, 0.014287948608398438, 0.015429019927978516, 0.016570091247558594, 0.017711162567138672, 0.01885223388671875, 0.019993305206298828, 0.021134376525878906, 0.022275447845458984, 0.023416519165039062, 0.02455759048461914, 0.02569866180419922, 0.026839733123779297, 0.027980804443359375, 0.029121875762939453, 0.03026294708251953, 0.03140401840209961, 0.03254508972167969, 0.033686161041259766, 0.034827232360839844, 0.03596830368041992, 0.037109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 11.0, 5.0, 15.0, 14.0, 30.0, 41.0, 47.0, 50.0, 87.0, 72.0, 100.0, 81.0, 81.0, 53.0, 68.0, 45.0, 45.0, 31.0, 22.0, 17.0, 12.0, 14.0, 11.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02069091796875, -0.02005171775817871, -0.019412517547607422, -0.018773317337036133, -0.018134117126464844, -0.017494916915893555, -0.016855716705322266, -0.016216516494750977, -0.015577316284179688, -0.014938116073608398, -0.01429891586303711, -0.01365971565246582, -0.013020515441894531, -0.012381315231323242, -0.011742115020751953, -0.011102914810180664, -0.010463714599609375, -0.009824514389038086, -0.009185314178466797, -0.008546113967895508, -0.007906913757324219, -0.00726771354675293, -0.006628513336181641, -0.0059893131256103516, -0.0053501129150390625, -0.0047109127044677734, -0.004071712493896484, -0.0034325122833251953, -0.0027933120727539062, -0.002154111862182617, -0.0015149116516113281, -0.0008757114410400391, -0.00023651123046875, 0.00040268898010253906, 0.0010418891906738281, 0.0016810894012451172, 0.0023202896118164062, 0.0029594898223876953, 0.0035986900329589844, 0.0042378902435302734, 0.0048770904541015625, 0.0055162906646728516, 0.006155490875244141, 0.00679469108581543, 0.007433891296386719, 0.008073091506958008, 0.008712291717529297, 0.009351491928100586, 0.009990692138671875, 0.010629892349243164, 0.011269092559814453, 0.011908292770385742, 0.012547492980957031, 0.01318669319152832, 0.01382589340209961, 0.014465093612670898, 0.015104293823242188, 0.015743494033813477, 0.016382694244384766, 0.017021894454956055, 0.017661094665527344, 0.018300294876098633, 0.018939495086669922, 0.01957869529724121, 0.0202178955078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 2.0, 5.0, 4.0, 6.0, 8.0, 10.0, 15.0, 15.0, 12.0, 22.0, 29.0, 34.0, 32.0, 44.0, 64.0, 82.0, 106.0, 133.0, 220.0, 429.0, 935.0, 4763.0, 113487.0, 907729.0, 16847.0, 1906.0, 607.0, 271.0, 179.0, 134.0, 107.0, 56.0, 56.0, 35.0, 26.0, 27.0, 20.0, 20.0, 25.0, 6.0, 9.0, 10.0, 4.0, 4.0, 4.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.098388671875, -0.09513568878173828, -0.09188270568847656, -0.08862972259521484, -0.08537673950195312, -0.0821237564086914, -0.07887077331542969, -0.07561779022216797, -0.07236480712890625, -0.06911182403564453, -0.06585884094238281, -0.0626058578491211, -0.059352874755859375, -0.056099891662597656, -0.05284690856933594, -0.04959392547607422, -0.0463409423828125, -0.04308795928955078, -0.03983497619628906, -0.036581993103027344, -0.033329010009765625, -0.030076026916503906, -0.026823043823242188, -0.02357006072998047, -0.02031707763671875, -0.01706409454345703, -0.013811111450195312, -0.010558128356933594, -0.007305145263671875, -0.004052162170410156, -0.0007991790771484375, 0.0024538040161132812, 0.005706787109375, 0.008959770202636719, 0.012212753295898438, 0.015465736389160156, 0.018718719482421875, 0.021971702575683594, 0.025224685668945312, 0.02847766876220703, 0.03173065185546875, 0.03498363494873047, 0.03823661804199219, 0.041489601135253906, 0.044742584228515625, 0.047995567321777344, 0.05124855041503906, 0.05450153350830078, 0.0577545166015625, 0.06100749969482422, 0.06426048278808594, 0.06751346588134766, 0.07076644897460938, 0.0740194320678711, 0.07727241516113281, 0.08052539825439453, 0.08377838134765625, 0.08703136444091797, 0.09028434753417969, 0.0935373306274414, 0.09679031372070312, 0.10004329681396484, 0.10329627990722656, 0.10654926300048828, 0.10980224609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 9.0, 5.0, 11.0, 15.0, 13.0, 15.0, 24.0, 23.0, 20.0, 27.0, 26.0, 28.0, 36.0, 39.0, 36.0, 40.0, 52.0, 43.0, 27.0, 42.0, 44.0, 49.0, 37.0, 32.0, 34.0, 37.0, 34.0, 34.0, 20.0, 21.0, 20.0, 18.0, 12.0, 6.0, 14.0, 8.0, 8.0, 6.0, 4.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.052642822265625, -0.051000118255615234, -0.04935741424560547, -0.0477147102355957, -0.04607200622558594, -0.04442930221557617, -0.042786598205566406, -0.04114389419555664, -0.039501190185546875, -0.03785848617553711, -0.036215782165527344, -0.03457307815551758, -0.03293037414550781, -0.03128767013549805, -0.02964496612548828, -0.028002262115478516, -0.02635955810546875, -0.024716854095458984, -0.02307415008544922, -0.021431446075439453, -0.019788742065429688, -0.018146038055419922, -0.016503334045410156, -0.01486063003540039, -0.013217926025390625, -0.01157522201538086, -0.009932518005371094, -0.008289813995361328, -0.0066471099853515625, -0.005004405975341797, -0.0033617019653320312, -0.0017189979553222656, -7.62939453125e-05, 0.0015664100646972656, 0.0032091140747070312, 0.004851818084716797, 0.0064945220947265625, 0.008137226104736328, 0.009779930114746094, 0.01142263412475586, 0.013065338134765625, 0.01470804214477539, 0.016350746154785156, 0.017993450164794922, 0.019636154174804688, 0.021278858184814453, 0.02292156219482422, 0.024564266204833984, 0.02620697021484375, 0.027849674224853516, 0.02949237823486328, 0.031135082244873047, 0.03277778625488281, 0.03442049026489258, 0.036063194274902344, 0.03770589828491211, 0.039348602294921875, 0.04099130630493164, 0.042634010314941406, 0.04427671432495117, 0.04591941833496094, 0.0475621223449707, 0.04920482635498047, 0.050847530364990234, 0.052490234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 4.0, 11.0, 11.0, 18.0, 24.0, 26.0, 45.0, 49.0, 68.0, 105.0, 153.0, 351.0, 1463.0, 8400.0, 909885.0, 121765.0, 4451.0, 940.0, 300.0, 142.0, 82.0, 52.0, 43.0, 32.0, 24.0, 20.0, 11.0, 13.0, 7.0, 9.0, 5.0, 4.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00897979736328125, -0.008714556694030762, -0.008449316024780273, -0.008184075355529785, -0.007918834686279297, -0.007653594017028809, -0.00738835334777832, -0.007123112678527832, -0.006857872009277344, -0.0065926313400268555, -0.006327390670776367, -0.006062150001525879, -0.005796909332275391, -0.005531668663024902, -0.005266427993774414, -0.005001187324523926, -0.0047359466552734375, -0.004470705986022949, -0.004205465316772461, -0.003940224647521973, -0.0036749839782714844, -0.003409743309020996, -0.003144502639770508, -0.0028792619705200195, -0.0026140213012695312, -0.002348780632019043, -0.0020835399627685547, -0.0018182992935180664, -0.0015530586242675781, -0.0012878179550170898, -0.0010225772857666016, -0.0007573366165161133, -0.000492095947265625, -0.00022685527801513672, 3.838539123535156e-05, 0.00030362606048583984, 0.0005688667297363281, 0.0008341073989868164, 0.0010993480682373047, 0.001364588737487793, 0.0016298294067382812, 0.0018950700759887695, 0.002160310745239258, 0.002425551414489746, 0.0026907920837402344, 0.0029560327529907227, 0.003221273422241211, 0.0034865140914916992, 0.0037517547607421875, 0.004016995429992676, 0.004282236099243164, 0.004547476768493652, 0.004812717437744141, 0.005077958106994629, 0.005343198776245117, 0.0056084394454956055, 0.005873680114746094, 0.006138920783996582, 0.00640416145324707, 0.006669402122497559, 0.006934642791748047, 0.007199883460998535, 0.0074651241302490234, 0.007730364799499512, 0.00799560546875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 2.0, 6.0, 11.0, 8.0, 16.0, 42.0, 70.0, 346.0, 290.0, 74.0, 25.0, 16.0, 8.0, 5.0, 6.0, 2.0, 7.0, 4.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0003542900085449219, -0.0003444477915763855, -0.0003346055746078491, -0.00032476335763931274, -0.00031492114067077637, -0.00030507892370224, -0.0002952367067337036, -0.00028539448976516724, -0.00027555227279663086, -0.0002657100558280945, -0.0002558678388595581, -0.00024602562189102173, -0.00023618340492248535, -0.00022634118795394897, -0.0002164989709854126, -0.00020665675401687622, -0.00019681453704833984, -0.00018697232007980347, -0.0001771301031112671, -0.0001672878861427307, -0.00015744566917419434, -0.00014760345220565796, -0.00013776123523712158, -0.0001279190182685852, -0.00011807680130004883, -0.00010823458433151245, -9.839236736297607e-05, -8.85501503944397e-05, -7.870793342590332e-05, -6.886571645736694e-05, -5.9023499488830566e-05, -4.918128252029419e-05, -3.933906555175781e-05, -2.9496848583221436e-05, -1.965463161468506e-05, -9.812414646148682e-06, 2.9802322387695312e-08, 9.872019290924072e-06, 1.971423625946045e-05, 2.9556453227996826e-05, 3.93986701965332e-05, 4.924088716506958e-05, 5.908310413360596e-05, 6.892532110214233e-05, 7.876753807067871e-05, 8.860975503921509e-05, 9.845197200775146e-05, 0.00010829418897628784, 0.00011813640594482422, 0.0001279786229133606, 0.00013782083988189697, 0.00014766305685043335, 0.00015750527381896973, 0.0001673474907875061, 0.00017718970775604248, 0.00018703192472457886, 0.00019687414169311523, 0.0002067163586616516, 0.000216558575630188, 0.00022640079259872437, 0.00023624300956726074, 0.0002460852265357971, 0.0002559274435043335, 0.0002657696604728699, 0.00027561187744140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 7.0, 8.0, 12.0, 13.0, 22.0, 37.0, 76.0, 151.0, 443.0, 3135.0, 983800.0, 58693.0, 1514.0, 354.0, 103.0, 70.0, 35.0, 22.0, 15.0, 18.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02386474609375, -0.023216962814331055, -0.02256917953491211, -0.021921396255493164, -0.02127361297607422, -0.020625829696655273, -0.019978046417236328, -0.019330263137817383, -0.018682479858398438, -0.018034696578979492, -0.017386913299560547, -0.0167391300201416, -0.016091346740722656, -0.015443563461303711, -0.014795780181884766, -0.01414799690246582, -0.013500213623046875, -0.01285243034362793, -0.012204647064208984, -0.011556863784790039, -0.010909080505371094, -0.010261297225952148, -0.009613513946533203, -0.008965730667114258, -0.008317947387695312, -0.007670164108276367, -0.007022380828857422, -0.0063745975494384766, -0.005726814270019531, -0.005079030990600586, -0.004431247711181641, -0.0037834644317626953, -0.00313568115234375, -0.0024878978729248047, -0.0018401145935058594, -0.001192331314086914, -0.0005445480346679688, 0.00010323524475097656, 0.0007510185241699219, 0.0013988018035888672, 0.0020465850830078125, 0.002694368362426758, 0.003342151641845703, 0.0039899349212646484, 0.004637718200683594, 0.005285501480102539, 0.005933284759521484, 0.00658106803894043, 0.007228851318359375, 0.00787663459777832, 0.008524417877197266, 0.009172201156616211, 0.009819984436035156, 0.010467767715454102, 0.011115550994873047, 0.011763334274291992, 0.012411117553710938, 0.013058900833129883, 0.013706684112548828, 0.014354467391967773, 0.015002250671386719, 0.015650033950805664, 0.01629781723022461, 0.016945600509643555, 0.0175933837890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 14.0, 10.0, 10.0, 15.0, 25.0, 42.0, 55.0, 130.0, 245.0, 196.0, 93.0, 54.0, 40.0, 20.0, 16.0, 8.0, 7.0, 3.0, 6.0, 3.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008514404296875, -0.008172154426574707, -0.007829904556274414, -0.007487654685974121, -0.007145404815673828, -0.006803154945373535, -0.006460905075073242, -0.006118655204772949, -0.005776405334472656, -0.005434155464172363, -0.00509190559387207, -0.004749655723571777, -0.004407405853271484, -0.004065155982971191, -0.0037229061126708984, -0.0033806562423706055, -0.0030384063720703125, -0.0026961565017700195, -0.0023539066314697266, -0.0020116567611694336, -0.0016694068908691406, -0.0013271570205688477, -0.0009849071502685547, -0.0006426572799682617, -0.00030040740966796875, 4.184246063232422e-05, 0.0003840923309326172, 0.0007263422012329102, 0.0010685920715332031, 0.001410841941833496, 0.001753091812133789, 0.002095341682434082, 0.002437591552734375, 0.002779841423034668, 0.003122091293334961, 0.003464341163635254, 0.003806591033935547, 0.00414884090423584, 0.004491090774536133, 0.004833340644836426, 0.005175590515136719, 0.005517840385437012, 0.005860090255737305, 0.006202340126037598, 0.006544589996337891, 0.006886839866638184, 0.0072290897369384766, 0.0075713396072387695, 0.007913589477539062, 0.008255839347839355, 0.008598089218139648, 0.008940339088439941, 0.009282588958740234, 0.009624838829040527, 0.00996708869934082, 0.010309338569641113, 0.010651588439941406, 0.0109938383102417, 0.011336088180541992, 0.011678338050842285, 0.012020587921142578, 0.012362837791442871, 0.012705087661743164, 0.013047337532043457, 0.01338958740234375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 116.0, 803.0, 82.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9232122898101807, -1.8808120489120483, -1.8384116888046265, -1.7960114479064941, -1.7536112070083618, -1.7112109661102295, -1.6688106060028076, -1.6264103651046753, -1.584010124206543, -1.5416098833084106, -1.4992095232009888, -1.4568092823028564, -1.4144090414047241, -1.3720088005065918, -1.32960844039917, -1.2872081995010376, -1.2448078393936157, -1.2024075984954834, -1.1600072383880615, -1.1176069974899292, -1.0752067565917969, -1.032806396484375, -0.9904061555862427, -0.9480059146881104, -0.9056056141853333, -0.8632053136825562, -0.8208050727844238, -0.7784047722816467, -0.7360044717788696, -0.6936042308807373, -0.6512039303779602, -0.6088036298751831, -0.5664033889770508, -0.5240030884742737, -0.48160284757614136, -0.43920254707336426, -0.39680227637290955, -0.35440200567245483, -0.31200170516967773, -0.269601434469223, -0.2272011637687683, -0.1848008930683136, -0.1424006074666977, -0.10000032186508179, -0.057600051164627075, -0.015199780464172363, 0.027200520038604736, 0.06960079073905945, 0.11200106143951416, 0.15440133213996887, 0.19680161774158478, 0.23920190334320068, 0.2816021740436554, 0.3240024447441101, 0.3664027452468872, 0.4088030159473419, 0.45120328664779663, 0.49360355734825134, 0.536003828048706, 0.5784041285514832, 0.6208044290542603, 0.6632046699523926, 0.7056049704551697, 0.7480052709579468, 0.7904055118560791]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 9.0, 10.0, 6.0, 11.0, 13.0, 13.0, 15.0, 13.0, 19.0, 35.0, 33.0, 27.0, 37.0, 33.0, 47.0, 37.0, 43.0, 36.0, 57.0, 52.0, 45.0, 33.0, 48.0, 31.0, 39.0, 31.0, 32.0, 27.0, 40.0, 28.0, 13.0, 20.0, 16.0, 10.0, 13.0, 8.0, 3.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2909756302833557, -0.2822502851486206, -0.2735249400138855, -0.2647995948791504, -0.2560742497444153, -0.24734888970851898, -0.23862352967262268, -0.22989818453788757, -0.22117283940315247, -0.21244749426841736, -0.20372214913368225, -0.19499678909778595, -0.18627144396305084, -0.17754609882831573, -0.16882073879241943, -0.16009539365768433, -0.15137004852294922, -0.1426447033882141, -0.133919358253479, -0.1251939982175827, -0.1164686530828476, -0.10774330794811249, -0.09901795536279678, -0.09029260277748108, -0.08156725764274597, -0.07284191250801086, -0.06411655992269516, -0.055391211062669754, -0.04666586220264435, -0.03794051334261894, -0.029215164482593536, -0.02048981562256813, -0.011764466762542725, -0.0030391179025173187, 0.005686230957508087, 0.014411579817533493, 0.0231369286775589, 0.031862277537584305, 0.04058762639760971, 0.04931297525763512, 0.05803832411766052, 0.06676366925239563, 0.07548902183771133, 0.08421437442302704, 0.09293971955776215, 0.10166506469249725, 0.11039041727781296, 0.11911576986312866, 0.12784111499786377, 0.13656646013259888, 0.14529180526733398, 0.15401716530323029, 0.1627425104379654, 0.1714678555727005, 0.1801932156085968, 0.1889185607433319, 0.19764390587806702, 0.20636925101280212, 0.21509459614753723, 0.22381995618343353, 0.23254530131816864, 0.24127064645290375, 0.24999600648880005, 0.25872135162353516, 0.26744669675827026]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 15.0, 12.0, 25.0, 42.0, 53.0, 102.0, 132.0, 277.0, 626.0, 6930.0, 4184543.0, 732.0, 279.0, 166.0, 115.0, 64.0, 36.0, 31.0, 16.0, 13.0, 14.0, 7.0, 9.0, 3.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.24978256225585938, -0.24175262451171875, -0.23372268676757812, -0.2256927490234375, -0.21766281127929688, -0.20963287353515625, -0.20160293579101562, -0.193572998046875, -0.18554306030273438, -0.17751312255859375, -0.16948318481445312, -0.1614532470703125, -0.15342330932617188, -0.14539337158203125, -0.13736343383789062, -0.12933349609375, -0.12130355834960938, -0.11327362060546875, -0.10524368286132812, -0.0972137451171875, -0.08918380737304688, -0.08115386962890625, -0.07312393188476562, -0.065093994140625, -0.057064056396484375, -0.04903411865234375, -0.041004180908203125, -0.0329742431640625, -0.024944305419921875, -0.01691436767578125, -0.008884429931640625, -0.0008544921875, 0.007175445556640625, 0.01520538330078125, 0.023235321044921875, 0.0312652587890625, 0.039295196533203125, 0.04732513427734375, 0.055355072021484375, 0.063385009765625, 0.07141494750976562, 0.07944488525390625, 0.08747482299804688, 0.0955047607421875, 0.10353469848632812, 0.11156463623046875, 0.11959457397460938, 0.12762451171875, 0.13565444946289062, 0.14368438720703125, 0.15171432495117188, 0.1597442626953125, 0.16777420043945312, 0.17580413818359375, 0.18383407592773438, 0.191864013671875, 0.19989395141601562, 0.20792388916015625, 0.21595382690429688, 0.2239837646484375, 0.23201370239257812, 0.24004364013671875, 0.24807357788085938, 0.256103515625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 11.0, 10.0, 11.0, 18.0, 25.0, 35.0, 55.0, 51.0, 79.0, 90.0, 92.0, 105.0, 67.0, 59.0, 61.0, 59.0, 46.0, 23.0, 21.0, 19.0, 11.0, 10.0, 6.0, 6.0, 7.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020751953125, -0.020109176635742188, -0.019466400146484375, -0.018823623657226562, -0.01818084716796875, -0.017538070678710938, -0.016895294189453125, -0.016252517700195312, -0.0156097412109375, -0.014966964721679688, -0.014324188232421875, -0.013681411743164062, -0.01303863525390625, -0.012395858764648438, -0.011753082275390625, -0.011110305786132812, -0.010467529296875, -0.009824752807617188, -0.009181976318359375, -0.008539199829101562, -0.00789642333984375, -0.0072536468505859375, -0.006610870361328125, -0.0059680938720703125, -0.0053253173828125, -0.0046825408935546875, -0.004039764404296875, -0.0033969879150390625, -0.00275421142578125, -0.0021114349365234375, -0.001468658447265625, -0.0008258819580078125, -0.00018310546875, 0.0004596710205078125, 0.001102447509765625, 0.0017452239990234375, 0.00238800048828125, 0.0030307769775390625, 0.003673553466796875, 0.0043163299560546875, 0.0049591064453125, 0.0056018829345703125, 0.006244659423828125, 0.0068874359130859375, 0.00753021240234375, 0.008172988891601562, 0.008815765380859375, 0.009458541870117188, 0.010101318359375, 0.010744094848632812, 0.011386871337890625, 0.012029647827148438, 0.01267242431640625, 0.013315200805664062, 0.013957977294921875, 0.014600753784179688, 0.0152435302734375, 0.015886306762695312, 0.016529083251953125, 0.017171859741210938, 0.01781463623046875, 0.018457412719726562, 0.019100189208984375, 0.019742965698242188, 0.0203857421875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 39.0, 128.0, 484.0, 7355.0, 4184123.0, 1783.0, 281.0, 51.0, 25.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08624267578125, -0.0832986831665039, -0.08035469055175781, -0.07741069793701172, -0.07446670532226562, -0.07152271270751953, -0.06857872009277344, -0.06563472747802734, -0.06269073486328125, -0.059746742248535156, -0.05680274963378906, -0.05385875701904297, -0.050914764404296875, -0.04797077178955078, -0.04502677917480469, -0.042082786560058594, -0.0391387939453125, -0.036194801330566406, -0.03325080871582031, -0.03030681610107422, -0.027362823486328125, -0.02441883087158203, -0.021474838256835938, -0.018530845642089844, -0.01558685302734375, -0.012642860412597656, -0.009698867797851562, -0.006754875183105469, -0.003810882568359375, -0.0008668899536132812, 0.0020771026611328125, 0.005021095275878906, 0.007965087890625, 0.010909080505371094, 0.013853073120117188, 0.01679706573486328, 0.019741058349609375, 0.02268505096435547, 0.025629043579101562, 0.028573036193847656, 0.03151702880859375, 0.034461021423339844, 0.03740501403808594, 0.04034900665283203, 0.043292999267578125, 0.04623699188232422, 0.04918098449707031, 0.052124977111816406, 0.0550689697265625, 0.058012962341308594, 0.06095695495605469, 0.06390094757080078, 0.06684494018554688, 0.06978893280029297, 0.07273292541503906, 0.07567691802978516, 0.07862091064453125, 0.08156490325927734, 0.08450889587402344, 0.08745288848876953, 0.09039688110351562, 0.09334087371826172, 0.09628486633300781, 0.0992288589477539, 0.1021728515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 9.0, 12.0, 46.0, 3682.0, 246.0, 40.0, 18.0, 9.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018341064453125, -0.017800092697143555, -0.01725912094116211, -0.016718149185180664, -0.01617717742919922, -0.015636205673217773, -0.015095233917236328, -0.014554262161254883, -0.014013290405273438, -0.013472318649291992, -0.012931346893310547, -0.012390375137329102, -0.011849403381347656, -0.011308431625366211, -0.010767459869384766, -0.01022648811340332, -0.009685516357421875, -0.00914454460144043, -0.008603572845458984, -0.008062601089477539, -0.007521629333496094, -0.0069806575775146484, -0.006439685821533203, -0.005898714065551758, -0.0053577423095703125, -0.004816770553588867, -0.004275798797607422, -0.0037348270416259766, -0.0031938552856445312, -0.002652883529663086, -0.0021119117736816406, -0.0015709400177001953, -0.00102996826171875, -0.0004889965057373047, 5.1975250244140625e-05, 0.0005929470062255859, 0.0011339187622070312, 0.0016748905181884766, 0.002215862274169922, 0.002756834030151367, 0.0032978057861328125, 0.003838777542114258, 0.004379749298095703, 0.0049207210540771484, 0.005461692810058594, 0.006002664566040039, 0.006543636322021484, 0.00708460807800293, 0.007625579833984375, 0.00816655158996582, 0.008707523345947266, 0.009248495101928711, 0.009789466857910156, 0.010330438613891602, 0.010871410369873047, 0.011412382125854492, 0.011953353881835938, 0.012494325637817383, 0.013035297393798828, 0.013576269149780273, 0.014117240905761719, 0.014658212661743164, 0.01519918441772461, 0.015740156173706055, 0.0162811279296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 24.0, 254.0, 689.0, 39.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1266936957836151, -0.12328440696001053, -0.11987511813640594, -0.11646582931280136, -0.11305654048919678, -0.1096472516655922, -0.10623796284198761, -0.10282867401838303, -0.09941938519477844, -0.09601009637117386, -0.09260080754756927, -0.08919151872396469, -0.08578222990036011, -0.08237294107675552, -0.07896365225315094, -0.07555436342954636, -0.07214507460594177, -0.06873578578233719, -0.0653264969587326, -0.06191720813512802, -0.05850791931152344, -0.055098630487918854, -0.05168934166431427, -0.048280052840709686, -0.0448707640171051, -0.04146147519350052, -0.038052186369895935, -0.03464289754629135, -0.031233608722686768, -0.027824319899082184, -0.0244150310754776, -0.021005742251873016, -0.017596445977687836, -0.014187157154083252, -0.010777868330478668, -0.0073685795068740845, -0.003959290683269501, -0.000550001859664917, 0.0028592869639396667, 0.0062685757875442505, 0.009677864611148834, 0.013087153434753418, 0.016496442258358, 0.019905731081962585, 0.02331501990556717, 0.026724308729171753, 0.030133597552776337, 0.03354288637638092, 0.036952175199985504, 0.04036146402359009, 0.04377075284719467, 0.047180041670799255, 0.05058933049440384, 0.05399861931800842, 0.05740790814161301, 0.06081719696521759, 0.06422648578882217, 0.06763577461242676, 0.07104506343603134, 0.07445435225963593, 0.07786364108324051, 0.08127292990684509, 0.08468221873044968, 0.08809150755405426, 0.09150079637765884]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 10.0, 11.0, 12.0, 22.0, 26.0, 24.0, 27.0, 31.0, 41.0, 42.0, 52.0, 44.0, 56.0, 56.0, 70.0, 64.0, 45.0, 54.0, 45.0, 50.0, 42.0, 29.0, 39.0, 19.0, 20.0, 14.0, 17.0, 12.0, 5.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.018992483615875244, -0.0183461494743824, -0.017699817195534706, -0.01705348491668701, -0.016407150775194168, -0.015760816633701324, -0.01511448435485363, -0.014468151144683361, -0.013821817934513092, -0.013175484724342823, -0.012529151514172554, -0.011882818304002285, -0.011236485093832016, -0.010590151883661747, -0.009943818673491478, -0.009297485463321209, -0.00865115225315094, -0.008004819042980671, -0.007358485832810402, -0.006712152622640133, -0.006065819412469864, -0.005419486202299595, -0.004773152992129326, -0.004126819781959057, -0.003480486571788788, -0.002834153361618519, -0.00218782015144825, -0.0015414869412779808, -0.0008951537311077118, -0.0002488205209374428, 0.00039751268923282623, 0.0010438458994030952, 0.0016901791095733643, 0.0023365123197436333, 0.0029828455299139023, 0.0036291787400841713, 0.00427551195025444, 0.004921845160424709, 0.005568178370594978, 0.006214511580765247, 0.006860844790935516, 0.007507178001105785, 0.008153511211276054, 0.008799844421446323, 0.009446177631616592, 0.010092510841786861, 0.01073884405195713, 0.0113851772621274, 0.012031510472297668, 0.012677843682467937, 0.013324176892638206, 0.013970510102808475, 0.014616843312978745, 0.015263176523149014, 0.015909509733319283, 0.016555842012166977, 0.01720217615365982, 0.017848510295152664, 0.01849484257400036, 0.019141174852848053, 0.019787508994340897, 0.02043384313583374, 0.021080175414681435, 0.02172650769352913, 0.022372841835021973]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 10.0, 4.0, 7.0, 11.0, 23.0, 20.0, 30.0, 43.0, 54.0, 102.0, 142.0, 257.0, 325.0, 554.0, 922.0, 1611.0, 3241.0, 6919.0, 17021.0, 55413.0, 347947.0, 511509.0, 67026.0, 19542.0, 7767.0, 3530.0, 1787.0, 1036.0, 582.0, 397.0, 241.0, 148.0, 87.0, 68.0, 50.0, 39.0, 23.0, 15.0, 11.0, 15.0, 7.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.032135009765625, -0.03116321563720703, -0.030191421508789062, -0.029219627380371094, -0.028247833251953125, -0.027276039123535156, -0.026304244995117188, -0.02533245086669922, -0.02436065673828125, -0.02338886260986328, -0.022417068481445312, -0.021445274353027344, -0.020473480224609375, -0.019501686096191406, -0.018529891967773438, -0.01755809783935547, -0.0165863037109375, -0.015614509582519531, -0.014642715454101562, -0.013670921325683594, -0.012699127197265625, -0.011727333068847656, -0.010755538940429688, -0.009783744812011719, -0.00881195068359375, -0.007840156555175781, -0.0068683624267578125, -0.005896568298339844, -0.004924774169921875, -0.003952980041503906, -0.0029811859130859375, -0.0020093917846679688, -0.00103759765625, -6.580352783203125e-05, 0.0009059906005859375, 0.0018777847290039062, 0.002849578857421875, 0.0038213729858398438, 0.0047931671142578125, 0.005764961242675781, 0.00673675537109375, 0.007708549499511719, 0.008680343627929688, 0.009652137756347656, 0.010623931884765625, 0.011595726013183594, 0.012567520141601562, 0.013539314270019531, 0.0145111083984375, 0.015482902526855469, 0.016454696655273438, 0.017426490783691406, 0.018398284912109375, 0.019370079040527344, 0.020341873168945312, 0.02131366729736328, 0.02228546142578125, 0.02325725555419922, 0.024229049682617188, 0.025200843811035156, 0.026172637939453125, 0.027144432067871094, 0.028116226196289062, 0.02908802032470703, 0.030059814453125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 8.0, 9.0, 8.0, 13.0, 14.0, 33.0, 35.0, 45.0, 53.0, 87.0, 87.0, 95.0, 104.0, 72.0, 52.0, 67.0, 56.0, 41.0, 27.0, 19.0, 21.0, 10.0, 10.0, 5.0, 6.0, 8.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0208740234375, -0.020227670669555664, -0.019581317901611328, -0.018934965133666992, -0.018288612365722656, -0.01764225959777832, -0.016995906829833984, -0.01634955406188965, -0.015703201293945312, -0.015056848526000977, -0.01441049575805664, -0.013764142990112305, -0.013117790222167969, -0.012471437454223633, -0.011825084686279297, -0.011178731918334961, -0.010532379150390625, -0.009886026382446289, -0.009239673614501953, -0.008593320846557617, -0.007946968078613281, -0.007300615310668945, -0.006654262542724609, -0.0060079097747802734, -0.0053615570068359375, -0.0047152042388916016, -0.004068851470947266, -0.0034224987030029297, -0.0027761459350585938, -0.002129793167114258, -0.0014834403991699219, -0.0008370876312255859, -0.00019073486328125, 0.00045561790466308594, 0.0011019706726074219, 0.0017483234405517578, 0.0023946762084960938, 0.0030410289764404297, 0.0036873817443847656, 0.0043337345123291016, 0.0049800872802734375, 0.0056264400482177734, 0.006272792816162109, 0.006919145584106445, 0.007565498352050781, 0.008211851119995117, 0.008858203887939453, 0.009504556655883789, 0.010150909423828125, 0.010797262191772461, 0.011443614959716797, 0.012089967727661133, 0.012736320495605469, 0.013382673263549805, 0.01402902603149414, 0.014675378799438477, 0.015321731567382812, 0.01596808433532715, 0.016614437103271484, 0.01726078987121582, 0.017907142639160156, 0.018553495407104492, 0.019199848175048828, 0.019846200942993164, 0.0204925537109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 6.0, 8.0, 18.0, 21.0, 20.0, 28.0, 39.0, 69.0, 79.0, 102.0, 163.0, 376.0, 875.0, 9438.0, 1013298.0, 21695.0, 1223.0, 406.0, 230.0, 126.0, 69.0, 62.0, 52.0, 41.0, 15.0, 14.0, 7.0, 9.0, 14.0, 8.0, 6.0, 2.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.12841796875, -0.12459468841552734, -0.12077140808105469, -0.11694812774658203, -0.11312484741210938, -0.10930156707763672, -0.10547828674316406, -0.1016550064086914, -0.09783172607421875, -0.0940084457397461, -0.09018516540527344, -0.08636188507080078, -0.08253860473632812, -0.07871532440185547, -0.07489204406738281, -0.07106876373291016, -0.0672454833984375, -0.06342220306396484, -0.05959892272949219, -0.05577564239501953, -0.051952362060546875, -0.04812908172607422, -0.04430580139160156, -0.040482521057128906, -0.03665924072265625, -0.032835960388183594, -0.029012680053710938, -0.02518939971923828, -0.021366119384765625, -0.01754283905029297, -0.013719558715820312, -0.009896278381347656, -0.006072998046875, -0.0022497177124023438, 0.0015735626220703125, 0.005396842956542969, 0.009220123291015625, 0.013043403625488281, 0.016866683959960938, 0.020689964294433594, 0.02451324462890625, 0.028336524963378906, 0.03215980529785156, 0.03598308563232422, 0.039806365966796875, 0.04362964630126953, 0.04745292663574219, 0.051276206970214844, 0.0550994873046875, 0.058922767639160156, 0.06274604797363281, 0.06656932830810547, 0.07039260864257812, 0.07421588897705078, 0.07803916931152344, 0.0818624496459961, 0.08568572998046875, 0.0895090103149414, 0.09333229064941406, 0.09715557098388672, 0.10097885131835938, 0.10480213165283203, 0.10862541198730469, 0.11244869232177734, 0.11627197265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 9.0, 4.0, 13.0, 17.0, 16.0, 25.0, 19.0, 20.0, 35.0, 30.0, 40.0, 34.0, 53.0, 46.0, 50.0, 44.0, 67.0, 56.0, 46.0, 39.0, 43.0, 46.0, 34.0, 32.0, 42.0, 24.0, 25.0, 13.0, 13.0, 14.0, 14.0, 4.0, 2.0, 12.0, 5.0, 7.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0511474609375, -0.04936027526855469, -0.047573089599609375, -0.04578590393066406, -0.04399871826171875, -0.04221153259277344, -0.040424346923828125, -0.03863716125488281, -0.0368499755859375, -0.03506278991699219, -0.033275604248046875, -0.03148841857910156, -0.02970123291015625, -0.027914047241210938, -0.026126861572265625, -0.024339675903320312, -0.022552490234375, -0.020765304565429688, -0.018978118896484375, -0.017190933227539062, -0.01540374755859375, -0.013616561889648438, -0.011829376220703125, -0.010042190551757812, -0.0082550048828125, -0.0064678192138671875, -0.004680633544921875, -0.0028934478759765625, -0.00110626220703125, 0.0006809234619140625, 0.002468109130859375, 0.0042552947998046875, 0.00604248046875, 0.007829666137695312, 0.009616851806640625, 0.011404037475585938, 0.01319122314453125, 0.014978408813476562, 0.016765594482421875, 0.018552780151367188, 0.0203399658203125, 0.022127151489257812, 0.023914337158203125, 0.025701522827148438, 0.02748870849609375, 0.029275894165039062, 0.031063079833984375, 0.03285026550292969, 0.034637451171875, 0.03642463684082031, 0.038211822509765625, 0.03999900817871094, 0.04178619384765625, 0.04357337951660156, 0.045360565185546875, 0.04714775085449219, 0.0489349365234375, 0.05072212219238281, 0.052509307861328125, 0.05429649353027344, 0.05608367919921875, 0.05787086486816406, 0.059658050537109375, 0.06144523620605469, 0.063232421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 19.0, 16.0, 23.0, 60.0, 153.0, 999.0, 1024091.0, 22551.0, 392.0, 100.0, 53.0, 24.0, 21.0, 7.0, 10.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01363372802734375, -0.01312553882598877, -0.012617349624633789, -0.012109160423278809, -0.011600971221923828, -0.011092782020568848, -0.010584592819213867, -0.010076403617858887, -0.009568214416503906, -0.009060025215148926, -0.008551836013793945, -0.008043646812438965, -0.007535457611083984, -0.007027268409729004, -0.0065190792083740234, -0.006010890007019043, -0.0055027008056640625, -0.004994511604309082, -0.0044863224029541016, -0.003978133201599121, -0.0034699440002441406, -0.00296175479888916, -0.0024535655975341797, -0.0019453763961791992, -0.0014371871948242188, -0.0009289979934692383, -0.0004208087921142578, 8.738040924072266e-05, 0.0005955696105957031, 0.0011037588119506836, 0.001611948013305664, 0.0021201372146606445, 0.002628326416015625, 0.0031365156173706055, 0.003644704818725586, 0.004152894020080566, 0.004661083221435547, 0.005169272422790527, 0.005677461624145508, 0.006185650825500488, 0.006693840026855469, 0.007202029228210449, 0.00771021842956543, 0.00821840763092041, 0.00872659683227539, 0.009234786033630371, 0.009742975234985352, 0.010251164436340332, 0.010759353637695312, 0.011267542839050293, 0.011775732040405273, 0.012283921241760254, 0.012792110443115234, 0.013300299644470215, 0.013808488845825195, 0.014316678047180176, 0.014824867248535156, 0.015333056449890137, 0.015841245651245117, 0.016349434852600098, 0.016857624053955078, 0.01736581325531006, 0.01787400245666504, 0.01838219165802002, 0.018890380859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 9.0, 12.0, 16.0, 14.0, 20.0, 34.0, 47.0, 106.0, 454.0, 81.0, 41.0, 22.0, 21.0, 21.0, 13.0, 11.0, 8.0, 9.0, 4.0, 5.0, 4.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003314018249511719, -0.0003217644989490509, -0.00031212717294692993, -0.00030248984694480896, -0.000292852520942688, -0.000283215194940567, -0.00027357786893844604, -0.0002639405429363251, -0.0002543032169342041, -0.00024466589093208313, -0.00023502856492996216, -0.0002253912389278412, -0.00021575391292572021, -0.00020611658692359924, -0.00019647926092147827, -0.0001868419349193573, -0.00017720460891723633, -0.00016756728291511536, -0.00015792995691299438, -0.0001482926309108734, -0.00013865530490875244, -0.00012901797890663147, -0.0001193806529045105, -0.00010974332690238953, -0.00010010600090026855, -9.046867489814758e-05, -8.083134889602661e-05, -7.119402289390564e-05, -6.155669689178467e-05, -5.1919370889663696e-05, -4.2282044887542725e-05, -3.264471888542175e-05, -2.300739288330078e-05, -1.337006688117981e-05, -3.732740879058838e-06, 5.904585123062134e-06, 1.5541911125183105e-05, 2.5179237127304077e-05, 3.481656312942505e-05, 4.445388913154602e-05, 5.409121513366699e-05, 6.372854113578796e-05, 7.336586713790894e-05, 8.300319314002991e-05, 9.264051914215088e-05, 0.00010227784514427185, 0.00011191517114639282, 0.0001215524971485138, 0.00013118982315063477, 0.00014082714915275574, 0.0001504644751548767, 0.00016010180115699768, 0.00016973912715911865, 0.00017937645316123962, 0.0001890137791633606, 0.00019865110516548157, 0.00020828843116760254, 0.0002179257571697235, 0.00022756308317184448, 0.00023720040917396545, 0.0002468377351760864, 0.0002564750611782074, 0.00026611238718032837, 0.00027574971318244934, 0.0002853870391845703]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 8.0, 7.0, 16.0, 33.0, 31.0, 84.0, 294.0, 8870.0, 1036859.0, 2005.0, 176.0, 63.0, 31.0, 28.0, 11.0, 14.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.026153564453125, -0.02541375160217285, -0.024673938751220703, -0.023934125900268555, -0.023194313049316406, -0.022454500198364258, -0.02171468734741211, -0.02097487449645996, -0.020235061645507812, -0.019495248794555664, -0.018755435943603516, -0.018015623092651367, -0.01727581024169922, -0.01653599739074707, -0.015796184539794922, -0.015056371688842773, -0.014316558837890625, -0.013576745986938477, -0.012836933135986328, -0.01209712028503418, -0.011357307434082031, -0.010617494583129883, -0.009877681732177734, -0.009137868881225586, -0.008398056030273438, -0.007658243179321289, -0.006918430328369141, -0.006178617477416992, -0.005438804626464844, -0.004698991775512695, -0.003959178924560547, -0.0032193660736083984, -0.00247955322265625, -0.0017397403717041016, -0.0009999275207519531, -0.0002601146697998047, 0.00047969818115234375, 0.0012195110321044922, 0.0019593238830566406, 0.002699136734008789, 0.0034389495849609375, 0.004178762435913086, 0.004918575286865234, 0.005658388137817383, 0.006398200988769531, 0.00713801383972168, 0.007877826690673828, 0.008617639541625977, 0.009357452392578125, 0.010097265243530273, 0.010837078094482422, 0.01157689094543457, 0.012316703796386719, 0.013056516647338867, 0.013796329498291016, 0.014536142349243164, 0.015275955200195312, 0.01601576805114746, 0.01675558090209961, 0.017495393753051758, 0.018235206604003906, 0.018975019454956055, 0.019714832305908203, 0.02045464515686035, 0.0211944580078125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 5.0, 15.0, 13.0, 23.0, 22.0, 14.0, 52.0, 64.0, 147.0, 314.0, 119.0, 63.0, 43.0, 28.0, 23.0, 10.0, 9.0, 11.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007007598876953125, -0.006761133670806885, -0.0065146684646606445, -0.006268203258514404, -0.006021738052368164, -0.005775272846221924, -0.005528807640075684, -0.005282342433929443, -0.005035877227783203, -0.004789412021636963, -0.004542946815490723, -0.004296481609344482, -0.004050016403198242, -0.003803551197052002, -0.0035570859909057617, -0.0033106207847595215, -0.0030641555786132812, -0.002817690372467041, -0.0025712251663208008, -0.0023247599601745605, -0.0020782947540283203, -0.00183182954788208, -0.0015853643417358398, -0.0013388991355895996, -0.0010924339294433594, -0.0008459687232971191, -0.0005995035171508789, -0.00035303831100463867, -0.00010657310485839844, 0.0001398921012878418, 0.00038635730743408203, 0.0006328225135803223, 0.0008792877197265625, 0.0011257529258728027, 0.001372218132019043, 0.0016186833381652832, 0.0018651485443115234, 0.0021116137504577637, 0.002358078956604004, 0.002604544162750244, 0.0028510093688964844, 0.0030974745750427246, 0.003343939781188965, 0.003590404987335205, 0.0038368701934814453, 0.0040833353996276855, 0.004329800605773926, 0.004576265811920166, 0.004822731018066406, 0.0050691962242126465, 0.005315661430358887, 0.005562126636505127, 0.005808591842651367, 0.006055057048797607, 0.006301522254943848, 0.006547987461090088, 0.006794452667236328, 0.007040917873382568, 0.007287383079528809, 0.007533848285675049, 0.007780313491821289, 0.00802677869796753, 0.00827324390411377, 0.00851970911026001, 0.00876617431640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 49.0, 774.0, 176.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8410512208938599, -1.8073618412017822, -1.7736724615097046, -1.739983081817627, -1.7062937021255493, -1.6726043224334717, -1.638914942741394, -1.6052255630493164, -1.5715363025665283, -1.5378469228744507, -1.504157543182373, -1.4704681634902954, -1.4367787837982178, -1.4030894041061401, -1.3694000244140625, -1.3357107639312744, -1.3020212650299072, -1.2683318853378296, -1.234642505645752, -1.2009531259536743, -1.1672637462615967, -1.133574366569519, -1.0998849868774414, -1.0661957263946533, -1.0325062274932861, -0.9988168478012085, -0.9651274681091309, -0.9314380884170532, -0.8977487087249756, -0.864059329032898, -0.8303700089454651, -0.7966806292533875, -0.7629913091659546, -0.729301929473877, -0.6956125497817993, -0.6619231700897217, -0.628233790397644, -0.5945444107055664, -0.5608550906181335, -0.5271657109260559, -0.49347633123397827, -0.45978695154190063, -0.426097571849823, -0.39240822196006775, -0.3587188422679901, -0.3250294625759125, -0.2913401126861572, -0.2576507329940796, -0.22396135330200195, -0.19027197360992432, -0.15658260881900787, -0.12289323657751083, -0.0892038643360138, -0.05551448464393616, -0.021825119853019714, 0.011864244937896729, 0.045553624629974365, 0.0792429968714714, 0.11293236911296844, 0.1466217339038849, 0.18031111359596252, 0.21400049328804016, 0.2476898580789566, 0.28137922286987305, 0.3150686025619507]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 6.0, 10.0, 11.0, 5.0, 7.0, 18.0, 15.0, 12.0, 19.0, 12.0, 15.0, 19.0, 31.0, 24.0, 39.0, 34.0, 37.0, 43.0, 42.0, 30.0, 33.0, 31.0, 54.0, 40.0, 38.0, 32.0, 28.0, 29.0, 30.0, 39.0, 25.0, 28.0, 24.0, 23.0, 17.0, 18.0, 18.0, 11.0, 13.0, 8.0, 7.0, 7.0, 2.0, 5.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.20592063665390015, -0.1988634467124939, -0.19180627167224884, -0.18474909663200378, -0.17769190669059753, -0.17063471674919128, -0.16357754170894623, -0.15652036666870117, -0.14946317672729492, -0.14240598678588867, -0.13534881174564362, -0.12829163670539856, -0.12123444676399231, -0.11417726427316666, -0.107120081782341, -0.10006289929151535, -0.0930057168006897, -0.08594853430986404, -0.07889135181903839, -0.07183416932821274, -0.06477698683738708, -0.05771980434656143, -0.05066262185573578, -0.043605439364910126, -0.03654825687408447, -0.02949107438325882, -0.022433891892433167, -0.015376709401607513, -0.00831952691078186, -0.0012623444199562073, 0.005794838070869446, 0.012852020561695099, 0.019909203052520752, 0.026966385543346405, 0.03402356803417206, 0.04108075052499771, 0.048137933015823364, 0.05519511550664902, 0.06225229799747467, 0.06930948048830032, 0.07636666297912598, 0.08342384546995163, 0.09048102796077728, 0.09753821045160294, 0.10459539294242859, 0.11165257543325424, 0.1187097579240799, 0.12576693296432495, 0.1328241229057312, 0.13988131284713745, 0.1469384878873825, 0.15399566292762756, 0.1610528528690338, 0.16811004281044006, 0.17516721785068512, 0.18222439289093018, 0.18928158283233643, 0.19633877277374268, 0.20339594781398773, 0.2104531228542328, 0.21751031279563904, 0.2245675027370453, 0.23162467777729034, 0.2386818528175354, 0.24573904275894165]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 8.0, 8.0, 14.0, 10.0, 18.0, 27.0, 48.0, 55.0, 76.0, 78.0, 97.0, 4193370.0, 87.0, 65.0, 66.0, 57.0, 43.0, 39.0, 26.0, 25.0, 13.0, 11.0, 10.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.177734375, -0.17232513427734375, -0.1669158935546875, -0.16150665283203125, -0.156097412109375, -0.15068817138671875, -0.1452789306640625, -0.13986968994140625, -0.13446044921875, -0.12905120849609375, -0.1236419677734375, -0.11823272705078125, -0.112823486328125, -0.10741424560546875, -0.1020050048828125, -0.09659576416015625, -0.0911865234375, -0.08577728271484375, -0.0803680419921875, -0.07495880126953125, -0.069549560546875, -0.06414031982421875, -0.0587310791015625, -0.05332183837890625, -0.04791259765625, -0.04250335693359375, -0.0370941162109375, -0.03168487548828125, -0.026275634765625, -0.02086639404296875, -0.0154571533203125, -0.01004791259765625, -0.004638671875, 0.00077056884765625, 0.0061798095703125, 0.01158905029296875, 0.016998291015625, 0.02240753173828125, 0.0278167724609375, 0.03322601318359375, 0.03863525390625, 0.04404449462890625, 0.0494537353515625, 0.05486297607421875, 0.060272216796875, 0.06568145751953125, 0.0710906982421875, 0.07649993896484375, 0.0819091796875, 0.08731842041015625, 0.0927276611328125, 0.09813690185546875, 0.103546142578125, 0.10895538330078125, 0.1143646240234375, 0.11977386474609375, 0.12518310546875, 0.13059234619140625, 0.1360015869140625, 0.14141082763671875, 0.146820068359375, 0.15222930908203125, 0.1576385498046875, 0.16304779052734375, 0.16845703125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 4.0, 10.0, 7.0, 16.0, 11.0, 26.0, 41.0, 52.0, 61.0, 81.0, 91.0, 100.0, 83.0, 72.0, 61.0, 69.0, 49.0, 43.0, 26.0, 26.0, 17.0, 8.0, 14.0, 6.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0203094482421875, -0.01967906951904297, -0.019048690795898438, -0.018418312072753906, -0.017787933349609375, -0.017157554626464844, -0.016527175903320312, -0.01589679718017578, -0.01526641845703125, -0.014636039733886719, -0.014005661010742188, -0.013375282287597656, -0.012744903564453125, -0.012114524841308594, -0.011484146118164062, -0.010853767395019531, -0.010223388671875, -0.009593009948730469, -0.008962631225585938, -0.008332252502441406, -0.007701873779296875, -0.007071495056152344, -0.0064411163330078125, -0.005810737609863281, -0.00518035888671875, -0.004549980163574219, -0.0039196014404296875, -0.0032892227172851562, -0.002658843994140625, -0.0020284652709960938, -0.0013980865478515625, -0.0007677078247070312, -0.0001373291015625, 0.0004930496215820312, 0.0011234283447265625, 0.0017538070678710938, 0.002384185791015625, 0.0030145645141601562, 0.0036449432373046875, 0.004275321960449219, 0.00490570068359375, 0.005536079406738281, 0.0061664581298828125, 0.006796836853027344, 0.007427215576171875, 0.008057594299316406, 0.008687973022460938, 0.009318351745605469, 0.00994873046875, 0.010579109191894531, 0.011209487915039062, 0.011839866638183594, 0.012470245361328125, 0.013100624084472656, 0.013731002807617188, 0.014361381530761719, 0.01499176025390625, 0.015622138977050781, 0.016252517700195312, 0.016882896423339844, 0.017513275146484375, 0.018143653869628906, 0.018774032592773438, 0.01940441131591797, 0.0200347900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 3.0, 8.0, 6.0, 7.0, 9.0, 17.0, 25.0, 21.0, 21.0, 25.0, 35.0, 38.0, 46.0, 59.0, 88.0, 200.0, 1835.0, 4190965.0, 263.0, 129.0, 87.0, 66.0, 45.0, 36.0, 42.0, 33.0, 27.0, 29.0, 26.0, 13.0, 18.0, 14.0, 11.0, 11.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.004913330078125, -0.004784703254699707, -0.004656076431274414, -0.004527449607849121, -0.004398822784423828, -0.004270195960998535, -0.004141569137573242, -0.004012942314147949, -0.0038843154907226562, -0.0037556886672973633, -0.0036270618438720703, -0.0034984350204467773, -0.0033698081970214844, -0.0032411813735961914, -0.0031125545501708984, -0.0029839277267456055, -0.0028553009033203125, -0.0027266740798950195, -0.0025980472564697266, -0.0024694204330444336, -0.0023407936096191406, -0.0022121667861938477, -0.0020835399627685547, -0.0019549131393432617, -0.0018262863159179688, -0.0016976594924926758, -0.0015690326690673828, -0.0014404058456420898, -0.0013117790222167969, -0.001183152198791504, -0.001054525375366211, -0.000925898551940918, -0.000797271728515625, -0.000668644905090332, -0.0005400180816650391, -0.0004113912582397461, -0.0002827644348144531, -0.00015413761138916016, -2.5510787963867188e-05, 0.00010311603546142578, 0.00023174285888671875, 0.0003603696823120117, 0.0004889965057373047, 0.0006176233291625977, 0.0007462501525878906, 0.0008748769760131836, 0.0010035037994384766, 0.0011321306228637695, 0.0012607574462890625, 0.0013893842697143555, 0.0015180110931396484, 0.0016466379165649414, 0.0017752647399902344, 0.0019038915634155273, 0.0020325183868408203, 0.0021611452102661133, 0.0022897720336914062, 0.0024183988571166992, 0.002547025680541992, 0.002675652503967285, 0.002804279327392578, 0.002932906150817871, 0.003061532974243164, 0.003190159797668457, 0.00331878662109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 4083.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0590763092041016e-05, -1.4564953744411469e-05, 1.1460855603218079e-05, 3.7486664950847626e-05, 6.351247429847717e-05, 8.953828364610672e-05, 0.00011556409299373627, 0.00014158990234136581, 0.00016761571168899536, 0.0001936415210366249, 0.00021966733038425446, 0.000245693139731884, 0.00027171894907951355, 0.0002977447584271431, 0.00032377056777477264, 0.0003497963771224022, 0.00037582218647003174, 0.0004018479958176613, 0.00042787380516529083, 0.0004538996145129204, 0.0004799254238605499, 0.0005059512332081795, 0.000531977042555809, 0.0005580028519034386, 0.0005840286612510681, 0.0006100544705986977, 0.0006360802799463272, 0.0006621060892939568, 0.0006881318986415863, 0.0007141577079892159, 0.0007401835173368454, 0.0007662093266844749, 0.0007922351360321045, 0.000818260945379734, 0.0008442867547273636, 0.0008703125640749931, 0.0008963383734226227, 0.0009223641827702522, 0.0009483899921178818, 0.0009744158014655113, 0.0010004416108131409, 0.0010264674201607704, 0.0010524932295084, 0.0010785190388560295, 0.001104544848203659, 0.0011305706575512886, 0.0011565964668989182, 0.0011826222762465477, 0.0012086480855941772, 0.0012346738949418068, 0.0012606997042894363, 0.0012867255136370659, 0.0013127513229846954, 0.001338777132332325, 0.0013648029416799545, 0.001390828751027584, 0.0014168545603752136, 0.0014428803697228432, 0.0014689061790704727, 0.0014949319884181023, 0.0015209577977657318, 0.0015469836071133614, 0.001573009416460991, 0.0015990352258086205, 0.00162506103515625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 16.0, 811.0, 176.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.016410663723945618, -0.01611698605120182, -0.015823308378458023, -0.0155296316370368, -0.015235954895615578, -0.01494227722287178, -0.014648599550127983, -0.01435492280870676, -0.014061245135962963, -0.013767567463219166, -0.013473890721797943, -0.013180213049054146, -0.012886536307632923, -0.012592858634889126, -0.012299181893467903, -0.012005504220724106, -0.011711826547980309, -0.011418148875236511, -0.011124472133815289, -0.010830794461071491, -0.010537117719650269, -0.010243440046906471, -0.009949762374162674, -0.009656085632741451, -0.009362408891320229, -0.009068731218576431, -0.008775054477155209, -0.008481376804411411, -0.008187700062990189, -0.007894022390246391, -0.007600345183163881, -0.007306667976081371, -0.007012990303337574, -0.006719313096255064, -0.006425635889172554, -0.006131958216428757, -0.005838281009346247, -0.005544603802263737, -0.005250926595181227, -0.004957249388098717, -0.004663572181016207, -0.004369894973933697, -0.004076217766851187, -0.003782540326938033, -0.0034888628870248795, -0.0031951856799423695, -0.0029015084728598595, -0.002607831032946706, -0.002314153825864196, -0.002020476618781686, -0.0017267991788685322, -0.0014331219717860222, -0.0011394446482881904, -0.0008457673247903585, -0.0005520901177078485, -0.0002584126777946949, 3.5264529287815094e-05, 0.00032894182368181646, 0.0006226191180758178, 0.0009162963833659887, 0.0012099737068638206, 0.0015036510303616524, 0.0017973282374441624, 0.002091005677357316, 0.002384682884439826]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 12.0, 18.0, 37.0, 63.0, 122.0, 172.0, 164.0, 142.0, 107.0, 79.0, 31.0, 28.0, 9.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014180541038513184, -0.001345757395029068, -0.0012734606862068176, -0.0012011639773845673, -0.001128867268562317, -0.0010565705597400665, -0.0009842738509178162, -0.0009119771420955658, -0.0008396804332733154, -0.0007673837244510651, -0.0006950870156288147, -0.0006227903068065643, -0.000550493597984314, -0.0004781968891620636, -0.00040590018033981323, -0.00033360347151756287, -0.0002613067626953125, -0.00018901005387306213, -0.00011671334505081177, -4.44166362285614e-05, 2.7880072593688965e-05, 0.00010017678141593933, 0.0001724734902381897, 0.00024477019906044006, 0.00031706690788269043, 0.0003893636167049408, 0.00046166032552719116, 0.0005339570343494415, 0.0006062537431716919, 0.0006785504519939423, 0.0007508471608161926, 0.000823143869638443, 0.0008954405784606934, 0.0009677372872829437, 0.001040033996105194, 0.0011123307049274445, 0.0011846274137496948, 0.0012569241225719452, 0.0013292208313941956, 0.001401517540216446, 0.0014738142490386963, 0.0015461109578609467, 0.001618407666683197, 0.0016907043755054474, 0.0017630010843276978, 0.0018352977931499481, 0.0019075945019721985, 0.001979891210794449, 0.0020521879196166992, 0.0021244846284389496, 0.0021967813372612, 0.0022690780460834503, 0.0023413747549057007, 0.002413671463727951, 0.0024859681725502014, 0.0025582648813724518, 0.002630561590194702, 0.0027028582990169525, 0.002775155007839203, 0.0028474517166614532, 0.0029197484254837036, 0.002992045134305954, 0.0030643418431282043, 0.0031366385519504547, 0.003208935260772705]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 6.0, 5.0, 4.0, 9.0, 10.0, 21.0, 25.0, 28.0, 49.0, 58.0, 91.0, 152.0, 230.0, 345.0, 574.0, 1024.0, 1986.0, 4118.0, 10061.0, 31578.0, 162042.0, 697282.0, 100448.0, 23091.0, 7939.0, 3451.0, 1617.0, 871.0, 553.0, 284.0, 185.0, 125.0, 81.0, 57.0, 50.0, 29.0, 19.0, 13.0, 15.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.03460693359375, -0.03350400924682617, -0.032401084899902344, -0.031298160552978516, -0.030195236206054688, -0.02909231185913086, -0.02798938751220703, -0.026886463165283203, -0.025783538818359375, -0.024680614471435547, -0.02357769012451172, -0.02247476577758789, -0.021371841430664062, -0.020268917083740234, -0.019165992736816406, -0.018063068389892578, -0.01696014404296875, -0.015857219696044922, -0.014754295349121094, -0.013651371002197266, -0.012548446655273438, -0.01144552230834961, -0.010342597961425781, -0.009239673614501953, -0.008136749267578125, -0.007033824920654297, -0.005930900573730469, -0.004827976226806641, -0.0037250518798828125, -0.0026221275329589844, -0.0015192031860351562, -0.0004162788391113281, 0.0006866455078125, 0.0017895698547363281, 0.0028924942016601562, 0.003995418548583984, 0.0050983428955078125, 0.006201267242431641, 0.007304191589355469, 0.008407115936279297, 0.009510040283203125, 0.010612964630126953, 0.011715888977050781, 0.01281881332397461, 0.013921737670898438, 0.015024662017822266, 0.016127586364746094, 0.017230510711669922, 0.01833343505859375, 0.019436359405517578, 0.020539283752441406, 0.021642208099365234, 0.022745132446289062, 0.02384805679321289, 0.02495098114013672, 0.026053905487060547, 0.027156829833984375, 0.028259754180908203, 0.02936267852783203, 0.03046560287475586, 0.03156852722167969, 0.032671451568603516, 0.033774375915527344, 0.03487730026245117, 0.035980224609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 4.0, 10.0, 9.0, 14.0, 11.0, 28.0, 39.0, 53.0, 60.0, 80.0, 92.0, 100.0, 85.0, 71.0, 60.0, 72.0, 46.0, 44.0, 26.0, 25.0, 17.0, 8.0, 14.0, 6.0, 3.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0203094482421875, -0.019678831100463867, -0.019048213958740234, -0.0184175968170166, -0.01778697967529297, -0.017156362533569336, -0.016525745391845703, -0.01589512825012207, -0.015264511108398438, -0.014633893966674805, -0.014003276824951172, -0.013372659683227539, -0.012742042541503906, -0.012111425399780273, -0.01148080825805664, -0.010850191116333008, -0.010219573974609375, -0.009588956832885742, -0.00895833969116211, -0.008327722549438477, -0.007697105407714844, -0.007066488265991211, -0.006435871124267578, -0.005805253982543945, -0.0051746368408203125, -0.00454401969909668, -0.003913402557373047, -0.003282785415649414, -0.0026521682739257812, -0.0020215511322021484, -0.0013909339904785156, -0.0007603168487548828, -0.00012969970703125, 0.0005009174346923828, 0.0011315345764160156, 0.0017621517181396484, 0.0023927688598632812, 0.003023386001586914, 0.003654003143310547, 0.00428462028503418, 0.0049152374267578125, 0.005545854568481445, 0.006176471710205078, 0.006807088851928711, 0.007437705993652344, 0.008068323135375977, 0.00869894027709961, 0.009329557418823242, 0.009960174560546875, 0.010590791702270508, 0.01122140884399414, 0.011852025985717773, 0.012482643127441406, 0.013113260269165039, 0.013743877410888672, 0.014374494552612305, 0.015005111694335938, 0.01563572883605957, 0.016266345977783203, 0.016896963119506836, 0.01752758026123047, 0.0181581974029541, 0.018788814544677734, 0.019419431686401367, 0.020050048828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 1.0, 5.0, 5.0, 7.0, 4.0, 9.0, 12.0, 12.0, 13.0, 21.0, 29.0, 36.0, 42.0, 59.0, 83.0, 148.0, 305.0, 865.0, 11790.0, 1010737.0, 22455.0, 1003.0, 385.0, 180.0, 87.0, 67.0, 44.0, 43.0, 19.0, 21.0, 21.0, 14.0, 8.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.105224609375, -0.10166549682617188, -0.09810638427734375, -0.09454727172851562, -0.0909881591796875, -0.08742904663085938, -0.08386993408203125, -0.08031082153320312, -0.076751708984375, -0.07319259643554688, -0.06963348388671875, -0.06607437133789062, -0.0625152587890625, -0.058956146240234375, -0.05539703369140625, -0.051837921142578125, -0.04827880859375, -0.044719696044921875, -0.04116058349609375, -0.037601470947265625, -0.0340423583984375, -0.030483245849609375, -0.02692413330078125, -0.023365020751953125, -0.019805908203125, -0.016246795654296875, -0.01268768310546875, -0.009128570556640625, -0.0055694580078125, -0.002010345458984375, 0.00154876708984375, 0.005107879638671875, 0.0086669921875, 0.012226104736328125, 0.01578521728515625, 0.019344329833984375, 0.0229034423828125, 0.026462554931640625, 0.03002166748046875, 0.033580780029296875, 0.037139892578125, 0.040699005126953125, 0.04425811767578125, 0.047817230224609375, 0.0513763427734375, 0.054935455322265625, 0.05849456787109375, 0.062053680419921875, 0.06561279296875, 0.06917190551757812, 0.07273101806640625, 0.07629013061523438, 0.0798492431640625, 0.08340835571289062, 0.08696746826171875, 0.09052658081054688, 0.094085693359375, 0.09764480590820312, 0.10120391845703125, 0.10476303100585938, 0.1083221435546875, 0.11188125610351562, 0.11544036865234375, 0.11899948120117188, 0.12255859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 11.0, 11.0, 12.0, 13.0, 12.0, 13.0, 21.0, 24.0, 34.0, 32.0, 37.0, 32.0, 24.0, 42.0, 49.0, 43.0, 42.0, 44.0, 40.0, 42.0, 43.0, 43.0, 40.0, 38.0, 38.0, 35.0, 26.0, 25.0, 21.0, 19.0, 19.0, 14.0, 11.0, 8.0, 15.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048187255859375, -0.046746253967285156, -0.04530525207519531, -0.04386425018310547, -0.042423248291015625, -0.04098224639892578, -0.03954124450683594, -0.038100242614746094, -0.03665924072265625, -0.035218238830566406, -0.03377723693847656, -0.03233623504638672, -0.030895233154296875, -0.02945423126220703, -0.028013229370117188, -0.026572227478027344, -0.0251312255859375, -0.023690223693847656, -0.022249221801757812, -0.02080821990966797, -0.019367218017578125, -0.01792621612548828, -0.016485214233398438, -0.015044212341308594, -0.01360321044921875, -0.012162208557128906, -0.010721206665039062, -0.009280204772949219, -0.007839202880859375, -0.006398200988769531, -0.0049571990966796875, -0.0035161972045898438, -0.0020751953125, -0.0006341934204101562, 0.0008068084716796875, 0.0022478103637695312, 0.003688812255859375, 0.005129814147949219, 0.0065708160400390625, 0.008011817932128906, 0.00945281982421875, 0.010893821716308594, 0.012334823608398438, 0.013775825500488281, 0.015216827392578125, 0.01665782928466797, 0.018098831176757812, 0.019539833068847656, 0.0209808349609375, 0.022421836853027344, 0.023862838745117188, 0.02530384063720703, 0.026744842529296875, 0.02818584442138672, 0.029626846313476562, 0.031067848205566406, 0.03250885009765625, 0.033949851989746094, 0.03539085388183594, 0.03683185577392578, 0.038272857666015625, 0.03971385955810547, 0.04115486145019531, 0.042595863342285156, 0.044036865234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 7.0, 6.0, 4.0, 8.0, 25.0, 33.0, 59.0, 203.0, 686.0, 8524.0, 1029593.0, 8397.0, 655.0, 172.0, 73.0, 27.0, 26.0, 16.0, 12.0, 4.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013671875, -0.013251185417175293, -0.012830495834350586, -0.012409806251525879, -0.011989116668701172, -0.011568427085876465, -0.011147737503051758, -0.01072704792022705, -0.010306358337402344, -0.009885668754577637, -0.00946497917175293, -0.009044289588928223, -0.008623600006103516, -0.008202910423278809, -0.0077822208404541016, -0.0073615312576293945, -0.0069408416748046875, -0.0065201520919799805, -0.0060994625091552734, -0.005678772926330566, -0.005258083343505859, -0.004837393760681152, -0.004416704177856445, -0.003996014595031738, -0.0035753250122070312, -0.0031546354293823242, -0.002733945846557617, -0.00231325626373291, -0.0018925666809082031, -0.001471877098083496, -0.001051187515258789, -0.000630497932434082, -0.000209808349609375, 0.00021088123321533203, 0.0006315708160400391, 0.001052260398864746, 0.0014729499816894531, 0.0018936395645141602, 0.002314329147338867, 0.0027350187301635742, 0.0031557083129882812, 0.0035763978958129883, 0.003997087478637695, 0.004417777061462402, 0.004838466644287109, 0.005259156227111816, 0.0056798458099365234, 0.0061005353927612305, 0.0065212249755859375, 0.0069419145584106445, 0.0073626041412353516, 0.007783293724060059, 0.008203983306884766, 0.008624672889709473, 0.00904536247253418, 0.009466052055358887, 0.009886741638183594, 0.0103074312210083, 0.010728120803833008, 0.011148810386657715, 0.011569499969482422, 0.011990189552307129, 0.012410879135131836, 0.012831568717956543, 0.01325225830078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 1.0, 5.0, 7.0, 10.0, 12.0, 17.0, 23.0, 29.0, 47.0, 79.0, 228.0, 283.0, 90.0, 48.0, 34.0, 17.0, 11.0, 14.0, 8.0, 8.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003342628479003906, -0.00032474473118782043, -0.00031522661447525024, -0.00030570849776268005, -0.00029619038105010986, -0.00028667226433753967, -0.0002771541476249695, -0.0002676360309123993, -0.0002581179141998291, -0.0002485997974872589, -0.00023908168077468872, -0.00022956356406211853, -0.00022004544734954834, -0.00021052733063697815, -0.00020100921392440796, -0.00019149109721183777, -0.00018197298049926758, -0.0001724548637866974, -0.0001629367470741272, -0.000153418630361557, -0.00014390051364898682, -0.00013438239693641663, -0.00012486428022384644, -0.00011534616351127625, -0.00010582804679870605, -9.630993008613586e-05, -8.679181337356567e-05, -7.727369666099548e-05, -6.775557994842529e-05, -5.82374632358551e-05, -4.871934652328491e-05, -3.920122981071472e-05, -2.968311309814453e-05, -2.016499638557434e-05, -1.064687967300415e-05, -1.12876296043396e-06, 8.38935375213623e-06, 1.790747046470642e-05, 2.742558717727661e-05, 3.69437038898468e-05, 4.646182060241699e-05, 5.597993731498718e-05, 6.549805402755737e-05, 7.501617074012756e-05, 8.453428745269775e-05, 9.405240416526794e-05, 0.00010357052087783813, 0.00011308863759040833, 0.00012260675430297852, 0.0001321248710155487, 0.0001416429877281189, 0.0001511611044406891, 0.00016067922115325928, 0.00017019733786582947, 0.00017971545457839966, 0.00018923357129096985, 0.00019875168800354004, 0.00020826980471611023, 0.00021778792142868042, 0.0002273060381412506, 0.0002368241548538208, 0.000246342271566391, 0.0002558603882789612, 0.00026537850499153137, 0.00027489662170410156]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 13.0, 8.0, 15.0, 34.0, 49.0, 77.0, 243.0, 2401.0, 1024924.0, 19918.0, 588.0, 128.0, 58.0, 25.0, 18.0, 10.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015716552734375, -0.015221118927001953, -0.014725685119628906, -0.01423025131225586, -0.013734817504882812, -0.013239383697509766, -0.012743949890136719, -0.012248516082763672, -0.011753082275390625, -0.011257648468017578, -0.010762214660644531, -0.010266780853271484, -0.009771347045898438, -0.00927591323852539, -0.008780479431152344, -0.008285045623779297, -0.00778961181640625, -0.007294178009033203, -0.006798744201660156, -0.006303310394287109, -0.0058078765869140625, -0.005312442779541016, -0.004817008972167969, -0.004321575164794922, -0.003826141357421875, -0.003330707550048828, -0.0028352737426757812, -0.0023398399353027344, -0.0018444061279296875, -0.0013489723205566406, -0.0008535385131835938, -0.0003581047058105469, 0.0001373291015625, 0.0006327629089355469, 0.0011281967163085938, 0.0016236305236816406, 0.0021190643310546875, 0.0026144981384277344, 0.0031099319458007812, 0.003605365753173828, 0.004100799560546875, 0.004596233367919922, 0.005091667175292969, 0.005587100982666016, 0.0060825347900390625, 0.006577968597412109, 0.007073402404785156, 0.007568836212158203, 0.00806427001953125, 0.008559703826904297, 0.009055137634277344, 0.00955057144165039, 0.010046005249023438, 0.010541439056396484, 0.011036872863769531, 0.011532306671142578, 0.012027740478515625, 0.012523174285888672, 0.013018608093261719, 0.013514041900634766, 0.014009475708007812, 0.01450490951538086, 0.015000343322753906, 0.015495777130126953, 0.0159912109375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 2.0, 8.0, 10.0, 18.0, 15.0, 28.0, 20.0, 40.0, 66.0, 82.0, 118.0, 105.0, 122.0, 101.0, 64.0, 40.0, 32.0, 25.0, 19.0, 17.0, 13.0, 14.0, 4.0, 7.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.005321502685546875, -0.005158364772796631, -0.004995226860046387, -0.004832088947296143, -0.0046689510345458984, -0.004505813121795654, -0.00434267520904541, -0.004179537296295166, -0.004016399383544922, -0.0038532614707946777, -0.0036901235580444336, -0.0035269856452941895, -0.0033638477325439453, -0.003200709819793701, -0.003037571907043457, -0.002874433994293213, -0.0027112960815429688, -0.0025481581687927246, -0.0023850202560424805, -0.0022218823432922363, -0.002058744430541992, -0.001895606517791748, -0.001732468605041504, -0.0015693306922912598, -0.0014061927795410156, -0.0012430548667907715, -0.0010799169540405273, -0.0009167790412902832, -0.0007536411285400391, -0.0005905032157897949, -0.0004273653030395508, -0.00026422739028930664, -0.0001010894775390625, 6.204843521118164e-05, 0.00022518634796142578, 0.0003883242607116699, 0.0005514621734619141, 0.0007146000862121582, 0.0008777379989624023, 0.0010408759117126465, 0.0012040138244628906, 0.0013671517372131348, 0.001530289649963379, 0.001693427562713623, 0.0018565654754638672, 0.0020197033882141113, 0.0021828413009643555, 0.0023459792137145996, 0.0025091171264648438, 0.002672255039215088, 0.002835392951965332, 0.002998530864715576, 0.0031616687774658203, 0.0033248066902160645, 0.0034879446029663086, 0.0036510825157165527, 0.003814220428466797, 0.003977358341217041, 0.004140496253967285, 0.004303634166717529, 0.0044667720794677734, 0.004629909992218018, 0.004793047904968262, 0.004956185817718506, 0.00511932373046875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 11.0, 8.0, 15.0, 18.0, 34.0, 54.0, 85.0, 152.0, 214.0, 143.0, 80.0, 50.0, 32.0, 21.0, 18.0, 19.0, 13.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15116441249847412, -0.1470138430595398, -0.14286325871944427, -0.13871268928050995, -0.13456210494041443, -0.1304115355014801, -0.12626096606254578, -0.12211038917303085, -0.11795981228351593, -0.11380923539400101, -0.10965865850448608, -0.10550808906555176, -0.10135751217603683, -0.09720693528652191, -0.09305636584758759, -0.08890578895807266, -0.08475521206855774, -0.08060463517904282, -0.0764540582895279, -0.07230348885059357, -0.06815291196107864, -0.06400233507156372, -0.059851761907339096, -0.05570118874311447, -0.05155061185359955, -0.047400034964084625, -0.04324946179986, -0.039098888635635376, -0.03494831174612045, -0.03079773671925068, -0.026647161692380905, -0.02249658666551113, -0.01834602653980255, -0.014195451512932777, -0.010044876486063004, -0.00589430145919323, -0.0017437264323234558, 0.002406848594546318, 0.006557423621416092, 0.010707998648285866, 0.01485857367515564, 0.019009148702025414, 0.023159723728895187, 0.02731029875576496, 0.031460873782634735, 0.03561145067214966, 0.03976202383637428, 0.04391259700059891, 0.04806317389011383, 0.052213750779628754, 0.05636432394385338, 0.060514897108078, 0.06466547399759293, 0.06881605088710785, 0.07296662032604218, 0.0771171972155571, 0.08126777410507202, 0.08541835099458694, 0.08956892788410187, 0.0937194973230362, 0.09787007421255112, 0.10202065110206604, 0.10617122054100037, 0.11032179743051529, 0.11447237432003021]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 5.0, 9.0, 6.0, 8.0, 13.0, 17.0, 20.0, 22.0, 17.0, 30.0, 22.0, 44.0, 35.0, 33.0, 45.0, 54.0, 36.0, 46.0, 49.0, 54.0, 51.0, 36.0, 45.0, 35.0, 34.0, 22.0, 31.0, 24.0, 18.0, 20.0, 13.0, 12.0, 10.0, 6.0, 11.0, 19.0, 8.0, 12.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0], "bins": [-0.24026131629943848, -0.23348981142044067, -0.22671830654144287, -0.21994680166244507, -0.21317531168460846, -0.20640380680561066, -0.19963230192661285, -0.19286079704761505, -0.18608930706977844, -0.17931780219078064, -0.17254629731178284, -0.16577479243278503, -0.15900330245494843, -0.15223179757595062, -0.14546029269695282, -0.13868878781795502, -0.13191728293895721, -0.1251457780599594, -0.1183742806315422, -0.1116027757525444, -0.1048312783241272, -0.0980597734451294, -0.09128826856613159, -0.08451676368713379, -0.07774526625871658, -0.07097376137971878, -0.06420226395130157, -0.05743075907230377, -0.05065925791859627, -0.04388775676488876, -0.03711625188589096, -0.030344750732183456, -0.023573249578475952, -0.016801748424768448, -0.010030245408415794, -0.003258742392063141, 0.0035127587616443634, 0.010284259915351868, 0.01705576479434967, 0.023827265948057175, 0.03059876710176468, 0.03737026825547218, 0.04414176940917969, 0.05091327428817749, 0.057684775441884995, 0.0644562765955925, 0.0712277814745903, 0.07799927890300751, 0.08477078378200531, 0.09154228866100311, 0.09831378608942032, 0.10508529096841812, 0.11185678839683533, 0.11862829327583313, 0.12539979815483093, 0.13217130303382874, 0.13894280791282654, 0.14571431279182434, 0.15248581767082214, 0.15925732254981995, 0.16602881252765656, 0.17280031740665436, 0.17957182228565216, 0.18634332716464996, 0.19311481714248657]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 7.0, 6.0, 6.0, 10.0, 11.0, 20.0, 37.0, 36.0, 63.0, 60.0, 77.0, 127.0, 225.0, 479.0, 2137.0, 4187797.0, 2077.0, 456.0, 217.0, 126.0, 87.0, 60.0, 35.0, 30.0, 18.0, 21.0, 25.0, 10.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00174713134765625, -0.0016857683658599854, -0.0016244053840637207, -0.001563042402267456, -0.0015016794204711914, -0.0014403164386749268, -0.0013789534568786621, -0.0013175904750823975, -0.0012562274932861328, -0.0011948645114898682, -0.0011335015296936035, -0.0010721385478973389, -0.0010107755661010742, -0.0009494125843048096, -0.0008880496025085449, -0.0008266866207122803, -0.0007653236389160156, -0.000703960657119751, -0.0006425976753234863, -0.0005812346935272217, -0.000519871711730957, -0.0004585087299346924, -0.00039714574813842773, -0.0003357827663421631, -0.00027441978454589844, -0.0002130568027496338, -0.00015169382095336914, -9.033083915710449e-05, -2.8967857360839844e-05, 3.2395124435424805e-05, 9.375810623168945e-05, 0.0001551210880279541, 0.00021648406982421875, 0.0002778470516204834, 0.00033921003341674805, 0.0004005730152130127, 0.00046193599700927734, 0.000523298978805542, 0.0005846619606018066, 0.0006460249423980713, 0.0007073879241943359, 0.0007687509059906006, 0.0008301138877868652, 0.0008914768695831299, 0.0009528398513793945, 0.0010142028331756592, 0.0010755658149719238, 0.0011369287967681885, 0.0011982917785644531, 0.0012596547603607178, 0.0013210177421569824, 0.001382380723953247, 0.0014437437057495117, 0.0015051066875457764, 0.001566469669342041, 0.0016278326511383057, 0.0016891956329345703, 0.001750558614730835, 0.0018119215965270996, 0.0018732845783233643, 0.001934647560119629, 0.0019960105419158936, 0.002057373523712158, 0.002118736505508423, 0.0021800994873046875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 7.0, 7.0, 13.0, 16.0, 32.0, 29.0, 53.0, 65.0, 76.0, 80.0, 95.0, 95.0, 91.0, 65.0, 65.0, 51.0, 39.0, 31.0, 20.0, 18.0, 12.0, 9.0, 7.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0202178955078125, -0.01959395408630371, -0.018970012664794922, -0.018346071243286133, -0.017722129821777344, -0.017098188400268555, -0.016474246978759766, -0.015850305557250977, -0.015226364135742188, -0.014602422714233398, -0.01397848129272461, -0.01335453987121582, -0.012730598449707031, -0.012106657028198242, -0.011482715606689453, -0.010858774185180664, -0.010234832763671875, -0.009610891342163086, -0.008986949920654297, -0.008363008499145508, -0.007739067077636719, -0.00711512565612793, -0.006491184234619141, -0.0058672428131103516, -0.0052433013916015625, -0.0046193599700927734, -0.003995418548583984, -0.0033714771270751953, -0.0027475357055664062, -0.002123594284057617, -0.0014996528625488281, -0.0008757114410400391, -0.00025177001953125, 0.00037217140197753906, 0.0009961128234863281, 0.0016200542449951172, 0.0022439956665039062, 0.0028679370880126953, 0.0034918785095214844, 0.0041158199310302734, 0.0047397613525390625, 0.0053637027740478516, 0.005987644195556641, 0.00661158561706543, 0.007235527038574219, 0.007859468460083008, 0.008483409881591797, 0.009107351303100586, 0.009731292724609375, 0.010355234146118164, 0.010979175567626953, 0.011603116989135742, 0.012227058410644531, 0.01285099983215332, 0.01347494125366211, 0.014098882675170898, 0.014722824096679688, 0.015346765518188477, 0.015970706939697266, 0.016594648361206055, 0.017218589782714844, 0.017842531204223633, 0.018466472625732422, 0.01909041404724121, 0.01971435546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 4.0, 6.0, 15.0, 16.0, 24.0, 25.0, 47.0, 73.0, 99.0, 159.0, 264.0, 444.0, 812.0, 7540.0, 4181688.0, 1503.0, 545.0, 365.0, 213.0, 151.0, 104.0, 61.0, 38.0, 27.0, 12.0, 14.0, 6.0, 5.0, 3.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013666152954101562, -0.001322820782661438, -0.0012790262699127197, -0.0012352317571640015, -0.0011914372444152832, -0.001147642731666565, -0.0011038482189178467, -0.0010600537061691284, -0.0010162591934204102, -0.0009724646806716919, -0.0009286701679229736, -0.0008848756551742554, -0.0008410811424255371, -0.0007972866296768188, -0.0007534921169281006, -0.0007096976041793823, -0.0006659030914306641, -0.0006221085786819458, -0.0005783140659332275, -0.0005345195531845093, -0.000490725040435791, -0.00044693052768707275, -0.0004031360149383545, -0.00035934150218963623, -0.00031554698944091797, -0.0002717524766921997, -0.00022795796394348145, -0.00018416345119476318, -0.00014036893844604492, -9.657442569732666e-05, -5.27799129486084e-05, -8.985400199890137e-06, 3.4809112548828125e-05, 7.860362529754639e-05, 0.00012239813804626465, 0.0001661926507949829, 0.00020998716354370117, 0.00025378167629241943, 0.0002975761890411377, 0.00034137070178985596, 0.0003851652145385742, 0.0004289597272872925, 0.00047275424003601074, 0.000516548752784729, 0.0005603432655334473, 0.0006041377782821655, 0.0006479322910308838, 0.000691726803779602, 0.0007355213165283203, 0.0007793158292770386, 0.0008231103420257568, 0.0008669048547744751, 0.0009106993675231934, 0.0009544938802719116, 0.0009982883930206299, 0.0010420829057693481, 0.0010858774185180664, 0.0011296719312667847, 0.001173466444015503, 0.0012172609567642212, 0.0012610554695129395, 0.0013048499822616577, 0.001348644495010376, 0.0013924390077590942, 0.0014362335205078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 4064.0, 9.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00035762786865234375, -0.00034628063440322876, -0.00033493340015411377, -0.0003235861659049988, -0.0003122389316558838, -0.0003008916974067688, -0.0002895444631576538, -0.0002781972289085388, -0.00026684999465942383, -0.00025550276041030884, -0.00024415552616119385, -0.00023280829191207886, -0.00022146105766296387, -0.00021011382341384888, -0.0001987665891647339, -0.0001874193549156189, -0.0001760721206665039, -0.00016472488641738892, -0.00015337765216827393, -0.00014203041791915894, -0.00013068318367004395, -0.00011933594942092896, -0.00010798871517181396, -9.664148092269897e-05, -8.529424667358398e-05, -7.3947012424469e-05, -6.2599778175354e-05, -5.1252543926239014e-05, -3.9905309677124023e-05, -2.8558075428009033e-05, -1.7210841178894043e-05, -5.863606929779053e-06, 5.4836273193359375e-06, 1.6830861568450928e-05, 2.8178095817565918e-05, 3.952533006668091e-05, 5.08725643157959e-05, 6.221979856491089e-05, 7.356703281402588e-05, 8.491426706314087e-05, 9.626150131225586e-05, 0.00010760873556137085, 0.00011895596981048584, 0.00013030320405960083, 0.00014165043830871582, 0.0001529976725578308, 0.0001643449068069458, 0.0001756921410560608, 0.00018703937530517578, 0.00019838660955429077, 0.00020973384380340576, 0.00022108107805252075, 0.00023242831230163574, 0.00024377554655075073, 0.0002551227807998657, 0.0002664700150489807, 0.0002778172492980957, 0.0002891644835472107, 0.0003005117177963257, 0.0003118589520454407, 0.00032320618629455566, 0.00033455342054367065, 0.00034590065479278564, 0.00035724788904190063, 0.0003685951232910156]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 39.0, 921.0, 47.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00319444527849555, -0.0030787005089223385, -0.002962955739349127, -0.002847210969775915, -0.00273146596737206, -0.002615721197798848, -0.0024999764282256365, -0.002384231658652425, -0.002268486889079213, -0.0021527421195060015, -0.00203699734993279, -0.0019212524639442563, -0.0018055076943710446, -0.0016897628083825111, -0.0015740180388092995, -0.0014582732692360878, -0.0013425283832475543, -0.0012267836136743426, -0.0011110387276858091, -0.0009952939581125975, -0.0008795491885393858, -0.0007638043607585132, -0.0006480595329776406, -0.000532314763404429, -0.0004165699356235564, -0.00030082513694651425, -0.0001850803237175569, -6.933551048859954e-05, 4.640928818844259e-05, 0.00016215408686548471, 0.0002778989146463573, 0.00039364368421956897, 0.0005093885120004416, 0.0006251333397813141, 0.0007408781093545258, 0.0008566229371353984, 0.0009723677067086101, 0.0010881125926971436, 0.0012038573622703552, 0.001319602131843567, 0.0014353469014167786, 0.0015510916709899902, 0.0016668365569785237, 0.0017825813265517354, 0.001898326096124947, 0.0020140709821134806, 0.0021298157516866922, 0.002245560521259904, 0.0023613055236637592, 0.002477050293236971, 0.0025927950628101826, 0.0027085398323833942, 0.0028242848347872496, 0.0029400296043604612, 0.003055774373933673, 0.0031715191435068846, 0.0032872639130800962, 0.003403008682653308, 0.0035187534522265196, 0.003634498454630375, 0.0037502432242035866, 0.0038659879937767982, 0.00398173276335001, 0.004097477532923222, 0.004213222302496433]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 22.0, 44.0, 31.0, 58.0, 79.0, 91.0, 94.0, 111.0, 92.0, 86.0, 85.0, 58.0, 40.0, 28.0, 27.0, 12.0, 11.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032806396484375, -0.00031471624970436096, -0.0003013685345649719, -0.0002880208194255829, -0.00027467310428619385, -0.0002613253891468048, -0.00024797767400741577, -0.00023462995886802673, -0.0002212822437286377, -0.00020793452858924866, -0.00019458681344985962, -0.00018123909831047058, -0.00016789138317108154, -0.0001545436680316925, -0.00014119595289230347, -0.00012784823775291443, -0.00011450052261352539, -0.00010115280747413635, -8.780509233474731e-05, -7.445737719535828e-05, -6.110966205596924e-05, -4.77619469165802e-05, -3.441423177719116e-05, -2.1066516637802124e-05, -7.718801498413086e-06, 5.628913640975952e-06, 1.897662878036499e-05, 3.232434391975403e-05, 4.5672059059143066e-05, 5.9019774198532104e-05, 7.236748933792114e-05, 8.571520447731018e-05, 9.906291961669922e-05, 0.00011241063475608826, 0.0001257583498954773, 0.00013910606503486633, 0.00015245378017425537, 0.0001658014953136444, 0.00017914921045303345, 0.00019249692559242249, 0.00020584464073181152, 0.00021919235587120056, 0.0002325400710105896, 0.00024588778614997864, 0.0002592355012893677, 0.0002725832164287567, 0.00028593093156814575, 0.0002992786467075348, 0.00031262636184692383, 0.00032597407698631287, 0.0003393217921257019, 0.00035266950726509094, 0.00036601722240448, 0.000379364937543869, 0.00039271265268325806, 0.0004060603678226471, 0.00041940808296203613, 0.00043275579810142517, 0.0004461035132408142, 0.00045945122838020325, 0.0004727989435195923, 0.0004861466586589813, 0.0004994943737983704, 0.0005128420889377594, 0.0005261898040771484]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 8.0, 13.0, 20.0, 27.0, 42.0, 47.0, 63.0, 81.0, 142.0, 215.0, 307.0, 442.0, 794.0, 1362.0, 2374.0, 4618.0, 10207.0, 25876.0, 83979.0, 520448.0, 299400.0, 60011.0, 20329.0, 8389.0, 4014.0, 2134.0, 1137.0, 709.0, 444.0, 272.0, 183.0, 130.0, 91.0, 65.0, 43.0, 36.0, 21.0, 18.0, 10.0, 13.0, 6.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.024627685546875, -0.02387857437133789, -0.02312946319580078, -0.022380352020263672, -0.021631240844726562, -0.020882129669189453, -0.020133018493652344, -0.019383907318115234, -0.018634796142578125, -0.017885684967041016, -0.017136573791503906, -0.016387462615966797, -0.015638351440429688, -0.014889240264892578, -0.014140129089355469, -0.01339101791381836, -0.01264190673828125, -0.01189279556274414, -0.011143684387207031, -0.010394573211669922, -0.009645462036132812, -0.008896350860595703, -0.008147239685058594, -0.007398128509521484, -0.006649017333984375, -0.005899906158447266, -0.005150794982910156, -0.004401683807373047, -0.0036525726318359375, -0.002903461456298828, -0.0021543502807617188, -0.0014052391052246094, -0.0006561279296875, 9.298324584960938e-05, 0.0008420944213867188, 0.0015912055969238281, 0.0023403167724609375, 0.003089427947998047, 0.0038385391235351562, 0.004587650299072266, 0.005336761474609375, 0.006085872650146484, 0.006834983825683594, 0.007584095001220703, 0.008333206176757812, 0.009082317352294922, 0.009831428527832031, 0.01058053970336914, 0.01132965087890625, 0.01207876205444336, 0.012827873229980469, 0.013576984405517578, 0.014326095581054688, 0.015075206756591797, 0.015824317932128906, 0.016573429107666016, 0.017322540283203125, 0.018071651458740234, 0.018820762634277344, 0.019569873809814453, 0.020318984985351562, 0.021068096160888672, 0.02181720733642578, 0.02256631851196289, 0.0233154296875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 7.0, 7.0, 12.0, 17.0, 32.0, 28.0, 54.0, 63.0, 76.0, 80.0, 96.0, 92.0, 94.0, 66.0, 64.0, 52.0, 39.0, 31.0, 19.0, 19.0, 12.0, 9.0, 6.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0202178955078125, -0.019594192504882812, -0.018970489501953125, -0.018346786499023438, -0.01772308349609375, -0.017099380493164062, -0.016475677490234375, -0.015851974487304688, -0.015228271484375, -0.014604568481445312, -0.013980865478515625, -0.013357162475585938, -0.01273345947265625, -0.012109756469726562, -0.011486053466796875, -0.010862350463867188, -0.0102386474609375, -0.009614944458007812, -0.008991241455078125, -0.008367538452148438, -0.00774383544921875, -0.0071201324462890625, -0.006496429443359375, -0.0058727264404296875, -0.0052490234375, -0.0046253204345703125, -0.004001617431640625, -0.0033779144287109375, -0.00275421142578125, -0.0021305084228515625, -0.001506805419921875, -0.0008831024169921875, -0.0002593994140625, 0.0003643035888671875, 0.000988006591796875, 0.0016117095947265625, 0.00223541259765625, 0.0028591156005859375, 0.003482818603515625, 0.0041065216064453125, 0.004730224609375, 0.0053539276123046875, 0.005977630615234375, 0.0066013336181640625, 0.00722503662109375, 0.007848739624023438, 0.008472442626953125, 0.009096145629882812, 0.0097198486328125, 0.010343551635742188, 0.010967254638671875, 0.011590957641601562, 0.01221466064453125, 0.012838363647460938, 0.013462066650390625, 0.014085769653320312, 0.01470947265625, 0.015333175659179688, 0.015956878662109375, 0.016580581665039062, 0.01720428466796875, 0.017827987670898438, 0.018451690673828125, 0.019075393676757812, 0.0196990966796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 6.0, 11.0, 14.0, 10.0, 13.0, 22.0, 21.0, 26.0, 33.0, 47.0, 42.0, 90.0, 120.0, 197.0, 386.0, 1004.0, 9510.0, 895738.0, 136390.0, 3325.0, 689.0, 283.0, 149.0, 107.0, 66.0, 40.0, 48.0, 30.0, 24.0, 17.0, 15.0, 13.0, 11.0, 6.0, 7.0, 7.0, 6.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0736083984375, -0.07121944427490234, -0.06883049011230469, -0.06644153594970703, -0.06405258178710938, -0.06166362762451172, -0.05927467346191406, -0.056885719299316406, -0.05449676513671875, -0.052107810974121094, -0.04971885681152344, -0.04732990264892578, -0.044940948486328125, -0.04255199432373047, -0.04016304016113281, -0.037774085998535156, -0.0353851318359375, -0.032996177673339844, -0.030607223510742188, -0.02821826934814453, -0.025829315185546875, -0.02344036102294922, -0.021051406860351562, -0.018662452697753906, -0.01627349853515625, -0.013884544372558594, -0.011495590209960938, -0.009106636047363281, -0.006717681884765625, -0.004328727722167969, -0.0019397735595703125, 0.00044918060302734375, 0.002838134765625, 0.005227088928222656, 0.0076160430908203125, 0.010004997253417969, 0.012393951416015625, 0.014782905578613281, 0.017171859741210938, 0.019560813903808594, 0.02194976806640625, 0.024338722229003906, 0.026727676391601562, 0.02911663055419922, 0.031505584716796875, 0.03389453887939453, 0.03628349304199219, 0.038672447204589844, 0.0410614013671875, 0.043450355529785156, 0.04583930969238281, 0.04822826385498047, 0.050617218017578125, 0.05300617218017578, 0.05539512634277344, 0.057784080505371094, 0.06017303466796875, 0.0625619888305664, 0.06495094299316406, 0.06733989715576172, 0.06972885131835938, 0.07211780548095703, 0.07450675964355469, 0.07689571380615234, 0.07928466796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 7.0, 5.0, 6.0, 7.0, 10.0, 15.0, 15.0, 11.0, 15.0, 21.0, 32.0, 22.0, 31.0, 31.0, 22.0, 45.0, 42.0, 37.0, 41.0, 25.0, 47.0, 52.0, 37.0, 21.0, 31.0, 52.0, 40.0, 18.0, 22.0, 22.0, 31.0, 33.0, 21.0, 17.0, 18.0, 14.0, 10.0, 10.0, 13.0, 10.0, 9.0, 5.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032684326171875, -0.031556129455566406, -0.030427932739257812, -0.02929973602294922, -0.028171539306640625, -0.02704334259033203, -0.025915145874023438, -0.024786949157714844, -0.02365875244140625, -0.022530555725097656, -0.021402359008789062, -0.02027416229248047, -0.019145965576171875, -0.01801776885986328, -0.016889572143554688, -0.015761375427246094, -0.0146331787109375, -0.013504981994628906, -0.012376785278320312, -0.011248588562011719, -0.010120391845703125, -0.008992195129394531, -0.007863998413085938, -0.006735801696777344, -0.00560760498046875, -0.004479408264160156, -0.0033512115478515625, -0.0022230148315429688, -0.001094818115234375, 3.337860107421875e-05, 0.0011615753173828125, 0.0022897720336914062, 0.00341796875, 0.004546165466308594, 0.0056743621826171875, 0.006802558898925781, 0.007930755615234375, 0.009058952331542969, 0.010187149047851562, 0.011315345764160156, 0.01244354248046875, 0.013571739196777344, 0.014699935913085938, 0.01582813262939453, 0.016956329345703125, 0.01808452606201172, 0.019212722778320312, 0.020340919494628906, 0.0214691162109375, 0.022597312927246094, 0.023725509643554688, 0.02485370635986328, 0.025981903076171875, 0.02711009979248047, 0.028238296508789062, 0.029366493225097656, 0.03049468994140625, 0.031622886657714844, 0.03275108337402344, 0.03387928009033203, 0.035007476806640625, 0.03613567352294922, 0.03726387023925781, 0.038392066955566406, 0.039520263671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 36.0, 100.0, 1110.0, 1046273.0, 848.0, 97.0, 22.0, 17.0, 9.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.052703857421875, -0.05151820182800293, -0.05033254623413086, -0.04914689064025879, -0.04796123504638672, -0.04677557945251465, -0.04558992385864258, -0.04440426826477051, -0.04321861267089844, -0.04203295707702637, -0.0408473014831543, -0.03966164588928223, -0.038475990295410156, -0.037290334701538086, -0.036104679107666016, -0.034919023513793945, -0.033733367919921875, -0.032547712326049805, -0.031362056732177734, -0.030176401138305664, -0.028990745544433594, -0.027805089950561523, -0.026619434356689453, -0.025433778762817383, -0.024248123168945312, -0.023062467575073242, -0.021876811981201172, -0.0206911563873291, -0.01950550079345703, -0.01831984519958496, -0.01713418960571289, -0.01594853401184082, -0.01476287841796875, -0.01357722282409668, -0.01239156723022461, -0.011205911636352539, -0.010020256042480469, -0.008834600448608398, -0.007648944854736328, -0.006463289260864258, -0.0052776336669921875, -0.004091978073120117, -0.002906322479248047, -0.0017206668853759766, -0.0005350112915039062, 0.0006506443023681641, 0.0018362998962402344, 0.0030219554901123047, 0.004207611083984375, 0.005393266677856445, 0.006578922271728516, 0.007764577865600586, 0.008950233459472656, 0.010135889053344727, 0.011321544647216797, 0.012507200241088867, 0.013692855834960938, 0.014878511428833008, 0.016064167022705078, 0.01724982261657715, 0.01843547821044922, 0.01962113380432129, 0.02080678939819336, 0.02199244499206543, 0.0231781005859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 20.0, 621.0, 317.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005645751953125, -0.0005450323224067688, -0.0005254894495010376, -0.0005059465765953064, -0.0004864037036895752, -0.000466860830783844, -0.0004473179578781128, -0.0004277750849723816, -0.0004082322120666504, -0.0003886893391609192, -0.000369146466255188, -0.0003496035933494568, -0.0003300607204437256, -0.0003105178475379944, -0.0002909749746322632, -0.000271432101726532, -0.0002518892288208008, -0.00023234635591506958, -0.00021280348300933838, -0.00019326061010360718, -0.00017371773719787598, -0.00015417486429214478, -0.00013463199138641357, -0.00011508911848068237, -9.554624557495117e-05, -7.600337266921997e-05, -5.646049976348877e-05, -3.691762685775757e-05, -1.7374753952026367e-05, 2.168118953704834e-06, 2.1710991859436035e-05, 4.1253864765167236e-05, 6.079673767089844e-05, 8.033961057662964e-05, 9.988248348236084e-05, 0.00011942535638809204, 0.00013896822929382324, 0.00015851110219955444, 0.00017805397510528564, 0.00019759684801101685, 0.00021713972091674805, 0.00023668259382247925, 0.00025622546672821045, 0.00027576833963394165, 0.00029531121253967285, 0.00031485408544540405, 0.00033439695835113525, 0.00035393983125686646, 0.00037348270416259766, 0.00039302557706832886, 0.00041256844997406006, 0.00043211132287979126, 0.00045165419578552246, 0.00047119706869125366, 0.0004907399415969849, 0.0005102828145027161, 0.0005298256874084473, 0.0005493685603141785, 0.0005689114332199097, 0.0005884543061256409, 0.0006079971790313721, 0.0006275400519371033, 0.0006470829248428345, 0.0006666257977485657, 0.0006861686706542969]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 18.0, 33.0, 140.0, 561.0, 1042538.0, 4937.0, 228.0, 59.0, 13.0, 8.0, 10.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0172882080078125, -0.015819311141967773, -0.014350414276123047, -0.01288151741027832, -0.011412620544433594, -0.009943723678588867, -0.00847482681274414, -0.007005929946899414, -0.0055370330810546875, -0.004068136215209961, -0.0025992393493652344, -0.0011303424835205078, 0.00033855438232421875, 0.0018074512481689453, 0.003276348114013672, 0.0047452449798583984, 0.006214141845703125, 0.0076830387115478516, 0.009151935577392578, 0.010620832443237305, 0.012089729309082031, 0.013558626174926758, 0.015027523040771484, 0.01649641990661621, 0.017965316772460938, 0.019434213638305664, 0.02090311050415039, 0.022372007369995117, 0.023840904235839844, 0.02530980110168457, 0.026778697967529297, 0.028247594833374023, 0.02971649169921875, 0.031185388565063477, 0.0326542854309082, 0.03412318229675293, 0.035592079162597656, 0.03706097602844238, 0.03852987289428711, 0.039998769760131836, 0.04146766662597656, 0.04293656349182129, 0.044405460357666016, 0.04587435722351074, 0.04734325408935547, 0.048812150955200195, 0.05028104782104492, 0.05174994468688965, 0.053218841552734375, 0.0546877384185791, 0.05615663528442383, 0.057625532150268555, 0.05909442901611328, 0.06056332588195801, 0.062032222747802734, 0.06350111961364746, 0.06497001647949219, 0.06643891334533691, 0.06790781021118164, 0.06937670707702637, 0.0708456039428711, 0.07231450080871582, 0.07378339767456055, 0.07525229454040527, 0.07672119140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 10.0, 12.0, 26.0, 80.0, 342.0, 369.0, 88.0, 47.0, 19.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03271484375, -0.03204786777496338, -0.03138089179992676, -0.030713915824890137, -0.030046939849853516, -0.029379963874816895, -0.028712987899780273, -0.028046011924743652, -0.02737903594970703, -0.02671205997467041, -0.02604508399963379, -0.025378108024597168, -0.024711132049560547, -0.024044156074523926, -0.023377180099487305, -0.022710204124450684, -0.022043228149414062, -0.02137625217437744, -0.02070927619934082, -0.0200423002243042, -0.019375324249267578, -0.018708348274230957, -0.018041372299194336, -0.017374396324157715, -0.016707420349121094, -0.016040444374084473, -0.015373468399047852, -0.01470649242401123, -0.01403951644897461, -0.013372540473937988, -0.012705564498901367, -0.012038588523864746, -0.011371612548828125, -0.010704636573791504, -0.010037660598754883, -0.009370684623718262, -0.00870370864868164, -0.00803673267364502, -0.0073697566986083984, -0.006702780723571777, -0.006035804748535156, -0.005368828773498535, -0.004701852798461914, -0.004034876823425293, -0.003367900848388672, -0.0027009248733520508, -0.0020339488983154297, -0.0013669729232788086, -0.0006999969482421875, -3.3020973205566406e-05, 0.0006339550018310547, 0.0013009309768676758, 0.001967906951904297, 0.002634882926940918, 0.003301858901977539, 0.00396883487701416, 0.004635810852050781, 0.005302786827087402, 0.0059697628021240234, 0.0066367387771606445, 0.007303714752197266, 0.007970690727233887, 0.008637666702270508, 0.009304642677307129, 0.00997161865234375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 15.0, 291.0, 668.0, 38.0, 6.0, 2.0, 1.0, 1.0], "bins": [-1.9654268026351929, -1.9315918684005737, -1.8977569341659546, -1.8639219999313354, -1.8300870656967163, -1.7962521314620972, -1.762417197227478, -1.7285822629928589, -1.6947473287582397, -1.6609123945236206, -1.6270774602890015, -1.5932425260543823, -1.5594075918197632, -1.525572657585144, -1.491737723350525, -1.4579027891159058, -1.4240678548812866, -1.3902329206466675, -1.3563979864120483, -1.3225630521774292, -1.28872811794281, -1.254893183708191, -1.2210582494735718, -1.1872233152389526, -1.1533883810043335, -1.1195534467697144, -1.0857185125350952, -1.051883578300476, -1.018048644065857, -0.9842137098312378, -0.9503787755966187, -0.9165438413619995, -0.8827088475227356, -0.8488739132881165, -0.8150389790534973, -0.7812040448188782, -0.747369110584259, -0.7135341763496399, -0.6796992421150208, -0.6458643078804016, -0.6120293736457825, -0.5781944394111633, -0.5443595051765442, -0.510524570941925, -0.4766896367073059, -0.44285470247268677, -0.4090197682380676, -0.3751848340034485, -0.34134989976882935, -0.3075149655342102, -0.27368003129959106, -0.23984509706497192, -0.20601016283035278, -0.17217522859573364, -0.1383402943611145, -0.10450536012649536, -0.07067042589187622, -0.03683549165725708, -0.0030005574226379395, 0.0308343768119812, 0.06466931104660034, 0.09850424528121948, 0.13233917951583862, 0.16617411375045776, 0.2000090479850769]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 3.0, 5.0, 9.0, 11.0, 9.0, 7.0, 10.0, 21.0, 11.0, 19.0, 22.0, 24.0, 31.0, 28.0, 31.0, 39.0, 31.0, 38.0, 43.0, 43.0, 44.0, 46.0, 27.0, 48.0, 27.0, 31.0, 41.0, 28.0, 30.0, 32.0, 30.0, 28.0, 25.0, 23.0, 20.0, 11.0, 15.0, 10.0, 7.0, 11.0, 6.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.18563055992126465, -0.18013067543506622, -0.1746307909488678, -0.16913089156150818, -0.16363100707530975, -0.15813112258911133, -0.1526312232017517, -0.14713133871555328, -0.14163145422935486, -0.13613156974315643, -0.130631685256958, -0.1251317858695984, -0.11963190138339996, -0.11413201689720154, -0.10863212496042252, -0.1031322330236435, -0.09763234853744507, -0.09213246405124664, -0.08663257211446762, -0.0811326801776886, -0.07563279569149017, -0.07013291120529175, -0.06463301926851273, -0.059133131057024, -0.05363324284553528, -0.048133354634046555, -0.04263346642255783, -0.03713357821106911, -0.03163368999958038, -0.02613380178809166, -0.020633913576602936, -0.015134025365114212, -0.009634137153625488, -0.0041342489421367645, 0.0013656392693519592, 0.006865527480840683, 0.012365415692329407, 0.01786530390381813, 0.023365192115306854, 0.028865080326795578, 0.0343649685382843, 0.039864856749773026, 0.04536474496126175, 0.05086463317275047, 0.0563645213842392, 0.06186440959572792, 0.06736429780721664, 0.07286418974399567, 0.07836407423019409, 0.08386395871639252, 0.08936385065317154, 0.09486374258995056, 0.10036362707614899, 0.10586351156234741, 0.11136340349912643, 0.11686329543590546, 0.12236317992210388, 0.1278630644083023, 0.13336294889450073, 0.13886284828186035, 0.14436273276805878, 0.1498626172542572, 0.15536251664161682, 0.16086240112781525, 0.16636228561401367]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 4.0, 8.0, 3.0, 7.0, 15.0, 33.0, 30.0, 39.0, 50.0, 77.0, 105.0, 159.0, 238.0, 414.0, 837.0, 2128.0, 7651.0, 4172090.0, 6660.0, 1820.0, 752.0, 379.0, 220.0, 129.0, 102.0, 96.0, 55.0, 39.0, 27.0, 22.0, 21.0, 11.0, 11.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004711151123046875, -0.0004565976560115814, -0.00044208019971847534, -0.00042756274342536926, -0.0004130452871322632, -0.0003985278308391571, -0.000384010374546051, -0.00036949291825294495, -0.00035497546195983887, -0.0003404580056667328, -0.0003259405493736267, -0.00031142309308052063, -0.00029690563678741455, -0.00028238818049430847, -0.0002678707242012024, -0.0002533532679080963, -0.00023883581161499023, -0.00022431835532188416, -0.00020980089902877808, -0.000195283442735672, -0.00018076598644256592, -0.00016624853014945984, -0.00015173107385635376, -0.00013721361756324768, -0.0001226961612701416, -0.00010817870497703552, -9.366124868392944e-05, -7.914379239082336e-05, -6.462633609771729e-05, -5.0108879804611206e-05, -3.559142351150513e-05, -2.1073967218399048e-05, -6.556510925292969e-06, 7.96094536781311e-06, 2.247840166091919e-05, 3.699585795402527e-05, 5.151331424713135e-05, 6.603077054023743e-05, 8.05482268333435e-05, 9.506568312644958e-05, 0.00010958313941955566, 0.00012410059571266174, 0.00013861805200576782, 0.0001531355082988739, 0.00016765296459197998, 0.00018217042088508606, 0.00019668787717819214, 0.00021120533347129822, 0.0002257227897644043, 0.00024024024605751038, 0.00025475770235061646, 0.00026927515864372253, 0.0002837926149368286, 0.0002983100712299347, 0.00031282752752304077, 0.00032734498381614685, 0.00034186244010925293, 0.000356379896402359, 0.0003708973526954651, 0.00038541480898857117, 0.00039993226528167725, 0.0004144497215747833, 0.0004289671778678894, 0.0004434846341609955, 0.00045800209045410156]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 9.0, 5.0, 16.0, 19.0, 29.0, 31.0, 56.0, 64.0, 82.0, 78.0, 87.0, 109.0, 83.0, 74.0, 49.0, 57.0, 38.0, 27.0, 22.0, 13.0, 12.0, 9.0, 9.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0202484130859375, -0.019620656967163086, -0.018992900848388672, -0.018365144729614258, -0.017737388610839844, -0.01710963249206543, -0.016481876373291016, -0.0158541202545166, -0.015226364135742188, -0.014598608016967773, -0.01397085189819336, -0.013343095779418945, -0.012715339660644531, -0.012087583541870117, -0.011459827423095703, -0.010832071304321289, -0.010204315185546875, -0.009576559066772461, -0.008948802947998047, -0.008321046829223633, -0.007693290710449219, -0.007065534591674805, -0.006437778472900391, -0.0058100223541259766, -0.0051822662353515625, -0.0045545101165771484, -0.003926753997802734, -0.0032989978790283203, -0.0026712417602539062, -0.002043485641479492, -0.0014157295227050781, -0.0007879734039306641, -0.00016021728515625, 0.00046753883361816406, 0.0010952949523925781, 0.0017230510711669922, 0.0023508071899414062, 0.0029785633087158203, 0.0036063194274902344, 0.0042340755462646484, 0.0048618316650390625, 0.0054895877838134766, 0.006117343902587891, 0.006745100021362305, 0.007372856140136719, 0.008000612258911133, 0.008628368377685547, 0.009256124496459961, 0.009883880615234375, 0.010511636734008789, 0.011139392852783203, 0.011767148971557617, 0.012394905090332031, 0.013022661209106445, 0.01365041732788086, 0.014278173446655273, 0.014905929565429688, 0.015533685684204102, 0.016161441802978516, 0.01678919792175293, 0.017416954040527344, 0.018044710159301758, 0.018672466278076172, 0.019300222396850586, 0.019927978515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 11.0, 10.0, 17.0, 34.0, 27.0, 33.0, 35.0, 75.0, 91.0, 118.0, 143.0, 292.0, 711.0, 2345.0, 14793.0, 4169319.0, 3907.0, 1144.0, 423.0, 191.0, 121.0, 101.0, 75.0, 56.0, 55.0, 31.0, 24.0, 27.0, 14.0, 17.0, 15.0, 5.0, 4.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010328292846679688, -0.0010017156600952148, -0.0009706020355224609, -0.000939488410949707, -0.0009083747863769531, -0.0008772611618041992, -0.0008461475372314453, -0.0008150339126586914, -0.0007839202880859375, -0.0007528066635131836, -0.0007216930389404297, -0.0006905794143676758, -0.0006594657897949219, -0.000628352165222168, -0.0005972385406494141, -0.0005661249160766602, -0.0005350112915039062, -0.0005038976669311523, -0.00047278404235839844, -0.00044167041778564453, -0.0004105567932128906, -0.0003794431686401367, -0.0003483295440673828, -0.0003172159194946289, -0.000286102294921875, -0.0002549886703491211, -0.0002238750457763672, -0.00019276142120361328, -0.00016164779663085938, -0.00013053417205810547, -9.942054748535156e-05, -6.830692291259766e-05, -3.719329833984375e-05, -6.079673767089844e-06, 2.5033950805664062e-05, 5.614757537841797e-05, 8.726119995117188e-05, 0.00011837482452392578, 0.0001494884490966797, 0.0001806020736694336, 0.0002117156982421875, 0.0002428293228149414, 0.0002739429473876953, 0.0003050565719604492, 0.0003361701965332031, 0.00036728382110595703, 0.00039839744567871094, 0.00042951107025146484, 0.00046062469482421875, 0.0004917383193969727, 0.0005228519439697266, 0.0005539655685424805, 0.0005850791931152344, 0.0006161928176879883, 0.0006473064422607422, 0.0006784200668334961, 0.00070953369140625, 0.0007406473159790039, 0.0007717609405517578, 0.0008028745651245117, 0.0008339881896972656, 0.0008651018142700195, 0.0008962154388427734, 0.0009273290634155273, 0.0009584426879882812]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 22.0, 4028.0, 7.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012350082397460938, -0.00011544302105903625, -0.00010738521814346313, -9.932741522789001e-05, -9.12696123123169e-05, -8.321180939674377e-05, -7.515400648117065e-05, -6.709620356559753e-05, -5.9038400650024414e-05, -5.0980597734451294e-05, -4.2922794818878174e-05, -3.4864991903305054e-05, -2.6807188987731934e-05, -1.8749386072158813e-05, -1.0691583156585693e-05, -2.6337802410125732e-06, 5.424022674560547e-06, 1.3481825590133667e-05, 2.1539628505706787e-05, 2.9597431421279907e-05, 3.765523433685303e-05, 4.571303725242615e-05, 5.377084016799927e-05, 6.182864308357239e-05, 6.988644599914551e-05, 7.794424891471863e-05, 8.600205183029175e-05, 9.405985474586487e-05, 0.00010211765766143799, 0.00011017546057701111, 0.00011823326349258423, 0.00012629106640815735, 0.00013434886932373047, 0.0001424066722393036, 0.0001504644751548767, 0.00015852227807044983, 0.00016658008098602295, 0.00017463788390159607, 0.0001826956868171692, 0.0001907534897327423, 0.00019881129264831543, 0.00020686909556388855, 0.00021492689847946167, 0.0002229847013950348, 0.0002310425043106079, 0.00023910030722618103, 0.00024715811014175415, 0.00025521591305732727, 0.0002632737159729004, 0.0002713315188884735, 0.00027938932180404663, 0.00028744712471961975, 0.00029550492763519287, 0.000303562730550766, 0.0003116205334663391, 0.00031967833638191223, 0.00032773613929748535, 0.00033579394221305847, 0.0003438517451286316, 0.0003519095480442047, 0.00035996735095977783, 0.00036802515387535095, 0.00037608295679092407, 0.0003841407597064972, 0.0003921985626220703]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 26.0, 95.0, 577.0, 229.0, 60.0, 13.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003884966135956347, -0.0003482723259367049, -0.00030804803827777505, -0.0002678237797226757, -0.00022759949206374586, -0.00018737520440481603, -0.00014715093129780143, -0.00010692665819078684, -6.670237053185701e-05, -2.6478090148884803e-05, 1.3746190234087408e-05, 5.397047061705962e-05, 9.419475100003183e-05, 0.00013441903865896165, 0.00017464331176597625, 0.00021486758487299085, 0.00025509187253192067, 0.0002953161601908505, 0.0003355404478497803, 0.0003757647064048797, 0.0004159889940638095, 0.00045621328172273934, 0.0004964375402778387, 0.0005366618279367685, 0.0005768861155956984, 0.0006171104032546282, 0.000657334690913558, 0.0006975589785724878, 0.0007377832662314177, 0.0007780075538903475, 0.0008182317833416164, 0.0008584560710005462, 0.000898680416867137, 0.0009389047045260668, 0.0009791289921849966, 0.0010193532798439264, 0.0010595775675028563, 0.001099801855161786, 0.001140026142820716, 0.0011802504304796457, 0.0012204747181385756, 0.0012606990057975054, 0.0013009232934564352, 0.001341147581115365, 0.0013813718687742949, 0.0014215961564332247, 0.0014618204440921545, 0.0015020447317510843, 0.0015422689029946923, 0.0015824931906536222, 0.001622717478312552, 0.0016629417659714818, 0.0017031660536304116, 0.0017433903412893414, 0.0017836146289482713, 0.0018238388001918793, 0.001864063087850809, 0.001904287375509739, 0.0019445116631686687, 0.0019847359508275986, 0.0020249602384865284, 0.0020651845261454582, 0.002105408813804388, 0.002145633101463318, 0.0021858573891222477]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 10.0, 3.0, 10.0, 7.0, 7.0, 17.0, 14.0, 22.0, 17.0, 21.0, 29.0, 40.0, 41.0, 51.0, 44.0, 55.0, 48.0, 58.0, 46.0, 50.0, 43.0, 48.0, 49.0, 43.0, 42.0, 38.0, 30.0, 14.0, 16.0, 18.0, 20.0, 14.0, 7.0, 10.0, 5.0, 9.0, 0.0, 5.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.0003345012664794922, -0.0003262395039200783, -0.00031797774136066437, -0.00030971597880125046, -0.00030145421624183655, -0.00029319245368242264, -0.00028493069112300873, -0.0002766689285635948, -0.0002684071660041809, -0.000260145403444767, -0.0002518836408853531, -0.00024362187832593918, -0.00023536011576652527, -0.00022709835320711136, -0.00021883659064769745, -0.00021057482808828354, -0.00020231306552886963, -0.00019405130296945572, -0.0001857895404100418, -0.0001775277778506279, -0.000169266015291214, -0.00016100425273180008, -0.00015274249017238617, -0.00014448072761297226, -0.00013621896505355835, -0.00012795720249414444, -0.00011969543993473053, -0.00011143367737531662, -0.00010317191481590271, -9.49101522564888e-05, -8.664838969707489e-05, -7.838662713766098e-05, -7.012486457824707e-05, -6.186310201883316e-05, -5.360133945941925e-05, -4.533957690000534e-05, -3.707781434059143e-05, -2.881605178117752e-05, -2.055428922176361e-05, -1.2292526662349701e-05, -4.030764102935791e-06, 4.230998456478119e-06, 1.2492761015892029e-05, 2.075452357530594e-05, 2.901628613471985e-05, 3.727804869413376e-05, 4.553981125354767e-05, 5.380157381296158e-05, 6.206333637237549e-05, 7.03250989317894e-05, 7.858686149120331e-05, 8.684862405061722e-05, 9.511038661003113e-05, 0.00010337214916944504, 0.00011163391172885895, 0.00011989567428827286, 0.00012815743684768677, 0.00013641919940710068, 0.0001446809619665146, 0.0001529427245259285, 0.0001612044870853424, 0.00016946624964475632, 0.00017772801220417023, 0.00018598977476358414, 0.00019425153732299805]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 2.0, 9.0, 9.0, 5.0, 4.0, 14.0, 20.0, 30.0, 25.0, 48.0, 55.0, 88.0, 118.0, 147.0, 218.0, 357.0, 543.0, 823.0, 1406.0, 2450.0, 4724.0, 9321.0, 20529.0, 53369.0, 197486.0, 568318.0, 119003.0, 37587.0, 15288.0, 7251.0, 3593.0, 2154.0, 1236.0, 749.0, 486.0, 317.0, 229.0, 145.0, 108.0, 83.0, 46.0, 31.0, 33.0, 31.0, 21.0, 10.0, 6.0, 8.0, 9.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0], "bins": [-0.0214385986328125, -0.020775556564331055, -0.02011251449584961, -0.019449472427368164, -0.01878643035888672, -0.018123388290405273, -0.017460346221923828, -0.016797304153442383, -0.016134262084960938, -0.015471220016479492, -0.014808177947998047, -0.014145135879516602, -0.013482093811035156, -0.012819051742553711, -0.012156009674072266, -0.01149296760559082, -0.010829925537109375, -0.01016688346862793, -0.009503841400146484, -0.008840799331665039, -0.008177757263183594, -0.0075147151947021484, -0.006851673126220703, -0.006188631057739258, -0.0055255889892578125, -0.004862546920776367, -0.004199504852294922, -0.0035364627838134766, -0.0028734207153320312, -0.002210378646850586, -0.0015473365783691406, -0.0008842945098876953, -0.00022125244140625, 0.0004417896270751953, 0.0011048316955566406, 0.001767873764038086, 0.0024309158325195312, 0.0030939579010009766, 0.003756999969482422, 0.004420042037963867, 0.0050830841064453125, 0.005746126174926758, 0.006409168243408203, 0.0070722103118896484, 0.007735252380371094, 0.008398294448852539, 0.009061336517333984, 0.00972437858581543, 0.010387420654296875, 0.01105046272277832, 0.011713504791259766, 0.012376546859741211, 0.013039588928222656, 0.013702630996704102, 0.014365673065185547, 0.015028715133666992, 0.015691757202148438, 0.016354799270629883, 0.017017841339111328, 0.017680883407592773, 0.01834392547607422, 0.019006967544555664, 0.01967000961303711, 0.020333051681518555, 0.02099609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 10.0, 4.0, 16.0, 19.0, 30.0, 30.0, 57.0, 63.0, 83.0, 79.0, 85.0, 109.0, 84.0, 74.0, 51.0, 56.0, 36.0, 27.0, 22.0, 13.0, 12.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020233154296875, -0.019605636596679688, -0.018978118896484375, -0.018350601196289062, -0.01772308349609375, -0.017095565795898438, -0.016468048095703125, -0.015840530395507812, -0.0152130126953125, -0.014585494995117188, -0.013957977294921875, -0.013330459594726562, -0.01270294189453125, -0.012075424194335938, -0.011447906494140625, -0.010820388793945312, -0.01019287109375, -0.009565353393554688, -0.008937835693359375, -0.008310317993164062, -0.00768280029296875, -0.0070552825927734375, -0.006427764892578125, -0.0058002471923828125, -0.0051727294921875, -0.0045452117919921875, -0.003917694091796875, -0.0032901763916015625, -0.00266265869140625, -0.0020351409912109375, -0.001407623291015625, -0.0007801055908203125, -0.000152587890625, 0.0004749298095703125, 0.001102447509765625, 0.0017299652099609375, 0.00235748291015625, 0.0029850006103515625, 0.003612518310546875, 0.0042400360107421875, 0.0048675537109375, 0.0054950714111328125, 0.006122589111328125, 0.0067501068115234375, 0.00737762451171875, 0.008005142211914062, 0.008632659912109375, 0.009260177612304688, 0.0098876953125, 0.010515213012695312, 0.011142730712890625, 0.011770248413085938, 0.01239776611328125, 0.013025283813476562, 0.013652801513671875, 0.014280319213867188, 0.0149078369140625, 0.015535354614257812, 0.016162872314453125, 0.016790390014648438, 0.01741790771484375, 0.018045425415039062, 0.018672943115234375, 0.019300460815429688, 0.019927978515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 11.0, 6.0, 13.0, 12.0, 14.0, 18.0, 17.0, 31.0, 38.0, 44.0, 70.0, 104.0, 148.0, 301.0, 734.0, 3476.0, 91051.0, 935994.0, 13895.0, 1472.0, 443.0, 211.0, 118.0, 72.0, 54.0, 42.0, 38.0, 30.0, 17.0, 12.0, 14.0, 16.0, 9.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07122802734375, -0.06894969940185547, -0.06667137145996094, -0.0643930435180664, -0.062114715576171875, -0.059836387634277344, -0.05755805969238281, -0.05527973175048828, -0.05300140380859375, -0.05072307586669922, -0.04844474792480469, -0.046166419982910156, -0.043888092041015625, -0.041609764099121094, -0.03933143615722656, -0.03705310821533203, -0.0347747802734375, -0.03249645233154297, -0.030218124389648438, -0.027939796447753906, -0.025661468505859375, -0.023383140563964844, -0.021104812622070312, -0.01882648468017578, -0.01654815673828125, -0.014269828796386719, -0.011991500854492188, -0.009713172912597656, -0.007434844970703125, -0.005156517028808594, -0.0028781890869140625, -0.0005998611450195312, 0.001678466796875, 0.003956794738769531, 0.0062351226806640625, 0.008513450622558594, 0.010791778564453125, 0.013070106506347656, 0.015348434448242188, 0.01762676239013672, 0.01990509033203125, 0.02218341827392578, 0.024461746215820312, 0.026740074157714844, 0.029018402099609375, 0.031296730041503906, 0.03357505798339844, 0.03585338592529297, 0.0381317138671875, 0.04041004180908203, 0.04268836975097656, 0.044966697692871094, 0.047245025634765625, 0.049523353576660156, 0.05180168151855469, 0.05408000946044922, 0.05635833740234375, 0.05863666534423828, 0.06091499328613281, 0.06319332122802734, 0.06547164916992188, 0.0677499771118164, 0.07002830505371094, 0.07230663299560547, 0.0745849609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 9.0, 11.0, 16.0, 12.0, 20.0, 23.0, 21.0, 29.0, 27.0, 36.0, 27.0, 36.0, 38.0, 45.0, 37.0, 38.0, 35.0, 24.0, 45.0, 41.0, 33.0, 45.0, 37.0, 42.0, 20.0, 27.0, 27.0, 28.0, 21.0, 14.0, 18.0, 16.0, 19.0, 14.0, 7.0, 11.0, 4.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.038848876953125, -0.03767251968383789, -0.03649616241455078, -0.03531980514526367, -0.03414344787597656, -0.03296709060668945, -0.031790733337402344, -0.030614376068115234, -0.029438018798828125, -0.028261661529541016, -0.027085304260253906, -0.025908946990966797, -0.024732589721679688, -0.023556232452392578, -0.02237987518310547, -0.02120351791381836, -0.02002716064453125, -0.01885080337524414, -0.01767444610595703, -0.016498088836669922, -0.015321731567382812, -0.014145374298095703, -0.012969017028808594, -0.011792659759521484, -0.010616302490234375, -0.009439945220947266, -0.008263587951660156, -0.007087230682373047, -0.0059108734130859375, -0.004734516143798828, -0.0035581588745117188, -0.0023818016052246094, -0.0012054443359375, -2.9087066650390625e-05, 0.0011472702026367188, 0.002323627471923828, 0.0034999847412109375, 0.004676342010498047, 0.005852699279785156, 0.007029056549072266, 0.008205413818359375, 0.009381771087646484, 0.010558128356933594, 0.011734485626220703, 0.012910842895507812, 0.014087200164794922, 0.015263557434082031, 0.01643991470336914, 0.01761627197265625, 0.01879262924194336, 0.01996898651123047, 0.021145343780517578, 0.022321701049804688, 0.023498058319091797, 0.024674415588378906, 0.025850772857666016, 0.027027130126953125, 0.028203487396240234, 0.029379844665527344, 0.030556201934814453, 0.03173255920410156, 0.03290891647338867, 0.03408527374267578, 0.03526163101196289, 0.03643798828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 6.0, 8.0, 18.0, 14.0, 17.0, 14.0, 34.0, 53.0, 107.0, 257.0, 2400.0, 1032287.0, 12558.0, 437.0, 117.0, 69.0, 30.0, 28.0, 15.0, 18.0, 12.0, 7.0, 7.0, 5.0, 6.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01131439208984375, -0.010919928550720215, -0.01052546501159668, -0.010131001472473145, -0.00973653793334961, -0.009342074394226074, -0.008947610855102539, -0.008553147315979004, -0.008158683776855469, -0.007764220237731934, -0.0073697566986083984, -0.006975293159484863, -0.006580829620361328, -0.006186366081237793, -0.005791902542114258, -0.005397439002990723, -0.0050029754638671875, -0.004608511924743652, -0.004214048385620117, -0.003819584846496582, -0.003425121307373047, -0.0030306577682495117, -0.0026361942291259766, -0.0022417306900024414, -0.0018472671508789062, -0.001452803611755371, -0.001058340072631836, -0.0006638765335083008, -0.0002694129943847656, 0.00012505054473876953, 0.0005195140838623047, 0.0009139776229858398, 0.001308441162109375, 0.0017029047012329102, 0.0020973682403564453, 0.0024918317794799805, 0.0028862953186035156, 0.0032807588577270508, 0.003675222396850586, 0.004069685935974121, 0.004464149475097656, 0.004858613014221191, 0.0052530765533447266, 0.005647540092468262, 0.006042003631591797, 0.006436467170715332, 0.006830930709838867, 0.007225394248962402, 0.0076198577880859375, 0.008014321327209473, 0.008408784866333008, 0.008803248405456543, 0.009197711944580078, 0.009592175483703613, 0.009986639022827148, 0.010381102561950684, 0.010775566101074219, 0.011170029640197754, 0.011564493179321289, 0.011958956718444824, 0.01235342025756836, 0.012747883796691895, 0.01314234733581543, 0.013536810874938965, 0.0139312744140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 4.0, 12.0, 3.0, 4.0, 19.0, 45.0, 490.0, 322.0, 37.0, 9.0, 15.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00037860870361328125, -0.00036710500717163086, -0.00035560131072998047, -0.0003440976142883301, -0.0003325939178466797, -0.0003210902214050293, -0.0003095865249633789, -0.0002980828285217285, -0.0002865791320800781, -0.00027507543563842773, -0.00026357173919677734, -0.00025206804275512695, -0.00024056434631347656, -0.00022906064987182617, -0.00021755695343017578, -0.0002060532569885254, -0.000194549560546875, -0.0001830458641052246, -0.00017154216766357422, -0.00016003847122192383, -0.00014853477478027344, -0.00013703107833862305, -0.00012552738189697266, -0.00011402368545532227, -0.00010251998901367188, -9.101629257202148e-05, -7.95125961303711e-05, -6.80088996887207e-05, -5.650520324707031e-05, -4.500150680541992e-05, -3.349781036376953e-05, -2.199411392211914e-05, -1.049041748046875e-05, 1.0132789611816406e-06, 1.2516975402832031e-05, 2.4020671844482422e-05, 3.552436828613281e-05, 4.70280647277832e-05, 5.8531761169433594e-05, 7.003545761108398e-05, 8.153915405273438e-05, 9.304285049438477e-05, 0.00010454654693603516, 0.00011605024337768555, 0.00012755393981933594, 0.00013905763626098633, 0.00015056133270263672, 0.0001620650291442871, 0.0001735687255859375, 0.0001850724220275879, 0.00019657611846923828, 0.00020807981491088867, 0.00021958351135253906, 0.00023108720779418945, 0.00024259090423583984, 0.00025409460067749023, 0.0002655982971191406, 0.000277101993560791, 0.0002886056900024414, 0.0003001093864440918, 0.0003116130828857422, 0.0003231167793273926, 0.00033462047576904297, 0.00034612417221069336, 0.00035762786865234375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 9.0, 10.0, 9.0, 14.0, 25.0, 31.0, 64.0, 87.0, 217.0, 878.0, 12391.0, 1024568.0, 9044.0, 724.0, 216.0, 97.0, 52.0, 25.0, 16.0, 12.0, 12.0, 11.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.01509857177734375, -0.014684438705444336, -0.014270305633544922, -0.013856172561645508, -0.013442039489746094, -0.01302790641784668, -0.012613773345947266, -0.012199640274047852, -0.011785507202148438, -0.011371374130249023, -0.01095724105834961, -0.010543107986450195, -0.010128974914550781, -0.009714841842651367, -0.009300708770751953, -0.008886575698852539, -0.008472442626953125, -0.008058309555053711, -0.007644176483154297, -0.007230043411254883, -0.006815910339355469, -0.006401777267456055, -0.005987644195556641, -0.0055735111236572266, -0.0051593780517578125, -0.0047452449798583984, -0.004331111907958984, -0.00391697883605957, -0.0035028457641601562, -0.003088712692260742, -0.002674579620361328, -0.002260446548461914, -0.0018463134765625, -0.001432180404663086, -0.0010180473327636719, -0.0006039142608642578, -0.00018978118896484375, 0.0002243518829345703, 0.0006384849548339844, 0.0010526180267333984, 0.0014667510986328125, 0.0018808841705322266, 0.0022950172424316406, 0.0027091503143310547, 0.0031232833862304688, 0.003537416458129883, 0.003951549530029297, 0.004365682601928711, 0.004779815673828125, 0.005193948745727539, 0.005608081817626953, 0.006022214889526367, 0.006436347961425781, 0.006850481033325195, 0.007264614105224609, 0.0076787471771240234, 0.008092880249023438, 0.008507013320922852, 0.008921146392822266, 0.00933527946472168, 0.009749412536621094, 0.010163545608520508, 0.010577678680419922, 0.010991811752319336, 0.01140594482421875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 11.0, 3.0, 5.0, 11.0, 7.0, 16.0, 31.0, 41.0, 68.0, 201.0, 271.0, 135.0, 78.0, 32.0, 21.0, 14.0, 14.0, 7.0, 5.0, 2.0, 10.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00937652587890625, -0.009095072746276855, -0.008813619613647461, -0.008532166481018066, -0.008250713348388672, -0.007969260215759277, -0.007687807083129883, -0.007406353950500488, -0.007124900817871094, -0.006843447685241699, -0.006561994552612305, -0.00628054141998291, -0.005999088287353516, -0.005717635154724121, -0.0054361820220947266, -0.005154728889465332, -0.0048732757568359375, -0.004591822624206543, -0.0043103694915771484, -0.004028916358947754, -0.0037474632263183594, -0.003466010093688965, -0.0031845569610595703, -0.0029031038284301758, -0.0026216506958007812, -0.0023401975631713867, -0.002058744430541992, -0.0017772912979125977, -0.0014958381652832031, -0.0012143850326538086, -0.0009329319000244141, -0.0006514787673950195, -0.000370025634765625, -8.857250213623047e-05, 0.00019288063049316406, 0.0004743337631225586, 0.0007557868957519531, 0.0010372400283813477, 0.0013186931610107422, 0.0016001462936401367, 0.0018815994262695312, 0.0021630525588989258, 0.0024445056915283203, 0.002725958824157715, 0.0030074119567871094, 0.003288865089416504, 0.0035703182220458984, 0.003851771354675293, 0.0041332244873046875, 0.004414677619934082, 0.0046961307525634766, 0.004977583885192871, 0.005259037017822266, 0.00554049015045166, 0.005821943283081055, 0.006103396415710449, 0.006384849548339844, 0.006666302680969238, 0.006947755813598633, 0.007229208946228027, 0.007510662078857422, 0.007792115211486816, 0.008073568344116211, 0.008355021476745605, 0.008636474609375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 22.0, 176.0, 757.0, 49.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5261597037315369, -0.49573713541030884, -0.4653145372867584, -0.4348919689655304, -0.40446937084198, -0.37404680252075195, -0.3436242341995239, -0.3132016658782959, -0.2827790677547455, -0.25235649943351746, -0.22193390130996704, -0.191511332988739, -0.1610887497663498, -0.13066616654396057, -0.10024359822273254, -0.06982101500034332, -0.0393984317779541, -0.008975852280855179, 0.021446727216243744, 0.05186930298805237, 0.08229188621044159, 0.11271446943283081, 0.14313703775405884, 0.17355962097644806, 0.20398220419883728, 0.2344047874212265, 0.2648273706436157, 0.29524993896484375, 0.3256725072860718, 0.3560951054096222, 0.3865176737308502, 0.41694027185440063, 0.4473627805709839, 0.4777853488922119, 0.5082079172134399, 0.538630485534668, 0.5690531134605408, 0.5994756817817688, 0.6298982501029968, 0.6603208184242249, 0.6907434463500977, 0.7211660146713257, 0.7515885829925537, 0.7820111513137817, 0.8124337792396545, 0.8428563475608826, 0.8732789158821106, 0.9037014842033386, 0.9341240525245667, 0.9645466208457947, 0.9949691891670227, 1.0253918170928955, 1.0558143854141235, 1.0862369537353516, 1.1166595220565796, 1.1470820903778076, 1.1775046586990356, 1.2079272270202637, 1.2383497953414917, 1.2687723636627197, 1.2991949319839478, 1.3296175003051758, 1.3600401878356934, 1.3904627561569214, 1.4208853244781494]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 7.0, 3.0, 9.0, 4.0, 9.0, 18.0, 11.0, 10.0, 21.0, 21.0, 16.0, 25.0, 36.0, 38.0, 33.0, 40.0, 45.0, 48.0, 44.0, 54.0, 58.0, 44.0, 58.0, 37.0, 21.0, 35.0, 42.0, 25.0, 31.0, 27.0, 24.0, 22.0, 12.0, 14.0, 19.0, 10.0, 5.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1732161045074463, -0.16705545783042908, -0.16089482605457306, -0.15473417937755585, -0.14857354760169983, -0.14241290092468262, -0.1362522542476654, -0.1300916075706482, -0.12393097579479218, -0.11777033656835556, -0.11160969734191895, -0.10544905066490173, -0.09928841143846512, -0.0931277722120285, -0.08696712553501129, -0.08080648630857468, -0.07464584708213806, -0.06848520785570145, -0.06232456490397453, -0.05616392195224762, -0.050003282725811005, -0.04384264349937439, -0.037682000547647476, -0.03152135759592056, -0.025360718369483948, -0.019200077280402184, -0.01303943619132042, -0.006878795102238655, -0.0007181540131568909, 0.005442487075924873, 0.011603128165006638, 0.01776377111673355, 0.023924410343170166, 0.03008505143225193, 0.036245692521333694, 0.04240633547306061, 0.04856697469949722, 0.05472761392593384, 0.06088825687766075, 0.06704889982938766, 0.07320953905582428, 0.0793701782822609, 0.08553081750869751, 0.09169146418571472, 0.09785210341215134, 0.10401274263858795, 0.11017338931560516, 0.11633402854204178, 0.1224946677684784, 0.1286553144454956, 0.13481594622135162, 0.14097659289836884, 0.14713722467422485, 0.15329787135124207, 0.15945851802825928, 0.1656191647052765, 0.1717797964811325, 0.17794044315814972, 0.18410107493400574, 0.19026172161102295, 0.19642236828804016, 0.20258300006389618, 0.2087436467409134, 0.2149042785167694, 0.22106492519378662]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 4.0, 8.0, 11.0, 23.0, 36.0, 55.0, 51.0, 90.0, 167.0, 506.0, 1952.0, 4169092.0, 20328.0, 1239.0, 319.0, 140.0, 76.0, 41.0, 37.0, 26.0, 19.0, 12.0, 5.0, 9.0, 8.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005279541015625, -0.005102813243865967, -0.004926085472106934, -0.0047493577003479, -0.004572629928588867, -0.004395902156829834, -0.004219174385070801, -0.004042446613311768, -0.0038657188415527344, -0.003688991069793701, -0.003512263298034668, -0.0033355355262756348, -0.0031588077545166016, -0.0029820799827575684, -0.002805352210998535, -0.002628624439239502, -0.0024518966674804688, -0.0022751688957214355, -0.0020984411239624023, -0.0019217133522033691, -0.001744985580444336, -0.0015682578086853027, -0.0013915300369262695, -0.0012148022651672363, -0.0010380744934082031, -0.0008613467216491699, -0.0006846189498901367, -0.0005078911781311035, -0.0003311634063720703, -0.0001544356346130371, 2.2292137145996094e-05, 0.0001990199089050293, 0.0003757476806640625, 0.0005524754524230957, 0.0007292032241821289, 0.0009059309959411621, 0.0010826587677001953, 0.0012593865394592285, 0.0014361143112182617, 0.001612842082977295, 0.0017895698547363281, 0.0019662976264953613, 0.0021430253982543945, 0.0023197531700134277, 0.002496480941772461, 0.002673208713531494, 0.0028499364852905273, 0.0030266642570495605, 0.0032033920288085938, 0.003380119800567627, 0.00355684757232666, 0.0037335753440856934, 0.0039103031158447266, 0.00408703088760376, 0.004263758659362793, 0.004440486431121826, 0.004617214202880859, 0.004793941974639893, 0.004970669746398926, 0.005147397518157959, 0.005324125289916992, 0.005500853061676025, 0.005677580833435059, 0.005854308605194092, 0.006031036376953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 19.0, 14.0, 37.0, 27.0, 37.0, 51.0, 80.0, 75.0, 75.0, 99.0, 97.0, 82.0, 59.0, 71.0, 40.0, 32.0, 17.0, 24.0, 11.0, 11.0, 6.0, 11.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0186920166015625, -0.018103837966918945, -0.01751565933227539, -0.016927480697631836, -0.01633930206298828, -0.015751123428344727, -0.015162944793701172, -0.014574766159057617, -0.013986587524414062, -0.013398408889770508, -0.012810230255126953, -0.012222051620483398, -0.011633872985839844, -0.011045694351196289, -0.010457515716552734, -0.00986933708190918, -0.009281158447265625, -0.00869297981262207, -0.008104801177978516, -0.007516622543334961, -0.006928443908691406, -0.0063402652740478516, -0.005752086639404297, -0.005163908004760742, -0.0045757293701171875, -0.003987550735473633, -0.003399372100830078, -0.0028111934661865234, -0.0022230148315429688, -0.001634836196899414, -0.0010466575622558594, -0.0004584789276123047, 0.00012969970703125, 0.0007178783416748047, 0.0013060569763183594, 0.001894235610961914, 0.0024824142456054688, 0.0030705928802490234, 0.003658771514892578, 0.004246950149536133, 0.0048351287841796875, 0.005423307418823242, 0.006011486053466797, 0.0065996646881103516, 0.007187843322753906, 0.007776021957397461, 0.008364200592041016, 0.00895237922668457, 0.009540557861328125, 0.01012873649597168, 0.010716915130615234, 0.011305093765258789, 0.011893272399902344, 0.012481451034545898, 0.013069629669189453, 0.013657808303833008, 0.014245986938476562, 0.014834165573120117, 0.015422344207763672, 0.016010522842407227, 0.01659870147705078, 0.017186880111694336, 0.01777505874633789, 0.018363237380981445, 0.018951416015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 4.0, 5.0, 16.0, 17.0, 22.0, 19.0, 20.0, 19.0, 29.0, 25.0, 25.0, 36.0, 43.0, 49.0, 80.0, 179.0, 560.0, 3100.0, 4176375.0, 11904.0, 1013.0, 297.0, 112.0, 50.0, 33.0, 36.0, 22.0, 38.0, 24.0, 15.0, 14.0, 22.0, 18.0, 10.0, 15.0, 6.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.005706787109375, -0.005547046661376953, -0.005387306213378906, -0.005227565765380859, -0.0050678253173828125, -0.004908084869384766, -0.004748344421386719, -0.004588603973388672, -0.004428863525390625, -0.004269123077392578, -0.004109382629394531, -0.003949642181396484, -0.0037899017333984375, -0.0036301612854003906, -0.0034704208374023438, -0.003310680389404297, -0.00315093994140625, -0.002991199493408203, -0.0028314590454101562, -0.0026717185974121094, -0.0025119781494140625, -0.0023522377014160156, -0.0021924972534179688, -0.002032756805419922, -0.001873016357421875, -0.0017132759094238281, -0.0015535354614257812, -0.0013937950134277344, -0.0012340545654296875, -0.0010743141174316406, -0.0009145736694335938, -0.0007548332214355469, -0.0005950927734375, -0.0004353523254394531, -0.00027561187744140625, -0.00011587142944335938, 4.38690185546875e-05, 0.00020360946655273438, 0.00036334991455078125, 0.0005230903625488281, 0.000682830810546875, 0.0008425712585449219, 0.0010023117065429688, 0.0011620521545410156, 0.0013217926025390625, 0.0014815330505371094, 0.0016412734985351562, 0.0018010139465332031, 0.00196075439453125, 0.002120494842529297, 0.0022802352905273438, 0.0024399757385253906, 0.0025997161865234375, 0.0027594566345214844, 0.0029191970825195312, 0.003078937530517578, 0.003238677978515625, 0.003398418426513672, 0.0035581588745117188, 0.0037178993225097656, 0.0038776397705078125, 0.004037380218505859, 0.004197120666503906, 0.004356861114501953, 0.0045166015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 8.0, 20.0, 4015.0, 32.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005016326904296875, -0.004924491047859192, -0.004832655191421509, -0.004740819334983826, -0.004648983478546143, -0.0045571476221084595, -0.004465311765670776, -0.004373475909233093, -0.00428164005279541, -0.004189804196357727, -0.004097968339920044, -0.004006132483482361, -0.003914296627044678, -0.0038224607706069946, -0.0037306249141693115, -0.0036387890577316284, -0.0035469532012939453, -0.003455117344856262, -0.003363281488418579, -0.003271445631980896, -0.003179609775543213, -0.00308777391910553, -0.0029959380626678467, -0.0029041022062301636, -0.0028122663497924805, -0.0027204304933547974, -0.0026285946369171143, -0.002536758780479431, -0.002444922924041748, -0.002353087067604065, -0.002261251211166382, -0.0021694153547286987, -0.0020775794982910156, -0.0019857436418533325, -0.0018939077854156494, -0.0018020719289779663, -0.0017102360725402832, -0.0016184002161026, -0.001526564359664917, -0.0014347285032272339, -0.0013428926467895508, -0.0012510567903518677, -0.0011592209339141846, -0.0010673850774765015, -0.0009755492210388184, -0.0008837133646011353, -0.0007918775081634521, -0.000700041651725769, -0.0006082057952880859, -0.0005163699388504028, -0.0004245340824127197, -0.0003326982259750366, -0.00024086236953735352, -0.0001490265130996704, -5.7190656661987305e-05, 3.46451997756958e-05, 0.0001264810562133789, 0.000218316912651062, 0.0003101527690887451, 0.0004019886255264282, 0.0004938244819641113, 0.0005856603384017944, 0.0006774961948394775, 0.0007693320512771606, 0.0008611679077148438]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 25.0, 52.0, 174.0, 507.0, 158.0, 51.0, 17.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006068538874387741, -0.005855209659785032, -0.0056418804451823235, -0.005428551230579615, -0.005215222015976906, -0.005001893267035484, -0.0047885640524327755, -0.004575234837830067, -0.004361905623227358, -0.004148576408624649, -0.00393524719402194, -0.003721918212249875, -0.0035085889976471663, -0.0032952597830444574, -0.0030819308012723923, -0.0028686015866696835, -0.0026552723720669746, -0.002441943157464266, -0.002228613942861557, -0.002015284961089492, -0.001801955746486783, -0.0015886265318840742, -0.0013752974336966872, -0.0011619683355093002, -0.0009486391209065914, -0.0007353099645115435, -0.0005219808081164956, -0.0003086516517214477, -9.53224953263998e-05, 0.00011800671927630901, 0.000331335817463696, 0.000544664915651083, 0.0007579936645925045, 0.0009713228209875524, 0.0011846519773826003, 0.0013979810755699873, 0.0016113102901726961, 0.001824639504775405, 0.00203796848654747, 0.002251297701150179, 0.0024646269157528877, 0.0026779561303555965, 0.0028912853449583054, 0.0031046143267303705, 0.0033179435413330793, 0.003531272755935788, 0.0037446017377078533, 0.003957930952310562, 0.004171260166913271, 0.00438458938151598, 0.004597918596118689, 0.004811247810721397, 0.005024576559662819, 0.005237906239926815, 0.0054512349888682365, 0.005664564203470945, 0.005877893418073654, 0.006091222632676363, 0.006304551847279072, 0.006517881061881781, 0.0067312102764844894, 0.006944539025425911, 0.00715786824002862, 0.007371197454631329, 0.007584526669234037]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 8.0, 4.0, 7.0, 10.0, 14.0, 29.0, 46.0, 62.0, 87.0, 85.0, 115.0, 129.0, 127.0, 89.0, 63.0, 36.0, 30.0, 22.0, 12.0, 9.0, 6.0, 6.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.009160101413726807, -0.008966248482465744, -0.008772395551204681, -0.008578542619943619, -0.008384689688682556, -0.008190836757421494, -0.007996983826160431, -0.007803130894899368, -0.007609277963638306, -0.007415425032377243, -0.00722157210111618, -0.007027719169855118, -0.006833866238594055, -0.0066400133073329926, -0.00644616037607193, -0.006252307444810867, -0.006058454513549805, -0.005864601582288742, -0.0056707486510276794, -0.005476895719766617, -0.005283042788505554, -0.005089189857244492, -0.004895336925983429, -0.004701483994722366, -0.004507631063461304, -0.004313778132200241, -0.0041199252009391785, -0.003926072269678116, -0.0037322193384170532, -0.0035383664071559906, -0.003344513475894928, -0.0031506605446338654, -0.0029568076133728027, -0.00276295468211174, -0.0025691017508506775, -0.002375248819589615, -0.0021813958883285522, -0.0019875429570674896, -0.001793690025806427, -0.0015998370945453644, -0.0014059841632843018, -0.0012121312320232391, -0.0010182783007621765, -0.0008244253695011139, -0.0006305724382400513, -0.00043671950697898865, -0.00024286657571792603, -4.90136444568634e-05, 0.00014483928680419922, 0.00033869221806526184, 0.0005325451493263245, 0.0007263980805873871, 0.0009202510118484497, 0.0011141039431095123, 0.001307956874370575, 0.0015018098056316376, 0.0016956627368927002, 0.0018895156681537628, 0.0020833685994148254, 0.002277221530675888, 0.0024710744619369507, 0.0026649273931980133, 0.002858780324459076, 0.0030526332557201385, 0.003246486186981201]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 8.0, 9.0, 8.0, 16.0, 18.0, 46.0, 55.0, 87.0, 150.0, 227.0, 474.0, 827.0, 1846.0, 4931.0, 16907.0, 100527.0, 781190.0, 114025.0, 18087.0, 5036.0, 2029.0, 907.0, 482.0, 248.0, 135.0, 74.0, 60.0, 40.0, 35.0, 16.0, 11.0, 4.0, 12.0, 10.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03863525390625, -0.03740978240966797, -0.03618431091308594, -0.034958839416503906, -0.033733367919921875, -0.032507896423339844, -0.03128242492675781, -0.03005695343017578, -0.02883148193359375, -0.02760601043701172, -0.026380538940429688, -0.025155067443847656, -0.023929595947265625, -0.022704124450683594, -0.021478652954101562, -0.02025318145751953, -0.0190277099609375, -0.01780223846435547, -0.016576766967773438, -0.015351295471191406, -0.014125823974609375, -0.012900352478027344, -0.011674880981445312, -0.010449409484863281, -0.00922393798828125, -0.007998466491699219, -0.0067729949951171875, -0.005547523498535156, -0.004322052001953125, -0.0030965805053710938, -0.0018711090087890625, -0.0006456375122070312, 0.000579833984375, 0.0018053054809570312, 0.0030307769775390625, 0.004256248474121094, 0.005481719970703125, 0.006707191467285156, 0.007932662963867188, 0.009158134460449219, 0.01038360595703125, 0.011609077453613281, 0.012834548950195312, 0.014060020446777344, 0.015285491943359375, 0.016510963439941406, 0.017736434936523438, 0.01896190643310547, 0.0201873779296875, 0.02141284942626953, 0.022638320922851562, 0.023863792419433594, 0.025089263916015625, 0.026314735412597656, 0.027540206909179688, 0.02876567840576172, 0.02999114990234375, 0.03121662139892578, 0.03244209289550781, 0.033667564392089844, 0.034893035888671875, 0.036118507385253906, 0.03734397888183594, 0.03856945037841797, 0.039794921875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 18.0, 17.0, 34.0, 32.0, 31.0, 56.0, 81.0, 69.0, 79.0, 96.0, 103.0, 78.0, 64.0, 64.0, 43.0, 31.0, 17.0, 25.0, 10.0, 11.0, 6.0, 10.0, 5.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0186920166015625, -0.018103837966918945, -0.01751565933227539, -0.016927480697631836, -0.01633930206298828, -0.015751123428344727, -0.015162944793701172, -0.014574766159057617, -0.013986587524414062, -0.013398408889770508, -0.012810230255126953, -0.012222051620483398, -0.011633872985839844, -0.011045694351196289, -0.010457515716552734, -0.00986933708190918, -0.009281158447265625, -0.00869297981262207, -0.008104801177978516, -0.007516622543334961, -0.006928443908691406, -0.0063402652740478516, -0.005752086639404297, -0.005163908004760742, -0.0045757293701171875, -0.003987550735473633, -0.003399372100830078, -0.0028111934661865234, -0.0022230148315429688, -0.001634836196899414, -0.0010466575622558594, -0.0004584789276123047, 0.00012969970703125, 0.0007178783416748047, 0.0013060569763183594, 0.001894235610961914, 0.0024824142456054688, 0.0030705928802490234, 0.003658771514892578, 0.004246950149536133, 0.0048351287841796875, 0.005423307418823242, 0.006011486053466797, 0.0065996646881103516, 0.007187843322753906, 0.007776021957397461, 0.008364200592041016, 0.00895237922668457, 0.009540557861328125, 0.01012873649597168, 0.010716915130615234, 0.011305093765258789, 0.011893272399902344, 0.012481451034545898, 0.013069629669189453, 0.013657808303833008, 0.014245986938476562, 0.014834165573120117, 0.015422344207763672, 0.016010522842407227, 0.01659870147705078, 0.017186880111694336, 0.01777505874633789, 0.018363237380981445, 0.018951416015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 10.0, 7.0, 13.0, 10.0, 10.0, 10.0, 20.0, 21.0, 26.0, 47.0, 73.0, 95.0, 163.0, 295.0, 550.0, 1361.0, 5705.0, 69024.0, 901414.0, 62072.0, 5017.0, 1241.0, 563.0, 285.0, 165.0, 72.0, 84.0, 43.0, 34.0, 22.0, 19.0, 11.0, 17.0, 9.0, 20.0, 12.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.051788330078125, -0.050328731536865234, -0.04886913299560547, -0.0474095344543457, -0.04594993591308594, -0.04449033737182617, -0.043030738830566406, -0.04157114028930664, -0.040111541748046875, -0.03865194320678711, -0.037192344665527344, -0.03573274612426758, -0.03427314758300781, -0.03281354904174805, -0.03135395050048828, -0.029894351959228516, -0.02843475341796875, -0.026975154876708984, -0.02551555633544922, -0.024055957794189453, -0.022596359252929688, -0.021136760711669922, -0.019677162170410156, -0.01821756362915039, -0.016757965087890625, -0.01529836654663086, -0.013838768005371094, -0.012379169464111328, -0.010919570922851562, -0.009459972381591797, -0.008000373840332031, -0.006540775299072266, -0.0050811767578125, -0.0036215782165527344, -0.0021619796752929688, -0.0007023811340332031, 0.0007572174072265625, 0.002216815948486328, 0.0036764144897460938, 0.005136013031005859, 0.006595611572265625, 0.00805521011352539, 0.009514808654785156, 0.010974407196044922, 0.012434005737304688, 0.013893604278564453, 0.015353202819824219, 0.016812801361083984, 0.01827239990234375, 0.019731998443603516, 0.02119159698486328, 0.022651195526123047, 0.024110794067382812, 0.025570392608642578, 0.027029991149902344, 0.02848958969116211, 0.029949188232421875, 0.03140878677368164, 0.032868385314941406, 0.03432798385620117, 0.03578758239746094, 0.0372471809387207, 0.03870677947998047, 0.040166378021240234, 0.0416259765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 6.0, 11.0, 9.0, 12.0, 11.0, 22.0, 14.0, 14.0, 20.0, 21.0, 43.0, 31.0, 36.0, 35.0, 39.0, 53.0, 42.0, 56.0, 42.0, 52.0, 42.0, 48.0, 50.0, 43.0, 40.0, 40.0, 30.0, 14.0, 26.0, 20.0, 19.0, 16.0, 9.0, 8.0, 9.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04437255859375, -0.043074607849121094, -0.04177665710449219, -0.04047870635986328, -0.039180755615234375, -0.03788280487060547, -0.03658485412597656, -0.035286903381347656, -0.03398895263671875, -0.032691001892089844, -0.03139305114746094, -0.03009510040283203, -0.028797149658203125, -0.02749919891357422, -0.026201248168945312, -0.024903297424316406, -0.0236053466796875, -0.022307395935058594, -0.021009445190429688, -0.01971149444580078, -0.018413543701171875, -0.01711559295654297, -0.015817642211914062, -0.014519691467285156, -0.01322174072265625, -0.011923789978027344, -0.010625839233398438, -0.009327888488769531, -0.008029937744140625, -0.006731986999511719, -0.0054340362548828125, -0.004136085510253906, -0.002838134765625, -0.0015401840209960938, -0.0002422332763671875, 0.0010557174682617188, 0.002353668212890625, 0.0036516189575195312, 0.0049495697021484375, 0.006247520446777344, 0.00754547119140625, 0.008843421936035156, 0.010141372680664062, 0.011439323425292969, 0.012737274169921875, 0.014035224914550781, 0.015333175659179688, 0.016631126403808594, 0.0179290771484375, 0.019227027893066406, 0.020524978637695312, 0.02182292938232422, 0.023120880126953125, 0.02441883087158203, 0.025716781616210938, 0.027014732360839844, 0.02831268310546875, 0.029610633850097656, 0.030908584594726562, 0.03220653533935547, 0.033504486083984375, 0.03480243682861328, 0.03610038757324219, 0.037398338317871094, 0.0386962890625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 15.0, 13.0, 37.0, 56.0, 164.0, 1448.0, 1042664.0, 3697.0, 290.0, 88.0, 45.0, 12.0, 9.0, 1.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.024932861328125, -0.024397850036621094, -0.023862838745117188, -0.02332782745361328, -0.022792816162109375, -0.02225780487060547, -0.021722793579101562, -0.021187782287597656, -0.02065277099609375, -0.020117759704589844, -0.019582748413085938, -0.01904773712158203, -0.018512725830078125, -0.01797771453857422, -0.017442703247070312, -0.016907691955566406, -0.0163726806640625, -0.015837669372558594, -0.015302658081054688, -0.014767646789550781, -0.014232635498046875, -0.013697624206542969, -0.013162612915039062, -0.012627601623535156, -0.01209259033203125, -0.011557579040527344, -0.011022567749023438, -0.010487556457519531, -0.009952545166015625, -0.009417533874511719, -0.008882522583007812, -0.008347511291503906, -0.0078125, -0.007277488708496094, -0.0067424774169921875, -0.006207466125488281, -0.005672454833984375, -0.005137443542480469, -0.0046024322509765625, -0.004067420959472656, -0.00353240966796875, -0.0029973983764648438, -0.0024623870849609375, -0.0019273757934570312, -0.001392364501953125, -0.0008573532104492188, -0.0003223419189453125, 0.00021266937255859375, 0.0007476806640625, 0.0012826919555664062, 0.0018177032470703125, 0.0023527145385742188, 0.002887725830078125, 0.0034227371215820312, 0.0039577484130859375, 0.004492759704589844, 0.00502777099609375, 0.005562782287597656, 0.0060977935791015625, 0.006632804870605469, 0.007167816162109375, 0.007702827453613281, 0.008237838745117188, 0.008772850036621094, 0.009307861328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 11.0, 5.0, 12.0, 43.0, 61.0, 137.0, 408.0, 166.0, 67.0, 33.0, 27.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003120899200439453, -0.00030553434044122696, -0.0002989787608385086, -0.00029242318123579025, -0.0002858676016330719, -0.00027931202203035355, -0.0002727564424276352, -0.00026620086282491684, -0.0002596452832221985, -0.00025308970361948013, -0.0002465341240167618, -0.00023997854441404343, -0.00023342296481132507, -0.00022686738520860672, -0.00022031180560588837, -0.00021375622600317, -0.00020720064640045166, -0.0002006450667977333, -0.00019408948719501495, -0.0001875339075922966, -0.00018097832798957825, -0.0001744227483868599, -0.00016786716878414154, -0.0001613115891814232, -0.00015475600957870483, -0.00014820042997598648, -0.00014164485037326813, -0.00013508927077054977, -0.00012853369116783142, -0.00012197811156511307, -0.00011542253196239471, -0.00010886695235967636, -0.00010231137275695801, -9.575579315423965e-05, -8.92002135515213e-05, -8.264463394880295e-05, -7.60890543460846e-05, -6.953347474336624e-05, -6.297789514064789e-05, -5.6422315537929535e-05, -4.986673593521118e-05, -4.331115633249283e-05, -3.6755576729774475e-05, -3.0199997127056122e-05, -2.364441752433777e-05, -1.7088837921619415e-05, -1.0533258318901062e-05, -3.977678716182709e-06, 2.5779008865356445e-06, 9.133480489253998e-06, 1.568906009197235e-05, 2.2244639694690704e-05, 2.8800219297409058e-05, 3.535579890012741e-05, 4.1911378502845764e-05, 4.846695810556412e-05, 5.502253770828247e-05, 6.157811731100082e-05, 6.813369691371918e-05, 7.468927651643753e-05, 8.124485611915588e-05, 8.780043572187424e-05, 9.435601532459259e-05, 0.00010091159492731094, 0.0001074671745300293]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 4.0, 10.0, 12.0, 41.0, 93.0, 228.0, 900.0, 18872.0, 1025167.0, 2572.0, 411.0, 141.0, 38.0, 27.0, 10.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0163116455078125, -0.015712976455688477, -0.015114307403564453, -0.01451563835144043, -0.013916969299316406, -0.013318300247192383, -0.01271963119506836, -0.012120962142944336, -0.011522293090820312, -0.010923624038696289, -0.010324954986572266, -0.009726285934448242, -0.009127616882324219, -0.008528947830200195, -0.007930278778076172, -0.0073316097259521484, -0.006732940673828125, -0.0061342716217041016, -0.005535602569580078, -0.004936933517456055, -0.004338264465332031, -0.003739595413208008, -0.0031409263610839844, -0.002542257308959961, -0.0019435882568359375, -0.001344919204711914, -0.0007462501525878906, -0.0001475811004638672, 0.00045108795166015625, 0.0010497570037841797, 0.0016484260559082031, 0.0022470951080322266, 0.00284576416015625, 0.0034444332122802734, 0.004043102264404297, 0.00464177131652832, 0.005240440368652344, 0.005839109420776367, 0.006437778472900391, 0.007036447525024414, 0.0076351165771484375, 0.008233785629272461, 0.008832454681396484, 0.009431123733520508, 0.010029792785644531, 0.010628461837768555, 0.011227130889892578, 0.011825799942016602, 0.012424468994140625, 0.013023138046264648, 0.013621807098388672, 0.014220476150512695, 0.014819145202636719, 0.015417814254760742, 0.016016483306884766, 0.01661515235900879, 0.017213821411132812, 0.017812490463256836, 0.01841115951538086, 0.019009828567504883, 0.019608497619628906, 0.02020716667175293, 0.020805835723876953, 0.021404504776000977, 0.022003173828125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 3.0, 16.0, 30.0, 71.0, 297.0, 399.0, 110.0, 34.0, 21.0, 9.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01983642578125, -0.019272327423095703, -0.018708229064941406, -0.01814413070678711, -0.017580032348632812, -0.017015933990478516, -0.01645183563232422, -0.015887737274169922, -0.015323638916015625, -0.014759540557861328, -0.014195442199707031, -0.013631343841552734, -0.013067245483398438, -0.01250314712524414, -0.011939048767089844, -0.011374950408935547, -0.01081085205078125, -0.010246753692626953, -0.009682655334472656, -0.00911855697631836, -0.008554458618164062, -0.007990360260009766, -0.007426261901855469, -0.006862163543701172, -0.006298065185546875, -0.005733966827392578, -0.005169868469238281, -0.004605770111083984, -0.0040416717529296875, -0.0034775733947753906, -0.0029134750366210938, -0.002349376678466797, -0.0017852783203125, -0.0012211799621582031, -0.0006570816040039062, -9.298324584960938e-05, 0.0004711151123046875, 0.0010352134704589844, 0.0015993118286132812, 0.002163410186767578, 0.002727508544921875, 0.003291606903076172, 0.0038557052612304688, 0.004419803619384766, 0.0049839019775390625, 0.005548000335693359, 0.006112098693847656, 0.006676197052001953, 0.00724029541015625, 0.007804393768310547, 0.008368492126464844, 0.00893259048461914, 0.009496688842773438, 0.010060787200927734, 0.010624885559082031, 0.011188983917236328, 0.011753082275390625, 0.012317180633544922, 0.012881278991699219, 0.013445377349853516, 0.014009475708007812, 0.01457357406616211, 0.015137672424316406, 0.015701770782470703, 0.016265869140625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 24.0, 234.0, 689.0, 55.0, 11.0, 2.0], "bins": [-1.5053203105926514, -1.4803191423416138, -1.4553178548812866, -1.430316686630249, -1.4053155183792114, -1.3803143501281738, -1.3553130626678467, -1.330311894416809, -1.3053107261657715, -1.2803095579147339, -1.2553082704544067, -1.2303071022033691, -1.2053059339523315, -1.180304765701294, -1.1553034782409668, -1.1303023099899292, -1.1053011417388916, -1.080299973487854, -1.0552986860275269, -1.0302975177764893, -1.0052963495254517, -0.9802951216697693, -0.9552939534187317, -0.9302927255630493, -0.9052914977073669, -0.8802902698516846, -0.855289101600647, -0.8302878737449646, -0.805286705493927, -0.7802854776382446, -0.755284309387207, -0.7302830815315247, -0.7052818536758423, -0.6802806258201599, -0.6552794575691223, -0.6302782297134399, -0.6052770614624023, -0.58027583360672, -0.5552746653556824, -0.5302734375, -0.5052722692489624, -0.4802710711956024, -0.45526987314224243, -0.43026867508888245, -0.40526747703552246, -0.3802662491798401, -0.3552650809288025, -0.3302638530731201, -0.3052626848220825, -0.28026148676872253, -0.25526028871536255, -0.23025909066200256, -0.20525789260864258, -0.1802566796541214, -0.1552554816007614, -0.13025428354740143, -0.10525307804346085, -0.08025187999010086, -0.05525067821145058, -0.030249476432800293, -0.005248278379440308, 0.019752927124500275, 0.04475412517786026, 0.06975532323122025, 0.09475652128458023]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 8.0, 5.0, 2.0, 3.0, 5.0, 12.0, 8.0, 7.0, 14.0, 9.0, 15.0, 19.0, 19.0, 23.0, 18.0, 27.0, 30.0, 24.0, 34.0, 46.0, 49.0, 33.0, 40.0, 44.0, 46.0, 60.0, 54.0, 33.0, 30.0, 34.0, 30.0, 35.0, 23.0, 28.0, 20.0, 23.0, 16.0, 12.0, 9.0, 14.0, 12.0, 11.0, 9.0, 5.0, 1.0, 3.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14891719818115234, -0.14399610459804535, -0.13907501101493835, -0.13415393233299255, -0.12923283874988556, -0.12431174516677856, -0.11939065903425217, -0.11446957290172577, -0.10954847931861877, -0.10462738573551178, -0.09970629960298538, -0.09478521347045898, -0.08986411988735199, -0.084943026304245, -0.0800219401717186, -0.0751008540391922, -0.0701797604560852, -0.06525866687297821, -0.06033758074045181, -0.05541649088263512, -0.05049540102481842, -0.045574311167001724, -0.04065322130918503, -0.03573213145136833, -0.030811041593551636, -0.02588995173573494, -0.020968861877918243, -0.016047772020101547, -0.011126682162284851, -0.006205592304468155, -0.0012845024466514587, 0.0036365874111652374, 0.008557677268981934, 0.01347876712679863, 0.018399856984615326, 0.023320946842432022, 0.028242036700248718, 0.033163126558065414, 0.03808421641588211, 0.04300530627369881, 0.0479263961315155, 0.0528474859893322, 0.057768575847148895, 0.06268966197967529, 0.06761075556278229, 0.07253184914588928, 0.07745293527841568, 0.08237402141094208, 0.08729511499404907, 0.09221620857715607, 0.09713729470968246, 0.10205838084220886, 0.10697947442531586, 0.11190056800842285, 0.11682165414094925, 0.12174274027347565, 0.12666383385658264, 0.13158492743968964, 0.13650602102279663, 0.14142709970474243, 0.14634819328784943, 0.15126928687095642, 0.15619036555290222, 0.16111145913600922, 0.1660325527191162]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 11.0, 9.0, 16.0, 17.0, 22.0, 41.0, 50.0, 91.0, 126.0, 197.0, 327.0, 566.0, 1468.0, 3290.0, 13133.0, 150524.0, 3908791.0, 101624.0, 8815.0, 2633.0, 963.0, 526.0, 359.0, 192.0, 147.0, 102.0, 60.0, 38.0, 35.0, 25.0, 19.0, 14.0, 8.0, 10.0, 7.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.016357421875, -0.01578235626220703, -0.015207290649414062, -0.014632225036621094, -0.014057159423828125, -0.013482093811035156, -0.012907028198242188, -0.012331962585449219, -0.01175689697265625, -0.011181831359863281, -0.010606765747070312, -0.010031700134277344, -0.009456634521484375, -0.008881568908691406, -0.008306503295898438, -0.007731437683105469, -0.0071563720703125, -0.006581306457519531, -0.0060062408447265625, -0.005431175231933594, -0.004856109619140625, -0.004281044006347656, -0.0037059783935546875, -0.0031309127807617188, -0.00255584716796875, -0.0019807815551757812, -0.0014057159423828125, -0.0008306503295898438, -0.000255584716796875, 0.00031948089599609375, 0.0008945465087890625, 0.0014696121215820312, 0.002044677734375, 0.0026197433471679688, 0.0031948089599609375, 0.0037698745727539062, 0.004344940185546875, 0.004920005798339844, 0.0054950714111328125, 0.006070137023925781, 0.00664520263671875, 0.007220268249511719, 0.0077953338623046875, 0.008370399475097656, 0.008945465087890625, 0.009520530700683594, 0.010095596313476562, 0.010670661926269531, 0.0112457275390625, 0.011820793151855469, 0.012395858764648438, 0.012970924377441406, 0.013545989990234375, 0.014121055603027344, 0.014696121215820312, 0.015271186828613281, 0.01584625244140625, 0.01642131805419922, 0.016996383666992188, 0.017571449279785156, 0.018146514892578125, 0.018721580505371094, 0.019296646118164062, 0.01987171173095703, 0.02044677734375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 11.0, 18.0, 21.0, 26.0, 36.0, 50.0, 63.0, 79.0, 76.0, 88.0, 88.0, 93.0, 98.0, 72.0, 47.0, 26.0, 30.0, 10.0, 14.0, 17.0, 5.0, 4.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0179290771484375, -0.017354726791381836, -0.016780376434326172, -0.016206026077270508, -0.015631675720214844, -0.01505732536315918, -0.014482975006103516, -0.013908624649047852, -0.013334274291992188, -0.012759923934936523, -0.01218557357788086, -0.011611223220825195, -0.011036872863769531, -0.010462522506713867, -0.009888172149658203, -0.009313821792602539, -0.008739471435546875, -0.008165121078491211, -0.007590770721435547, -0.007016420364379883, -0.006442070007324219, -0.005867719650268555, -0.005293369293212891, -0.0047190189361572266, -0.0041446685791015625, -0.0035703182220458984, -0.0029959678649902344, -0.0024216175079345703, -0.0018472671508789062, -0.0012729167938232422, -0.0006985664367675781, -0.00012421607971191406, 0.00045013427734375, 0.001024484634399414, 0.0015988349914550781, 0.002173185348510742, 0.0027475357055664062, 0.0033218860626220703, 0.0038962364196777344, 0.0044705867767333984, 0.0050449371337890625, 0.0056192874908447266, 0.006193637847900391, 0.006767988204956055, 0.007342338562011719, 0.007916688919067383, 0.008491039276123047, 0.009065389633178711, 0.009639739990234375, 0.010214090347290039, 0.010788440704345703, 0.011362791061401367, 0.011937141418457031, 0.012511491775512695, 0.01308584213256836, 0.013660192489624023, 0.014234542846679688, 0.014808893203735352, 0.015383243560791016, 0.01595759391784668, 0.016531944274902344, 0.017106294631958008, 0.017680644989013672, 0.018254995346069336, 0.018829345703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 11.0, 3.0, 20.0, 47.0, 84.0, 264.0, 721.0, 2338.0, 9412.0, 3733183.0, 437195.0, 7689.0, 2080.0, 738.0, 261.0, 110.0, 45.0, 23.0, 10.0, 9.0, 7.0, 2.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.034698486328125, -0.0336761474609375, -0.03265380859375, -0.0316314697265625, -0.030609130859375, -0.0295867919921875, -0.028564453125, -0.0275421142578125, -0.026519775390625, -0.0254974365234375, -0.02447509765625, -0.0234527587890625, -0.022430419921875, -0.0214080810546875, -0.0203857421875, -0.0193634033203125, -0.018341064453125, -0.0173187255859375, -0.01629638671875, -0.0152740478515625, -0.014251708984375, -0.0132293701171875, -0.01220703125, -0.0111846923828125, -0.010162353515625, -0.0091400146484375, -0.00811767578125, -0.0070953369140625, -0.006072998046875, -0.0050506591796875, -0.0040283203125, -0.0030059814453125, -0.001983642578125, -0.0009613037109375, 6.103515625e-05, 0.0010833740234375, 0.002105712890625, 0.0031280517578125, 0.004150390625, 0.0051727294921875, 0.006195068359375, 0.0072174072265625, 0.00823974609375, 0.0092620849609375, 0.010284423828125, 0.0113067626953125, 0.0123291015625, 0.0133514404296875, 0.014373779296875, 0.0153961181640625, 0.01641845703125, 0.0174407958984375, 0.018463134765625, 0.0194854736328125, 0.0205078125, 0.0215301513671875, 0.022552490234375, 0.0235748291015625, 0.02459716796875, 0.0256195068359375, 0.026641845703125, 0.0276641845703125, 0.0286865234375, 0.0297088623046875, 0.030731201171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 8.0, 1.0, 2.0, 7.0, 12.0, 14.0, 15.0, 49.0, 131.0, 504.0, 2313.0, 727.0, 175.0, 55.0, 20.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.023162841796875, -0.022454261779785156, -0.021745681762695312, -0.02103710174560547, -0.020328521728515625, -0.01961994171142578, -0.018911361694335938, -0.018202781677246094, -0.01749420166015625, -0.016785621643066406, -0.016077041625976562, -0.015368461608886719, -0.014659881591796875, -0.013951301574707031, -0.013242721557617188, -0.012534141540527344, -0.0118255615234375, -0.011116981506347656, -0.010408401489257812, -0.009699821472167969, -0.008991241455078125, -0.008282661437988281, -0.0075740814208984375, -0.006865501403808594, -0.00615692138671875, -0.005448341369628906, -0.0047397613525390625, -0.004031181335449219, -0.003322601318359375, -0.0026140213012695312, -0.0019054412841796875, -0.0011968612670898438, -0.00048828125, 0.00022029876708984375, 0.0009288787841796875, 0.0016374588012695312, 0.002346038818359375, 0.0030546188354492188, 0.0037631988525390625, 0.004471778869628906, 0.00518035888671875, 0.005888938903808594, 0.0065975189208984375, 0.007306098937988281, 0.008014678955078125, 0.008723258972167969, 0.009431838989257812, 0.010140419006347656, 0.0108489990234375, 0.011557579040527344, 0.012266159057617188, 0.012974739074707031, 0.013683319091796875, 0.014391899108886719, 0.015100479125976562, 0.015809059143066406, 0.01651763916015625, 0.017226219177246094, 0.017934799194335938, 0.01864337921142578, 0.019351959228515625, 0.02006053924560547, 0.020769119262695312, 0.021477699279785156, 0.022186279296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 12.0, 15.0, 36.0, 81.0, 267.0, 386.0, 125.0, 35.0, 29.0, 12.0, 3.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.19926783442497253, -0.19537487626075745, -0.19148191809654236, -0.18758895993232727, -0.18369600176811218, -0.1798030436038971, -0.175910085439682, -0.17201711237430573, -0.16812415421009064, -0.16423119604587555, -0.16033823788166046, -0.15644527971744537, -0.15255232155323029, -0.148659348487854, -0.14476639032363892, -0.14087343215942383, -0.13698047399520874, -0.13308751583099365, -0.12919455766677856, -0.12530159950256348, -0.12140863388776779, -0.1175156757235527, -0.11362271755933762, -0.10972975939512253, -0.10583680868148804, -0.10194385051727295, -0.09805089235305786, -0.09415793418884277, -0.09026496857404709, -0.086372010409832, -0.08247905224561691, -0.07858609408140182, -0.07469313591718674, -0.07080017775297165, -0.06690721958875656, -0.06301425397396088, -0.05912129580974579, -0.0552283376455307, -0.05133537948131561, -0.047442421317100525, -0.04354945942759514, -0.03965650126338005, -0.035763539373874664, -0.031870581209659576, -0.02797762118279934, -0.024084661155939102, -0.020191702991724014, -0.016298742964863777, -0.01240578293800354, -0.008512822911143303, -0.00461986381560564, -0.0007269047200679779, 0.003166055306792259, 0.007059015333652496, 0.010951973497867584, 0.014844933524727821, 0.01873789355158806, 0.022630853578448296, 0.026523813605308533, 0.03041677176952362, 0.03430972993373871, 0.038202691823244095, 0.04209564998745918, 0.04598861187696457, 0.04988157004117966]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 3.0, 8.0, 7.0, 7.0, 6.0, 20.0, 9.0, 20.0, 23.0, 30.0, 22.0, 33.0, 30.0, 46.0, 44.0, 35.0, 50.0, 45.0, 50.0, 47.0, 55.0, 48.0, 44.0, 39.0, 33.0, 33.0, 40.0, 31.0, 24.0, 18.0, 15.0, 16.0, 19.0, 9.0, 11.0, 8.0, 5.0, 7.0, 8.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05647921562194824, -0.054582379758358, -0.05268554389476776, -0.05078870430588722, -0.04889186844229698, -0.04699503257870674, -0.0450981929898262, -0.04320135712623596, -0.04130452126264572, -0.03940768539905548, -0.03751084953546524, -0.0356140099465847, -0.03371717408299446, -0.03182033821940422, -0.02992350049316883, -0.02802666276693344, -0.0261298269033432, -0.02423299103975296, -0.02233615331351757, -0.02043931558728218, -0.01854247972369194, -0.0166456438601017, -0.01474880613386631, -0.012851969338953495, -0.01095513254404068, -0.009058295749127865, -0.00716145895421505, -0.005264622159302235, -0.0033677853643894196, -0.0014709485694766045, 0.00042588822543621063, 0.0023227250203490257, 0.004219561815261841, 0.006116398610174656, 0.008013235405087471, 0.009910072200000286, 0.011806908994913101, 0.013703745789825916, 0.015600582584738731, 0.01749742031097412, 0.01939425617456436, 0.021291092038154602, 0.023187929764389992, 0.02508476749062538, 0.026981603354215622, 0.028878439217805862, 0.030775276944041252, 0.03267211467027664, 0.03456895053386688, 0.03646578639745712, 0.03836262226104736, 0.0402594618499279, 0.04215629771351814, 0.04405313357710838, 0.04594997316598892, 0.04784680902957916, 0.0497436448931694, 0.051640480756759644, 0.053537316620349884, 0.05543415620923042, 0.05733099207282066, 0.059227827936410904, 0.06112466752529144, 0.06302150338888168, 0.06491833925247192]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 12.0, 21.0, 12.0, 21.0, 38.0, 42.0, 71.0, 80.0, 116.0, 186.0, 273.0, 463.0, 650.0, 1095.0, 2041.0, 3776.0, 8095.0, 19869.0, 63256.0, 409999.0, 434710.0, 66680.0, 19895.0, 8092.0, 3808.0, 2104.0, 1080.0, 714.0, 434.0, 278.0, 195.0, 129.0, 81.0, 52.0, 59.0, 29.0, 25.0, 15.0, 13.0, 9.0, 10.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.0321044921875, -0.031131982803344727, -0.030159473419189453, -0.02918696403503418, -0.028214454650878906, -0.027241945266723633, -0.02626943588256836, -0.025296926498413086, -0.024324417114257812, -0.02335190773010254, -0.022379398345947266, -0.021406888961791992, -0.02043437957763672, -0.019461870193481445, -0.018489360809326172, -0.0175168514251709, -0.016544342041015625, -0.015571832656860352, -0.014599323272705078, -0.013626813888549805, -0.012654304504394531, -0.011681795120239258, -0.010709285736083984, -0.009736776351928711, -0.008764266967773438, -0.007791757583618164, -0.006819248199462891, -0.005846738815307617, -0.004874229431152344, -0.0039017200469970703, -0.002929210662841797, -0.0019567012786865234, -0.00098419189453125, -1.1682510375976562e-05, 0.0009608268737792969, 0.0019333362579345703, 0.0029058456420898438, 0.003878355026245117, 0.004850864410400391, 0.005823373794555664, 0.0067958831787109375, 0.007768392562866211, 0.008740901947021484, 0.009713411331176758, 0.010685920715332031, 0.011658430099487305, 0.012630939483642578, 0.013603448867797852, 0.014575958251953125, 0.015548467636108398, 0.016520977020263672, 0.017493486404418945, 0.01846599578857422, 0.019438505172729492, 0.020411014556884766, 0.02138352394104004, 0.022356033325195312, 0.023328542709350586, 0.02430105209350586, 0.025273561477661133, 0.026246070861816406, 0.02721858024597168, 0.028191089630126953, 0.029163599014282227, 0.0301361083984375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 17.0, 22.0, 21.0, 41.0, 41.0, 58.0, 82.0, 72.0, 77.0, 93.0, 97.0, 92.0, 77.0, 65.0, 32.0, 30.0, 7.0, 15.0, 10.0, 11.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0170745849609375, -0.016513586044311523, -0.015952587127685547, -0.01539158821105957, -0.014830589294433594, -0.014269590377807617, -0.01370859146118164, -0.013147592544555664, -0.012586593627929688, -0.012025594711303711, -0.011464595794677734, -0.010903596878051758, -0.010342597961425781, -0.009781599044799805, -0.009220600128173828, -0.008659601211547852, -0.008098602294921875, -0.0075376033782958984, -0.006976604461669922, -0.006415605545043945, -0.005854606628417969, -0.005293607711791992, -0.004732608795166016, -0.004171609878540039, -0.0036106109619140625, -0.003049612045288086, -0.0024886131286621094, -0.0019276142120361328, -0.0013666152954101562, -0.0008056163787841797, -0.0002446174621582031, 0.00031638145446777344, 0.00087738037109375, 0.0014383792877197266, 0.001999378204345703, 0.0025603771209716797, 0.0031213760375976562, 0.003682374954223633, 0.004243373870849609, 0.004804372787475586, 0.0053653717041015625, 0.005926370620727539, 0.006487369537353516, 0.007048368453979492, 0.007609367370605469, 0.008170366287231445, 0.008731365203857422, 0.009292364120483398, 0.009853363037109375, 0.010414361953735352, 0.010975360870361328, 0.011536359786987305, 0.012097358703613281, 0.012658357620239258, 0.013219356536865234, 0.013780355453491211, 0.014341354370117188, 0.014902353286743164, 0.01546335220336914, 0.016024351119995117, 0.016585350036621094, 0.01714634895324707, 0.017707347869873047, 0.018268346786499023, 0.018829345703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 13.0, 19.0, 20.0, 40.0, 43.0, 63.0, 80.0, 165.0, 298.0, 550.0, 1070.0, 2891.0, 12548.0, 142717.0, 827099.0, 50545.0, 6579.0, 1918.0, 811.0, 401.0, 237.0, 144.0, 95.0, 63.0, 39.0, 18.0, 12.0, 8.0, 7.0, 9.0, 6.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.051544189453125, -0.05016279220581055, -0.048781394958496094, -0.04739999771118164, -0.04601860046386719, -0.044637203216552734, -0.04325580596923828, -0.04187440872192383, -0.040493011474609375, -0.03911161422729492, -0.03773021697998047, -0.036348819732666016, -0.03496742248535156, -0.03358602523803711, -0.032204627990722656, -0.030823230743408203, -0.02944183349609375, -0.028060436248779297, -0.026679039001464844, -0.02529764175415039, -0.023916244506835938, -0.022534847259521484, -0.02115345001220703, -0.019772052764892578, -0.018390655517578125, -0.017009258270263672, -0.01562786102294922, -0.014246463775634766, -0.012865066528320312, -0.01148366928100586, -0.010102272033691406, -0.008720874786376953, -0.0073394775390625, -0.005958080291748047, -0.004576683044433594, -0.0031952857971191406, -0.0018138885498046875, -0.0004324913024902344, 0.0009489059448242188, 0.002330303192138672, 0.003711700439453125, 0.005093097686767578, 0.006474494934082031, 0.007855892181396484, 0.009237289428710938, 0.01061868667602539, 0.012000083923339844, 0.013381481170654297, 0.01476287841796875, 0.016144275665283203, 0.017525672912597656, 0.01890707015991211, 0.020288467407226562, 0.021669864654541016, 0.02305126190185547, 0.024432659149169922, 0.025814056396484375, 0.027195453643798828, 0.02857685089111328, 0.029958248138427734, 0.03133964538574219, 0.03272104263305664, 0.034102439880371094, 0.03548383712768555, 0.036865234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 4.0, 13.0, 14.0, 15.0, 20.0, 22.0, 26.0, 27.0, 27.0, 31.0, 31.0, 33.0, 23.0, 47.0, 49.0, 35.0, 49.0, 45.0, 48.0, 36.0, 51.0, 37.0, 36.0, 33.0, 37.0, 30.0, 29.0, 32.0, 12.0, 13.0, 15.0, 10.0, 15.0, 8.0, 6.0, 7.0, 4.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036865234375, -0.035726070404052734, -0.03458690643310547, -0.0334477424621582, -0.03230857849121094, -0.031169414520263672, -0.030030250549316406, -0.02889108657836914, -0.027751922607421875, -0.02661275863647461, -0.025473594665527344, -0.024334430694580078, -0.023195266723632812, -0.022056102752685547, -0.02091693878173828, -0.019777774810791016, -0.01863861083984375, -0.017499446868896484, -0.01636028289794922, -0.015221118927001953, -0.014081954956054688, -0.012942790985107422, -0.011803627014160156, -0.01066446304321289, -0.009525299072265625, -0.00838613510131836, -0.007246971130371094, -0.006107807159423828, -0.0049686431884765625, -0.003829479217529297, -0.0026903152465820312, -0.0015511512756347656, -0.0004119873046875, 0.0007271766662597656, 0.0018663406372070312, 0.003005504608154297, 0.0041446685791015625, 0.005283832550048828, 0.006422996520996094, 0.007562160491943359, 0.008701324462890625, 0.00984048843383789, 0.010979652404785156, 0.012118816375732422, 0.013257980346679688, 0.014397144317626953, 0.015536308288574219, 0.016675472259521484, 0.01781463623046875, 0.018953800201416016, 0.02009296417236328, 0.021232128143310547, 0.022371292114257812, 0.023510456085205078, 0.024649620056152344, 0.02578878402709961, 0.026927947998046875, 0.02806711196899414, 0.029206275939941406, 0.030345439910888672, 0.03148460388183594, 0.0326237678527832, 0.03376293182373047, 0.034902095794677734, 0.036041259765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 9.0, 22.0, 19.0, 57.0, 77.0, 190.0, 451.0, 1878.0, 61387.0, 976390.0, 6605.0, 894.0, 305.0, 125.0, 56.0, 43.0, 23.0, 9.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01141357421875, -0.011115193367004395, -0.010816812515258789, -0.010518431663513184, -0.010220050811767578, -0.009921669960021973, -0.009623289108276367, -0.009324908256530762, -0.009026527404785156, -0.00872814655303955, -0.008429765701293945, -0.00813138484954834, -0.007833003997802734, -0.007534623146057129, -0.0072362422943115234, -0.006937861442565918, -0.0066394805908203125, -0.006341099739074707, -0.0060427188873291016, -0.005744338035583496, -0.005445957183837891, -0.005147576332092285, -0.00484919548034668, -0.004550814628601074, -0.004252433776855469, -0.003954052925109863, -0.003655672073364258, -0.0033572912216186523, -0.003058910369873047, -0.0027605295181274414, -0.002462148666381836, -0.0021637678146362305, -0.001865386962890625, -0.0015670061111450195, -0.001268625259399414, -0.0009702444076538086, -0.0006718635559082031, -0.00037348270416259766, -7.510185241699219e-05, 0.00022327899932861328, 0.0005216598510742188, 0.0008200407028198242, 0.0011184215545654297, 0.0014168024063110352, 0.0017151832580566406, 0.002013564109802246, 0.0023119449615478516, 0.002610325813293457, 0.0029087066650390625, 0.003207087516784668, 0.0035054683685302734, 0.003803849220275879, 0.004102230072021484, 0.00440061092376709, 0.004698991775512695, 0.004997372627258301, 0.005295753479003906, 0.005594134330749512, 0.005892515182495117, 0.006190896034240723, 0.006489276885986328, 0.006787657737731934, 0.007086038589477539, 0.0073844194412231445, 0.00768280029296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 7.0, 5.0, 12.0, 21.0, 16.0, 38.0, 64.0, 61.0, 93.0, 141.0, 157.0, 116.0, 82.0, 51.0, 31.0, 32.0, 13.0, 11.0, 12.0, 13.0, 2.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011163949966430664, -0.0001084720715880394, -0.00010530464351177216, -0.00010213721543550491, -9.896978735923767e-05, -9.580235928297043e-05, -9.263493120670319e-05, -8.946750313043594e-05, -8.63000750541687e-05, -8.313264697790146e-05, -7.996521890163422e-05, -7.679779082536697e-05, -7.363036274909973e-05, -7.046293467283249e-05, -6.729550659656525e-05, -6.4128078520298e-05, -6.096065044403076e-05, -5.779322236776352e-05, -5.462579429149628e-05, -5.1458366215229034e-05, -4.829093813896179e-05, -4.512351006269455e-05, -4.195608198642731e-05, -3.8788653910160065e-05, -3.562122583389282e-05, -3.245379775762558e-05, -2.9286369681358337e-05, -2.6118941605091095e-05, -2.2951513528823853e-05, -1.978408545255661e-05, -1.6616657376289368e-05, -1.3449229300022125e-05, -1.0281801223754883e-05, -7.11437314748764e-06, -3.946945071220398e-06, -7.795169949531555e-07, 2.387911081314087e-06, 5.555339157581329e-06, 8.722767233848572e-06, 1.1890195310115814e-05, 1.5057623386383057e-05, 1.82250514626503e-05, 2.139247953891754e-05, 2.4559907615184784e-05, 2.7727335691452026e-05, 3.089476376771927e-05, 3.406219184398651e-05, 3.7229619920253754e-05, 4.0397047996520996e-05, 4.356447607278824e-05, 4.673190414905548e-05, 4.9899332225322723e-05, 5.3066760301589966e-05, 5.623418837785721e-05, 5.940161645412445e-05, 6.256904453039169e-05, 6.573647260665894e-05, 6.890390068292618e-05, 7.207132875919342e-05, 7.523875683546066e-05, 7.84061849117279e-05, 8.157361298799515e-05, 8.474104106426239e-05, 8.790846914052963e-05, 9.107589721679688e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 3.0, 10.0, 14.0, 18.0, 23.0, 34.0, 39.0, 73.0, 150.0, 361.0, 917.0, 4207.0, 105135.0, 920752.0, 14117.0, 1671.0, 555.0, 196.0, 115.0, 55.0, 37.0, 23.0, 18.0, 11.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007022857666015625, -0.006755173206329346, -0.006487488746643066, -0.006219804286956787, -0.005952119827270508, -0.0056844353675842285, -0.005416750907897949, -0.00514906644821167, -0.004881381988525391, -0.004613697528839111, -0.004346013069152832, -0.004078328609466553, -0.0038106441497802734, -0.003542959690093994, -0.003275275230407715, -0.0030075907707214355, -0.0027399063110351562, -0.002472221851348877, -0.0022045373916625977, -0.0019368529319763184, -0.001669168472290039, -0.0014014840126037598, -0.0011337995529174805, -0.0008661150932312012, -0.0005984306335449219, -0.0003307461738586426, -6.306171417236328e-05, 0.00020462274551391602, 0.0004723072052001953, 0.0007399916648864746, 0.001007676124572754, 0.0012753605842590332, 0.0015430450439453125, 0.0018107295036315918, 0.002078413963317871, 0.0023460984230041504, 0.0026137828826904297, 0.002881467342376709, 0.0031491518020629883, 0.0034168362617492676, 0.003684520721435547, 0.003952205181121826, 0.0042198896408081055, 0.004487574100494385, 0.004755258560180664, 0.005022943019866943, 0.005290627479553223, 0.005558311939239502, 0.005825996398925781, 0.0060936808586120605, 0.00636136531829834, 0.006629049777984619, 0.0068967342376708984, 0.007164418697357178, 0.007432103157043457, 0.007699787616729736, 0.007967472076416016, 0.008235156536102295, 0.008502840995788574, 0.008770525455474854, 0.009038209915161133, 0.009305894374847412, 0.009573578834533691, 0.00984126329421997, 0.01010894775390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 4.0, 3.0, 6.0, 9.0, 15.0, 16.0, 21.0, 16.0, 24.0, 35.0, 37.0, 31.0, 58.0, 74.0, 82.0, 66.0, 93.0, 73.0, 58.0, 54.0, 39.0, 38.0, 25.0, 20.0, 12.0, 19.0, 14.0, 13.0, 16.0, 6.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042572021484375, -0.004114091396331787, -0.003970980644226074, -0.0038278698921203613, -0.0036847591400146484, -0.0035416483879089355, -0.0033985376358032227, -0.0032554268836975098, -0.003112316131591797, -0.002969205379486084, -0.002826094627380371, -0.002682983875274658, -0.0025398731231689453, -0.0023967623710632324, -0.0022536516189575195, -0.0021105408668518066, -0.0019674301147460938, -0.0018243193626403809, -0.001681208610534668, -0.001538097858428955, -0.0013949871063232422, -0.0012518763542175293, -0.0011087656021118164, -0.0009656548500061035, -0.0008225440979003906, -0.0006794333457946777, -0.0005363225936889648, -0.00039321184158325195, -0.00025010108947753906, -0.00010699033737182617, 3.612041473388672e-05, 0.0001792311668395996, 0.0003223419189453125, 0.0004654526710510254, 0.0006085634231567383, 0.0007516741752624512, 0.0008947849273681641, 0.001037895679473877, 0.0011810064315795898, 0.0013241171836853027, 0.0014672279357910156, 0.0016103386878967285, 0.0017534494400024414, 0.0018965601921081543, 0.002039670944213867, 0.00218278169631958, 0.002325892448425293, 0.002469003200531006, 0.0026121139526367188, 0.0027552247047424316, 0.0028983354568481445, 0.0030414462089538574, 0.0031845569610595703, 0.003327667713165283, 0.003470778465270996, 0.003613889217376709, 0.003756999969482422, 0.0039001107215881348, 0.004043221473693848, 0.0041863322257995605, 0.0043294429779052734, 0.004472553730010986, 0.004615664482116699, 0.004758775234222412, 0.004901885986328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 8.0, 79.0, 800.0, 114.0, 13.0, 2.0, 1.0, 1.0], "bins": [-1.8321216106414795, -1.8008090257644653, -1.7694965600967407, -1.7381839752197266, -1.706871509552002, -1.6755589246749878, -1.6442463397979736, -1.612933874130249, -1.5816212892532349, -1.5503087043762207, -1.518996238708496, -1.487683653831482, -1.4563710689544678, -1.4250586032867432, -1.393746018409729, -1.3624335527420044, -1.3311209678649902, -1.299808382987976, -1.2684959173202515, -1.2371833324432373, -1.2058708667755127, -1.1745582818984985, -1.1432456970214844, -1.1119332313537598, -1.0806206464767456, -1.0493080615997314, -1.0179955959320068, -0.9866830110549927, -0.9553704857826233, -0.9240579605102539, -0.8927453756332397, -0.8614328503608704, -0.8301204442977905, -0.7988079190254211, -0.7674953937530518, -0.7361828088760376, -0.7048702836036682, -0.6735577583312988, -0.6422451734542847, -0.6109326481819153, -0.5796201229095459, -0.5483075976371765, -0.5169950723648071, -0.48568248748779297, -0.4543699622154236, -0.4230574369430542, -0.3917448818683624, -0.36043232679367065, -0.32911980152130127, -0.2978072762489319, -0.2664947211742401, -0.23518218100070953, -0.20386964082717896, -0.17255710065364838, -0.1412445604801178, -0.10993202030658722, -0.07861948013305664, -0.04730693995952606, -0.015994399785995483, 0.015318140387535095, 0.046630680561065674, 0.07794322073459625, 0.10925576090812683, 0.1405683010816574, 0.171880841255188]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 4.0, 8.0, 4.0, 6.0, 11.0, 13.0, 26.0, 16.0, 19.0, 19.0, 22.0, 25.0, 31.0, 25.0, 44.0, 51.0, 52.0, 57.0, 58.0, 58.0, 66.0, 41.0, 56.0, 38.0, 39.0, 28.0, 30.0, 31.0, 20.0, 18.0, 20.0, 9.0, 9.0, 9.0, 4.0, 5.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.16554975509643555, -0.16077828407287598, -0.1560068130493164, -0.15123534202575684, -0.14646387100219727, -0.1416924148797989, -0.13692094385623932, -0.13214947283267975, -0.12737800180912018, -0.12260653078556061, -0.11783505976200104, -0.11306359618902206, -0.1082921251654625, -0.10352065414190292, -0.09874919056892395, -0.09397771954536438, -0.08920624852180481, -0.08443477749824524, -0.07966330647468567, -0.0748918429017067, -0.07012037187814713, -0.06534890085458755, -0.06057743355631828, -0.05580596625804901, -0.05103449523448944, -0.04626302421092987, -0.0414915569126606, -0.03672008961439133, -0.03194861859083176, -0.027177149429917336, -0.022405680269002914, -0.017634212970733643, -0.012862741947174072, -0.008091272786259651, -0.00331980362534523, 0.001451665535569191, 0.006223134696483612, 0.010994603857398033, 0.015766073018312454, 0.020537540316581726, 0.025309011340141296, 0.030080480501055717, 0.03485194966197014, 0.03962341696023941, 0.04439488798379898, 0.04916635900735855, 0.05393782630562782, 0.058709293603897095, 0.06348076462745667, 0.06825223565101624, 0.0730237066745758, 0.07779517024755478, 0.08256664127111435, 0.08733811229467392, 0.0921095758676529, 0.09688104689121246, 0.10165251791477203, 0.1064239889383316, 0.11119545996189117, 0.11596692353487015, 0.12073839455842972, 0.1255098581314087, 0.13028132915496826, 0.13505280017852783, 0.1398242712020874]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 0.0, 5.0, 8.0, 20.0, 12.0, 24.0, 47.0, 65.0, 92.0, 141.0, 192.0, 337.0, 1062.0, 4190995.0, 511.0, 255.0, 160.0, 109.0, 67.0, 64.0, 32.0, 20.0, 18.0, 12.0, 5.0, 12.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.385986328125, -0.3694496154785156, -0.35291290283203125, -0.3363761901855469, -0.3198394775390625, -0.3033027648925781, -0.28676605224609375, -0.2702293395996094, -0.253692626953125, -0.23715591430664062, -0.22061920166015625, -0.20408248901367188, -0.1875457763671875, -0.17100906372070312, -0.15447235107421875, -0.13793563842773438, -0.12139892578125, -0.10486221313476562, -0.08832550048828125, -0.07178878784179688, -0.0552520751953125, -0.038715362548828125, -0.02217864990234375, -0.005641937255859375, 0.010894775390625, 0.027431488037109375, 0.04396820068359375, 0.060504913330078125, 0.0770416259765625, 0.09357833862304688, 0.11011505126953125, 0.12665176391601562, 0.1431884765625, 0.15972518920898438, 0.17626190185546875, 0.19279861450195312, 0.2093353271484375, 0.22587203979492188, 0.24240875244140625, 0.2589454650878906, 0.275482177734375, 0.2920188903808594, 0.30855560302734375, 0.3250923156738281, 0.3416290283203125, 0.3581657409667969, 0.37470245361328125, 0.3912391662597656, 0.40777587890625, 0.4243125915527344, 0.44084930419921875, 0.4573860168457031, 0.4739227294921875, 0.4904594421386719, 0.5069961547851562, 0.5235328674316406, 0.540069580078125, 0.5566062927246094, 0.5731430053710938, 0.5896797180175781, 0.6062164306640625, 0.6227531433105469, 0.6392898559570312, 0.6558265686035156, 0.67236328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 15.0, 14.0, 21.0, 27.0, 48.0, 48.0, 58.0, 71.0, 77.0, 86.0, 85.0, 104.0, 75.0, 65.0, 51.0, 43.0, 32.0, 13.0, 12.0, 13.0, 7.0, 4.0, 8.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0157318115234375, -0.01519465446472168, -0.01465749740600586, -0.014120340347290039, -0.013583183288574219, -0.013046026229858398, -0.012508869171142578, -0.011971712112426758, -0.011434555053710938, -0.010897397994995117, -0.010360240936279297, -0.009823083877563477, -0.009285926818847656, -0.008748769760131836, -0.008211612701416016, -0.007674455642700195, -0.007137298583984375, -0.006600141525268555, -0.006062984466552734, -0.005525827407836914, -0.004988670349121094, -0.0044515132904052734, -0.003914356231689453, -0.003377199172973633, -0.0028400421142578125, -0.002302885055541992, -0.0017657279968261719, -0.0012285709381103516, -0.0006914138793945312, -0.00015425682067871094, 0.0003829002380371094, 0.0009200572967529297, 0.00145721435546875, 0.0019943714141845703, 0.0025315284729003906, 0.003068685531616211, 0.0036058425903320312, 0.0041429996490478516, 0.004680156707763672, 0.005217313766479492, 0.0057544708251953125, 0.006291627883911133, 0.006828784942626953, 0.0073659420013427734, 0.007903099060058594, 0.008440256118774414, 0.008977413177490234, 0.009514570236206055, 0.010051727294921875, 0.010588884353637695, 0.011126041412353516, 0.011663198471069336, 0.012200355529785156, 0.012737512588500977, 0.013274669647216797, 0.013811826705932617, 0.014348983764648438, 0.014886140823364258, 0.015423297882080078, 0.0159604549407959, 0.01649761199951172, 0.01703476905822754, 0.01757192611694336, 0.01810908317565918, 0.018646240234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 6.0, 19.0, 10.0, 23.0, 36.0, 63.0, 136.0, 265.0, 394.0, 780.0, 1541.0, 2960.0, 6398.0, 17658.0, 187983.0, 3922658.0, 34808.0, 9878.0, 4337.0, 2066.0, 1053.0, 545.0, 299.0, 152.0, 68.0, 53.0, 25.0, 25.0, 11.0, 9.0, 8.0, 7.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014923095703125, -0.014354228973388672, -0.013785362243652344, -0.013216495513916016, -0.012647628784179688, -0.01207876205444336, -0.011509895324707031, -0.010941028594970703, -0.010372161865234375, -0.009803295135498047, -0.009234428405761719, -0.00866556167602539, -0.008096694946289062, -0.007527828216552734, -0.006958961486816406, -0.006390094757080078, -0.00582122802734375, -0.005252361297607422, -0.004683494567871094, -0.004114627838134766, -0.0035457611083984375, -0.0029768943786621094, -0.0024080276489257812, -0.0018391609191894531, -0.001270294189453125, -0.0007014274597167969, -0.00013256072998046875, 0.0004363059997558594, 0.0010051727294921875, 0.0015740394592285156, 0.0021429061889648438, 0.002711772918701172, 0.0032806396484375, 0.003849506378173828, 0.004418373107910156, 0.004987239837646484, 0.0055561065673828125, 0.006124973297119141, 0.006693840026855469, 0.007262706756591797, 0.007831573486328125, 0.008400440216064453, 0.008969306945800781, 0.00953817367553711, 0.010107040405273438, 0.010675907135009766, 0.011244773864746094, 0.011813640594482422, 0.01238250732421875, 0.012951374053955078, 0.013520240783691406, 0.014089107513427734, 0.014657974243164062, 0.01522684097290039, 0.01579570770263672, 0.016364574432373047, 0.016933441162109375, 0.017502307891845703, 0.01807117462158203, 0.01864004135131836, 0.019208908081054688, 0.019777774810791016, 0.020346641540527344, 0.020915508270263672, 0.021484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 5.0, 11.0, 12.0, 15.0, 25.0, 107.0, 416.0, 2505.0, 723.0, 106.0, 36.0, 27.0, 14.0, 7.0, 4.0, 7.0, 7.0, 2.0, 4.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01880502700805664, -0.01824665069580078, -0.017688274383544922, -0.017129898071289062, -0.016571521759033203, -0.016013145446777344, -0.015454769134521484, -0.014896392822265625, -0.014338016510009766, -0.013779640197753906, -0.013221263885498047, -0.012662887573242188, -0.012104511260986328, -0.011546134948730469, -0.01098775863647461, -0.01042938232421875, -0.00987100601196289, -0.009312629699707031, -0.008754253387451172, -0.008195877075195312, -0.007637500762939453, -0.007079124450683594, -0.006520748138427734, -0.005962371826171875, -0.005403995513916016, -0.004845619201660156, -0.004287242889404297, -0.0037288665771484375, -0.003170490264892578, -0.0026121139526367188, -0.0020537376403808594, -0.001495361328125, -0.0009369850158691406, -0.00037860870361328125, 0.00017976760864257812, 0.0007381439208984375, 0.0012965202331542969, 0.0018548965454101562, 0.0024132728576660156, 0.002971649169921875, 0.0035300254821777344, 0.004088401794433594, 0.004646778106689453, 0.0052051544189453125, 0.005763530731201172, 0.006321907043457031, 0.006880283355712891, 0.00743865966796875, 0.00799703598022461, 0.008555412292480469, 0.009113788604736328, 0.009672164916992188, 0.010230541229248047, 0.010788917541503906, 0.011347293853759766, 0.011905670166015625, 0.012464046478271484, 0.013022422790527344, 0.013580799102783203, 0.014139175415039062, 0.014697551727294922, 0.015255928039550781, 0.01581430435180664, 0.0163726806640625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 6.0, 12.0, 21.0, 41.0, 63.0, 144.0, 277.0, 206.0, 112.0, 41.0, 32.0, 17.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11407141387462616, -0.11077532172203064, -0.10747922211885452, -0.104183129966259, -0.10088703036308289, -0.09759093821048737, -0.09429483860731125, -0.09099874645471573, -0.08770264685153961, -0.08440655469894409, -0.08111045509576797, -0.07781436294317245, -0.07451826333999634, -0.07122217118740082, -0.0679260715842247, -0.06462997943162918, -0.06133388355374336, -0.058037787675857544, -0.054741691797971725, -0.05144559592008591, -0.04814950004220009, -0.04485340416431427, -0.04155731201171875, -0.03826121240854263, -0.03496512025594711, -0.031669024378061295, -0.028372928500175476, -0.025076832622289658, -0.02178073674440384, -0.01848464272916317, -0.015188546851277351, -0.011892450973391533, -0.008596353232860565, -0.005300257354974747, -0.0020041619427502155, 0.0012919334694743156, 0.004588029347360134, 0.007884124293923378, 0.011180220171809196, 0.014476316049695015, 0.017772411927580833, 0.021068507805466652, 0.02436460368335247, 0.02766069769859314, 0.030956793576478958, 0.03425288945436478, 0.037548985332250595, 0.040845081210136414, 0.04414117708802223, 0.04743727296590805, 0.05073336884379387, 0.05402946472167969, 0.057325560599565506, 0.060621656477451324, 0.06391774863004684, 0.06721384823322296, 0.07050994038581848, 0.073806032538414, 0.07710213214159012, 0.08039822429418564, 0.08369432389736176, 0.08699041604995728, 0.09028651565313339, 0.09358260780572891, 0.09687870740890503]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 1.0, 14.0, 7.0, 7.0, 15.0, 13.0, 16.0, 15.0, 26.0, 16.0, 28.0, 22.0, 23.0, 33.0, 38.0, 43.0, 52.0, 47.0, 59.0, 46.0, 44.0, 54.0, 52.0, 34.0, 35.0, 37.0, 32.0, 28.0, 21.0, 29.0, 18.0, 18.0, 10.0, 13.0, 8.0, 8.0, 7.0, 3.0, 6.0, 0.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.05529212951660156, -0.053685516119003296, -0.05207889899611473, -0.050472281873226166, -0.0488656684756279, -0.04725905507802963, -0.04565243795514107, -0.0440458208322525, -0.042439207434654236, -0.04083259403705597, -0.039225976914167404, -0.03761935979127884, -0.03601274639368057, -0.034406132996082306, -0.03279951587319374, -0.031192900612950325, -0.02958628535270691, -0.027979670092463493, -0.026373054832220078, -0.02476643957197666, -0.023159824311733246, -0.02155320905148983, -0.019946593791246414, -0.018339978531003, -0.016733363270759583, -0.015126748010516167, -0.01352013275027275, -0.011913517490029335, -0.01030690222978592, -0.008700286969542503, -0.0070936717092990875, -0.005487056449055672, -0.003880441188812256, -0.00227382592856884, -0.0006672106683254242, 0.0009394045919179916, 0.0025460198521614075, 0.004152635112404823, 0.005759250372648239, 0.007365865632891655, 0.00897248089313507, 0.010579096153378487, 0.012185711413621902, 0.013792326673865318, 0.015398941934108734, 0.01700555719435215, 0.018612172454595566, 0.02021878771483898, 0.021825402975082397, 0.023432018235325813, 0.02503863349556923, 0.026645248755812645, 0.02825186401605606, 0.029858479276299477, 0.03146509453654289, 0.03307171165943146, 0.034678325057029724, 0.03628493845462799, 0.037891555577516556, 0.03949817270040512, 0.04110478609800339, 0.042711399495601654, 0.04431801661849022, 0.045924633741378784, 0.04753124713897705]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 10.0, 20.0, 47.0, 70.0, 109.0, 214.0, 410.0, 953.0, 2534.0, 9247.0, 56105.0, 780967.0, 173063.0, 17777.0, 4329.0, 1433.0, 637.0, 273.0, 141.0, 81.0, 44.0, 23.0, 21.0, 17.0, 7.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043212890625, -0.04165363311767578, -0.04009437561035156, -0.038535118103027344, -0.036975860595703125, -0.035416603088378906, -0.03385734558105469, -0.03229808807373047, -0.03073883056640625, -0.02917957305908203, -0.027620315551757812, -0.026061058044433594, -0.024501800537109375, -0.022942543029785156, -0.021383285522460938, -0.01982402801513672, -0.0182647705078125, -0.01670551300048828, -0.015146255493164062, -0.013586997985839844, -0.012027740478515625, -0.010468482971191406, -0.008909225463867188, -0.007349967956542969, -0.00579071044921875, -0.004231452941894531, -0.0026721954345703125, -0.0011129379272460938, 0.000446319580078125, 0.0020055770874023438, 0.0035648345947265625, 0.005124092102050781, 0.006683349609375, 0.008242607116699219, 0.009801864624023438, 0.011361122131347656, 0.012920379638671875, 0.014479637145996094, 0.016038894653320312, 0.01759815216064453, 0.01915740966796875, 0.02071666717529297, 0.022275924682617188, 0.023835182189941406, 0.025394439697265625, 0.026953697204589844, 0.028512954711914062, 0.03007221221923828, 0.0316314697265625, 0.03319072723388672, 0.03474998474121094, 0.036309242248535156, 0.037868499755859375, 0.039427757263183594, 0.04098701477050781, 0.04254627227783203, 0.04410552978515625, 0.04566478729248047, 0.04722404479980469, 0.048783302307128906, 0.050342559814453125, 0.051901817321777344, 0.05346107482910156, 0.05502033233642578, 0.05657958984375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 0.0, 3.0, 11.0, 13.0, 20.0, 24.0, 33.0, 53.0, 62.0, 72.0, 67.0, 85.0, 91.0, 99.0, 89.0, 65.0, 67.0, 38.0, 26.0, 17.0, 20.0, 15.0, 2.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0152587890625, -0.014724016189575195, -0.01418924331665039, -0.013654470443725586, -0.013119697570800781, -0.012584924697875977, -0.012050151824951172, -0.011515378952026367, -0.010980606079101562, -0.010445833206176758, -0.009911060333251953, -0.009376287460327148, -0.008841514587402344, -0.008306741714477539, -0.007771968841552734, -0.00723719596862793, -0.006702423095703125, -0.00616765022277832, -0.005632877349853516, -0.005098104476928711, -0.004563331604003906, -0.0040285587310791016, -0.003493785858154297, -0.002959012985229492, -0.0024242401123046875, -0.0018894672393798828, -0.0013546943664550781, -0.0008199214935302734, -0.00028514862060546875, 0.00024962425231933594, 0.0007843971252441406, 0.0013191699981689453, 0.00185394287109375, 0.0023887157440185547, 0.0029234886169433594, 0.003458261489868164, 0.003993034362792969, 0.0045278072357177734, 0.005062580108642578, 0.005597352981567383, 0.0061321258544921875, 0.006666898727416992, 0.007201671600341797, 0.0077364444732666016, 0.008271217346191406, 0.008805990219116211, 0.009340763092041016, 0.00987553596496582, 0.010410308837890625, 0.01094508171081543, 0.011479854583740234, 0.012014627456665039, 0.012549400329589844, 0.013084173202514648, 0.013618946075439453, 0.014153718948364258, 0.014688491821289062, 0.015223264694213867, 0.015758037567138672, 0.016292810440063477, 0.01682758331298828, 0.017362356185913086, 0.01789712905883789, 0.018431901931762695, 0.0189666748046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 13.0, 21.0, 20.0, 40.0, 37.0, 87.0, 105.0, 141.0, 248.0, 431.0, 855.0, 1834.0, 4517.0, 12538.0, 38032.0, 152969.0, 632465.0, 146951.0, 36880.0, 12032.0, 4504.0, 1810.0, 855.0, 409.0, 251.0, 166.0, 90.0, 66.0, 42.0, 30.0, 23.0, 18.0, 16.0, 8.0, 10.0, 6.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0213623046875, -0.02070474624633789, -0.02004718780517578, -0.019389629364013672, -0.018732070922851562, -0.018074512481689453, -0.017416954040527344, -0.016759395599365234, -0.016101837158203125, -0.015444278717041016, -0.014786720275878906, -0.014129161834716797, -0.013471603393554688, -0.012814044952392578, -0.012156486511230469, -0.01149892807006836, -0.01084136962890625, -0.01018381118774414, -0.009526252746582031, -0.008868694305419922, -0.008211135864257812, -0.007553577423095703, -0.006896018981933594, -0.006238460540771484, -0.005580902099609375, -0.004923343658447266, -0.004265785217285156, -0.003608226776123047, -0.0029506683349609375, -0.002293109893798828, -0.0016355514526367188, -0.0009779930114746094, -0.0003204345703125, 0.0003371238708496094, 0.0009946823120117188, 0.0016522407531738281, 0.0023097991943359375, 0.002967357635498047, 0.0036249160766601562, 0.004282474517822266, 0.004940032958984375, 0.005597591400146484, 0.006255149841308594, 0.006912708282470703, 0.0075702667236328125, 0.008227825164794922, 0.008885383605957031, 0.00954294204711914, 0.01020050048828125, 0.01085805892944336, 0.011515617370605469, 0.012173175811767578, 0.012830734252929688, 0.013488292694091797, 0.014145851135253906, 0.014803409576416016, 0.015460968017578125, 0.016118526458740234, 0.016776084899902344, 0.017433643341064453, 0.018091201782226562, 0.018748760223388672, 0.01940631866455078, 0.02006387710571289, 0.020721435546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 4.0, 6.0, 7.0, 8.0, 7.0, 17.0, 7.0, 16.0, 20.0, 15.0, 16.0, 22.0, 25.0, 24.0, 38.0, 31.0, 42.0, 43.0, 39.0, 39.0, 38.0, 52.0, 35.0, 49.0, 36.0, 35.0, 34.0, 38.0, 37.0, 23.0, 34.0, 20.0, 29.0, 18.0, 14.0, 23.0, 7.0, 7.0, 10.0, 9.0, 6.0, 8.0, 1.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0278778076171875, -0.026966571807861328, -0.026055335998535156, -0.025144100189208984, -0.024232864379882812, -0.02332162857055664, -0.02241039276123047, -0.021499156951904297, -0.020587921142578125, -0.019676685333251953, -0.01876544952392578, -0.01785421371459961, -0.016942977905273438, -0.016031742095947266, -0.015120506286621094, -0.014209270477294922, -0.01329803466796875, -0.012386798858642578, -0.011475563049316406, -0.010564327239990234, -0.009653091430664062, -0.00874185562133789, -0.007830619812011719, -0.006919384002685547, -0.006008148193359375, -0.005096912384033203, -0.004185676574707031, -0.0032744407653808594, -0.0023632049560546875, -0.0014519691467285156, -0.0005407333374023438, 0.0003705024719238281, 0.00128173828125, 0.002192974090576172, 0.0031042098999023438, 0.004015445709228516, 0.0049266815185546875, 0.005837917327880859, 0.006749153137207031, 0.007660388946533203, 0.008571624755859375, 0.009482860565185547, 0.010394096374511719, 0.01130533218383789, 0.012216567993164062, 0.013127803802490234, 0.014039039611816406, 0.014950275421142578, 0.01586151123046875, 0.016772747039794922, 0.017683982849121094, 0.018595218658447266, 0.019506454467773438, 0.02041769027709961, 0.02132892608642578, 0.022240161895751953, 0.023151397705078125, 0.024062633514404297, 0.02497386932373047, 0.02588510513305664, 0.026796340942382812, 0.027707576751708984, 0.028618812561035156, 0.029530048370361328, 0.0304412841796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 8.0, 20.0, 25.0, 49.0, 91.0, 210.0, 546.0, 2527.0, 987552.0, 54659.0, 2014.0, 479.0, 177.0, 80.0, 44.0, 25.0, 11.0, 13.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140869140625, -0.13659286499023438, -0.13231658935546875, -0.12804031372070312, -0.1237640380859375, -0.11948776245117188, -0.11521148681640625, -0.11093521118164062, -0.106658935546875, -0.10238265991210938, -0.09810638427734375, -0.09383010864257812, -0.0895538330078125, -0.08527755737304688, -0.08100128173828125, -0.07672500610351562, -0.07244873046875, -0.06817245483398438, -0.06389617919921875, -0.059619903564453125, -0.0553436279296875, -0.051067352294921875, -0.04679107666015625, -0.042514801025390625, -0.038238525390625, -0.033962249755859375, -0.02968597412109375, -0.025409698486328125, -0.0211334228515625, -0.016857147216796875, -0.01258087158203125, -0.008304595947265625, -0.0040283203125, 0.000247955322265625, 0.00452423095703125, 0.008800506591796875, 0.0130767822265625, 0.017353057861328125, 0.02162933349609375, 0.025905609130859375, 0.030181884765625, 0.034458160400390625, 0.03873443603515625, 0.043010711669921875, 0.0472869873046875, 0.051563262939453125, 0.05583953857421875, 0.060115814208984375, 0.06439208984375, 0.06866836547851562, 0.07294464111328125, 0.07722091674804688, 0.0814971923828125, 0.08577346801757812, 0.09004974365234375, 0.09432601928710938, 0.098602294921875, 0.10287857055664062, 0.10715484619140625, 0.11143112182617188, 0.1157073974609375, 0.11998367309570312, 0.12425994873046875, 0.12853622436523438, 0.1328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 11.0, 6.0, 9.0, 13.0, 10.0, 12.0, 13.0, 19.0, 21.0, 37.0, 33.0, 72.0, 85.0, 107.0, 77.0, 99.0, 70.0, 58.0, 61.0, 26.0, 25.0, 26.0, 21.0, 11.0, 16.0, 2.0, 9.0, 9.0, 4.0, 4.0, 2.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.933906555175781e-05, -3.795977681875229e-05, -3.6580488085746765e-05, -3.520119935274124e-05, -3.382191061973572e-05, -3.2442621886730194e-05, -3.106333315372467e-05, -2.9684044420719147e-05, -2.8304755687713623e-05, -2.69254669547081e-05, -2.5546178221702576e-05, -2.4166889488697052e-05, -2.278760075569153e-05, -2.1408312022686005e-05, -2.002902328968048e-05, -1.8649734556674957e-05, -1.7270445823669434e-05, -1.589115709066391e-05, -1.4511868357658386e-05, -1.3132579624652863e-05, -1.1753290891647339e-05, -1.0374002158641815e-05, -8.994713425636292e-06, -7.615424692630768e-06, -6.236135959625244e-06, -4.8568472266197205e-06, -3.4775584936141968e-06, -2.098269760608673e-06, -7.189810276031494e-07, 6.603077054023743e-07, 2.039596438407898e-06, 3.4188851714134216e-06, 4.798173904418945e-06, 6.177462637424469e-06, 7.556751370429993e-06, 8.936040103435516e-06, 1.031532883644104e-05, 1.1694617569446564e-05, 1.3073906302452087e-05, 1.4453195035457611e-05, 1.5832483768463135e-05, 1.721177250146866e-05, 1.8591061234474182e-05, 1.9970349967479706e-05, 2.134963870048523e-05, 2.2728927433490753e-05, 2.4108216166496277e-05, 2.54875048995018e-05, 2.6866793632507324e-05, 2.8246082365512848e-05, 2.962537109851837e-05, 3.1004659831523895e-05, 3.238394856452942e-05, 3.376323729753494e-05, 3.5142526030540466e-05, 3.652181476354599e-05, 3.7901103496551514e-05, 3.928039222955704e-05, 4.065968096256256e-05, 4.2038969695568085e-05, 4.341825842857361e-05, 4.479754716157913e-05, 4.6176835894584656e-05, 4.755612462759018e-05, 4.89354133605957e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 13.0, 14.0, 18.0, 31.0, 64.0, 171.0, 596.0, 3587.0, 1026843.0, 15478.0, 1267.0, 266.0, 88.0, 54.0, 27.0, 11.0, 12.0, 7.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12078857421875, -0.11750125885009766, -0.11421394348144531, -0.11092662811279297, -0.10763931274414062, -0.10435199737548828, -0.10106468200683594, -0.0977773666381836, -0.09449005126953125, -0.0912027359008789, -0.08791542053222656, -0.08462810516357422, -0.08134078979492188, -0.07805347442626953, -0.07476615905761719, -0.07147884368896484, -0.0681915283203125, -0.06490421295166016, -0.06161689758300781, -0.05832958221435547, -0.055042266845703125, -0.05175495147705078, -0.04846763610839844, -0.045180320739746094, -0.04189300537109375, -0.038605690002441406, -0.03531837463378906, -0.03203105926513672, -0.028743743896484375, -0.02545642852783203, -0.022169113159179688, -0.018881797790527344, -0.015594482421875, -0.012307167053222656, -0.009019851684570312, -0.005732536315917969, -0.002445220947265625, 0.0008420944213867188, 0.0041294097900390625, 0.007416725158691406, 0.01070404052734375, 0.013991355895996094, 0.017278671264648438, 0.02056598663330078, 0.023853302001953125, 0.02714061737060547, 0.030427932739257812, 0.033715248107910156, 0.0370025634765625, 0.040289878845214844, 0.04357719421386719, 0.04686450958251953, 0.050151824951171875, 0.05343914031982422, 0.05672645568847656, 0.060013771057128906, 0.06330108642578125, 0.0665884017944336, 0.06987571716308594, 0.07316303253173828, 0.07645034790039062, 0.07973766326904297, 0.08302497863769531, 0.08631229400634766, 0.089599609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 7.0, 30.0, 120.0, 579.0, 190.0, 25.0, 10.0, 7.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033477783203125, -0.03192472457885742, -0.030371665954589844, -0.028818607330322266, -0.027265548706054688, -0.02571249008178711, -0.02415943145751953, -0.022606372833251953, -0.021053314208984375, -0.019500255584716797, -0.01794719696044922, -0.01639413833618164, -0.014841079711914062, -0.013288021087646484, -0.011734962463378906, -0.010181903839111328, -0.00862884521484375, -0.007075786590576172, -0.005522727966308594, -0.003969669342041016, -0.0024166107177734375, -0.0008635520935058594, 0.0006895065307617188, 0.002242565155029297, 0.003795623779296875, 0.005348682403564453, 0.006901741027832031, 0.00845479965209961, 0.010007858276367188, 0.011560916900634766, 0.013113975524902344, 0.014667034149169922, 0.0162200927734375, 0.017773151397705078, 0.019326210021972656, 0.020879268646240234, 0.022432327270507812, 0.02398538589477539, 0.02553844451904297, 0.027091503143310547, 0.028644561767578125, 0.030197620391845703, 0.03175067901611328, 0.03330373764038086, 0.03485679626464844, 0.036409854888916016, 0.037962913513183594, 0.03951597213745117, 0.04106903076171875, 0.04262208938598633, 0.044175148010253906, 0.045728206634521484, 0.04728126525878906, 0.04883432388305664, 0.05038738250732422, 0.0519404411315918, 0.053493499755859375, 0.05504655838012695, 0.05659961700439453, 0.05815267562866211, 0.05970573425292969, 0.061258792877197266, 0.06281185150146484, 0.06436491012573242, 0.06591796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 11.0, 48.0, 161.0, 557.0, 174.0, 38.0, 11.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1114814281463623, -1.0865565538406372, -1.0616317987442017, -1.0367069244384766, -1.0117820501327515, -0.9868572354316711, -0.9619324207305908, -0.9370075464248657, -0.9120827317237854, -0.8871579170227051, -0.86223304271698, -0.8373082280158997, -0.8123834133148193, -0.7874585390090942, -0.7625337243080139, -0.7376089096069336, -0.7126840353012085, -0.6877592206001282, -0.6628343462944031, -0.6379095315933228, -0.6129847168922424, -0.5880598425865173, -0.563135027885437, -0.5382101535797119, -0.5132853984832764, -0.48836055397987366, -0.46343573927879333, -0.4385108947753906, -0.4135860502719879, -0.3886612057685852, -0.3637363910675049, -0.3388115465641022, -0.31388670206069946, -0.28896185755729675, -0.26403704285621643, -0.23911219835281372, -0.214187353849411, -0.1892625242471695, -0.16433769464492798, -0.13941285014152527, -0.11448802053928375, -0.08956318348646164, -0.06463834643363953, -0.03971351683139801, -0.014788679778575897, 0.010136157274246216, 0.03506098687648773, 0.05998583137989044, 0.08491066098213196, 0.10983549803495407, 0.13476033508777618, 0.1596851646900177, 0.1846100091934204, 0.20953483879566193, 0.23445966839790344, 0.25938451290130615, 0.2843093276023865, 0.3092341721057892, 0.3341589868068695, 0.3590838313102722, 0.3840086758136749, 0.40893352031707764, 0.43385833501815796, 0.45878317952156067, 0.4837080240249634]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 5.0, 8.0, 12.0, 19.0, 19.0, 23.0, 36.0, 34.0, 29.0, 38.0, 50.0, 38.0, 52.0, 56.0, 43.0, 65.0, 63.0, 62.0, 40.0, 35.0, 31.0, 35.0, 28.0, 25.0, 22.0, 13.0, 16.0, 14.0, 13.0, 13.0, 10.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1524093747138977, -0.14752794802188873, -0.14264653623104095, -0.13776510953903198, -0.1328836977481842, -0.12800227105617523, -0.12312085181474686, -0.11823943257331848, -0.1133580133318901, -0.10847659409046173, -0.10359517484903336, -0.09871375560760498, -0.09383232891559601, -0.08895091712474823, -0.08406949043273926, -0.07918807119131088, -0.07430665194988251, -0.06942523270845413, -0.06454381346702576, -0.05966239050030708, -0.05478097125887871, -0.04989955201745033, -0.04501812905073166, -0.040136709809303284, -0.03525529056787491, -0.030373871326446533, -0.02549245022237301, -0.020611029118299484, -0.01572960987687111, -0.010848190635442734, -0.005966769531369209, -0.0010853484272956848, 0.0037960708141326904, 0.00867749098688364, 0.01355891115963459, 0.018440332263708115, 0.02332175150513649, 0.028203170746564865, 0.03308459371328354, 0.037966012954711914, 0.04284743219614029, 0.047728851437568665, 0.05261027067899704, 0.057491693645715714, 0.06237311288714409, 0.06725452840328217, 0.07213595509529114, 0.07701737433671951, 0.08189879357814789, 0.08678021281957626, 0.09166163206100464, 0.09654305130243301, 0.10142447054386139, 0.10630589723587036, 0.11118731647729874, 0.11606873571872711, 0.12095015496015549, 0.12583157420158386, 0.13071300089359283, 0.1355944126844406, 0.14047583937644958, 0.14535725116729736, 0.15023867785930634, 0.1551201045513153, 0.16000151634216309]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 9.0, 7.0, 9.0, 18.0, 21.0, 21.0, 29.0, 29.0, 55.0, 107.0, 170.0, 367.0, 1018.0, 8573.0, 4155253.0, 25872.0, 1664.0, 497.0, 210.0, 108.0, 67.0, 47.0, 27.0, 25.0, 18.0, 16.0, 9.0, 12.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052581787109375, -0.05044698715209961, -0.04831218719482422, -0.04617738723754883, -0.04404258728027344, -0.04190778732299805, -0.039772987365722656, -0.037638187408447266, -0.035503387451171875, -0.033368587493896484, -0.031233787536621094, -0.029098987579345703, -0.026964187622070312, -0.024829387664794922, -0.02269458770751953, -0.02055978775024414, -0.01842498779296875, -0.01629018783569336, -0.014155387878417969, -0.012020587921142578, -0.009885787963867188, -0.007750988006591797, -0.005616188049316406, -0.0034813880920410156, -0.001346588134765625, 0.0007882118225097656, 0.0029230117797851562, 0.005057811737060547, 0.0071926116943359375, 0.009327411651611328, 0.011462211608886719, 0.01359701156616211, 0.0157318115234375, 0.01786661148071289, 0.02000141143798828, 0.022136211395263672, 0.024271011352539062, 0.026405811309814453, 0.028540611267089844, 0.030675411224365234, 0.032810211181640625, 0.034945011138916016, 0.037079811096191406, 0.0392146110534668, 0.04134941101074219, 0.04348421096801758, 0.04561901092529297, 0.04775381088256836, 0.04988861083984375, 0.05202341079711914, 0.05415821075439453, 0.05629301071166992, 0.05842781066894531, 0.0605626106262207, 0.0626974105834961, 0.06483221054077148, 0.06696701049804688, 0.06910181045532227, 0.07123661041259766, 0.07337141036987305, 0.07550621032714844, 0.07764101028442383, 0.07977581024169922, 0.08191061019897461, 0.08404541015625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 13.0, 8.0, 9.0, 22.0, 25.0, 30.0, 58.0, 55.0, 81.0, 70.0, 80.0, 109.0, 83.0, 79.0, 71.0, 64.0, 34.0, 24.0, 27.0, 22.0, 8.0, 5.0, 7.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01534271240234375, -0.01482236385345459, -0.01430201530456543, -0.01378166675567627, -0.01326131820678711, -0.01274096965789795, -0.012220621109008789, -0.011700272560119629, -0.011179924011230469, -0.010659575462341309, -0.010139226913452148, -0.009618878364562988, -0.009098529815673828, -0.008578181266784668, -0.008057832717895508, -0.007537484169006348, -0.0070171356201171875, -0.006496787071228027, -0.005976438522338867, -0.005456089973449707, -0.004935741424560547, -0.004415392875671387, -0.0038950443267822266, -0.0033746957778930664, -0.0028543472290039062, -0.002333998680114746, -0.001813650131225586, -0.0012933015823364258, -0.0007729530334472656, -0.00025260448455810547, 0.0002677440643310547, 0.0007880926132202148, 0.001308441162109375, 0.0018287897109985352, 0.0023491382598876953, 0.0028694868087768555, 0.0033898353576660156, 0.003910183906555176, 0.004430532455444336, 0.004950881004333496, 0.005471229553222656, 0.005991578102111816, 0.0065119266510009766, 0.007032275199890137, 0.007552623748779297, 0.008072972297668457, 0.008593320846557617, 0.009113669395446777, 0.009634017944335938, 0.010154366493225098, 0.010674715042114258, 0.011195063591003418, 0.011715412139892578, 0.012235760688781738, 0.012756109237670898, 0.013276457786560059, 0.013796806335449219, 0.014317154884338379, 0.014837503433227539, 0.0153578519821167, 0.01587820053100586, 0.01639854907989502, 0.01691889762878418, 0.01743924617767334, 0.0179595947265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 16.0, 12.0, 19.0, 40.0, 74.0, 138.0, 390.0, 3710.0, 4137344.0, 50724.0, 1046.0, 285.0, 160.0, 109.0, 64.0, 56.0, 32.0, 21.0, 16.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12017822265625, -0.117156982421875, -0.1141357421875, -0.111114501953125, -0.10809326171875, -0.105072021484375, -0.10205078125, -0.099029541015625, -0.09600830078125, -0.092987060546875, -0.0899658203125, -0.086944580078125, -0.08392333984375, -0.080902099609375, -0.077880859375, -0.074859619140625, -0.07183837890625, -0.068817138671875, -0.0657958984375, -0.062774658203125, -0.05975341796875, -0.056732177734375, -0.0537109375, -0.050689697265625, -0.04766845703125, -0.044647216796875, -0.0416259765625, -0.038604736328125, -0.03558349609375, -0.032562255859375, -0.029541015625, -0.026519775390625, -0.02349853515625, -0.020477294921875, -0.0174560546875, -0.014434814453125, -0.01141357421875, -0.008392333984375, -0.00537109375, -0.002349853515625, 0.00067138671875, 0.003692626953125, 0.0067138671875, 0.009735107421875, 0.01275634765625, 0.015777587890625, 0.018798828125, 0.021820068359375, 0.02484130859375, 0.027862548828125, 0.0308837890625, 0.033905029296875, 0.03692626953125, 0.039947509765625, 0.04296875, 0.045989990234375, 0.04901123046875, 0.052032470703125, 0.0550537109375, 0.058074951171875, 0.06109619140625, 0.064117431640625, 0.067138671875, 0.070159912109375, 0.07318115234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 8.0, 15.0, 22.0, 52.0, 181.0, 2529.0, 1073.0, 125.0, 44.0, 16.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290679931640625, -0.02711176872253418, -0.02515554428100586, -0.02319931983947754, -0.02124309539794922, -0.0192868709564209, -0.017330646514892578, -0.015374422073364258, -0.013418197631835938, -0.011461973190307617, -0.009505748748779297, -0.0075495243072509766, -0.005593299865722656, -0.003637075424194336, -0.0016808509826660156, 0.0002753734588623047, 0.002231597900390625, 0.004187822341918945, 0.006144046783447266, 0.008100271224975586, 0.010056495666503906, 0.012012720108032227, 0.013968944549560547, 0.015925168991088867, 0.017881393432617188, 0.019837617874145508, 0.021793842315673828, 0.02375006675720215, 0.02570629119873047, 0.02766251564025879, 0.02961874008178711, 0.03157496452331543, 0.03353118896484375, 0.03548741340637207, 0.03744363784790039, 0.03939986228942871, 0.04135608673095703, 0.04331231117248535, 0.04526853561401367, 0.04722476005554199, 0.04918098449707031, 0.05113720893859863, 0.05309343338012695, 0.05504965782165527, 0.057005882263183594, 0.058962106704711914, 0.060918331146240234, 0.06287455558776855, 0.06483078002929688, 0.0667870044708252, 0.06874322891235352, 0.07069945335388184, 0.07265567779541016, 0.07461190223693848, 0.0765681266784668, 0.07852435111999512, 0.08048057556152344, 0.08243680000305176, 0.08439302444458008, 0.0863492488861084, 0.08830547332763672, 0.09026169776916504, 0.09221792221069336, 0.09417414665222168, 0.09613037109375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 11.0, 14.0, 16.0, 21.0, 38.0, 79.0, 155.0, 199.0, 168.0, 79.0, 57.0, 42.0, 31.0, 20.0, 11.0, 19.0, 10.0, 8.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28262707591056824, -0.2751024663448334, -0.2675778269767761, -0.26005321741104126, -0.2525286078453064, -0.24500398337841034, -0.23747935891151428, -0.22995474934577942, -0.22243012487888336, -0.2149055004119873, -0.20738089084625244, -0.19985626637935638, -0.19233165681362152, -0.18480703234672546, -0.1772824227809906, -0.16975779831409454, -0.1622331738471985, -0.15470854938030243, -0.14718393981456757, -0.1396593153476715, -0.13213470578193665, -0.12461008131504059, -0.11708546429872513, -0.10956084728240967, -0.1020362377166748, -0.09451162070035934, -0.08698700368404388, -0.07946237921714783, -0.07193776220083237, -0.0644131451845169, -0.05688852816820145, -0.04936390742659569, -0.04183928668498993, -0.03431466966867447, -0.02679004892706871, -0.01926543191075325, -0.01174081303179264, -0.004216194152832031, 0.003308422863483429, 0.010833043605089188, 0.018357660621404648, 0.025882279500365257, 0.03340689837932587, 0.04093151539564133, 0.04845613241195679, 0.055980753153562546, 0.06350536644458771, 0.07102999091148376, 0.07855460792779922, 0.08607922494411469, 0.09360384196043015, 0.1011284589767456, 0.10865308344364166, 0.11617770045995712, 0.12370231747627258, 0.13122694194316864, 0.1387515515089035, 0.14627617597579956, 0.15380078554153442, 0.16132541000843048, 0.16885001957416534, 0.1763746440410614, 0.18389925360679626, 0.19142387807369232, 0.19894850254058838]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 12.0, 8.0, 5.0, 8.0, 7.0, 7.0, 16.0, 19.0, 11.0, 33.0, 25.0, 25.0, 30.0, 30.0, 27.0, 28.0, 36.0, 46.0, 50.0, 48.0, 49.0, 45.0, 38.0, 56.0, 56.0, 42.0, 32.0, 29.0, 30.0, 19.0, 28.0, 11.0, 17.0, 11.0, 12.0, 9.0, 10.0, 9.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.14713478088378906, -0.14239844679832458, -0.1376621127128601, -0.13292576372623444, -0.12818942964076996, -0.12345309555530548, -0.1187167540192604, -0.11398041248321533, -0.10924407839775085, -0.10450774431228638, -0.0997714027762413, -0.09503506124019623, -0.09029872715473175, -0.08556239306926727, -0.0808260515332222, -0.07608970999717712, -0.07135337591171265, -0.06661704182624817, -0.061880700290203094, -0.05714436247944832, -0.05240802466869354, -0.047671686857938766, -0.04293534904718399, -0.038199011236429214, -0.03346267342567444, -0.028726335614919662, -0.023989997804164886, -0.01925365999341011, -0.014517322182655334, -0.009780984371900558, -0.0050446465611457825, -0.00030830875039100647, 0.0044280290603637695, 0.009164366871118546, 0.013900704681873322, 0.018637042492628098, 0.023373380303382874, 0.02810971811413765, 0.032846055924892426, 0.0375823937356472, 0.04231873154640198, 0.047055069357156754, 0.05179140716791153, 0.056527744978666306, 0.06126408278942108, 0.06600041687488556, 0.07073675841093063, 0.07547309994697571, 0.08020943403244019, 0.08494576811790466, 0.08968210965394974, 0.09441845118999481, 0.09915478527545929, 0.10389111936092377, 0.10862746089696884, 0.11336380243301392, 0.1181001365184784, 0.12283647060394287, 0.12757280468940735, 0.13230915367603302, 0.1370454877614975, 0.14178182184696198, 0.14651817083358765, 0.15125450491905212, 0.1559908390045166]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 11.0, 5.0, 15.0, 33.0, 43.0, 82.0, 115.0, 144.0, 242.0, 364.0, 732.0, 1230.0, 2434.0, 4948.0, 10648.0, 26336.0, 71049.0, 236234.0, 462555.0, 147715.0, 49019.0, 18586.0, 7923.0, 3710.0, 1843.0, 1052.0, 565.0, 308.0, 223.0, 122.0, 93.0, 50.0, 37.0, 27.0, 11.0, 18.0, 12.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01611328125, -0.015523433685302734, -0.014933586120605469, -0.014343738555908203, -0.013753890991210938, -0.013164043426513672, -0.012574195861816406, -0.01198434829711914, -0.011394500732421875, -0.01080465316772461, -0.010214805603027344, -0.009624958038330078, -0.009035110473632812, -0.008445262908935547, -0.007855415344238281, -0.007265567779541016, -0.00667572021484375, -0.006085872650146484, -0.005496025085449219, -0.004906177520751953, -0.0043163299560546875, -0.003726482391357422, -0.0031366348266601562, -0.0025467872619628906, -0.001956939697265625, -0.0013670921325683594, -0.0007772445678710938, -0.00018739700317382812, 0.0004024505615234375, 0.0009922981262207031, 0.0015821456909179688, 0.0021719932556152344, 0.0027618408203125, 0.0033516883850097656, 0.003941535949707031, 0.004531383514404297, 0.0051212310791015625, 0.005711078643798828, 0.006300926208496094, 0.006890773773193359, 0.007480621337890625, 0.00807046890258789, 0.008660316467285156, 0.009250164031982422, 0.009840011596679688, 0.010429859161376953, 0.011019706726074219, 0.011609554290771484, 0.01219940185546875, 0.012789249420166016, 0.013379096984863281, 0.013968944549560547, 0.014558792114257812, 0.015148639678955078, 0.015738487243652344, 0.01632833480834961, 0.016918182373046875, 0.01750802993774414, 0.018097877502441406, 0.018687725067138672, 0.019277572631835938, 0.019867420196533203, 0.02045726776123047, 0.021047115325927734, 0.021636962890625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 13.0, 10.0, 20.0, 28.0, 42.0, 45.0, 70.0, 65.0, 73.0, 85.0, 61.0, 93.0, 75.0, 64.0, 59.0, 48.0, 37.0, 29.0, 25.0, 6.0, 12.0, 10.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01473236083984375, -0.014180302619934082, -0.013628244400024414, -0.013076186180114746, -0.012524127960205078, -0.01197206974029541, -0.011420011520385742, -0.010867953300476074, -0.010315895080566406, -0.009763836860656738, -0.00921177864074707, -0.008659720420837402, -0.008107662200927734, -0.007555603981018066, -0.0070035457611083984, -0.0064514875411987305, -0.0058994293212890625, -0.0053473711013793945, -0.0047953128814697266, -0.004243254661560059, -0.0036911964416503906, -0.0031391382217407227, -0.0025870800018310547, -0.0020350217819213867, -0.0014829635620117188, -0.0009309053421020508, -0.0003788471221923828, 0.00017321109771728516, 0.0007252693176269531, 0.001277327537536621, 0.001829385757446289, 0.002381443977355957, 0.002933502197265625, 0.003485560417175293, 0.004037618637084961, 0.004589676856994629, 0.005141735076904297, 0.005693793296813965, 0.006245851516723633, 0.006797909736633301, 0.007349967956542969, 0.007902026176452637, 0.008454084396362305, 0.009006142616271973, 0.00955820083618164, 0.010110259056091309, 0.010662317276000977, 0.011214375495910645, 0.011766433715820312, 0.01231849193572998, 0.012870550155639648, 0.013422608375549316, 0.013974666595458984, 0.014526724815368652, 0.01507878303527832, 0.01563084125518799, 0.016182899475097656, 0.016734957695007324, 0.017287015914916992, 0.01783907413482666, 0.018391132354736328, 0.018943190574645996, 0.019495248794555664, 0.020047307014465332, 0.020599365234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 16.0, 6.0, 26.0, 28.0, 54.0, 78.0, 169.0, 336.0, 816.0, 2798.0, 14832.0, 375730.0, 631742.0, 17153.0, 3074.0, 897.0, 396.0, 168.0, 93.0, 49.0, 32.0, 19.0, 11.0, 7.0, 4.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07696533203125, -0.07463550567626953, -0.07230567932128906, -0.0699758529663086, -0.06764602661132812, -0.06531620025634766, -0.06298637390136719, -0.06065654754638672, -0.05832672119140625, -0.05599689483642578, -0.05366706848144531, -0.051337242126464844, -0.049007415771484375, -0.046677589416503906, -0.04434776306152344, -0.04201793670654297, -0.0396881103515625, -0.03735828399658203, -0.03502845764160156, -0.032698631286621094, -0.030368804931640625, -0.028038978576660156, -0.025709152221679688, -0.02337932586669922, -0.02104949951171875, -0.01871967315673828, -0.016389846801757812, -0.014060020446777344, -0.011730194091796875, -0.009400367736816406, -0.0070705413818359375, -0.004740715026855469, -0.002410888671875, -8.106231689453125e-05, 0.0022487640380859375, 0.004578590393066406, 0.006908416748046875, 0.009238243103027344, 0.011568069458007812, 0.013897895812988281, 0.01622772216796875, 0.01855754852294922, 0.020887374877929688, 0.023217201232910156, 0.025547027587890625, 0.027876853942871094, 0.030206680297851562, 0.03253650665283203, 0.0348663330078125, 0.03719615936279297, 0.03952598571777344, 0.041855812072753906, 0.044185638427734375, 0.046515464782714844, 0.04884529113769531, 0.05117511749267578, 0.05350494384765625, 0.05583477020263672, 0.05816459655761719, 0.060494422912597656, 0.06282424926757812, 0.0651540756225586, 0.06748390197753906, 0.06981372833251953, 0.0721435546875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 9.0, 4.0, 11.0, 7.0, 11.0, 16.0, 32.0, 31.0, 43.0, 47.0, 55.0, 69.0, 65.0, 72.0, 93.0, 64.0, 63.0, 42.0, 62.0, 50.0, 38.0, 24.0, 18.0, 14.0, 9.0, 15.0, 9.0, 8.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.071533203125, -0.069305419921875, -0.06707763671875, -0.064849853515625, -0.0626220703125, -0.060394287109375, -0.05816650390625, -0.055938720703125, -0.0537109375, -0.051483154296875, -0.04925537109375, -0.047027587890625, -0.0447998046875, -0.042572021484375, -0.04034423828125, -0.038116455078125, -0.035888671875, -0.033660888671875, -0.03143310546875, -0.029205322265625, -0.0269775390625, -0.024749755859375, -0.02252197265625, -0.020294189453125, -0.01806640625, -0.015838623046875, -0.01361083984375, -0.011383056640625, -0.0091552734375, -0.006927490234375, -0.00469970703125, -0.002471923828125, -0.000244140625, 0.001983642578125, 0.00421142578125, 0.006439208984375, 0.0086669921875, 0.010894775390625, 0.01312255859375, 0.015350341796875, 0.017578125, 0.019805908203125, 0.02203369140625, 0.024261474609375, 0.0264892578125, 0.028717041015625, 0.03094482421875, 0.033172607421875, 0.035400390625, 0.037628173828125, 0.03985595703125, 0.042083740234375, 0.0443115234375, 0.046539306640625, 0.04876708984375, 0.050994873046875, 0.05322265625, 0.055450439453125, 0.05767822265625, 0.059906005859375, 0.0621337890625, 0.064361572265625, 0.06658935546875, 0.068817138671875, 0.071044921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 8.0, 11.0, 8.0, 19.0, 29.0, 49.0, 40.0, 74.0, 111.0, 177.0, 280.0, 470.0, 801.0, 1539.0, 3057.0, 7669.0, 25775.0, 929813.0, 57059.0, 12454.0, 4502.0, 2000.0, 1007.0, 594.0, 358.0, 207.0, 146.0, 80.0, 50.0, 42.0, 35.0, 17.0, 15.0, 11.0, 9.0, 6.0, 5.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038177490234375, -0.03689289093017578, -0.03560829162597656, -0.034323692321777344, -0.033039093017578125, -0.031754493713378906, -0.030469894409179688, -0.02918529510498047, -0.02790069580078125, -0.02661609649658203, -0.025331497192382812, -0.024046897888183594, -0.022762298583984375, -0.021477699279785156, -0.020193099975585938, -0.01890850067138672, -0.0176239013671875, -0.01633930206298828, -0.015054702758789062, -0.013770103454589844, -0.012485504150390625, -0.011200904846191406, -0.009916305541992188, -0.008631706237792969, -0.00734710693359375, -0.006062507629394531, -0.0047779083251953125, -0.0034933090209960938, -0.002208709716796875, -0.0009241104125976562, 0.0003604888916015625, 0.0016450881958007812, 0.0029296875, 0.004214286804199219, 0.0054988861083984375, 0.006783485412597656, 0.008068084716796875, 0.009352684020996094, 0.010637283325195312, 0.011921882629394531, 0.01320648193359375, 0.014491081237792969, 0.015775680541992188, 0.017060279846191406, 0.018344879150390625, 0.019629478454589844, 0.020914077758789062, 0.02219867706298828, 0.0234832763671875, 0.02476787567138672, 0.026052474975585938, 0.027337074279785156, 0.028621673583984375, 0.029906272888183594, 0.031190872192382812, 0.03247547149658203, 0.03376007080078125, 0.03504467010498047, 0.03632926940917969, 0.037613868713378906, 0.038898468017578125, 0.040183067321777344, 0.04146766662597656, 0.04275226593017578, 0.044036865234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 4.0, 8.0, 7.0, 7.0, 6.0, 8.0, 18.0, 20.0, 30.0, 36.0, 47.0, 92.0, 86.0, 96.0, 121.0, 102.0, 73.0, 57.0, 39.0, 28.0, 21.0, 19.0, 14.0, 7.0, 7.0, 6.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8710575103759766e-05, -5.676690489053726e-05, -5.482323467731476e-05, -5.2879564464092255e-05, -5.093589425086975e-05, -4.899222403764725e-05, -4.7048553824424744e-05, -4.510488361120224e-05, -4.3161213397979736e-05, -4.121754318475723e-05, -3.927387297153473e-05, -3.7330202758312225e-05, -3.538653254508972e-05, -3.344286233186722e-05, -3.1499192118644714e-05, -2.955552190542221e-05, -2.7611851692199707e-05, -2.5668181478977203e-05, -2.37245112657547e-05, -2.1780841052532196e-05, -1.9837170839309692e-05, -1.789350062608719e-05, -1.5949830412864685e-05, -1.4006160199642181e-05, -1.2062489986419678e-05, -1.0118819773197174e-05, -8.17514955997467e-06, -6.231479346752167e-06, -4.287809133529663e-06, -2.3441389203071594e-06, -4.0046870708465576e-07, 1.543201506137848e-06, 3.4868717193603516e-06, 5.430541932582855e-06, 7.374212145805359e-06, 9.317882359027863e-06, 1.1261552572250366e-05, 1.320522278547287e-05, 1.5148892998695374e-05, 1.7092563211917877e-05, 1.903623342514038e-05, 2.0979903638362885e-05, 2.2923573851585388e-05, 2.4867244064807892e-05, 2.6810914278030396e-05, 2.87545844912529e-05, 3.06982547044754e-05, 3.2641924917697906e-05, 3.458559513092041e-05, 3.6529265344142914e-05, 3.847293555736542e-05, 4.041660577058792e-05, 4.2360275983810425e-05, 4.430394619703293e-05, 4.624761641025543e-05, 4.8191286623477936e-05, 5.013495683670044e-05, 5.207862704992294e-05, 5.402229726314545e-05, 5.596596747636795e-05, 5.7909637689590454e-05, 5.985330790281296e-05, 6.179697811603546e-05, 6.374064832925797e-05, 6.568431854248047e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 6.0, 4.0, 5.0, 11.0, 4.0, 12.0, 21.0, 34.0, 57.0, 129.0, 240.0, 736.0, 2265.0, 9146.0, 82464.0, 934213.0, 14435.0, 3141.0, 952.0, 358.0, 148.0, 60.0, 42.0, 22.0, 14.0, 9.0, 5.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07110595703125, -0.06908226013183594, -0.06705856323242188, -0.06503486633300781, -0.06301116943359375, -0.06098747253417969, -0.058963775634765625, -0.05694007873535156, -0.0549163818359375, -0.05289268493652344, -0.050868988037109375, -0.04884529113769531, -0.04682159423828125, -0.04479789733886719, -0.042774200439453125, -0.04075050354003906, -0.038726806640625, -0.03670310974121094, -0.034679412841796875, -0.03265571594238281, -0.03063201904296875, -0.028608322143554688, -0.026584625244140625, -0.024560928344726562, -0.0225372314453125, -0.020513534545898438, -0.018489837646484375, -0.016466140747070312, -0.01444244384765625, -0.012418746948242188, -0.010395050048828125, -0.008371353149414062, -0.00634765625, -0.0043239593505859375, -0.002300262451171875, -0.0002765655517578125, 0.00174713134765625, 0.0037708282470703125, 0.005794525146484375, 0.007818222045898438, 0.0098419189453125, 0.011865615844726562, 0.013889312744140625, 0.015913009643554688, 0.01793670654296875, 0.019960403442382812, 0.021984100341796875, 0.024007797241210938, 0.026031494140625, 0.028055191040039062, 0.030078887939453125, 0.03210258483886719, 0.03412628173828125, 0.03614997863769531, 0.038173675537109375, 0.04019737243652344, 0.0422210693359375, 0.04424476623535156, 0.046268463134765625, 0.04829216003417969, 0.05031585693359375, 0.05233955383300781, 0.054363250732421875, 0.05638694763183594, 0.05841064453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 7.0, 6.0, 9.0, 13.0, 11.0, 13.0, 29.0, 136.0, 453.0, 167.0, 43.0, 15.0, 14.0, 6.0, 6.0, 4.0, 7.0, 7.0, 7.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03997802734375, -0.03862476348876953, -0.03727149963378906, -0.035918235778808594, -0.034564971923828125, -0.033211708068847656, -0.03185844421386719, -0.03050518035888672, -0.02915191650390625, -0.02779865264892578, -0.026445388793945312, -0.025092124938964844, -0.023738861083984375, -0.022385597229003906, -0.021032333374023438, -0.01967906951904297, -0.0183258056640625, -0.01697254180908203, -0.015619277954101562, -0.014266014099121094, -0.012912750244140625, -0.011559486389160156, -0.010206222534179688, -0.008852958679199219, -0.00749969482421875, -0.006146430969238281, -0.0047931671142578125, -0.0034399032592773438, -0.002086639404296875, -0.0007333755493164062, 0.0006198883056640625, 0.0019731521606445312, 0.003326416015625, 0.004679679870605469, 0.0060329437255859375, 0.007386207580566406, 0.008739471435546875, 0.010092735290527344, 0.011445999145507812, 0.012799263000488281, 0.01415252685546875, 0.015505790710449219, 0.016859054565429688, 0.018212318420410156, 0.019565582275390625, 0.020918846130371094, 0.022272109985351562, 0.02362537384033203, 0.0249786376953125, 0.02633190155029297, 0.027685165405273438, 0.029038429260253906, 0.030391693115234375, 0.031744956970214844, 0.03309822082519531, 0.03445148468017578, 0.03580474853515625, 0.03715801239013672, 0.03851127624511719, 0.039864540100097656, 0.041217803955078125, 0.042571067810058594, 0.04392433166503906, 0.04527759552001953, 0.046630859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 20.0, 29.0, 42.0, 66.0, 132.0, 246.0, 213.0, 116.0, 59.0, 21.0, 14.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4694001078605652, -0.45262354612350464, -0.4358469545841217, -0.41907039284706116, -0.4022938311100006, -0.3855172395706177, -0.36874067783355713, -0.3519641160964966, -0.33518755435943604, -0.3184109926223755, -0.30163440108299255, -0.284857839345932, -0.26808127760887146, -0.2513046860694885, -0.23452812433242798, -0.21775156259536743, -0.2009749710559845, -0.18419839441776276, -0.1674218326807022, -0.15064525604248047, -0.13386869430541992, -0.11709211766719818, -0.10031554102897644, -0.0835389718413353, -0.06676240265369415, -0.04998583346605301, -0.03320926055312157, -0.016432687640190125, 0.0003438815474510193, 0.017120450735092163, 0.033897027373313904, 0.05067359656095505, 0.06745016574859619, 0.08422673493623734, 0.10100330412387848, 0.11777988076210022, 0.13455644249916077, 0.1513330191373825, 0.16810959577560425, 0.1848861575126648, 0.20166273415088654, 0.21843931078910828, 0.23521587252616882, 0.25199246406555176, 0.2687690258026123, 0.28554558753967285, 0.3023221492767334, 0.31909874081611633, 0.3358753025531769, 0.3526518642902374, 0.36942845582962036, 0.3862050175666809, 0.40298157930374146, 0.419758141040802, 0.43653473258018494, 0.4533112943172455, 0.4700878858566284, 0.48686444759368896, 0.5036410093307495, 0.5204175710678101, 0.5371941924095154, 0.5539707541465759, 0.5707473158836365, 0.587523877620697, 0.6043004393577576]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 1.0, 8.0, 11.0, 16.0, 15.0, 13.0, 21.0, 19.0, 19.0, 23.0, 23.0, 25.0, 37.0, 32.0, 44.0, 41.0, 56.0, 63.0, 70.0, 56.0, 44.0, 34.0, 41.0, 36.0, 32.0, 26.0, 21.0, 22.0, 20.0, 18.0, 15.0, 13.0, 11.0, 14.0, 11.0, 2.0, 11.0, 10.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2635602355003357, -0.25540804862976074, -0.2472558319568634, -0.23910364508628845, -0.2309514433145523, -0.22279924154281616, -0.2146470546722412, -0.20649485290050507, -0.19834265112876892, -0.19019044935703278, -0.18203824758529663, -0.17388606071472168, -0.16573385894298553, -0.1575816571712494, -0.14942947030067444, -0.1412772685289383, -0.13312506675720215, -0.124972864985466, -0.11682067066431046, -0.10866847634315491, -0.10051627457141876, -0.09236407279968262, -0.08421187847852707, -0.07605968415737152, -0.06790748238563538, -0.05975528433918953, -0.05160308629274368, -0.043450888246297836, -0.03529869019985199, -0.027146492153406143, -0.018994294106960297, -0.01084209606051445, -0.0026898980140686035, 0.005462300032377243, 0.01361449807882309, 0.021766696125268936, 0.029918894171714783, 0.03807109221816063, 0.046223290264606476, 0.05437548831105232, 0.06252768635749817, 0.07067988812923431, 0.07883208245038986, 0.08698427677154541, 0.09513647854328156, 0.1032886803150177, 0.11144087463617325, 0.1195930689573288, 0.12774527072906494, 0.1358974725008011, 0.14404967427253723, 0.15220186114311218, 0.16035406291484833, 0.16850626468658447, 0.17665845155715942, 0.18481065332889557, 0.1929628551006317, 0.20111505687236786, 0.209267258644104, 0.21741944551467896, 0.2255716472864151, 0.23372384905815125, 0.2418760359287262, 0.25002825260162354, 0.2581804394721985]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 11.0, 15.0, 13.0, 16.0, 22.0, 42.0, 50.0, 52.0, 87.0, 147.0, 242.0, 457.0, 1042.0, 2611.0, 8130.0, 50952.0, 3364708.0, 733292.0, 22956.0, 5410.0, 2008.0, 914.0, 413.0, 240.0, 141.0, 88.0, 50.0, 50.0, 42.0, 19.0, 15.0, 13.0, 8.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.034149169921875, -0.033246755599975586, -0.03234434127807617, -0.03144192695617676, -0.030539512634277344, -0.02963709831237793, -0.028734683990478516, -0.0278322696685791, -0.026929855346679688, -0.026027441024780273, -0.02512502670288086, -0.024222612380981445, -0.02332019805908203, -0.022417783737182617, -0.021515369415283203, -0.02061295509338379, -0.019710540771484375, -0.01880812644958496, -0.017905712127685547, -0.017003297805786133, -0.01610088348388672, -0.015198469161987305, -0.01429605484008789, -0.013393640518188477, -0.012491226196289062, -0.011588811874389648, -0.010686397552490234, -0.00978398323059082, -0.008881568908691406, -0.007979154586791992, -0.007076740264892578, -0.006174325942993164, -0.00527191162109375, -0.004369497299194336, -0.003467082977294922, -0.002564668655395508, -0.0016622543334960938, -0.0007598400115966797, 0.00014257431030273438, 0.0010449886322021484, 0.0019474029541015625, 0.0028498172760009766, 0.0037522315979003906, 0.004654645919799805, 0.005557060241699219, 0.006459474563598633, 0.007361888885498047, 0.008264303207397461, 0.009166717529296875, 0.010069131851196289, 0.010971546173095703, 0.011873960494995117, 0.012776374816894531, 0.013678789138793945, 0.01458120346069336, 0.015483617782592773, 0.016386032104492188, 0.0172884464263916, 0.018190860748291016, 0.01909327507019043, 0.019995689392089844, 0.020898103713989258, 0.021800518035888672, 0.022702932357788086, 0.0236053466796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 10.0, 11.0, 13.0, 17.0, 29.0, 31.0, 38.0, 41.0, 50.0, 74.0, 50.0, 79.0, 61.0, 85.0, 63.0, 60.0, 53.0, 43.0, 50.0, 32.0, 20.0, 25.0, 12.0, 6.0, 10.0, 9.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01512908935546875, -0.014623284339904785, -0.01411747932434082, -0.013611674308776855, -0.01310586929321289, -0.012600064277648926, -0.012094259262084961, -0.011588454246520996, -0.011082649230957031, -0.010576844215393066, -0.010071039199829102, -0.009565234184265137, -0.009059429168701172, -0.008553624153137207, -0.008047819137573242, -0.007542014122009277, -0.0070362091064453125, -0.006530404090881348, -0.006024599075317383, -0.005518794059753418, -0.005012989044189453, -0.004507184028625488, -0.0040013790130615234, -0.0034955739974975586, -0.0029897689819335938, -0.002483963966369629, -0.001978158950805664, -0.0014723539352416992, -0.0009665489196777344, -0.00046074390411376953, 4.506111145019531e-05, 0.0005508661270141602, 0.001056671142578125, 0.0015624761581420898, 0.0020682811737060547, 0.0025740861892700195, 0.0030798912048339844, 0.0035856962203979492, 0.004091501235961914, 0.004597306251525879, 0.005103111267089844, 0.005608916282653809, 0.0061147212982177734, 0.006620526313781738, 0.007126331329345703, 0.007632136344909668, 0.008137941360473633, 0.008643746376037598, 0.009149551391601562, 0.009655356407165527, 0.010161161422729492, 0.010666966438293457, 0.011172771453857422, 0.011678576469421387, 0.012184381484985352, 0.012690186500549316, 0.013195991516113281, 0.013701796531677246, 0.014207601547241211, 0.014713406562805176, 0.01521921157836914, 0.015725016593933105, 0.01623082160949707, 0.016736626625061035, 0.017242431640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 9.0, 8.0, 13.0, 29.0, 25.0, 50.0, 61.0, 87.0, 131.0, 203.0, 438.0, 928.0, 3336.0, 24751.0, 3947400.0, 200883.0, 11019.0, 2590.0, 958.0, 487.0, 264.0, 201.0, 123.0, 74.0, 76.0, 33.0, 32.0, 25.0, 8.0, 15.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052947998046875, -0.05116987228393555, -0.049391746520996094, -0.04761362075805664, -0.04583549499511719, -0.044057369232177734, -0.04227924346923828, -0.04050111770629883, -0.038722991943359375, -0.03694486618041992, -0.03516674041748047, -0.033388614654541016, -0.03161048889160156, -0.02983236312866211, -0.028054237365722656, -0.026276111602783203, -0.02449798583984375, -0.022719860076904297, -0.020941734313964844, -0.01916360855102539, -0.017385482788085938, -0.015607357025146484, -0.013829231262207031, -0.012051105499267578, -0.010272979736328125, -0.008494853973388672, -0.006716728210449219, -0.004938602447509766, -0.0031604766845703125, -0.0013823509216308594, 0.00039577484130859375, 0.002173900604248047, 0.0039520263671875, 0.005730152130126953, 0.007508277893066406, 0.00928640365600586, 0.011064529418945312, 0.012842655181884766, 0.014620780944824219, 0.016398906707763672, 0.018177032470703125, 0.019955158233642578, 0.02173328399658203, 0.023511409759521484, 0.025289535522460938, 0.02706766128540039, 0.028845787048339844, 0.030623912811279297, 0.03240203857421875, 0.0341801643371582, 0.035958290100097656, 0.03773641586303711, 0.03951454162597656, 0.041292667388916016, 0.04307079315185547, 0.04484891891479492, 0.046627044677734375, 0.04840517044067383, 0.05018329620361328, 0.051961421966552734, 0.05373954772949219, 0.05551767349243164, 0.057295799255371094, 0.05907392501831055, 0.06085205078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 15.0, 22.0, 50.0, 94.0, 235.0, 1187.0, 1767.0, 400.0, 118.0, 54.0, 28.0, 23.0, 14.0, 12.0, 7.0, 8.0, 5.0, 4.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.025299072265625, -0.02415752410888672, -0.023015975952148438, -0.021874427795410156, -0.020732879638671875, -0.019591331481933594, -0.018449783325195312, -0.01730823516845703, -0.01616668701171875, -0.015025138854980469, -0.013883590698242188, -0.012742042541503906, -0.011600494384765625, -0.010458946228027344, -0.009317398071289062, -0.008175849914550781, -0.0070343017578125, -0.005892753601074219, -0.0047512054443359375, -0.0036096572875976562, -0.002468109130859375, -0.0013265609741210938, -0.0001850128173828125, 0.0009565353393554688, 0.00209808349609375, 0.0032396316528320312, 0.0043811798095703125, 0.005522727966308594, 0.006664276123046875, 0.007805824279785156, 0.008947372436523438, 0.010088920593261719, 0.01123046875, 0.012372016906738281, 0.013513565063476562, 0.014655113220214844, 0.015796661376953125, 0.016938209533691406, 0.018079757690429688, 0.01922130584716797, 0.02036285400390625, 0.02150440216064453, 0.022645950317382812, 0.023787498474121094, 0.024929046630859375, 0.026070594787597656, 0.027212142944335938, 0.02835369110107422, 0.0294952392578125, 0.03063678741455078, 0.03177833557128906, 0.032919883728027344, 0.034061431884765625, 0.035202980041503906, 0.03634452819824219, 0.03748607635498047, 0.03862762451171875, 0.03976917266845703, 0.04091072082519531, 0.042052268981933594, 0.043193817138671875, 0.044335365295410156, 0.04547691345214844, 0.04661846160888672, 0.047760009765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 16.0, 39.0, 61.0, 135.0, 233.0, 219.0, 126.0, 69.0, 34.0, 21.0, 14.0, 11.0, 7.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3248322010040283, -0.31391409039497375, -0.3029959797859192, -0.2920778691768646, -0.28115975856781006, -0.2702416181564331, -0.2593235373497009, -0.24840539693832397, -0.2374872863292694, -0.22656917572021484, -0.21565106511116028, -0.2047329545021057, -0.19381482899188995, -0.1828967183828354, -0.17197860777378082, -0.16106048226356506, -0.1501423865556717, -0.13922427594661713, -0.12830616533756256, -0.1173880472779274, -0.10646992921829224, -0.09555181860923767, -0.0846337080001831, -0.07371558994054794, -0.06279747933149338, -0.051879364997148514, -0.04096125066280365, -0.030043140053749084, -0.01912502571940422, -0.008206911385059357, 0.0027111992239952087, 0.013629317283630371, 0.024547427892684937, 0.0354655422270298, 0.046383656561374664, 0.05730176717042923, 0.06821988523006439, 0.07913799583911896, 0.09005610644817352, 0.10097422450780869, 0.11189233511686325, 0.12281044572591782, 0.13372856378555298, 0.14464667439460754, 0.1555647850036621, 0.16648289561271667, 0.17740100622177124, 0.188319131731987, 0.19923724234104156, 0.21015535295009613, 0.2210734635591507, 0.23199158906936646, 0.24290969967842102, 0.2538278102874756, 0.26474592089653015, 0.2756640315055847, 0.2865821421146393, 0.29750025272369385, 0.3084183633327484, 0.319336473941803, 0.33025458455085754, 0.3411726951599121, 0.35209083557128906, 0.36300894618034363, 0.3739270567893982]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 6.0, 12.0, 8.0, 11.0, 10.0, 11.0, 21.0, 25.0, 22.0, 26.0, 45.0, 36.0, 54.0, 55.0, 43.0, 53.0, 55.0, 60.0, 47.0, 55.0, 45.0, 52.0, 36.0, 36.0, 27.0, 23.0, 22.0, 21.0, 16.0, 17.0, 14.0, 12.0, 2.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12280076742172241, -0.1182720810174942, -0.1137433871626854, -0.10921470075845718, -0.10468600690364838, -0.10015732049942017, -0.09562863409519196, -0.09109994769096375, -0.08657125383615494, -0.08204256743192673, -0.07751387357711792, -0.07298518717288971, -0.0684565007686615, -0.06392780691385269, -0.05939912050962448, -0.05487043038010597, -0.05034174025058746, -0.045813050121068954, -0.041284359991550446, -0.036755673587322235, -0.032226983457803726, -0.027698293328285217, -0.023169605061411858, -0.018640916794538498, -0.014112226665019989, -0.009583537466824055, -0.00505484826862812, -0.0005261590704321861, 0.004002530127763748, 0.008531220257282257, 0.013059908524155617, 0.017588596791028976, 0.022117286920547485, 0.026645977050065994, 0.031174665316939354, 0.035703353583812714, 0.04023204371333122, 0.04476073384284973, 0.04928942024707794, 0.05381811037659645, 0.05834680050611496, 0.06287548691034317, 0.06740418076515198, 0.07193286716938019, 0.0764615535736084, 0.0809902474284172, 0.08551893383264542, 0.09004762768745422, 0.09457631409168243, 0.09910500049591064, 0.10363369435071945, 0.10816238075494766, 0.11269107460975647, 0.11721976101398468, 0.12174844741821289, 0.1262771338224411, 0.1308058202266693, 0.13533450663089752, 0.13986319303512573, 0.14439189434051514, 0.14892058074474335, 0.15344926714897156, 0.15797795355319977, 0.16250663995742798, 0.16703534126281738]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 3.0, 5.0, 4.0, 8.0, 19.0, 15.0, 30.0, 64.0, 104.0, 133.0, 202.0, 381.0, 682.0, 1332.0, 2336.0, 4567.0, 9702.0, 21728.0, 53459.0, 152650.0, 416720.0, 245100.0, 81522.0, 31709.0, 13427.0, 6106.0, 2984.0, 1556.0, 845.0, 479.0, 257.0, 172.0, 87.0, 58.0, 28.0, 31.0, 16.0, 13.0, 11.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0213470458984375, -0.02062845230102539, -0.01990985870361328, -0.019191265106201172, -0.018472671508789062, -0.017754077911376953, -0.017035484313964844, -0.016316890716552734, -0.015598297119140625, -0.014879703521728516, -0.014161109924316406, -0.013442516326904297, -0.012723922729492188, -0.012005329132080078, -0.011286735534667969, -0.01056814193725586, -0.00984954833984375, -0.00913095474243164, -0.008412361145019531, -0.007693767547607422, -0.0069751739501953125, -0.006256580352783203, -0.005537986755371094, -0.004819393157958984, -0.004100799560546875, -0.0033822059631347656, -0.0026636123657226562, -0.0019450187683105469, -0.0012264251708984375, -0.0005078315734863281, 0.00021076202392578125, 0.0009293556213378906, 0.00164794921875, 0.0023665428161621094, 0.0030851364135742188, 0.003803730010986328, 0.0045223236083984375, 0.005240917205810547, 0.005959510803222656, 0.006678104400634766, 0.007396697998046875, 0.008115291595458984, 0.008833885192871094, 0.009552478790283203, 0.010271072387695312, 0.010989665985107422, 0.011708259582519531, 0.01242685317993164, 0.01314544677734375, 0.01386404037475586, 0.014582633972167969, 0.015301227569580078, 0.016019821166992188, 0.016738414764404297, 0.017457008361816406, 0.018175601959228516, 0.018894195556640625, 0.019612789154052734, 0.020331382751464844, 0.021049976348876953, 0.021768569946289062, 0.022487163543701172, 0.02320575714111328, 0.02392435073852539, 0.0246429443359375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 9.0, 13.0, 8.0, 25.0, 30.0, 37.0, 45.0, 48.0, 54.0, 63.0, 53.0, 69.0, 81.0, 74.0, 76.0, 58.0, 43.0, 36.0, 40.0, 36.0, 33.0, 14.0, 11.0, 12.0, 5.0, 7.0, 5.0, 8.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01506805419921875, -0.01455986499786377, -0.014051675796508789, -0.013543486595153809, -0.013035297393798828, -0.012527108192443848, -0.012018918991088867, -0.011510729789733887, -0.011002540588378906, -0.010494351387023926, -0.009986162185668945, -0.009477972984313965, -0.008969783782958984, -0.008461594581604004, -0.007953405380249023, -0.007445216178894043, -0.0069370269775390625, -0.006428837776184082, -0.0059206485748291016, -0.005412459373474121, -0.004904270172119141, -0.00439608097076416, -0.0038878917694091797, -0.0033797025680541992, -0.0028715133666992188, -0.0023633241653442383, -0.0018551349639892578, -0.0013469457626342773, -0.0008387565612792969, -0.0003305673599243164, 0.00017762184143066406, 0.0006858110427856445, 0.001194000244140625, 0.0017021894454956055, 0.002210378646850586, 0.0027185678482055664, 0.003226757049560547, 0.0037349462509155273, 0.004243135452270508, 0.004751324653625488, 0.005259513854980469, 0.005767703056335449, 0.00627589225769043, 0.00678408145904541, 0.007292270660400391, 0.007800459861755371, 0.008308649063110352, 0.008816838264465332, 0.009325027465820312, 0.009833216667175293, 0.010341405868530273, 0.010849595069885254, 0.011357784271240234, 0.011865973472595215, 0.012374162673950195, 0.012882351875305176, 0.013390541076660156, 0.013898730278015137, 0.014406919479370117, 0.014915108680725098, 0.015423297882080078, 0.01593148708343506, 0.01643967628479004, 0.01694786548614502, 0.0174560546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 22.0, 18.0, 36.0, 53.0, 115.0, 204.0, 399.0, 789.0, 2034.0, 6380.0, 27249.0, 175548.0, 723357.0, 88889.0, 16484.0, 4289.0, 1400.0, 586.0, 288.0, 148.0, 87.0, 55.0, 37.0, 24.0, 11.0, 10.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04412841796875, -0.042571067810058594, -0.04101371765136719, -0.03945636749267578, -0.037899017333984375, -0.03634166717529297, -0.03478431701660156, -0.033226966857910156, -0.03166961669921875, -0.030112266540527344, -0.028554916381835938, -0.02699756622314453, -0.025440216064453125, -0.02388286590576172, -0.022325515747070312, -0.020768165588378906, -0.0192108154296875, -0.017653465270996094, -0.016096115112304688, -0.014538764953613281, -0.012981414794921875, -0.011424064636230469, -0.009866714477539062, -0.008309364318847656, -0.00675201416015625, -0.005194664001464844, -0.0036373138427734375, -0.0020799636840820312, -0.000522613525390625, 0.0010347366333007812, 0.0025920867919921875, 0.004149436950683594, 0.005706787109375, 0.007264137268066406, 0.008821487426757812, 0.010378837585449219, 0.011936187744140625, 0.013493537902832031, 0.015050888061523438, 0.016608238220214844, 0.01816558837890625, 0.019722938537597656, 0.021280288696289062, 0.02283763885498047, 0.024394989013671875, 0.02595233917236328, 0.027509689331054688, 0.029067039489746094, 0.0306243896484375, 0.032181739807128906, 0.03373908996582031, 0.03529644012451172, 0.036853790283203125, 0.03841114044189453, 0.03996849060058594, 0.041525840759277344, 0.04308319091796875, 0.044640541076660156, 0.04619789123535156, 0.04775524139404297, 0.049312591552734375, 0.05086994171142578, 0.05242729187011719, 0.053984642028808594, 0.0555419921875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 6.0, 7.0, 12.0, 16.0, 12.0, 13.0, 15.0, 20.0, 29.0, 31.0, 35.0, 47.0, 43.0, 42.0, 43.0, 54.0, 45.0, 60.0, 56.0, 51.0, 51.0, 51.0, 36.0, 43.0, 27.0, 22.0, 26.0, 19.0, 13.0, 17.0, 13.0, 11.0, 6.0, 11.0, 5.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.044189453125, -0.04262685775756836, -0.04106426239013672, -0.03950166702270508, -0.03793907165527344, -0.0363764762878418, -0.034813880920410156, -0.033251285552978516, -0.031688690185546875, -0.030126094818115234, -0.028563499450683594, -0.027000904083251953, -0.025438308715820312, -0.023875713348388672, -0.02231311798095703, -0.02075052261352539, -0.01918792724609375, -0.01762533187866211, -0.01606273651123047, -0.014500141143798828, -0.012937545776367188, -0.011374950408935547, -0.009812355041503906, -0.008249759674072266, -0.006687164306640625, -0.005124568939208984, -0.0035619735717773438, -0.001999378204345703, -0.0004367828369140625, 0.0011258125305175781, 0.0026884078979492188, 0.004251003265380859, 0.0058135986328125, 0.007376194000244141, 0.008938789367675781, 0.010501384735107422, 0.012063980102539062, 0.013626575469970703, 0.015189170837402344, 0.016751766204833984, 0.018314361572265625, 0.019876956939697266, 0.021439552307128906, 0.023002147674560547, 0.024564743041992188, 0.026127338409423828, 0.02768993377685547, 0.02925252914428711, 0.03081512451171875, 0.03237771987915039, 0.03394031524658203, 0.03550291061401367, 0.03706550598144531, 0.03862810134887695, 0.040190696716308594, 0.041753292083740234, 0.043315887451171875, 0.044878482818603516, 0.046441078186035156, 0.0480036735534668, 0.04956626892089844, 0.05112886428833008, 0.05269145965576172, 0.05425405502319336, 0.055816650390625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 6.0, 16.0, 15.0, 20.0, 47.0, 42.0, 56.0, 97.0, 123.0, 215.0, 333.0, 488.0, 775.0, 1374.0, 2317.0, 4386.0, 8798.0, 23552.0, 168660.0, 766351.0, 44576.0, 12897.0, 5857.0, 3083.0, 1681.0, 1019.0, 640.0, 388.0, 230.0, 149.0, 120.0, 80.0, 36.0, 31.0, 27.0, 13.0, 11.0, 12.0, 6.0, 5.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.031036376953125, -0.030179500579833984, -0.02932262420654297, -0.028465747833251953, -0.027608871459960938, -0.026751995086669922, -0.025895118713378906, -0.02503824234008789, -0.024181365966796875, -0.02332448959350586, -0.022467613220214844, -0.021610736846923828, -0.020753860473632812, -0.019896984100341797, -0.01904010772705078, -0.018183231353759766, -0.01732635498046875, -0.016469478607177734, -0.015612602233886719, -0.014755725860595703, -0.013898849487304688, -0.013041973114013672, -0.012185096740722656, -0.01132822036743164, -0.010471343994140625, -0.00961446762084961, -0.008757591247558594, -0.007900714874267578, -0.0070438385009765625, -0.006186962127685547, -0.005330085754394531, -0.004473209381103516, -0.0036163330078125, -0.0027594566345214844, -0.0019025802612304688, -0.0010457038879394531, -0.0001888275146484375, 0.0006680488586425781, 0.0015249252319335938, 0.0023818016052246094, 0.003238677978515625, 0.004095554351806641, 0.004952430725097656, 0.005809307098388672, 0.0066661834716796875, 0.007523059844970703, 0.008379936218261719, 0.009236812591552734, 0.01009368896484375, 0.010950565338134766, 0.011807441711425781, 0.012664318084716797, 0.013521194458007812, 0.014378070831298828, 0.015234947204589844, 0.01609182357788086, 0.016948699951171875, 0.01780557632446289, 0.018662452697753906, 0.019519329071044922, 0.020376205444335938, 0.021233081817626953, 0.02208995819091797, 0.022946834564208984, 0.0238037109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 3.0, 6.0, 11.0, 17.0, 20.0, 46.0, 56.0, 55.0, 89.0, 108.0, 84.0, 126.0, 91.0, 79.0, 47.0, 43.0, 29.0, 23.0, 15.0, 9.0, 7.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.557868957519531e-05, -7.35679641366005e-05, -7.155723869800568e-05, -6.954651325941086e-05, -6.753578782081604e-05, -6.552506238222122e-05, -6.35143369436264e-05, -6.150361150503159e-05, -5.949288606643677e-05, -5.748216062784195e-05, -5.547143518924713e-05, -5.346070975065231e-05, -5.1449984312057495e-05, -4.943925887346268e-05, -4.742853343486786e-05, -4.541780799627304e-05, -4.340708255767822e-05, -4.1396357119083405e-05, -3.9385631680488586e-05, -3.737490624189377e-05, -3.536418080329895e-05, -3.335345536470413e-05, -3.1342729926109314e-05, -2.9332004487514496e-05, -2.7321279048919678e-05, -2.531055361032486e-05, -2.329982817173004e-05, -2.1289102733135223e-05, -1.9278377294540405e-05, -1.7267651855945587e-05, -1.5256926417350769e-05, -1.3246200978755951e-05, -1.1235475540161133e-05, -9.224750101566315e-06, -7.214024662971497e-06, -5.2032992243766785e-06, -3.1925737857818604e-06, -1.1818483471870422e-06, 8.288770914077759e-07, 2.839602530002594e-06, 4.850327968597412e-06, 6.86105340719223e-06, 8.871778845787048e-06, 1.0882504284381866e-05, 1.2893229722976685e-05, 1.4903955161571503e-05, 1.691468060016632e-05, 1.892540603876114e-05, 2.0936131477355957e-05, 2.2946856915950775e-05, 2.4957582354545593e-05, 2.696830779314041e-05, 2.897903323173523e-05, 3.098975867033005e-05, 3.3000484108924866e-05, 3.5011209547519684e-05, 3.70219349861145e-05, 3.903266042470932e-05, 4.104338586330414e-05, 4.3054111301898956e-05, 4.5064836740493774e-05, 4.707556217908859e-05, 4.908628761768341e-05, 5.109701305627823e-05, 5.310773849487305e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 10.0, 12.0, 10.0, 30.0, 45.0, 65.0, 95.0, 193.0, 366.0, 827.0, 2082.0, 6565.0, 29529.0, 881879.0, 108380.0, 12440.0, 3531.0, 1283.0, 594.0, 274.0, 127.0, 92.0, 42.0, 33.0, 15.0, 11.0, 8.0, 2.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045806884765625, -0.044316768646240234, -0.04282665252685547, -0.0413365364074707, -0.03984642028808594, -0.03835630416870117, -0.036866188049316406, -0.03537607192993164, -0.033885955810546875, -0.03239583969116211, -0.030905723571777344, -0.029415607452392578, -0.027925491333007812, -0.026435375213623047, -0.02494525909423828, -0.023455142974853516, -0.02196502685546875, -0.020474910736083984, -0.01898479461669922, -0.017494678497314453, -0.016004562377929688, -0.014514446258544922, -0.013024330139160156, -0.01153421401977539, -0.010044097900390625, -0.00855398178100586, -0.007063865661621094, -0.005573749542236328, -0.0040836334228515625, -0.002593517303466797, -0.0011034011840820312, 0.0003867149353027344, 0.0018768310546875, 0.0033669471740722656, 0.004857063293457031, 0.006347179412841797, 0.007837295532226562, 0.009327411651611328, 0.010817527770996094, 0.01230764389038086, 0.013797760009765625, 0.01528787612915039, 0.016777992248535156, 0.018268108367919922, 0.019758224487304688, 0.021248340606689453, 0.02273845672607422, 0.024228572845458984, 0.02571868896484375, 0.027208805084228516, 0.02869892120361328, 0.030189037322998047, 0.03167915344238281, 0.03316926956176758, 0.034659385681152344, 0.03614950180053711, 0.037639617919921875, 0.03912973403930664, 0.040619850158691406, 0.04210996627807617, 0.04360008239746094, 0.0450901985168457, 0.04658031463623047, 0.048070430755615234, 0.049560546875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 6.0, 4.0, 11.0, 10.0, 29.0, 72.0, 127.0, 224.0, 191.0, 139.0, 61.0, 23.0, 26.0, 9.0, 8.0, 8.0, 4.0, 5.0, 5.0, 4.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0262451171875, -0.025341033935546875, -0.02443695068359375, -0.023532867431640625, -0.0226287841796875, -0.021724700927734375, -0.02082061767578125, -0.019916534423828125, -0.019012451171875, -0.018108367919921875, -0.01720428466796875, -0.016300201416015625, -0.0153961181640625, -0.014492034912109375, -0.01358795166015625, -0.012683868408203125, -0.01177978515625, -0.010875701904296875, -0.00997161865234375, -0.009067535400390625, -0.0081634521484375, -0.007259368896484375, -0.00635528564453125, -0.005451202392578125, -0.004547119140625, -0.003643035888671875, -0.00273895263671875, -0.001834869384765625, -0.0009307861328125, -2.6702880859375e-05, 0.00087738037109375, 0.001781463623046875, 0.002685546875, 0.003589630126953125, 0.00449371337890625, 0.005397796630859375, 0.0063018798828125, 0.007205963134765625, 0.00811004638671875, 0.009014129638671875, 0.009918212890625, 0.010822296142578125, 0.01172637939453125, 0.012630462646484375, 0.0135345458984375, 0.014438629150390625, 0.01534271240234375, 0.016246795654296875, 0.01715087890625, 0.018054962158203125, 0.01895904541015625, 0.019863128662109375, 0.0207672119140625, 0.021671295166015625, 0.02257537841796875, 0.023479461669921875, 0.024383544921875, 0.025287628173828125, 0.02619171142578125, 0.027095794677734375, 0.0279998779296875, 0.028903961181640625, 0.02980804443359375, 0.030712127685546875, 0.0316162109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 5.0, 17.0, 23.0, 40.0, 59.0, 98.0, 136.0, 255.0, 151.0, 69.0, 62.0, 30.0, 15.0, 4.0, 9.0, 3.0, 1.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39762502908706665, -0.38466352224349976, -0.37170201539993286, -0.35874050855636597, -0.3457790017127991, -0.3328174948692322, -0.31985601782798767, -0.3068945109844208, -0.2939330041408539, -0.280971497297287, -0.2680099904537201, -0.2550484836101532, -0.2420869916677475, -0.2291254848241806, -0.2161639928817749, -0.203202486038208, -0.1902409791946411, -0.17727947235107422, -0.16431796550750732, -0.15135647356510162, -0.13839496672153473, -0.12543345987796783, -0.11247196048498154, -0.09951046109199524, -0.08654895424842834, -0.07358744740486145, -0.06062594801187515, -0.047664444893598557, -0.03470294177532196, -0.021741434931755066, -0.008779935538768768, 0.004181563854217529, 0.017143070697784424, 0.03010457381606102, 0.043066076934337616, 0.05602758005261421, 0.06898908317089081, 0.0819505900144577, 0.094912089407444, 0.1078735888004303, 0.12083509564399719, 0.1337966024875641, 0.14675810933113098, 0.15971960127353668, 0.17268110811710358, 0.18564261496067047, 0.19860410690307617, 0.21156561374664307, 0.22452712059020996, 0.23748862743377686, 0.25045013427734375, 0.26341164112091064, 0.27637314796447754, 0.28933465480804443, 0.30229613184928894, 0.31525763869285583, 0.32821914553642273, 0.3411806523799896, 0.3541421592235565, 0.3671036660671234, 0.3800651431083679, 0.3930266499519348, 0.4059881567955017, 0.4189496636390686, 0.4319111704826355]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 9.0, 1.0, 10.0, 14.0, 15.0, 22.0, 17.0, 25.0, 19.0, 32.0, 11.0, 24.0, 32.0, 37.0, 38.0, 39.0, 68.0, 76.0, 62.0, 61.0, 50.0, 45.0, 31.0, 35.0, 27.0, 21.0, 15.0, 27.0, 12.0, 19.0, 28.0, 12.0, 10.0, 10.0, 8.0, 9.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19505393505096436, -0.18864333629608154, -0.18223273754119873, -0.1758221536874771, -0.1694115549325943, -0.1630009561777115, -0.15659037232398987, -0.15017977356910706, -0.14376917481422424, -0.13735857605934143, -0.13094797730445862, -0.124537393450737, -0.11812679469585419, -0.11171619594097137, -0.10530560463666916, -0.09889501333236694, -0.09248441457748413, -0.08607381582260132, -0.0796632245182991, -0.07325263321399689, -0.06684203445911407, -0.06043143942952156, -0.05402084439992905, -0.04761024937033653, -0.04119965434074402, -0.034789059311151505, -0.02837846428155899, -0.021967869251966476, -0.015557274222373962, -0.009146679192781448, -0.0027360841631889343, 0.0036745108664035797, 0.010085105895996094, 0.016495700925588608, 0.022906295955181122, 0.029316890984773636, 0.03572748601436615, 0.042138081043958664, 0.04854867607355118, 0.05495927110314369, 0.061369866132736206, 0.06778046488761902, 0.07419105619192123, 0.08060164749622345, 0.08701224625110626, 0.09342284500598907, 0.09983343631029129, 0.1062440276145935, 0.11265462636947632, 0.11906522512435913, 0.12547582387924194, 0.13188640773296356, 0.13829700648784637, 0.1447076052427292, 0.1511181890964508, 0.15752878785133362, 0.16393938660621643, 0.17034998536109924, 0.17676058411598206, 0.18317116796970367, 0.1895817667245865, 0.1959923654794693, 0.20240294933319092, 0.20881354808807373, 0.21522414684295654]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 9.0, 8.0, 13.0, 16.0, 27.0, 36.0, 50.0, 77.0, 119.0, 169.0, 297.0, 477.0, 946.0, 2077.0, 4773.0, 13224.0, 55148.0, 806576.0, 3113775.0, 158819.0, 23790.0, 7572.0, 3038.0, 1420.0, 729.0, 401.0, 234.0, 149.0, 94.0, 79.0, 45.0, 25.0, 18.0, 17.0, 12.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.03082275390625, -0.029995203018188477, -0.029167652130126953, -0.02834010124206543, -0.027512550354003906, -0.026684999465942383, -0.02585744857788086, -0.025029897689819336, -0.024202346801757812, -0.02337479591369629, -0.022547245025634766, -0.021719694137573242, -0.02089214324951172, -0.020064592361450195, -0.019237041473388672, -0.01840949058532715, -0.017581939697265625, -0.0167543888092041, -0.015926837921142578, -0.015099287033081055, -0.014271736145019531, -0.013444185256958008, -0.012616634368896484, -0.011789083480834961, -0.010961532592773438, -0.010133981704711914, -0.00930643081665039, -0.008478879928588867, -0.007651329040527344, -0.00682377815246582, -0.005996227264404297, -0.0051686763763427734, -0.00434112548828125, -0.0035135746002197266, -0.002686023712158203, -0.0018584728240966797, -0.0010309219360351562, -0.0002033710479736328, 0.0006241798400878906, 0.001451730728149414, 0.0022792816162109375, 0.003106832504272461, 0.003934383392333984, 0.004761934280395508, 0.005589485168457031, 0.006417036056518555, 0.007244586944580078, 0.008072137832641602, 0.008899688720703125, 0.009727239608764648, 0.010554790496826172, 0.011382341384887695, 0.012209892272949219, 0.013037443161010742, 0.013864994049072266, 0.014692544937133789, 0.015520095825195312, 0.016347646713256836, 0.01717519760131836, 0.018002748489379883, 0.018830299377441406, 0.01965785026550293, 0.020485401153564453, 0.021312952041625977, 0.0221405029296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 9.0, 13.0, 13.0, 20.0, 24.0, 25.0, 42.0, 39.0, 43.0, 54.0, 53.0, 63.0, 70.0, 51.0, 57.0, 69.0, 75.0, 58.0, 52.0, 39.0, 27.0, 24.0, 15.0, 13.0, 13.0, 9.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0147552490234375, -0.014284849166870117, -0.013814449310302734, -0.013344049453735352, -0.012873649597167969, -0.012403249740600586, -0.011932849884033203, -0.01146245002746582, -0.010992050170898438, -0.010521650314331055, -0.010051250457763672, -0.009580850601196289, -0.009110450744628906, -0.008640050888061523, -0.00816965103149414, -0.007699251174926758, -0.007228851318359375, -0.006758451461791992, -0.006288051605224609, -0.0058176517486572266, -0.005347251892089844, -0.004876852035522461, -0.004406452178955078, -0.003936052322387695, -0.0034656524658203125, -0.0029952526092529297, -0.002524852752685547, -0.002054452896118164, -0.0015840530395507812, -0.0011136531829833984, -0.0006432533264160156, -0.0001728534698486328, 0.00029754638671875, 0.0007679462432861328, 0.0012383460998535156, 0.0017087459564208984, 0.0021791458129882812, 0.002649545669555664, 0.003119945526123047, 0.0035903453826904297, 0.0040607452392578125, 0.004531145095825195, 0.005001544952392578, 0.005471944808959961, 0.005942344665527344, 0.0064127445220947266, 0.006883144378662109, 0.007353544235229492, 0.007823944091796875, 0.008294343948364258, 0.00876474380493164, 0.009235143661499023, 0.009705543518066406, 0.010175943374633789, 0.010646343231201172, 0.011116743087768555, 0.011587142944335938, 0.01205754280090332, 0.012527942657470703, 0.012998342514038086, 0.013468742370605469, 0.013939142227172852, 0.014409542083740234, 0.014879941940307617, 0.015350341796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 7.0, 10.0, 13.0, 22.0, 12.0, 21.0, 36.0, 45.0, 57.0, 92.0, 146.0, 282.0, 714.0, 4648.0, 417992.0, 3759640.0, 8650.0, 978.0, 395.0, 188.0, 102.0, 63.0, 38.0, 33.0, 16.0, 22.0, 15.0, 8.0, 11.0, 5.0, 6.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.095458984375, -0.09193801879882812, -0.08841705322265625, -0.08489608764648438, -0.0813751220703125, -0.07785415649414062, -0.07433319091796875, -0.07081222534179688, -0.067291259765625, -0.06377029418945312, -0.06024932861328125, -0.056728363037109375, -0.0532073974609375, -0.049686431884765625, -0.04616546630859375, -0.042644500732421875, -0.03912353515625, -0.035602569580078125, -0.03208160400390625, -0.028560638427734375, -0.0250396728515625, -0.021518707275390625, -0.01799774169921875, -0.014476776123046875, -0.010955810546875, -0.007434844970703125, -0.00391387939453125, -0.000392913818359375, 0.0031280517578125, 0.006649017333984375, 0.01016998291015625, 0.013690948486328125, 0.0172119140625, 0.020732879638671875, 0.02425384521484375, 0.027774810791015625, 0.0312957763671875, 0.034816741943359375, 0.03833770751953125, 0.041858673095703125, 0.045379638671875, 0.048900604248046875, 0.05242156982421875, 0.055942535400390625, 0.0594635009765625, 0.06298446655273438, 0.06650543212890625, 0.07002639770507812, 0.07354736328125, 0.07706832885742188, 0.08058929443359375, 0.08411026000976562, 0.0876312255859375, 0.09115219116210938, 0.09467315673828125, 0.09819412231445312, 0.101715087890625, 0.10523605346679688, 0.10875701904296875, 0.11227798461914062, 0.1157989501953125, 0.11931991577148438, 0.12284088134765625, 0.12636184692382812, 0.1298828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 12.0, 16.0, 27.0, 32.0, 51.0, 74.0, 138.0, 342.0, 953.0, 1362.0, 598.0, 192.0, 93.0, 65.0, 45.0, 21.0, 13.0, 10.0, 3.0, 9.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036834716796875, -0.03548479080200195, -0.034134864807128906, -0.03278493881225586, -0.03143501281738281, -0.030085086822509766, -0.02873516082763672, -0.027385234832763672, -0.026035308837890625, -0.024685382843017578, -0.02333545684814453, -0.021985530853271484, -0.020635604858398438, -0.01928567886352539, -0.017935752868652344, -0.016585826873779297, -0.01523590087890625, -0.013885974884033203, -0.012536048889160156, -0.01118612289428711, -0.009836196899414062, -0.008486270904541016, -0.007136344909667969, -0.005786418914794922, -0.004436492919921875, -0.003086566925048828, -0.0017366409301757812, -0.0003867149353027344, 0.0009632110595703125, 0.0023131370544433594, 0.0036630630493164062, 0.005012989044189453, 0.0063629150390625, 0.007712841033935547, 0.009062767028808594, 0.01041269302368164, 0.011762619018554688, 0.013112545013427734, 0.014462471008300781, 0.015812397003173828, 0.017162322998046875, 0.018512248992919922, 0.01986217498779297, 0.021212100982666016, 0.022562026977539062, 0.02391195297241211, 0.025261878967285156, 0.026611804962158203, 0.02796173095703125, 0.029311656951904297, 0.030661582946777344, 0.03201150894165039, 0.03336143493652344, 0.034711360931396484, 0.03606128692626953, 0.03741121292114258, 0.038761138916015625, 0.04011106491088867, 0.04146099090576172, 0.042810916900634766, 0.04416084289550781, 0.04551076889038086, 0.046860694885253906, 0.04821062088012695, 0.049560546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 8.0, 19.0, 36.0, 76.0, 195.0, 326.0, 212.0, 71.0, 29.0, 12.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5154139995574951, -0.49460044503211975, -0.4737868905067444, -0.452973335981369, -0.43215978145599365, -0.4113462567329407, -0.3905327022075653, -0.36971914768218994, -0.3489055931568146, -0.3280920386314392, -0.30727848410606384, -0.2864649295806885, -0.2656514048576355, -0.24483783543109894, -0.22402429580688477, -0.2032107412815094, -0.18239718675613403, -0.16158363223075867, -0.1407700777053833, -0.11995653808116913, -0.09914298355579376, -0.0783294290304184, -0.05751588195562363, -0.03670233488082886, -0.01588878035545349, 0.0049247704446315765, 0.025738321244716644, 0.04655187204480171, 0.06736542284488678, 0.08817897737026215, 0.10899252444505692, 0.12980607151985168, 0.15061962604522705, 0.17143318057060242, 0.19224673509597778, 0.21306027472019196, 0.23387382924556732, 0.2546873688697815, 0.27550092339515686, 0.2963144779205322, 0.3171280324459076, 0.33794158697128296, 0.3587551414966583, 0.3795686960220337, 0.40038222074508667, 0.4211958050727844, 0.4420093297958374, 0.46282288432121277, 0.48363643884658813, 0.5044499635696411, 0.5252635478973389, 0.5460770726203918, 0.5668906569480896, 0.5877041816711426, 0.6085177659988403, 0.6293312907218933, 0.6501448154449463, 0.6709583401679993, 0.691771924495697, 0.71258544921875, 0.7333990335464478, 0.7542125582695007, 0.7750261425971985, 0.7958396673202515, 0.8166532516479492]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 11.0, 6.0, 12.0, 16.0, 15.0, 28.0, 27.0, 41.0, 29.0, 58.0, 49.0, 68.0, 53.0, 74.0, 72.0, 66.0, 73.0, 63.0, 33.0, 39.0, 45.0, 34.0, 18.0, 16.0, 18.0, 15.0, 8.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18904048204421997, -0.1836414635181427, -0.17824243009090424, -0.17284341156482697, -0.1674443781375885, -0.16204535961151123, -0.15664634108543396, -0.1512473225593567, -0.14584828913211823, -0.14044927060604095, -0.1350502371788025, -0.12965121865272522, -0.12425219267606735, -0.11885316669940948, -0.11345414817333221, -0.10805512219667435, -0.10265609622001648, -0.09725707024335861, -0.09185804426670074, -0.08645902574062347, -0.0810599997639656, -0.07566097378730774, -0.07026195526123047, -0.0648629292845726, -0.059463903307914734, -0.054064877331256866, -0.0486658550798893, -0.04326683282852173, -0.03786780685186386, -0.032468780875205994, -0.027069758623838425, -0.021670736372470856, -0.01627171039581299, -0.01087268628180027, -0.005473662167787552, -7.463805377483368e-05, 0.0053243860602378845, 0.010723410174250603, 0.01612243428826332, 0.02152145653963089, 0.026920482516288757, 0.032319508492946625, 0.037718530744314194, 0.04311755299568176, 0.04851657897233963, 0.0539156049489975, 0.059314627200365067, 0.06471364945173264, 0.0701126754283905, 0.07551170140504837, 0.08091072738170624, 0.08630974590778351, 0.09170877188444138, 0.09710779786109924, 0.10250681638717651, 0.10790584236383438, 0.11330486834049225, 0.11870389431715012, 0.12410292029380798, 0.12950193881988525, 0.13490095734596252, 0.140299990773201, 0.14569900929927826, 0.15109804272651672, 0.156497061252594]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 15.0, 12.0, 16.0, 23.0, 36.0, 47.0, 84.0, 95.0, 182.0, 228.0, 354.0, 603.0, 878.0, 1329.0, 2336.0, 3816.0, 6800.0, 12473.0, 24208.0, 50953.0, 112633.0, 253025.0, 301524.0, 146214.0, 64654.0, 30488.0, 15563.0, 8266.0, 4578.0, 2644.0, 1645.0, 973.0, 613.0, 386.0, 294.0, 182.0, 115.0, 68.0, 63.0, 42.0, 27.0, 17.0, 14.0, 15.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0218353271484375, -0.02121424674987793, -0.02059316635131836, -0.01997208595275879, -0.01935100555419922, -0.01872992515563965, -0.018108844757080078, -0.017487764358520508, -0.016866683959960938, -0.016245603561401367, -0.015624523162841797, -0.015003442764282227, -0.014382362365722656, -0.013761281967163086, -0.013140201568603516, -0.012519121170043945, -0.011898040771484375, -0.011276960372924805, -0.010655879974365234, -0.010034799575805664, -0.009413719177246094, -0.008792638778686523, -0.008171558380126953, -0.007550477981567383, -0.0069293975830078125, -0.006308317184448242, -0.005687236785888672, -0.0050661563873291016, -0.004445075988769531, -0.003823995590209961, -0.0032029151916503906, -0.0025818347930908203, -0.00196075439453125, -0.0013396739959716797, -0.0007185935974121094, -9.751319885253906e-05, 0.0005235671997070312, 0.0011446475982666016, 0.0017657279968261719, 0.002386808395385742, 0.0030078887939453125, 0.003628969192504883, 0.004250049591064453, 0.0048711299896240234, 0.005492210388183594, 0.006113290786743164, 0.006734371185302734, 0.007355451583862305, 0.007976531982421875, 0.008597612380981445, 0.009218692779541016, 0.009839773178100586, 0.010460853576660156, 0.011081933975219727, 0.011703014373779297, 0.012324094772338867, 0.012945175170898438, 0.013566255569458008, 0.014187335968017578, 0.014808416366577148, 0.015429496765136719, 0.01605057716369629, 0.01667165756225586, 0.01729273796081543, 0.017913818359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 11.0, 17.0, 20.0, 26.0, 24.0, 38.0, 43.0, 38.0, 48.0, 67.0, 59.0, 60.0, 75.0, 73.0, 55.0, 58.0, 45.0, 40.0, 50.0, 30.0, 22.0, 23.0, 19.0, 11.0, 14.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0147705078125, -0.014300346374511719, -0.013830184936523438, -0.013360023498535156, -0.012889862060546875, -0.012419700622558594, -0.011949539184570312, -0.011479377746582031, -0.01100921630859375, -0.010539054870605469, -0.010068893432617188, -0.009598731994628906, -0.009128570556640625, -0.008658409118652344, -0.008188247680664062, -0.007718086242675781, -0.0072479248046875, -0.006777763366699219, -0.0063076019287109375, -0.005837440490722656, -0.005367279052734375, -0.004897117614746094, -0.0044269561767578125, -0.003956794738769531, -0.00348663330078125, -0.0030164718627929688, -0.0025463104248046875, -0.0020761489868164062, -0.001605987548828125, -0.0011358261108398438, -0.0006656646728515625, -0.00019550323486328125, 0.000274658203125, 0.0007448196411132812, 0.0012149810791015625, 0.0016851425170898438, 0.002155303955078125, 0.0026254653930664062, 0.0030956268310546875, 0.0035657882690429688, 0.00403594970703125, 0.004506111145019531, 0.0049762725830078125, 0.005446434020996094, 0.005916595458984375, 0.006386756896972656, 0.0068569183349609375, 0.007327079772949219, 0.0077972412109375, 0.008267402648925781, 0.008737564086914062, 0.009207725524902344, 0.009677886962890625, 0.010148048400878906, 0.010618209838867188, 0.011088371276855469, 0.01155853271484375, 0.012028694152832031, 0.012498855590820312, 0.012969017028808594, 0.013439178466796875, 0.013909339904785156, 0.014379501342773438, 0.014849662780761719, 0.01531982421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 7.0, 18.0, 22.0, 25.0, 37.0, 66.0, 100.0, 159.0, 266.0, 560.0, 1159.0, 2679.0, 6483.0, 17832.0, 58122.0, 233257.0, 570757.0, 108865.0, 30417.0, 10286.0, 3963.0, 1769.0, 754.0, 374.0, 192.0, 124.0, 85.0, 50.0, 40.0, 20.0, 16.0, 12.0, 11.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0325927734375, -0.031477928161621094, -0.030363082885742188, -0.02924823760986328, -0.028133392333984375, -0.02701854705810547, -0.025903701782226562, -0.024788856506347656, -0.02367401123046875, -0.022559165954589844, -0.021444320678710938, -0.02032947540283203, -0.019214630126953125, -0.01809978485107422, -0.016984939575195312, -0.015870094299316406, -0.0147552490234375, -0.013640403747558594, -0.012525558471679688, -0.011410713195800781, -0.010295867919921875, -0.009181022644042969, -0.008066177368164062, -0.006951332092285156, -0.00583648681640625, -0.004721641540527344, -0.0036067962646484375, -0.0024919509887695312, -0.001377105712890625, -0.00026226043701171875, 0.0008525848388671875, 0.0019674301147460938, 0.003082275390625, 0.004197120666503906, 0.0053119659423828125, 0.006426811218261719, 0.007541656494140625, 0.008656501770019531, 0.009771347045898438, 0.010886192321777344, 0.01200103759765625, 0.013115882873535156, 0.014230728149414062, 0.015345573425292969, 0.016460418701171875, 0.01757526397705078, 0.018690109252929688, 0.019804954528808594, 0.0209197998046875, 0.022034645080566406, 0.023149490356445312, 0.02426433563232422, 0.025379180908203125, 0.02649402618408203, 0.027608871459960938, 0.028723716735839844, 0.02983856201171875, 0.030953407287597656, 0.03206825256347656, 0.03318309783935547, 0.034297943115234375, 0.03541278839111328, 0.03652763366699219, 0.037642478942871094, 0.03875732421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 6.0, 10.0, 10.0, 14.0, 14.0, 7.0, 21.0, 32.0, 34.0, 39.0, 26.0, 26.0, 43.0, 44.0, 50.0, 36.0, 42.0, 50.0, 45.0, 48.0, 34.0, 40.0, 28.0, 50.0, 33.0, 27.0, 16.0, 22.0, 17.0, 18.0, 20.0, 9.0, 5.0, 11.0, 8.0, 6.0, 6.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.031768798828125, -0.03062152862548828, -0.029474258422851562, -0.028326988220214844, -0.027179718017578125, -0.026032447814941406, -0.024885177612304688, -0.02373790740966797, -0.02259063720703125, -0.02144336700439453, -0.020296096801757812, -0.019148826599121094, -0.018001556396484375, -0.016854286193847656, -0.015707015991210938, -0.014559745788574219, -0.0134124755859375, -0.012265205383300781, -0.011117935180664062, -0.009970664978027344, -0.008823394775390625, -0.007676124572753906, -0.0065288543701171875, -0.005381584167480469, -0.00423431396484375, -0.0030870437622070312, -0.0019397735595703125, -0.0007925033569335938, 0.000354766845703125, 0.0015020370483398438, 0.0026493072509765625, 0.0037965774536132812, 0.00494384765625, 0.006091117858886719, 0.0072383880615234375, 0.008385658264160156, 0.009532928466796875, 0.010680198669433594, 0.011827468872070312, 0.012974739074707031, 0.01412200927734375, 0.015269279479980469, 0.016416549682617188, 0.017563819885253906, 0.018711090087890625, 0.019858360290527344, 0.021005630493164062, 0.02215290069580078, 0.0233001708984375, 0.02444744110107422, 0.025594711303710938, 0.026741981506347656, 0.027889251708984375, 0.029036521911621094, 0.030183792114257812, 0.03133106231689453, 0.03247833251953125, 0.03362560272216797, 0.03477287292480469, 0.035920143127441406, 0.037067413330078125, 0.038214683532714844, 0.03936195373535156, 0.04050922393798828, 0.041656494140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 16.0, 16.0, 23.0, 42.0, 40.0, 62.0, 125.0, 167.0, 284.0, 409.0, 686.0, 1179.0, 1929.0, 3573.0, 7090.0, 15757.0, 47097.0, 297274.0, 580932.0, 56876.0, 18059.0, 7721.0, 3868.0, 2045.0, 1252.0, 701.0, 461.0, 279.0, 175.0, 107.0, 78.0, 59.0, 44.0, 41.0, 21.0, 16.0, 11.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.023956298828125, -0.023209333419799805, -0.02246236801147461, -0.021715402603149414, -0.02096843719482422, -0.020221471786499023, -0.019474506378173828, -0.018727540969848633, -0.017980575561523438, -0.017233610153198242, -0.016486644744873047, -0.01573967933654785, -0.014992713928222656, -0.014245748519897461, -0.013498783111572266, -0.01275181770324707, -0.012004852294921875, -0.01125788688659668, -0.010510921478271484, -0.009763956069946289, -0.009016990661621094, -0.008270025253295898, -0.007523059844970703, -0.006776094436645508, -0.0060291290283203125, -0.005282163619995117, -0.004535198211669922, -0.0037882328033447266, -0.0030412673950195312, -0.002294301986694336, -0.0015473365783691406, -0.0008003711700439453, -5.340576171875e-05, 0.0006935596466064453, 0.0014405250549316406, 0.002187490463256836, 0.0029344558715820312, 0.0036814212799072266, 0.004428386688232422, 0.005175352096557617, 0.0059223175048828125, 0.006669282913208008, 0.007416248321533203, 0.008163213729858398, 0.008910179138183594, 0.009657144546508789, 0.010404109954833984, 0.01115107536315918, 0.011898040771484375, 0.01264500617980957, 0.013391971588134766, 0.014138936996459961, 0.014885902404785156, 0.01563286781311035, 0.016379833221435547, 0.017126798629760742, 0.017873764038085938, 0.018620729446411133, 0.019367694854736328, 0.020114660263061523, 0.02086162567138672, 0.021608591079711914, 0.02235555648803711, 0.023102521896362305, 0.0238494873046875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 4.0, 7.0, 6.0, 17.0, 19.0, 23.0, 25.0, 31.0, 56.0, 63.0, 102.0, 103.0, 95.0, 123.0, 88.0, 56.0, 46.0, 38.0, 23.0, 27.0, 12.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02467155456543e-05, -4.828162491321564e-05, -4.631653428077698e-05, -4.435144364833832e-05, -4.238635301589966e-05, -4.0421262383461e-05, -3.845617175102234e-05, -3.649108111858368e-05, -3.452599048614502e-05, -3.256089985370636e-05, -3.05958092212677e-05, -2.863071858882904e-05, -2.666562795639038e-05, -2.470053732395172e-05, -2.273544669151306e-05, -2.0770356059074402e-05, -1.8805265426635742e-05, -1.6840174794197083e-05, -1.4875084161758423e-05, -1.2909993529319763e-05, -1.0944902896881104e-05, -8.979812264442444e-06, -7.014721632003784e-06, -5.0496309995651245e-06, -3.084540367126465e-06, -1.1194497346878052e-06, 8.456408977508545e-07, 2.810731530189514e-06, 4.775822162628174e-06, 6.7409127950668335e-06, 8.706003427505493e-06, 1.0671094059944153e-05, 1.2636184692382812e-05, 1.4601275324821472e-05, 1.6566365957260132e-05, 1.853145658969879e-05, 2.049654722213745e-05, 2.246163785457611e-05, 2.442672848701477e-05, 2.639181911945343e-05, 2.835690975189209e-05, 3.032200038433075e-05, 3.228709101676941e-05, 3.425218164920807e-05, 3.621727228164673e-05, 3.818236291408539e-05, 4.014745354652405e-05, 4.211254417896271e-05, 4.407763481140137e-05, 4.604272544384003e-05, 4.8007816076278687e-05, 4.9972906708717346e-05, 5.1937997341156006e-05, 5.3903087973594666e-05, 5.5868178606033325e-05, 5.7833269238471985e-05, 5.9798359870910645e-05, 6.17634505033493e-05, 6.372854113578796e-05, 6.569363176822662e-05, 6.765872240066528e-05, 6.962381303310394e-05, 7.15889036655426e-05, 7.355399429798126e-05, 7.551908493041992e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 13.0, 12.0, 34.0, 45.0, 68.0, 120.0, 245.0, 436.0, 879.0, 2005.0, 4875.0, 14064.0, 59714.0, 741106.0, 183963.0, 27111.0, 8135.0, 3023.0, 1332.0, 637.0, 307.0, 199.0, 91.0, 53.0, 28.0, 19.0, 16.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0254974365234375, -0.02450728416442871, -0.023517131805419922, -0.022526979446411133, -0.021536827087402344, -0.020546674728393555, -0.019556522369384766, -0.018566370010375977, -0.017576217651367188, -0.0165860652923584, -0.01559591293334961, -0.01460576057434082, -0.013615608215332031, -0.012625455856323242, -0.011635303497314453, -0.010645151138305664, -0.009654998779296875, -0.008664846420288086, -0.007674694061279297, -0.006684541702270508, -0.005694389343261719, -0.00470423698425293, -0.0037140846252441406, -0.0027239322662353516, -0.0017337799072265625, -0.0007436275482177734, 0.0002465248107910156, 0.0012366771697998047, 0.0022268295288085938, 0.003216981887817383, 0.004207134246826172, 0.005197286605834961, 0.00618743896484375, 0.007177591323852539, 0.008167743682861328, 0.009157896041870117, 0.010148048400878906, 0.011138200759887695, 0.012128353118896484, 0.013118505477905273, 0.014108657836914062, 0.015098810195922852, 0.01608896255493164, 0.01707911491394043, 0.01806926727294922, 0.019059419631958008, 0.020049571990966797, 0.021039724349975586, 0.022029876708984375, 0.023020029067993164, 0.024010181427001953, 0.025000333786010742, 0.02599048614501953, 0.02698063850402832, 0.02797079086303711, 0.0289609432220459, 0.029951095581054688, 0.030941247940063477, 0.031931400299072266, 0.032921552658081055, 0.033911705017089844, 0.03490185737609863, 0.03589200973510742, 0.03688216209411621, 0.037872314453125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 5.0, 7.0, 15.0, 22.0, 35.0, 50.0, 101.0, 154.0, 195.0, 156.0, 95.0, 47.0, 31.0, 24.0, 14.0, 6.0, 9.0, 7.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033599853515625, -0.03270125389099121, -0.03180265426635742, -0.030904054641723633, -0.030005455017089844, -0.029106855392456055, -0.028208255767822266, -0.027309656143188477, -0.026411056518554688, -0.0255124568939209, -0.02461385726928711, -0.02371525764465332, -0.02281665802001953, -0.021918058395385742, -0.021019458770751953, -0.020120859146118164, -0.019222259521484375, -0.018323659896850586, -0.017425060272216797, -0.016526460647583008, -0.01562786102294922, -0.01472926139831543, -0.01383066177368164, -0.012932062149047852, -0.012033462524414062, -0.011134862899780273, -0.010236263275146484, -0.009337663650512695, -0.008439064025878906, -0.007540464401245117, -0.006641864776611328, -0.005743265151977539, -0.00484466552734375, -0.003946065902709961, -0.003047466278076172, -0.002148866653442383, -0.0012502670288085938, -0.0003516674041748047, 0.0005469322204589844, 0.0014455318450927734, 0.0023441314697265625, 0.0032427310943603516, 0.004141330718994141, 0.00503993034362793, 0.005938529968261719, 0.006837129592895508, 0.007735729217529297, 0.008634328842163086, 0.009532928466796875, 0.010431528091430664, 0.011330127716064453, 0.012228727340698242, 0.013127326965332031, 0.01402592658996582, 0.01492452621459961, 0.0158231258392334, 0.016721725463867188, 0.017620325088500977, 0.018518924713134766, 0.019417524337768555, 0.020316123962402344, 0.021214723587036133, 0.022113323211669922, 0.02301192283630371, 0.0239105224609375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 13.0, 26.0, 73.0, 153.0, 409.0, 204.0, 68.0, 24.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8900133371353149, -0.8636792898178101, -0.8373452425003052, -0.8110111951828003, -0.7846771478652954, -0.7583431005477905, -0.7320090532302856, -0.7056750059127808, -0.6793409585952759, -0.653006911277771, -0.6266728639602661, -0.6003388166427612, -0.5740047693252563, -0.5476707220077515, -0.5213366746902466, -0.4950026273727417, -0.4686685800552368, -0.44233453273773193, -0.41600048542022705, -0.38966643810272217, -0.3633323907852173, -0.3369983434677124, -0.3106642961502075, -0.28433024883270264, -0.25799620151519775, -0.23166215419769287, -0.205328106880188, -0.1789940595626831, -0.15266001224517822, -0.12632596492767334, -0.09999191761016846, -0.07365787029266357, -0.04732388257980347, -0.020989835262298584, 0.005344212055206299, 0.03167825937271118, 0.058012306690216064, 0.08434635400772095, 0.11068040132522583, 0.1370144486427307, 0.1633484959602356, 0.18968254327774048, 0.21601659059524536, 0.24235063791275024, 0.2686846852302551, 0.29501873254776, 0.3213527798652649, 0.3476868271827698, 0.37402087450027466, 0.40035492181777954, 0.4266889691352844, 0.4530230164527893, 0.4793570637702942, 0.5056911110877991, 0.532025158405304, 0.5583592057228088, 0.5846932530403137, 0.6110273003578186, 0.6373613476753235, 0.6636953949928284, 0.6900294423103333, 0.7163634896278381, 0.742697536945343, 0.7690315842628479, 0.7953656315803528]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 9.0, 6.0, 8.0, 10.0, 10.0, 18.0, 13.0, 18.0, 29.0, 22.0, 33.0, 30.0, 31.0, 29.0, 52.0, 47.0, 64.0, 102.0, 71.0, 36.0, 39.0, 42.0, 34.0, 28.0, 25.0, 30.0, 23.0, 18.0, 22.0, 18.0, 20.0, 10.0, 6.0, 11.0, 4.0, 7.0, 4.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.19877541065216064, -0.19333045184612274, -0.18788549304008484, -0.18244054913520813, -0.17699559032917023, -0.17155063152313232, -0.16610568761825562, -0.1606607288122177, -0.1552157700061798, -0.1497708112001419, -0.144325852394104, -0.1388809084892273, -0.1334359496831894, -0.1279909908771515, -0.12254603952169418, -0.11710108816623688, -0.11165612936019897, -0.10621117055416107, -0.10076621919870377, -0.09532126784324646, -0.08987630903720856, -0.08443135023117065, -0.07898639887571335, -0.07354144752025604, -0.06809648871421814, -0.06265152990818024, -0.05720657855272293, -0.05176162347197533, -0.04631666839122772, -0.04087171331048012, -0.03542675822973251, -0.02998180314898491, -0.024536848068237305, -0.0190918929874897, -0.013646937906742096, -0.008201982825994492, -0.002757027745246887, 0.002687927335500717, 0.008132882416248322, 0.013577837496995926, 0.01902279257774353, 0.024467747658491135, 0.02991270273923874, 0.03535765781998634, 0.04080261290073395, 0.04624756798148155, 0.051692523062229156, 0.05713747814297676, 0.06258243322372437, 0.06802739202976227, 0.07347234338521957, 0.07891729474067688, 0.08436225354671478, 0.08980721235275269, 0.09525216370820999, 0.1006971150636673, 0.1061420738697052, 0.1115870326757431, 0.11703198403120041, 0.12247693538665771, 0.12792189419269562, 0.13336685299873352, 0.13881179690361023, 0.14425675570964813, 0.14970171451568604]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 12.0, 12.0, 19.0, 31.0, 44.0, 61.0, 107.0, 167.0, 248.0, 478.0, 764.0, 1379.0, 2557.0, 5726.0, 15952.0, 95472.0, 2379714.0, 1594299.0, 72640.0, 13828.0, 5181.0, 2437.0, 1237.0, 715.0, 420.0, 261.0, 185.0, 115.0, 58.0, 49.0, 30.0, 18.0, 25.0, 11.0, 3.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0241241455078125, -0.0233919620513916, -0.022659778594970703, -0.021927595138549805, -0.021195411682128906, -0.020463228225708008, -0.01973104476928711, -0.01899886131286621, -0.018266677856445312, -0.017534494400024414, -0.016802310943603516, -0.016070127487182617, -0.015337944030761719, -0.01460576057434082, -0.013873577117919922, -0.013141393661499023, -0.012409210205078125, -0.011677026748657227, -0.010944843292236328, -0.01021265983581543, -0.009480476379394531, -0.008748292922973633, -0.008016109466552734, -0.007283926010131836, -0.0065517425537109375, -0.005819559097290039, -0.005087375640869141, -0.004355192184448242, -0.0036230087280273438, -0.0028908252716064453, -0.002158641815185547, -0.0014264583587646484, -0.00069427490234375, 3.790855407714844e-05, 0.0007700920104980469, 0.0015022754669189453, 0.0022344589233398438, 0.002966642379760742, 0.0036988258361816406, 0.004431009292602539, 0.0051631927490234375, 0.005895376205444336, 0.006627559661865234, 0.007359743118286133, 0.008091926574707031, 0.00882411003112793, 0.009556293487548828, 0.010288476943969727, 0.011020660400390625, 0.011752843856811523, 0.012485027313232422, 0.01321721076965332, 0.013949394226074219, 0.014681577682495117, 0.015413761138916016, 0.016145944595336914, 0.016878128051757812, 0.01761031150817871, 0.01834249496459961, 0.019074678421020508, 0.019806861877441406, 0.020539045333862305, 0.021271228790283203, 0.0220034122467041, 0.022735595703125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 10.0, 8.0, 9.0, 10.0, 21.0, 29.0, 38.0, 43.0, 53.0, 53.0, 57.0, 66.0, 59.0, 71.0, 78.0, 54.0, 49.0, 56.0, 42.0, 38.0, 26.0, 22.0, 19.0, 16.0, 11.0, 11.0, 12.0, 12.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.015716552734375, -0.015274763107299805, -0.01483297348022461, -0.014391183853149414, -0.013949394226074219, -0.013507604598999023, -0.013065814971923828, -0.012624025344848633, -0.012182235717773438, -0.011740446090698242, -0.011298656463623047, -0.010856866836547852, -0.010415077209472656, -0.009973287582397461, -0.009531497955322266, -0.00908970832824707, -0.008647918701171875, -0.00820612907409668, -0.007764339447021484, -0.007322549819946289, -0.006880760192871094, -0.0064389705657958984, -0.005997180938720703, -0.005555391311645508, -0.0051136016845703125, -0.004671812057495117, -0.004230022430419922, -0.0037882328033447266, -0.0033464431762695312, -0.002904653549194336, -0.0024628639221191406, -0.0020210742950439453, -0.00157928466796875, -0.0011374950408935547, -0.0006957054138183594, -0.00025391578674316406, 0.00018787384033203125, 0.0006296634674072266, 0.0010714530944824219, 0.0015132427215576172, 0.0019550323486328125, 0.002396821975708008, 0.002838611602783203, 0.0032804012298583984, 0.0037221908569335938, 0.004163980484008789, 0.004605770111083984, 0.00504755973815918, 0.005489349365234375, 0.00593113899230957, 0.006372928619384766, 0.006814718246459961, 0.007256507873535156, 0.0076982975006103516, 0.008140087127685547, 0.008581876754760742, 0.009023666381835938, 0.009465456008911133, 0.009907245635986328, 0.010349035263061523, 0.010790824890136719, 0.011232614517211914, 0.01167440414428711, 0.012116193771362305, 0.0125579833984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 7.0, 10.0, 10.0, 22.0, 25.0, 40.0, 62.0, 75.0, 127.0, 448.0, 4356.0, 3484205.0, 700659.0, 3371.0, 375.0, 147.0, 93.0, 76.0, 49.0, 30.0, 30.0, 20.0, 9.0, 10.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.184326171875, -0.1795940399169922, -0.17486190795898438, -0.17012977600097656, -0.16539764404296875, -0.16066551208496094, -0.15593338012695312, -0.1512012481689453, -0.1464691162109375, -0.1417369842529297, -0.13700485229492188, -0.13227272033691406, -0.12754058837890625, -0.12280845642089844, -0.11807632446289062, -0.11334419250488281, -0.108612060546875, -0.10387992858886719, -0.09914779663085938, -0.09441566467285156, -0.08968353271484375, -0.08495140075683594, -0.08021926879882812, -0.07548713684082031, -0.0707550048828125, -0.06602287292480469, -0.061290740966796875, -0.05655860900878906, -0.05182647705078125, -0.04709434509277344, -0.042362213134765625, -0.03763008117675781, -0.03289794921875, -0.028165817260742188, -0.023433685302734375, -0.018701553344726562, -0.01396942138671875, -0.009237289428710938, -0.004505157470703125, 0.0002269744873046875, 0.0049591064453125, 0.009691238403320312, 0.014423370361328125, 0.019155502319335938, 0.02388763427734375, 0.028619766235351562, 0.033351898193359375, 0.03808403015136719, 0.042816162109375, 0.04754829406738281, 0.052280426025390625, 0.05701255798339844, 0.06174468994140625, 0.06647682189941406, 0.07120895385742188, 0.07594108581542969, 0.0806732177734375, 0.08540534973144531, 0.09013748168945312, 0.09486961364746094, 0.09960174560546875, 0.10433387756347656, 0.10906600952148438, 0.11379814147949219, 0.1185302734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 18.0, 23.0, 46.0, 152.0, 1236.0, 2195.0, 258.0, 79.0, 47.0, 11.0, 7.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040008544921875, -0.03718423843383789, -0.03435993194580078, -0.03153562545776367, -0.028711318969726562, -0.025887012481689453, -0.023062705993652344, -0.020238399505615234, -0.017414093017578125, -0.014589786529541016, -0.011765480041503906, -0.008941173553466797, -0.0061168670654296875, -0.003292560577392578, -0.00046825408935546875, 0.0023560523986816406, 0.00518035888671875, 0.00800466537475586, 0.010828971862792969, 0.013653278350830078, 0.016477584838867188, 0.019301891326904297, 0.022126197814941406, 0.024950504302978516, 0.027774810791015625, 0.030599117279052734, 0.033423423767089844, 0.03624773025512695, 0.03907203674316406, 0.04189634323120117, 0.04472064971923828, 0.04754495620727539, 0.0503692626953125, 0.05319356918334961, 0.05601787567138672, 0.05884218215942383, 0.06166648864746094, 0.06449079513549805, 0.06731510162353516, 0.07013940811157227, 0.07296371459960938, 0.07578802108764648, 0.0786123275756836, 0.0814366340637207, 0.08426094055175781, 0.08708524703979492, 0.08990955352783203, 0.09273386001586914, 0.09555816650390625, 0.09838247299194336, 0.10120677947998047, 0.10403108596801758, 0.10685539245605469, 0.1096796989440918, 0.1125040054321289, 0.11532831192016602, 0.11815261840820312, 0.12097692489624023, 0.12380123138427734, 0.12662553787231445, 0.12944984436035156, 0.13227415084838867, 0.13509845733642578, 0.1379227638244629, 0.1407470703125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 7.0, 12.0, 21.0, 30.0, 41.0, 80.0, 105.0, 150.0, 149.0, 131.0, 84.0, 67.0, 45.0, 26.0, 20.0, 9.0, 7.0, 3.0, 5.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20781758427619934, -0.19840659201145172, -0.1889955997467041, -0.17958460748195648, -0.17017361521720886, -0.16076262295246124, -0.15135163068771362, -0.141940638422966, -0.13252964615821838, -0.12311865389347076, -0.11370766162872314, -0.10429666936397552, -0.0948856770992279, -0.08547468483448029, -0.07606369256973267, -0.06665270030498505, -0.05724170804023743, -0.04783071577548981, -0.03841972351074219, -0.029008731245994568, -0.019597738981246948, -0.010186746716499329, -0.000775754451751709, 0.00863523781299591, 0.01804623007774353, 0.02745722234249115, 0.03686821460723877, 0.04627920687198639, 0.05569019913673401, 0.06510119140148163, 0.07451218366622925, 0.08392317593097687, 0.09333419799804688, 0.1027451902627945, 0.11215618252754211, 0.12156717479228973, 0.13097816705703735, 0.14038915932178497, 0.1498001515865326, 0.1592111438512802, 0.16862213611602783, 0.17803312838077545, 0.18744412064552307, 0.1968551129102707, 0.2062661051750183, 0.21567709743976593, 0.22508808970451355, 0.23449908196926117, 0.2439100742340088, 0.2533210515975952, 0.26273205876350403, 0.27214306592941284, 0.28155404329299927, 0.2909650206565857, 0.3003760278224945, 0.3097870349884033, 0.31919801235198975, 0.32860898971557617, 0.338019996881485, 0.3474310040473938, 0.3568419814109802, 0.36625295877456665, 0.37566396594047546, 0.3850749731063843, 0.3944859504699707]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 7.0, 4.0, 8.0, 9.0, 11.0, 14.0, 14.0, 19.0, 24.0, 30.0, 26.0, 43.0, 41.0, 41.0, 63.0, 34.0, 52.0, 52.0, 54.0, 55.0, 42.0, 45.0, 46.0, 31.0, 44.0, 38.0, 28.0, 33.0, 19.0, 17.0, 16.0, 8.0, 6.0, 2.0, 10.0, 6.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.18049389123916626, -0.17510296404361725, -0.16971203684806824, -0.16432110965251923, -0.15893018245697021, -0.15353924036026, -0.148148313164711, -0.142757385969162, -0.13736645877361298, -0.13197553157806396, -0.12658460438251495, -0.12119366973638535, -0.11580274254083633, -0.11041181534528732, -0.10502088069915771, -0.0996299535036087, -0.09423902630805969, -0.08884809911251068, -0.08345717191696167, -0.07806623727083206, -0.07267531007528305, -0.06728438287973404, -0.06189345195889473, -0.05650252103805542, -0.05111159384250641, -0.0457206666469574, -0.04032973572611809, -0.03493880480527878, -0.029547877609729767, -0.024156948551535606, -0.018766019493341446, -0.013375088572502136, -0.007984161376953125, -0.0025932323187589645, 0.002797696739435196, 0.008188625797629356, 0.013579554855823517, 0.018970483914017677, 0.024361412972211838, 0.029752343893051147, 0.03514327108860016, 0.04053419828414917, 0.04592512920498848, 0.05131606012582779, 0.0567069873213768, 0.06209791451692581, 0.06748884916305542, 0.07287977635860443, 0.07827070355415344, 0.08366163074970245, 0.08905255794525146, 0.09444349259138107, 0.09983441978693008, 0.1052253469824791, 0.1106162816286087, 0.11600720882415771, 0.12139813601970673, 0.12678906321525574, 0.13217999041080475, 0.13757091760635376, 0.14296185970306396, 0.14835278689861298, 0.153743714094162, 0.159134641289711, 0.16452556848526]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 12.0, 15.0, 13.0, 33.0, 50.0, 91.0, 128.0, 201.0, 307.0, 501.0, 766.0, 1326.0, 2253.0, 4161.0, 7972.0, 16474.0, 38009.0, 108706.0, 378643.0, 329766.0, 93974.0, 33950.0, 14989.0, 7233.0, 3773.0, 2068.0, 1183.0, 697.0, 432.0, 278.0, 171.0, 124.0, 73.0, 69.0, 29.0, 18.0, 17.0, 15.0, 7.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0299530029296875, -0.029015064239501953, -0.028077125549316406, -0.02713918685913086, -0.026201248168945312, -0.025263309478759766, -0.02432537078857422, -0.023387432098388672, -0.022449493408203125, -0.021511554718017578, -0.02057361602783203, -0.019635677337646484, -0.018697738647460938, -0.01775979995727539, -0.016821861267089844, -0.015883922576904297, -0.01494598388671875, -0.014008045196533203, -0.013070106506347656, -0.01213216781616211, -0.011194229125976562, -0.010256290435791016, -0.009318351745605469, -0.008380413055419922, -0.007442474365234375, -0.006504535675048828, -0.005566596984863281, -0.004628658294677734, -0.0036907196044921875, -0.0027527809143066406, -0.0018148422241210938, -0.0008769035339355469, 6.103515625e-05, 0.0009989738464355469, 0.0019369125366210938, 0.0028748512268066406, 0.0038127899169921875, 0.004750728607177734, 0.005688667297363281, 0.006626605987548828, 0.007564544677734375, 0.008502483367919922, 0.009440422058105469, 0.010378360748291016, 0.011316299438476562, 0.01225423812866211, 0.013192176818847656, 0.014130115509033203, 0.01506805419921875, 0.016005992889404297, 0.016943931579589844, 0.01788187026977539, 0.018819808959960938, 0.019757747650146484, 0.02069568634033203, 0.021633625030517578, 0.022571563720703125, 0.023509502410888672, 0.02444744110107422, 0.025385379791259766, 0.026323318481445312, 0.02726125717163086, 0.028199195861816406, 0.029137134552001953, 0.0300750732421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 7.0, 5.0, 1.0, 8.0, 13.0, 7.0, 13.0, 17.0, 13.0, 27.0, 22.0, 37.0, 48.0, 41.0, 59.0, 53.0, 52.0, 58.0, 60.0, 64.0, 59.0, 51.0, 41.0, 41.0, 33.0, 23.0, 24.0, 18.0, 24.0, 18.0, 14.0, 14.0, 12.0, 6.0, 6.0, 9.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0151824951171875, -0.01474153995513916, -0.01430058479309082, -0.01385962963104248, -0.01341867446899414, -0.0129777193069458, -0.012536764144897461, -0.012095808982849121, -0.011654853820800781, -0.011213898658752441, -0.010772943496704102, -0.010331988334655762, -0.009891033172607422, -0.009450078010559082, -0.009009122848510742, -0.008568167686462402, -0.008127212524414062, -0.007686257362365723, -0.007245302200317383, -0.006804347038269043, -0.006363391876220703, -0.005922436714172363, -0.0054814815521240234, -0.005040526390075684, -0.004599571228027344, -0.004158616065979004, -0.003717660903930664, -0.0032767057418823242, -0.0028357505798339844, -0.0023947954177856445, -0.0019538402557373047, -0.0015128850936889648, -0.001071929931640625, -0.0006309747695922852, -0.0001900196075439453, 0.00025093555450439453, 0.0006918907165527344, 0.0011328458786010742, 0.001573801040649414, 0.002014756202697754, 0.0024557113647460938, 0.0028966665267944336, 0.0033376216888427734, 0.0037785768508911133, 0.004219532012939453, 0.004660487174987793, 0.005101442337036133, 0.005542397499084473, 0.0059833526611328125, 0.006424307823181152, 0.006865262985229492, 0.007306218147277832, 0.007747173309326172, 0.008188128471374512, 0.008629083633422852, 0.009070038795471191, 0.009510993957519531, 0.009951949119567871, 0.010392904281616211, 0.01083385944366455, 0.01127481460571289, 0.01171576976776123, 0.01215672492980957, 0.01259768009185791, 0.01303863525390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 11.0, 9.0, 15.0, 20.0, 23.0, 36.0, 68.0, 85.0, 115.0, 172.0, 248.0, 424.0, 662.0, 1215.0, 2300.0, 4546.0, 10390.0, 28975.0, 102582.0, 625719.0, 194943.0, 46918.0, 15789.0, 6399.0, 3004.0, 1560.0, 872.0, 508.0, 311.0, 200.0, 120.0, 97.0, 62.0, 46.0, 24.0, 20.0, 21.0, 15.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.033782958984375, -0.03264570236206055, -0.031508445739746094, -0.03037118911743164, -0.029233932495117188, -0.028096675872802734, -0.02695941925048828, -0.025822162628173828, -0.024684906005859375, -0.023547649383544922, -0.02241039276123047, -0.021273136138916016, -0.020135879516601562, -0.01899862289428711, -0.017861366271972656, -0.016724109649658203, -0.01558685302734375, -0.014449596405029297, -0.013312339782714844, -0.01217508316040039, -0.011037826538085938, -0.009900569915771484, -0.008763313293457031, -0.007626056671142578, -0.006488800048828125, -0.005351543426513672, -0.004214286804199219, -0.0030770301818847656, -0.0019397735595703125, -0.0008025169372558594, 0.00033473968505859375, 0.0014719963073730469, 0.0026092529296875, 0.003746509552001953, 0.004883766174316406, 0.006021022796630859, 0.0071582794189453125, 0.008295536041259766, 0.009432792663574219, 0.010570049285888672, 0.011707305908203125, 0.012844562530517578, 0.013981819152832031, 0.015119075775146484, 0.016256332397460938, 0.01739358901977539, 0.018530845642089844, 0.019668102264404297, 0.02080535888671875, 0.021942615509033203, 0.023079872131347656, 0.02421712875366211, 0.025354385375976562, 0.026491641998291016, 0.02762889862060547, 0.028766155242919922, 0.029903411865234375, 0.031040668487548828, 0.03217792510986328, 0.033315181732177734, 0.03445243835449219, 0.03558969497680664, 0.036726951599121094, 0.03786420822143555, 0.03900146484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 4.0, 9.0, 8.0, 4.0, 11.0, 7.0, 14.0, 14.0, 30.0, 25.0, 32.0, 36.0, 39.0, 36.0, 58.0, 34.0, 62.0, 56.0, 51.0, 44.0, 54.0, 51.0, 52.0, 34.0, 40.0, 40.0, 23.0, 29.0, 20.0, 21.0, 16.0, 10.0, 11.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0552978515625, -0.05356597900390625, -0.0518341064453125, -0.05010223388671875, -0.048370361328125, -0.04663848876953125, -0.0449066162109375, -0.04317474365234375, -0.04144287109375, -0.03971099853515625, -0.0379791259765625, -0.03624725341796875, -0.034515380859375, -0.03278350830078125, -0.0310516357421875, -0.02931976318359375, -0.027587890625, -0.02585601806640625, -0.0241241455078125, -0.02239227294921875, -0.020660400390625, -0.01892852783203125, -0.0171966552734375, -0.01546478271484375, -0.01373291015625, -0.01200103759765625, -0.0102691650390625, -0.00853729248046875, -0.006805419921875, -0.00507354736328125, -0.0033416748046875, -0.00160980224609375, 0.0001220703125, 0.00185394287109375, 0.0035858154296875, 0.00531768798828125, 0.007049560546875, 0.00878143310546875, 0.0105133056640625, 0.01224517822265625, 0.01397705078125, 0.01570892333984375, 0.0174407958984375, 0.01917266845703125, 0.020904541015625, 0.02263641357421875, 0.0243682861328125, 0.02610015869140625, 0.02783203125, 0.02956390380859375, 0.0312957763671875, 0.03302764892578125, 0.034759521484375, 0.03649139404296875, 0.0382232666015625, 0.03995513916015625, 0.04168701171875, 0.04341888427734375, 0.0451507568359375, 0.04688262939453125, 0.048614501953125, 0.05034637451171875, 0.0520782470703125, 0.05381011962890625, 0.0555419921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 10.0, 2.0, 12.0, 11.0, 22.0, 21.0, 35.0, 34.0, 70.0, 85.0, 162.0, 296.0, 568.0, 1313.0, 3792.0, 15394.0, 136521.0, 838731.0, 39619.0, 7649.0, 2307.0, 876.0, 424.0, 214.0, 120.0, 75.0, 64.0, 35.0, 18.0, 16.0, 10.0, 17.0, 6.0, 8.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.040740966796875, -0.03958559036254883, -0.038430213928222656, -0.037274837493896484, -0.03611946105957031, -0.03496408462524414, -0.03380870819091797, -0.0326533317565918, -0.031497955322265625, -0.030342578887939453, -0.02918720245361328, -0.02803182601928711, -0.026876449584960938, -0.025721073150634766, -0.024565696716308594, -0.023410320281982422, -0.02225494384765625, -0.021099567413330078, -0.019944190979003906, -0.018788814544677734, -0.017633438110351562, -0.01647806167602539, -0.015322685241699219, -0.014167308807373047, -0.013011932373046875, -0.011856555938720703, -0.010701179504394531, -0.00954580307006836, -0.008390426635742188, -0.007235050201416016, -0.006079673767089844, -0.004924297332763672, -0.0037689208984375, -0.002613544464111328, -0.0014581680297851562, -0.0003027915954589844, 0.0008525848388671875, 0.0020079612731933594, 0.0031633377075195312, 0.004318714141845703, 0.005474090576171875, 0.006629467010498047, 0.007784843444824219, 0.00894021987915039, 0.010095596313476562, 0.011250972747802734, 0.012406349182128906, 0.013561725616455078, 0.01471710205078125, 0.015872478485107422, 0.017027854919433594, 0.018183231353759766, 0.019338607788085938, 0.02049398422241211, 0.02164936065673828, 0.022804737091064453, 0.023960113525390625, 0.025115489959716797, 0.02627086639404297, 0.02742624282836914, 0.028581619262695312, 0.029736995697021484, 0.030892372131347656, 0.03204774856567383, 0.033203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 11.0, 23.0, 46.0, 101.0, 150.0, 232.0, 206.0, 95.0, 58.0, 29.0, 16.0, 11.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013327598571777344, -0.00012918561697006226, -0.00012509524822235107, -0.00012100487947463989, -0.00011691451072692871, -0.00011282414197921753, -0.00010873377323150635, -0.00010464340448379517, -0.00010055303573608398, -9.64626669883728e-05, -9.237229824066162e-05, -8.828192949295044e-05, -8.419156074523926e-05, -8.010119199752808e-05, -7.60108232498169e-05, -7.192045450210571e-05, -6.783008575439453e-05, -6.373971700668335e-05, -5.964934825897217e-05, -5.5558979511260986e-05, -5.1468610763549805e-05, -4.737824201583862e-05, -4.328787326812744e-05, -3.919750452041626e-05, -3.510713577270508e-05, -3.1016767024993896e-05, -2.6926398277282715e-05, -2.2836029529571533e-05, -1.874566078186035e-05, -1.465529203414917e-05, -1.0564923286437988e-05, -6.474554538726807e-06, -2.384185791015625e-06, 1.7061829566955566e-06, 5.796551704406738e-06, 9.88692045211792e-06, 1.3977289199829102e-05, 1.8067657947540283e-05, 2.2158026695251465e-05, 2.6248395442962646e-05, 3.0338764190673828e-05, 3.442913293838501e-05, 3.851950168609619e-05, 4.260987043380737e-05, 4.6700239181518555e-05, 5.0790607929229736e-05, 5.488097667694092e-05, 5.89713454246521e-05, 6.306171417236328e-05, 6.715208292007446e-05, 7.124245166778564e-05, 7.533282041549683e-05, 7.942318916320801e-05, 8.351355791091919e-05, 8.760392665863037e-05, 9.169429540634155e-05, 9.578466415405273e-05, 9.987503290176392e-05, 0.0001039654016494751, 0.00010805577039718628, 0.00011214613914489746, 0.00011623650789260864, 0.00012032687664031982, 0.000124417245388031, 0.0001285076141357422]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 8.0, 8.0, 8.0, 15.0, 16.0, 25.0, 29.0, 39.0, 71.0, 87.0, 147.0, 224.0, 394.0, 775.0, 1585.0, 3983.0, 14239.0, 99316.0, 851896.0, 58889.0, 10376.0, 3302.0, 1444.0, 690.0, 363.0, 188.0, 136.0, 92.0, 69.0, 42.0, 27.0, 20.0, 8.0, 7.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028594970703125, -0.027587890625, -0.026580810546875, -0.02557373046875, -0.024566650390625, -0.0235595703125, -0.022552490234375, -0.02154541015625, -0.020538330078125, -0.01953125, -0.018524169921875, -0.01751708984375, -0.016510009765625, -0.0155029296875, -0.014495849609375, -0.01348876953125, -0.012481689453125, -0.011474609375, -0.010467529296875, -0.00946044921875, -0.008453369140625, -0.0074462890625, -0.006439208984375, -0.00543212890625, -0.004425048828125, -0.00341796875, -0.002410888671875, -0.00140380859375, -0.000396728515625, 0.0006103515625, 0.001617431640625, 0.00262451171875, 0.003631591796875, 0.004638671875, 0.005645751953125, 0.00665283203125, 0.007659912109375, 0.0086669921875, 0.009674072265625, 0.01068115234375, 0.011688232421875, 0.0126953125, 0.013702392578125, 0.01470947265625, 0.015716552734375, 0.0167236328125, 0.017730712890625, 0.01873779296875, 0.019744873046875, 0.020751953125, 0.021759033203125, 0.02276611328125, 0.023773193359375, 0.0247802734375, 0.025787353515625, 0.02679443359375, 0.027801513671875, 0.02880859375, 0.029815673828125, 0.03082275390625, 0.031829833984375, 0.0328369140625, 0.033843994140625, 0.03485107421875, 0.035858154296875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 2.0, 4.0, 6.0, 10.0, 19.0, 29.0, 39.0, 56.0, 82.0, 126.0, 189.0, 149.0, 95.0, 57.0, 40.0, 33.0, 22.0, 5.0, 9.0, 9.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.035888671875, -0.035117506980895996, -0.03434634208679199, -0.03357517719268799, -0.032804012298583984, -0.03203284740447998, -0.03126168251037598, -0.030490517616271973, -0.02971935272216797, -0.028948187828063965, -0.02817702293395996, -0.027405858039855957, -0.026634693145751953, -0.02586352825164795, -0.025092363357543945, -0.02432119846343994, -0.023550033569335938, -0.022778868675231934, -0.02200770378112793, -0.021236538887023926, -0.020465373992919922, -0.019694209098815918, -0.018923044204711914, -0.01815187931060791, -0.017380714416503906, -0.016609549522399902, -0.0158383846282959, -0.015067219734191895, -0.01429605484008789, -0.013524889945983887, -0.012753725051879883, -0.011982560157775879, -0.011211395263671875, -0.010440230369567871, -0.009669065475463867, -0.008897900581359863, -0.00812673568725586, -0.0073555707931518555, -0.0065844058990478516, -0.005813241004943848, -0.005042076110839844, -0.00427091121673584, -0.003499746322631836, -0.002728581428527832, -0.001957416534423828, -0.0011862516403198242, -0.0004150867462158203, 0.0003560781478881836, 0.0011272430419921875, 0.0018984079360961914, 0.0026695728302001953, 0.0034407377243041992, 0.004211902618408203, 0.004983067512512207, 0.005754232406616211, 0.006525397300720215, 0.007296562194824219, 0.008067727088928223, 0.008838891983032227, 0.00961005687713623, 0.010381221771240234, 0.011152386665344238, 0.011923551559448242, 0.012694716453552246, 0.01346588134765625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 14.0, 21.0, 32.0, 49.0, 78.0, 170.0, 365.0, 150.0, 72.0, 26.0, 16.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5270462036132812, -0.5084968209266663, -0.48994749784469604, -0.47139811515808105, -0.45284876227378845, -0.43429940938949585, -0.41575002670288086, -0.39720067381858826, -0.37865132093429565, -0.36010196805000305, -0.34155261516571045, -0.32300323247909546, -0.30445387959480286, -0.28590452671051025, -0.26735514402389526, -0.24880579113960266, -0.23025643825531006, -0.21170708537101746, -0.19315771758556366, -0.17460834980010986, -0.15605899691581726, -0.13750964403152466, -0.11896027624607086, -0.10041090846061707, -0.08186155557632446, -0.06331219524145126, -0.044762834906578064, -0.026213474571704865, -0.007664114236831665, 0.010885246098041534, 0.029434606432914734, 0.04798397421836853, 0.06653332710266113, 0.08508268743753433, 0.10363204777240753, 0.12218140810728073, 0.14073076844215393, 0.15928012132644653, 0.17782948911190033, 0.19637885689735413, 0.21492820978164673, 0.23347756266593933, 0.25202691555023193, 0.2705762982368469, 0.2891256511211395, 0.30767500400543213, 0.3262243866920471, 0.3447737395763397, 0.3633230924606323, 0.3818724453449249, 0.40042179822921753, 0.4189711809158325, 0.4375205338001251, 0.4560698866844177, 0.4746192693710327, 0.4931686222553253, 0.5117179751396179, 0.5302673578262329, 0.5488166809082031, 0.5673660635948181, 0.5859154462814331, 0.6044647693634033, 0.6230141520500183, 0.6415635347366333, 0.6601128578186035]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 4.0, 10.0, 8.0, 8.0, 12.0, 16.0, 8.0, 13.0, 15.0, 24.0, 22.0, 22.0, 32.0, 33.0, 30.0, 51.0, 64.0, 114.0, 98.0, 60.0, 50.0, 53.0, 31.0, 33.0, 27.0, 27.0, 13.0, 15.0, 15.0, 14.0, 5.0, 15.0, 16.0, 12.0, 8.0, 7.0, 6.0, 1.0, 4.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2553887367248535, -0.24745464324951172, -0.23952054977416992, -0.23158645629882812, -0.22365237772464752, -0.21571828424930573, -0.20778419077396393, -0.19985009729862213, -0.19191601872444153, -0.18398192524909973, -0.17604783177375793, -0.16811373829841614, -0.16017965972423553, -0.15224556624889374, -0.14431147277355194, -0.13637737929821014, -0.12844328582286835, -0.12050919234752655, -0.11257510632276535, -0.10464101284742355, -0.09670692682266235, -0.08877283334732056, -0.08083873987197876, -0.07290464639663696, -0.06497056037187576, -0.057036470621824265, -0.049102380871772766, -0.04116828739643097, -0.03323419764637947, -0.025300107896327972, -0.017366014420986176, -0.009431924670934677, -0.0014978349208831787, 0.006436255760490894, 0.014370346441864967, 0.022304438054561615, 0.030238527804613113, 0.03817261755466461, 0.04610671103000641, 0.05404080078005791, 0.061974890530109406, 0.0699089840054512, 0.0778430700302124, 0.0857771635055542, 0.093711256980896, 0.1016453430056572, 0.10957943648099899, 0.11751352250576019, 0.125447615981102, 0.1333817094564438, 0.14131580293178558, 0.1492498815059662, 0.15718397498130798, 0.16511806845664978, 0.17305216193199158, 0.18098625540733337, 0.18892034888267517, 0.19685444235801697, 0.20478853583335876, 0.21272262930870056, 0.22065670788288116, 0.22859080135822296, 0.23652489483356476, 0.24445898830890656, 0.25239306688308716]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 10.0, 7.0, 7.0, 19.0, 22.0, 21.0, 32.0, 51.0, 66.0, 105.0, 128.0, 176.0, 224.0, 300.0, 443.0, 824.0, 1628.0, 4864.0, 23428.0, 745697.0, 3354164.0, 49361.0, 7617.0, 2326.0, 933.0, 525.0, 348.0, 249.0, 187.0, 126.0, 95.0, 63.0, 55.0, 42.0, 33.0, 20.0, 21.0, 12.0, 13.0, 9.0, 8.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.067138671875, -0.06498432159423828, -0.06282997131347656, -0.060675621032714844, -0.058521270751953125, -0.056366920471191406, -0.05421257019042969, -0.05205821990966797, -0.04990386962890625, -0.04774951934814453, -0.04559516906738281, -0.043440818786621094, -0.041286468505859375, -0.039132118225097656, -0.03697776794433594, -0.03482341766357422, -0.0326690673828125, -0.03051471710205078, -0.028360366821289062, -0.026206016540527344, -0.024051666259765625, -0.021897315979003906, -0.019742965698242188, -0.01758861541748047, -0.01543426513671875, -0.013279914855957031, -0.011125564575195312, -0.008971214294433594, -0.006816864013671875, -0.004662513732910156, -0.0025081634521484375, -0.00035381317138671875, 0.001800537109375, 0.003954887390136719, 0.0061092376708984375, 0.008263587951660156, 0.010417938232421875, 0.012572288513183594, 0.014726638793945312, 0.01688098907470703, 0.01903533935546875, 0.02118968963623047, 0.023344039916992188, 0.025498390197753906, 0.027652740478515625, 0.029807090759277344, 0.03196144104003906, 0.03411579132080078, 0.0362701416015625, 0.03842449188232422, 0.04057884216308594, 0.042733192443847656, 0.044887542724609375, 0.047041893005371094, 0.04919624328613281, 0.05135059356689453, 0.05350494384765625, 0.05565929412841797, 0.05781364440917969, 0.059967994689941406, 0.062122344970703125, 0.06427669525146484, 0.06643104553222656, 0.06858539581298828, 0.07073974609375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 3.0, 6.0, 11.0, 6.0, 10.0, 13.0, 19.0, 18.0, 31.0, 40.0, 39.0, 47.0, 65.0, 52.0, 62.0, 69.0, 58.0, 64.0, 59.0, 49.0, 55.0, 35.0, 34.0, 23.0, 21.0, 17.0, 16.0, 10.0, 14.0, 15.0, 2.0, 6.0, 5.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01580810546875, -0.015344977378845215, -0.01488184928894043, -0.014418721199035645, -0.01395559310913086, -0.013492465019226074, -0.013029336929321289, -0.012566208839416504, -0.012103080749511719, -0.011639952659606934, -0.011176824569702148, -0.010713696479797363, -0.010250568389892578, -0.009787440299987793, -0.009324312210083008, -0.008861184120178223, -0.008398056030273438, -0.007934927940368652, -0.007471799850463867, -0.007008671760559082, -0.006545543670654297, -0.006082415580749512, -0.0056192874908447266, -0.005156159400939941, -0.004693031311035156, -0.004229903221130371, -0.003766775131225586, -0.0033036470413208008, -0.0028405189514160156, -0.0023773908615112305, -0.0019142627716064453, -0.0014511346817016602, -0.000988006591796875, -0.0005248785018920898, -6.175041198730469e-05, 0.00040137767791748047, 0.0008645057678222656, 0.0013276338577270508, 0.001790761947631836, 0.002253890037536621, 0.0027170181274414062, 0.0031801462173461914, 0.0036432743072509766, 0.004106402397155762, 0.004569530487060547, 0.005032658576965332, 0.005495786666870117, 0.005958914756774902, 0.0064220428466796875, 0.006885170936584473, 0.007348299026489258, 0.007811427116394043, 0.008274555206298828, 0.008737683296203613, 0.009200811386108398, 0.009663939476013184, 0.010127067565917969, 0.010590195655822754, 0.011053323745727539, 0.011516451835632324, 0.01197957992553711, 0.012442708015441895, 0.01290583610534668, 0.013368964195251465, 0.01383209228515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 6.0, 14.0, 24.0, 41.0, 65.0, 148.0, 188.0, 383.0, 834.0, 2551.0, 48906.0, 4111047.0, 26448.0, 1996.0, 759.0, 394.0, 210.0, 121.0, 68.0, 34.0, 24.0, 7.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.108154296875, -0.10258674621582031, -0.09701919555664062, -0.09145164489746094, -0.08588409423828125, -0.08031654357910156, -0.07474899291992188, -0.06918144226074219, -0.0636138916015625, -0.05804634094238281, -0.052478790283203125, -0.04691123962402344, -0.04134368896484375, -0.03577613830566406, -0.030208587646484375, -0.024641036987304688, -0.019073486328125, -0.013505935668945312, -0.007938385009765625, -0.0023708343505859375, 0.00319671630859375, 0.008764266967773438, 0.014331817626953125, 0.019899368286132812, 0.0254669189453125, 0.031034469604492188, 0.036602020263671875, 0.04216957092285156, 0.04773712158203125, 0.05330467224121094, 0.058872222900390625, 0.06443977355957031, 0.07000732421875, 0.07557487487792969, 0.08114242553710938, 0.08670997619628906, 0.09227752685546875, 0.09784507751464844, 0.10341262817382812, 0.10898017883300781, 0.1145477294921875, 0.12011528015136719, 0.12568283081054688, 0.13125038146972656, 0.13681793212890625, 0.14238548278808594, 0.14795303344726562, 0.1535205841064453, 0.159088134765625, 0.1646556854248047, 0.17022323608398438, 0.17579078674316406, 0.18135833740234375, 0.18692588806152344, 0.19249343872070312, 0.1980609893798828, 0.2036285400390625, 0.2091960906982422, 0.21476364135742188, 0.22033119201660156, 0.22589874267578125, 0.23146629333496094, 0.23703384399414062, 0.2426013946533203, 0.2481689453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 12.0, 33.0, 48.0, 131.0, 425.0, 1677.0, 1249.0, 272.0, 116.0, 41.0, 28.0, 13.0, 8.0, 9.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1024169921875, -0.09898185729980469, -0.09554672241210938, -0.09211158752441406, -0.08867645263671875, -0.08524131774902344, -0.08180618286132812, -0.07837104797363281, -0.0749359130859375, -0.07150077819824219, -0.06806564331054688, -0.06463050842285156, -0.06119537353515625, -0.05776023864746094, -0.054325103759765625, -0.05088996887207031, -0.047454833984375, -0.04401969909667969, -0.040584564208984375, -0.03714942932128906, -0.03371429443359375, -0.030279159545898438, -0.026844024658203125, -0.023408889770507812, -0.0199737548828125, -0.016538619995117188, -0.013103485107421875, -0.009668350219726562, -0.00623321533203125, -0.0027980804443359375, 0.000637054443359375, 0.0040721893310546875, 0.00750732421875, 0.010942459106445312, 0.014377593994140625, 0.017812728881835938, 0.02124786376953125, 0.024682998657226562, 0.028118133544921875, 0.03155326843261719, 0.0349884033203125, 0.03842353820800781, 0.041858673095703125, 0.04529380798339844, 0.04872894287109375, 0.05216407775878906, 0.055599212646484375, 0.05903434753417969, 0.062469482421875, 0.06590461730957031, 0.06933975219726562, 0.07277488708496094, 0.07621002197265625, 0.07964515686035156, 0.08308029174804688, 0.08651542663574219, 0.0899505615234375, 0.09338569641113281, 0.09682083129882812, 0.10025596618652344, 0.10369110107421875, 0.10712623596191406, 0.11056137084960938, 0.11399650573730469, 0.117431640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 14.0, 26.0, 50.0, 107.0, 244.0, 256.0, 150.0, 70.0, 34.0, 16.0, 15.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4478585422039032, -0.4181429445743561, -0.3884273171424866, -0.35871171951293945, -0.32899612188339233, -0.2992805242538452, -0.2695649266242981, -0.2398492991924286, -0.21013370156288147, -0.18041810393333435, -0.15070249140262604, -0.12098688632249832, -0.0912712812423706, -0.061555683612823486, -0.03184007108211517, -0.0021244585514068604, 0.02759113907814026, 0.057306744158267975, 0.08702234923839569, 0.11673795431852341, 0.14645355939865112, 0.17616915702819824, 0.20588476955890656, 0.23560038208961487, 0.265315979719162, 0.2950315773487091, 0.3247472047805786, 0.35446280241012573, 0.38417840003967285, 0.41389399766921997, 0.4436095952987671, 0.4733252227306366, 0.5030407905578613, 0.5327563881874084, 0.5624719858169556, 0.5921875834465027, 0.6219031810760498, 0.6516188383102417, 0.6813344359397888, 0.7110500335693359, 0.7407656311988831, 0.7704812288284302, 0.8001968264579773, 0.8299124240875244, 0.8596280813217163, 0.8893436193466187, 0.9190592765808105, 0.9487748742103577, 0.9784904718399048, 1.0082061290740967, 1.037921667098999, 1.067637324333191, 1.0973528623580933, 1.1270685195922852, 1.1567840576171875, 1.1864997148513794, 1.2162153720855713, 1.2459310293197632, 1.2756465673446655, 1.3053622245788574, 1.3350777626037598, 1.3647934198379517, 1.394508957862854, 1.424224615097046, 1.4539401531219482]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 12.0, 8.0, 8.0, 12.0, 12.0, 14.0, 27.0, 33.0, 27.0, 52.0, 45.0, 45.0, 59.0, 43.0, 48.0, 44.0, 50.0, 45.0, 38.0, 32.0, 57.0, 47.0, 33.0, 38.0, 47.0, 20.0, 25.0, 18.0, 16.0, 14.0, 13.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.3338594436645508, -0.32600292563438416, -0.31814640760421753, -0.3102899193763733, -0.30243340134620667, -0.29457688331604004, -0.2867203652858734, -0.2788638472557068, -0.27100732922554016, -0.26315081119537354, -0.2552942931652069, -0.24743779003620148, -0.23958127200603485, -0.23172476887702942, -0.2238682508468628, -0.21601173281669617, -0.20815522968769073, -0.2002987116575241, -0.19244220852851868, -0.18458569049835205, -0.17672917246818542, -0.1688726544380188, -0.16101615130901337, -0.15315963327884674, -0.1453031301498413, -0.13744661211967468, -0.12959010899066925, -0.12173359096050262, -0.113877072930336, -0.10602056235074997, -0.09816405177116394, -0.09030753374099731, -0.08245101571083069, -0.07459450513124466, -0.06673798710107803, -0.058881476521492004, -0.05102496221661568, -0.04316844791173935, -0.03531193733215332, -0.027455423027276993, -0.019598908722400665, -0.011742395348846912, -0.0038858819752931595, 0.003970630466938019, 0.011827144771814346, 0.019683659076690674, 0.027540169656276703, 0.03539668396115303, 0.04325319826602936, 0.051109712570905685, 0.05896622687578201, 0.06682273745536804, 0.07467925548553467, 0.0825357660651207, 0.09039227664470673, 0.09824879467487335, 0.10610530525445938, 0.11396181583404541, 0.12181833386421204, 0.12967485189437866, 0.1375313550233841, 0.14538787305355072, 0.15324437618255615, 0.16110089421272278, 0.1689574122428894]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 4.0, 9.0, 4.0, 8.0, 9.0, 12.0, 18.0, 19.0, 31.0, 44.0, 66.0, 90.0, 143.0, 178.0, 275.0, 408.0, 596.0, 935.0, 1522.0, 2705.0, 4572.0, 8516.0, 15962.0, 31530.0, 66145.0, 150707.0, 328890.0, 239764.0, 100170.0, 45453.0, 22480.0, 11778.0, 6401.0, 3460.0, 2054.0, 1257.0, 741.0, 490.0, 328.0, 237.0, 139.0, 100.0, 88.0, 70.0, 38.0, 34.0, 19.0, 18.0, 15.0, 13.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0240325927734375, -0.02325129508972168, -0.02246999740600586, -0.02168869972229004, -0.02090740203857422, -0.0201261043548584, -0.019344806671142578, -0.018563508987426758, -0.017782211303710938, -0.017000913619995117, -0.016219615936279297, -0.015438318252563477, -0.014657020568847656, -0.013875722885131836, -0.013094425201416016, -0.012313127517700195, -0.011531829833984375, -0.010750532150268555, -0.009969234466552734, -0.009187936782836914, -0.008406639099121094, -0.0076253414154052734, -0.006844043731689453, -0.006062746047973633, -0.0052814483642578125, -0.004500150680541992, -0.003718852996826172, -0.0029375553131103516, -0.0021562576293945312, -0.001374959945678711, -0.0005936622619628906, 0.0001876354217529297, 0.00096893310546875, 0.0017502307891845703, 0.0025315284729003906, 0.003312826156616211, 0.004094123840332031, 0.0048754215240478516, 0.005656719207763672, 0.006438016891479492, 0.0072193145751953125, 0.008000612258911133, 0.008781909942626953, 0.009563207626342773, 0.010344505310058594, 0.011125802993774414, 0.011907100677490234, 0.012688398361206055, 0.013469696044921875, 0.014250993728637695, 0.015032291412353516, 0.015813589096069336, 0.016594886779785156, 0.017376184463500977, 0.018157482147216797, 0.018938779830932617, 0.019720077514648438, 0.020501375198364258, 0.021282672882080078, 0.0220639705657959, 0.02284526824951172, 0.02362656593322754, 0.02440786361694336, 0.02518916130065918, 0.025970458984375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 2.0, 4.0, 5.0, 4.0, 11.0, 8.0, 12.0, 13.0, 22.0, 16.0, 25.0, 27.0, 46.0, 52.0, 37.0, 49.0, 50.0, 51.0, 61.0, 49.0, 71.0, 51.0, 43.0, 44.0, 36.0, 34.0, 36.0, 26.0, 29.0, 15.0, 19.0, 11.0, 14.0, 9.0, 6.0, 4.0, 6.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0178070068359375, -0.01725172996520996, -0.016696453094482422, -0.016141176223754883, -0.015585899353027344, -0.015030622482299805, -0.014475345611572266, -0.013920068740844727, -0.013364791870117188, -0.012809514999389648, -0.01225423812866211, -0.01169896125793457, -0.011143684387207031, -0.010588407516479492, -0.010033130645751953, -0.009477853775024414, -0.008922576904296875, -0.008367300033569336, -0.007812023162841797, -0.007256746292114258, -0.006701469421386719, -0.00614619255065918, -0.005590915679931641, -0.0050356388092041016, -0.0044803619384765625, -0.0039250850677490234, -0.0033698081970214844, -0.0028145313262939453, -0.0022592544555664062, -0.0017039775848388672, -0.0011487007141113281, -0.0005934238433837891, -3.814697265625e-05, 0.0005171298980712891, 0.0010724067687988281, 0.0016276836395263672, 0.0021829605102539062, 0.0027382373809814453, 0.0032935142517089844, 0.0038487911224365234, 0.0044040679931640625, 0.0049593448638916016, 0.005514621734619141, 0.00606989860534668, 0.006625175476074219, 0.007180452346801758, 0.007735729217529297, 0.008291006088256836, 0.008846282958984375, 0.009401559829711914, 0.009956836700439453, 0.010512113571166992, 0.011067390441894531, 0.01162266731262207, 0.01217794418334961, 0.012733221054077148, 0.013288497924804688, 0.013843774795532227, 0.014399051666259766, 0.014954328536987305, 0.015509605407714844, 0.016064882278442383, 0.016620159149169922, 0.01717543601989746, 0.017730712890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 8.0, 16.0, 17.0, 31.0, 35.0, 52.0, 72.0, 116.0, 160.0, 297.0, 478.0, 824.0, 1950.0, 6979.0, 55641.0, 841653.0, 123581.0, 11648.0, 2562.0, 977.0, 537.0, 296.0, 195.0, 124.0, 97.0, 67.0, 34.0, 24.0, 19.0, 12.0, 13.0, 6.0, 4.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0714111328125, -0.06891822814941406, -0.06642532348632812, -0.06393241882324219, -0.06143951416015625, -0.05894660949707031, -0.056453704833984375, -0.05396080017089844, -0.0514678955078125, -0.04897499084472656, -0.046482086181640625, -0.04398918151855469, -0.04149627685546875, -0.03900337219238281, -0.036510467529296875, -0.03401756286621094, -0.031524658203125, -0.029031753540039062, -0.026538848876953125, -0.024045944213867188, -0.02155303955078125, -0.019060134887695312, -0.016567230224609375, -0.014074325561523438, -0.0115814208984375, -0.009088516235351562, -0.006595611572265625, -0.0041027069091796875, -0.00160980224609375, 0.0008831024169921875, 0.003376007080078125, 0.0058689117431640625, 0.00836181640625, 0.010854721069335938, 0.013347625732421875, 0.015840530395507812, 0.01833343505859375, 0.020826339721679688, 0.023319244384765625, 0.025812149047851562, 0.0283050537109375, 0.030797958374023438, 0.033290863037109375, 0.03578376770019531, 0.03827667236328125, 0.04076957702636719, 0.043262481689453125, 0.04575538635253906, 0.048248291015625, 0.05074119567871094, 0.053234100341796875, 0.05572700500488281, 0.05821990966796875, 0.06071281433105469, 0.06320571899414062, 0.06569862365722656, 0.0681915283203125, 0.07068443298339844, 0.07317733764648438, 0.07567024230957031, 0.07816314697265625, 0.08065605163574219, 0.08314895629882812, 0.08564186096191406, 0.088134765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 4.0, 5.0, 10.0, 13.0, 16.0, 27.0, 19.0, 31.0, 35.0, 53.0, 60.0, 66.0, 84.0, 74.0, 82.0, 83.0, 61.0, 62.0, 50.0, 43.0, 30.0, 21.0, 26.0, 13.0, 14.0, 7.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1038818359375, -0.10082626342773438, -0.09777069091796875, -0.09471511840820312, -0.0916595458984375, -0.08860397338867188, -0.08554840087890625, -0.08249282836914062, -0.079437255859375, -0.07638168334960938, -0.07332611083984375, -0.07027053833007812, -0.0672149658203125, -0.06415939331054688, -0.06110382080078125, -0.058048248291015625, -0.05499267578125, -0.051937103271484375, -0.04888153076171875, -0.045825958251953125, -0.0427703857421875, -0.039714813232421875, -0.03665924072265625, -0.033603668212890625, -0.030548095703125, -0.027492523193359375, -0.02443695068359375, -0.021381378173828125, -0.0183258056640625, -0.015270233154296875, -0.01221466064453125, -0.009159088134765625, -0.006103515625, -0.003047943115234375, 7.62939453125e-06, 0.003063201904296875, 0.0061187744140625, 0.009174346923828125, 0.01222991943359375, 0.015285491943359375, 0.018341064453125, 0.021396636962890625, 0.02445220947265625, 0.027507781982421875, 0.0305633544921875, 0.033618927001953125, 0.03667449951171875, 0.039730072021484375, 0.04278564453125, 0.045841217041015625, 0.04889678955078125, 0.051952362060546875, 0.0550079345703125, 0.058063507080078125, 0.06111907958984375, 0.06417465209960938, 0.067230224609375, 0.07028579711914062, 0.07334136962890625, 0.07639694213867188, 0.0794525146484375, 0.08250808715820312, 0.08556365966796875, 0.08861923217773438, 0.0916748046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 8.0, 6.0, 6.0, 16.0, 13.0, 33.0, 32.0, 54.0, 86.0, 142.0, 276.0, 521.0, 1229.0, 3500.0, 13493.0, 76482.0, 784362.0, 139154.0, 20884.0, 5125.0, 1615.0, 700.0, 309.0, 176.0, 105.0, 74.0, 48.0, 24.0, 20.0, 18.0, 16.0, 6.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.016448974609375, -0.0158538818359375, -0.0152587890625, -0.0146636962890625, -0.014068603515625, -0.0134735107421875, -0.01287841796875, -0.0122833251953125, -0.011688232421875, -0.0110931396484375, -0.010498046875, -0.0099029541015625, -0.009307861328125, -0.0087127685546875, -0.00811767578125, -0.0075225830078125, -0.006927490234375, -0.0063323974609375, -0.0057373046875, -0.0051422119140625, -0.004547119140625, -0.0039520263671875, -0.00335693359375, -0.0027618408203125, -0.002166748046875, -0.0015716552734375, -0.0009765625, -0.0003814697265625, 0.000213623046875, 0.0008087158203125, 0.00140380859375, 0.0019989013671875, 0.002593994140625, 0.0031890869140625, 0.0037841796875, 0.0043792724609375, 0.004974365234375, 0.0055694580078125, 0.00616455078125, 0.0067596435546875, 0.007354736328125, 0.0079498291015625, 0.008544921875, 0.0091400146484375, 0.009735107421875, 0.0103302001953125, 0.01092529296875, 0.0115203857421875, 0.012115478515625, 0.0127105712890625, 0.0133056640625, 0.0139007568359375, 0.014495849609375, 0.0150909423828125, 0.01568603515625, 0.0162811279296875, 0.016876220703125, 0.0174713134765625, 0.01806640625, 0.0186614990234375, 0.019256591796875, 0.0198516845703125, 0.02044677734375, 0.0210418701171875, 0.021636962890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 3.0, 9.0, 6.0, 8.0, 12.0, 7.0, 12.0, 21.0, 17.0, 23.0, 32.0, 39.0, 51.0, 55.0, 59.0, 82.0, 85.0, 82.0, 81.0, 54.0, 47.0, 52.0, 18.0, 28.0, 20.0, 14.0, 15.0, 7.0, 12.0, 8.0, 5.0, 6.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2557716369628906e-05, -4.120729863643646e-05, -3.985688090324402e-05, -3.8506463170051575e-05, -3.715604543685913e-05, -3.580562770366669e-05, -3.445520997047424e-05, -3.31047922372818e-05, -3.1754374504089355e-05, -3.040395677089691e-05, -2.9053539037704468e-05, -2.7703121304512024e-05, -2.635270357131958e-05, -2.5002285838127136e-05, -2.3651868104934692e-05, -2.230145037174225e-05, -2.0951032638549805e-05, -1.960061490535736e-05, -1.8250197172164917e-05, -1.6899779438972473e-05, -1.554936170578003e-05, -1.4198943972587585e-05, -1.2848526239395142e-05, -1.1498108506202698e-05, -1.0147690773010254e-05, -8.79727303981781e-06, -7.446855306625366e-06, -6.096437573432922e-06, -4.7460198402404785e-06, -3.3956021070480347e-06, -2.045184373855591e-06, -6.94766640663147e-07, 6.556510925292969e-07, 2.0060688257217407e-06, 3.3564865589141846e-06, 4.706904292106628e-06, 6.057322025299072e-06, 7.407739758491516e-06, 8.75815749168396e-06, 1.0108575224876404e-05, 1.1458992958068848e-05, 1.2809410691261292e-05, 1.4159828424453735e-05, 1.551024615764618e-05, 1.6860663890838623e-05, 1.8211081624031067e-05, 1.956149935722351e-05, 2.0911917090415955e-05, 2.22623348236084e-05, 2.3612752556800842e-05, 2.4963170289993286e-05, 2.631358802318573e-05, 2.7664005756378174e-05, 2.9014423489570618e-05, 3.036484122276306e-05, 3.1715258955955505e-05, 3.306567668914795e-05, 3.441609442234039e-05, 3.576651215553284e-05, 3.711692988872528e-05, 3.8467347621917725e-05, 3.981776535511017e-05, 4.116818308830261e-05, 4.2518600821495056e-05, 4.38690185546875e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 11.0, 9.0, 12.0, 19.0, 33.0, 48.0, 96.0, 136.0, 230.0, 414.0, 855.0, 1921.0, 5484.0, 23791.0, 188287.0, 753053.0, 58237.0, 10407.0, 3074.0, 1194.0, 553.0, 282.0, 158.0, 82.0, 48.0, 35.0, 25.0, 9.0, 21.0, 12.0, 5.0, 7.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.02362060546875, -0.022968769073486328, -0.022316932678222656, -0.021665096282958984, -0.021013259887695312, -0.02036142349243164, -0.01970958709716797, -0.019057750701904297, -0.018405914306640625, -0.017754077911376953, -0.01710224151611328, -0.01645040512084961, -0.015798568725585938, -0.015146732330322266, -0.014494895935058594, -0.013843059539794922, -0.01319122314453125, -0.012539386749267578, -0.011887550354003906, -0.011235713958740234, -0.010583877563476562, -0.00993204116821289, -0.009280204772949219, -0.008628368377685547, -0.007976531982421875, -0.007324695587158203, -0.006672859191894531, -0.006021022796630859, -0.0053691864013671875, -0.004717350006103516, -0.004065513610839844, -0.003413677215576172, -0.0027618408203125, -0.002110004425048828, -0.0014581680297851562, -0.0008063316345214844, -0.0001544952392578125, 0.0004973411560058594, 0.0011491775512695312, 0.0018010139465332031, 0.002452850341796875, 0.003104686737060547, 0.0037565231323242188, 0.004408359527587891, 0.0050601959228515625, 0.005712032318115234, 0.006363868713378906, 0.007015705108642578, 0.00766754150390625, 0.008319377899169922, 0.008971214294433594, 0.009623050689697266, 0.010274887084960938, 0.01092672348022461, 0.011578559875488281, 0.012230396270751953, 0.012882232666015625, 0.013534069061279297, 0.014185905456542969, 0.01483774185180664, 0.015489578247070312, 0.016141414642333984, 0.016793251037597656, 0.017445087432861328, 0.018096923828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 9.0, 6.0, 12.0, 13.0, 20.0, 24.0, 33.0, 33.0, 42.0, 44.0, 67.0, 76.0, 70.0, 82.0, 93.0, 62.0, 49.0, 43.0, 44.0, 33.0, 35.0, 17.0, 15.0, 18.0, 8.0, 14.0, 9.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01261138916015625, -0.01219475269317627, -0.011778116226196289, -0.011361479759216309, -0.010944843292236328, -0.010528206825256348, -0.010111570358276367, -0.009694933891296387, -0.009278297424316406, -0.008861660957336426, -0.008445024490356445, -0.008028388023376465, -0.007611751556396484, -0.007195115089416504, -0.0067784786224365234, -0.006361842155456543, -0.0059452056884765625, -0.005528569221496582, -0.0051119327545166016, -0.004695296287536621, -0.004278659820556641, -0.00386202335357666, -0.0034453868865966797, -0.0030287504196166992, -0.0026121139526367188, -0.0021954774856567383, -0.0017788410186767578, -0.0013622045516967773, -0.0009455680847167969, -0.0005289316177368164, -0.00011229515075683594, 0.00030434131622314453, 0.000720977783203125, 0.0011376142501831055, 0.001554250717163086, 0.0019708871841430664, 0.002387523651123047, 0.0028041601181030273, 0.003220796585083008, 0.0036374330520629883, 0.004054069519042969, 0.004470705986022949, 0.00488734245300293, 0.00530397891998291, 0.005720615386962891, 0.006137251853942871, 0.0065538883209228516, 0.006970524787902832, 0.0073871612548828125, 0.007803797721862793, 0.008220434188842773, 0.008637070655822754, 0.009053707122802734, 0.009470343589782715, 0.009886980056762695, 0.010303616523742676, 0.010720252990722656, 0.011136889457702637, 0.011553525924682617, 0.011970162391662598, 0.012386798858642578, 0.012803435325622559, 0.013220071792602539, 0.01363670825958252, 0.0140533447265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 9.0, 43.0, 176.0, 505.0, 189.0, 55.0, 14.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7443504929542542, -0.7126302123069763, -0.6809099316596985, -0.6491896510124207, -0.6174694299697876, -0.5857491493225098, -0.5540288686752319, -0.5223085880279541, -0.49058830738067627, -0.45886802673339844, -0.4271477460861206, -0.39542749524116516, -0.36370721459388733, -0.3319869339466095, -0.30026668310165405, -0.2685464024543762, -0.2368261218070984, -0.20510584115982056, -0.17338557541370392, -0.14166530966758728, -0.10994502902030945, -0.07822474837303162, -0.04650448262691498, -0.01478421688079834, 0.016936063766479492, 0.04865633696317673, 0.08037661015987396, 0.1120968833565712, 0.14381715655326843, 0.17553743720054626, 0.2072577029466629, 0.23897796869277954, 0.27069830894470215, 0.30241858959198, 0.3341388702392578, 0.36585912108421326, 0.3975794017314911, 0.4292996823787689, 0.46101993322372437, 0.4927402138710022, 0.52446049451828, 0.5561807751655579, 0.5879010558128357, 0.6196213364601135, 0.6513415575027466, 0.6830618381500244, 0.7147821187973022, 0.7465023994445801, 0.7782226800918579, 0.8099429607391357, 0.8416632413864136, 0.8733835220336914, 0.9051038026809692, 0.9368240833282471, 0.9685443043708801, 1.0002646446228027, 1.031984806060791, 1.0637050867080688, 1.0954253673553467, 1.1271456480026245, 1.1588659286499023, 1.1905862092971802, 1.222306489944458, 1.2540266513824463, 1.2857470512390137]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 6.0, 4.0, 6.0, 9.0, 9.0, 19.0, 11.0, 19.0, 18.0, 14.0, 21.0, 28.0, 27.0, 28.0, 33.0, 37.0, 66.0, 98.0, 104.0, 80.0, 38.0, 40.0, 39.0, 27.0, 21.0, 27.0, 16.0, 21.0, 9.0, 20.0, 14.0, 17.0, 15.0, 5.0, 10.0, 3.0, 5.0, 5.0, 1.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2552034258842468, -0.24712397158145905, -0.23904451727867126, -0.23096506297588348, -0.2228856086730957, -0.21480615437030792, -0.20672670006752014, -0.19864724576473236, -0.19056779146194458, -0.1824883371591568, -0.17440888285636902, -0.16632942855358124, -0.15824997425079346, -0.15017051994800568, -0.1420910656452179, -0.13401161134243011, -0.12593215703964233, -0.11785270273685455, -0.10977324843406677, -0.10169379413127899, -0.09361433982849121, -0.08553488552570343, -0.07745543122291565, -0.06937597692012787, -0.06129652261734009, -0.05321706831455231, -0.045137614011764526, -0.037058159708976746, -0.028978705406188965, -0.020899251103401184, -0.012819796800613403, -0.0047403424978256226, 0.003339111804962158, 0.011418566107749939, 0.01949802041053772, 0.0275774747133255, 0.03565692901611328, 0.04373638331890106, 0.05181583762168884, 0.059895291924476624, 0.0679747462272644, 0.07605420053005219, 0.08413365483283997, 0.09221310913562775, 0.10029256343841553, 0.10837201774120331, 0.11645147204399109, 0.12453092634677887, 0.13261038064956665, 0.14068983495235443, 0.1487692892551422, 0.15684874355793, 0.16492819786071777, 0.17300765216350555, 0.18108710646629333, 0.18916656076908112, 0.1972460150718689, 0.20532546937465668, 0.21340492367744446, 0.22148437798023224, 0.22956383228302002, 0.2376432865858078, 0.24572274088859558, 0.25380218029022217, 0.26188164949417114]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 6.0, 10.0, 23.0, 23.0, 37.0, 51.0, 66.0, 80.0, 119.0, 151.0, 221.0, 307.0, 501.0, 704.0, 1130.0, 1765.0, 3085.0, 5376.0, 10459.0, 22498.0, 58488.0, 196725.0, 823680.0, 1942106.0, 821778.0, 198645.0, 58807.0, 22830.0, 10628.0, 5520.0, 3162.0, 1794.0, 1156.0, 729.0, 457.0, 332.0, 220.0, 171.0, 108.0, 90.0, 68.0, 54.0, 22.0, 18.0, 17.0, 14.0, 7.0, 11.0, 4.0, 7.0, 3.0, 6.0, 4.0], "bins": [-0.0250396728515625, -0.024313926696777344, -0.023588180541992188, -0.02286243438720703, -0.022136688232421875, -0.02141094207763672, -0.020685195922851562, -0.019959449768066406, -0.01923370361328125, -0.018507957458496094, -0.017782211303710938, -0.01705646514892578, -0.016330718994140625, -0.015604972839355469, -0.014879226684570312, -0.014153480529785156, -0.013427734375, -0.012701988220214844, -0.011976242065429688, -0.011250495910644531, -0.010524749755859375, -0.009799003601074219, -0.009073257446289062, -0.008347511291503906, -0.00762176513671875, -0.006896018981933594, -0.0061702728271484375, -0.005444526672363281, -0.004718780517578125, -0.003993034362792969, -0.0032672882080078125, -0.0025415420532226562, -0.0018157958984375, -0.0010900497436523438, -0.0003643035888671875, 0.00036144256591796875, 0.001087188720703125, 0.0018129348754882812, 0.0025386810302734375, 0.0032644271850585938, 0.00399017333984375, 0.004715919494628906, 0.0054416656494140625, 0.006167411804199219, 0.006893157958984375, 0.007618904113769531, 0.008344650268554688, 0.009070396423339844, 0.009796142578125, 0.010521888732910156, 0.011247634887695312, 0.011973381042480469, 0.012699127197265625, 0.013424873352050781, 0.014150619506835938, 0.014876365661621094, 0.01560211181640625, 0.016327857971191406, 0.017053604125976562, 0.01777935028076172, 0.018505096435546875, 0.01923084259033203, 0.019956588745117188, 0.020682334899902344, 0.0214080810546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 11.0, 11.0, 14.0, 12.0, 9.0, 24.0, 26.0, 37.0, 38.0, 49.0, 58.0, 58.0, 56.0, 68.0, 58.0, 60.0, 55.0, 48.0, 65.0, 44.0, 37.0, 28.0, 28.0, 23.0, 13.0, 19.0, 10.0, 7.0, 12.0, 5.0, 7.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0183258056640625, -0.017743587493896484, -0.01716136932373047, -0.016579151153564453, -0.015996932983398438, -0.015414714813232422, -0.014832496643066406, -0.01425027847290039, -0.013668060302734375, -0.01308584213256836, -0.012503623962402344, -0.011921405792236328, -0.011339187622070312, -0.010756969451904297, -0.010174751281738281, -0.009592533111572266, -0.00901031494140625, -0.008428096771240234, -0.007845878601074219, -0.007263660430908203, -0.0066814422607421875, -0.006099224090576172, -0.005517005920410156, -0.004934787750244141, -0.004352569580078125, -0.0037703514099121094, -0.0031881332397460938, -0.002605915069580078, -0.0020236968994140625, -0.0014414787292480469, -0.0008592605590820312, -0.0002770423889160156, 0.00030517578125, 0.0008873939514160156, 0.0014696121215820312, 0.002051830291748047, 0.0026340484619140625, 0.003216266632080078, 0.0037984848022460938, 0.004380702972412109, 0.004962921142578125, 0.005545139312744141, 0.006127357482910156, 0.006709575653076172, 0.0072917938232421875, 0.007874011993408203, 0.008456230163574219, 0.009038448333740234, 0.00962066650390625, 0.010202884674072266, 0.010785102844238281, 0.011367321014404297, 0.011949539184570312, 0.012531757354736328, 0.013113975524902344, 0.01369619369506836, 0.014278411865234375, 0.01486063003540039, 0.015442848205566406, 0.016025066375732422, 0.016607284545898438, 0.017189502716064453, 0.01777172088623047, 0.018353939056396484, 0.0189361572265625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 11.0, 15.0, 32.0, 65.0, 134.0, 264.0, 604.0, 1757.0, 12176.0, 3765459.0, 405779.0, 5903.0, 1229.0, 451.0, 202.0, 86.0, 50.0, 19.0, 17.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1339111328125, -0.1282978057861328, -0.12268447875976562, -0.11707115173339844, -0.11145782470703125, -0.10584449768066406, -0.10023117065429688, -0.09461784362792969, -0.0890045166015625, -0.08339118957519531, -0.07777786254882812, -0.07216453552246094, -0.06655120849609375, -0.06093788146972656, -0.055324554443359375, -0.04971122741699219, -0.044097900390625, -0.03848457336425781, -0.032871246337890625, -0.027257919311523438, -0.02164459228515625, -0.016031265258789062, -0.010417938232421875, -0.0048046112060546875, 0.0008087158203125, 0.0064220428466796875, 0.012035369873046875, 0.017648696899414062, 0.02326202392578125, 0.028875350952148438, 0.034488677978515625, 0.04010200500488281, 0.04571533203125, 0.05132865905761719, 0.056941986083984375, 0.06255531311035156, 0.06816864013671875, 0.07378196716308594, 0.07939529418945312, 0.08500862121582031, 0.0906219482421875, 0.09623527526855469, 0.10184860229492188, 0.10746192932128906, 0.11307525634765625, 0.11868858337402344, 0.12430191040039062, 0.1299152374267578, 0.135528564453125, 0.1411418914794922, 0.14675521850585938, 0.15236854553222656, 0.15798187255859375, 0.16359519958496094, 0.16920852661132812, 0.1748218536376953, 0.1804351806640625, 0.1860485076904297, 0.19166183471679688, 0.19727516174316406, 0.20288848876953125, 0.20850181579589844, 0.21411514282226562, 0.2197284698486328, 0.225341796875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 9.0, 9.0, 13.0, 27.0, 18.0, 45.0, 64.0, 68.0, 103.0, 166.0, 266.0, 369.0, 659.0, 753.0, 513.0, 301.0, 230.0, 126.0, 97.0, 55.0, 48.0, 33.0, 32.0, 16.0, 11.0, 8.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.08489990234375, -0.08267498016357422, -0.08045005798339844, -0.07822513580322266, -0.07600021362304688, -0.0737752914428711, -0.07155036926269531, -0.06932544708251953, -0.06710052490234375, -0.06487560272216797, -0.06265068054199219, -0.060425758361816406, -0.058200836181640625, -0.055975914001464844, -0.05375099182128906, -0.05152606964111328, -0.0493011474609375, -0.04707622528076172, -0.04485130310058594, -0.042626380920410156, -0.040401458740234375, -0.038176536560058594, -0.03595161437988281, -0.03372669219970703, -0.03150177001953125, -0.02927684783935547, -0.027051925659179688, -0.024827003479003906, -0.022602081298828125, -0.020377159118652344, -0.018152236938476562, -0.01592731475830078, -0.013702392578125, -0.011477470397949219, -0.009252548217773438, -0.007027626037597656, -0.004802703857421875, -0.0025777816772460938, -0.0003528594970703125, 0.0018720626831054688, 0.00409698486328125, 0.006321907043457031, 0.008546829223632812, 0.010771751403808594, 0.012996673583984375, 0.015221595764160156, 0.017446517944335938, 0.01967144012451172, 0.0218963623046875, 0.02412128448486328, 0.026346206665039062, 0.028571128845214844, 0.030796051025390625, 0.033020973205566406, 0.03524589538574219, 0.03747081756591797, 0.03969573974609375, 0.04192066192626953, 0.04414558410644531, 0.046370506286621094, 0.048595428466796875, 0.050820350646972656, 0.05304527282714844, 0.05527019500732422, 0.0574951171875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 10.0, 16.0, 18.0, 39.0, 65.0, 133.0, 202.0, 229.0, 124.0, 72.0, 35.0, 19.0, 12.0, 14.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9246997237205505, -0.8966338038444519, -0.8685678243637085, -0.8405019044876099, -0.8124359846115112, -0.7843700051307678, -0.7563040852546692, -0.7282381057739258, -0.7001721858978271, -0.6721062660217285, -0.6440402865409851, -0.6159743666648865, -0.5879083871841431, -0.5598424673080444, -0.5317765474319458, -0.5037106275558472, -0.47564464807510376, -0.44757869839668274, -0.4195127487182617, -0.3914468288421631, -0.36338087916374207, -0.33531492948532104, -0.3072490096092224, -0.2791830599308014, -0.25111711025238037, -0.22305116057395935, -0.19498522579669952, -0.1669192910194397, -0.13885334134101868, -0.11078739166259766, -0.08272145688533783, -0.054655522108078, -0.026589512825012207, 0.0014764294028282166, 0.02954237163066864, 0.057608313858509064, 0.08567425608634949, 0.11374020576477051, 0.14180614054203033, 0.16987207531929016, 0.19793802499771118, 0.2260039746761322, 0.2540699243545532, 0.28213584423065186, 0.3102017939090729, 0.3382677435874939, 0.36633366346359253, 0.39439961314201355, 0.42246556282043457, 0.4505315124988556, 0.4785974621772766, 0.5066633820533752, 0.5347293615341187, 0.5627952814102173, 0.5908612012863159, 0.6189271211624146, 0.646993100643158, 0.6750590205192566, 0.703125, 0.7311909198760986, 0.7592568397521973, 0.7873228192329407, 0.8153887391090393, 0.8434547185897827, 0.8715206384658813]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 9.0, 14.0, 8.0, 11.0, 23.0, 23.0, 24.0, 18.0, 25.0, 32.0, 32.0, 43.0, 33.0, 42.0, 46.0, 60.0, 63.0, 63.0, 54.0, 58.0, 39.0, 47.0, 38.0, 36.0, 31.0, 20.0, 18.0, 19.0, 14.0, 5.0, 9.0, 8.0, 4.0, 4.0, 6.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4024389386177063, -0.39043498039245605, -0.3784310221672058, -0.36642709374427795, -0.3544231355190277, -0.34241917729377747, -0.3304152488708496, -0.31841129064559937, -0.3064073324203491, -0.2944033741950989, -0.28239941596984863, -0.2703954875469208, -0.25839152932167053, -0.2463875710964203, -0.23438362777233124, -0.2223796844482422, -0.21037572622299194, -0.1983717679977417, -0.18636782467365265, -0.1743638813495636, -0.16235992312431335, -0.1503559648990631, -0.13835202157497406, -0.126348078250885, -0.11434412002563477, -0.10234016925096512, -0.09033621847629547, -0.07833226770162582, -0.06632831692695618, -0.05432436615228653, -0.04232041537761688, -0.030316464602947235, -0.018312513828277588, -0.006308563053607941, 0.0056953877210617065, 0.017699338495731354, 0.029703289270401, 0.04170724004507065, 0.053711190819740295, 0.06571514159440994, 0.07771909236907959, 0.08972304314374924, 0.10172699391841888, 0.11373094469308853, 0.12573489546775818, 0.13773885369300842, 0.14974279701709747, 0.16174674034118652, 0.17375069856643677, 0.185754656791687, 0.19775860011577606, 0.2097625434398651, 0.22176650166511536, 0.2337704598903656, 0.24577440321445465, 0.2577783465385437, 0.26978230476379395, 0.2817862629890442, 0.29379022121429443, 0.3057941496372223, 0.31779810786247253, 0.3298020660877228, 0.34180599451065063, 0.3538099527359009, 0.3658139109611511]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 4.0, 14.0, 11.0, 31.0, 33.0, 39.0, 64.0, 109.0, 172.0, 266.0, 570.0, 1014.0, 2202.0, 4674.0, 12078.0, 39509.0, 201085.0, 649884.0, 97895.0, 23922.0, 8127.0, 3476.0, 1565.0, 745.0, 441.0, 223.0, 150.0, 91.0, 59.0, 26.0, 28.0, 17.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.042083740234375, -0.04089164733886719, -0.039699554443359375, -0.03850746154785156, -0.03731536865234375, -0.03612327575683594, -0.034931182861328125, -0.03373908996582031, -0.0325469970703125, -0.03135490417480469, -0.030162811279296875, -0.028970718383789062, -0.02777862548828125, -0.026586532592773438, -0.025394439697265625, -0.024202346801757812, -0.02301025390625, -0.021818161010742188, -0.020626068115234375, -0.019433975219726562, -0.01824188232421875, -0.017049789428710938, -0.015857696533203125, -0.014665603637695312, -0.0134735107421875, -0.012281417846679688, -0.011089324951171875, -0.009897232055664062, -0.00870513916015625, -0.0075130462646484375, -0.006320953369140625, -0.0051288604736328125, -0.003936767578125, -0.0027446746826171875, -0.001552581787109375, -0.0003604888916015625, 0.00083160400390625, 0.0020236968994140625, 0.003215789794921875, 0.0044078826904296875, 0.0055999755859375, 0.0067920684814453125, 0.007984161376953125, 0.009176254272460938, 0.01036834716796875, 0.011560440063476562, 0.012752532958984375, 0.013944625854492188, 0.01513671875, 0.016328811645507812, 0.017520904541015625, 0.018712997436523438, 0.01990509033203125, 0.021097183227539062, 0.022289276123046875, 0.023481369018554688, 0.0246734619140625, 0.025865554809570312, 0.027057647705078125, 0.028249740600585938, 0.02944183349609375, 0.030633926391601562, 0.031826019287109375, 0.03301811218261719, 0.034210205078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 10.0, 9.0, 7.0, 14.0, 17.0, 22.0, 22.0, 47.0, 51.0, 52.0, 70.0, 68.0, 61.0, 85.0, 81.0, 61.0, 65.0, 51.0, 51.0, 46.0, 24.0, 20.0, 15.0, 14.0, 10.0, 13.0, 5.0, 9.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03302001953125, -0.032064199447631836, -0.031108379364013672, -0.030152559280395508, -0.029196739196777344, -0.02824091911315918, -0.027285099029541016, -0.02632927894592285, -0.025373458862304688, -0.024417638778686523, -0.02346181869506836, -0.022505998611450195, -0.02155017852783203, -0.020594358444213867, -0.019638538360595703, -0.01868271827697754, -0.017726898193359375, -0.01677107810974121, -0.015815258026123047, -0.014859437942504883, -0.013903617858886719, -0.012947797775268555, -0.01199197769165039, -0.011036157608032227, -0.010080337524414062, -0.009124517440795898, -0.008168697357177734, -0.00721287727355957, -0.006257057189941406, -0.005301237106323242, -0.004345417022705078, -0.003389596939086914, -0.00243377685546875, -0.001477956771850586, -0.0005221366882324219, 0.0004336833953857422, 0.0013895034790039062, 0.0023453235626220703, 0.0033011436462402344, 0.0042569637298583984, 0.0052127838134765625, 0.0061686038970947266, 0.007124423980712891, 0.008080244064331055, 0.009036064147949219, 0.009991884231567383, 0.010947704315185547, 0.011903524398803711, 0.012859344482421875, 0.013815164566040039, 0.014770984649658203, 0.015726804733276367, 0.01668262481689453, 0.017638444900512695, 0.01859426498413086, 0.019550085067749023, 0.020505905151367188, 0.02146172523498535, 0.022417545318603516, 0.02337336540222168, 0.024329185485839844, 0.025285005569458008, 0.026240825653076172, 0.027196645736694336, 0.0281524658203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 5.0, 4.0, 8.0, 9.0, 15.0, 14.0, 36.0, 45.0, 76.0, 114.0, 155.0, 272.0, 588.0, 1455.0, 5383.0, 41575.0, 935879.0, 53666.0, 6136.0, 1654.0, 649.0, 299.0, 174.0, 100.0, 56.0, 59.0, 26.0, 26.0, 14.0, 15.0, 8.0, 9.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0654296875, -0.06341934204101562, -0.06140899658203125, -0.059398651123046875, -0.0573883056640625, -0.055377960205078125, -0.05336761474609375, -0.051357269287109375, -0.049346923828125, -0.047336578369140625, -0.04532623291015625, -0.043315887451171875, -0.0413055419921875, -0.039295196533203125, -0.03728485107421875, -0.035274505615234375, -0.03326416015625, -0.031253814697265625, -0.02924346923828125, -0.027233123779296875, -0.0252227783203125, -0.023212432861328125, -0.02120208740234375, -0.019191741943359375, -0.017181396484375, -0.015171051025390625, -0.01316070556640625, -0.011150360107421875, -0.0091400146484375, -0.007129669189453125, -0.00511932373046875, -0.003108978271484375, -0.0010986328125, 0.000911712646484375, 0.00292205810546875, 0.004932403564453125, 0.0069427490234375, 0.008953094482421875, 0.01096343994140625, 0.012973785400390625, 0.014984130859375, 0.016994476318359375, 0.01900482177734375, 0.021015167236328125, 0.0230255126953125, 0.025035858154296875, 0.02704620361328125, 0.029056549072265625, 0.03106689453125, 0.033077239990234375, 0.03508758544921875, 0.037097930908203125, 0.0391082763671875, 0.041118621826171875, 0.04312896728515625, 0.045139312744140625, 0.047149658203125, 0.049160003662109375, 0.05117034912109375, 0.053180694580078125, 0.0551910400390625, 0.057201385498046875, 0.05921173095703125, 0.061222076416015625, 0.063232421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 7.0, 9.0, 8.0, 15.0, 14.0, 17.0, 19.0, 17.0, 30.0, 46.0, 34.0, 40.0, 53.0, 71.0, 79.0, 75.0, 61.0, 56.0, 53.0, 41.0, 43.0, 36.0, 32.0, 21.0, 14.0, 21.0, 19.0, 13.0, 14.0, 3.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.07904052734375, -0.07653427124023438, -0.07402801513671875, -0.07152175903320312, -0.0690155029296875, -0.06650924682617188, -0.06400299072265625, -0.061496734619140625, -0.058990478515625, -0.056484222412109375, -0.05397796630859375, -0.051471710205078125, -0.0489654541015625, -0.046459197998046875, -0.04395294189453125, -0.041446685791015625, -0.0389404296875, -0.036434173583984375, -0.03392791748046875, -0.031421661376953125, -0.0289154052734375, -0.026409149169921875, -0.02390289306640625, -0.021396636962890625, -0.018890380859375, -0.016384124755859375, -0.01387786865234375, -0.011371612548828125, -0.0088653564453125, -0.006359100341796875, -0.00385284423828125, -0.001346588134765625, 0.00115966796875, 0.003665924072265625, 0.00617218017578125, 0.008678436279296875, 0.0111846923828125, 0.013690948486328125, 0.01619720458984375, 0.018703460693359375, 0.021209716796875, 0.023715972900390625, 0.02622222900390625, 0.028728485107421875, 0.0312347412109375, 0.033740997314453125, 0.03624725341796875, 0.038753509521484375, 0.041259765625, 0.043766021728515625, 0.04627227783203125, 0.048778533935546875, 0.0512847900390625, 0.053791046142578125, 0.05629730224609375, 0.058803558349609375, 0.061309814453125, 0.06381607055664062, 0.06632232666015625, 0.06882858276367188, 0.0713348388671875, 0.07384109497070312, 0.07634735107421875, 0.07885360717773438, 0.08135986328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 4.0, 6.0, 10.0, 6.0, 8.0, 9.0, 22.0, 27.0, 20.0, 41.0, 52.0, 106.0, 150.0, 311.0, 516.0, 1345.0, 4490.0, 22859.0, 926044.0, 78894.0, 9502.0, 2375.0, 798.0, 372.0, 218.0, 105.0, 71.0, 53.0, 32.0, 32.0, 20.0, 7.0, 12.0, 9.0, 7.0, 4.0, 8.0, 5.0, 2.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0173492431640625, -0.016849994659423828, -0.016350746154785156, -0.015851497650146484, -0.015352249145507812, -0.01485300064086914, -0.014353752136230469, -0.013854503631591797, -0.013355255126953125, -0.012856006622314453, -0.012356758117675781, -0.01185750961303711, -0.011358261108398438, -0.010859012603759766, -0.010359764099121094, -0.009860515594482422, -0.00936126708984375, -0.008862018585205078, -0.008362770080566406, -0.007863521575927734, -0.0073642730712890625, -0.006865024566650391, -0.006365776062011719, -0.005866527557373047, -0.005367279052734375, -0.004868030548095703, -0.004368782043457031, -0.0038695335388183594, -0.0033702850341796875, -0.0028710365295410156, -0.0023717880249023438, -0.0018725395202636719, -0.001373291015625, -0.0008740425109863281, -0.00037479400634765625, 0.00012445449829101562, 0.0006237030029296875, 0.0011229515075683594, 0.0016222000122070312, 0.002121448516845703, 0.002620697021484375, 0.003119945526123047, 0.0036191940307617188, 0.004118442535400391, 0.0046176910400390625, 0.005116939544677734, 0.005616188049316406, 0.006115436553955078, 0.00661468505859375, 0.007113933563232422, 0.007613182067871094, 0.008112430572509766, 0.008611679077148438, 0.00911092758178711, 0.009610176086425781, 0.010109424591064453, 0.010608673095703125, 0.011107921600341797, 0.011607170104980469, 0.01210641860961914, 0.012605667114257812, 0.013104915618896484, 0.013604164123535156, 0.014103412628173828, 0.0146026611328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 8.0, 10.0, 7.0, 20.0, 21.0, 30.0, 28.0, 30.0, 51.0, 90.0, 99.0, 119.0, 106.0, 75.0, 51.0, 43.0, 36.0, 30.0, 27.0, 21.0, 13.0, 6.0, 11.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0], "bins": [-5.1975250244140625e-05, -5.0324946641922e-05, -4.867464303970337e-05, -4.702433943748474e-05, -4.537403583526611e-05, -4.3723732233047485e-05, -4.207342863082886e-05, -4.042312502861023e-05, -3.87728214263916e-05, -3.7122517824172974e-05, -3.5472214221954346e-05, -3.382191061973572e-05, -3.217160701751709e-05, -3.052130341529846e-05, -2.8870999813079834e-05, -2.7220696210861206e-05, -2.5570392608642578e-05, -2.392008900642395e-05, -2.2269785404205322e-05, -2.0619481801986694e-05, -1.8969178199768066e-05, -1.731887459754944e-05, -1.566857099533081e-05, -1.4018267393112183e-05, -1.2367963790893555e-05, -1.0717660188674927e-05, -9.067356586456299e-06, -7.417052984237671e-06, -5.766749382019043e-06, -4.116445779800415e-06, -2.466142177581787e-06, -8.158385753631592e-07, 8.344650268554688e-07, 2.4847686290740967e-06, 4.135072231292725e-06, 5.7853758335113525e-06, 7.4356794357299805e-06, 9.085983037948608e-06, 1.0736286640167236e-05, 1.2386590242385864e-05, 1.4036893844604492e-05, 1.568719744682312e-05, 1.7337501049041748e-05, 1.8987804651260376e-05, 2.0638108253479004e-05, 2.2288411855697632e-05, 2.393871545791626e-05, 2.5589019060134888e-05, 2.7239322662353516e-05, 2.8889626264572144e-05, 3.053992986679077e-05, 3.21902334690094e-05, 3.384053707122803e-05, 3.5490840673446655e-05, 3.714114427566528e-05, 3.879144787788391e-05, 4.044175148010254e-05, 4.209205508232117e-05, 4.3742358684539795e-05, 4.539266228675842e-05, 4.704296588897705e-05, 4.869326949119568e-05, 5.034357309341431e-05, 5.1993876695632935e-05, 5.364418029785156e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 4.0, 12.0, 12.0, 19.0, 29.0, 31.0, 45.0, 90.0, 137.0, 212.0, 331.0, 611.0, 1277.0, 2981.0, 8725.0, 42636.0, 916522.0, 57774.0, 10609.0, 3390.0, 1341.0, 712.0, 381.0, 230.0, 140.0, 86.0, 54.0, 49.0, 31.0, 15.0, 20.0, 10.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.013275146484375, -0.012840867042541504, -0.012406587600708008, -0.011972308158874512, -0.011538028717041016, -0.01110374927520752, -0.010669469833374023, -0.010235190391540527, -0.009800910949707031, -0.009366631507873535, -0.008932352066040039, -0.008498072624206543, -0.008063793182373047, -0.007629513740539551, -0.007195234298706055, -0.006760954856872559, -0.0063266754150390625, -0.005892395973205566, -0.00545811653137207, -0.005023837089538574, -0.004589557647705078, -0.004155278205871582, -0.003720998764038086, -0.00328671932220459, -0.0028524398803710938, -0.0024181604385375977, -0.0019838809967041016, -0.0015496015548706055, -0.0011153221130371094, -0.0006810426712036133, -0.0002467632293701172, 0.0001875162124633789, 0.000621795654296875, 0.001056075096130371, 0.0014903545379638672, 0.0019246339797973633, 0.0023589134216308594, 0.0027931928634643555, 0.0032274723052978516, 0.0036617517471313477, 0.004096031188964844, 0.00453031063079834, 0.004964590072631836, 0.005398869514465332, 0.005833148956298828, 0.006267428398132324, 0.00670170783996582, 0.007135987281799316, 0.0075702667236328125, 0.008004546165466309, 0.008438825607299805, 0.0088731050491333, 0.009307384490966797, 0.009741663932800293, 0.010175943374633789, 0.010610222816467285, 0.011044502258300781, 0.011478781700134277, 0.011913061141967773, 0.01234734058380127, 0.012781620025634766, 0.013215899467468262, 0.013650178909301758, 0.014084458351135254, 0.01451873779296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 12.0, 3.0, 9.0, 10.0, 9.0, 14.0, 27.0, 48.0, 114.0, 256.0, 226.0, 107.0, 44.0, 28.0, 17.0, 15.0, 9.0, 9.0, 5.0, 9.0, 6.0, 5.0, 4.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01430511474609375, -0.013773798942565918, -0.013242483139038086, -0.012711167335510254, -0.012179851531982422, -0.01164853572845459, -0.011117219924926758, -0.010585904121398926, -0.010054588317871094, -0.009523272514343262, -0.00899195671081543, -0.008460640907287598, -0.007929325103759766, -0.007398009300231934, -0.0068666934967041016, -0.0063353776931762695, -0.0058040618896484375, -0.0052727460861206055, -0.0047414302825927734, -0.004210114479064941, -0.0036787986755371094, -0.0031474828720092773, -0.0026161670684814453, -0.0020848512649536133, -0.0015535354614257812, -0.0010222196578979492, -0.0004909038543701172, 4.0411949157714844e-05, 0.0005717277526855469, 0.001103043556213379, 0.001634359359741211, 0.002165675163269043, 0.002696990966796875, 0.003228306770324707, 0.003759622573852539, 0.004290938377380371, 0.004822254180908203, 0.005353569984436035, 0.005884885787963867, 0.006416201591491699, 0.006947517395019531, 0.007478833198547363, 0.008010149002075195, 0.008541464805603027, 0.00907278060913086, 0.009604096412658691, 0.010135412216186523, 0.010666728019714355, 0.011198043823242188, 0.01172935962677002, 0.012260675430297852, 0.012791991233825684, 0.013323307037353516, 0.013854622840881348, 0.01438593864440918, 0.014917254447937012, 0.015448570251464844, 0.015979886054992676, 0.016511201858520508, 0.01704251766204834, 0.017573833465576172, 0.018105149269104004, 0.018636465072631836, 0.019167780876159668, 0.0196990966796875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 10.0, 10.0, 40.0, 90.0, 528.0, 160.0, 76.0, 46.0, 17.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23220795392990112, -0.21643856167793274, -0.20066916942596436, -0.18489976227283478, -0.1691303700208664, -0.153360977768898, -0.13759157061576843, -0.12182217836380005, -0.10605278611183167, -0.09028339385986328, -0.0745139941573143, -0.05874459818005562, -0.042975202202796936, -0.027205809950828552, -0.011436410248279572, 0.004332989454269409, 0.020102381706237793, 0.035871777683496475, 0.05164117366075516, 0.06741057336330414, 0.08317996561527252, 0.0989493578672409, 0.11471875756978989, 0.13048815727233887, 0.14625754952430725, 0.16202694177627563, 0.17779633402824402, 0.1935657411813736, 0.20933513343334198, 0.22510452568531036, 0.24087393283843994, 0.2566433250904083, 0.27241265773773193, 0.2881820499897003, 0.3039514422416687, 0.3197208344936371, 0.33549022674560547, 0.35125964879989624, 0.3670290410518646, 0.382798433303833, 0.3985678255558014, 0.4143372178077698, 0.43010661005973816, 0.44587600231170654, 0.4616454243659973, 0.4774147868156433, 0.4931842088699341, 0.5089535713195801, 0.5247229933738708, 0.5404924154281616, 0.5562617778778076, 0.5720311999320984, 0.5878005623817444, 0.6035699844360352, 0.6193393468856812, 0.6351087689399719, 0.6508781909942627, 0.6666476130485535, 0.6824169754981995, 0.6981863975524902, 0.7139557600021362, 0.729725182056427, 0.745494544506073, 0.7612639665603638, 0.7770333290100098]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 6.0, 11.0, 11.0, 18.0, 15.0, 20.0, 23.0, 24.0, 22.0, 43.0, 39.0, 131.0, 313.0, 89.0, 34.0, 22.0, 33.0, 24.0, 21.0, 27.0, 19.0, 8.0, 16.0, 8.0, 2.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1979086995124817, -0.18863563239574432, -0.17936256527900696, -0.1700894981622696, -0.16081643104553223, -0.15154334902763367, -0.1422702819108963, -0.13299721479415894, -0.12372414767742157, -0.1144510805606842, -0.10517801344394684, -0.09590493887662888, -0.08663187175989151, -0.07735880464315414, -0.06808573007583618, -0.058812662959098816, -0.04953959584236145, -0.040266528725624084, -0.03099345788359642, -0.021720388904213905, -0.01244731992483139, -0.0031742528080940247, 0.0060988180339336395, 0.015371888875961304, 0.02464495599269867, 0.033918023109436035, 0.0431910939514637, 0.052464164793491364, 0.06173723191022873, 0.0710102990269661, 0.08028337359428406, 0.08955644071102142, 0.09882950782775879, 0.10810257494449615, 0.11737564206123352, 0.1266487091779709, 0.13592177629470825, 0.1451948583126068, 0.15446792542934418, 0.16374099254608154, 0.1730140596628189, 0.18228712677955627, 0.19156019389629364, 0.200833261013031, 0.21010634303092957, 0.21937939524650574, 0.2286524772644043, 0.23792554438114166, 0.24719861149787903, 0.2564716935157776, 0.26574474573135376, 0.2750178277492523, 0.2842908799648285, 0.29356396198272705, 0.3028370141983032, 0.3121100962162018, 0.32138317823410034, 0.3306562602519989, 0.3399293124675751, 0.34920239448547363, 0.3584754467010498, 0.36774852871894836, 0.37702158093452454, 0.3862946629524231, 0.39556771516799927]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 2.0, 8.0, 3.0, 6.0, 11.0, 13.0, 11.0, 15.0, 11.0, 23.0, 16.0, 15.0, 27.0, 22.0, 22.0, 36.0, 34.0, 95.0, 227.0, 92.0, 40.0, 35.0, 26.0, 30.0, 16.0, 20.0, 15.0, 21.0, 14.0, 11.0, 10.0, 11.0, 10.0, 3.0, 6.0, 7.0, 3.0, 5.0, 5.0, 4.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0166778564453125, -0.01616644859313965, -0.015655040740966797, -0.015143632888793945, -0.014632225036621094, -0.014120817184448242, -0.01360940933227539, -0.013098001480102539, -0.012586593627929688, -0.012075185775756836, -0.011563777923583984, -0.011052370071411133, -0.010540962219238281, -0.01002955436706543, -0.009518146514892578, -0.009006738662719727, -0.008495330810546875, -0.007983922958374023, -0.007472515106201172, -0.00696110725402832, -0.006449699401855469, -0.005938291549682617, -0.005426883697509766, -0.004915475845336914, -0.0044040679931640625, -0.003892660140991211, -0.0033812522888183594, -0.002869844436645508, -0.0023584365844726562, -0.0018470287322998047, -0.0013356208801269531, -0.0008242130279541016, -0.00031280517578125, 0.00019860267639160156, 0.0007100105285644531, 0.0012214183807373047, 0.0017328262329101562, 0.002244234085083008, 0.0027556419372558594, 0.003267049789428711, 0.0037784576416015625, 0.004289865493774414, 0.004801273345947266, 0.005312681198120117, 0.005824089050292969, 0.00633549690246582, 0.006846904754638672, 0.0073583126068115234, 0.007869720458984375, 0.008381128311157227, 0.008892536163330078, 0.00940394401550293, 0.009915351867675781, 0.010426759719848633, 0.010938167572021484, 0.011449575424194336, 0.011960983276367188, 0.012472391128540039, 0.01298379898071289, 0.013495206832885742, 0.014006614685058594, 0.014518022537231445, 0.015029430389404297, 0.015540838241577148, 0.01605224609375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 1.0, 9.0, 16.0, 7.0, 16.0, 19.0, 46.0, 56.0, 166.0, 320.0, 818.0, 3056.0, 22070.0, 8347625.0, 11213.0, 2011.0, 648.0, 231.0, 99.0, 44.0, 35.0, 26.0, 24.0, 9.0, 4.0, 7.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2597764730453491, -0.25243186950683594, -0.24508728086948395, -0.23774269223213196, -0.23039808869361877, -0.22305350005626678, -0.2157088965177536, -0.2083643078804016, -0.20101970434188843, -0.19367511570453644, -0.18633051216602325, -0.17898592352867126, -0.17164131999015808, -0.1642967313528061, -0.1569521278142929, -0.14960753917694092, -0.14226293563842773, -0.13491834700107574, -0.12757374346256256, -0.12022914737462997, -0.11288455128669739, -0.1055399626493454, -0.09819535911083221, -0.09085077047348022, -0.08350618183612823, -0.07616158574819565, -0.06881698966026306, -0.061472393572330475, -0.05412779748439789, -0.0467832051217556, -0.03943860903382301, -0.03209401294589043, -0.02474941313266754, -0.017404817044734955, -0.010060221888124943, -0.0027156267315149307, 0.004628969356417656, 0.011973563581705093, 0.01931815966963768, 0.026662755757570267, 0.03400735184550285, 0.04135194793343544, 0.04869654402136803, 0.056041136384010315, 0.0633857324719429, 0.07073032855987549, 0.07807492464780807, 0.08541952073574066, 0.09276411682367325, 0.10010871291160583, 0.10745330899953842, 0.11479790508747101, 0.1221425011754036, 0.12948709726333618, 0.13683168590068817, 0.14417628943920135, 0.15152087807655334, 0.15886546671390533, 0.16621007025241852, 0.1735546588897705, 0.1808992624282837, 0.18824385106563568, 0.19558845460414886, 0.20293304324150085, 0.21027764678001404]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 7.0, 6.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 6.0, 2.0, 6.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21082796156406403, -0.20547974109649658, -0.20013152062892914, -0.1947833001613617, -0.18943509459495544, -0.184086874127388, -0.17873865365982056, -0.1733904331922531, -0.16804221272468567, -0.16269399225711823, -0.15734577178955078, -0.15199756622314453, -0.1466493457555771, -0.14130112528800964, -0.1359529048204422, -0.13060468435287476, -0.1252564787864685, -0.11990825831890106, -0.11456004530191422, -0.10921182483434677, -0.10386361181735992, -0.09851539134979248, -0.09316717088222504, -0.08781895041465759, -0.08247073739767075, -0.0771225169301033, -0.07177430391311646, -0.06642608344554901, -0.061077866703271866, -0.05572964996099472, -0.05038142949342728, -0.04503321275115013, -0.03968498110771179, -0.03433676436543465, -0.028988545760512352, -0.023640327155590057, -0.018292110413312912, -0.012943893671035767, -0.007595673203468323, -0.0022474564611911774, 0.003100760281085968, 0.008448977954685688, 0.013797195628285408, 0.019145414233207703, 0.024493630975484848, 0.029841847717761993, 0.03519006818532944, 0.04053828492760658, 0.04588650166988373, 0.05123471841216087, 0.05658293515443802, 0.06193115562200546, 0.06727936863899231, 0.07262758910655975, 0.0779758095741272, 0.08332403004169464, 0.08867224305868149, 0.09402046352624893, 0.09936867654323578, 0.10471689701080322, 0.11006511747837067, 0.11541333049535751, 0.12076155096292496, 0.1261097639799118, 0.13145798444747925]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 8.0, 18.0, 20.0, 23.0, 24.0, 54.0, 73.0, 115.0, 220.0, 335.0, 605.0, 1142.0, 2440.0, 5584.0, 14657.0, 42091.0, 137764.0, 206584.0, 73232.0, 23726.0, 8532.0, 3447.0, 1650.0, 800.0, 418.0, 242.0, 147.0, 95.0, 70.0, 39.0, 30.0, 22.0, 17.0, 13.0, 6.0, 3.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1739501953125, -0.1681957244873047, -0.16244125366210938, -0.15668678283691406, -0.15093231201171875, -0.14517784118652344, -0.13942337036132812, -0.1336688995361328, -0.1279144287109375, -0.12215995788574219, -0.11640548706054688, -0.11065101623535156, -0.10489654541015625, -0.09914207458496094, -0.09338760375976562, -0.08763313293457031, -0.081878662109375, -0.07612419128417969, -0.07036972045898438, -0.06461524963378906, -0.05886077880859375, -0.05310630798339844, -0.047351837158203125, -0.04159736633300781, -0.0358428955078125, -0.030088424682617188, -0.024333953857421875, -0.018579483032226562, -0.01282501220703125, -0.0070705413818359375, -0.001316070556640625, 0.0044384002685546875, 0.01019287109375, 0.015947341918945312, 0.021701812744140625, 0.027456283569335938, 0.03321075439453125, 0.03896522521972656, 0.044719696044921875, 0.05047416687011719, 0.0562286376953125, 0.06198310852050781, 0.06773757934570312, 0.07349205017089844, 0.07924652099609375, 0.08500099182128906, 0.09075546264648438, 0.09650993347167969, 0.102264404296875, 0.10801887512207031, 0.11377334594726562, 0.11952781677246094, 0.12528228759765625, 0.13103675842285156, 0.13679122924804688, 0.1425457000732422, 0.1483001708984375, 0.1540546417236328, 0.15980911254882812, 0.16556358337402344, 0.17131805419921875, 0.17707252502441406, 0.18282699584960938, 0.1885814666748047, 0.1943359375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 16.0, 15.0, 21.0, 28.0, 42.0, 56.0, 68.0, 79.0, 102.0, 106.0, 116.0, 93.0, 60.0, 50.0, 44.0, 24.0, 23.0, 12.0, 5.0, 17.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039459228515625, -0.03837132453918457, -0.03728342056274414, -0.03619551658630371, -0.03510761260986328, -0.03401970863342285, -0.03293180465698242, -0.03184390068054199, -0.030755996704101562, -0.029668092727661133, -0.028580188751220703, -0.027492284774780273, -0.026404380798339844, -0.025316476821899414, -0.024228572845458984, -0.023140668869018555, -0.022052764892578125, -0.020964860916137695, -0.019876956939697266, -0.018789052963256836, -0.017701148986816406, -0.016613245010375977, -0.015525341033935547, -0.014437437057495117, -0.013349533081054688, -0.012261629104614258, -0.011173725128173828, -0.010085821151733398, -0.008997917175292969, -0.007910013198852539, -0.006822109222412109, -0.00573420524597168, -0.00464630126953125, -0.0035583972930908203, -0.0024704933166503906, -0.001382589340209961, -0.00029468536376953125, 0.0007932186126708984, 0.0018811225891113281, 0.002969026565551758, 0.0040569305419921875, 0.005144834518432617, 0.006232738494873047, 0.0073206424713134766, 0.008408546447753906, 0.009496450424194336, 0.010584354400634766, 0.011672258377075195, 0.012760162353515625, 0.013848066329956055, 0.014935970306396484, 0.016023874282836914, 0.017111778259277344, 0.018199682235717773, 0.019287586212158203, 0.020375490188598633, 0.021463394165039062, 0.022551298141479492, 0.023639202117919922, 0.02472710609436035, 0.02581501007080078, 0.02690291404724121, 0.02799081802368164, 0.02907872200012207, 0.0301666259765625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 7.0, 9.0, 11.0, 21.0, 36.0, 77.0, 125.0, 86.0, 44.0, 22.0, 14.0, 5.0, 4.0, 3.0, 5.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24039745330810547, -0.23246397078037262, -0.22453050315380096, -0.21659702062606812, -0.20866355299949646, -0.2007300704717636, -0.19279658794403076, -0.1848631203174591, -0.17692965269088745, -0.1689961701631546, -0.16106270253658295, -0.1531292200088501, -0.14519575238227844, -0.1372622698545456, -0.12932878732681274, -0.12139531970024109, -0.11346183717250824, -0.10552836209535599, -0.09759488701820374, -0.08966140449047089, -0.08172793686389923, -0.07379445433616638, -0.06586097925901413, -0.05792750418186188, -0.049994029104709625, -0.04206055402755737, -0.03412707895040512, -0.02619360014796257, -0.018260125070810318, -0.010326649993658066, -0.002393171191215515, 0.005540303885936737, 0.01347377896308899, 0.02140725404024124, 0.029340730980038643, 0.037274207919836044, 0.045207682996988297, 0.05314115807414055, 0.0610746368765831, 0.06900811195373535, 0.0769415870308876, 0.08487506210803986, 0.09280853718519211, 0.10074201226234436, 0.10867549479007721, 0.11660896241664886, 0.12454244494438171, 0.13247591257095337, 0.14040939509868622, 0.14834287762641907, 0.15627634525299072, 0.16420982778072357, 0.17214329540729523, 0.18007677793502808, 0.18801024556159973, 0.19594372808933258, 0.20387721061706543, 0.21181069314479828, 0.21974416077136993, 0.22767764329910278, 0.23561111092567444, 0.2435445934534073, 0.25147807598114014, 0.2594115436077118, 0.26734501123428345]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 6.0, 4.0, 12.0, 16.0, 19.0, 57.0, 82.0, 93.0, 67.0, 35.0, 17.0, 7.0, 5.0, 4.0, 4.0, 6.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13171684741973877, -0.12739770114421844, -0.12307855486869812, -0.1187594085931778, -0.11444026231765747, -0.11012111604213715, -0.10580196976661682, -0.1014828234910965, -0.09716367721557617, -0.09284453094005585, -0.08852538466453552, -0.0842062383890152, -0.07988709211349487, -0.07556794583797455, -0.07124879956245422, -0.0669296532869339, -0.06261050701141357, -0.05829136073589325, -0.053972214460372925, -0.0496530681848526, -0.045333921909332275, -0.04101477563381195, -0.036695629358291626, -0.0323764830827713, -0.028057336807250977, -0.023738190531730652, -0.019419044256210327, -0.015099897980690002, -0.010780751705169678, -0.006461605429649353, -0.0021424591541290283, 0.0021766871213912964, 0.006495833396911621, 0.010814979672431946, 0.01513412594795227, 0.019453272223472595, 0.02377241849899292, 0.028091564774513245, 0.03241071105003357, 0.036729857325553894, 0.04104900360107422, 0.04536814987659454, 0.04968729615211487, 0.05400644242763519, 0.05832558870315552, 0.06264473497867584, 0.06696388125419617, 0.07128302752971649, 0.07560217380523682, 0.07992132008075714, 0.08424046635627747, 0.08855961263179779, 0.09287875890731812, 0.09719790518283844, 0.10151705145835876, 0.10583619773387909, 0.11015534400939941, 0.11447449028491974, 0.11879363656044006, 0.12311278283596039, 0.1274319291114807, 0.13175107538700104, 0.13607022166252136, 0.1403893679380417, 0.144708514213562]}, "train/train_runtime": 5167.9675, "train/train_samples_per_second": 5.522, "train/train_steps_per_second": 0.086, "train/total_flos": 0.0, "train/train_loss": 4.734800568610563, "eval/loss": 5.330791473388672, "eval/wer": 2.4313764379214597, "eval/runtime": 1116.9995, "eval/samples_per_second": 2.365, "eval/steps_per_second": 0.296} \ No newline at end of file +{"train/loss": 4.8899, "train/learning_rate": 0.0008900000000000001, "train/epoch": 1.0, "train/global_step": 446, "_runtime": 6619, "_timestamp": 1646293310, "_step": 447, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 78.0, 357.0, 439.0, 109.0, 16.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.88333511352539, -41.3859977722168, -36.88865661621094, -32.391319274902344, -27.893980026245117, -23.39664077758789, -18.899303436279297, -14.40196418762207, -9.904624938964844, -5.407286167144775, -0.909947395324707, 3.587390899658203, 8.08473014831543, 12.582069396972656, 17.07940673828125, 21.576745986938477, 26.074085235595703, 30.57142448425293, 35.068763732910156, 39.56610107421875, 44.063438415527344, 48.5607795715332, 53.0581169128418, 57.555458068847656, 62.05279541015625, 66.55013275146484, 71.04747009277344, 75.54481506347656, 80.04215240478516, 84.53948974609375, 89.03682708740234, 93.53416442871094, 98.03150939941406, 102.52884674072266, 107.02618408203125, 111.52352905273438, 116.02086639404297, 120.51820373535156, 125.01554107666016, 129.51287841796875, 134.01022338867188, 138.507568359375, 143.00489807128906, 147.5022430419922, 151.99957275390625, 156.49691772460938, 160.9942626953125, 165.49159240722656, 169.98892211914062, 174.48626708984375, 178.9835968017578, 183.48094177246094, 187.978271484375, 192.47561645507812, 196.97296142578125, 201.4702911376953, 205.96763610839844, 210.46498107910156, 214.96231079101562, 219.45965576171875, 223.9569854736328, 228.45433044433594, 232.95166015625, 237.44900512695312, 241.94635009765625]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 5.0, 5.0, 6.0, 4.0, 13.0, 15.0, 9.0, 19.0, 13.0, 18.0, 24.0, 32.0, 28.0, 30.0, 34.0, 30.0, 39.0, 52.0, 42.0, 51.0, 46.0, 47.0, 32.0, 44.0, 44.0, 39.0, 38.0, 33.0, 22.0, 35.0, 24.0, 21.0, 18.0, 16.0, 12.0, 20.0, 10.0, 8.0, 6.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.24918365478516, -62.14531326293945, -60.04144287109375, -57.93757247924805, -55.833702087402344, -53.729827880859375, -51.62595748901367, -49.52208709716797, -47.418216705322266, -45.31434631347656, -43.21047592163086, -41.106605529785156, -39.00273132324219, -36.89886474609375, -34.79499053955078, -32.69112014770508, -30.587249755859375, -28.483379364013672, -26.37950897216797, -24.275636672973633, -22.17176628112793, -20.067895889282227, -17.96402359008789, -15.860153198242188, -13.756282806396484, -11.652412414550781, -9.548541069030762, -7.4446702003479, -5.340799331665039, -3.236928939819336, -1.1330575942993164, 0.9708137512207031, 3.0746917724609375, 5.178562641143799, 7.28243350982666, 9.38630485534668, 11.490175247192383, 13.594045639038086, 15.697916984558105, 17.801788330078125, 19.905658721923828, 22.00952911376953, 24.113399505615234, 26.21727180480957, 28.321142196655273, 30.425012588500977, 32.52888488769531, 34.632755279541016, 36.73662567138672, 38.84049606323242, 40.944366455078125, 43.04823684692383, 45.15210723876953, 47.2559814453125, 49.3598518371582, 51.463722229003906, 53.56759262084961, 55.67146301269531, 57.775333404541016, 59.87920379638672, 61.98307800292969, 64.08694458007812, 66.1908187866211, 68.29469299316406, 70.3985595703125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 4.0, 5.0, 12.0, 9.0, 6.0, 15.0, 15.0, 22.0, 16.0, 27.0, 21.0, 36.0, 35.0, 33.0, 40.0, 38.0, 56.0, 56.0, 51.0, 45.0, 40.0, 51.0, 59.0, 53.0, 35.0, 32.0, 33.0, 22.0, 24.0, 27.0, 21.0, 19.0, 12.0, 8.0, 6.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.623046875, -1.576690673828125, -1.53033447265625, -1.483978271484375, -1.4376220703125, -1.391265869140625, -1.34490966796875, -1.298553466796875, -1.252197265625, -1.205841064453125, -1.15948486328125, -1.113128662109375, -1.0667724609375, -1.020416259765625, -0.97406005859375, -0.927703857421875, -0.88134765625, -0.834991455078125, -0.78863525390625, -0.742279052734375, -0.6959228515625, -0.649566650390625, -0.60321044921875, -0.556854248046875, -0.510498046875, -0.464141845703125, -0.41778564453125, -0.371429443359375, -0.3250732421875, -0.278717041015625, -0.23236083984375, -0.186004638671875, -0.1396484375, -0.093292236328125, -0.04693603515625, -0.000579833984375, 0.0457763671875, 0.092132568359375, 0.13848876953125, 0.184844970703125, 0.231201171875, 0.277557373046875, 0.32391357421875, 0.370269775390625, 0.4166259765625, 0.462982177734375, 0.50933837890625, 0.555694580078125, 0.60205078125, 0.648406982421875, 0.69476318359375, 0.741119384765625, 0.7874755859375, 0.833831787109375, 0.88018798828125, 0.926544189453125, 0.972900390625, 1.019256591796875, 1.06561279296875, 1.111968994140625, 1.1583251953125, 1.204681396484375, 1.25103759765625, 1.297393798828125, 1.34375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 8.0, 8.0, 14.0, 22.0, 23.0, 27.0, 35.0, 59.0, 87.0, 118.0, 153.0, 214.0, 327.0, 478.0, 749.0, 1145.0, 2014.0, 4292.0, 15400.0, 281478.0, 3816804.0, 54896.0, 8421.0, 2970.0, 1630.0, 1027.0, 609.0, 383.0, 259.0, 185.0, 139.0, 90.0, 68.0, 30.0, 39.0, 20.0, 17.0, 11.0, 8.0, 6.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.734375, -14.3046875, -13.875, -13.4453125, -13.015625, -12.5859375, -12.15625, -11.7265625, -11.296875, -10.8671875, -10.4375, -10.0078125, -9.578125, -9.1484375, -8.71875, -8.2890625, -7.859375, -7.4296875, -7.0, -6.5703125, -6.140625, -5.7109375, -5.28125, -4.8515625, -4.421875, -3.9921875, -3.5625, -3.1328125, -2.703125, -2.2734375, -1.84375, -1.4140625, -0.984375, -0.5546875, -0.125, 0.3046875, 0.734375, 1.1640625, 1.59375, 2.0234375, 2.453125, 2.8828125, 3.3125, 3.7421875, 4.171875, 4.6015625, 5.03125, 5.4609375, 5.890625, 6.3203125, 6.75, 7.1796875, 7.609375, 8.0390625, 8.46875, 8.8984375, 9.328125, 9.7578125, 10.1875, 10.6171875, 11.046875, 11.4765625, 11.90625, 12.3359375, 12.765625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 16.0, 33.0, 58.0, 145.0, 434.0, 1106.0, 1332.0, 520.0, 190.0, 116.0, 49.0, 28.0, 24.0, 14.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3203125, -9.9085693359375, -9.496826171875, -9.0850830078125, -8.67333984375, -8.2615966796875, -7.849853515625, -7.4381103515625, -7.0263671875, -6.6146240234375, -6.202880859375, -5.7911376953125, -5.37939453125, -4.9676513671875, -4.555908203125, -4.1441650390625, -3.732421875, -3.3206787109375, -2.908935546875, -2.4971923828125, -2.08544921875, -1.6737060546875, -1.261962890625, -0.8502197265625, -0.4384765625, -0.0267333984375, 0.385009765625, 0.7967529296875, 1.20849609375, 1.6202392578125, 2.031982421875, 2.4437255859375, 2.85546875, 3.2672119140625, 3.678955078125, 4.0906982421875, 4.50244140625, 4.9141845703125, 5.325927734375, 5.7376708984375, 6.1494140625, 6.5611572265625, 6.972900390625, 7.3846435546875, 7.79638671875, 8.2081298828125, 8.619873046875, 9.0316162109375, 9.443359375, 9.8551025390625, 10.266845703125, 10.6785888671875, 11.09033203125, 11.5020751953125, 11.913818359375, 12.3255615234375, 12.7373046875, 13.1490478515625, 13.560791015625, 13.9725341796875, 14.38427734375, 14.7960205078125, 15.207763671875, 15.6195068359375, 16.03125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 21.0, 46.0, 100.0, 222.0, 704.0, 4200.0, 3430448.0, 754313.0, 3127.0, 680.0, 208.0, 103.0, 59.0, 18.0, 9.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.09375, -39.845703125, -38.59765625, -37.349609375, -36.1015625, -34.853515625, -33.60546875, -32.357421875, -31.109375, -29.861328125, -28.61328125, -27.365234375, -26.1171875, -24.869140625, -23.62109375, -22.373046875, -21.125, -19.876953125, -18.62890625, -17.380859375, -16.1328125, -14.884765625, -13.63671875, -12.388671875, -11.140625, -9.892578125, -8.64453125, -7.396484375, -6.1484375, -4.900390625, -3.65234375, -2.404296875, -1.15625, 0.091796875, 1.33984375, 2.587890625, 3.8359375, 5.083984375, 6.33203125, 7.580078125, 8.828125, 10.076171875, 11.32421875, 12.572265625, 13.8203125, 15.068359375, 16.31640625, 17.564453125, 18.8125, 20.060546875, 21.30859375, 22.556640625, 23.8046875, 25.052734375, 26.30078125, 27.548828125, 28.796875, 30.044921875, 31.29296875, 32.541015625, 33.7890625, 35.037109375, 36.28515625, 37.533203125, 38.78125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 49.0, 579.0, 350.0, 31.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.93313598632812, -176.4544677734375, -172.97579956054688, -169.4971160888672, -166.01844787597656, -162.53977966308594, -159.0611114501953, -155.5824432373047, -152.103759765625, -148.62509155273438, -145.14642333984375, -141.66773986816406, -138.18907165527344, -134.7104034423828, -131.2317352294922, -127.75306701660156, -124.27439880371094, -120.79573059082031, -117.31705474853516, -113.83838653564453, -110.35971069335938, -106.88104248046875, -103.40237426757812, -99.9237060546875, -96.44503021240234, -92.96636199951172, -89.48768615722656, -86.00901794433594, -82.53034973144531, -79.05167388916016, -75.57300567626953, -72.09432983398438, -68.61566162109375, -65.13699340820312, -61.65831756591797, -58.179649353027344, -54.70097732543945, -51.22230529785156, -47.74363708496094, -44.26496505737305, -40.78628921508789, -37.3076171875, -33.828948974609375, -30.350276947021484, -26.871604919433594, -23.392932891845703, -19.914262771606445, -16.435592651367188, -12.956920623779297, -9.478249549865723, -5.999578475952148, -2.520907402038574, 0.957763671875, 4.436435699462891, 7.915105819702148, 11.393775939941406, 14.872447967529297, 18.351119995117188, 21.829790115356445, 25.308460235595703, 28.787132263183594, 32.265804290771484, 35.744476318359375, 39.22314453125, 42.70181655883789]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 13.0, 10.0, 12.0, 12.0, 18.0, 21.0, 27.0, 25.0, 33.0, 31.0, 45.0, 37.0, 47.0, 41.0, 51.0, 51.0, 50.0, 48.0, 38.0, 32.0, 46.0, 37.0, 41.0, 28.0, 25.0, 30.0, 25.0, 17.0, 18.0, 14.0, 17.0, 13.0, 5.0, 7.0, 8.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-32.39892578125, -31.52111053466797, -30.64329719543457, -29.76548194885254, -28.88766860961914, -28.00985336303711, -27.132038116455078, -26.254222869873047, -25.37640953063965, -24.498594284057617, -23.62078094482422, -22.742965698242188, -21.865150451660156, -20.987337112426758, -20.109521865844727, -19.231708526611328, -18.353893280029297, -17.476078033447266, -16.598264694213867, -15.720449447631836, -14.842635154724121, -13.964820861816406, -13.087005615234375, -12.20919132232666, -11.331377029418945, -10.45356273651123, -9.575748443603516, -8.697933197021484, -7.8201189041137695, -6.942304611206055, -6.064489841461182, -5.186675071716309, -4.308860778808594, -3.4310462474823, -2.553231716156006, -1.675417184829712, -0.797602653503418, 0.08021163940429688, 0.9580264091491699, 1.835841178894043, 2.713655471801758, 3.5914700031280518, 4.469284534454346, 5.347099304199219, 6.224913597106934, 7.102727890014648, 7.9805426597595215, 8.858357429504395, 9.73617172241211, 10.613986015319824, 11.491800308227539, 12.36961555480957, 13.247429847717285, 14.125244140625, 15.003059387207031, 15.880873680114746, 16.75868797302246, 17.636503219604492, 18.51431655883789, 19.392131805419922, 20.269947052001953, 21.14776039123535, 22.025575637817383, 22.90338897705078, 23.781204223632812]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 10.0, 10.0, 11.0, 12.0, 17.0, 14.0, 21.0, 15.0, 22.0, 25.0, 24.0, 34.0, 28.0, 34.0, 47.0, 32.0, 43.0, 37.0, 45.0, 46.0, 43.0, 47.0, 33.0, 42.0, 41.0, 41.0, 30.0, 36.0, 16.0, 28.0, 22.0, 17.0, 6.0, 10.0, 15.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.263580322265625, -1.22247314453125, -1.181365966796875, -1.1402587890625, -1.099151611328125, -1.05804443359375, -1.016937255859375, -0.975830078125, -0.934722900390625, -0.89361572265625, -0.852508544921875, -0.8114013671875, -0.770294189453125, -0.72918701171875, -0.688079833984375, -0.64697265625, -0.605865478515625, -0.56475830078125, -0.523651123046875, -0.4825439453125, -0.441436767578125, -0.40032958984375, -0.359222412109375, -0.318115234375, -0.277008056640625, -0.23590087890625, -0.194793701171875, -0.1536865234375, -0.112579345703125, -0.07147216796875, -0.030364990234375, 0.0107421875, 0.051849365234375, 0.09295654296875, 0.134063720703125, 0.1751708984375, 0.216278076171875, 0.25738525390625, 0.298492431640625, 0.339599609375, 0.380706787109375, 0.42181396484375, 0.462921142578125, 0.5040283203125, 0.545135498046875, 0.58624267578125, 0.627349853515625, 0.66845703125, 0.709564208984375, 0.75067138671875, 0.791778564453125, 0.8328857421875, 0.873992919921875, 0.91510009765625, 0.956207275390625, 0.997314453125, 1.038421630859375, 1.07952880859375, 1.120635986328125, 1.1617431640625, 1.202850341796875, 1.24395751953125, 1.285064697265625, 1.326171875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 14.0, 15.0, 35.0, 42.0, 76.0, 103.0, 142.0, 196.0, 294.0, 365.0, 605.0, 749.0, 1160.0, 1664.0, 2315.0, 3193.0, 4615.0, 6763.0, 9570.0, 14080.0, 20448.0, 30487.0, 45823.0, 71224.0, 121589.0, 285192.0, 167951.0, 89186.0, 55384.0, 36603.0, 24311.0, 16765.0, 11318.0, 7985.0, 5487.0, 3838.0, 2670.0, 1879.0, 1309.0, 959.0, 616.0, 485.0, 329.0, 206.0, 170.0, 110.0, 72.0, 51.0, 47.0, 22.0, 17.0, 9.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.05267333984375, -0.05101299285888672, -0.04935264587402344, -0.047692298889160156, -0.046031951904296875, -0.044371604919433594, -0.04271125793457031, -0.04105091094970703, -0.03939056396484375, -0.03773021697998047, -0.03606986999511719, -0.034409523010253906, -0.032749176025390625, -0.031088829040527344, -0.029428482055664062, -0.02776813507080078, -0.0261077880859375, -0.02444744110107422, -0.022787094116210938, -0.021126747131347656, -0.019466400146484375, -0.017806053161621094, -0.016145706176757812, -0.014485359191894531, -0.01282501220703125, -0.011164665222167969, -0.009504318237304688, -0.007843971252441406, -0.006183624267578125, -0.004523277282714844, -0.0028629302978515625, -0.0012025833129882812, 0.000457763671875, 0.0021181106567382812, 0.0037784576416015625, 0.005438804626464844, 0.007099151611328125, 0.008759498596191406, 0.010419845581054688, 0.012080192565917969, 0.01374053955078125, 0.015400886535644531, 0.017061233520507812, 0.018721580505371094, 0.020381927490234375, 0.022042274475097656, 0.023702621459960938, 0.02536296844482422, 0.0270233154296875, 0.02868366241455078, 0.030344009399414062, 0.032004356384277344, 0.033664703369140625, 0.035325050354003906, 0.03698539733886719, 0.03864574432373047, 0.04030609130859375, 0.04196643829345703, 0.04362678527832031, 0.045287132263183594, 0.046947479248046875, 0.048607826232910156, 0.05026817321777344, 0.05192852020263672, 0.0535888671875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 6.0, 14.0, 6.0, 17.0, 15.0, 22.0, 14.0, 20.0, 26.0, 21.0, 22.0, 34.0, 28.0, 38.0, 38.0, 33.0, 37.0, 40.0, 37.0, 1059.0, 30.0, 37.0, 40.0, 46.0, 24.0, 45.0, 44.0, 21.0, 30.0, 23.0, 16.0, 17.0, 17.0, 22.0, 11.0, 18.0, 10.0, 13.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.1484375, -1.1159591674804688, -1.0834808349609375, -1.0510025024414062, -1.018524169921875, -0.9860458374023438, -0.9535675048828125, -0.9210891723632812, -0.88861083984375, -0.8561325073242188, -0.8236541748046875, -0.7911758422851562, -0.758697509765625, -0.7262191772460938, -0.6937408447265625, -0.6612625122070312, -0.6287841796875, -0.5963058471679688, -0.5638275146484375, -0.5313491821289062, -0.498870849609375, -0.46639251708984375, -0.4339141845703125, -0.40143585205078125, -0.36895751953125, -0.33647918701171875, -0.3040008544921875, -0.27152252197265625, -0.239044189453125, -0.20656585693359375, -0.1740875244140625, -0.14160919189453125, -0.109130859375, -0.07665252685546875, -0.0441741943359375, -0.01169586181640625, 0.020782470703125, 0.05326080322265625, 0.0857391357421875, 0.11821746826171875, 0.15069580078125, 0.18317413330078125, 0.2156524658203125, 0.24813079833984375, 0.280609130859375, 0.31308746337890625, 0.3455657958984375, 0.37804412841796875, 0.4105224609375, 0.44300079345703125, 0.4754791259765625, 0.5079574584960938, 0.540435791015625, 0.5729141235351562, 0.6053924560546875, 0.6378707885742188, 0.67034912109375, 0.7028274536132812, 0.7353057861328125, 0.7677841186523438, 0.800262451171875, 0.8327407836914062, 0.8652191162109375, 0.8976974487304688, 0.93017578125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 14.0, 12.0, 22.0, 28.0, 52.0, 74.0, 117.0, 174.0, 274.0, 397.0, 648.0, 959.0, 1443.0, 2241.0, 3181.0, 4811.0, 7156.0, 10479.0, 15665.0, 23829.0, 36829.0, 60243.0, 104412.0, 209741.0, 1314786.0, 116389.0, 66129.0, 40194.0, 25405.0, 16956.0, 11252.0, 7694.0, 5118.0, 3496.0, 2347.0, 1553.0, 1013.0, 686.0, 450.0, 268.0, 229.0, 120.0, 99.0, 51.0, 42.0, 21.0, 14.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031280517578125, -0.030274391174316406, -0.029268264770507812, -0.02826213836669922, -0.027256011962890625, -0.02624988555908203, -0.025243759155273438, -0.024237632751464844, -0.02323150634765625, -0.022225379943847656, -0.021219253540039062, -0.02021312713623047, -0.019207000732421875, -0.01820087432861328, -0.017194747924804688, -0.016188621520996094, -0.0151824951171875, -0.014176368713378906, -0.013170242309570312, -0.012164115905761719, -0.011157989501953125, -0.010151863098144531, -0.009145736694335938, -0.008139610290527344, -0.00713348388671875, -0.006127357482910156, -0.0051212310791015625, -0.004115104675292969, -0.003108978271484375, -0.0021028518676757812, -0.0010967254638671875, -9.059906005859375e-05, 0.00091552734375, 0.0019216537475585938, 0.0029277801513671875, 0.003933906555175781, 0.004940032958984375, 0.005946159362792969, 0.0069522857666015625, 0.007958412170410156, 0.00896453857421875, 0.009970664978027344, 0.010976791381835938, 0.011982917785644531, 0.012989044189453125, 0.013995170593261719, 0.015001296997070312, 0.016007423400878906, 0.0170135498046875, 0.018019676208496094, 0.019025802612304688, 0.02003192901611328, 0.021038055419921875, 0.02204418182373047, 0.023050308227539062, 0.024056434631347656, 0.02506256103515625, 0.026068687438964844, 0.027074813842773438, 0.02808094024658203, 0.029087066650390625, 0.03009319305419922, 0.031099319458007812, 0.032105445861816406, 0.033111572265625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 9.0, 4.0, 12.0, 15.0, 8.0, 0.0, 13.0, 16.0, 17.0, 29.0, 61.0, 69.0, 437.0, 94.0, 61.0, 34.0, 0.0, 17.0, 15.0, 15.0, 14.0, 5.0, 10.0, 6.0, 9.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.086162567138672e-06, -2.032145857810974e-06, -1.9781291484832764e-06, -1.9241124391555786e-06, -1.8700957298278809e-06, -1.816079020500183e-06, -1.7620623111724854e-06, -1.7080456018447876e-06, -1.6540288925170898e-06, -1.600012183189392e-06, -1.5459954738616943e-06, -1.4919787645339966e-06, -1.4379620552062988e-06, -1.383945345878601e-06, -1.3299286365509033e-06, -1.2759119272232056e-06, -1.2218952178955078e-06, -1.16787850856781e-06, -1.1138617992401123e-06, -1.0598450899124146e-06, -1.0058283805847168e-06, -9.51811671257019e-07, -8.977949619293213e-07, -8.437782526016235e-07, -7.897615432739258e-07, -7.35744833946228e-07, -6.817281246185303e-07, -6.277114152908325e-07, -5.736947059631348e-07, -5.19677996635437e-07, -4.6566128730773926e-07, -4.116445779800415e-07, -3.5762786865234375e-07, -3.03611159324646e-07, -2.4959444999694824e-07, -1.955777406692505e-07, -1.4156103134155273e-07, -8.754432201385498e-08, -3.3527612686157227e-08, 2.0489096641540527e-08, 7.450580596923828e-08, 1.2852251529693604e-07, 1.825392246246338e-07, 2.3655593395233154e-07, 2.905726432800293e-07, 3.4458935260772705e-07, 3.986060619354248e-07, 4.5262277126312256e-07, 5.066394805908203e-07, 5.606561899185181e-07, 6.146728992462158e-07, 6.686896085739136e-07, 7.227063179016113e-07, 7.767230272293091e-07, 8.307397365570068e-07, 8.847564458847046e-07, 9.387731552124023e-07, 9.927898645401e-07, 1.0468065738677979e-06, 1.1008232831954956e-06, 1.1548399925231934e-06, 1.2088567018508911e-06, 1.2628734111785889e-06, 1.3168901205062866e-06, 1.3709068298339844e-06]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 3.0, 4.0, 7.0, 5.0, 12.0, 12.0, 19.0, 31.0, 25.0, 33.0, 45.0, 47.0, 71.0, 84.0, 142.0, 356.0, 3177.0, 1042735.0, 949.0, 321.0, 121.0, 68.0, 59.0, 45.0, 26.0, 44.0, 19.0, 19.0, 15.0, 13.0, 9.0, 8.0, 4.0, 3.0, 7.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1888484954833984e-05, -3.07643786072731e-05, -2.964027225971222e-05, -2.8516165912151337e-05, -2.7392059564590454e-05, -2.626795321702957e-05, -2.514384686946869e-05, -2.4019740521907806e-05, -2.2895634174346924e-05, -2.177152782678604e-05, -2.064742147922516e-05, -1.9523315131664276e-05, -1.8399208784103394e-05, -1.727510243654251e-05, -1.615099608898163e-05, -1.5026889741420746e-05, -1.3902783393859863e-05, -1.277867704629898e-05, -1.1654570698738098e-05, -1.0530464351177216e-05, -9.406358003616333e-06, -8.28225165605545e-06, -7.158145308494568e-06, -6.034038960933685e-06, -4.909932613372803e-06, -3.78582626581192e-06, -2.6617199182510376e-06, -1.537613570690155e-06, -4.1350722312927246e-07, 7.105991244316101e-07, 1.8347054719924927e-06, 2.9588118195533752e-06, 4.082918167114258e-06, 5.20702451467514e-06, 6.331130862236023e-06, 7.4552372097969055e-06, 8.579343557357788e-06, 9.70344990491867e-06, 1.0827556252479553e-05, 1.1951662600040436e-05, 1.3075768947601318e-05, 1.4199875295162201e-05, 1.5323981642723083e-05, 1.6448087990283966e-05, 1.757219433784485e-05, 1.869630068540573e-05, 1.9820407032966614e-05, 2.0944513380527496e-05, 2.206861972808838e-05, 2.319272607564926e-05, 2.4316832423210144e-05, 2.5440938770771027e-05, 2.656504511833191e-05, 2.7689151465892792e-05, 2.8813257813453674e-05, 2.9937364161014557e-05, 3.106147050857544e-05, 3.218557685613632e-05, 3.3309683203697205e-05, 3.443378955125809e-05, 3.555789589881897e-05, 3.668200224637985e-05, 3.7806108593940735e-05, 3.893021494150162e-05, 4.00543212890625e-05]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 69.0, 915.0, 34.0], "bins": [-5.084586973680416e-06, -5.0030935199174564e-06, -4.921600066154497e-06, -4.840106612391537e-06, -4.758613158628577e-06, -4.677119250118267e-06, -4.595625796355307e-06, -4.514132342592347e-06, -4.432638888829388e-06, -4.351145435066428e-06, -4.269651981303468e-06, -4.188158527540509e-06, -4.106665073777549e-06, -4.025171620014589e-06, -3.94367816625163e-06, -3.862184257741319e-06, -3.7806910313520348e-06, -3.699197577589075e-06, -3.6177041238261154e-06, -3.5362104426894803e-06, -3.4547169889265206e-06, -3.373223535163561e-06, -3.291730081400601e-06, -3.2102366276376415e-06, -3.128743173874682e-06, -3.047249720111722e-06, -2.9657562663487624e-06, -2.8842628125858027e-06, -2.8027691314491676e-06, -2.721275677686208e-06, -2.6397822239232482e-06, -2.5582887701602885e-06, -2.4767950890236534e-06, -2.3953016352606937e-06, -2.313808181497734e-06, -2.2323147277347744e-06, -2.1508210465981392e-06, -2.0693275928351795e-06, -1.98783413907222e-06, -1.9063406853092602e-06, -1.8248472315463005e-06, -1.7433537777833408e-06, -1.6618602103335434e-06, -1.5803667565705837e-06, -1.4988731891207863e-06, -1.4173797353578266e-06, -1.3358862815948669e-06, -1.2543928278319072e-06, -1.1728992603821098e-06, -1.09140580661915e-06, -1.0099122391693527e-06, -9.28418785406393e-07, -8.469252748000144e-07, -7.654317641936359e-07, -6.839383104306762e-07, -6.024447998242977e-07, -5.209512892179191e-07, -4.3945777861154056e-07, -3.5796429642687144e-07, -2.764708142422023e-07, -1.9497730363582377e-07, -1.1348379302944522e-07, -3.1990339266485535e-08, 4.9503171339893015e-08, 1.3099668194627156e-07]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 72.0, 0.0, 0.0, 0.0, 0.0, 137.0, 0.0, 0.0, 0.0, 0.0, 0.0, 522.0, 0.0, 0.0, 0.0, 0.0, 151.0, 0.0, 0.0, 0.0, 0.0, 67.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.46451997756958e-07, -3.3527612686157227e-07, -3.241002559661865e-07, -3.129243850708008e-07, -3.0174851417541504e-07, -2.905726432800293e-07, -2.7939677238464355e-07, -2.682209014892578e-07, -2.5704503059387207e-07, -2.4586915969848633e-07, -2.3469328880310059e-07, -2.2351741790771484e-07, -2.123415470123291e-07, -2.0116567611694336e-07, -1.8998980522155762e-07, -1.7881393432617188e-07, -1.6763806343078613e-07, -1.564621925354004e-07, -1.4528632164001465e-07, -1.341104507446289e-07, -1.2293457984924316e-07, -1.1175870895385742e-07, -1.0058283805847168e-07, -8.940696716308594e-08, -7.82310962677002e-08, -6.705522537231445e-08, -5.587935447692871e-08, -4.470348358154297e-08, -3.3527612686157227e-08, -2.2351741790771484e-08, -1.1175870895385742e-08, 0.0, 1.1175870895385742e-08, 2.2351741790771484e-08, 3.3527612686157227e-08, 4.470348358154297e-08, 5.587935447692871e-08, 6.705522537231445e-08, 7.82310962677002e-08, 8.940696716308594e-08, 1.0058283805847168e-07, 1.1175870895385742e-07, 1.2293457984924316e-07, 1.341104507446289e-07, 1.4528632164001465e-07, 1.564621925354004e-07, 1.6763806343078613e-07, 1.7881393432617188e-07, 1.8998980522155762e-07, 2.0116567611694336e-07, 2.123415470123291e-07, 2.2351741790771484e-07, 2.3469328880310059e-07, 2.4586915969848633e-07, 2.5704503059387207e-07, 2.682209014892578e-07, 2.7939677238464355e-07, 2.905726432800293e-07, 3.0174851417541504e-07, 3.129243850708008e-07, 3.241002559661865e-07, 3.3527612686157227e-07, 3.46451997756958e-07, 3.5762786865234375e-07]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 10.0, 10.0, 11.0, 12.0, 17.0, 14.0, 21.0, 15.0, 22.0, 25.0, 24.0, 34.0, 28.0, 34.0, 47.0, 32.0, 43.0, 37.0, 45.0, 46.0, 43.0, 47.0, 33.0, 42.0, 41.0, 41.0, 30.0, 36.0, 16.0, 28.0, 22.0, 17.0, 6.0, 10.0, 15.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3046875, -1.263580322265625, -1.22247314453125, -1.181365966796875, -1.1402587890625, -1.099151611328125, -1.05804443359375, -1.016937255859375, -0.975830078125, -0.934722900390625, -0.89361572265625, -0.852508544921875, -0.8114013671875, -0.770294189453125, -0.72918701171875, -0.688079833984375, -0.64697265625, -0.605865478515625, -0.56475830078125, -0.523651123046875, -0.4825439453125, -0.441436767578125, -0.40032958984375, -0.359222412109375, -0.318115234375, -0.277008056640625, -0.23590087890625, -0.194793701171875, -0.1536865234375, -0.112579345703125, -0.07147216796875, -0.030364990234375, 0.0107421875, 0.051849365234375, 0.09295654296875, 0.134063720703125, 0.1751708984375, 0.216278076171875, 0.25738525390625, 0.298492431640625, 0.339599609375, 0.380706787109375, 0.42181396484375, 0.462921142578125, 0.5040283203125, 0.545135498046875, 0.58624267578125, 0.627349853515625, 0.66845703125, 0.709564208984375, 0.75067138671875, 0.791778564453125, 0.8328857421875, 0.873992919921875, 0.91510009765625, 0.956207275390625, 0.997314453125, 1.038421630859375, 1.07952880859375, 1.120635986328125, 1.1617431640625, 1.202850341796875, 1.24395751953125, 1.285064697265625, 1.326171875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 10.0, 7.0, 11.0, 16.0, 16.0, 35.0, 39.0, 40.0, 57.0, 102.0, 137.0, 151.0, 245.0, 315.0, 426.0, 582.0, 866.0, 1294.0, 2044.0, 3274.0, 6004.0, 12985.0, 37024.0, 141360.0, 492528.0, 249060.0, 61222.0, 18974.0, 8032.0, 4234.0, 2419.0, 1557.0, 996.0, 723.0, 496.0, 342.0, 247.0, 184.0, 133.0, 101.0, 75.0, 54.0, 33.0, 30.0, 27.0, 18.0, 12.0, 8.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.3515625, -6.1630859375, -5.974609375, -5.7861328125, -5.59765625, -5.4091796875, -5.220703125, -5.0322265625, -4.84375, -4.6552734375, -4.466796875, -4.2783203125, -4.08984375, -3.9013671875, -3.712890625, -3.5244140625, -3.3359375, -3.1474609375, -2.958984375, -2.7705078125, -2.58203125, -2.3935546875, -2.205078125, -2.0166015625, -1.828125, -1.6396484375, -1.451171875, -1.2626953125, -1.07421875, -0.8857421875, -0.697265625, -0.5087890625, -0.3203125, -0.1318359375, 0.056640625, 0.2451171875, 0.43359375, 0.6220703125, 0.810546875, 0.9990234375, 1.1875, 1.3759765625, 1.564453125, 1.7529296875, 1.94140625, 2.1298828125, 2.318359375, 2.5068359375, 2.6953125, 2.8837890625, 3.072265625, 3.2607421875, 3.44921875, 3.6376953125, 3.826171875, 4.0146484375, 4.203125, 4.3916015625, 4.580078125, 4.7685546875, 4.95703125, 5.1455078125, 5.333984375, 5.5224609375, 5.7109375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 7.0, 9.0, 12.0, 11.0, 14.0, 19.0, 17.0, 25.0, 26.0, 34.0, 28.0, 44.0, 52.0, 78.0, 112.0, 181.0, 876.0, 782.0, 178.0, 106.0, 80.0, 65.0, 53.0, 44.0, 33.0, 27.0, 26.0, 17.0, 25.0, 16.0, 6.0, 13.0, 4.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.03125, -4.8740234375, -4.716796875, -4.5595703125, -4.40234375, -4.2451171875, -4.087890625, -3.9306640625, -3.7734375, -3.6162109375, -3.458984375, -3.3017578125, -3.14453125, -2.9873046875, -2.830078125, -2.6728515625, -2.515625, -2.3583984375, -2.201171875, -2.0439453125, -1.88671875, -1.7294921875, -1.572265625, -1.4150390625, -1.2578125, -1.1005859375, -0.943359375, -0.7861328125, -0.62890625, -0.4716796875, -0.314453125, -0.1572265625, 0.0, 0.1572265625, 0.314453125, 0.4716796875, 0.62890625, 0.7861328125, 0.943359375, 1.1005859375, 1.2578125, 1.4150390625, 1.572265625, 1.7294921875, 1.88671875, 2.0439453125, 2.201171875, 2.3583984375, 2.515625, 2.6728515625, 2.830078125, 2.9873046875, 3.14453125, 3.3017578125, 3.458984375, 3.6162109375, 3.7734375, 3.9306640625, 4.087890625, 4.2451171875, 4.40234375, 4.5595703125, 4.716796875, 4.8740234375, 5.03125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 9.0, 5.0, 6.0, 10.0, 15.0, 15.0, 18.0, 28.0, 34.0, 42.0, 40.0, 68.0, 124.0, 294.0, 1321.0, 275110.0, 2864907.0, 2791.0, 389.0, 139.0, 77.0, 60.0, 28.0, 36.0, 29.0, 13.0, 13.0, 20.0, 15.0, 13.0, 6.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.921875, -23.177734375, -22.43359375, -21.689453125, -20.9453125, -20.201171875, -19.45703125, -18.712890625, -17.96875, -17.224609375, -16.48046875, -15.736328125, -14.9921875, -14.248046875, -13.50390625, -12.759765625, -12.015625, -11.271484375, -10.52734375, -9.783203125, -9.0390625, -8.294921875, -7.55078125, -6.806640625, -6.0625, -5.318359375, -4.57421875, -3.830078125, -3.0859375, -2.341796875, -1.59765625, -0.853515625, -0.109375, 0.634765625, 1.37890625, 2.123046875, 2.8671875, 3.611328125, 4.35546875, 5.099609375, 5.84375, 6.587890625, 7.33203125, 8.076171875, 8.8203125, 9.564453125, 10.30859375, 11.052734375, 11.796875, 12.541015625, 13.28515625, 14.029296875, 14.7734375, 15.517578125, 16.26171875, 17.005859375, 17.75, 18.494140625, 19.23828125, 19.982421875, 20.7265625, 21.470703125, 22.21484375, 22.958984375, 23.703125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [968.0, 47.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.007070064544678, 1.9058313369750977, 7.818732738494873, 13.731634140014648, 19.644535064697266, 25.557435989379883, 31.470338821411133, 37.38323974609375, 43.296142578125, 49.20904541015625, 55.121944427490234, 61.034847259521484, 66.94774627685547, 72.86064910888672, 78.77355194091797, 84.68644714355469, 90.59934997558594, 96.51225280761719, 102.42515563964844, 108.33805847167969, 114.2509536743164, 120.16385650634766, 126.0767593383789, 131.98965454101562, 137.90255737304688, 143.81546020507812, 149.72836303710938, 155.64126586914062, 161.55416870117188, 167.46707153320312, 173.37997436523438, 179.29286193847656, 185.2057647705078, 191.11866760253906, 197.0315704345703, 202.94447326660156, 208.8573760986328, 214.770263671875, 220.68316650390625, 226.5960693359375, 232.50897216796875, 238.421875, 244.33477783203125, 250.2476806640625, 256.16058349609375, 262.073486328125, 267.98638916015625, 273.8992919921875, 279.81219482421875, 285.72509765625, 291.63800048828125, 297.5509033203125, 303.46380615234375, 309.376708984375, 315.28961181640625, 321.2025146484375, 327.1153869628906, 333.0282897949219, 338.9411926269531, 344.8540954589844, 350.7669982910156, 356.6799011230469, 362.5928039550781, 368.5057067871094, 374.4186096191406]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 8.0, 12.0, 6.0, 18.0, 17.0, 18.0, 20.0, 19.0, 26.0, 27.0, 35.0, 32.0, 38.0, 37.0, 34.0, 46.0, 38.0, 41.0, 36.0, 40.0, 42.0, 44.0, 41.0, 38.0, 32.0, 30.0, 33.0, 22.0, 26.0, 25.0, 21.0, 14.0, 12.0, 11.0, 10.0, 10.0, 7.0, 12.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.260639190673828, -17.712726593017578, -17.164812088012695, -16.616899490356445, -16.068984985351562, -15.521072387695312, -14.973158836364746, -14.42524528503418, -13.877331733703613, -13.329418182373047, -12.78150463104248, -12.233591079711914, -11.685678482055664, -11.137763977050781, -10.589851379394531, -10.041937828063965, -9.494024276733398, -8.946110725402832, -8.398197174072266, -7.850284099578857, -7.302370548248291, -6.754456996917725, -6.206543922424316, -5.65863037109375, -5.110716819763184, -4.562803268432617, -4.014889717102051, -3.4669766426086426, -2.919063091278076, -2.3711495399475098, -1.8232362270355225, -1.2753229141235352, -0.7274112701416016, -0.1794978380203247, 0.36841559410095215, 0.916329026222229, 1.4642424583435059, 2.0121560096740723, 2.5600693225860596, 3.107982635498047, 3.6558961868286133, 4.20380973815918, 4.751723289489746, 5.299636363983154, 5.847549915313721, 6.395463466644287, 6.943376541137695, 7.491290092468262, 8.039203643798828, 8.587117195129395, 9.135030746459961, 9.682944297790527, 10.230857849121094, 10.778770446777344, 11.32668399810791, 11.874597549438477, 12.422511100769043, 12.97042465209961, 13.518338203430176, 14.066251754760742, 14.614164352416992, 15.162078857421875, 15.709991455078125, 16.257904052734375, 16.805818557739258]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 10.0, 7.0, 11.0, 8.0, 11.0, 19.0, 13.0, 18.0, 18.0, 26.0, 21.0, 23.0, 22.0, 29.0, 38.0, 36.0, 37.0, 37.0, 36.0, 41.0, 42.0, 44.0, 34.0, 47.0, 34.0, 31.0, 41.0, 33.0, 29.0, 31.0, 33.0, 21.0, 18.0, 15.0, 13.0, 10.0, 13.0, 6.0, 9.0, 10.0, 7.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.318359375, -1.2775726318359375, -1.236785888671875, -1.1959991455078125, -1.15521240234375, -1.1144256591796875, -1.073638916015625, -1.0328521728515625, -0.9920654296875, -0.9512786865234375, -0.910491943359375, -0.8697052001953125, -0.82891845703125, -0.7881317138671875, -0.747344970703125, -0.7065582275390625, -0.665771484375, -0.6249847412109375, -0.584197998046875, -0.5434112548828125, -0.50262451171875, -0.4618377685546875, -0.421051025390625, -0.3802642822265625, -0.3394775390625, -0.2986907958984375, -0.257904052734375, -0.2171173095703125, -0.17633056640625, -0.1355438232421875, -0.094757080078125, -0.0539703369140625, -0.01318359375, 0.0276031494140625, 0.068389892578125, 0.1091766357421875, 0.14996337890625, 0.1907501220703125, 0.231536865234375, 0.2723236083984375, 0.3131103515625, 0.3538970947265625, 0.394683837890625, 0.4354705810546875, 0.47625732421875, 0.5170440673828125, 0.557830810546875, 0.5986175537109375, 0.639404296875, 0.6801910400390625, 0.720977783203125, 0.7617645263671875, 0.80255126953125, 0.8433380126953125, 0.884124755859375, 0.9249114990234375, 0.9656982421875, 1.0064849853515625, 1.047271728515625, 1.0880584716796875, 1.12884521484375, 1.1696319580078125, 1.210418701171875, 1.2512054443359375, 1.2919921875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 4.0, 7.0, 9.0, 15.0, 15.0, 16.0, 34.0, 44.0, 46.0, 61.0, 93.0, 109.0, 160.0, 244.0, 322.0, 524.0, 1096.0, 3307.0, 20050.0, 430954.0, 3553585.0, 167514.0, 11330.0, 2331.0, 861.0, 439.0, 340.0, 205.0, 162.0, 85.0, 91.0, 67.0, 33.0, 33.0, 30.0, 19.0, 10.0, 8.0, 10.0, 3.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.6171875, -10.3170166015625, -10.016845703125, -9.7166748046875, -9.41650390625, -9.1163330078125, -8.816162109375, -8.5159912109375, -8.2158203125, -7.9156494140625, -7.615478515625, -7.3153076171875, -7.01513671875, -6.7149658203125, -6.414794921875, -6.1146240234375, -5.814453125, -5.5142822265625, -5.214111328125, -4.9139404296875, -4.61376953125, -4.3135986328125, -4.013427734375, -3.7132568359375, -3.4130859375, -3.1129150390625, -2.812744140625, -2.5125732421875, -2.21240234375, -1.9122314453125, -1.612060546875, -1.3118896484375, -1.01171875, -0.7115478515625, -0.411376953125, -0.1112060546875, 0.18896484375, 0.4891357421875, 0.789306640625, 1.0894775390625, 1.3896484375, 1.6898193359375, 1.989990234375, 2.2901611328125, 2.59033203125, 2.8905029296875, 3.190673828125, 3.4908447265625, 3.791015625, 4.0911865234375, 4.391357421875, 4.6915283203125, 4.99169921875, 5.2918701171875, 5.592041015625, 5.8922119140625, 6.1923828125, 6.4925537109375, 6.792724609375, 7.0928955078125, 7.39306640625, 7.6932373046875, 7.993408203125, 8.2935791015625, 8.59375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 11.0, 33.0, 42.0, 80.0, 157.0, 272.0, 579.0, 826.0, 872.0, 505.0, 328.0, 159.0, 95.0, 45.0, 24.0, 24.0, 7.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-12.3515625, -12.082763671875, -11.81396484375, -11.545166015625, -11.2763671875, -11.007568359375, -10.73876953125, -10.469970703125, -10.201171875, -9.932373046875, -9.66357421875, -9.394775390625, -9.1259765625, -8.857177734375, -8.58837890625, -8.319580078125, -8.05078125, -7.781982421875, -7.51318359375, -7.244384765625, -6.9755859375, -6.706787109375, -6.43798828125, -6.169189453125, -5.900390625, -5.631591796875, -5.36279296875, -5.093994140625, -4.8251953125, -4.556396484375, -4.28759765625, -4.018798828125, -3.75, -3.481201171875, -3.21240234375, -2.943603515625, -2.6748046875, -2.406005859375, -2.13720703125, -1.868408203125, -1.599609375, -1.330810546875, -1.06201171875, -0.793212890625, -0.5244140625, -0.255615234375, 0.01318359375, 0.281982421875, 0.55078125, 0.819580078125, 1.08837890625, 1.357177734375, 1.6259765625, 1.894775390625, 2.16357421875, 2.432373046875, 2.701171875, 2.969970703125, 3.23876953125, 3.507568359375, 3.7763671875, 4.045166015625, 4.31396484375, 4.582763671875, 4.8515625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 12.0, 11.0, 14.0, 31.0, 49.0, 94.0, 208.0, 410.0, 969.0, 3104.0, 15609.0, 303122.0, 3514074.0, 335446.0, 16152.0, 3120.0, 989.0, 422.0, 194.0, 108.0, 53.0, 29.0, 20.0, 11.0, 5.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.875, -16.412841796875, -15.95068359375, -15.488525390625, -15.0263671875, -14.564208984375, -14.10205078125, -13.639892578125, -13.177734375, -12.715576171875, -12.25341796875, -11.791259765625, -11.3291015625, -10.866943359375, -10.40478515625, -9.942626953125, -9.48046875, -9.018310546875, -8.55615234375, -8.093994140625, -7.6318359375, -7.169677734375, -6.70751953125, -6.245361328125, -5.783203125, -5.321044921875, -4.85888671875, -4.396728515625, -3.9345703125, -3.472412109375, -3.01025390625, -2.548095703125, -2.0859375, -1.623779296875, -1.16162109375, -0.699462890625, -0.2373046875, 0.224853515625, 0.68701171875, 1.149169921875, 1.611328125, 2.073486328125, 2.53564453125, 2.997802734375, 3.4599609375, 3.922119140625, 4.38427734375, 4.846435546875, 5.30859375, 5.770751953125, 6.23291015625, 6.695068359375, 7.1572265625, 7.619384765625, 8.08154296875, 8.543701171875, 9.005859375, 9.468017578125, 9.93017578125, 10.392333984375, 10.8544921875, 11.316650390625, 11.77880859375, 12.240966796875, 12.703125]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 31.0, 155.0, 305.0, 328.0, 154.0, 28.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.87224197387695, -43.86967086791992, -41.867095947265625, -39.864524841308594, -37.8619499206543, -35.859378814697266, -33.85680389404297, -31.854232788085938, -29.851659774780273, -27.84908676147461, -25.846513748168945, -23.84394073486328, -21.84136962890625, -19.838794708251953, -17.836223602294922, -15.833650588989258, -13.831077575683594, -11.82850456237793, -9.825931549072266, -7.823359489440918, -5.820786476135254, -3.81821346282959, -1.8156414031982422, 0.18693161010742188, 2.189504623413086, 4.19207763671875, 6.194650173187256, 8.197222709655762, 10.199795722961426, 12.20236873626709, 14.204940795898438, 16.2075138092041, 18.21009063720703, 20.212663650512695, 22.21523666381836, 24.21780776977539, 26.220382690429688, 28.22295379638672, 30.225526809692383, 32.22809982299805, 34.230674743652344, 36.233245849609375, 38.23582077026367, 40.2383918762207, 42.240966796875, 44.24353790283203, 46.24610900878906, 48.24868392944336, 50.25125503540039, 52.25382614135742, 54.25640106201172, 56.25897216796875, 58.26154708862305, 60.26411819458008, 62.266693115234375, 64.2692642211914, 66.27183532714844, 68.27440643310547, 70.2769775390625, 72.27955627441406, 74.2821273803711, 76.28469848632812, 78.28726959228516, 80.28984069824219, 82.29241943359375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 4.0, 4.0, 0.0, 3.0, 6.0, 6.0, 8.0, 9.0, 12.0, 20.0, 17.0, 13.0, 21.0, 26.0, 29.0, 28.0, 31.0, 29.0, 28.0, 46.0, 41.0, 44.0, 47.0, 34.0, 46.0, 33.0, 47.0, 33.0, 26.0, 28.0, 42.0, 31.0, 25.0, 21.0, 31.0, 21.0, 34.0, 14.0, 20.0, 9.0, 10.0, 6.0, 9.0, 3.0, 9.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.536693572998047, -12.05055046081543, -11.564407348632812, -11.078264236450195, -10.592121124267578, -10.105978012084961, -9.619834899902344, -9.13369083404541, -8.647547721862793, -8.161404609680176, -7.675261497497559, -7.189118385314941, -6.702974796295166, -6.216831684112549, -5.730688571929932, -5.244544982910156, -4.758402347564697, -4.27225923538208, -3.786115884780884, -3.2999727725982666, -2.8138294219970703, -2.327686309814453, -1.841543197631836, -1.3553998470306396, -0.8692567348480225, -0.3831135332584381, 0.10302966833114624, 0.5891728401184082, 1.075316071510315, 1.5614593029022217, 2.047602415084839, 2.533745765686035, 3.0198888778686523, 3.5060319900512695, 3.992175340652466, 4.478318214416504, 4.964461803436279, 5.4506049156188965, 5.936748027801514, 6.422891616821289, 6.909034729003906, 7.395177841186523, 7.881320953369141, 8.367464065551758, 8.853607177734375, 9.339750289916992, 9.82589340209961, 10.312037467956543, 10.798179626464844, 11.284322738647461, 11.770465850830078, 12.256608963012695, 12.742752075195312, 13.22889518737793, 13.715038299560547, 14.20118236541748, 14.687325477600098, 15.173468589782715, 15.659611701965332, 16.145755767822266, 16.631898880004883, 17.1180419921875, 17.604185104370117, 18.090328216552734, 18.57647132873535]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 6.0, 8.0, 4.0, 13.0, 9.0, 12.0, 20.0, 13.0, 16.0, 16.0, 22.0, 25.0, 20.0, 25.0, 37.0, 37.0, 36.0, 37.0, 36.0, 35.0, 52.0, 45.0, 44.0, 43.0, 42.0, 44.0, 31.0, 34.0, 38.0, 22.0, 27.0, 25.0, 18.0, 15.0, 20.0, 11.0, 14.0, 10.0, 7.0, 7.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.2928619384765625, -1.249786376953125, -1.2067108154296875, -1.16363525390625, -1.1205596923828125, -1.077484130859375, -1.0344085693359375, -0.9913330078125, -0.9482574462890625, -0.905181884765625, -0.8621063232421875, -0.81903076171875, -0.7759552001953125, -0.732879638671875, -0.6898040771484375, -0.646728515625, -0.6036529541015625, -0.560577392578125, -0.5175018310546875, -0.47442626953125, -0.4313507080078125, -0.388275146484375, -0.3451995849609375, -0.3021240234375, -0.2590484619140625, -0.215972900390625, -0.1728973388671875, -0.12982177734375, -0.0867462158203125, -0.043670654296875, -0.0005950927734375, 0.04248046875, 0.0855560302734375, 0.128631591796875, 0.1717071533203125, 0.21478271484375, 0.2578582763671875, 0.300933837890625, 0.3440093994140625, 0.3870849609375, 0.4301605224609375, 0.473236083984375, 0.5163116455078125, 0.55938720703125, 0.6024627685546875, 0.645538330078125, 0.6886138916015625, 0.731689453125, 0.7747650146484375, 0.817840576171875, 0.8609161376953125, 0.90399169921875, 0.9470672607421875, 0.990142822265625, 1.0332183837890625, 1.0762939453125, 1.1193695068359375, 1.162445068359375, 1.2055206298828125, 1.24859619140625, 1.2916717529296875, 1.334747314453125, 1.3778228759765625, 1.4208984375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 13.0, 8.0, 22.0, 34.0, 44.0, 81.0, 124.0, 170.0, 262.0, 374.0, 600.0, 847.0, 1299.0, 1907.0, 2779.0, 4209.0, 6167.0, 9428.0, 14311.0, 22408.0, 35821.0, 59177.0, 104697.0, 244588.0, 267200.0, 107883.0, 60822.0, 36675.0, 22996.0, 14560.0, 9678.0, 6318.0, 4277.0, 2862.0, 1918.0, 1317.0, 869.0, 622.0, 382.0, 271.0, 182.0, 128.0, 72.0, 54.0, 36.0, 25.0, 18.0, 6.0, 7.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057281494140625, -0.0554351806640625, -0.0535888671875, -0.0517425537109375, -0.049896240234375, -0.0480499267578125, -0.04620361328125, -0.0443572998046875, -0.042510986328125, -0.0406646728515625, -0.038818359375, -0.0369720458984375, -0.035125732421875, -0.0332794189453125, -0.03143310546875, -0.0295867919921875, -0.027740478515625, -0.0258941650390625, -0.0240478515625, -0.0222015380859375, -0.020355224609375, -0.0185089111328125, -0.01666259765625, -0.0148162841796875, -0.012969970703125, -0.0111236572265625, -0.00927734375, -0.0074310302734375, -0.005584716796875, -0.0037384033203125, -0.00189208984375, -4.57763671875e-05, 0.001800537109375, 0.0036468505859375, 0.0054931640625, 0.0073394775390625, 0.009185791015625, 0.0110321044921875, 0.01287841796875, 0.0147247314453125, 0.016571044921875, 0.0184173583984375, 0.020263671875, 0.0221099853515625, 0.023956298828125, 0.0258026123046875, 0.02764892578125, 0.0294952392578125, 0.031341552734375, 0.0331878662109375, 0.0350341796875, 0.0368804931640625, 0.038726806640625, 0.0405731201171875, 0.04241943359375, 0.0442657470703125, 0.046112060546875, 0.0479583740234375, 0.0498046875, 0.0516510009765625, 0.053497314453125, 0.0553436279296875, 0.05718994140625, 0.0590362548828125, 0.060882568359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 2.0, 6.0, 5.0, 13.0, 8.0, 12.0, 11.0, 14.0, 12.0, 22.0, 24.0, 20.0, 27.0, 30.0, 23.0, 46.0, 27.0, 41.0, 39.0, 46.0, 42.0, 1067.0, 33.0, 25.0, 31.0, 36.0, 46.0, 38.0, 31.0, 36.0, 32.0, 23.0, 18.0, 23.0, 26.0, 16.0, 10.0, 5.0, 11.0, 10.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.17578125, -1.1416778564453125, -1.107574462890625, -1.0734710693359375, -1.03936767578125, -1.0052642822265625, -0.971160888671875, -0.9370574951171875, -0.9029541015625, -0.8688507080078125, -0.834747314453125, -0.8006439208984375, -0.76654052734375, -0.7324371337890625, -0.698333740234375, -0.6642303466796875, -0.630126953125, -0.5960235595703125, -0.561920166015625, -0.5278167724609375, -0.49371337890625, -0.4596099853515625, -0.425506591796875, -0.3914031982421875, -0.3572998046875, -0.3231964111328125, -0.289093017578125, -0.2549896240234375, -0.22088623046875, -0.1867828369140625, -0.152679443359375, -0.1185760498046875, -0.08447265625, -0.0503692626953125, -0.016265869140625, 0.0178375244140625, 0.05194091796875, 0.0860443115234375, 0.120147705078125, 0.1542510986328125, 0.1883544921875, 0.2224578857421875, 0.256561279296875, 0.2906646728515625, 0.32476806640625, 0.3588714599609375, 0.392974853515625, 0.4270782470703125, 0.461181640625, 0.4952850341796875, 0.529388427734375, 0.5634918212890625, 0.59759521484375, 0.6316986083984375, 0.665802001953125, 0.6999053955078125, 0.7340087890625, 0.7681121826171875, 0.802215576171875, 0.8363189697265625, 0.87042236328125, 0.9045257568359375, 0.938629150390625, 0.9727325439453125, 1.0068359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 5.0, 15.0, 19.0, 26.0, 46.0, 63.0, 102.0, 151.0, 235.0, 322.0, 490.0, 749.0, 1109.0, 1530.0, 2254.0, 3375.0, 4805.0, 6972.0, 10548.0, 15341.0, 23550.0, 36394.0, 59221.0, 100810.0, 200481.0, 1325062.0, 116858.0, 66706.0, 40883.0, 25893.0, 17302.0, 11260.0, 7711.0, 5313.0, 3634.0, 2483.0, 1736.0, 1169.0, 807.0, 560.0, 374.0, 259.0, 186.0, 116.0, 74.0, 49.0, 34.0, 22.0, 11.0, 9.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03204345703125, -0.031013965606689453, -0.029984474182128906, -0.02895498275756836, -0.027925491333007812, -0.026895999908447266, -0.02586650848388672, -0.024837017059326172, -0.023807525634765625, -0.022778034210205078, -0.02174854278564453, -0.020719051361083984, -0.019689559936523438, -0.01866006851196289, -0.017630577087402344, -0.016601085662841797, -0.01557159423828125, -0.014542102813720703, -0.013512611389160156, -0.01248311996459961, -0.011453628540039062, -0.010424137115478516, -0.009394645690917969, -0.008365154266357422, -0.007335662841796875, -0.006306171417236328, -0.005276679992675781, -0.004247188568115234, -0.0032176971435546875, -0.0021882057189941406, -0.0011587142944335938, -0.00012922286987304688, 0.0009002685546875, 0.0019297599792480469, 0.0029592514038085938, 0.003988742828369141, 0.0050182342529296875, 0.006047725677490234, 0.007077217102050781, 0.008106708526611328, 0.009136199951171875, 0.010165691375732422, 0.011195182800292969, 0.012224674224853516, 0.013254165649414062, 0.01428365707397461, 0.015313148498535156, 0.016342639923095703, 0.01737213134765625, 0.018401622772216797, 0.019431114196777344, 0.02046060562133789, 0.021490097045898438, 0.022519588470458984, 0.02354907989501953, 0.024578571319580078, 0.025608062744140625, 0.026637554168701172, 0.02766704559326172, 0.028696537017822266, 0.029726028442382812, 0.03075551986694336, 0.031785011291503906, 0.03281450271606445, 0.033843994140625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 8.0, 0.0, 6.0, 14.0, 0.0, 11.0, 33.0, 0.0, 43.0, 98.0, 565.0, 0.0, 90.0, 53.0, 0.0, 23.0, 22.0, 10.0, 0.0, 10.0, 4.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2097880244255066e-06, -1.16787850856781e-06, -1.1259689927101135e-06, -1.084059476852417e-06, -1.0421499609947205e-06, -1.000240445137024e-06, -9.583309292793274e-07, -9.164214134216309e-07, -8.745118975639343e-07, -8.326023817062378e-07, -7.906928658485413e-07, -7.487833499908447e-07, -7.068738341331482e-07, -6.649643182754517e-07, -6.230548024177551e-07, -5.811452865600586e-07, -5.392357707023621e-07, -4.973262548446655e-07, -4.55416738986969e-07, -4.1350722312927246e-07, -3.7159770727157593e-07, -3.296881914138794e-07, -2.8777867555618286e-07, -2.4586915969848633e-07, -2.039596438407898e-07, -1.6205012798309326e-07, -1.2014061212539673e-07, -7.82310962677002e-08, -3.632158041000366e-08, 5.587935447692871e-09, 4.7497451305389404e-08, 8.940696716308594e-08, 1.3131648302078247e-07, 1.73225998878479e-07, 2.1513551473617554e-07, 2.5704503059387207e-07, 2.989545464515686e-07, 3.4086406230926514e-07, 3.8277357816696167e-07, 4.246830940246582e-07, 4.6659260988235474e-07, 5.085021257400513e-07, 5.504116415977478e-07, 5.923211574554443e-07, 6.342306733131409e-07, 6.761401891708374e-07, 7.180497050285339e-07, 7.599592208862305e-07, 8.01868736743927e-07, 8.437782526016235e-07, 8.856877684593201e-07, 9.275972843170166e-07, 9.695068001747131e-07, 1.0114163160324097e-06, 1.0533258318901062e-06, 1.0952353477478027e-06, 1.1371448636054993e-06, 1.1790543794631958e-06, 1.2209638953208923e-06, 1.2628734111785889e-06, 1.3047829270362854e-06, 1.346692442893982e-06, 1.3886019587516785e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 8.0, 8.0, 1.0, 3.0, 3.0, 3.0, 11.0, 13.0, 11.0, 26.0, 32.0, 31.0, 59.0, 89.0, 187.0, 648.0, 72994.0, 972601.0, 1259.0, 200.0, 117.0, 60.0, 49.0, 30.0, 20.0, 21.0, 19.0, 4.0, 9.0, 5.0, 4.0, 7.0, 6.0, 4.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9371509552001953e-05, -1.87065452337265e-05, -1.804158091545105e-05, -1.7376616597175598e-05, -1.6711652278900146e-05, -1.6046687960624695e-05, -1.5381723642349243e-05, -1.4716759324073792e-05, -1.405179500579834e-05, -1.3386830687522888e-05, -1.2721866369247437e-05, -1.2056902050971985e-05, -1.1391937732696533e-05, -1.0726973414421082e-05, -1.006200909614563e-05, -9.397044777870178e-06, -8.732080459594727e-06, -8.067116141319275e-06, -7.402151823043823e-06, -6.737187504768372e-06, -6.07222318649292e-06, -5.407258868217468e-06, -4.742294549942017e-06, -4.077330231666565e-06, -3.4123659133911133e-06, -2.7474015951156616e-06, -2.08243727684021e-06, -1.4174729585647583e-06, -7.525086402893066e-07, -8.754432201385498e-08, 5.774199962615967e-07, 1.2423843145370483e-06, 1.9073486328125e-06, 2.5723129510879517e-06, 3.2372772693634033e-06, 3.902241587638855e-06, 4.567205905914307e-06, 5.232170224189758e-06, 5.89713454246521e-06, 6.562098860740662e-06, 7.227063179016113e-06, 7.892027497291565e-06, 8.556991815567017e-06, 9.221956133842468e-06, 9.88692045211792e-06, 1.0551884770393372e-05, 1.1216849088668823e-05, 1.1881813406944275e-05, 1.2546777725219727e-05, 1.3211742043495178e-05, 1.387670636177063e-05, 1.4541670680046082e-05, 1.5206634998321533e-05, 1.5871599316596985e-05, 1.6536563634872437e-05, 1.7201527953147888e-05, 1.786649227142334e-05, 1.853145658969879e-05, 1.9196420907974243e-05, 1.9861385226249695e-05, 2.0526349544525146e-05, 2.1191313862800598e-05, 2.185627818107605e-05, 2.25212424993515e-05, 2.3186206817626953e-05]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 15.0, 9.0, 12.0, 7.0, 7.0, 18.0, 14.0, 11.0, 805.0, 20.0, 15.0, 12.0, 14.0, 7.0, 7.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.351340443989102e-07, -1.303858283563386e-07, -1.2563761231376702e-07, -1.2088939627119544e-07, -1.1614118733405121e-07, -1.1139297129147963e-07, -1.066447623543354e-07, -1.0189654631176381e-07, -9.714833026919223e-08, -9.240011422662064e-08, -8.765189818404906e-08, -8.290368924690483e-08, -7.815547320433325e-08, -7.340725716176166e-08, -6.865904822461744e-08, -6.391083218204585e-08, -5.9162616139474267e-08, -5.441440009690268e-08, -4.9666187607044776e-08, -4.491797511718687e-08, -4.0169759074615285e-08, -3.54215430320437e-08, -3.0673330542185795e-08, -2.592511805232789e-08, -2.1176902009756304e-08, -1.642868774354156e-08, -1.1680473477326814e-08, -6.9322592111120684e-09, -2.184044944897323e-09, 2.564169321317422e-09, 7.3123835875321674e-09, 1.2060596077390073e-08, 1.6808812119961658e-08, 2.1557026386176403e-08, 2.630524065239115e-08, 3.1053453142249055e-08, 3.580166918482064e-08, 4.0549885227392224e-08, 4.529809771725013e-08, 5.0046310207108036e-08, 5.479452624967962e-08, 5.9542742292251205e-08, 6.429095833482279e-08, 6.903916727196702e-08, 7.37873833145386e-08, 7.853559935711019e-08, 8.328380829425441e-08, 8.8032024336826e-08, 9.278024037939758e-08, 9.752845642196917e-08, 1.0227667246454075e-07, 1.0702488140168498e-07, 1.1177309744425656e-07, 1.1652131348682815e-07, 1.2126952242397238e-07, 1.2601773846654396e-07, 1.3076595450911555e-07, 1.3551417055168713e-07, 1.4026238659425871e-07, 1.450106026368303e-07, 1.4975881867940188e-07, 1.5450702051111875e-07, 1.5925523655369034e-07, 1.6400345259626192e-07, 1.687516686388335e-07]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 83.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 815.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 6.0, 8.0, 4.0, 13.0, 9.0, 12.0, 20.0, 13.0, 16.0, 16.0, 22.0, 25.0, 20.0, 25.0, 37.0, 37.0, 36.0, 37.0, 36.0, 35.0, 52.0, 45.0, 44.0, 43.0, 42.0, 44.0, 31.0, 34.0, 38.0, 22.0, 27.0, 25.0, 18.0, 15.0, 20.0, 11.0, 14.0, 10.0, 7.0, 7.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.2928619384765625, -1.249786376953125, -1.2067108154296875, -1.16363525390625, -1.1205596923828125, -1.077484130859375, -1.0344085693359375, -0.9913330078125, -0.9482574462890625, -0.905181884765625, -0.8621063232421875, -0.81903076171875, -0.7759552001953125, -0.732879638671875, -0.6898040771484375, -0.646728515625, -0.6036529541015625, -0.560577392578125, -0.5175018310546875, -0.47442626953125, -0.4313507080078125, -0.388275146484375, -0.3451995849609375, -0.3021240234375, -0.2590484619140625, -0.215972900390625, -0.1728973388671875, -0.12982177734375, -0.0867462158203125, -0.043670654296875, -0.0005950927734375, 0.04248046875, 0.0855560302734375, 0.128631591796875, 0.1717071533203125, 0.21478271484375, 0.2578582763671875, 0.300933837890625, 0.3440093994140625, 0.3870849609375, 0.4301605224609375, 0.473236083984375, 0.5163116455078125, 0.55938720703125, 0.6024627685546875, 0.645538330078125, 0.6886138916015625, 0.731689453125, 0.7747650146484375, 0.817840576171875, 0.8609161376953125, 0.90399169921875, 0.9470672607421875, 0.990142822265625, 1.0332183837890625, 1.0762939453125, 1.1193695068359375, 1.162445068359375, 1.2055206298828125, 1.24859619140625, 1.2916717529296875, 1.334747314453125, 1.3778228759765625, 1.4208984375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 9.0, 8.0, 30.0, 36.0, 70.0, 77.0, 121.0, 211.0, 263.0, 432.0, 682.0, 1033.0, 1595.0, 2490.0, 4184.0, 7699.0, 14349.0, 29584.0, 66354.0, 157552.0, 368903.0, 221806.0, 89549.0, 39856.0, 18386.0, 9696.0, 5271.0, 3071.0, 1835.0, 1149.0, 764.0, 479.0, 329.0, 225.0, 154.0, 94.0, 76.0, 33.0, 30.0, 18.0, 13.0, 10.0, 9.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.974609375, -1.915985107421875, -1.85736083984375, -1.798736572265625, -1.7401123046875, -1.681488037109375, -1.62286376953125, -1.564239501953125, -1.505615234375, -1.446990966796875, -1.38836669921875, -1.329742431640625, -1.2711181640625, -1.212493896484375, -1.15386962890625, -1.095245361328125, -1.03662109375, -0.977996826171875, -0.91937255859375, -0.860748291015625, -0.8021240234375, -0.743499755859375, -0.68487548828125, -0.626251220703125, -0.567626953125, -0.509002685546875, -0.45037841796875, -0.391754150390625, -0.3331298828125, -0.274505615234375, -0.21588134765625, -0.157257080078125, -0.0986328125, -0.040008544921875, 0.01861572265625, 0.077239990234375, 0.1358642578125, 0.194488525390625, 0.25311279296875, 0.311737060546875, 0.370361328125, 0.428985595703125, 0.48760986328125, 0.546234130859375, 0.6048583984375, 0.663482666015625, 0.72210693359375, 0.780731201171875, 0.83935546875, 0.897979736328125, 0.95660400390625, 1.015228271484375, 1.0738525390625, 1.132476806640625, 1.19110107421875, 1.249725341796875, 1.308349609375, 1.366973876953125, 1.42559814453125, 1.484222412109375, 1.5428466796875, 1.601470947265625, 1.66009521484375, 1.718719482421875, 1.77734375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 2.0, 6.0, 4.0, 13.0, 11.0, 5.0, 17.0, 17.0, 39.0, 30.0, 30.0, 34.0, 46.0, 46.0, 54.0, 65.0, 110.0, 210.0, 1562.0, 212.0, 101.0, 74.0, 55.0, 48.0, 34.0, 52.0, 33.0, 27.0, 11.0, 27.0, 14.0, 9.0, 8.0, 14.0, 5.0, 2.0, 4.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.05078125, -4.8797607421875, -4.708740234375, -4.5377197265625, -4.36669921875, -4.1956787109375, -4.024658203125, -3.8536376953125, -3.6826171875, -3.5115966796875, -3.340576171875, -3.1695556640625, -2.99853515625, -2.8275146484375, -2.656494140625, -2.4854736328125, -2.314453125, -2.1434326171875, -1.972412109375, -1.8013916015625, -1.63037109375, -1.4593505859375, -1.288330078125, -1.1173095703125, -0.9462890625, -0.7752685546875, -0.604248046875, -0.4332275390625, -0.26220703125, -0.0911865234375, 0.079833984375, 0.2508544921875, 0.421875, 0.5928955078125, 0.763916015625, 0.9349365234375, 1.10595703125, 1.2769775390625, 1.447998046875, 1.6190185546875, 1.7900390625, 1.9610595703125, 2.132080078125, 2.3031005859375, 2.47412109375, 2.6451416015625, 2.816162109375, 2.9871826171875, 3.158203125, 3.3292236328125, 3.500244140625, 3.6712646484375, 3.84228515625, 4.0133056640625, 4.184326171875, 4.3553466796875, 4.5263671875, 4.6973876953125, 4.868408203125, 5.0394287109375, 5.21044921875, 5.3814697265625, 5.552490234375, 5.7235107421875, 5.89453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 3.0, 1.0, 6.0, 9.0, 6.0, 13.0, 11.0, 15.0, 18.0, 24.0, 45.0, 53.0, 53.0, 83.0, 181.0, 438.0, 1653.0, 35859.0, 2998039.0, 105260.0, 2801.0, 493.0, 219.0, 122.0, 76.0, 37.0, 43.0, 35.0, 25.0, 23.0, 13.0, 7.0, 12.0, 7.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.828125, -13.4285888671875, -13.029052734375, -12.6295166015625, -12.22998046875, -11.8304443359375, -11.430908203125, -11.0313720703125, -10.6318359375, -10.2322998046875, -9.832763671875, -9.4332275390625, -9.03369140625, -8.6341552734375, -8.234619140625, -7.8350830078125, -7.435546875, -7.0360107421875, -6.636474609375, -6.2369384765625, -5.83740234375, -5.4378662109375, -5.038330078125, -4.6387939453125, -4.2392578125, -3.8397216796875, -3.440185546875, -3.0406494140625, -2.64111328125, -2.2415771484375, -1.842041015625, -1.4425048828125, -1.04296875, -0.6434326171875, -0.243896484375, 0.1556396484375, 0.55517578125, 0.9547119140625, 1.354248046875, 1.7537841796875, 2.1533203125, 2.5528564453125, 2.952392578125, 3.3519287109375, 3.75146484375, 4.1510009765625, 4.550537109375, 4.9500732421875, 5.349609375, 5.7491455078125, 6.148681640625, 6.5482177734375, 6.94775390625, 7.3472900390625, 7.746826171875, 8.1463623046875, 8.5458984375, 8.9454345703125, 9.344970703125, 9.7445068359375, 10.14404296875, 10.5435791015625, 10.943115234375, 11.3426513671875, 11.7421875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 15.0, 26.0, 43.0, 95.0, 158.0, 206.0, 180.0, 121.0, 75.0, 48.0, 22.0, 10.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.23815155029297, -15.808196067810059, -15.378240585327148, -14.948284149169922, -14.518328666687012, -14.088373184204102, -13.658417701721191, -13.228462219238281, -12.798505783081055, -12.368550300598145, -11.938594818115234, -11.508638381958008, -11.078682899475098, -10.648727416992188, -10.218771934509277, -9.788816452026367, -9.358860969543457, -8.928905487060547, -8.498950004577637, -8.068994522094727, -7.6390380859375, -7.20908260345459, -6.77912712097168, -6.3491716384887695, -5.919215679168701, -5.489260196685791, -5.059304237365723, -4.6293487548828125, -4.199393272399902, -3.769437313079834, -3.339481830596924, -2.9095261096954346, -2.4795703887939453, -2.049614667892456, -1.6196590662002563, -1.1897034645080566, -0.7597477436065674, -0.3297920227050781, 0.10016345977783203, 0.5301191806793213, 0.9600749015808105, 1.3900306224822998, 1.8199862241744995, 2.249941825866699, 2.6798975467681885, 3.1098532676696777, 3.539808750152588, 3.969764471054077, 4.399720191955566, 4.829675674438477, 5.259631633758545, 5.689587116241455, 6.119543075561523, 6.549498558044434, 6.979454040527344, 7.409409523010254, 7.839365482330322, 8.26932144165039, 8.6992769241333, 9.129232406616211, 9.559187889099121, 9.989143371582031, 10.419099807739258, 10.849055290222168, 11.279010772705078]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 15.0, 10.0, 18.0, 19.0, 23.0, 22.0, 18.0, 14.0, 22.0, 23.0, 36.0, 35.0, 41.0, 40.0, 47.0, 42.0, 42.0, 51.0, 34.0, 42.0, 41.0, 41.0, 26.0, 43.0, 35.0, 30.0, 28.0, 25.0, 20.0, 24.0, 22.0, 13.0, 17.0, 12.0, 9.0, 5.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.803150177001953, -16.246971130371094, -15.69079303741455, -15.134614944458008, -14.578435897827148, -14.022256851196289, -13.466078758239746, -12.909900665283203, -12.353721618652344, -11.797542572021484, -11.241364479064941, -10.685186386108398, -10.129007339477539, -9.57282829284668, -9.016650199890137, -8.460472106933594, -7.904293060302734, -7.348114490509033, -6.791935920715332, -6.235757350921631, -5.67957878112793, -5.1234002113342285, -4.567221641540527, -4.011043071746826, -3.454864501953125, -2.898685932159424, -2.3425073623657227, -1.7863287925720215, -1.2301502227783203, -0.6739716529846191, -0.11779308319091797, 0.4383854866027832, 0.9945621490478516, 1.5507407188415527, 2.106919288635254, 2.663097858428955, 3.2192764282226562, 3.7754549980163574, 4.331633567810059, 4.88781213760376, 5.443990707397461, 6.000169277191162, 6.556347846984863, 7.1125264167785645, 7.668704986572266, 8.224884033203125, 8.781062126159668, 9.337240219116211, 9.89341926574707, 10.44959831237793, 11.005776405334473, 11.561954498291016, 12.118133544921875, 12.674312591552734, 13.230490684509277, 13.78666877746582, 14.34284782409668, 14.899026870727539, 15.455204963684082, 16.011383056640625, 16.567562103271484, 17.123741149902344, 17.679920196533203, 18.23609733581543, 18.79227638244629]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 11.0, 10.0, 17.0, 20.0, 10.0, 17.0, 17.0, 22.0, 23.0, 21.0, 25.0, 34.0, 37.0, 29.0, 42.0, 40.0, 41.0, 39.0, 41.0, 42.0, 51.0, 43.0, 35.0, 41.0, 42.0, 22.0, 25.0, 25.0, 22.0, 21.0, 24.0, 11.0, 15.0, 16.0, 9.0, 9.0, 7.0, 8.0, 9.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.302734375, -1.259521484375, -1.21630859375, -1.173095703125, -1.1298828125, -1.086669921875, -1.04345703125, -1.000244140625, -0.95703125, -0.913818359375, -0.87060546875, -0.827392578125, -0.7841796875, -0.740966796875, -0.69775390625, -0.654541015625, -0.611328125, -0.568115234375, -0.52490234375, -0.481689453125, -0.4384765625, -0.395263671875, -0.35205078125, -0.308837890625, -0.265625, -0.222412109375, -0.17919921875, -0.135986328125, -0.0927734375, -0.049560546875, -0.00634765625, 0.036865234375, 0.080078125, 0.123291015625, 0.16650390625, 0.209716796875, 0.2529296875, 0.296142578125, 0.33935546875, 0.382568359375, 0.42578125, 0.468994140625, 0.51220703125, 0.555419921875, 0.5986328125, 0.641845703125, 0.68505859375, 0.728271484375, 0.771484375, 0.814697265625, 0.85791015625, 0.901123046875, 0.9443359375, 0.987548828125, 1.03076171875, 1.073974609375, 1.1171875, 1.160400390625, 1.20361328125, 1.246826171875, 1.2900390625, 1.333251953125, 1.37646484375, 1.419677734375, 1.462890625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 11.0, 5.0, 8.0, 5.0, 14.0, 10.0, 14.0, 22.0, 23.0, 35.0, 30.0, 35.0, 41.0, 49.0, 60.0, 107.0, 140.0, 258.0, 521.0, 1206.0, 3735.0, 15942.0, 100318.0, 966413.0, 2725662.0, 326187.0, 41724.0, 7769.0, 2090.0, 722.0, 377.0, 191.0, 102.0, 87.0, 69.0, 61.0, 35.0, 29.0, 34.0, 31.0, 19.0, 14.0, 19.0, 17.0, 11.0, 15.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.32421875, -6.1341552734375, -5.944091796875, -5.7540283203125, -5.56396484375, -5.3739013671875, -5.183837890625, -4.9937744140625, -4.8037109375, -4.6136474609375, -4.423583984375, -4.2335205078125, -4.04345703125, -3.8533935546875, -3.663330078125, -3.4732666015625, -3.283203125, -3.0931396484375, -2.903076171875, -2.7130126953125, -2.52294921875, -2.3328857421875, -2.142822265625, -1.9527587890625, -1.7626953125, -1.5726318359375, -1.382568359375, -1.1925048828125, -1.00244140625, -0.8123779296875, -0.622314453125, -0.4322509765625, -0.2421875, -0.0521240234375, 0.137939453125, 0.3280029296875, 0.51806640625, 0.7081298828125, 0.898193359375, 1.0882568359375, 1.2783203125, 1.4683837890625, 1.658447265625, 1.8485107421875, 2.03857421875, 2.2286376953125, 2.418701171875, 2.6087646484375, 2.798828125, 2.9888916015625, 3.178955078125, 3.3690185546875, 3.55908203125, 3.7491455078125, 3.939208984375, 4.1292724609375, 4.3193359375, 4.5093994140625, 4.699462890625, 4.8895263671875, 5.07958984375, 5.2696533203125, 5.459716796875, 5.6497802734375, 5.83984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 9.0, 18.0, 27.0, 25.0, 54.0, 80.0, 142.0, 208.0, 306.0, 466.0, 677.0, 667.0, 481.0, 328.0, 216.0, 155.0, 81.0, 52.0, 37.0, 17.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.696533203125, -8.47900390625, -8.261474609375, -8.0439453125, -7.826416015625, -7.60888671875, -7.391357421875, -7.173828125, -6.956298828125, -6.73876953125, -6.521240234375, -6.3037109375, -6.086181640625, -5.86865234375, -5.651123046875, -5.43359375, -5.216064453125, -4.99853515625, -4.781005859375, -4.5634765625, -4.345947265625, -4.12841796875, -3.910888671875, -3.693359375, -3.475830078125, -3.25830078125, -3.040771484375, -2.8232421875, -2.605712890625, -2.38818359375, -2.170654296875, -1.953125, -1.735595703125, -1.51806640625, -1.300537109375, -1.0830078125, -0.865478515625, -0.64794921875, -0.430419921875, -0.212890625, 0.004638671875, 0.22216796875, 0.439697265625, 0.6572265625, 0.874755859375, 1.09228515625, 1.309814453125, 1.52734375, 1.744873046875, 1.96240234375, 2.179931640625, 2.3974609375, 2.614990234375, 2.83251953125, 3.050048828125, 3.267578125, 3.485107421875, 3.70263671875, 3.920166015625, 4.1376953125, 4.355224609375, 4.57275390625, 4.790283203125, 5.0078125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 10.0, 22.0, 30.0, 55.0, 97.0, 152.0, 290.0, 535.0, 1161.0, 2696.0, 9550.0, 55497.0, 497295.0, 2770106.0, 757435.0, 80811.0, 12502.0, 3316.0, 1325.0, 599.0, 346.0, 187.0, 104.0, 59.0, 32.0, 20.0, 13.0, 9.0, 10.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.40625, -9.08837890625, -8.7705078125, -8.45263671875, -8.134765625, -7.81689453125, -7.4990234375, -7.18115234375, -6.86328125, -6.54541015625, -6.2275390625, -5.90966796875, -5.591796875, -5.27392578125, -4.9560546875, -4.63818359375, -4.3203125, -4.00244140625, -3.6845703125, -3.36669921875, -3.048828125, -2.73095703125, -2.4130859375, -2.09521484375, -1.77734375, -1.45947265625, -1.1416015625, -0.82373046875, -0.505859375, -0.18798828125, 0.1298828125, 0.44775390625, 0.765625, 1.08349609375, 1.4013671875, 1.71923828125, 2.037109375, 2.35498046875, 2.6728515625, 2.99072265625, 3.30859375, 3.62646484375, 3.9443359375, 4.26220703125, 4.580078125, 4.89794921875, 5.2158203125, 5.53369140625, 5.8515625, 6.16943359375, 6.4873046875, 6.80517578125, 7.123046875, 7.44091796875, 7.7587890625, 8.07666015625, 8.39453125, 8.71240234375, 9.0302734375, 9.34814453125, 9.666015625, 9.98388671875, 10.3017578125, 10.61962890625, 10.9375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 18.0, 51.0, 119.0, 224.0, 255.0, 171.0, 105.0, 57.0, 11.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.57279205322266, -92.76798248291016, -90.96317291259766, -89.15836334228516, -87.35355377197266, -85.54873657226562, -83.74392700195312, -81.93911743164062, -80.13430786132812, -78.32949829101562, -76.52468872070312, -74.71987915039062, -72.91506958007812, -71.11026000976562, -69.3054428100586, -67.5006332397461, -65.6958236694336, -63.891014099121094, -62.086204528808594, -60.28139114379883, -58.47658157348633, -56.67177200317383, -54.86696243286133, -53.06214904785156, -51.25734329223633, -49.45253372192383, -47.64772415161133, -45.84291076660156, -44.03810119628906, -42.23329162597656, -40.42848205566406, -38.62367248535156, -36.81885528564453, -35.01404571533203, -33.20923614501953, -31.4044246673584, -29.599613189697266, -27.794803619384766, -25.989994049072266, -24.185182571411133, -22.380374908447266, -20.575565338134766, -18.770753860473633, -16.965944290161133, -15.1611328125, -13.3563232421875, -11.551512718200684, -9.746702194213867, -7.941890716552734, -6.137080192565918, -4.332269668579102, -2.5274596214294434, -0.722649097442627, 1.0821609497070312, 2.8869714736938477, 4.691781997680664, 6.4965925216674805, 8.301403045654297, 10.106213569641113, 11.91102409362793, 13.71583366394043, 15.520644187927246, 17.325454711914062, 19.130264282226562, 20.935075759887695]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 3.0, 4.0, 7.0, 3.0, 15.0, 17.0, 19.0, 25.0, 23.0, 30.0, 27.0, 37.0, 49.0, 38.0, 51.0, 30.0, 48.0, 39.0, 43.0, 43.0, 39.0, 41.0, 34.0, 46.0, 36.0, 44.0, 27.0, 19.0, 29.0, 19.0, 15.0, 21.0, 21.0, 10.0, 13.0, 12.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.511360168457031, -14.975646018981934, -14.439931869506836, -13.904217720031738, -13.36850357055664, -12.83279037475586, -12.297076225280762, -11.761362075805664, -11.225647926330566, -10.689933776855469, -10.154219627380371, -9.618505477905273, -9.082792282104492, -8.547077178955078, -8.011363983154297, -7.475649833679199, -6.939935684204102, -6.404221534729004, -5.868507385253906, -5.332793712615967, -4.797079563140869, -4.2613654136657715, -3.725651502609253, -3.1899375915527344, -2.6542234420776367, -2.118509292602539, -1.5827953815460205, -1.0470813512802124, -0.5113673210144043, 0.02434682846069336, 0.5600607395172119, 1.0957746505737305, 1.631490707397461, 2.1672048568725586, 2.702918767929077, 3.2386326789855957, 3.7743468284606934, 4.310060977935791, 4.8457746505737305, 5.381488800048828, 5.917202949523926, 6.452917098999023, 6.988631248474121, 7.5243449211120605, 8.06005859375, 8.595773696899414, 9.131486892700195, 9.667201042175293, 10.20291519165039, 10.738629341125488, 11.274343490600586, 11.810057640075684, 12.345771789550781, 12.881484985351562, 13.41719913482666, 13.952913284301758, 14.488627433776855, 15.024341583251953, 15.56005573272705, 16.09576988220215, 16.63148307800293, 17.167198181152344, 17.702911376953125, 18.238624572753906, 18.77433967590332]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 8.0, 9.0, 7.0, 10.0, 16.0, 16.0, 18.0, 17.0, 18.0, 15.0, 20.0, 24.0, 22.0, 30.0, 37.0, 41.0, 31.0, 34.0, 42.0, 45.0, 50.0, 41.0, 31.0, 36.0, 37.0, 32.0, 37.0, 37.0, 22.0, 30.0, 23.0, 20.0, 25.0, 16.0, 26.0, 10.0, 11.0, 12.0, 7.0, 11.0, 6.0, 3.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2446746826171875, -1.201263427734375, -1.1578521728515625, -1.11444091796875, -1.0710296630859375, -1.027618408203125, -0.9842071533203125, -0.9407958984375, -0.8973846435546875, -0.853973388671875, -0.8105621337890625, -0.76715087890625, -0.7237396240234375, -0.680328369140625, -0.6369171142578125, -0.593505859375, -0.5500946044921875, -0.506683349609375, -0.4632720947265625, -0.41986083984375, -0.3764495849609375, -0.333038330078125, -0.2896270751953125, -0.2462158203125, -0.2028045654296875, -0.159393310546875, -0.1159820556640625, -0.07257080078125, -0.0291595458984375, 0.014251708984375, 0.0576629638671875, 0.10107421875, 0.1444854736328125, 0.187896728515625, 0.2313079833984375, 0.27471923828125, 0.3181304931640625, 0.361541748046875, 0.4049530029296875, 0.4483642578125, 0.4917755126953125, 0.535186767578125, 0.5785980224609375, 0.62200927734375, 0.6654205322265625, 0.708831787109375, 0.7522430419921875, 0.795654296875, 0.8390655517578125, 0.882476806640625, 0.9258880615234375, 0.96929931640625, 1.0127105712890625, 1.056121826171875, 1.0995330810546875, 1.1429443359375, 1.1863555908203125, 1.229766845703125, 1.2731781005859375, 1.31658935546875, 1.3600006103515625, 1.403411865234375, 1.4468231201171875, 1.490234375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 14.0, 30.0, 46.0, 54.0, 80.0, 122.0, 193.0, 281.0, 408.0, 666.0, 970.0, 1472.0, 2155.0, 3313.0, 4941.0, 7601.0, 11340.0, 17061.0, 26755.0, 42617.0, 70110.0, 127787.0, 329288.0, 171468.0, 86725.0, 51588.0, 31743.0, 20413.0, 13183.0, 8743.0, 5836.0, 3852.0, 2608.0, 1724.0, 1119.0, 743.0, 523.0, 323.0, 204.0, 154.0, 97.0, 79.0, 41.0, 22.0, 15.0, 11.0, 11.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05242919921875, -0.05066347122192383, -0.048897743225097656, -0.047132015228271484, -0.04536628723144531, -0.04360055923461914, -0.04183483123779297, -0.0400691032409668, -0.038303375244140625, -0.03653764724731445, -0.03477191925048828, -0.03300619125366211, -0.031240463256835938, -0.029474735260009766, -0.027709007263183594, -0.025943279266357422, -0.02417755126953125, -0.022411823272705078, -0.020646095275878906, -0.018880367279052734, -0.017114639282226562, -0.01534891128540039, -0.013583183288574219, -0.011817455291748047, -0.010051727294921875, -0.008285999298095703, -0.006520271301269531, -0.004754543304443359, -0.0029888153076171875, -0.0012230873107910156, 0.0005426406860351562, 0.002308368682861328, 0.0040740966796875, 0.005839824676513672, 0.007605552673339844, 0.009371280670166016, 0.011137008666992188, 0.01290273666381836, 0.014668464660644531, 0.016434192657470703, 0.018199920654296875, 0.019965648651123047, 0.02173137664794922, 0.02349710464477539, 0.025262832641601562, 0.027028560638427734, 0.028794288635253906, 0.030560016632080078, 0.03232574462890625, 0.03409147262573242, 0.035857200622558594, 0.037622928619384766, 0.03938865661621094, 0.04115438461303711, 0.04292011260986328, 0.04468584060668945, 0.046451568603515625, 0.0482172966003418, 0.04998302459716797, 0.05174875259399414, 0.05351448059082031, 0.055280208587646484, 0.057045936584472656, 0.05881166458129883, 0.060577392578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 3.0, 6.0, 3.0, 8.0, 8.0, 7.0, 3.0, 8.0, 4.0, 11.0, 16.0, 17.0, 22.0, 15.0, 21.0, 28.0, 32.0, 33.0, 31.0, 23.0, 36.0, 39.0, 33.0, 30.0, 39.0, 1052.0, 40.0, 32.0, 56.0, 28.0, 31.0, 27.0, 26.0, 24.0, 37.0, 31.0, 25.0, 27.0, 16.0, 13.0, 16.0, 11.0, 12.0, 8.0, 7.0, 5.0, 11.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0], "bins": [-1.0693359375, -1.0385665893554688, -1.0077972412109375, -0.9770278930664062, -0.946258544921875, -0.9154891967773438, -0.8847198486328125, -0.8539505004882812, -0.82318115234375, -0.7924118041992188, -0.7616424560546875, -0.7308731079101562, -0.700103759765625, -0.6693344116210938, -0.6385650634765625, -0.6077957153320312, -0.5770263671875, -0.5462570190429688, -0.5154876708984375, -0.48471832275390625, -0.453948974609375, -0.42317962646484375, -0.3924102783203125, -0.36164093017578125, -0.33087158203125, -0.30010223388671875, -0.2693328857421875, -0.23856353759765625, -0.207794189453125, -0.17702484130859375, -0.1462554931640625, -0.11548614501953125, -0.084716796875, -0.05394744873046875, -0.0231781005859375, 0.00759124755859375, 0.038360595703125, 0.06912994384765625, 0.0998992919921875, 0.13066864013671875, 0.16143798828125, 0.19220733642578125, 0.2229766845703125, 0.25374603271484375, 0.284515380859375, 0.31528472900390625, 0.3460540771484375, 0.37682342529296875, 0.4075927734375, 0.43836212158203125, 0.4691314697265625, 0.49990081787109375, 0.530670166015625, 0.5614395141601562, 0.5922088623046875, 0.6229782104492188, 0.65374755859375, 0.6845169067382812, 0.7152862548828125, 0.7460556030273438, 0.776824951171875, 0.8075942993164062, 0.8383636474609375, 0.8691329956054688, 0.89990234375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 5.0, 8.0, 9.0, 24.0, 31.0, 40.0, 76.0, 119.0, 164.0, 250.0, 341.0, 457.0, 699.0, 966.0, 1372.0, 1898.0, 2797.0, 3862.0, 5617.0, 7950.0, 11622.0, 17324.0, 25612.0, 38688.0, 60277.0, 101850.0, 205014.0, 1302357.0, 113214.0, 65740.0, 41555.0, 27662.0, 18295.0, 12567.0, 8662.0, 5941.0, 4074.0, 3000.0, 2061.0, 1578.0, 1004.0, 737.0, 517.0, 390.0, 228.0, 179.0, 113.0, 81.0, 39.0, 26.0, 18.0, 15.0, 9.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0291290283203125, -0.02819204330444336, -0.02725505828857422, -0.026318073272705078, -0.025381088256835938, -0.024444103240966797, -0.023507118225097656, -0.022570133209228516, -0.021633148193359375, -0.020696163177490234, -0.019759178161621094, -0.018822193145751953, -0.017885208129882812, -0.016948223114013672, -0.01601123809814453, -0.01507425308227539, -0.01413726806640625, -0.01320028305053711, -0.012263298034667969, -0.011326313018798828, -0.010389328002929688, -0.009452342987060547, -0.008515357971191406, -0.007578372955322266, -0.006641387939453125, -0.005704402923583984, -0.004767417907714844, -0.003830432891845703, -0.0028934478759765625, -0.001956462860107422, -0.0010194778442382812, -8.249282836914062e-05, 0.0008544921875, 0.0017914772033691406, 0.0027284622192382812, 0.003665447235107422, 0.0046024322509765625, 0.005539417266845703, 0.006476402282714844, 0.007413387298583984, 0.008350372314453125, 0.009287357330322266, 0.010224342346191406, 0.011161327362060547, 0.012098312377929688, 0.013035297393798828, 0.013972282409667969, 0.01490926742553711, 0.01584625244140625, 0.01678323745727539, 0.01772022247314453, 0.018657207489013672, 0.019594192504882812, 0.020531177520751953, 0.021468162536621094, 0.022405147552490234, 0.023342132568359375, 0.024279117584228516, 0.025216102600097656, 0.026153087615966797, 0.027090072631835938, 0.028027057647705078, 0.02896404266357422, 0.02990102767944336, 0.0308380126953125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 8.0, 0.0, 30.0, 0.0, 35.0, 0.0, 0.0, 108.0, 0.0, 635.0, 0.0, 105.0, 0.0, 0.0, 26.0, 0.0, 19.0, 0.0, 0.0, 11.0, 0.0, 5.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-8.940696716308594e-07, -8.689239621162415e-07, -8.437782526016235e-07, -8.186325430870056e-07, -7.934868335723877e-07, -7.683411240577698e-07, -7.431954145431519e-07, -7.180497050285339e-07, -6.92903995513916e-07, -6.677582859992981e-07, -6.426125764846802e-07, -6.174668669700623e-07, -5.923211574554443e-07, -5.671754479408264e-07, -5.420297384262085e-07, -5.168840289115906e-07, -4.917383193969727e-07, -4.6659260988235474e-07, -4.414469003677368e-07, -4.163011908531189e-07, -3.91155481338501e-07, -3.6600977182388306e-07, -3.4086406230926514e-07, -3.157183527946472e-07, -2.905726432800293e-07, -2.654269337654114e-07, -2.4028122425079346e-07, -2.1513551473617554e-07, -1.8998980522155762e-07, -1.648440957069397e-07, -1.3969838619232178e-07, -1.1455267667770386e-07, -8.940696716308594e-08, -6.426125764846802e-08, -3.91155481338501e-08, -1.3969838619232178e-08, 1.1175870895385742e-08, 3.632158041000366e-08, 6.146728992462158e-08, 8.66129994392395e-08, 1.1175870895385742e-07, 1.3690441846847534e-07, 1.6205012798309326e-07, 1.8719583749771118e-07, 2.123415470123291e-07, 2.3748725652694702e-07, 2.6263296604156494e-07, 2.8777867555618286e-07, 3.129243850708008e-07, 3.380700945854187e-07, 3.632158041000366e-07, 3.8836151361465454e-07, 4.1350722312927246e-07, 4.386529326438904e-07, 4.637986421585083e-07, 4.889443516731262e-07, 5.140900611877441e-07, 5.392357707023621e-07, 5.6438148021698e-07, 5.895271897315979e-07, 6.146728992462158e-07, 6.398186087608337e-07, 6.649643182754517e-07, 6.901100277900696e-07, 7.152557373046875e-07]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 11.0, 5.0, 4.0, 5.0, 10.0, 15.0, 8.0, 21.0, 21.0, 56.0, 35.0, 98.0, 88.0, 476.0, 4928.0, 883851.0, 156435.0, 1773.0, 370.0, 71.0, 72.0, 21.0, 56.0, 11.0, 22.0, 17.0, 18.0, 7.0, 2.0, 11.0, 6.0, 5.0, 3.0, 2.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.3470649719238281e-05, -1.3084150850772858e-05, -1.2697651982307434e-05, -1.231115311384201e-05, -1.1924654245376587e-05, -1.1538155376911163e-05, -1.115165650844574e-05, -1.0765157639980316e-05, -1.0378658771514893e-05, -9.992159903049469e-06, -9.605661034584045e-06, -9.219162166118622e-06, -8.832663297653198e-06, -8.446164429187775e-06, -8.059665560722351e-06, -7.673166692256927e-06, -7.286667823791504e-06, -6.90016895532608e-06, -6.513670086860657e-06, -6.127171218395233e-06, -5.7406723499298096e-06, -5.354173481464386e-06, -4.967674612998962e-06, -4.581175744533539e-06, -4.194676876068115e-06, -3.8081780076026917e-06, -3.421679139137268e-06, -3.0351802706718445e-06, -2.648681402206421e-06, -2.2621825337409973e-06, -1.8756836652755737e-06, -1.4891847968101501e-06, -1.1026859283447266e-06, -7.16187059879303e-07, -3.296881914138794e-07, 5.681067705154419e-08, 4.4330954551696777e-07, 8.298084139823914e-07, 1.216307282447815e-06, 1.6028061509132385e-06, 1.989305019378662e-06, 2.3758038878440857e-06, 2.7623027563095093e-06, 3.148801624774933e-06, 3.5353004932403564e-06, 3.92179936170578e-06, 4.308298230171204e-06, 4.694797098636627e-06, 5.081295967102051e-06, 5.467794835567474e-06, 5.854293704032898e-06, 6.2407925724983215e-06, 6.627291440963745e-06, 7.013790309429169e-06, 7.400289177894592e-06, 7.786788046360016e-06, 8.17328691482544e-06, 8.559785783290863e-06, 8.946284651756287e-06, 9.33278352022171e-06, 9.719282388687134e-06, 1.0105781257152557e-05, 1.0492280125617981e-05, 1.0878778994083405e-05, 1.1265277862548828e-05]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 1.0, 4.0, 2.0, 6.0, 932.0, 6.0, 3.0, 6.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7114422234953963e-07, -1.6711740613573056e-07, -1.6309057571106678e-07, -1.590637594972577e-07, -1.5503694328344864e-07, -1.5101011285878485e-07, -1.4698329664497578e-07, -1.429564804311667e-07, -1.3892965000650292e-07, -1.3490283379269385e-07, -1.3087600336803007e-07, -1.26849187154221e-07, -1.2282237094041193e-07, -1.1879554051574814e-07, -1.1476872430193907e-07, -1.1074190098270265e-07, -1.0671508476889358e-07, -1.0268826144965715e-07, -9.866144523584808e-08, -9.463462191661165e-08, -9.060779859737522e-08, -8.658098238356615e-08, -8.255415906432972e-08, -7.85273357450933e-08, -7.450051953128423e-08, -7.04736962120478e-08, -6.644687999823873e-08, -6.24200566790023e-08, -5.839323335976587e-08, -5.4366413593243124e-08, -5.0339593826720375e-08, -4.631277050748395e-08, -4.228594718824752e-08, -3.825912742172477e-08, -3.423230410248834e-08, -3.0205484335965593e-08, -2.6178662793086005e-08, -2.2151841250206417e-08, -1.8125021483683668e-08, -1.409819994080408e-08, -1.0071378397924491e-08, -6.044557299134112e-09, -2.017736200343734e-09, 2.009084454357435e-09, 6.035905997237023e-09, 1.0062727540116612e-08, 1.408954730663936e-08, 1.811636884951895e-08, 2.2143190392398537e-08, 2.6170011935278126e-08, 3.0196833478157714e-08, 3.422365324468046e-08, 3.825047656391689e-08, 4.227729633043964e-08, 4.630411609696239e-08, 5.0330939416198817e-08, 5.4357759182721566e-08, 5.8384578949244315e-08, 6.241140226848074e-08, 6.643821848228981e-08, 7.046504180152624e-08, 7.449186512076267e-08, 7.851868133457174e-08, 8.254550465380817e-08, 8.65723279730446e-08]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 39.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 934.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 8.0, 9.0, 7.0, 10.0, 16.0, 16.0, 18.0, 17.0, 18.0, 15.0, 20.0, 24.0, 22.0, 30.0, 37.0, 41.0, 31.0, 34.0, 42.0, 45.0, 50.0, 41.0, 31.0, 36.0, 37.0, 32.0, 37.0, 37.0, 22.0, 30.0, 23.0, 20.0, 25.0, 16.0, 26.0, 10.0, 11.0, 12.0, 7.0, 11.0, 6.0, 3.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2446746826171875, -1.201263427734375, -1.1578521728515625, -1.11444091796875, -1.0710296630859375, -1.027618408203125, -0.9842071533203125, -0.9407958984375, -0.8973846435546875, -0.853973388671875, -0.8105621337890625, -0.76715087890625, -0.7237396240234375, -0.680328369140625, -0.6369171142578125, -0.593505859375, -0.5500946044921875, -0.506683349609375, -0.4632720947265625, -0.41986083984375, -0.3764495849609375, -0.333038330078125, -0.2896270751953125, -0.2462158203125, -0.2028045654296875, -0.159393310546875, -0.1159820556640625, -0.07257080078125, -0.0291595458984375, 0.014251708984375, 0.0576629638671875, 0.10107421875, 0.1444854736328125, 0.187896728515625, 0.2313079833984375, 0.27471923828125, 0.3181304931640625, 0.361541748046875, 0.4049530029296875, 0.4483642578125, 0.4917755126953125, 0.535186767578125, 0.5785980224609375, 0.62200927734375, 0.6654205322265625, 0.708831787109375, 0.7522430419921875, 0.795654296875, 0.8390655517578125, 0.882476806640625, 0.9258880615234375, 0.96929931640625, 1.0127105712890625, 1.056121826171875, 1.0995330810546875, 1.1429443359375, 1.1863555908203125, 1.229766845703125, 1.2731781005859375, 1.31658935546875, 1.3600006103515625, 1.403411865234375, 1.4468231201171875, 1.490234375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 6.0, 14.0, 15.0, 24.0, 43.0, 69.0, 93.0, 146.0, 244.0, 358.0, 647.0, 1109.0, 1964.0, 3412.0, 6215.0, 12404.0, 25841.0, 64211.0, 194502.0, 476833.0, 159175.0, 54290.0, 22751.0, 11000.0, 5728.0, 3120.0, 1788.0, 1024.0, 574.0, 368.0, 204.0, 128.0, 89.0, 63.0, 39.0, 26.0, 9.0, 19.0, 8.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.53125, -2.45068359375, -2.3701171875, -2.28955078125, -2.208984375, -2.12841796875, -2.0478515625, -1.96728515625, -1.88671875, -1.80615234375, -1.7255859375, -1.64501953125, -1.564453125, -1.48388671875, -1.4033203125, -1.32275390625, -1.2421875, -1.16162109375, -1.0810546875, -1.00048828125, -0.919921875, -0.83935546875, -0.7587890625, -0.67822265625, -0.59765625, -0.51708984375, -0.4365234375, -0.35595703125, -0.275390625, -0.19482421875, -0.1142578125, -0.03369140625, 0.046875, 0.12744140625, 0.2080078125, 0.28857421875, 0.369140625, 0.44970703125, 0.5302734375, 0.61083984375, 0.69140625, 0.77197265625, 0.8525390625, 0.93310546875, 1.013671875, 1.09423828125, 1.1748046875, 1.25537109375, 1.3359375, 1.41650390625, 1.4970703125, 1.57763671875, 1.658203125, 1.73876953125, 1.8193359375, 1.89990234375, 1.98046875, 2.06103515625, 2.1416015625, 2.22216796875, 2.302734375, 2.38330078125, 2.4638671875, 2.54443359375, 2.625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 9.0, 7.0, 5.0, 7.0, 21.0, 21.0, 36.0, 31.0, 32.0, 36.0, 34.0, 50.0, 62.0, 93.0, 181.0, 1555.0, 258.0, 116.0, 77.0, 59.0, 67.0, 42.0, 49.0, 40.0, 20.0, 21.0, 16.0, 22.0, 10.0, 18.0, 7.0, 11.0, 8.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08984375, -5.9095458984375, -5.729248046875, -5.5489501953125, -5.36865234375, -5.1883544921875, -5.008056640625, -4.8277587890625, -4.6474609375, -4.4671630859375, -4.286865234375, -4.1065673828125, -3.92626953125, -3.7459716796875, -3.565673828125, -3.3853759765625, -3.205078125, -3.0247802734375, -2.844482421875, -2.6641845703125, -2.48388671875, -2.3035888671875, -2.123291015625, -1.9429931640625, -1.7626953125, -1.5823974609375, -1.402099609375, -1.2218017578125, -1.04150390625, -0.8612060546875, -0.680908203125, -0.5006103515625, -0.3203125, -0.1400146484375, 0.040283203125, 0.2205810546875, 0.40087890625, 0.5811767578125, 0.761474609375, 0.9417724609375, 1.1220703125, 1.3023681640625, 1.482666015625, 1.6629638671875, 1.84326171875, 2.0235595703125, 2.203857421875, 2.3841552734375, 2.564453125, 2.7447509765625, 2.925048828125, 3.1053466796875, 3.28564453125, 3.4659423828125, 3.646240234375, 3.8265380859375, 4.0068359375, 4.1871337890625, 4.367431640625, 4.5477294921875, 4.72802734375, 4.9083251953125, 5.088623046875, 5.2689208984375, 5.44921875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 9.0, 6.0, 13.0, 16.0, 16.0, 29.0, 22.0, 45.0, 69.0, 89.0, 152.0, 329.0, 735.0, 2607.0, 18968.0, 462975.0, 2606537.0, 46316.0, 4714.0, 1088.0, 393.0, 195.0, 120.0, 68.0, 54.0, 35.0, 24.0, 17.0, 13.0, 13.0, 5.0, 4.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.296875, -8.978271484375, -8.65966796875, -8.341064453125, -8.0224609375, -7.703857421875, -7.38525390625, -7.066650390625, -6.748046875, -6.429443359375, -6.11083984375, -5.792236328125, -5.4736328125, -5.155029296875, -4.83642578125, -4.517822265625, -4.19921875, -3.880615234375, -3.56201171875, -3.243408203125, -2.9248046875, -2.606201171875, -2.28759765625, -1.968994140625, -1.650390625, -1.331787109375, -1.01318359375, -0.694580078125, -0.3759765625, -0.057373046875, 0.26123046875, 0.579833984375, 0.8984375, 1.217041015625, 1.53564453125, 1.854248046875, 2.1728515625, 2.491455078125, 2.81005859375, 3.128662109375, 3.447265625, 3.765869140625, 4.08447265625, 4.403076171875, 4.7216796875, 5.040283203125, 5.35888671875, 5.677490234375, 5.99609375, 6.314697265625, 6.63330078125, 6.951904296875, 7.2705078125, 7.589111328125, 7.90771484375, 8.226318359375, 8.544921875, 8.863525390625, 9.18212890625, 9.500732421875, 9.8193359375, 10.137939453125, 10.45654296875, 10.775146484375, 11.09375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 17.0, 102.0, 300.0, 348.0, 201.0, 38.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-54.88368606567383, -53.8116569519043, -52.739627838134766, -51.667598724365234, -50.5955696105957, -49.52354049682617, -48.45151138305664, -47.379478454589844, -46.30744934082031, -45.23542022705078, -44.16339111328125, -43.09136199951172, -42.01933288574219, -40.947303771972656, -39.875274658203125, -38.803245544433594, -37.73121643066406, -36.65918731689453, -35.587158203125, -34.51512908935547, -33.44309997558594, -32.371070861816406, -31.299039840698242, -30.22701072692871, -29.15498161315918, -28.08295249938965, -27.010923385620117, -25.938894271850586, -24.866863250732422, -23.79483413696289, -22.72280502319336, -21.650775909423828, -20.57874298095703, -19.5067138671875, -18.43468475341797, -17.362655639648438, -16.290626525878906, -15.218596458435059, -14.146566390991211, -13.07453727722168, -12.002509117126465, -10.930480003356934, -9.858449935913086, -8.786420822143555, -7.714391708374023, -6.642362594604492, -5.570333003997803, -4.498303413391113, -3.426274299621582, -2.3542449474334717, -1.2822155952453613, -0.21018624305725098, 0.8618431091308594, 1.9338722229003906, 3.00590181350708, 4.0779314041137695, 5.149960517883301, 6.221989631652832, 7.2940192222595215, 8.366048812866211, 9.438077926635742, 10.510107040405273, 11.582136154174805, 12.654166221618652, 13.726195335388184]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 5.0, 6.0, 4.0, 5.0, 11.0, 9.0, 14.0, 20.0, 27.0, 14.0, 25.0, 20.0, 22.0, 29.0, 26.0, 25.0, 34.0, 36.0, 38.0, 42.0, 47.0, 44.0, 38.0, 42.0, 33.0, 37.0, 36.0, 41.0, 38.0, 29.0, 26.0, 12.0, 23.0, 17.0, 26.0, 23.0, 16.0, 11.0, 12.0, 12.0, 7.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-17.735549926757812, -17.222135543823242, -16.708721160888672, -16.19530487060547, -15.681890487670898, -15.168476104736328, -14.655061721801758, -14.141646385192871, -13.628231048583984, -13.114816665649414, -12.601401329040527, -12.087986946105957, -11.57457160949707, -11.0611572265625, -10.54774284362793, -10.034327507019043, -9.520913124084473, -9.007498741149902, -8.494083404541016, -7.980669021606445, -7.467253684997559, -6.953839302062988, -6.44042444229126, -5.927009582519531, -5.413594722747803, -4.900179862976074, -4.386765003204346, -3.8733503818511963, -3.3599355220794678, -2.8465206623077393, -2.33310604095459, -1.8196911811828613, -1.3062763214111328, -0.7928615212440491, -0.27944672107696533, 0.23396801948547363, 0.7473828792572021, 1.2607977390289307, 1.77421236038208, 2.2876272201538086, 2.801042079925537, 3.3144569396972656, 3.827871799468994, 4.341286659240723, 4.854701042175293, 5.36811637878418, 5.88153076171875, 6.3949456214904785, 6.908360481262207, 7.4217753410339355, 7.935190200805664, 8.448604583740234, 8.962019920349121, 9.475434303283691, 9.988849639892578, 10.502264022827148, 11.015678405761719, 11.529092788696289, 12.042508125305176, 12.555922508239746, 13.069337844848633, 13.582752227783203, 14.096166610717773, 14.60958194732666, 15.122997283935547]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 6.0, 11.0, 11.0, 17.0, 16.0, 15.0, 18.0, 18.0, 16.0, 17.0, 24.0, 25.0, 29.0, 36.0, 35.0, 34.0, 33.0, 39.0, 46.0, 49.0, 47.0, 31.0, 43.0, 24.0, 30.0, 47.0, 27.0, 31.0, 33.0, 21.0, 17.0, 28.0, 25.0, 15.0, 18.0, 5.0, 12.0, 10.0, 9.0, 3.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.283203125, -1.2386016845703125, -1.194000244140625, -1.1493988037109375, -1.10479736328125, -1.0601959228515625, -1.015594482421875, -0.9709930419921875, -0.9263916015625, -0.8817901611328125, -0.837188720703125, -0.7925872802734375, -0.74798583984375, -0.7033843994140625, -0.658782958984375, -0.6141815185546875, -0.569580078125, -0.5249786376953125, -0.480377197265625, -0.4357757568359375, -0.39117431640625, -0.3465728759765625, -0.301971435546875, -0.2573699951171875, -0.2127685546875, -0.1681671142578125, -0.123565673828125, -0.0789642333984375, -0.03436279296875, 0.0102386474609375, 0.054840087890625, 0.0994415283203125, 0.14404296875, 0.1886444091796875, 0.233245849609375, 0.2778472900390625, 0.32244873046875, 0.3670501708984375, 0.411651611328125, 0.4562530517578125, 0.5008544921875, 0.5454559326171875, 0.590057373046875, 0.6346588134765625, 0.67926025390625, 0.7238616943359375, 0.768463134765625, 0.8130645751953125, 0.857666015625, 0.9022674560546875, 0.946868896484375, 0.9914703369140625, 1.03607177734375, 1.0806732177734375, 1.125274658203125, 1.1698760986328125, 1.2144775390625, 1.2590789794921875, 1.303680419921875, 1.3482818603515625, 1.39288330078125, 1.4374847412109375, 1.482086181640625, 1.5266876220703125, 1.5712890625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 10.0, 11.0, 11.0, 18.0, 24.0, 28.0, 28.0, 41.0, 34.0, 55.0, 93.0, 105.0, 161.0, 325.0, 610.0, 1527.0, 4838.0, 21829.0, 138991.0, 1233791.0, 2429474.0, 307142.0, 42762.0, 8086.0, 2251.0, 836.0, 428.0, 230.0, 138.0, 95.0, 59.0, 50.0, 47.0, 36.0, 23.0, 27.0, 7.0, 18.0, 10.0, 10.0, 7.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.87890625, -5.7017822265625, -5.524658203125, -5.3475341796875, -5.17041015625, -4.9932861328125, -4.816162109375, -4.6390380859375, -4.4619140625, -4.2847900390625, -4.107666015625, -3.9305419921875, -3.75341796875, -3.5762939453125, -3.399169921875, -3.2220458984375, -3.044921875, -2.8677978515625, -2.690673828125, -2.5135498046875, -2.33642578125, -2.1593017578125, -1.982177734375, -1.8050537109375, -1.6279296875, -1.4508056640625, -1.273681640625, -1.0965576171875, -0.91943359375, -0.7423095703125, -0.565185546875, -0.3880615234375, -0.2109375, -0.0338134765625, 0.143310546875, 0.3204345703125, 0.49755859375, 0.6746826171875, 0.851806640625, 1.0289306640625, 1.2060546875, 1.3831787109375, 1.560302734375, 1.7374267578125, 1.91455078125, 2.0916748046875, 2.268798828125, 2.4459228515625, 2.623046875, 2.8001708984375, 2.977294921875, 3.1544189453125, 3.33154296875, 3.5086669921875, 3.685791015625, 3.8629150390625, 4.0400390625, 4.2171630859375, 4.394287109375, 4.5714111328125, 4.74853515625, 4.9256591796875, 5.102783203125, 5.2799072265625, 5.45703125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 6.0, 1.0, 3.0, 10.0, 6.0, 10.0, 12.0, 26.0, 35.0, 43.0, 62.0, 105.0, 160.0, 198.0, 285.0, 428.0, 515.0, 515.0, 490.0, 360.0, 258.0, 158.0, 123.0, 85.0, 56.0, 34.0, 28.0, 17.0, 14.0, 8.0, 9.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.0777587890625, -3.909423828125, -3.7410888671875, -3.57275390625, -3.4044189453125, -3.236083984375, -3.0677490234375, -2.8994140625, -2.7310791015625, -2.562744140625, -2.3944091796875, -2.22607421875, -2.0577392578125, -1.889404296875, -1.7210693359375, -1.552734375, -1.3843994140625, -1.216064453125, -1.0477294921875, -0.87939453125, -0.7110595703125, -0.542724609375, -0.3743896484375, -0.2060546875, -0.0377197265625, 0.130615234375, 0.2989501953125, 0.46728515625, 0.6356201171875, 0.803955078125, 0.9722900390625, 1.140625, 1.3089599609375, 1.477294921875, 1.6456298828125, 1.81396484375, 1.9822998046875, 2.150634765625, 2.3189697265625, 2.4873046875, 2.6556396484375, 2.823974609375, 2.9923095703125, 3.16064453125, 3.3289794921875, 3.497314453125, 3.6656494140625, 3.833984375, 4.0023193359375, 4.170654296875, 4.3389892578125, 4.50732421875, 4.6756591796875, 4.843994140625, 5.0123291015625, 5.1806640625, 5.3489990234375, 5.517333984375, 5.6856689453125, 5.85400390625, 6.0223388671875, 6.190673828125, 6.3590087890625, 6.52734375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 5.0, 10.0, 20.0, 14.0, 33.0, 59.0, 114.0, 187.0, 399.0, 874.0, 2260.0, 7340.0, 47402.0, 545901.0, 2930673.0, 595923.0, 51098.0, 7936.0, 2189.0, 929.0, 426.0, 197.0, 114.0, 71.0, 27.0, 25.0, 14.0, 13.0, 5.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.92724609375, -12.5732421875, -12.21923828125, -11.865234375, -11.51123046875, -11.1572265625, -10.80322265625, -10.44921875, -10.09521484375, -9.7412109375, -9.38720703125, -9.033203125, -8.67919921875, -8.3251953125, -7.97119140625, -7.6171875, -7.26318359375, -6.9091796875, -6.55517578125, -6.201171875, -5.84716796875, -5.4931640625, -5.13916015625, -4.78515625, -4.43115234375, -4.0771484375, -3.72314453125, -3.369140625, -3.01513671875, -2.6611328125, -2.30712890625, -1.953125, -1.59912109375, -1.2451171875, -0.89111328125, -0.537109375, -0.18310546875, 0.1708984375, 0.52490234375, 0.87890625, 1.23291015625, 1.5869140625, 1.94091796875, 2.294921875, 2.64892578125, 3.0029296875, 3.35693359375, 3.7109375, 4.06494140625, 4.4189453125, 4.77294921875, 5.126953125, 5.48095703125, 5.8349609375, 6.18896484375, 6.54296875, 6.89697265625, 7.2509765625, 7.60498046875, 7.958984375, 8.31298828125, 8.6669921875, 9.02099609375, 9.375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 29.0, 60.0, 116.0, 172.0, 195.0, 195.0, 127.0, 66.0, 35.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.501319885253906, -18.86980438232422, -17.23828887939453, -15.606772422790527, -13.97525691986084, -12.343741416931152, -10.712224960327148, -9.080709457397461, -7.449193954467773, -5.817678451538086, -4.18616247177124, -2.5546464920043945, -0.923130989074707, 0.7083845138549805, 2.3399009704589844, 3.971416473388672, 5.602931976318359, 7.234447479248047, 8.865962982177734, 10.497479438781738, 12.128994941711426, 13.760510444641113, 15.392026901245117, 17.023542404174805, 18.655057907104492, 20.28657341003418, 21.918088912963867, 23.549606323242188, 25.181121826171875, 26.812637329101562, 28.44415283203125, 30.075668334960938, 31.707183837890625, 33.33869934082031, 34.97021484375, 36.60173034667969, 38.233245849609375, 39.86476135253906, 41.49627685546875, 43.12779235839844, 44.759307861328125, 46.39082336425781, 48.0223388671875, 49.65385437011719, 51.285369873046875, 52.91688537597656, 54.54840087890625, 56.17991638183594, 57.81143569946289, 59.44295120239258, 61.074466705322266, 62.70598220825195, 64.3375015258789, 65.9690170288086, 67.60053253173828, 69.23204803466797, 70.86356353759766, 72.49507904052734, 74.12659454345703, 75.75811004638672, 77.3896255493164, 79.0211410522461, 80.65265655517578, 82.28417205810547, 83.91568756103516]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 5.0, 4.0, 6.0, 9.0, 12.0, 10.0, 18.0, 18.0, 15.0, 31.0, 33.0, 39.0, 32.0, 43.0, 34.0, 43.0, 36.0, 57.0, 51.0, 36.0, 43.0, 55.0, 46.0, 47.0, 42.0, 50.0, 33.0, 23.0, 25.0, 18.0, 19.0, 14.0, 14.0, 15.0, 5.0, 12.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.6761474609375, -19.113943099975586, -18.551738739013672, -17.98953628540039, -17.427331924438477, -16.865127563476562, -16.30292320251465, -15.74071979522705, -15.178516387939453, -14.616312026977539, -14.054108619689941, -13.491904258728027, -12.92970085144043, -12.367496490478516, -11.805292129516602, -11.243088722229004, -10.68088436126709, -10.118680000305176, -9.556476593017578, -8.994272232055664, -8.432068824768066, -7.869864463806152, -7.3076605796813965, -6.745456695556641, -6.183252811431885, -5.621048927307129, -5.058845043182373, -4.496641159057617, -3.9344370365142822, -3.3722331523895264, -2.8100290298461914, -2.2478251457214355, -1.6856212615966797, -1.1234173774719238, -0.5612133741378784, 0.0009906291961669922, 0.5631945133209229, 1.1253983974456787, 1.6876025199890137, 2.2498064041137695, 2.8120102882385254, 3.3742141723632812, 3.936418056488037, 4.498621940612793, 5.060826301574707, 5.623029708862305, 6.185234069824219, 6.747437953948975, 7.3096418380737305, 7.871845722198486, 8.434049606323242, 8.996253967285156, 9.558457374572754, 10.120661735534668, 10.682865142822266, 11.24506950378418, 11.807273864746094, 12.369478225708008, 12.931681632995605, 13.49388599395752, 14.056089401245117, 14.618293762207031, 15.180498123168945, 15.742701530456543, 16.30490493774414]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 12.0, 13.0, 10.0, 10.0, 8.0, 22.0, 21.0, 23.0, 23.0, 32.0, 19.0, 37.0, 27.0, 42.0, 42.0, 35.0, 49.0, 42.0, 34.0, 50.0, 32.0, 32.0, 45.0, 40.0, 32.0, 36.0, 25.0, 32.0, 27.0, 23.0, 19.0, 20.0, 12.0, 11.0, 9.0, 11.0, 6.0, 8.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4814453125, -1.43408203125, -1.38671875, -1.33935546875, -1.2919921875, -1.24462890625, -1.197265625, -1.14990234375, -1.1025390625, -1.05517578125, -1.0078125, -0.96044921875, -0.9130859375, -0.86572265625, -0.818359375, -0.77099609375, -0.7236328125, -0.67626953125, -0.62890625, -0.58154296875, -0.5341796875, -0.48681640625, -0.439453125, -0.39208984375, -0.3447265625, -0.29736328125, -0.25, -0.20263671875, -0.1552734375, -0.10791015625, -0.060546875, -0.01318359375, 0.0341796875, 0.08154296875, 0.12890625, 0.17626953125, 0.2236328125, 0.27099609375, 0.318359375, 0.36572265625, 0.4130859375, 0.46044921875, 0.5078125, 0.55517578125, 0.6025390625, 0.64990234375, 0.697265625, 0.74462890625, 0.7919921875, 0.83935546875, 0.88671875, 0.93408203125, 0.9814453125, 1.02880859375, 1.076171875, 1.12353515625, 1.1708984375, 1.21826171875, 1.265625, 1.31298828125, 1.3603515625, 1.40771484375, 1.455078125, 1.50244140625, 1.5498046875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 11.0, 21.0, 35.0, 44.0, 48.0, 106.0, 152.0, 182.0, 320.0, 429.0, 634.0, 903.0, 1419.0, 2168.0, 3210.0, 4762.0, 7137.0, 11067.0, 16886.0, 26647.0, 42740.0, 71202.0, 124937.0, 318715.0, 177901.0, 90630.0, 53568.0, 32721.0, 20625.0, 13295.0, 8719.0, 5739.0, 3736.0, 2652.0, 1711.0, 1153.0, 714.0, 507.0, 346.0, 220.0, 195.0, 109.0, 78.0, 47.0, 35.0, 15.0, 18.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.059967041015625, -0.05813455581665039, -0.05630207061767578, -0.05446958541870117, -0.05263710021972656, -0.05080461502075195, -0.048972129821777344, -0.047139644622802734, -0.045307159423828125, -0.043474674224853516, -0.041642189025878906, -0.0398097038269043, -0.03797721862792969, -0.03614473342895508, -0.03431224822998047, -0.03247976303100586, -0.03064727783203125, -0.02881479263305664, -0.02698230743408203, -0.025149822235107422, -0.023317337036132812, -0.021484851837158203, -0.019652366638183594, -0.017819881439208984, -0.015987396240234375, -0.014154911041259766, -0.012322425842285156, -0.010489940643310547, -0.008657455444335938, -0.006824970245361328, -0.004992485046386719, -0.0031599998474121094, -0.0013275146484375, 0.0005049705505371094, 0.0023374557495117188, 0.004169940948486328, 0.0060024261474609375, 0.007834911346435547, 0.009667396545410156, 0.011499881744384766, 0.013332366943359375, 0.015164852142333984, 0.016997337341308594, 0.018829822540283203, 0.020662307739257812, 0.022494792938232422, 0.02432727813720703, 0.02615976333618164, 0.02799224853515625, 0.02982473373413086, 0.03165721893310547, 0.03348970413208008, 0.03532218933105469, 0.0371546745300293, 0.038987159729003906, 0.040819644927978516, 0.042652130126953125, 0.044484615325927734, 0.046317100524902344, 0.04814958572387695, 0.04998207092285156, 0.05181455612182617, 0.05364704132080078, 0.05547952651977539, 0.05731201171875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 6.0, 13.0, 6.0, 15.0, 12.0, 12.0, 17.0, 18.0, 28.0, 25.0, 20.0, 29.0, 22.0, 22.0, 38.0, 45.0, 49.0, 43.0, 36.0, 1064.0, 41.0, 41.0, 34.0, 50.0, 32.0, 41.0, 30.0, 35.0, 28.0, 22.0, 17.0, 18.0, 10.0, 15.0, 13.0, 12.0, 16.0, 11.0, 12.0, 2.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95947265625, -0.9250869750976562, -0.8907012939453125, -0.8563156127929688, -0.821929931640625, -0.7875442504882812, -0.7531585693359375, -0.7187728881835938, -0.68438720703125, -0.6500015258789062, -0.6156158447265625, -0.5812301635742188, -0.546844482421875, -0.5124588012695312, -0.4780731201171875, -0.44368743896484375, -0.4093017578125, -0.37491607666015625, -0.3405303955078125, -0.30614471435546875, -0.271759033203125, -0.23737335205078125, -0.2029876708984375, -0.16860198974609375, -0.13421630859375, -0.09983062744140625, -0.0654449462890625, -0.03105926513671875, 0.003326416015625, 0.03771209716796875, 0.0720977783203125, 0.10648345947265625, 0.140869140625, 0.17525482177734375, 0.2096405029296875, 0.24402618408203125, 0.278411865234375, 0.31279754638671875, 0.3471832275390625, 0.38156890869140625, 0.41595458984375, 0.45034027099609375, 0.4847259521484375, 0.5191116333007812, 0.553497314453125, 0.5878829956054688, 0.6222686767578125, 0.6566543579101562, 0.6910400390625, 0.7254257202148438, 0.7598114013671875, 0.7941970825195312, 0.828582763671875, 0.8629684448242188, 0.8973541259765625, 0.9317398071289062, 0.96612548828125, 1.0005111694335938, 1.0348968505859375, 1.0692825317382812, 1.103668212890625, 1.1380538940429688, 1.1724395751953125, 1.2068252563476562, 1.2412109375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 15.0, 24.0, 29.0, 45.0, 80.0, 121.0, 177.0, 266.0, 411.0, 638.0, 903.0, 1415.0, 2193.0, 3136.0, 4802.0, 7150.0, 10348.0, 15506.0, 23755.0, 37494.0, 63352.0, 117082.0, 1338607.0, 215182.0, 100321.0, 55855.0, 33641.0, 21484.0, 14361.0, 9456.0, 6399.0, 4297.0, 2902.0, 1870.0, 1309.0, 865.0, 556.0, 373.0, 240.0, 154.0, 92.0, 76.0, 43.0, 38.0, 18.0, 14.0, 14.0, 4.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0357666015625, -0.03467893600463867, -0.033591270446777344, -0.032503604888916016, -0.03141593933105469, -0.03032827377319336, -0.02924060821533203, -0.028152942657470703, -0.027065277099609375, -0.025977611541748047, -0.02488994598388672, -0.02380228042602539, -0.022714614868164062, -0.021626949310302734, -0.020539283752441406, -0.019451618194580078, -0.01836395263671875, -0.017276287078857422, -0.016188621520996094, -0.015100955963134766, -0.014013290405273438, -0.01292562484741211, -0.011837959289550781, -0.010750293731689453, -0.009662628173828125, -0.008574962615966797, -0.007487297058105469, -0.006399631500244141, -0.0053119659423828125, -0.004224300384521484, -0.0031366348266601562, -0.002048969268798828, -0.0009613037109375, 0.00012636184692382812, 0.0012140274047851562, 0.0023016929626464844, 0.0033893585205078125, 0.004477024078369141, 0.005564689636230469, 0.006652355194091797, 0.007740020751953125, 0.008827686309814453, 0.009915351867675781, 0.01100301742553711, 0.012090682983398438, 0.013178348541259766, 0.014266014099121094, 0.015353679656982422, 0.01644134521484375, 0.017529010772705078, 0.018616676330566406, 0.019704341888427734, 0.020792007446289062, 0.02187967300415039, 0.02296733856201172, 0.024055004119873047, 0.025142669677734375, 0.026230335235595703, 0.02731800079345703, 0.02840566635131836, 0.029493331909179688, 0.030580997467041016, 0.031668663024902344, 0.03275632858276367, 0.033843994140625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 8.0, 0.0, 14.0, 0.0, 0.0, 12.0, 0.0, 22.0, 0.0, 0.0, 39.0, 0.0, 93.0, 0.0, 660.0, 0.0, 0.0, 68.0, 0.0, 31.0, 0.0, 14.0, 0.0, 0.0, 11.0, 0.0, 9.0, 0.0, 0.0, 5.0, 0.0, 5.0, 0.0, 8.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.497146725654602e-07, -7.245689630508423e-07, -6.994232535362244e-07, -6.742775440216064e-07, -6.491318345069885e-07, -6.239861249923706e-07, -5.988404154777527e-07, -5.736947059631348e-07, -5.485489964485168e-07, -5.234032869338989e-07, -4.98257577419281e-07, -4.731118679046631e-07, -4.4796615839004517e-07, -4.2282044887542725e-07, -3.976747393608093e-07, -3.725290298461914e-07, -3.473833203315735e-07, -3.2223761081695557e-07, -2.9709190130233765e-07, -2.7194619178771973e-07, -2.468004822731018e-07, -2.2165477275848389e-07, -1.9650906324386597e-07, -1.7136335372924805e-07, -1.4621764421463013e-07, -1.210719347000122e-07, -9.592622518539429e-08, -7.078051567077637e-08, -4.563480615615845e-08, -2.0489096641540527e-08, 4.6566128730773926e-09, 2.9802322387695312e-08, 5.494803190231323e-08, 8.009374141693115e-08, 1.0523945093154907e-07, 1.30385160446167e-07, 1.555308699607849e-07, 1.8067657947540283e-07, 2.0582228899002075e-07, 2.3096799850463867e-07, 2.561137080192566e-07, 2.812594175338745e-07, 3.0640512704849243e-07, 3.3155083656311035e-07, 3.5669654607772827e-07, 3.818422555923462e-07, 4.069879651069641e-07, 4.3213367462158203e-07, 4.5727938413619995e-07, 4.824250936508179e-07, 5.075708031654358e-07, 5.327165126800537e-07, 5.578622221946716e-07, 5.830079317092896e-07, 6.081536412239075e-07, 6.332993507385254e-07, 6.584450602531433e-07, 6.835907697677612e-07, 7.087364792823792e-07, 7.338821887969971e-07, 7.59027898311615e-07, 7.841736078262329e-07, 8.093193173408508e-07, 8.344650268554688e-07]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 6.0, 6.0, 7.0, 4.0, 6.0, 4.0, 19.0, 9.0, 12.0, 24.0, 18.0, 20.0, 22.0, 27.0, 41.0, 70.0, 120.0, 265.0, 1235.0, 26455.0, 933804.0, 82270.0, 3215.0, 463.0, 83.0, 101.0, 43.0, 35.0, 21.0, 23.0, 23.0, 14.0, 16.0, 7.0, 5.0, 15.0, 11.0, 9.0, 7.0, 4.0, 5.0, 5.0, 0.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.0907649993896484e-05, -1.0583549737930298e-05, -1.0259449481964111e-05, -9.935349225997925e-06, -9.611248970031738e-06, -9.287148714065552e-06, -8.963048458099365e-06, -8.638948202133179e-06, -8.314847946166992e-06, -7.990747690200806e-06, -7.666647434234619e-06, -7.342547178268433e-06, -7.018446922302246e-06, -6.6943466663360596e-06, -6.370246410369873e-06, -6.0461461544036865e-06, -5.7220458984375e-06, -5.3979456424713135e-06, -5.073845386505127e-06, -4.7497451305389404e-06, -4.425644874572754e-06, -4.101544618606567e-06, -3.777444362640381e-06, -3.4533441066741943e-06, -3.129243850708008e-06, -2.8051435947418213e-06, -2.4810433387756348e-06, -2.1569430828094482e-06, -1.8328428268432617e-06, -1.5087425708770752e-06, -1.1846423149108887e-06, -8.605420589447021e-07, -5.364418029785156e-07, -2.123415470123291e-07, 1.1175870895385742e-07, 4.3585896492004395e-07, 7.599592208862305e-07, 1.084059476852417e-06, 1.4081597328186035e-06, 1.73225998878479e-06, 2.0563602447509766e-06, 2.380460500717163e-06, 2.7045607566833496e-06, 3.028661012649536e-06, 3.3527612686157227e-06, 3.676861524581909e-06, 4.000961780548096e-06, 4.325062036514282e-06, 4.649162292480469e-06, 4.973262548446655e-06, 5.297362804412842e-06, 5.621463060379028e-06, 5.945563316345215e-06, 6.269663572311401e-06, 6.593763828277588e-06, 6.917864084243774e-06, 7.241964340209961e-06, 7.5660645961761475e-06, 7.890164852142334e-06, 8.21426510810852e-06, 8.538365364074707e-06, 8.862465620040894e-06, 9.18656587600708e-06, 9.510666131973267e-06, 9.834766387939453e-06]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 4.0, 960.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.201703128117515e-07, -1.1653239084807865e-07, -1.1289446177897844e-07, -1.0925653981530559e-07, -1.0561861785163273e-07, -1.0198068878253252e-07, -9.834276681885967e-08, -9.470484485518682e-08, -9.106691578608661e-08, -8.742899382241376e-08, -8.379106475331355e-08, -8.01531427896407e-08, -7.651522082596784e-08, -7.287729175686763e-08, -6.923936979319478e-08, -6.560144072409457e-08, -6.196351876042172e-08, -5.832559324403519e-08, -5.468767128036234e-08, -5.104974576397581e-08, -4.7411820247589276e-08, -4.3773894731202745e-08, -4.013597276752989e-08, -3.649804725114336e-08, -3.286012884018419e-08, -2.9222205100154497e-08, -2.5584279583767966e-08, -2.1946355843738274e-08, -1.8308430327351743e-08, -1.4670506587322052e-08, -1.103258284729236e-08, -7.3946573309058294e-09, -3.7567318145192985e-09, -1.1880740835579218e-10, 3.519116997807714e-09, 7.1570411819266155e-09, 1.0794965810134727e-08, 1.4432890438342838e-08, 1.807081417837253e-08, 2.170873969475906e-08, 2.5346663434788752e-08, 2.8984587174818444e-08, 3.2622512691204975e-08, 3.6260438207591505e-08, 3.989836017126436e-08, 4.353628568765089e-08, 4.717421120403742e-08, 5.081213316771027e-08, 5.44500586840968e-08, 5.8087984200483334e-08, 6.172590616415619e-08, 6.53638352332564e-08, 6.900175719692925e-08, 7.26396791606021e-08, 7.627760112427495e-08, 7.991553019337516e-08, 8.355345215704801e-08, 8.719137412072087e-08, 9.082930318982108e-08, 9.446722515349393e-08, 9.810514711716678e-08, 1.0174307618626699e-07, 1.0538099814993984e-07, 1.0901892721904005e-07, 1.126568491827129e-07]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 960.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.1920928955078125e-07, -1.1548399925231934e-07, -1.1175870895385742e-07, -1.0803341865539551e-07, -1.043081283569336e-07, -1.0058283805847168e-07, -9.685754776000977e-08, -9.313225746154785e-08, -8.940696716308594e-08, -8.568167686462402e-08, -8.195638656616211e-08, -7.82310962677002e-08, -7.450580596923828e-08, -7.078051567077637e-08, -6.705522537231445e-08, -6.332993507385254e-08, -5.960464477539063e-08, -5.587935447692871e-08, -5.21540641784668e-08, -4.842877388000488e-08, -4.470348358154297e-08, -4.0978193283081055e-08, -3.725290298461914e-08, -3.3527612686157227e-08, -2.9802322387695312e-08, -2.60770320892334e-08, -2.2351741790771484e-08, -1.862645149230957e-08, -1.4901161193847656e-08, -1.1175870895385742e-08, -7.450580596923828e-09, -3.725290298461914e-09, 0.0, 3.725290298461914e-09, 7.450580596923828e-09, 1.1175870895385742e-08, 1.4901161193847656e-08, 1.862645149230957e-08, 2.2351741790771484e-08, 2.60770320892334e-08, 2.9802322387695312e-08, 3.3527612686157227e-08, 3.725290298461914e-08, 4.0978193283081055e-08, 4.470348358154297e-08, 4.842877388000488e-08, 5.21540641784668e-08, 5.587935447692871e-08, 5.960464477539063e-08, 6.332993507385254e-08, 6.705522537231445e-08, 7.078051567077637e-08, 7.450580596923828e-08, 7.82310962677002e-08, 8.195638656616211e-08, 8.568167686462402e-08, 8.940696716308594e-08, 9.313225746154785e-08, 9.685754776000977e-08, 1.0058283805847168e-07, 1.043081283569336e-07, 1.0803341865539551e-07, 1.1175870895385742e-07, 1.1548399925231934e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 12.0, 13.0, 10.0, 10.0, 8.0, 22.0, 21.0, 23.0, 23.0, 32.0, 19.0, 37.0, 27.0, 42.0, 42.0, 35.0, 49.0, 42.0, 34.0, 50.0, 32.0, 32.0, 45.0, 40.0, 32.0, 36.0, 25.0, 32.0, 27.0, 23.0, 19.0, 20.0, 12.0, 11.0, 9.0, 11.0, 6.0, 8.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4814453125, -1.43408203125, -1.38671875, -1.33935546875, -1.2919921875, -1.24462890625, -1.197265625, -1.14990234375, -1.1025390625, -1.05517578125, -1.0078125, -0.96044921875, -0.9130859375, -0.86572265625, -0.818359375, -0.77099609375, -0.7236328125, -0.67626953125, -0.62890625, -0.58154296875, -0.5341796875, -0.48681640625, -0.439453125, -0.39208984375, -0.3447265625, -0.29736328125, -0.25, -0.20263671875, -0.1552734375, -0.10791015625, -0.060546875, -0.01318359375, 0.0341796875, 0.08154296875, 0.12890625, 0.17626953125, 0.2236328125, 0.27099609375, 0.318359375, 0.36572265625, 0.4130859375, 0.46044921875, 0.5078125, 0.55517578125, 0.6025390625, 0.64990234375, 0.697265625, 0.74462890625, 0.7919921875, 0.83935546875, 0.88671875, 0.93408203125, 0.9814453125, 1.02880859375, 1.076171875, 1.12353515625, 1.1708984375, 1.21826171875, 1.265625, 1.31298828125, 1.3603515625, 1.40771484375, 1.455078125, 1.50244140625, 1.5498046875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 7.0, 9.0, 15.0, 28.0, 30.0, 38.0, 49.0, 87.0, 145.0, 166.0, 262.0, 400.0, 607.0, 1061.0, 1541.0, 2446.0, 4109.0, 6926.0, 11650.0, 20730.0, 38468.0, 77977.0, 172716.0, 315083.0, 203008.0, 90613.0, 44450.0, 23185.0, 13077.0, 7461.0, 4490.0, 2779.0, 1708.0, 1064.0, 725.0, 477.0, 309.0, 207.0, 139.0, 94.0, 63.0, 43.0, 33.0, 15.0, 11.0, 17.0, 7.0, 7.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.8125, -1.7551422119140625, -1.697784423828125, -1.6404266357421875, -1.58306884765625, -1.5257110595703125, -1.468353271484375, -1.4109954833984375, -1.3536376953125, -1.2962799072265625, -1.238922119140625, -1.1815643310546875, -1.12420654296875, -1.0668487548828125, -1.009490966796875, -0.9521331787109375, -0.894775390625, -0.8374176025390625, -0.780059814453125, -0.7227020263671875, -0.66534423828125, -0.6079864501953125, -0.550628662109375, -0.4932708740234375, -0.4359130859375, -0.3785552978515625, -0.321197509765625, -0.2638397216796875, -0.20648193359375, -0.1491241455078125, -0.091766357421875, -0.0344085693359375, 0.02294921875, 0.0803070068359375, 0.137664794921875, 0.1950225830078125, 0.25238037109375, 0.3097381591796875, 0.367095947265625, 0.4244537353515625, 0.4818115234375, 0.5391693115234375, 0.596527099609375, 0.6538848876953125, 0.71124267578125, 0.7686004638671875, 0.825958251953125, 0.8833160400390625, 0.940673828125, 0.9980316162109375, 1.055389404296875, 1.1127471923828125, 1.17010498046875, 1.2274627685546875, 1.284820556640625, 1.3421783447265625, 1.3995361328125, 1.4568939208984375, 1.514251708984375, 1.5716094970703125, 1.62896728515625, 1.6863250732421875, 1.743682861328125, 1.8010406494140625, 1.8583984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 6.0, 10.0, 11.0, 15.0, 28.0, 37.0, 37.0, 41.0, 54.0, 58.0, 74.0, 121.0, 288.0, 1618.0, 171.0, 88.0, 59.0, 73.0, 57.0, 54.0, 36.0, 30.0, 18.0, 14.0, 14.0, 7.0, 5.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.640625, -8.40240478515625, -8.1641845703125, -7.92596435546875, -7.687744140625, -7.44952392578125, -7.2113037109375, -6.97308349609375, -6.73486328125, -6.49664306640625, -6.2584228515625, -6.02020263671875, -5.781982421875, -5.54376220703125, -5.3055419921875, -5.06732177734375, -4.8291015625, -4.59088134765625, -4.3526611328125, -4.11444091796875, -3.876220703125, -3.63800048828125, -3.3997802734375, -3.16156005859375, -2.92333984375, -2.68511962890625, -2.4468994140625, -2.20867919921875, -1.970458984375, -1.73223876953125, -1.4940185546875, -1.25579833984375, -1.017578125, -0.77935791015625, -0.5411376953125, -0.30291748046875, -0.064697265625, 0.17352294921875, 0.4117431640625, 0.64996337890625, 0.88818359375, 1.12640380859375, 1.3646240234375, 1.60284423828125, 1.841064453125, 2.07928466796875, 2.3175048828125, 2.55572509765625, 2.7939453125, 3.03216552734375, 3.2703857421875, 3.50860595703125, 3.746826171875, 3.98504638671875, 4.2232666015625, 4.46148681640625, 4.69970703125, 4.93792724609375, 5.1761474609375, 5.41436767578125, 5.652587890625, 5.89080810546875, 6.1290283203125, 6.36724853515625, 6.60546875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 6.0, 2.0, 11.0, 9.0, 7.0, 22.0, 32.0, 35.0, 55.0, 80.0, 156.0, 364.0, 1128.0, 5759.0, 48052.0, 2373578.0, 685991.0, 25445.0, 3592.0, 722.0, 284.0, 132.0, 82.0, 49.0, 22.0, 32.0, 17.0, 12.0, 8.0, 8.0, 4.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.0662841796875, -7.741943359375, -7.4176025390625, -7.09326171875, -6.7689208984375, -6.444580078125, -6.1202392578125, -5.7958984375, -5.4715576171875, -5.147216796875, -4.8228759765625, -4.49853515625, -4.1741943359375, -3.849853515625, -3.5255126953125, -3.201171875, -2.8768310546875, -2.552490234375, -2.2281494140625, -1.90380859375, -1.5794677734375, -1.255126953125, -0.9307861328125, -0.6064453125, -0.2821044921875, 0.042236328125, 0.3665771484375, 0.69091796875, 1.0152587890625, 1.339599609375, 1.6639404296875, 1.98828125, 2.3126220703125, 2.636962890625, 2.9613037109375, 3.28564453125, 3.6099853515625, 3.934326171875, 4.2586669921875, 4.5830078125, 4.9073486328125, 5.231689453125, 5.5560302734375, 5.88037109375, 6.2047119140625, 6.529052734375, 6.8533935546875, 7.177734375, 7.5020751953125, 7.826416015625, 8.1507568359375, 8.47509765625, 8.7994384765625, 9.123779296875, 9.4481201171875, 9.7724609375, 10.0968017578125, 10.421142578125, 10.7454833984375, 11.06982421875, 11.3941650390625, 11.718505859375, 12.0428466796875, 12.3671875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [5.0, 37.0, 331.0, 473.0, 151.0, 19.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.411599159240723, -4.450282096862793, -2.4889652729034424, -0.5276484489440918, 1.433668613433838, 3.3949851989746094, 5.356302261352539, 7.317619323730469, 9.278936386108398, 11.240253448486328, 13.201570510864258, 15.162887573242188, 17.124204635620117, 19.085521697998047, 21.046836853027344, 23.008155822753906, 24.969470977783203, 26.930788040161133, 28.892105102539062, 30.853422164916992, 32.81473922729492, 34.77605438232422, 36.73737335205078, 38.69868850708008, 40.66000747680664, 42.62132263183594, 44.5826416015625, 46.5439567565918, 48.50527572631836, 50.466590881347656, 52.42790985107422, 54.389225006103516, 56.35054397583008, 58.311859130859375, 60.27317810058594, 62.234493255615234, 64.19580841064453, 66.1571273803711, 68.11844635009766, 70.07976531982422, 72.04107666015625, 74.00239562988281, 75.96370697021484, 77.9250259399414, 79.88634490966797, 81.84766387939453, 83.80897521972656, 85.77029418945312, 87.73161315917969, 89.69293212890625, 91.65424346923828, 93.61556243896484, 95.5768814086914, 97.53820037841797, 99.49951171875, 101.46083068847656, 103.42214965820312, 105.38346862792969, 107.34477996826172, 109.30609893798828, 111.26741790771484, 113.2287368774414, 115.19004821777344, 117.1513671875, 119.11268615722656]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 10.0, 12.0, 11.0, 13.0, 20.0, 25.0, 14.0, 18.0, 22.0, 40.0, 37.0, 38.0, 44.0, 29.0, 53.0, 44.0, 58.0, 43.0, 43.0, 45.0, 36.0, 25.0, 36.0, 31.0, 31.0, 30.0, 25.0, 32.0, 14.0, 19.0, 19.0, 12.0, 15.0, 11.0, 7.0, 5.0, 4.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.878488540649414, -17.288463592529297, -16.698440551757812, -16.108415603637695, -15.518391609191895, -14.928367614746094, -14.338342666625977, -13.748318672180176, -13.158294677734375, -12.568270683288574, -11.978246688842773, -11.388221740722656, -10.798197746276855, -10.208173751831055, -9.618148803710938, -9.028124809265137, -8.438100814819336, -7.848076820373535, -7.258052349090576, -6.668027877807617, -6.078003883361816, -5.487979888916016, -4.897955417633057, -4.307930946350098, -3.717906951904297, -3.127882719039917, -2.537858486175537, -1.9478342533111572, -1.3578100204467773, -0.7677857875823975, -0.17776155471801758, 0.4122629165649414, 1.002288818359375, 1.5923130512237549, 2.1823372840881348, 2.7723615169525146, 3.3623857498168945, 3.9524099826812744, 4.542434215545654, 5.132458686828613, 5.722482681274414, 6.312506675720215, 6.902531147003174, 7.492555618286133, 8.082579612731934, 8.672603607177734, 9.262628555297852, 9.852652549743652, 10.442676544189453, 11.032700538635254, 11.622724533081055, 12.212749481201172, 12.802773475646973, 13.392797470092773, 13.98282241821289, 14.572846412658691, 15.162870407104492, 15.752894401550293, 16.342918395996094, 16.93294334411621, 17.522968292236328, 18.112991333007812, 18.70301628112793, 19.293041229248047, 19.88306427001953]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 11.0, 10.0, 12.0, 11.0, 8.0, 22.0, 21.0, 20.0, 27.0, 24.0, 27.0, 30.0, 31.0, 41.0, 51.0, 45.0, 34.0, 49.0, 41.0, 34.0, 37.0, 45.0, 37.0, 38.0, 34.0, 30.0, 29.0, 30.0, 24.0, 22.0, 20.0, 19.0, 13.0, 14.0, 9.0, 8.0, 5.0, 10.0, 2.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5283203125, -1.479248046875, -1.43017578125, -1.381103515625, -1.33203125, -1.282958984375, -1.23388671875, -1.184814453125, -1.1357421875, -1.086669921875, -1.03759765625, -0.988525390625, -0.939453125, -0.890380859375, -0.84130859375, -0.792236328125, -0.7431640625, -0.694091796875, -0.64501953125, -0.595947265625, -0.546875, -0.497802734375, -0.44873046875, -0.399658203125, -0.3505859375, -0.301513671875, -0.25244140625, -0.203369140625, -0.154296875, -0.105224609375, -0.05615234375, -0.007080078125, 0.0419921875, 0.091064453125, 0.14013671875, 0.189208984375, 0.23828125, 0.287353515625, 0.33642578125, 0.385498046875, 0.4345703125, 0.483642578125, 0.53271484375, 0.581787109375, 0.630859375, 0.679931640625, 0.72900390625, 0.778076171875, 0.8271484375, 0.876220703125, 0.92529296875, 0.974365234375, 1.0234375, 1.072509765625, 1.12158203125, 1.170654296875, 1.2197265625, 1.268798828125, 1.31787109375, 1.366943359375, 1.416015625, 1.465087890625, 1.51416015625, 1.563232421875, 1.6123046875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 5.0, 4.0, 15.0, 14.0, 20.0, 22.0, 43.0, 59.0, 89.0, 147.0, 213.0, 284.0, 647.0, 1194.0, 2726.0, 6595.0, 18126.0, 52425.0, 159298.0, 517650.0, 1582487.0, 1276113.0, 389440.0, 121719.0, 40566.0, 14326.0, 5406.0, 2214.0, 1058.0, 520.0, 287.0, 170.0, 101.0, 89.0, 52.0, 42.0, 23.0, 15.0, 14.0, 15.0, 8.0, 8.0, 10.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3515625, -3.2496337890625, -3.147705078125, -3.0457763671875, -2.94384765625, -2.8419189453125, -2.739990234375, -2.6380615234375, -2.5361328125, -2.4342041015625, -2.332275390625, -2.2303466796875, -2.12841796875, -2.0264892578125, -1.924560546875, -1.8226318359375, -1.720703125, -1.6187744140625, -1.516845703125, -1.4149169921875, -1.31298828125, -1.2110595703125, -1.109130859375, -1.0072021484375, -0.9052734375, -0.8033447265625, -0.701416015625, -0.5994873046875, -0.49755859375, -0.3956298828125, -0.293701171875, -0.1917724609375, -0.08984375, 0.0120849609375, 0.114013671875, 0.2159423828125, 0.31787109375, 0.4197998046875, 0.521728515625, 0.6236572265625, 0.7255859375, 0.8275146484375, 0.929443359375, 1.0313720703125, 1.13330078125, 1.2352294921875, 1.337158203125, 1.4390869140625, 1.541015625, 1.6429443359375, 1.744873046875, 1.8468017578125, 1.94873046875, 2.0506591796875, 2.152587890625, 2.2545166015625, 2.3564453125, 2.4583740234375, 2.560302734375, 2.6622314453125, 2.76416015625, 2.8660888671875, 2.968017578125, 3.0699462890625, 3.171875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 5.0, 7.0, 17.0, 28.0, 43.0, 53.0, 77.0, 137.0, 239.0, 311.0, 463.0, 631.0, 574.0, 510.0, 304.0, 201.0, 165.0, 114.0, 65.0, 61.0, 21.0, 15.0, 12.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.125, -8.91754150390625, -8.7100830078125, -8.50262451171875, -8.295166015625, -8.08770751953125, -7.8802490234375, -7.67279052734375, -7.46533203125, -7.25787353515625, -7.0504150390625, -6.84295654296875, -6.635498046875, -6.42803955078125, -6.2205810546875, -6.01312255859375, -5.8056640625, -5.59820556640625, -5.3907470703125, -5.18328857421875, -4.975830078125, -4.76837158203125, -4.5609130859375, -4.35345458984375, -4.14599609375, -3.93853759765625, -3.7310791015625, -3.52362060546875, -3.316162109375, -3.10870361328125, -2.9012451171875, -2.69378662109375, -2.486328125, -2.27886962890625, -2.0714111328125, -1.86395263671875, -1.656494140625, -1.44903564453125, -1.2415771484375, -1.03411865234375, -0.82666015625, -0.61920166015625, -0.4117431640625, -0.20428466796875, 0.003173828125, 0.21063232421875, 0.4180908203125, 0.62554931640625, 0.8330078125, 1.04046630859375, 1.2479248046875, 1.45538330078125, 1.662841796875, 1.87030029296875, 2.0777587890625, 2.28521728515625, 2.49267578125, 2.70013427734375, 2.9075927734375, 3.11505126953125, 3.322509765625, 3.52996826171875, 3.7374267578125, 3.94488525390625, 4.15234375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 2.0, 3.0, 8.0, 6.0, 18.0, 18.0, 39.0, 67.0, 83.0, 152.0, 275.0, 479.0, 966.0, 2158.0, 6373.0, 27254.0, 165921.0, 1086521.0, 2302544.0, 504634.0, 75638.0, 14087.0, 3915.0, 1467.0, 747.0, 385.0, 199.0, 121.0, 77.0, 60.0, 27.0, 15.0, 9.0, 4.0, 7.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.27734375, -7.00054931640625, -6.7237548828125, -6.44696044921875, -6.170166015625, -5.89337158203125, -5.6165771484375, -5.33978271484375, -5.06298828125, -4.78619384765625, -4.5093994140625, -4.23260498046875, -3.955810546875, -3.67901611328125, -3.4022216796875, -3.12542724609375, -2.8486328125, -2.57183837890625, -2.2950439453125, -2.01824951171875, -1.741455078125, -1.46466064453125, -1.1878662109375, -0.91107177734375, -0.63427734375, -0.35748291015625, -0.0806884765625, 0.19610595703125, 0.472900390625, 0.74969482421875, 1.0264892578125, 1.30328369140625, 1.580078125, 1.85687255859375, 2.1336669921875, 2.41046142578125, 2.687255859375, 2.96405029296875, 3.2408447265625, 3.51763916015625, 3.79443359375, 4.07122802734375, 4.3480224609375, 4.62481689453125, 4.901611328125, 5.17840576171875, 5.4552001953125, 5.73199462890625, 6.0087890625, 6.28558349609375, 6.5623779296875, 6.83917236328125, 7.115966796875, 7.39276123046875, 7.6695556640625, 7.94635009765625, 8.22314453125, 8.49993896484375, 8.7767333984375, 9.05352783203125, 9.330322265625, 9.60711669921875, 9.8839111328125, 10.16070556640625, 10.4375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 15.0, 27.0, 41.0, 50.0, 85.0, 81.0, 109.0, 96.0, 115.0, 101.0, 76.0, 67.0, 51.0, 36.0, 24.0, 12.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.560035705566406, -31.597412109375, -30.634788513183594, -29.672164916992188, -28.70954132080078, -27.746917724609375, -26.78429412841797, -25.82166862487793, -24.859045028686523, -23.896421432495117, -22.93379783630371, -21.971174240112305, -21.0085506439209, -20.04592514038086, -19.083301544189453, -18.120677947998047, -17.15805435180664, -16.195430755615234, -15.232807159423828, -14.270183563232422, -13.3075590133667, -12.344935417175293, -11.382311820983887, -10.419687271118164, -9.45706558227539, -8.494441986083984, -7.53181791305542, -6.569194316864014, -5.606570243835449, -4.643946647644043, -3.6813230514526367, -2.7186989784240723, -1.7560749053955078, -0.7934511303901672, 0.16917264461517334, 1.1317963600158691, 2.0944201946258545, 3.05704402923584, 4.019667625427246, 4.9822916984558105, 5.944915294647217, 6.907538890838623, 7.8701629638671875, 8.832786560058594, 9.79541015625, 10.758033752441406, 11.720657348632812, 12.683281898498535, 13.645905494689941, 14.608529090881348, 15.571152687072754, 16.533777236938477, 17.496400833129883, 18.45902442932129, 19.421648025512695, 20.3842716217041, 21.346895217895508, 22.309518814086914, 23.27214241027832, 24.234766006469727, 25.197389602661133, 26.160015106201172, 27.122638702392578, 28.085262298583984, 29.04788589477539]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 9.0, 9.0, 9.0, 11.0, 6.0, 15.0, 17.0, 20.0, 25.0, 22.0, 42.0, 38.0, 41.0, 36.0, 25.0, 39.0, 53.0, 41.0, 45.0, 47.0, 40.0, 43.0, 36.0, 44.0, 34.0, 21.0, 33.0, 25.0, 22.0, 23.0, 11.0, 28.0, 12.0, 11.0, 10.0, 8.0, 10.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.71459197998047, -16.211467742919922, -15.708341598510742, -15.205217361450195, -14.702092170715332, -14.198966979980469, -13.695842742919922, -13.192717552185059, -12.689592361450195, -12.186467170715332, -11.683341979980469, -11.180217742919922, -10.677092552185059, -10.173967361450195, -9.670843124389648, -9.167717933654785, -8.664592742919922, -8.161467552185059, -7.6583428382873535, -7.155218124389648, -6.652092933654785, -6.148967742919922, -5.645843029022217, -5.142718315124512, -4.639593124389648, -4.136467933654785, -3.63334321975708, -3.130218267440796, -2.6270933151245117, -2.1239683628082275, -1.6208434104919434, -1.1177184581756592, -0.614593505859375, -0.11146855354309082, 0.39165639877319336, 0.8947813510894775, 1.3979063034057617, 1.901031255722046, 2.40415620803833, 2.9072811603546143, 3.4104061126708984, 3.9135310649871826, 4.416656017303467, 4.919780731201172, 5.422905921936035, 5.926031112670898, 6.4291558265686035, 6.932280540466309, 7.435405731201172, 7.938530921936035, 8.441656112670898, 8.944780349731445, 9.447905540466309, 9.951030731201172, 10.454154968261719, 10.957280158996582, 11.460405349731445, 11.963530540466309, 12.466655731201172, 12.969779968261719, 13.472905158996582, 13.976030349731445, 14.479154586791992, 14.982279777526855, 15.485404968261719]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 5.0, 8.0, 1.0, 11.0, 12.0, 12.0, 13.0, 12.0, 16.0, 17.0, 26.0, 23.0, 34.0, 22.0, 25.0, 40.0, 35.0, 44.0, 41.0, 42.0, 34.0, 35.0, 47.0, 39.0, 38.0, 37.0, 30.0, 34.0, 33.0, 25.0, 34.0, 27.0, 20.0, 22.0, 23.0, 15.0, 11.0, 16.0, 11.0, 11.0, 9.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4697265625, -1.4201812744140625, -1.370635986328125, -1.3210906982421875, -1.27154541015625, -1.2220001220703125, -1.172454833984375, -1.1229095458984375, -1.0733642578125, -1.0238189697265625, -0.974273681640625, -0.9247283935546875, -0.87518310546875, -0.8256378173828125, -0.776092529296875, -0.7265472412109375, -0.677001953125, -0.6274566650390625, -0.577911376953125, -0.5283660888671875, -0.47882080078125, -0.4292755126953125, -0.379730224609375, -0.3301849365234375, -0.2806396484375, -0.2310943603515625, -0.181549072265625, -0.1320037841796875, -0.08245849609375, -0.0329132080078125, 0.016632080078125, 0.0661773681640625, 0.11572265625, 0.1652679443359375, 0.214813232421875, 0.2643585205078125, 0.31390380859375, 0.3634490966796875, 0.412994384765625, 0.4625396728515625, 0.5120849609375, 0.5616302490234375, 0.611175537109375, 0.6607208251953125, 0.71026611328125, 0.7598114013671875, 0.809356689453125, 0.8589019775390625, 0.908447265625, 0.9579925537109375, 1.007537841796875, 1.0570831298828125, 1.10662841796875, 1.1561737060546875, 1.205718994140625, 1.2552642822265625, 1.3048095703125, 1.3543548583984375, 1.403900146484375, 1.4534454345703125, 1.50299072265625, 1.5525360107421875, 1.602081298828125, 1.6516265869140625, 1.701171875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 8.0, 6.0, 8.0, 12.0, 31.0, 26.0, 47.0, 105.0, 111.0, 188.0, 287.0, 375.0, 601.0, 861.0, 1337.0, 1859.0, 2885.0, 4318.0, 6399.0, 9824.0, 14743.0, 22472.0, 34840.0, 55677.0, 95570.0, 188884.0, 290990.0, 124324.0, 70098.0, 42476.0, 26887.0, 17550.0, 11531.0, 7609.0, 5129.0, 3418.0, 2289.0, 1540.0, 1052.0, 748.0, 468.0, 356.0, 190.0, 140.0, 124.0, 59.0, 35.0, 34.0, 18.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061309814453125, -0.05934572219848633, -0.057381629943847656, -0.055417537689208984, -0.05345344543457031, -0.05148935317993164, -0.04952526092529297, -0.0475611686706543, -0.045597076416015625, -0.04363298416137695, -0.04166889190673828, -0.03970479965209961, -0.03774070739746094, -0.035776615142822266, -0.033812522888183594, -0.03184843063354492, -0.02988433837890625, -0.027920246124267578, -0.025956153869628906, -0.023992061614990234, -0.022027969360351562, -0.02006387710571289, -0.01809978485107422, -0.016135692596435547, -0.014171600341796875, -0.012207508087158203, -0.010243415832519531, -0.00827932357788086, -0.0063152313232421875, -0.004351139068603516, -0.0023870468139648438, -0.0004229545593261719, 0.0015411376953125, 0.003505229949951172, 0.005469322204589844, 0.007433414459228516, 0.009397506713867188, 0.01136159896850586, 0.013325691223144531, 0.015289783477783203, 0.017253875732421875, 0.019217967987060547, 0.02118206024169922, 0.02314615249633789, 0.025110244750976562, 0.027074337005615234, 0.029038429260253906, 0.031002521514892578, 0.03296661376953125, 0.03493070602416992, 0.036894798278808594, 0.038858890533447266, 0.04082298278808594, 0.04278707504272461, 0.04475116729736328, 0.04671525955200195, 0.048679351806640625, 0.0506434440612793, 0.05260753631591797, 0.05457162857055664, 0.05653572082519531, 0.058499813079833984, 0.060463905334472656, 0.06242799758911133, 0.06439208984375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 6.0, 17.0, 9.0, 22.0, 16.0, 21.0, 23.0, 23.0, 28.0, 27.0, 41.0, 33.0, 32.0, 41.0, 33.0, 40.0, 41.0, 1070.0, 37.0, 39.0, 45.0, 41.0, 33.0, 39.0, 28.0, 27.0, 28.0, 23.0, 19.0, 28.0, 17.0, 15.0, 9.0, 7.0, 5.0, 9.0, 8.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0869140625, -1.051025390625, -1.01513671875, -0.979248046875, -0.943359375, -0.907470703125, -0.87158203125, -0.835693359375, -0.7998046875, -0.763916015625, -0.72802734375, -0.692138671875, -0.65625, -0.620361328125, -0.58447265625, -0.548583984375, -0.5126953125, -0.476806640625, -0.44091796875, -0.405029296875, -0.369140625, -0.333251953125, -0.29736328125, -0.261474609375, -0.2255859375, -0.189697265625, -0.15380859375, -0.117919921875, -0.08203125, -0.046142578125, -0.01025390625, 0.025634765625, 0.0615234375, 0.097412109375, 0.13330078125, 0.169189453125, 0.205078125, 0.240966796875, 0.27685546875, 0.312744140625, 0.3486328125, 0.384521484375, 0.42041015625, 0.456298828125, 0.4921875, 0.528076171875, 0.56396484375, 0.599853515625, 0.6357421875, 0.671630859375, 0.70751953125, 0.743408203125, 0.779296875, 0.815185546875, 0.85107421875, 0.886962890625, 0.9228515625, 0.958740234375, 0.99462890625, 1.030517578125, 1.06640625, 1.102294921875, 1.13818359375, 1.174072265625, 1.2099609375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 11.0, 14.0, 24.0, 43.0, 44.0, 90.0, 115.0, 150.0, 245.0, 358.0, 508.0, 738.0, 1147.0, 1622.0, 2384.0, 3600.0, 5143.0, 7538.0, 11223.0, 16888.0, 25581.0, 39511.0, 65200.0, 114417.0, 1320174.0, 210756.0, 102100.0, 59030.0, 36829.0, 23480.0, 15463.0, 10489.0, 7125.0, 4889.0, 3247.0, 2184.0, 1475.0, 1008.0, 746.0, 519.0, 319.0, 223.0, 165.0, 111.0, 70.0, 44.0, 33.0, 18.0, 20.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0], "bins": [-0.03485107421875, -0.03379201889038086, -0.03273296356201172, -0.03167390823364258, -0.030614852905273438, -0.029555797576904297, -0.028496742248535156, -0.027437686920166016, -0.026378631591796875, -0.025319576263427734, -0.024260520935058594, -0.023201465606689453, -0.022142410278320312, -0.021083354949951172, -0.02002429962158203, -0.01896524429321289, -0.01790618896484375, -0.01684713363647461, -0.01578807830810547, -0.014729022979736328, -0.013669967651367188, -0.012610912322998047, -0.011551856994628906, -0.010492801666259766, -0.009433746337890625, -0.008374691009521484, -0.007315635681152344, -0.006256580352783203, -0.0051975250244140625, -0.004138469696044922, -0.0030794143676757812, -0.0020203590393066406, -0.0009613037109375, 9.775161743164062e-05, 0.0011568069458007812, 0.002215862274169922, 0.0032749176025390625, 0.004333972930908203, 0.005393028259277344, 0.006452083587646484, 0.007511138916015625, 0.008570194244384766, 0.009629249572753906, 0.010688304901123047, 0.011747360229492188, 0.012806415557861328, 0.013865470886230469, 0.01492452621459961, 0.01598358154296875, 0.01704263687133789, 0.01810169219970703, 0.019160747528076172, 0.020219802856445312, 0.021278858184814453, 0.022337913513183594, 0.023396968841552734, 0.024456024169921875, 0.025515079498291016, 0.026574134826660156, 0.027633190155029297, 0.028692245483398438, 0.029751300811767578, 0.03081035614013672, 0.03186941146850586, 0.032928466796875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 0.0, 13.0, 11.0, 10.0, 0.0, 14.0, 22.0, 33.0, 0.0, 77.0, 625.0, 90.0, 0.0, 27.0, 21.0, 10.0, 10.0, 0.0, 8.0, 11.0, 5.0, 0.0, 2.0, 1.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2060627341270447e-06, -1.1604279279708862e-06, -1.1147931218147278e-06, -1.0691583156585693e-06, -1.0235235095024109e-06, -9.778887033462524e-07, -9.32253897190094e-07, -8.866190910339355e-07, -8.409842848777771e-07, -7.953494787216187e-07, -7.497146725654602e-07, -7.040798664093018e-07, -6.584450602531433e-07, -6.128102540969849e-07, -5.671754479408264e-07, -5.21540641784668e-07, -4.759058356285095e-07, -4.302710294723511e-07, -3.8463622331619263e-07, -3.390014171600342e-07, -2.9336661100387573e-07, -2.477318048477173e-07, -2.0209699869155884e-07, -1.564621925354004e-07, -1.1082738637924194e-07, -6.51925802230835e-08, -1.955777406692505e-08, 2.60770320892334e-08, 7.171183824539185e-08, 1.1734664440155029e-07, 1.6298145055770874e-07, 2.086162567138672e-07, 2.5425106287002563e-07, 2.998858690261841e-07, 3.4552067518234253e-07, 3.91155481338501e-07, 4.367902874946594e-07, 4.824250936508179e-07, 5.280598998069763e-07, 5.736947059631348e-07, 6.193295121192932e-07, 6.649643182754517e-07, 7.105991244316101e-07, 7.562339305877686e-07, 8.01868736743927e-07, 8.475035429000854e-07, 8.931383490562439e-07, 9.387731552124023e-07, 9.844079613685608e-07, 1.0300427675247192e-06, 1.0756775736808777e-06, 1.1213123798370361e-06, 1.1669471859931946e-06, 1.212581992149353e-06, 1.2582167983055115e-06, 1.30385160446167e-06, 1.3494864106178284e-06, 1.3951212167739868e-06, 1.4407560229301453e-06, 1.4863908290863037e-06, 1.5320256352424622e-06, 1.5776604413986206e-06, 1.623295247554779e-06, 1.6689300537109375e-06]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 7.0, 2.0, 2.0, 4.0, 6.0, 10.0, 26.0, 32.0, 43.0, 46.0, 96.0, 262.0, 2313.0, 983330.0, 61176.0, 795.0, 176.0, 63.0, 37.0, 29.0, 23.0, 31.0, 12.0, 8.0, 9.0, 5.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.6881694793701172e-05, -2.6131048798561096e-05, -2.538040280342102e-05, -2.4629756808280945e-05, -2.387911081314087e-05, -2.3128464818000793e-05, -2.2377818822860718e-05, -2.1627172827720642e-05, -2.0876526832580566e-05, -2.012588083744049e-05, -1.9375234842300415e-05, -1.862458884716034e-05, -1.7873942852020264e-05, -1.7123296856880188e-05, -1.6372650861740112e-05, -1.5622004866600037e-05, -1.4871358871459961e-05, -1.4120712876319885e-05, -1.337006688117981e-05, -1.2619420886039734e-05, -1.1868774890899658e-05, -1.1118128895759583e-05, -1.0367482900619507e-05, -9.616836905479431e-06, -8.866190910339355e-06, -8.11554491519928e-06, -7.364898920059204e-06, -6.614252924919128e-06, -5.863606929779053e-06, -5.112960934638977e-06, -4.362314939498901e-06, -3.6116689443588257e-06, -2.86102294921875e-06, -2.1103769540786743e-06, -1.3597309589385986e-06, -6.09084963798523e-07, 1.4156103134155273e-07, 8.922070264816284e-07, 1.642853021621704e-06, 2.3934990167617798e-06, 3.1441450119018555e-06, 3.894791007041931e-06, 4.645437002182007e-06, 5.3960829973220825e-06, 6.146728992462158e-06, 6.897374987602234e-06, 7.64802098274231e-06, 8.398666977882385e-06, 9.149312973022461e-06, 9.899958968162537e-06, 1.0650604963302612e-05, 1.1401250958442688e-05, 1.2151896953582764e-05, 1.290254294872284e-05, 1.3653188943862915e-05, 1.440383493900299e-05, 1.5154480934143066e-05, 1.5905126929283142e-05, 1.6655772924423218e-05, 1.7406418919563293e-05, 1.815706491470337e-05, 1.8907710909843445e-05, 1.965835690498352e-05, 2.0409002900123596e-05, 2.1159648895263672e-05]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 10.0, 8.0, 13.0, 901.0, 9.0, 11.0, 17.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.6425776645264705e-07, -4.544414764495741e-07, -4.446252148682106e-07, -4.3480892486513767e-07, -4.2499263486206473e-07, -4.1517637328070123e-07, -4.053600832776283e-07, -3.9554379327455536e-07, -3.8572753169319185e-07, -3.759112416901189e-07, -3.660949801087554e-07, -3.5627869010568247e-07, -3.4646240010260954e-07, -3.3664613852124603e-07, -3.268298485181731e-07, -3.170135869368096e-07, -3.0719729693373665e-07, -2.973810069306637e-07, -2.875647453493002e-07, -2.777484553462273e-07, -2.6793216534315434e-07, -2.5811590376179083e-07, -2.482996137587179e-07, -2.3848332375564496e-07, -2.2866703375257202e-07, -2.188507579603538e-07, -2.0903446795728087e-07, -1.9921819216506265e-07, -1.8940191637284443e-07, -1.795856405806262e-07, -1.6976935057755327e-07, -1.5995307478533505e-07, -1.501367847822621e-07, -1.403205089900439e-07, -1.3050421898697095e-07, -1.2068794319475273e-07, -1.1087166740253451e-07, -1.0105538450488893e-07, -9.123910160724336e-08, -8.142282581502513e-08, -7.160654291737956e-08, -6.179026001973398e-08, -5.197398422751576e-08, -4.215770132987018e-08, -3.234142198493828e-08, -2.252514264000638e-08, -1.27088597423608e-08, -2.89258395014258e-09, 6.923698947502999e-09, 1.6739978292434898e-08, 2.6556259413723637e-08, 3.6372540535012376e-08, 4.6188819879944276e-08, 5.6005099224876176e-08, 6.582138212252175e-08, 7.563765791473998e-08, 8.545394081238555e-08, 9.527022371003113e-08, 1.0508649950224935e-07, 1.1490278239989493e-07, 1.247190652975405e-07, 1.3453534108975873e-07, 1.4435161688197695e-07, 1.541679068850499e-07, 1.639841826772681e-07]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 903.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 52.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.384185791015625e-07, -2.3189932107925415e-07, -2.253800630569458e-07, -2.1886080503463745e-07, -2.123415470123291e-07, -2.0582228899002075e-07, -1.993030309677124e-07, -1.9278377294540405e-07, -1.862645149230957e-07, -1.7974525690078735e-07, -1.73225998878479e-07, -1.6670674085617065e-07, -1.601874828338623e-07, -1.5366822481155396e-07, -1.471489667892456e-07, -1.4062970876693726e-07, -1.341104507446289e-07, -1.2759119272232056e-07, -1.210719347000122e-07, -1.1455267667770386e-07, -1.0803341865539551e-07, -1.0151416063308716e-07, -9.499490261077881e-08, -8.847564458847046e-08, -8.195638656616211e-08, -7.543712854385376e-08, -6.891787052154541e-08, -6.239861249923706e-08, -5.587935447692871e-08, -4.936009645462036e-08, -4.284083843231201e-08, -3.632158041000366e-08, -2.9802322387695312e-08, -2.3283064365386963e-08, -1.6763806343078613e-08, -1.0244548320770264e-08, -3.725290298461914e-09, 2.7939677238464355e-09, 9.313225746154785e-09, 1.5832483768463135e-08, 2.2351741790771484e-08, 2.8870999813079834e-08, 3.5390257835388184e-08, 4.190951585769653e-08, 4.842877388000488e-08, 5.494803190231323e-08, 6.146728992462158e-08, 6.798654794692993e-08, 7.450580596923828e-08, 8.102506399154663e-08, 8.754432201385498e-08, 9.406358003616333e-08, 1.0058283805847168e-07, 1.0710209608078003e-07, 1.1362135410308838e-07, 1.2014061212539673e-07, 1.2665987014770508e-07, 1.3317912817001343e-07, 1.3969838619232178e-07, 1.4621764421463013e-07, 1.5273690223693848e-07, 1.5925616025924683e-07, 1.6577541828155518e-07, 1.7229467630386353e-07, 1.7881393432617188e-07]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 5.0, 8.0, 1.0, 11.0, 12.0, 12.0, 13.0, 12.0, 16.0, 17.0, 26.0, 23.0, 34.0, 22.0, 25.0, 40.0, 35.0, 44.0, 41.0, 42.0, 34.0, 35.0, 47.0, 39.0, 38.0, 37.0, 30.0, 34.0, 33.0, 25.0, 34.0, 27.0, 20.0, 22.0, 23.0, 15.0, 11.0, 16.0, 11.0, 11.0, 9.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4697265625, -1.4201812744140625, -1.370635986328125, -1.3210906982421875, -1.27154541015625, -1.2220001220703125, -1.172454833984375, -1.1229095458984375, -1.0733642578125, -1.0238189697265625, -0.974273681640625, -0.9247283935546875, -0.87518310546875, -0.8256378173828125, -0.776092529296875, -0.7265472412109375, -0.677001953125, -0.6274566650390625, -0.577911376953125, -0.5283660888671875, -0.47882080078125, -0.4292755126953125, -0.379730224609375, -0.3301849365234375, -0.2806396484375, -0.2310943603515625, -0.181549072265625, -0.1320037841796875, -0.08245849609375, -0.0329132080078125, 0.016632080078125, 0.0661773681640625, 0.11572265625, 0.1652679443359375, 0.214813232421875, 0.2643585205078125, 0.31390380859375, 0.3634490966796875, 0.412994384765625, 0.4625396728515625, 0.5120849609375, 0.5616302490234375, 0.611175537109375, 0.6607208251953125, 0.71026611328125, 0.7598114013671875, 0.809356689453125, 0.8589019775390625, 0.908447265625, 0.9579925537109375, 1.007537841796875, 1.0570831298828125, 1.10662841796875, 1.1561737060546875, 1.205718994140625, 1.2552642822265625, 1.3048095703125, 1.3543548583984375, 1.403900146484375, 1.4534454345703125, 1.50299072265625, 1.5525360107421875, 1.602081298828125, 1.6516265869140625, 1.701171875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 10.0, 11.0, 16.0, 25.0, 45.0, 50.0, 93.0, 126.0, 189.0, 287.0, 383.0, 591.0, 952.0, 1298.0, 2015.0, 2914.0, 4289.0, 6479.0, 9412.0, 14203.0, 21864.0, 36065.0, 59967.0, 101513.0, 177500.0, 233361.0, 150016.0, 86313.0, 50560.0, 30486.0, 19313.0, 12335.0, 8432.0, 5690.0, 3752.0, 2630.0, 1754.0, 1192.0, 784.0, 547.0, 372.0, 246.0, 154.0, 100.0, 82.0, 55.0, 33.0, 22.0, 15.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.607421875, -1.5577239990234375, -1.508026123046875, -1.4583282470703125, -1.40863037109375, -1.3589324951171875, -1.309234619140625, -1.2595367431640625, -1.2098388671875, -1.1601409912109375, -1.110443115234375, -1.0607452392578125, -1.01104736328125, -0.9613494873046875, -0.911651611328125, -0.8619537353515625, -0.812255859375, -0.7625579833984375, -0.712860107421875, -0.6631622314453125, -0.61346435546875, -0.5637664794921875, -0.514068603515625, -0.4643707275390625, -0.4146728515625, -0.3649749755859375, -0.315277099609375, -0.2655792236328125, -0.21588134765625, -0.1661834716796875, -0.116485595703125, -0.0667877197265625, -0.01708984375, 0.0326080322265625, 0.082305908203125, 0.1320037841796875, 0.18170166015625, 0.2313995361328125, 0.281097412109375, 0.3307952880859375, 0.3804931640625, 0.4301910400390625, 0.479888916015625, 0.5295867919921875, 0.57928466796875, 0.6289825439453125, 0.678680419921875, 0.7283782958984375, 0.778076171875, 0.8277740478515625, 0.877471923828125, 0.9271697998046875, 0.97686767578125, 1.0265655517578125, 1.076263427734375, 1.1259613037109375, 1.1756591796875, 1.2253570556640625, 1.275054931640625, 1.3247528076171875, 1.37445068359375, 1.4241485595703125, 1.473846435546875, 1.5235443115234375, 1.5732421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 6.0, 7.0, 15.0, 17.0, 17.0, 10.0, 19.0, 36.0, 41.0, 33.0, 42.0, 40.0, 49.0, 73.0, 99.0, 137.0, 230.0, 1318.0, 192.0, 119.0, 77.0, 61.0, 57.0, 48.0, 32.0, 36.0, 31.0, 35.0, 21.0, 19.0, 20.0, 24.0, 22.0, 9.0, 13.0, 8.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.16015625, -5.98114013671875, -5.8021240234375, -5.62310791015625, -5.444091796875, -5.26507568359375, -5.0860595703125, -4.90704345703125, -4.72802734375, -4.54901123046875, -4.3699951171875, -4.19097900390625, -4.011962890625, -3.83294677734375, -3.6539306640625, -3.47491455078125, -3.2958984375, -3.11688232421875, -2.9378662109375, -2.75885009765625, -2.579833984375, -2.40081787109375, -2.2218017578125, -2.04278564453125, -1.86376953125, -1.68475341796875, -1.5057373046875, -1.32672119140625, -1.147705078125, -0.96868896484375, -0.7896728515625, -0.61065673828125, -0.431640625, -0.25262451171875, -0.0736083984375, 0.10540771484375, 0.284423828125, 0.46343994140625, 0.6424560546875, 0.82147216796875, 1.00048828125, 1.17950439453125, 1.3585205078125, 1.53753662109375, 1.716552734375, 1.89556884765625, 2.0745849609375, 2.25360107421875, 2.4326171875, 2.61163330078125, 2.7906494140625, 2.96966552734375, 3.148681640625, 3.32769775390625, 3.5067138671875, 3.68572998046875, 3.86474609375, 4.04376220703125, 4.2227783203125, 4.40179443359375, 4.580810546875, 4.75982666015625, 4.9388427734375, 5.11785888671875, 5.296875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 7.0, 18.0, 20.0, 23.0, 29.0, 18.0, 38.0, 53.0, 71.0, 98.0, 187.0, 372.0, 653.0, 1567.0, 4095.0, 13337.0, 59596.0, 477497.0, 2285788.0, 248488.0, 38658.0, 9551.0, 2929.0, 1264.0, 523.0, 275.0, 162.0, 108.0, 60.0, 54.0, 27.0, 26.0, 18.0, 20.0, 8.0, 13.0, 7.0, 5.0, 5.0, 4.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.64453125, -7.40081787109375, -7.1571044921875, -6.91339111328125, -6.669677734375, -6.42596435546875, -6.1822509765625, -5.93853759765625, -5.69482421875, -5.45111083984375, -5.2073974609375, -4.96368408203125, -4.719970703125, -4.47625732421875, -4.2325439453125, -3.98883056640625, -3.7451171875, -3.50140380859375, -3.2576904296875, -3.01397705078125, -2.770263671875, -2.52655029296875, -2.2828369140625, -2.03912353515625, -1.79541015625, -1.55169677734375, -1.3079833984375, -1.06427001953125, -0.820556640625, -0.57684326171875, -0.3331298828125, -0.08941650390625, 0.154296875, 0.39801025390625, 0.6417236328125, 0.88543701171875, 1.129150390625, 1.37286376953125, 1.6165771484375, 1.86029052734375, 2.10400390625, 2.34771728515625, 2.5914306640625, 2.83514404296875, 3.078857421875, 3.32257080078125, 3.5662841796875, 3.80999755859375, 4.0537109375, 4.29742431640625, 4.5411376953125, 4.78485107421875, 5.028564453125, 5.27227783203125, 5.5159912109375, 5.75970458984375, 6.00341796875, 6.24713134765625, 6.4908447265625, 6.73455810546875, 6.978271484375, 7.22198486328125, 7.4656982421875, 7.70941162109375, 7.953125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 104.0, 733.0, 174.0], "bins": [-305.97344970703125, -301.0771484375, -296.1808776855469, -291.2845764160156, -286.3883056640625, -281.49200439453125, -276.595703125, -271.6994323730469, -266.8031311035156, -261.9068298339844, -257.01055908203125, -252.1142578125, -247.2179718017578, -242.32168579101562, -237.42538452148438, -232.5290985107422, -227.6328125, -222.7365264892578, -217.84024047851562, -212.94393920898438, -208.0476531982422, -203.1513671875, -198.25506591796875, -193.35877990722656, -188.46249389648438, -183.5662078857422, -178.669921875, -173.77362060546875, -168.87733459472656, -163.98104858398438, -159.08474731445312, -154.18846130371094, -149.29217529296875, -144.39588928222656, -139.49960327148438, -134.60330200195312, -129.70701599121094, -124.81072998046875, -119.91443634033203, -115.01814270019531, -110.12186431884766, -105.22557067871094, -100.32928466796875, -95.43299865722656, -90.53670501708984, -85.64041137695312, -80.74412536621094, -75.84783935546875, -70.95154571533203, -66.05525207519531, -61.158966064453125, -56.26267623901367, -51.36638641357422, -46.470096588134766, -41.57380676269531, -36.67751693725586, -31.781227111816406, -26.884937286376953, -21.9886474609375, -17.092357635498047, -12.196067810058594, -7.299777984619141, -2.4034881591796875, 2.4928016662597656, 7.389091491699219]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 5.0, 1.0, 3.0, 4.0, 9.0, 8.0, 6.0, 7.0, 8.0, 18.0, 9.0, 22.0, 18.0, 25.0, 27.0, 28.0, 18.0, 21.0, 26.0, 32.0, 46.0, 31.0, 31.0, 41.0, 35.0, 34.0, 33.0, 44.0, 38.0, 28.0, 28.0, 38.0, 47.0, 34.0, 26.0, 19.0, 20.0, 26.0, 19.0, 12.0, 11.0, 15.0, 17.0, 10.0, 4.0, 5.0, 4.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.080780029296875, -17.523303985595703, -16.96582794189453, -16.40835189819336, -15.850875854492188, -15.293399810791016, -14.73592472076416, -14.178448677062988, -13.620972633361816, -13.063496589660645, -12.506020545959473, -11.9485445022583, -11.391069412231445, -10.833593368530273, -10.276117324829102, -9.71864128112793, -9.161165237426758, -8.603689193725586, -8.046213150024414, -7.4887375831604, -6.9312615394592285, -6.373785495758057, -5.816309928894043, -5.258833885192871, -4.701357841491699, -4.143881797790527, -3.5864059925079346, -3.028930187225342, -2.47145414352417, -1.913978099822998, -1.3565022945404053, -0.7990264892578125, -0.24155235290527344, 0.3159235715866089, 0.8733994960784912, 1.4308754205703735, 1.9883513450622559, 2.5458273887634277, 3.1033031940460205, 3.6607789993286133, 4.218255043029785, 4.775731086730957, 5.333207130432129, 5.890682697296143, 6.4481587409973145, 7.005634784698486, 7.5631103515625, 8.120586395263672, 8.678062438964844, 9.235538482666016, 9.793014526367188, 10.35049057006836, 10.907966613769531, 11.465442657470703, 12.022917747497559, 12.58039379119873, 13.137869834899902, 13.695345878601074, 14.252821922302246, 14.810297966003418, 15.367773056030273, 15.925249099731445, 16.482725143432617, 17.04020118713379, 17.59767723083496]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 4.0, 6.0, 9.0, 12.0, 14.0, 17.0, 23.0, 15.0, 23.0, 21.0, 26.0, 31.0, 36.0, 39.0, 27.0, 35.0, 44.0, 35.0, 34.0, 44.0, 40.0, 50.0, 36.0, 41.0, 40.0, 27.0, 33.0, 35.0, 23.0, 35.0, 16.0, 18.0, 14.0, 16.0, 20.0, 14.0, 9.0, 5.0, 10.0, 7.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.5117340087890625, -1.459014892578125, -1.4062957763671875, -1.35357666015625, -1.3008575439453125, -1.248138427734375, -1.1954193115234375, -1.1427001953125, -1.0899810791015625, -1.037261962890625, -0.9845428466796875, -0.93182373046875, -0.8791046142578125, -0.826385498046875, -0.7736663818359375, -0.720947265625, -0.6682281494140625, -0.615509033203125, -0.5627899169921875, -0.51007080078125, -0.4573516845703125, -0.404632568359375, -0.3519134521484375, -0.2991943359375, -0.2464752197265625, -0.193756103515625, -0.1410369873046875, -0.08831787109375, -0.0355987548828125, 0.017120361328125, 0.0698394775390625, 0.12255859375, 0.1752777099609375, 0.227996826171875, 0.2807159423828125, 0.33343505859375, 0.3861541748046875, 0.438873291015625, 0.4915924072265625, 0.5443115234375, 0.5970306396484375, 0.649749755859375, 0.7024688720703125, 0.75518798828125, 0.8079071044921875, 0.860626220703125, 0.9133453369140625, 0.966064453125, 1.0187835693359375, 1.071502685546875, 1.1242218017578125, 1.17694091796875, 1.2296600341796875, 1.282379150390625, 1.3350982666015625, 1.3878173828125, 1.4405364990234375, 1.493255615234375, 1.5459747314453125, 1.59869384765625, 1.6514129638671875, 1.704132080078125, 1.7568511962890625, 1.8095703125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 4.0, 5.0, 5.0, 9.0, 20.0, 23.0, 31.0, 26.0, 40.0, 69.0, 106.0, 158.0, 217.0, 397.0, 793.0, 1655.0, 4103.0, 11153.0, 32910.0, 104434.0, 350830.0, 1208165.0, 1671940.0, 565953.0, 163577.0, 50294.0, 16553.0, 6082.0, 2352.0, 1017.0, 477.0, 272.0, 159.0, 121.0, 98.0, 53.0, 46.0, 33.0, 30.0, 17.0, 15.0, 13.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.654296875, -3.544189453125, -3.43408203125, -3.323974609375, -3.2138671875, -3.103759765625, -2.99365234375, -2.883544921875, -2.7734375, -2.663330078125, -2.55322265625, -2.443115234375, -2.3330078125, -2.222900390625, -2.11279296875, -2.002685546875, -1.892578125, -1.782470703125, -1.67236328125, -1.562255859375, -1.4521484375, -1.342041015625, -1.23193359375, -1.121826171875, -1.01171875, -0.901611328125, -0.79150390625, -0.681396484375, -0.5712890625, -0.461181640625, -0.35107421875, -0.240966796875, -0.130859375, -0.020751953125, 0.08935546875, 0.199462890625, 0.3095703125, 0.419677734375, 0.52978515625, 0.639892578125, 0.75, 0.860107421875, 0.97021484375, 1.080322265625, 1.1904296875, 1.300537109375, 1.41064453125, 1.520751953125, 1.630859375, 1.740966796875, 1.85107421875, 1.961181640625, 2.0712890625, 2.181396484375, 2.29150390625, 2.401611328125, 2.51171875, 2.621826171875, 2.73193359375, 2.842041015625, 2.9521484375, 3.062255859375, 3.17236328125, 3.282470703125, 3.392578125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 11.0, 20.0, 33.0, 46.0, 89.0, 150.0, 303.0, 454.0, 738.0, 839.0, 562.0, 381.0, 207.0, 112.0, 63.0, 33.0, 18.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.109375, -13.81671142578125, -13.5240478515625, -13.23138427734375, -12.938720703125, -12.64605712890625, -12.3533935546875, -12.06072998046875, -11.76806640625, -11.47540283203125, -11.1827392578125, -10.89007568359375, -10.597412109375, -10.30474853515625, -10.0120849609375, -9.71942138671875, -9.4267578125, -9.13409423828125, -8.8414306640625, -8.54876708984375, -8.256103515625, -7.96343994140625, -7.6707763671875, -7.37811279296875, -7.08544921875, -6.79278564453125, -6.5001220703125, -6.20745849609375, -5.914794921875, -5.62213134765625, -5.3294677734375, -5.03680419921875, -4.744140625, -4.45147705078125, -4.1588134765625, -3.86614990234375, -3.573486328125, -3.28082275390625, -2.9881591796875, -2.69549560546875, -2.40283203125, -2.11016845703125, -1.8175048828125, -1.52484130859375, -1.232177734375, -0.93951416015625, -0.6468505859375, -0.35418701171875, -0.0615234375, 0.23114013671875, 0.5238037109375, 0.81646728515625, 1.109130859375, 1.40179443359375, 1.6944580078125, 1.98712158203125, 2.27978515625, 2.57244873046875, 2.8651123046875, 3.15777587890625, 3.450439453125, 3.74310302734375, 4.0357666015625, 4.32843017578125, 4.62109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 9.0, 10.0, 30.0, 27.0, 43.0, 81.0, 139.0, 269.0, 586.0, 1531.0, 5640.0, 45226.0, 790046.0, 3010448.0, 313928.0, 20708.0, 3538.0, 1071.0, 444.0, 229.0, 105.0, 61.0, 37.0, 25.0, 18.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.7884521484375, -9.350341796875, -8.9122314453125, -8.47412109375, -8.0360107421875, -7.597900390625, -7.1597900390625, -6.7216796875, -6.2835693359375, -5.845458984375, -5.4073486328125, -4.96923828125, -4.5311279296875, -4.093017578125, -3.6549072265625, -3.216796875, -2.7786865234375, -2.340576171875, -1.9024658203125, -1.46435546875, -1.0262451171875, -0.588134765625, -0.1500244140625, 0.2880859375, 0.7261962890625, 1.164306640625, 1.6024169921875, 2.04052734375, 2.4786376953125, 2.916748046875, 3.3548583984375, 3.79296875, 4.2310791015625, 4.669189453125, 5.1072998046875, 5.54541015625, 5.9835205078125, 6.421630859375, 6.8597412109375, 7.2978515625, 7.7359619140625, 8.174072265625, 8.6121826171875, 9.05029296875, 9.4884033203125, 9.926513671875, 10.3646240234375, 10.802734375, 11.2408447265625, 11.678955078125, 12.1170654296875, 12.55517578125, 12.9932861328125, 13.431396484375, 13.8695068359375, 14.3076171875, 14.7457275390625, 15.183837890625, 15.6219482421875, 16.06005859375, 16.4981689453125, 16.936279296875, 17.3743896484375, 17.8125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 8.0, 24.0, 35.0, 46.0, 66.0, 79.0, 92.0, 104.0, 122.0, 117.0, 98.0, 71.0, 57.0, 44.0, 22.0, 10.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.606205940246582, -12.44528865814209, -11.284372329711914, -10.123455047607422, -8.96253776550293, -7.801621437072754, -6.640704154968262, -5.479787826538086, -4.318870544433594, -3.1579537391662598, -1.9970366954803467, -0.8361196517944336, 0.3247971534729004, 1.4857139587402344, 2.6466312408447266, 3.8075475692749023, 4.9684648513793945, 6.1293816566467285, 7.2902984619140625, 8.451215744018555, 9.612133026123047, 10.773049354553223, 11.933966636657715, 13.09488296508789, 14.255800247192383, 15.416717529296875, 16.577634811401367, 17.73855209350586, 18.89946746826172, 20.06038475036621, 21.221302032470703, 22.382217407226562, 23.543132781982422, 24.704050064086914, 25.864967346191406, 27.025882720947266, 28.186800003051758, 29.34771728515625, 30.508634567260742, 31.669551849365234, 32.830467224121094, 33.99138259887695, 35.15230178833008, 36.31321716308594, 37.47413635253906, 38.63505172729492, 39.79596710205078, 40.956886291503906, 42.11780548095703, 43.27872085571289, 44.439640045166016, 45.600555419921875, 46.761474609375, 47.92238998413086, 49.08330535888672, 50.244224548339844, 51.4051399230957, 52.56605529785156, 53.72697448730469, 54.88788986206055, 56.04880905151367, 57.20972442626953, 58.370643615722656, 59.531558990478516, 60.692474365234375]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 7.0, 4.0, 10.0, 8.0, 12.0, 10.0, 16.0, 22.0, 15.0, 15.0, 14.0, 29.0, 33.0, 34.0, 29.0, 29.0, 33.0, 39.0, 42.0, 42.0, 42.0, 28.0, 53.0, 29.0, 47.0, 29.0, 38.0, 41.0, 30.0, 33.0, 31.0, 24.0, 15.0, 15.0, 24.0, 20.0, 12.0, 13.0, 8.0, 11.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.288288116455078, -19.717477798461914, -19.14666748046875, -18.575857162475586, -18.005046844482422, -17.434236526489258, -16.863426208496094, -16.292617797851562, -15.721806526184082, -15.150996208190918, -14.580185890197754, -14.00937557220459, -13.438566207885742, -12.867755889892578, -12.296945571899414, -11.72613525390625, -11.155324935913086, -10.584514617919922, -10.013704299926758, -9.442893981933594, -8.87208366394043, -8.301273345947266, -7.730463981628418, -7.159653663635254, -6.58884334564209, -6.018033027648926, -5.447222709655762, -4.876412868499756, -4.305602550506592, -3.7347922325134277, -3.1639821529388428, -2.593172073364258, -2.022359848022461, -1.4515496492385864, -0.8807394504547119, -0.3099292516708374, 0.2608809471130371, 0.8316912651062012, 1.4025013446807861, 1.973311424255371, 2.544121742248535, 3.114932060241699, 3.685742139816284, 4.256552219390869, 4.827362537384033, 5.398172855377197, 5.968982696533203, 6.539793014526367, 7.110603332519531, 7.681413650512695, 8.25222396850586, 8.823034286499023, 9.393844604492188, 9.964654922485352, 10.5354642868042, 11.106274604797363, 11.677084922790527, 12.247895240783691, 12.818705558776855, 13.38951587677002, 13.960325241088867, 14.531135559082031, 15.101945877075195, 15.67275619506836, 16.243566513061523]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 5.0, 7.0, 6.0, 9.0, 11.0, 16.0, 13.0, 20.0, 15.0, 19.0, 20.0, 27.0, 30.0, 32.0, 35.0, 35.0, 39.0, 28.0, 36.0, 36.0, 38.0, 47.0, 36.0, 42.0, 38.0, 35.0, 35.0, 37.0, 41.0, 29.0, 25.0, 20.0, 19.0, 19.0, 19.0, 18.0, 19.0, 11.0, 6.0, 7.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.5109100341796875, -1.457366943359375, -1.4038238525390625, -1.35028076171875, -1.2967376708984375, -1.243194580078125, -1.1896514892578125, -1.1361083984375, -1.0825653076171875, -1.029022216796875, -0.9754791259765625, -0.92193603515625, -0.8683929443359375, -0.814849853515625, -0.7613067626953125, -0.707763671875, -0.6542205810546875, -0.600677490234375, -0.5471343994140625, -0.49359130859375, -0.4400482177734375, -0.386505126953125, -0.3329620361328125, -0.2794189453125, -0.2258758544921875, -0.172332763671875, -0.1187896728515625, -0.06524658203125, -0.0117034912109375, 0.041839599609375, 0.0953826904296875, 0.14892578125, 0.2024688720703125, 0.256011962890625, 0.3095550537109375, 0.36309814453125, 0.4166412353515625, 0.470184326171875, 0.5237274169921875, 0.5772705078125, 0.6308135986328125, 0.684356689453125, 0.7378997802734375, 0.79144287109375, 0.8449859619140625, 0.898529052734375, 0.9520721435546875, 1.005615234375, 1.0591583251953125, 1.112701416015625, 1.1662445068359375, 1.21978759765625, 1.2733306884765625, 1.326873779296875, 1.3804168701171875, 1.4339599609375, 1.4875030517578125, 1.541046142578125, 1.5945892333984375, 1.64813232421875, 1.7016754150390625, 1.755218505859375, 1.8087615966796875, 1.8623046875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 5.0, 7.0, 21.0, 40.0, 49.0, 82.0, 121.0, 159.0, 248.0, 380.0, 566.0, 829.0, 1263.0, 1942.0, 2813.0, 4250.0, 6156.0, 9181.0, 13057.0, 19126.0, 28905.0, 43510.0, 67465.0, 113367.0, 276722.0, 187533.0, 94989.0, 58593.0, 38069.0, 25442.0, 17209.0, 11710.0, 7952.0, 5531.0, 3651.0, 2564.0, 1678.0, 1154.0, 785.0, 501.0, 313.0, 206.0, 147.0, 97.0, 50.0, 38.0, 34.0, 15.0, 9.0, 10.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.062255859375, -0.06030082702636719, -0.058345794677734375, -0.05639076232910156, -0.05443572998046875, -0.05248069763183594, -0.050525665283203125, -0.04857063293457031, -0.0466156005859375, -0.04466056823730469, -0.042705535888671875, -0.04075050354003906, -0.03879547119140625, -0.03684043884277344, -0.034885406494140625, -0.03293037414550781, -0.030975341796875, -0.029020309448242188, -0.027065277099609375, -0.025110244750976562, -0.02315521240234375, -0.021200180053710938, -0.019245147705078125, -0.017290115356445312, -0.0153350830078125, -0.013380050659179688, -0.011425018310546875, -0.009469985961914062, -0.00751495361328125, -0.0055599212646484375, -0.003604888916015625, -0.0016498565673828125, 0.00030517578125, 0.0022602081298828125, 0.004215240478515625, 0.0061702728271484375, 0.00812530517578125, 0.010080337524414062, 0.012035369873046875, 0.013990402221679688, 0.0159454345703125, 0.017900466918945312, 0.019855499267578125, 0.021810531616210938, 0.02376556396484375, 0.025720596313476562, 0.027675628662109375, 0.029630661010742188, 0.031585693359375, 0.03354072570800781, 0.035495758056640625, 0.03745079040527344, 0.03940582275390625, 0.04136085510253906, 0.043315887451171875, 0.04527091979980469, 0.0472259521484375, 0.04918098449707031, 0.051136016845703125, 0.05309104919433594, 0.05504608154296875, 0.05700111389160156, 0.058956146240234375, 0.06091117858886719, 0.0628662109375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 4.0, 9.0, 11.0, 7.0, 18.0, 21.0, 31.0, 32.0, 29.0, 29.0, 23.0, 34.0, 35.0, 43.0, 40.0, 45.0, 32.0, 34.0, 1051.0, 42.0, 45.0, 45.0, 44.0, 40.0, 39.0, 34.0, 35.0, 31.0, 23.0, 14.0, 16.0, 12.0, 10.0, 12.0, 8.0, 12.0, 5.0, 10.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1787109375, -1.1368255615234375, -1.094940185546875, -1.0530548095703125, -1.01116943359375, -0.9692840576171875, -0.927398681640625, -0.8855133056640625, -0.8436279296875, -0.8017425537109375, -0.759857177734375, -0.7179718017578125, -0.67608642578125, -0.6342010498046875, -0.592315673828125, -0.5504302978515625, -0.508544921875, -0.4666595458984375, -0.424774169921875, -0.3828887939453125, -0.34100341796875, -0.2991180419921875, -0.257232666015625, -0.2153472900390625, -0.1734619140625, -0.1315765380859375, -0.089691162109375, -0.0478057861328125, -0.00592041015625, 0.0359649658203125, 0.077850341796875, 0.1197357177734375, 0.16162109375, 0.2035064697265625, 0.245391845703125, 0.2872772216796875, 0.32916259765625, 0.3710479736328125, 0.412933349609375, 0.4548187255859375, 0.4967041015625, 0.5385894775390625, 0.580474853515625, 0.6223602294921875, 0.66424560546875, 0.7061309814453125, 0.748016357421875, 0.7899017333984375, 0.831787109375, 0.8736724853515625, 0.915557861328125, 0.9574432373046875, 0.99932861328125, 1.0412139892578125, 1.083099365234375, 1.1249847412109375, 1.1668701171875, 1.2087554931640625, 1.250640869140625, 1.2925262451171875, 1.33441162109375, 1.3762969970703125, 1.418182373046875, 1.4600677490234375, 1.501953125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 4.0, 9.0, 11.0, 23.0, 29.0, 54.0, 75.0, 114.0, 181.0, 286.0, 429.0, 629.0, 1027.0, 1530.0, 2538.0, 3924.0, 5983.0, 9213.0, 14361.0, 23212.0, 37727.0, 63487.0, 117915.0, 1313134.0, 232604.0, 110295.0, 61028.0, 35987.0, 22170.0, 14305.0, 8912.0, 5676.0, 3580.0, 2363.0, 1520.0, 995.0, 646.0, 438.0, 251.0, 166.0, 93.0, 71.0, 44.0, 23.0, 21.0, 13.0, 12.0, 11.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.043182373046875, -0.04187202453613281, -0.040561676025390625, -0.03925132751464844, -0.03794097900390625, -0.03663063049316406, -0.035320281982421875, -0.03400993347167969, -0.0326995849609375, -0.03138923645019531, -0.030078887939453125, -0.028768539428710938, -0.02745819091796875, -0.026147842407226562, -0.024837493896484375, -0.023527145385742188, -0.022216796875, -0.020906448364257812, -0.019596099853515625, -0.018285751342773438, -0.01697540283203125, -0.015665054321289062, -0.014354705810546875, -0.013044357299804688, -0.0117340087890625, -0.010423660278320312, -0.009113311767578125, -0.0078029632568359375, -0.00649261474609375, -0.0051822662353515625, -0.003871917724609375, -0.0025615692138671875, -0.001251220703125, 5.91278076171875e-05, 0.001369476318359375, 0.0026798248291015625, 0.00399017333984375, 0.0053005218505859375, 0.006610870361328125, 0.007921218872070312, 0.0092315673828125, 0.010541915893554688, 0.011852264404296875, 0.013162612915039062, 0.01447296142578125, 0.015783309936523438, 0.017093658447265625, 0.018404006958007812, 0.01971435546875, 0.021024703979492188, 0.022335052490234375, 0.023645401000976562, 0.02495574951171875, 0.026266098022460938, 0.027576446533203125, 0.028886795043945312, 0.0301971435546875, 0.03150749206542969, 0.032817840576171875, 0.03412818908691406, 0.03543853759765625, 0.03674888610839844, 0.038059234619140625, 0.03936958312988281, 0.040679931640625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 0.0, 10.0, 6.0, 14.0, 13.0, 0.0, 13.0, 36.0, 52.0, 88.0, 0.0, 527.0, 102.0, 57.0, 0.0, 28.0, 10.0, 12.0, 6.0, 0.0, 6.0, 4.0, 3.0, 0.0, 7.0, 0.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.9203871488571167e-06, -1.8738210201263428e-06, -1.8272548913955688e-06, -1.780688762664795e-06, -1.734122633934021e-06, -1.687556505203247e-06, -1.6409903764724731e-06, -1.5944242477416992e-06, -1.5478581190109253e-06, -1.5012919902801514e-06, -1.4547258615493774e-06, -1.4081597328186035e-06, -1.3615936040878296e-06, -1.3150274753570557e-06, -1.2684613466262817e-06, -1.2218952178955078e-06, -1.1753290891647339e-06, -1.12876296043396e-06, -1.082196831703186e-06, -1.0356307029724121e-06, -9.890645742416382e-07, -9.424984455108643e-07, -8.959323167800903e-07, -8.493661880493164e-07, -8.028000593185425e-07, -7.562339305877686e-07, -7.096678018569946e-07, -6.631016731262207e-07, -6.165355443954468e-07, -5.699694156646729e-07, -5.234032869338989e-07, -4.76837158203125e-07, -4.302710294723511e-07, -3.8370490074157715e-07, -3.371387720108032e-07, -2.905726432800293e-07, -2.4400651454925537e-07, -1.9744038581848145e-07, -1.5087425708770752e-07, -1.043081283569336e-07, -5.774199962615967e-08, -1.1175870895385742e-08, 3.5390257835388184e-08, 8.195638656616211e-08, 1.2852251529693604e-07, 1.7508864402770996e-07, 2.2165477275848389e-07, 2.682209014892578e-07, 3.1478703022003174e-07, 3.6135315895080566e-07, 4.079192876815796e-07, 4.544854164123535e-07, 5.010515451431274e-07, 5.476176738739014e-07, 5.941838026046753e-07, 6.407499313354492e-07, 6.873160600662231e-07, 7.338821887969971e-07, 7.80448317527771e-07, 8.270144462585449e-07, 8.735805749893188e-07, 9.201467037200928e-07, 9.667128324508667e-07, 1.0132789611816406e-06]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 3.0, 4.0, 7.0, 7.0, 13.0, 9.0, 30.0, 44.0, 74.0, 129.0, 372.0, 15033.0, 1021847.0, 10387.0, 305.0, 93.0, 48.0, 46.0, 29.0, 24.0, 20.0, 17.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9550323486328125e-05, -1.8716789782047272e-05, -1.788325607776642e-05, -1.7049722373485565e-05, -1.6216188669204712e-05, -1.538265496492386e-05, -1.4549121260643005e-05, -1.3715587556362152e-05, -1.2882053852081299e-05, -1.2048520147800446e-05, -1.1214986443519592e-05, -1.0381452739238739e-05, -9.547919034957886e-06, -8.714385330677032e-06, -7.88085162639618e-06, -7.047317922115326e-06, -6.213784217834473e-06, -5.380250513553619e-06, -4.546716809272766e-06, -3.713183104991913e-06, -2.8796494007110596e-06, -2.0461156964302063e-06, -1.212581992149353e-06, -3.7904828786849976e-07, 4.544854164123535e-07, 1.2880191206932068e-06, 2.12155282497406e-06, 2.9550865292549133e-06, 3.7886202335357666e-06, 4.62215393781662e-06, 5.455687642097473e-06, 6.289221346378326e-06, 7.12275505065918e-06, 7.956288754940033e-06, 8.789822459220886e-06, 9.62335616350174e-06, 1.0456889867782593e-05, 1.1290423572063446e-05, 1.21239572763443e-05, 1.2957490980625153e-05, 1.3791024684906006e-05, 1.4624558389186859e-05, 1.5458092093467712e-05, 1.6291625797748566e-05, 1.712515950202942e-05, 1.7958693206310272e-05, 1.8792226910591125e-05, 1.962576061487198e-05, 2.0459294319152832e-05, 2.1292828023433685e-05, 2.212636172771454e-05, 2.2959895431995392e-05, 2.3793429136276245e-05, 2.46269628405571e-05, 2.546049654483795e-05, 2.6294030249118805e-05, 2.7127563953399658e-05, 2.796109765768051e-05, 2.8794631361961365e-05, 2.9628165066242218e-05, 3.046169877052307e-05, 3.1295232474803925e-05, 3.212876617908478e-05, 3.296229988336563e-05, 3.3795833587646484e-05]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 11.0, 16.0, 20.0, 31.0, 833.0, 31.0, 22.0, 21.0, 11.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.063435300049605e-07, -8.880516588760656e-07, -8.697597309037519e-07, -8.514678597748571e-07, -8.331759318025433e-07, -8.148840606736485e-07, -7.965921895447536e-07, -7.783002615724399e-07, -7.600083904435451e-07, -7.417165193146502e-07, -7.234245913423365e-07, -7.051327202134416e-07, -6.868407922411279e-07, -6.685489211122331e-07, -6.502569931399194e-07, -6.319651220110245e-07, -6.136732508821297e-07, -5.953813797532348e-07, -5.770894517809211e-07, -5.587975806520262e-07, -5.405056526797125e-07, -5.222137815508177e-07, -5.039219104219228e-07, -4.856299824496091e-07, -4.6733805447729537e-07, -4.490461549266911e-07, -4.307542553760868e-07, -4.1246238424719195e-07, -3.9417048469658766e-07, -3.758785851459834e-07, -3.575866855953791e-07, -3.392947860447748e-07, -3.210029433375894e-07, -3.027110437869851e-07, -2.844191442363808e-07, -2.6612724468577653e-07, -2.478353735568817e-07, -2.295434740062774e-07, -2.112515744556731e-07, -1.9295968911592354e-07, -1.7466778956531925e-07, -1.5637589001471497e-07, -1.380840046749654e-07, -1.1979210512436111e-07, -1.0150021267918419e-07, -8.320832023400726e-08, -6.491642068340298e-08, -4.6624535343653406e-08, -2.833263579304912e-08, -1.0040741571515355e-08, 8.251152650018412e-09, 2.6543048647909018e-08, 4.4834941093085945e-08, 6.312683353826287e-08, 8.141873308886716e-08, 9.971061842861673e-08, 1.1800251797922101e-07, 1.362944175298253e-07, 1.5458630286957487e-07, 1.7287820242017915e-07, 1.9117010197078343e-07, 2.09461987310533e-07, 2.277538868611373e-07, 2.4604577220088686e-07, 2.6433767175149114e-07]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 88.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 825.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 82.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 5.0, 7.0, 6.0, 9.0, 11.0, 16.0, 13.0, 20.0, 15.0, 19.0, 20.0, 27.0, 30.0, 32.0, 35.0, 35.0, 39.0, 28.0, 36.0, 36.0, 38.0, 47.0, 36.0, 42.0, 38.0, 35.0, 35.0, 37.0, 41.0, 29.0, 25.0, 20.0, 19.0, 19.0, 19.0, 18.0, 19.0, 11.0, 6.0, 7.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.564453125, -1.5109100341796875, -1.457366943359375, -1.4038238525390625, -1.35028076171875, -1.2967376708984375, -1.243194580078125, -1.1896514892578125, -1.1361083984375, -1.0825653076171875, -1.029022216796875, -0.9754791259765625, -0.92193603515625, -0.8683929443359375, -0.814849853515625, -0.7613067626953125, -0.707763671875, -0.6542205810546875, -0.600677490234375, -0.5471343994140625, -0.49359130859375, -0.4400482177734375, -0.386505126953125, -0.3329620361328125, -0.2794189453125, -0.2258758544921875, -0.172332763671875, -0.1187896728515625, -0.06524658203125, -0.0117034912109375, 0.041839599609375, 0.0953826904296875, 0.14892578125, 0.2024688720703125, 0.256011962890625, 0.3095550537109375, 0.36309814453125, 0.4166412353515625, 0.470184326171875, 0.5237274169921875, 0.5772705078125, 0.6308135986328125, 0.684356689453125, 0.7378997802734375, 0.79144287109375, 0.8449859619140625, 0.898529052734375, 0.9520721435546875, 1.005615234375, 1.0591583251953125, 1.112701416015625, 1.1662445068359375, 1.21978759765625, 1.2733306884765625, 1.326873779296875, 1.3804168701171875, 1.4339599609375, 1.4875030517578125, 1.541046142578125, 1.5945892333984375, 1.64813232421875, 1.7016754150390625, 1.755218505859375, 1.8087615966796875, 1.8623046875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 13.0, 14.0, 17.0, 22.0, 34.0, 44.0, 68.0, 103.0, 153.0, 247.0, 364.0, 503.0, 840.0, 1266.0, 1894.0, 2788.0, 4445.0, 6991.0, 11094.0, 18522.0, 31781.0, 58669.0, 116746.0, 253323.0, 269789.0, 123177.0, 61579.0, 32891.0, 19021.0, 11456.0, 7303.0, 4625.0, 2956.0, 2011.0, 1236.0, 870.0, 584.0, 377.0, 272.0, 128.0, 116.0, 65.0, 52.0, 33.0, 26.0, 23.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.296875, -2.222869873046875, -2.14886474609375, -2.074859619140625, -2.0008544921875, -1.926849365234375, -1.85284423828125, -1.778839111328125, -1.704833984375, -1.630828857421875, -1.55682373046875, -1.482818603515625, -1.4088134765625, -1.334808349609375, -1.26080322265625, -1.186798095703125, -1.11279296875, -1.038787841796875, -0.96478271484375, -0.890777587890625, -0.8167724609375, -0.742767333984375, -0.66876220703125, -0.594757080078125, -0.520751953125, -0.446746826171875, -0.37274169921875, -0.298736572265625, -0.2247314453125, -0.150726318359375, -0.07672119140625, -0.002716064453125, 0.0712890625, 0.145294189453125, 0.21929931640625, 0.293304443359375, 0.3673095703125, 0.441314697265625, 0.51531982421875, 0.589324951171875, 0.663330078125, 0.737335205078125, 0.81134033203125, 0.885345458984375, 0.9593505859375, 1.033355712890625, 1.10736083984375, 1.181365966796875, 1.25537109375, 1.329376220703125, 1.40338134765625, 1.477386474609375, 1.5513916015625, 1.625396728515625, 1.69940185546875, 1.773406982421875, 1.847412109375, 1.921417236328125, 1.99542236328125, 2.069427490234375, 2.1434326171875, 2.217437744140625, 2.29144287109375, 2.365447998046875, 2.439453125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 15.0, 10.0, 17.0, 23.0, 28.0, 34.0, 33.0, 46.0, 53.0, 59.0, 91.0, 131.0, 202.0, 1456.0, 286.0, 128.0, 84.0, 67.0, 48.0, 42.0, 32.0, 30.0, 28.0, 21.0, 17.0, 23.0, 10.0, 7.0, 6.0, 5.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8203125, -9.5595703125, -9.298828125, -9.0380859375, -8.77734375, -8.5166015625, -8.255859375, -7.9951171875, -7.734375, -7.4736328125, -7.212890625, -6.9521484375, -6.69140625, -6.4306640625, -6.169921875, -5.9091796875, -5.6484375, -5.3876953125, -5.126953125, -4.8662109375, -4.60546875, -4.3447265625, -4.083984375, -3.8232421875, -3.5625, -3.3017578125, -3.041015625, -2.7802734375, -2.51953125, -2.2587890625, -1.998046875, -1.7373046875, -1.4765625, -1.2158203125, -0.955078125, -0.6943359375, -0.43359375, -0.1728515625, 0.087890625, 0.3486328125, 0.609375, 0.8701171875, 1.130859375, 1.3916015625, 1.65234375, 1.9130859375, 2.173828125, 2.4345703125, 2.6953125, 2.9560546875, 3.216796875, 3.4775390625, 3.73828125, 3.9990234375, 4.259765625, 4.5205078125, 4.78125, 5.0419921875, 5.302734375, 5.5634765625, 5.82421875, 6.0849609375, 6.345703125, 6.6064453125, 6.8671875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 6.0, 4.0, 17.0, 13.0, 11.0, 16.0, 21.0, 29.0, 37.0, 64.0, 85.0, 134.0, 199.0, 399.0, 1011.0, 3811.0, 20505.0, 203475.0, 2537584.0, 342049.0, 28859.0, 4915.0, 1247.0, 495.0, 237.0, 122.0, 101.0, 58.0, 56.0, 36.0, 28.0, 28.0, 14.0, 8.0, 8.0, 8.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.234375, -9.8997802734375, -9.565185546875, -9.2305908203125, -8.89599609375, -8.5614013671875, -8.226806640625, -7.8922119140625, -7.5576171875, -7.2230224609375, -6.888427734375, -6.5538330078125, -6.21923828125, -5.8846435546875, -5.550048828125, -5.2154541015625, -4.880859375, -4.5462646484375, -4.211669921875, -3.8770751953125, -3.54248046875, -3.2078857421875, -2.873291015625, -2.5386962890625, -2.2041015625, -1.8695068359375, -1.534912109375, -1.2003173828125, -0.86572265625, -0.5311279296875, -0.196533203125, 0.1380615234375, 0.47265625, 0.8072509765625, 1.141845703125, 1.4764404296875, 1.81103515625, 2.1456298828125, 2.480224609375, 2.8148193359375, 3.1494140625, 3.4840087890625, 3.818603515625, 4.1531982421875, 4.48779296875, 4.8223876953125, 5.156982421875, 5.4915771484375, 5.826171875, 6.1607666015625, 6.495361328125, 6.8299560546875, 7.16455078125, 7.4991455078125, 7.833740234375, 8.1683349609375, 8.5029296875, 8.8375244140625, 9.172119140625, 9.5067138671875, 9.84130859375, 10.1759033203125, 10.510498046875, 10.8450927734375, 11.1796875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [108.0, 871.0, 39.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.390555381774902, -2.889803886413574, 3.610947608947754, 10.111699104309082, 16.612449645996094, 23.113201141357422, 29.61395263671875, 36.11470413208008, 42.615455627441406, 49.116207122802734, 55.61695861816406, 62.11771011352539, 68.61846160888672, 75.11921691894531, 81.61996459960938, 88.12071228027344, 94.62146759033203, 101.12222290039062, 107.62297058105469, 114.12371826171875, 120.62447357177734, 127.12522888183594, 133.6259765625, 140.12672424316406, 146.6274871826172, 153.12823486328125, 159.62899780273438, 166.12974548339844, 172.6304931640625, 179.13124084472656, 185.63198852539062, 192.13275146484375, 198.63348388671875, 205.1342315673828, 211.63497924804688, 218.1357421875, 224.63648986816406, 231.13723754882812, 237.63800048828125, 244.1387481689453, 250.63949584960938, 257.1402587890625, 263.6409912109375, 270.1417541503906, 276.64251708984375, 283.14324951171875, 289.6440124511719, 296.1447448730469, 302.6455078125, 309.1462707519531, 315.6470031738281, 322.14776611328125, 328.64849853515625, 335.1492614746094, 341.6500244140625, 348.1507568359375, 354.6515197753906, 361.15228271484375, 367.65301513671875, 374.1537780761719, 380.654541015625, 387.1552734375, 393.6560363769531, 400.1567687988281, 406.65753173828125]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 5.0, 16.0, 9.0, 5.0, 9.0, 10.0, 17.0, 22.0, 22.0, 18.0, 27.0, 26.0, 31.0, 34.0, 39.0, 37.0, 30.0, 40.0, 33.0, 38.0, 40.0, 35.0, 48.0, 41.0, 43.0, 41.0, 26.0, 29.0, 26.0, 24.0, 26.0, 23.0, 14.0, 11.0, 20.0, 14.0, 11.0, 10.0, 12.0, 10.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0], "bins": [-22.254898071289062, -21.652996063232422, -21.05109405517578, -20.449193954467773, -19.847291946411133, -19.245389938354492, -18.643489837646484, -18.041587829589844, -17.439685821533203, -16.837783813476562, -16.235881805419922, -15.633981704711914, -15.032079696655273, -14.430177688598633, -13.828276634216309, -13.226375579833984, -12.624473571777344, -12.022571563720703, -11.420670509338379, -10.818769454956055, -10.216867446899414, -9.614965438842773, -9.01306438446045, -8.411163330078125, -7.809261322021484, -7.207359790802002, -6.6054582595825195, -6.003556728363037, -5.401655197143555, -4.799753665924072, -4.19785213470459, -3.5959506034851074, -2.994047164916992, -2.3921456336975098, -1.7902441024780273, -1.188342571258545, -0.5864410400390625, 0.015460491180419922, 0.6173620223999023, 1.2192635536193848, 1.8211650848388672, 2.4230666160583496, 3.024968147277832, 3.6268696784973145, 4.228771209716797, 4.830672740936279, 5.432574272155762, 6.034475803375244, 6.636377334594727, 7.238278865814209, 7.840180397033691, 8.442081451416016, 9.043983459472656, 9.645885467529297, 10.247786521911621, 10.849687576293945, 11.451589584350586, 12.053491592407227, 12.65539264678955, 13.257293701171875, 13.859195709228516, 14.461097717285156, 15.06299877166748, 15.664899826049805, 16.266801834106445]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 13.0, 10.0, 13.0, 14.0, 16.0, 18.0, 18.0, 17.0, 19.0, 23.0, 17.0, 27.0, 35.0, 34.0, 26.0, 30.0, 35.0, 39.0, 36.0, 36.0, 41.0, 29.0, 36.0, 44.0, 31.0, 28.0, 35.0, 34.0, 36.0, 31.0, 20.0, 15.0, 18.0, 18.0, 20.0, 15.0, 11.0, 8.0, 10.0, 7.0, 10.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5224609375, -1.469940185546875, -1.41741943359375, -1.364898681640625, -1.3123779296875, -1.259857177734375, -1.20733642578125, -1.154815673828125, -1.102294921875, -1.049774169921875, -0.99725341796875, -0.944732666015625, -0.8922119140625, -0.839691162109375, -0.78717041015625, -0.734649658203125, -0.68212890625, -0.629608154296875, -0.57708740234375, -0.524566650390625, -0.4720458984375, -0.419525146484375, -0.36700439453125, -0.314483642578125, -0.261962890625, -0.209442138671875, -0.15692138671875, -0.104400634765625, -0.0518798828125, 0.000640869140625, 0.05316162109375, 0.105682373046875, 0.158203125, 0.210723876953125, 0.26324462890625, 0.315765380859375, 0.3682861328125, 0.420806884765625, 0.47332763671875, 0.525848388671875, 0.578369140625, 0.630889892578125, 0.68341064453125, 0.735931396484375, 0.7884521484375, 0.840972900390625, 0.89349365234375, 0.946014404296875, 0.99853515625, 1.051055908203125, 1.10357666015625, 1.156097412109375, 1.2086181640625, 1.261138916015625, 1.31365966796875, 1.366180419921875, 1.418701171875, 1.471221923828125, 1.52374267578125, 1.576263427734375, 1.6287841796875, 1.681304931640625, 1.73382568359375, 1.786346435546875, 1.8388671875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 5.0, 12.0, 9.0, 11.0, 21.0, 24.0, 29.0, 62.0, 94.0, 130.0, 205.0, 326.0, 544.0, 952.0, 1785.0, 3436.0, 7031.0, 14621.0, 32495.0, 72687.0, 164995.0, 379036.0, 850934.0, 1282715.0, 772347.0, 340888.0, 147914.0, 64867.0, 29195.0, 13388.0, 6402.0, 3243.0, 1670.0, 861.0, 506.0, 286.0, 196.0, 126.0, 80.0, 47.0, 35.0, 25.0, 18.0, 8.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.693359375, -2.615142822265625, -2.53692626953125, -2.458709716796875, -2.3804931640625, -2.302276611328125, -2.22406005859375, -2.145843505859375, -2.067626953125, -1.989410400390625, -1.91119384765625, -1.832977294921875, -1.7547607421875, -1.676544189453125, -1.59832763671875, -1.520111083984375, -1.44189453125, -1.363677978515625, -1.28546142578125, -1.207244873046875, -1.1290283203125, -1.050811767578125, -0.97259521484375, -0.894378662109375, -0.816162109375, -0.737945556640625, -0.65972900390625, -0.581512451171875, -0.5032958984375, -0.425079345703125, -0.34686279296875, -0.268646240234375, -0.1904296875, -0.112213134765625, -0.03399658203125, 0.044219970703125, 0.1224365234375, 0.200653076171875, 0.27886962890625, 0.357086181640625, 0.435302734375, 0.513519287109375, 0.59173583984375, 0.669952392578125, 0.7481689453125, 0.826385498046875, 0.90460205078125, 0.982818603515625, 1.06103515625, 1.139251708984375, 1.21746826171875, 1.295684814453125, 1.3739013671875, 1.452117919921875, 1.53033447265625, 1.608551025390625, 1.686767578125, 1.764984130859375, 1.84320068359375, 1.921417236328125, 1.9996337890625, 2.077850341796875, 2.15606689453125, 2.234283447265625, 2.3125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 7.0, 7.0, 11.0, 15.0, 19.0, 36.0, 61.0, 99.0, 137.0, 202.0, 284.0, 414.0, 538.0, 579.0, 471.0, 371.0, 274.0, 173.0, 140.0, 81.0, 56.0, 38.0, 26.0, 14.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.219970703125, -9.00244140625, -8.784912109375, -8.5673828125, -8.349853515625, -8.13232421875, -7.914794921875, -7.697265625, -7.479736328125, -7.26220703125, -7.044677734375, -6.8271484375, -6.609619140625, -6.39208984375, -6.174560546875, -5.95703125, -5.739501953125, -5.52197265625, -5.304443359375, -5.0869140625, -4.869384765625, -4.65185546875, -4.434326171875, -4.216796875, -3.999267578125, -3.78173828125, -3.564208984375, -3.3466796875, -3.129150390625, -2.91162109375, -2.694091796875, -2.4765625, -2.259033203125, -2.04150390625, -1.823974609375, -1.6064453125, -1.388916015625, -1.17138671875, -0.953857421875, -0.736328125, -0.518798828125, -0.30126953125, -0.083740234375, 0.1337890625, 0.351318359375, 0.56884765625, 0.786376953125, 1.00390625, 1.221435546875, 1.43896484375, 1.656494140625, 1.8740234375, 2.091552734375, 2.30908203125, 2.526611328125, 2.744140625, 2.961669921875, 3.17919921875, 3.396728515625, 3.6142578125, 3.831787109375, 4.04931640625, 4.266845703125, 4.484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 14.0, 28.0, 35.0, 65.0, 114.0, 178.0, 312.0, 633.0, 1579.0, 4872.0, 20391.0, 111309.0, 653333.0, 2231565.0, 960686.0, 169209.0, 29809.0, 6654.0, 1947.0, 714.0, 336.0, 185.0, 116.0, 59.0, 38.0, 32.0, 22.0, 15.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.13671875, -6.86859130859375, -6.6004638671875, -6.33233642578125, -6.064208984375, -5.79608154296875, -5.5279541015625, -5.25982666015625, -4.99169921875, -4.72357177734375, -4.4554443359375, -4.18731689453125, -3.919189453125, -3.65106201171875, -3.3829345703125, -3.11480712890625, -2.8466796875, -2.57855224609375, -2.3104248046875, -2.04229736328125, -1.774169921875, -1.50604248046875, -1.2379150390625, -0.96978759765625, -0.70166015625, -0.43353271484375, -0.1654052734375, 0.10272216796875, 0.370849609375, 0.63897705078125, 0.9071044921875, 1.17523193359375, 1.443359375, 1.71148681640625, 1.9796142578125, 2.24774169921875, 2.515869140625, 2.78399658203125, 3.0521240234375, 3.32025146484375, 3.58837890625, 3.85650634765625, 4.1246337890625, 4.39276123046875, 4.660888671875, 4.92901611328125, 5.1971435546875, 5.46527099609375, 5.7333984375, 6.00152587890625, 6.2696533203125, 6.53778076171875, 6.805908203125, 7.07403564453125, 7.3421630859375, 7.61029052734375, 7.87841796875, 8.14654541015625, 8.4146728515625, 8.68280029296875, 8.950927734375, 9.21905517578125, 9.4871826171875, 9.75531005859375, 10.0234375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 10.0, 30.0, 46.0, 124.0, 171.0, 174.0, 192.0, 156.0, 62.0, 30.0, 16.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.161182403564453, -15.189746856689453, -13.218311309814453, -11.24687671661377, -9.27544116973877, -7.3040056228637695, -5.332571029663086, -3.361135482788086, -1.389699935913086, 0.581735372543335, 2.553170680999756, 4.524605751037598, 6.496041297912598, 8.467476844787598, 10.438911437988281, 12.410346984863281, 14.381782531738281, 16.35321807861328, 18.32465362548828, 20.29608917236328, 22.26752471923828, 24.23896026611328, 26.21039390563965, 28.18182945251465, 30.15326499938965, 32.124698638916016, 34.096134185791016, 36.067569732666016, 38.039005279541016, 40.010440826416016, 41.981876373291016, 43.953311920166016, 45.92474365234375, 47.89617919921875, 49.86761474609375, 51.83905029296875, 53.81048583984375, 55.78192138671875, 57.75335693359375, 59.72479248046875, 61.69622802734375, 63.66766357421875, 65.63909912109375, 67.61053466796875, 69.58197021484375, 71.55340576171875, 73.52484130859375, 75.49627685546875, 77.46771240234375, 79.43914794921875, 81.41058349609375, 83.38201904296875, 85.35345458984375, 87.32489013671875, 89.29632568359375, 91.26776123046875, 93.23918914794922, 95.21062469482422, 97.18206024169922, 99.15349578857422, 101.12493133544922, 103.09636688232422, 105.06780242919922, 107.03923797607422, 109.01067352294922]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 6.0, 10.0, 8.0, 10.0, 14.0, 8.0, 19.0, 19.0, 17.0, 28.0, 20.0, 19.0, 24.0, 37.0, 35.0, 34.0, 31.0, 44.0, 31.0, 39.0, 44.0, 36.0, 41.0, 49.0, 38.0, 38.0, 39.0, 24.0, 24.0, 29.0, 32.0, 21.0, 22.0, 22.0, 13.0, 12.0, 13.0, 6.0, 10.0, 11.0, 6.0, 5.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-20.3746337890625, -19.805919647216797, -19.237205505371094, -18.668493270874023, -18.09977912902832, -17.531064987182617, -16.962352752685547, -16.393638610839844, -15.82492446899414, -15.256210327148438, -14.68749713897705, -14.118783950805664, -13.550069808959961, -12.981355667114258, -12.412642478942871, -11.843929290771484, -11.275215148925781, -10.706501007080078, -10.137787818908691, -9.569074630737305, -9.000360488891602, -8.431646347045898, -7.862933158874512, -7.294219493865967, -6.725505828857422, -6.156792163848877, -5.588078498840332, -5.019364833831787, -4.450651168823242, -3.8819375038146973, -3.3132238388061523, -2.7445101737976074, -2.1757965087890625, -1.6070828437805176, -1.0383691787719727, -0.46965551376342773, 0.09905815124511719, 0.6677718162536621, 1.236485481262207, 1.805199146270752, 2.373912811279297, 2.942626476287842, 3.5113401412963867, 4.080053806304932, 4.648767471313477, 5.2174811363220215, 5.786194801330566, 6.354908466339111, 6.923622131347656, 7.492335796356201, 8.061049461364746, 8.629762649536133, 9.198476791381836, 9.767190933227539, 10.335904121398926, 10.904617309570312, 11.473331451416016, 12.042045593261719, 12.610758781433105, 13.179471969604492, 13.748186111450195, 14.316900253295898, 14.885613441467285, 15.454326629638672, 16.023040771484375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 7.0, 8.0, 9.0, 6.0, 14.0, 16.0, 10.0, 15.0, 23.0, 19.0, 19.0, 25.0, 26.0, 24.0, 34.0, 44.0, 29.0, 34.0, 35.0, 35.0, 35.0, 36.0, 36.0, 35.0, 33.0, 38.0, 30.0, 35.0, 25.0, 31.0, 28.0, 24.0, 21.0, 23.0, 25.0, 12.0, 15.0, 18.0, 7.0, 12.0, 7.0, 10.0, 3.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.685546875, -1.6317291259765625, -1.577911376953125, -1.5240936279296875, -1.47027587890625, -1.4164581298828125, -1.362640380859375, -1.3088226318359375, -1.2550048828125, -1.2011871337890625, -1.147369384765625, -1.0935516357421875, -1.03973388671875, -0.9859161376953125, -0.932098388671875, -0.8782806396484375, -0.824462890625, -0.7706451416015625, -0.716827392578125, -0.6630096435546875, -0.60919189453125, -0.5553741455078125, -0.501556396484375, -0.4477386474609375, -0.3939208984375, -0.3401031494140625, -0.286285400390625, -0.2324676513671875, -0.17864990234375, -0.1248321533203125, -0.071014404296875, -0.0171966552734375, 0.03662109375, 0.0904388427734375, 0.144256591796875, 0.1980743408203125, 0.25189208984375, 0.3057098388671875, 0.359527587890625, 0.4133453369140625, 0.4671630859375, 0.5209808349609375, 0.574798583984375, 0.6286163330078125, 0.68243408203125, 0.7362518310546875, 0.790069580078125, 0.8438873291015625, 0.897705078125, 0.9515228271484375, 1.005340576171875, 1.0591583251953125, 1.11297607421875, 1.1667938232421875, 1.220611572265625, 1.2744293212890625, 1.3282470703125, 1.3820648193359375, 1.435882568359375, 1.4897003173828125, 1.54351806640625, 1.5973358154296875, 1.651153564453125, 1.7049713134765625, 1.7587890625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 13.0, 25.0, 34.0, 45.0, 87.0, 106.0, 138.0, 192.0, 328.0, 449.0, 660.0, 904.0, 1332.0, 1824.0, 2832.0, 4111.0, 6173.0, 8938.0, 13152.0, 19413.0, 28986.0, 43838.0, 71135.0, 125008.0, 298872.0, 172042.0, 88530.0, 53570.0, 34381.0, 22907.0, 15482.0, 10401.0, 7138.0, 4823.0, 3368.0, 2207.0, 1551.0, 1083.0, 759.0, 499.0, 372.0, 231.0, 172.0, 127.0, 87.0, 63.0, 41.0, 41.0, 24.0, 17.0, 9.0, 5.0, 2.0, 5.0, 2.0, 6.0], "bins": [-0.07025146484375, -0.06810379028320312, -0.06595611572265625, -0.06380844116210938, -0.0616607666015625, -0.059513092041015625, -0.05736541748046875, -0.055217742919921875, -0.053070068359375, -0.050922393798828125, -0.04877471923828125, -0.046627044677734375, -0.0444793701171875, -0.042331695556640625, -0.04018402099609375, -0.038036346435546875, -0.035888671875, -0.033740997314453125, -0.03159332275390625, -0.029445648193359375, -0.0272979736328125, -0.025150299072265625, -0.02300262451171875, -0.020854949951171875, -0.018707275390625, -0.016559600830078125, -0.01441192626953125, -0.012264251708984375, -0.0101165771484375, -0.007968902587890625, -0.00582122802734375, -0.003673553466796875, -0.00152587890625, 0.000621795654296875, 0.00276947021484375, 0.004917144775390625, 0.0070648193359375, 0.009212493896484375, 0.01136016845703125, 0.013507843017578125, 0.015655517578125, 0.017803192138671875, 0.01995086669921875, 0.022098541259765625, 0.0242462158203125, 0.026393890380859375, 0.02854156494140625, 0.030689239501953125, 0.0328369140625, 0.034984588623046875, 0.03713226318359375, 0.039279937744140625, 0.0414276123046875, 0.043575286865234375, 0.04572296142578125, 0.047870635986328125, 0.050018310546875, 0.052165985107421875, 0.05431365966796875, 0.056461334228515625, 0.0586090087890625, 0.060756683349609375, 0.06290435791015625, 0.06505203247070312, 0.06719970703125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 2.0, 7.0, 7.0, 8.0, 14.0, 11.0, 11.0, 18.0, 19.0, 22.0, 17.0, 18.0, 27.0, 21.0, 27.0, 26.0, 34.0, 33.0, 37.0, 47.0, 43.0, 1066.0, 51.0, 32.0, 36.0, 31.0, 43.0, 27.0, 34.0, 26.0, 23.0, 33.0, 20.0, 18.0, 17.0, 15.0, 15.0, 13.0, 14.0, 14.0, 9.0, 4.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.271484375, -1.232635498046875, -1.19378662109375, -1.154937744140625, -1.1160888671875, -1.077239990234375, -1.03839111328125, -0.999542236328125, -0.960693359375, -0.921844482421875, -0.88299560546875, -0.844146728515625, -0.8052978515625, -0.766448974609375, -0.72760009765625, -0.688751220703125, -0.64990234375, -0.611053466796875, -0.57220458984375, -0.533355712890625, -0.4945068359375, -0.455657958984375, -0.41680908203125, -0.377960205078125, -0.339111328125, -0.300262451171875, -0.26141357421875, -0.222564697265625, -0.1837158203125, -0.144866943359375, -0.10601806640625, -0.067169189453125, -0.0283203125, 0.010528564453125, 0.04937744140625, 0.088226318359375, 0.1270751953125, 0.165924072265625, 0.20477294921875, 0.243621826171875, 0.282470703125, 0.321319580078125, 0.36016845703125, 0.399017333984375, 0.4378662109375, 0.476715087890625, 0.51556396484375, 0.554412841796875, 0.59326171875, 0.632110595703125, 0.67095947265625, 0.709808349609375, 0.7486572265625, 0.787506103515625, 0.82635498046875, 0.865203857421875, 0.904052734375, 0.942901611328125, 0.98175048828125, 1.020599365234375, 1.0594482421875, 1.098297119140625, 1.13714599609375, 1.175994873046875, 1.21484375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 8.0, 12.0, 12.0, 33.0, 41.0, 61.0, 95.0, 117.0, 174.0, 239.0, 375.0, 519.0, 729.0, 1049.0, 1428.0, 2022.0, 2994.0, 4170.0, 5702.0, 8087.0, 11346.0, 16262.0, 23434.0, 34496.0, 53662.0, 87596.0, 168414.0, 1343804.0, 121226.0, 69158.0, 43926.0, 28786.0, 19636.0, 13880.0, 9726.0, 7000.0, 4979.0, 3379.0, 2558.0, 1732.0, 1295.0, 889.0, 649.0, 433.0, 327.0, 192.0, 152.0, 106.0, 75.0, 56.0, 33.0, 25.0, 13.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.03497314453125, -0.03385496139526367, -0.032736778259277344, -0.031618595123291016, -0.030500411987304688, -0.02938222885131836, -0.02826404571533203, -0.027145862579345703, -0.026027679443359375, -0.024909496307373047, -0.02379131317138672, -0.02267313003540039, -0.021554946899414062, -0.020436763763427734, -0.019318580627441406, -0.018200397491455078, -0.01708221435546875, -0.015964031219482422, -0.014845848083496094, -0.013727664947509766, -0.012609481811523438, -0.01149129867553711, -0.010373115539550781, -0.009254932403564453, -0.008136749267578125, -0.007018566131591797, -0.005900382995605469, -0.004782199859619141, -0.0036640167236328125, -0.0025458335876464844, -0.0014276504516601562, -0.0003094673156738281, 0.0008087158203125, 0.0019268989562988281, 0.0030450820922851562, 0.004163265228271484, 0.0052814483642578125, 0.006399631500244141, 0.007517814636230469, 0.008635997772216797, 0.009754180908203125, 0.010872364044189453, 0.011990547180175781, 0.01310873031616211, 0.014226913452148438, 0.015345096588134766, 0.016463279724121094, 0.017581462860107422, 0.01869964599609375, 0.019817829132080078, 0.020936012268066406, 0.022054195404052734, 0.023172378540039062, 0.02429056167602539, 0.02540874481201172, 0.026526927947998047, 0.027645111083984375, 0.028763294219970703, 0.02988147735595703, 0.03099966049194336, 0.03211784362792969, 0.033236026763916016, 0.034354209899902344, 0.03547239303588867, 0.036590576171875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 11.0, 0.0, 13.0, 0.0, 18.0, 0.0, 21.0, 0.0, 39.0, 0.0, 51.0, 0.0, 79.0, 0.0, 497.0, 0.0, 96.0, 63.0, 0.0, 43.0, 0.0, 26.0, 0.0, 18.0, 0.0, 9.0, 0.0, 7.0, 0.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.5367431640625e-07, -9.220093488693237e-07, -8.903443813323975e-07, -8.586794137954712e-07, -8.270144462585449e-07, -7.953494787216187e-07, -7.636845111846924e-07, -7.320195436477661e-07, -7.003545761108398e-07, -6.686896085739136e-07, -6.370246410369873e-07, -6.05359673500061e-07, -5.736947059631348e-07, -5.420297384262085e-07, -5.103647708892822e-07, -4.78699803352356e-07, -4.470348358154297e-07, -4.153698682785034e-07, -3.8370490074157715e-07, -3.520399332046509e-07, -3.203749656677246e-07, -2.8870999813079834e-07, -2.5704503059387207e-07, -2.253800630569458e-07, -1.9371509552001953e-07, -1.6205012798309326e-07, -1.30385160446167e-07, -9.872019290924072e-08, -6.705522537231445e-08, -3.5390257835388184e-08, -3.725290298461914e-09, 2.7939677238464355e-08, 5.960464477539063e-08, 9.12696123123169e-08, 1.2293457984924316e-07, 1.5459954738616943e-07, 1.862645149230957e-07, 2.1792948246002197e-07, 2.4959444999694824e-07, 2.812594175338745e-07, 3.129243850708008e-07, 3.4458935260772705e-07, 3.762543201446533e-07, 4.079192876815796e-07, 4.3958425521850586e-07, 4.7124922275543213e-07, 5.029141902923584e-07, 5.345791578292847e-07, 5.662441253662109e-07, 5.979090929031372e-07, 6.295740604400635e-07, 6.612390279769897e-07, 6.92903995513916e-07, 7.245689630508423e-07, 7.562339305877686e-07, 7.878988981246948e-07, 8.195638656616211e-07, 8.512288331985474e-07, 8.828938007354736e-07, 9.145587682723999e-07, 9.462237358093262e-07, 9.778887033462524e-07, 1.0095536708831787e-06, 1.041218638420105e-06, 1.0728836059570312e-06]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 10.0, 6.0, 3.0, 14.0, 7.0, 23.0, 22.0, 54.0, 93.0, 125.0, 238.0, 1810.0, 26416.0, 928662.0, 85400.0, 4858.0, 397.0, 135.0, 66.0, 52.0, 27.0, 35.0, 18.0, 16.0, 16.0, 9.0, 9.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.704692840576172e-05, -1.6555190086364746e-05, -1.6063451766967773e-05, -1.55717134475708e-05, -1.5079975128173828e-05, -1.4588236808776855e-05, -1.4096498489379883e-05, -1.360476016998291e-05, -1.3113021850585938e-05, -1.2621283531188965e-05, -1.2129545211791992e-05, -1.163780689239502e-05, -1.1146068572998047e-05, -1.0654330253601074e-05, -1.0162591934204102e-05, -9.670853614807129e-06, -9.179115295410156e-06, -8.687376976013184e-06, -8.195638656616211e-06, -7.703900337219238e-06, -7.212162017822266e-06, -6.720423698425293e-06, -6.22868537902832e-06, -5.736947059631348e-06, -5.245208740234375e-06, -4.753470420837402e-06, -4.26173210144043e-06, -3.769993782043457e-06, -3.2782554626464844e-06, -2.7865171432495117e-06, -2.294778823852539e-06, -1.8030405044555664e-06, -1.3113021850585938e-06, -8.195638656616211e-07, -3.2782554626464844e-07, 1.6391277313232422e-07, 6.556510925292969e-07, 1.1473894119262695e-06, 1.6391277313232422e-06, 2.130866050720215e-06, 2.6226043701171875e-06, 3.11434268951416e-06, 3.606081008911133e-06, 4.0978193283081055e-06, 4.589557647705078e-06, 5.081295967102051e-06, 5.5730342864990234e-06, 6.064772605895996e-06, 6.556510925292969e-06, 7.048249244689941e-06, 7.539987564086914e-06, 8.031725883483887e-06, 8.52346420288086e-06, 9.015202522277832e-06, 9.506940841674805e-06, 9.998679161071777e-06, 1.049041748046875e-05, 1.0982155799865723e-05, 1.1473894119262695e-05, 1.1965632438659668e-05, 1.245737075805664e-05, 1.2949109077453613e-05, 1.3440847396850586e-05, 1.3932585716247559e-05, 1.4424324035644531e-05]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 9.0, 8.0, 22.0, 19.0, 29.0, 29.0, 37.0, 645.0, 38.0, 36.0, 33.0, 27.0, 22.0, 11.0, 9.0, 12.0, 5.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.801639642617374e-07, -6.659624887106474e-07, -6.517609563161386e-07, -6.375594807650486e-07, -6.233580052139587e-07, -6.091564728194498e-07, -5.949549972683599e-07, -5.807535217172699e-07, -5.665519893227611e-07, -5.523505137716711e-07, -5.381489813771623e-07, -5.239475058260723e-07, -5.097460302749823e-07, -4.955445547238924e-07, -4.813430223293835e-07, -4.6714154677829356e-07, -4.529400712272036e-07, -4.387385672544042e-07, -4.245370917033142e-07, -4.103355877305148e-07, -3.9613411217942485e-07, -3.8193260820662545e-07, -3.6773110423382604e-07, -3.535296286827361e-07, -3.393281247099367e-07, -3.2512662073713727e-07, -3.109251451860473e-07, -2.967236412132479e-07, -2.825221372404485e-07, -2.6832066168935853e-07, -2.5411915771655913e-07, -2.3991765374375973e-07, -2.2571616398181504e-07, -2.1151467421987036e-07, -1.9731317024707096e-07, -1.8311168048512627e-07, -1.6891019072318159e-07, -1.547087009612369e-07, -1.4050721119929221e-07, -1.2630570722649281e-07, -1.1210421746454813e-07, -9.790272770260344e-08, -8.37012308352314e-08, -6.949973396785936e-08, -5.529824420591467e-08, -4.1096754443969985e-08, -2.6895257576597942e-08, -1.2693760709225899e-08, 1.507729052718787e-09, 1.570922236737715e-08, 2.9910715682035516e-08, 4.411220899669388e-08, 5.8313702311352245e-08, 7.251519207329693e-08, 8.671668894066897e-08, 1.0091818580804102e-07, 1.151196755699857e-07, 1.293211653319304e-07, 1.435226693047298e-07, 1.5772415906667447e-07, 1.7192564882861916e-07, 1.8612713859056385e-07, 2.0032862835250853e-07, 2.1453013232530793e-07, 2.2873162208725262e-07]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 35.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 143.0, 0.0, 0.0, 0.0, 0.0, 0.0, 651.0, 0.0, 0.0, 0.0, 0.0, 0.0, 139.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4831464290618896e-07, -3.390014171600342e-07, -3.296881914138794e-07, -3.203749656677246e-07, -3.110617399215698e-07, -3.0174851417541504e-07, -2.9243528842926025e-07, -2.8312206268310547e-07, -2.738088369369507e-07, -2.644956111907959e-07, -2.551823854446411e-07, -2.4586915969848633e-07, -2.3655593395233154e-07, -2.2724270820617676e-07, -2.1792948246002197e-07, -2.086162567138672e-07, -1.993030309677124e-07, -1.8998980522155762e-07, -1.8067657947540283e-07, -1.7136335372924805e-07, -1.6205012798309326e-07, -1.5273690223693848e-07, -1.434236764907837e-07, -1.341104507446289e-07, -1.2479722499847412e-07, -1.1548399925231934e-07, -1.0617077350616455e-07, -9.685754776000977e-08, -8.754432201385498e-08, -7.82310962677002e-08, -6.891787052154541e-08, -5.960464477539063e-08, -5.029141902923584e-08, -4.0978193283081055e-08, -3.166496753692627e-08, -2.2351741790771484e-08, -1.30385160446167e-08, -3.725290298461914e-09, 5.587935447692871e-09, 1.4901161193847656e-08, 2.421438694000244e-08, 3.3527612686157227e-08, 4.284083843231201e-08, 5.21540641784668e-08, 6.146728992462158e-08, 7.078051567077637e-08, 8.009374141693115e-08, 8.940696716308594e-08, 9.872019290924072e-08, 1.0803341865539551e-07, 1.1734664440155029e-07, 1.2665987014770508e-07, 1.3597309589385986e-07, 1.4528632164001465e-07, 1.5459954738616943e-07, 1.6391277313232422e-07, 1.73225998878479e-07, 1.825392246246338e-07, 1.9185245037078857e-07, 2.0116567611694336e-07, 2.1047890186309814e-07, 2.1979212760925293e-07, 2.2910535335540771e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 7.0, 8.0, 9.0, 6.0, 14.0, 16.0, 10.0, 15.0, 23.0, 19.0, 19.0, 25.0, 26.0, 24.0, 34.0, 44.0, 29.0, 34.0, 35.0, 35.0, 35.0, 36.0, 36.0, 35.0, 33.0, 38.0, 30.0, 35.0, 25.0, 31.0, 28.0, 24.0, 21.0, 23.0, 25.0, 12.0, 15.0, 18.0, 7.0, 12.0, 7.0, 10.0, 3.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.685546875, -1.6317291259765625, -1.577911376953125, -1.5240936279296875, -1.47027587890625, -1.4164581298828125, -1.362640380859375, -1.3088226318359375, -1.2550048828125, -1.2011871337890625, -1.147369384765625, -1.0935516357421875, -1.03973388671875, -0.9859161376953125, -0.932098388671875, -0.8782806396484375, -0.824462890625, -0.7706451416015625, -0.716827392578125, -0.6630096435546875, -0.60919189453125, -0.5553741455078125, -0.501556396484375, -0.4477386474609375, -0.3939208984375, -0.3401031494140625, -0.286285400390625, -0.2324676513671875, -0.17864990234375, -0.1248321533203125, -0.071014404296875, -0.0171966552734375, 0.03662109375, 0.0904388427734375, 0.144256591796875, 0.1980743408203125, 0.25189208984375, 0.3057098388671875, 0.359527587890625, 0.4133453369140625, 0.4671630859375, 0.5209808349609375, 0.574798583984375, 0.6286163330078125, 0.68243408203125, 0.7362518310546875, 0.790069580078125, 0.8438873291015625, 0.897705078125, 0.9515228271484375, 1.005340576171875, 1.0591583251953125, 1.11297607421875, 1.1667938232421875, 1.220611572265625, 1.2744293212890625, 1.3282470703125, 1.3820648193359375, 1.435882568359375, 1.4897003173828125, 1.54351806640625, 1.5973358154296875, 1.651153564453125, 1.7049713134765625, 1.7587890625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 11.0, 6.0, 20.0, 29.0, 34.0, 54.0, 69.0, 130.0, 168.0, 279.0, 396.0, 646.0, 1080.0, 1540.0, 2288.0, 3517.0, 5708.0, 8925.0, 14612.0, 25808.0, 52119.0, 123215.0, 268916.0, 281640.0, 133187.0, 56087.0, 27093.0, 15150.0, 9197.0, 5854.0, 3706.0, 2451.0, 1616.0, 999.0, 690.0, 436.0, 285.0, 208.0, 129.0, 88.0, 55.0, 36.0, 19.0, 22.0, 10.0, 17.0, 5.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.501953125, -2.421356201171875, -2.34075927734375, -2.260162353515625, -2.1795654296875, -2.098968505859375, -2.01837158203125, -1.937774658203125, -1.857177734375, -1.776580810546875, -1.69598388671875, -1.615386962890625, -1.5347900390625, -1.454193115234375, -1.37359619140625, -1.292999267578125, -1.21240234375, -1.131805419921875, -1.05120849609375, -0.970611572265625, -0.8900146484375, -0.809417724609375, -0.72882080078125, -0.648223876953125, -0.567626953125, -0.487030029296875, -0.40643310546875, -0.325836181640625, -0.2452392578125, -0.164642333984375, -0.08404541015625, -0.003448486328125, 0.0771484375, 0.157745361328125, 0.23834228515625, 0.318939208984375, 0.3995361328125, 0.480133056640625, 0.56072998046875, 0.641326904296875, 0.721923828125, 0.802520751953125, 0.88311767578125, 0.963714599609375, 1.0443115234375, 1.124908447265625, 1.20550537109375, 1.286102294921875, 1.36669921875, 1.447296142578125, 1.52789306640625, 1.608489990234375, 1.6890869140625, 1.769683837890625, 1.85028076171875, 1.930877685546875, 2.011474609375, 2.092071533203125, 2.17266845703125, 2.253265380859375, 2.3338623046875, 2.414459228515625, 2.49505615234375, 2.575653076171875, 2.65625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 7.0, 8.0, 7.0, 11.0, 18.0, 16.0, 20.0, 25.0, 25.0, 29.0, 38.0, 32.0, 61.0, 57.0, 79.0, 112.0, 178.0, 1358.0, 289.0, 146.0, 95.0, 74.0, 54.0, 50.0, 38.0, 42.0, 36.0, 24.0, 16.0, 14.0, 15.0, 16.0, 9.0, 8.0, 10.0, 8.0, 4.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.6484375, -7.42242431640625, -7.1964111328125, -6.97039794921875, -6.744384765625, -6.51837158203125, -6.2923583984375, -6.06634521484375, -5.84033203125, -5.61431884765625, -5.3883056640625, -5.16229248046875, -4.936279296875, -4.71026611328125, -4.4842529296875, -4.25823974609375, -4.0322265625, -3.80621337890625, -3.5802001953125, -3.35418701171875, -3.128173828125, -2.90216064453125, -2.6761474609375, -2.45013427734375, -2.22412109375, -1.99810791015625, -1.7720947265625, -1.54608154296875, -1.320068359375, -1.09405517578125, -0.8680419921875, -0.64202880859375, -0.416015625, -0.19000244140625, 0.0360107421875, 0.26202392578125, 0.488037109375, 0.71405029296875, 0.9400634765625, 1.16607666015625, 1.39208984375, 1.61810302734375, 1.8441162109375, 2.07012939453125, 2.296142578125, 2.52215576171875, 2.7481689453125, 2.97418212890625, 3.2001953125, 3.42620849609375, 3.6522216796875, 3.87823486328125, 4.104248046875, 4.33026123046875, 4.5562744140625, 4.78228759765625, 5.00830078125, 5.23431396484375, 5.4603271484375, 5.68634033203125, 5.912353515625, 6.13836669921875, 6.3643798828125, 6.59039306640625, 6.81640625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 10.0, 14.0, 14.0, 18.0, 14.0, 19.0, 31.0, 47.0, 64.0, 84.0, 133.0, 221.0, 356.0, 959.0, 4322.0, 30467.0, 716660.0, 2314853.0, 67022.0, 7705.0, 1476.0, 460.0, 230.0, 147.0, 105.0, 66.0, 49.0, 25.0, 25.0, 23.0, 15.0, 15.0, 7.0, 10.0, 7.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5390625, -12.123291015625, -11.70751953125, -11.291748046875, -10.8759765625, -10.460205078125, -10.04443359375, -9.628662109375, -9.212890625, -8.797119140625, -8.38134765625, -7.965576171875, -7.5498046875, -7.134033203125, -6.71826171875, -6.302490234375, -5.88671875, -5.470947265625, -5.05517578125, -4.639404296875, -4.2236328125, -3.807861328125, -3.39208984375, -2.976318359375, -2.560546875, -2.144775390625, -1.72900390625, -1.313232421875, -0.8974609375, -0.481689453125, -0.06591796875, 0.349853515625, 0.765625, 1.181396484375, 1.59716796875, 2.012939453125, 2.4287109375, 2.844482421875, 3.26025390625, 3.676025390625, 4.091796875, 4.507568359375, 4.92333984375, 5.339111328125, 5.7548828125, 6.170654296875, 6.58642578125, 7.002197265625, 7.41796875, 7.833740234375, 8.24951171875, 8.665283203125, 9.0810546875, 9.496826171875, 9.91259765625, 10.328369140625, 10.744140625, 11.159912109375, 11.57568359375, 11.991455078125, 12.4072265625, 12.822998046875, 13.23876953125, 13.654541015625, 14.0703125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 20.0, 67.0, 150.0, 261.0, 254.0, 166.0, 70.0, 14.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.20335388183594, -76.7536849975586, -75.30401611328125, -73.8543472290039, -72.40467834472656, -70.95500183105469, -69.50533294677734, -68.0556640625, -66.60599517822266, -65.15632629394531, -63.70665740966797, -62.25698471069336, -60.807315826416016, -59.35764694213867, -57.90797424316406, -56.45830535888672, -55.008636474609375, -53.55896759033203, -52.10929870605469, -50.65962600708008, -49.209957122802734, -47.76028823852539, -46.31061553955078, -44.86094665527344, -43.411277770996094, -41.96160888671875, -40.511940002441406, -39.0622673034668, -37.61259841918945, -36.16292953491211, -34.7132568359375, -33.263587951660156, -31.813915252685547, -30.364246368408203, -28.914575576782227, -27.46490478515625, -26.015235900878906, -24.565567016601562, -23.115896224975586, -21.66622543334961, -20.216556549072266, -18.766887664794922, -17.317216873168945, -15.867547035217285, -14.417877197265625, -12.968207359313965, -11.518537521362305, -10.068867683410645, -8.619197845458984, -7.169528007507324, -5.719858169555664, -4.270188331604004, -2.8205184936523438, -1.3708486557006836, 0.07882118225097656, 1.5284910202026367, 2.978160858154297, 4.427830696105957, 5.877500534057617, 7.327170372009277, 8.776840209960938, 10.226510047912598, 11.676179885864258, 13.125849723815918, 14.575519561767578]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 7.0, 5.0, 7.0, 13.0, 15.0, 10.0, 16.0, 30.0, 13.0, 14.0, 26.0, 32.0, 26.0, 26.0, 34.0, 28.0, 33.0, 45.0, 41.0, 41.0, 33.0, 39.0, 39.0, 41.0, 38.0, 35.0, 45.0, 45.0, 26.0, 36.0, 30.0, 23.0, 17.0, 21.0, 10.0, 11.0, 5.0, 4.0, 10.0, 4.0, 11.0, 6.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.197187423706055, -16.65139389038086, -16.10559844970703, -15.559804916381836, -15.01401138305664, -14.468217849731445, -13.922423362731934, -13.376628875732422, -12.830835342407227, -12.285041809082031, -11.73924732208252, -11.193452835083008, -10.647659301757812, -10.101865768432617, -9.556071281433105, -9.010276794433594, -8.464483261108398, -7.918689250946045, -7.372895240783691, -6.827101230621338, -6.281307220458984, -5.735513210296631, -5.189719200134277, -4.643925189971924, -4.09813117980957, -3.552337169647217, -3.0065431594848633, -2.4607491493225098, -1.9149551391601562, -1.3691611289978027, -0.8233671188354492, -0.2775731086730957, 0.2682209014892578, 0.8140149116516113, 1.3598089218139648, 1.9056029319763184, 2.451396942138672, 2.9971909523010254, 3.542984962463379, 4.088778972625732, 4.634572982788086, 5.1803669929504395, 5.726161003112793, 6.2719550132751465, 6.8177490234375, 7.3635430335998535, 7.909337043762207, 8.455131530761719, 9.000925064086914, 9.54671859741211, 10.092513084411621, 10.638307571411133, 11.184101104736328, 11.729894638061523, 12.275689125061035, 12.821483612060547, 13.367277145385742, 13.913070678710938, 14.45886516571045, 15.004659652709961, 15.550453186035156, 16.09624671936035, 16.642040252685547, 17.187835693359375, 17.73362922668457]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 6.0, 5.0, 7.0, 8.0, 9.0, 10.0, 5.0, 17.0, 13.0, 14.0, 17.0, 16.0, 19.0, 29.0, 20.0, 29.0, 31.0, 32.0, 36.0, 31.0, 36.0, 32.0, 28.0, 42.0, 41.0, 33.0, 35.0, 32.0, 31.0, 36.0, 35.0, 28.0, 21.0, 31.0, 35.0, 24.0, 16.0, 17.0, 7.0, 20.0, 11.0, 10.0, 13.0, 11.0, 8.0, 4.0, 7.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.8583984375, -1.802276611328125, -1.74615478515625, -1.690032958984375, -1.6339111328125, -1.577789306640625, -1.52166748046875, -1.465545654296875, -1.409423828125, -1.353302001953125, -1.29718017578125, -1.241058349609375, -1.1849365234375, -1.128814697265625, -1.07269287109375, -1.016571044921875, -0.96044921875, -0.904327392578125, -0.84820556640625, -0.792083740234375, -0.7359619140625, -0.679840087890625, -0.62371826171875, -0.567596435546875, -0.511474609375, -0.455352783203125, -0.39923095703125, -0.343109130859375, -0.2869873046875, -0.230865478515625, -0.17474365234375, -0.118621826171875, -0.0625, -0.006378173828125, 0.04974365234375, 0.105865478515625, 0.1619873046875, 0.218109130859375, 0.27423095703125, 0.330352783203125, 0.386474609375, 0.442596435546875, 0.49871826171875, 0.554840087890625, 0.6109619140625, 0.667083740234375, 0.72320556640625, 0.779327392578125, 0.83544921875, 0.891571044921875, 0.94769287109375, 1.003814697265625, 1.0599365234375, 1.116058349609375, 1.17218017578125, 1.228302001953125, 1.284423828125, 1.340545654296875, 1.39666748046875, 1.452789306640625, 1.5089111328125, 1.565032958984375, 1.62115478515625, 1.677276611328125, 1.7333984375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 8.0, 10.0, 15.0, 7.0, 16.0, 14.0, 15.0, 24.0, 29.0, 54.0, 68.0, 85.0, 166.0, 280.0, 517.0, 1137.0, 3217.0, 10713.0, 40671.0, 167915.0, 708375.0, 1974642.0, 975722.0, 233447.0, 55778.0, 14308.0, 4163.0, 1422.0, 605.0, 282.0, 196.0, 100.0, 76.0, 48.0, 35.0, 34.0, 16.0, 17.0, 13.0, 13.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.04296875, -4.89727783203125, -4.7515869140625, -4.60589599609375, -4.460205078125, -4.31451416015625, -4.1688232421875, -4.02313232421875, -3.87744140625, -3.73175048828125, -3.5860595703125, -3.44036865234375, -3.294677734375, -3.14898681640625, -3.0032958984375, -2.85760498046875, -2.7119140625, -2.56622314453125, -2.4205322265625, -2.27484130859375, -2.129150390625, -1.98345947265625, -1.8377685546875, -1.69207763671875, -1.54638671875, -1.40069580078125, -1.2550048828125, -1.10931396484375, -0.963623046875, -0.81793212890625, -0.6722412109375, -0.52655029296875, -0.380859375, -0.23516845703125, -0.0894775390625, 0.05621337890625, 0.201904296875, 0.34759521484375, 0.4932861328125, 0.63897705078125, 0.78466796875, 0.93035888671875, 1.0760498046875, 1.22174072265625, 1.367431640625, 1.51312255859375, 1.6588134765625, 1.80450439453125, 1.9501953125, 2.09588623046875, 2.2415771484375, 2.38726806640625, 2.532958984375, 2.67864990234375, 2.8243408203125, 2.97003173828125, 3.11572265625, 3.26141357421875, 3.4071044921875, 3.55279541015625, 3.698486328125, 3.84417724609375, 3.9898681640625, 4.13555908203125, 4.28125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 10.0, 7.0, 18.0, 26.0, 36.0, 35.0, 61.0, 99.0, 170.0, 221.0, 292.0, 385.0, 490.0, 546.0, 447.0, 353.0, 265.0, 175.0, 152.0, 75.0, 72.0, 44.0, 31.0, 25.0, 14.0, 6.0, 9.0, 3.0, 1.0, 5.0, 5.0, 2.0, 1.0, 3.0], "bins": [-9.3515625, -9.135986328125, -8.92041015625, -8.704833984375, -8.4892578125, -8.273681640625, -8.05810546875, -7.842529296875, -7.626953125, -7.411376953125, -7.19580078125, -6.980224609375, -6.7646484375, -6.549072265625, -6.33349609375, -6.117919921875, -5.90234375, -5.686767578125, -5.47119140625, -5.255615234375, -5.0400390625, -4.824462890625, -4.60888671875, -4.393310546875, -4.177734375, -3.962158203125, -3.74658203125, -3.531005859375, -3.3154296875, -3.099853515625, -2.88427734375, -2.668701171875, -2.453125, -2.237548828125, -2.02197265625, -1.806396484375, -1.5908203125, -1.375244140625, -1.15966796875, -0.944091796875, -0.728515625, -0.512939453125, -0.29736328125, -0.081787109375, 0.1337890625, 0.349365234375, 0.56494140625, 0.780517578125, 0.99609375, 1.211669921875, 1.42724609375, 1.642822265625, 1.8583984375, 2.073974609375, 2.28955078125, 2.505126953125, 2.720703125, 2.936279296875, 3.15185546875, 3.367431640625, 3.5830078125, 3.798583984375, 4.01416015625, 4.229736328125, 4.4453125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 6.0, 6.0, 2.0, 3.0, 8.0, 12.0, 24.0, 38.0, 42.0, 74.0, 148.0, 291.0, 568.0, 2380.0, 25047.0, 719506.0, 3206773.0, 226929.0, 10115.0, 1422.0, 422.0, 200.0, 105.0, 62.0, 47.0, 31.0, 13.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -9.9346923828125, -9.392822265625, -8.8509521484375, -8.30908203125, -7.7672119140625, -7.225341796875, -6.6834716796875, -6.1416015625, -5.5997314453125, -5.057861328125, -4.5159912109375, -3.97412109375, -3.4322509765625, -2.890380859375, -2.3485107421875, -1.806640625, -1.2647705078125, -0.722900390625, -0.1810302734375, 0.36083984375, 0.9027099609375, 1.444580078125, 1.9864501953125, 2.5283203125, 3.0701904296875, 3.612060546875, 4.1539306640625, 4.69580078125, 5.2376708984375, 5.779541015625, 6.3214111328125, 6.86328125, 7.4051513671875, 7.947021484375, 8.4888916015625, 9.03076171875, 9.5726318359375, 10.114501953125, 10.6563720703125, 11.1982421875, 11.7401123046875, 12.281982421875, 12.8238525390625, 13.36572265625, 13.9075927734375, 14.449462890625, 14.9913330078125, 15.533203125, 16.0750732421875, 16.616943359375, 17.1588134765625, 17.70068359375, 18.2425537109375, 18.784423828125, 19.3262939453125, 19.8681640625, 20.4100341796875, 20.951904296875, 21.4937744140625, 22.03564453125, 22.5775146484375, 23.119384765625, 23.6612548828125, 24.203125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 13.0, 15.0, 29.0, 49.0, 63.0, 68.0, 96.0, 87.0, 117.0, 108.0, 96.0, 86.0, 67.0, 45.0, 35.0, 13.0, 7.0, 4.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.028179168701172, -24.881858825683594, -23.735536575317383, -22.589214324951172, -21.442893981933594, -20.296573638916016, -19.150251388549805, -18.003929138183594, -16.857608795166016, -15.711287498474121, -14.564966201782227, -13.418644905090332, -12.272323608398438, -11.126002311706543, -9.979681015014648, -8.833359718322754, -7.687038421630859, -6.540717124938965, -5.39439582824707, -4.248074531555176, -3.1017532348632812, -1.9554319381713867, -0.8091106414794922, 0.33721065521240234, 1.4835319519042969, 2.6298532485961914, 3.776174545288086, 4.9224958419799805, 6.068817138671875, 7.2151384353637695, 8.361459732055664, 9.507781028747559, 10.654098510742188, 11.800419807434082, 12.946741104125977, 14.093062400817871, 15.239383697509766, 16.385704040527344, 17.532026290893555, 18.678348541259766, 19.824668884277344, 20.970989227294922, 22.117311477661133, 23.263633728027344, 24.409954071044922, 25.5562744140625, 26.70259666442871, 27.848918914794922, 28.9952392578125, 30.141559600830078, 31.28788185119629, 32.4342041015625, 33.58052444458008, 34.726844787597656, 35.8731689453125, 37.01948928833008, 38.165809631347656, 39.312129974365234, 40.45845031738281, 41.604774475097656, 42.751094818115234, 43.89741516113281, 45.043739318847656, 46.190059661865234, 47.33638000488281]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 6.0, 12.0, 10.0, 13.0, 18.0, 20.0, 14.0, 21.0, 18.0, 23.0, 28.0, 34.0, 26.0, 33.0, 42.0, 34.0, 36.0, 32.0, 52.0, 42.0, 49.0, 44.0, 39.0, 49.0, 32.0, 33.0, 23.0, 25.0, 26.0, 24.0, 27.0, 13.0, 13.0, 18.0, 18.0, 14.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-21.775001525878906, -21.15688705444336, -20.538774490356445, -19.9206600189209, -19.302547454833984, -18.684432983398438, -18.066320419311523, -17.448205947875977, -16.830093383789062, -16.211978912353516, -15.593866348266602, -14.975752830505371, -14.35763931274414, -13.739524841308594, -13.121411323547363, -12.503297805786133, -11.885183334350586, -11.267069816589355, -10.648956298828125, -10.030842781066895, -9.412729263305664, -8.794614791870117, -8.176501274108887, -7.558387756347656, -6.940274238586426, -6.322160720825195, -5.704047203063965, -5.085933208465576, -4.467819690704346, -3.8497061729431152, -3.2315924167633057, -2.613478660583496, -1.9953651428222656, -1.3772515058517456, -0.7591378688812256, -0.14102423191070557, 0.47708940505981445, 1.095202922821045, 1.7133166790008545, 2.331430435180664, 2.9495439529418945, 3.567657470703125, 4.1857709884643555, 4.803884983062744, 5.421998500823975, 6.040112018585205, 6.658226013183594, 7.276339530944824, 7.894453048706055, 8.512566566467285, 9.130680084228516, 9.748793601989746, 10.366907119750977, 10.985021591186523, 11.603135108947754, 12.221248626708984, 12.839362144470215, 13.457475662231445, 14.075589179992676, 14.693702697753906, 15.311817169189453, 15.929929733276367, 16.548044204711914, 17.166156768798828, 17.784271240234375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 8.0, 10.0, 8.0, 8.0, 14.0, 15.0, 11.0, 18.0, 24.0, 29.0, 21.0, 31.0, 25.0, 29.0, 26.0, 31.0, 40.0, 33.0, 39.0, 32.0, 36.0, 36.0, 37.0, 39.0, 35.0, 42.0, 24.0, 33.0, 41.0, 27.0, 22.0, 21.0, 18.0, 22.0, 16.0, 13.0, 13.0, 12.0, 9.0, 6.0, 4.0, 8.0, 9.0, 4.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7596282958984375, -1.701873779296875, -1.6441192626953125, -1.58636474609375, -1.5286102294921875, -1.470855712890625, -1.4131011962890625, -1.3553466796875, -1.2975921630859375, -1.239837646484375, -1.1820831298828125, -1.12432861328125, -1.0665740966796875, -1.008819580078125, -0.9510650634765625, -0.893310546875, -0.8355560302734375, -0.777801513671875, -0.7200469970703125, -0.66229248046875, -0.6045379638671875, -0.546783447265625, -0.4890289306640625, -0.4312744140625, -0.3735198974609375, -0.315765380859375, -0.2580108642578125, -0.20025634765625, -0.1425018310546875, -0.084747314453125, -0.0269927978515625, 0.03076171875, 0.0885162353515625, 0.146270751953125, 0.2040252685546875, 0.26177978515625, 0.3195343017578125, 0.377288818359375, 0.4350433349609375, 0.4927978515625, 0.5505523681640625, 0.608306884765625, 0.6660614013671875, 0.72381591796875, 0.7815704345703125, 0.839324951171875, 0.8970794677734375, 0.954833984375, 1.0125885009765625, 1.070343017578125, 1.1280975341796875, 1.18585205078125, 1.2436065673828125, 1.301361083984375, 1.3591156005859375, 1.4168701171875, 1.4746246337890625, 1.532379150390625, 1.5901336669921875, 1.64788818359375, 1.7056427001953125, 1.763397216796875, 1.8211517333984375, 1.87890625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 8.0, 8.0, 11.0, 14.0, 14.0, 28.0, 53.0, 75.0, 115.0, 183.0, 230.0, 290.0, 490.0, 725.0, 1103.0, 1463.0, 2072.0, 3017.0, 4341.0, 6356.0, 9373.0, 13587.0, 20342.0, 30490.0, 47931.0, 77663.0, 143831.0, 313786.0, 147528.0, 78888.0, 48554.0, 31030.0, 20913.0, 13800.0, 9374.0, 6422.0, 4530.0, 2986.0, 2124.0, 1481.0, 1074.0, 722.0, 473.0, 344.0, 247.0, 145.0, 129.0, 62.0, 44.0, 36.0, 25.0, 15.0, 6.0, 10.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.07568359375, -0.07328224182128906, -0.07088088989257812, -0.06847953796386719, -0.06607818603515625, -0.06367683410644531, -0.061275482177734375, -0.05887413024902344, -0.0564727783203125, -0.05407142639160156, -0.051670074462890625, -0.04926872253417969, -0.04686737060546875, -0.04446601867675781, -0.042064666748046875, -0.03966331481933594, -0.037261962890625, -0.03486061096191406, -0.032459259033203125, -0.030057907104492188, -0.02765655517578125, -0.025255203247070312, -0.022853851318359375, -0.020452499389648438, -0.0180511474609375, -0.015649795532226562, -0.013248443603515625, -0.010847091674804688, -0.00844573974609375, -0.0060443878173828125, -0.003643035888671875, -0.0012416839599609375, 0.00115966796875, 0.0035610198974609375, 0.005962371826171875, 0.008363723754882812, 0.01076507568359375, 0.013166427612304688, 0.015567779541015625, 0.017969131469726562, 0.0203704833984375, 0.022771835327148438, 0.025173187255859375, 0.027574539184570312, 0.02997589111328125, 0.03237724304199219, 0.034778594970703125, 0.03717994689941406, 0.039581298828125, 0.04198265075683594, 0.044384002685546875, 0.04678535461425781, 0.04918670654296875, 0.05158805847167969, 0.053989410400390625, 0.05639076232910156, 0.0587921142578125, 0.06119346618652344, 0.06359481811523438, 0.06599617004394531, 0.06839752197265625, 0.07079887390136719, 0.07320022583007812, 0.07560157775878906, 0.0780029296875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 9.0, 5.0, 7.0, 8.0, 15.0, 11.0, 14.0, 20.0, 19.0, 22.0, 26.0, 29.0, 34.0, 22.0, 34.0, 32.0, 29.0, 29.0, 47.0, 41.0, 1067.0, 43.0, 38.0, 46.0, 41.0, 35.0, 43.0, 35.0, 26.0, 27.0, 22.0, 22.0, 17.0, 17.0, 22.0, 15.0, 7.0, 7.0, 5.0, 6.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.29296875, -1.2514190673828125, -1.209869384765625, -1.1683197021484375, -1.12677001953125, -1.0852203369140625, -1.043670654296875, -1.0021209716796875, -0.9605712890625, -0.9190216064453125, -0.877471923828125, -0.8359222412109375, -0.79437255859375, -0.7528228759765625, -0.711273193359375, -0.6697235107421875, -0.628173828125, -0.5866241455078125, -0.545074462890625, -0.5035247802734375, -0.46197509765625, -0.4204254150390625, -0.378875732421875, -0.3373260498046875, -0.2957763671875, -0.2542266845703125, -0.212677001953125, -0.1711273193359375, -0.12957763671875, -0.0880279541015625, -0.046478271484375, -0.0049285888671875, 0.03662109375, 0.0781707763671875, 0.119720458984375, 0.1612701416015625, 0.20281982421875, 0.2443695068359375, 0.285919189453125, 0.3274688720703125, 0.3690185546875, 0.4105682373046875, 0.452117919921875, 0.4936676025390625, 0.53521728515625, 0.5767669677734375, 0.618316650390625, 0.6598663330078125, 0.701416015625, 0.7429656982421875, 0.784515380859375, 0.8260650634765625, 0.86761474609375, 0.9091644287109375, 0.950714111328125, 0.9922637939453125, 1.0338134765625, 1.0753631591796875, 1.116912841796875, 1.1584625244140625, 1.20001220703125, 1.2415618896484375, 1.283111572265625, 1.3246612548828125, 1.3662109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 12.0, 13.0, 22.0, 27.0, 46.0, 58.0, 75.0, 129.0, 152.0, 220.0, 363.0, 473.0, 665.0, 895.0, 1292.0, 1976.0, 2694.0, 3913.0, 5638.0, 8338.0, 11982.0, 17870.0, 26685.0, 41625.0, 66261.0, 115370.0, 1323913.0, 198616.0, 97651.0, 57947.0, 36645.0, 23976.0, 16097.0, 10858.0, 7499.0, 5085.0, 3662.0, 2593.0, 1675.0, 1231.0, 898.0, 588.0, 440.0, 310.0, 200.0, 126.0, 107.0, 66.0, 49.0, 39.0, 24.0, 16.0, 11.0, 11.0, 6.0, 2.0, 2.0, 4.0], "bins": [-0.03936767578125, -0.03816986083984375, -0.0369720458984375, -0.03577423095703125, -0.034576416015625, -0.03337860107421875, -0.0321807861328125, -0.03098297119140625, -0.02978515625, -0.02858734130859375, -0.0273895263671875, -0.02619171142578125, -0.024993896484375, -0.02379608154296875, -0.0225982666015625, -0.02140045166015625, -0.02020263671875, -0.01900482177734375, -0.0178070068359375, -0.01660919189453125, -0.015411376953125, -0.01421356201171875, -0.0130157470703125, -0.01181793212890625, -0.0106201171875, -0.00942230224609375, -0.0082244873046875, -0.00702667236328125, -0.005828857421875, -0.00463104248046875, -0.0034332275390625, -0.00223541259765625, -0.00103759765625, 0.00016021728515625, 0.0013580322265625, 0.00255584716796875, 0.003753662109375, 0.00495147705078125, 0.0061492919921875, 0.00734710693359375, 0.008544921875, 0.00974273681640625, 0.0109405517578125, 0.01213836669921875, 0.013336181640625, 0.01453399658203125, 0.0157318115234375, 0.01692962646484375, 0.01812744140625, 0.01932525634765625, 0.0205230712890625, 0.02172088623046875, 0.022918701171875, 0.02411651611328125, 0.0253143310546875, 0.02651214599609375, 0.0277099609375, 0.02890777587890625, 0.0301055908203125, 0.03130340576171875, 0.032501220703125, 0.03369903564453125, 0.0348968505859375, 0.03609466552734375, 0.03729248046875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 0.0, 13.0, 19.0, 0.0, 23.0, 26.0, 33.0, 0.0, 39.0, 56.0, 0.0, 74.0, 431.0, 83.0, 0.0, 67.0, 37.0, 24.0, 0.0, 15.0, 14.0, 0.0, 16.0, 11.0, 10.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.387670636177063e-06, -1.344829797744751e-06, -1.301988959312439e-06, -1.259148120880127e-06, -1.216307282447815e-06, -1.173466444015503e-06, -1.130625605583191e-06, -1.087784767150879e-06, -1.044943928718567e-06, -1.0021030902862549e-06, -9.592622518539429e-07, -9.164214134216309e-07, -8.735805749893188e-07, -8.307397365570068e-07, -7.878988981246948e-07, -7.450580596923828e-07, -7.022172212600708e-07, -6.593763828277588e-07, -6.165355443954468e-07, -5.736947059631348e-07, -5.308538675308228e-07, -4.880130290985107e-07, -4.4517219066619873e-07, -4.023313522338867e-07, -3.594905138015747e-07, -3.166496753692627e-07, -2.738088369369507e-07, -2.3096799850463867e-07, -1.8812716007232666e-07, -1.4528632164001465e-07, -1.0244548320770264e-07, -5.960464477539063e-08, -1.6763806343078613e-08, 2.60770320892334e-08, 6.891787052154541e-08, 1.1175870895385742e-07, 1.5459954738616943e-07, 1.9744038581848145e-07, 2.4028122425079346e-07, 2.8312206268310547e-07, 3.259629011154175e-07, 3.688037395477295e-07, 4.116445779800415e-07, 4.544854164123535e-07, 4.973262548446655e-07, 5.401670932769775e-07, 5.830079317092896e-07, 6.258487701416016e-07, 6.686896085739136e-07, 7.115304470062256e-07, 7.543712854385376e-07, 7.972121238708496e-07, 8.400529623031616e-07, 8.828938007354736e-07, 9.257346391677856e-07, 9.685754776000977e-07, 1.0114163160324097e-06, 1.0542571544647217e-06, 1.0970979928970337e-06, 1.1399388313293457e-06, 1.1827796697616577e-06, 1.2256205081939697e-06, 1.2684613466262817e-06, 1.3113021850585938e-06]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 17.0, 12.0, 14.0, 23.0, 36.0, 63.0, 158.0, 519.0, 7513.0, 849605.0, 186500.0, 3480.0, 307.0, 128.0, 60.0, 33.0, 20.0, 16.0, 11.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.282857894897461e-05, -2.2009946405887604e-05, -2.1191313862800598e-05, -2.0372681319713593e-05, -1.9554048776626587e-05, -1.873541623353958e-05, -1.7916783690452576e-05, -1.709815114736557e-05, -1.6279518604278564e-05, -1.546088606119156e-05, -1.4642253518104553e-05, -1.3823620975017548e-05, -1.3004988431930542e-05, -1.2186355888843536e-05, -1.136772334575653e-05, -1.0549090802669525e-05, -9.73045825958252e-06, -8.911825716495514e-06, -8.093193173408508e-06, -7.274560630321503e-06, -6.455928087234497e-06, -5.6372955441474915e-06, -4.818663001060486e-06, -4.00003045797348e-06, -3.1813979148864746e-06, -2.362765371799469e-06, -1.5441328287124634e-06, -7.255002856254578e-07, 9.313225746154785e-08, 9.117648005485535e-07, 1.730397343635559e-06, 2.5490298867225647e-06, 3.3676624298095703e-06, 4.186294972896576e-06, 5.0049275159835815e-06, 5.823560059070587e-06, 6.642192602157593e-06, 7.460825145244598e-06, 8.279457688331604e-06, 9.09809023141861e-06, 9.916722774505615e-06, 1.0735355317592621e-05, 1.1553987860679626e-05, 1.2372620403766632e-05, 1.3191252946853638e-05, 1.4009885489940643e-05, 1.4828518033027649e-05, 1.5647150576114655e-05, 1.646578311920166e-05, 1.7284415662288666e-05, 1.810304820537567e-05, 1.8921680748462677e-05, 1.9740313291549683e-05, 2.0558945834636688e-05, 2.1377578377723694e-05, 2.21962109208107e-05, 2.3014843463897705e-05, 2.383347600698471e-05, 2.4652108550071716e-05, 2.5470741093158722e-05, 2.6289373636245728e-05, 2.7108006179332733e-05, 2.792663872241974e-05, 2.8745271265506744e-05, 2.956390380859375e-05]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 13.0, 24.0, 144.0, 653.0, 131.0, 39.0, 6.0, 5.0], "bins": [-4.811475719179725e-06, -4.730711225420237e-06, -4.649946276913397e-06, -4.569181783153908e-06, -4.488416834647069e-06, -4.40765234088758e-06, -4.326887847128091e-06, -4.246122898621252e-06, -4.165358404861763e-06, -4.0845939111022744e-06, -4.003828962595435e-06, -3.923064468835946e-06, -3.842299520329107e-06, -3.761535026569618e-06, -3.6807703054364538e-06, -3.6000055843032897e-06, -3.519241090543801e-06, -3.438476369410637e-06, -3.3577116482774727e-06, -3.276947154517984e-06, -3.19618243338482e-06, -3.1154177122516558e-06, -3.0346529911184916e-06, -2.9538882699853275e-06, -2.8731235488521634e-06, -2.7923588277189992e-06, -2.711594106585835e-06, -2.6308296128263464e-06, -2.5500648916931823e-06, -2.469300170560018e-06, -2.388535449426854e-06, -2.3077709556673653e-06, -2.2270064619078767e-06, -2.1462417407747125e-06, -2.0654770196415484e-06, -1.9847125258820597e-06, -1.9039478047488956e-06, -1.8231830836157314e-06, -1.7424183624825673e-06, -1.661653755036241e-06, -1.5808890339030768e-06, -1.5001243127699126e-06, -1.4193597053235862e-06, -1.3385949841904221e-06, -1.2578303767440957e-06, -1.1770656556109316e-06, -1.0963010481646052e-06, -1.015536327031441e-06, -9.347716627416958e-07, -8.540069984519505e-07, -7.732423341622052e-07, -6.9247766987246e-07, -6.117129487392958e-07, -5.309483412929694e-07, -4.501836201598053e-07, -3.6941895587006e-07, -2.8865429158031475e-07, -2.0788962729056948e-07, -1.271249487899695e-07, -4.636027028936951e-08, 3.440439400037576e-08, 1.1516905829012103e-07, 1.9593375100157573e-07, 2.76698415291321e-07, 3.5746307958106627e-07]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 168.0, 0.0, 0.0, 0.0, 440.0, 0.0, 0.0, 0.0, 154.0, 0.0, 0.0, 0.0, 57.0, 0.0, 0.0, 0.0, 33.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.6193599700927734e-07, -4.470348358154297e-07, -4.3213367462158203e-07, -4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07, 4.3213367462158203e-07, 4.470348358154297e-07, 4.6193599700927734e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 11.0, 8.0, 10.0, 8.0, 8.0, 14.0, 15.0, 11.0, 18.0, 24.0, 29.0, 21.0, 31.0, 25.0, 29.0, 26.0, 31.0, 40.0, 33.0, 39.0, 32.0, 36.0, 36.0, 37.0, 39.0, 35.0, 42.0, 24.0, 33.0, 41.0, 27.0, 22.0, 21.0, 18.0, 22.0, 16.0, 13.0, 13.0, 12.0, 9.0, 6.0, 4.0, 8.0, 9.0, 4.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7596282958984375, -1.701873779296875, -1.6441192626953125, -1.58636474609375, -1.5286102294921875, -1.470855712890625, -1.4131011962890625, -1.3553466796875, -1.2975921630859375, -1.239837646484375, -1.1820831298828125, -1.12432861328125, -1.0665740966796875, -1.008819580078125, -0.9510650634765625, -0.893310546875, -0.8355560302734375, -0.777801513671875, -0.7200469970703125, -0.66229248046875, -0.6045379638671875, -0.546783447265625, -0.4890289306640625, -0.4312744140625, -0.3735198974609375, -0.315765380859375, -0.2580108642578125, -0.20025634765625, -0.1425018310546875, -0.084747314453125, -0.0269927978515625, 0.03076171875, 0.0885162353515625, 0.146270751953125, 0.2040252685546875, 0.26177978515625, 0.3195343017578125, 0.377288818359375, 0.4350433349609375, 0.4927978515625, 0.5505523681640625, 0.608306884765625, 0.6660614013671875, 0.72381591796875, 0.7815704345703125, 0.839324951171875, 0.8970794677734375, 0.954833984375, 1.0125885009765625, 1.070343017578125, 1.1280975341796875, 1.18585205078125, 1.2436065673828125, 1.301361083984375, 1.3591156005859375, 1.4168701171875, 1.4746246337890625, 1.532379150390625, 1.5901336669921875, 1.64788818359375, 1.7056427001953125, 1.763397216796875, 1.8211517333984375, 1.87890625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 14.0, 20.0, 48.0, 79.0, 74.0, 142.0, 218.0, 341.0, 507.0, 785.0, 1213.0, 1755.0, 2639.0, 3932.0, 5562.0, 8218.0, 11854.0, 17133.0, 24847.0, 37919.0, 62379.0, 116096.0, 228205.0, 228663.0, 115949.0, 62585.0, 37992.0, 24805.0, 17097.0, 11841.0, 8150.0, 5708.0, 3908.0, 2595.0, 1840.0, 1148.0, 773.0, 499.0, 327.0, 236.0, 152.0, 115.0, 71.0, 28.0, 28.0, 19.0, 13.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0], "bins": [-2.32421875, -2.255859375, -2.1875, -2.119140625, -2.05078125, -1.982421875, -1.9140625, -1.845703125, -1.77734375, -1.708984375, -1.640625, -1.572265625, -1.50390625, -1.435546875, -1.3671875, -1.298828125, -1.23046875, -1.162109375, -1.09375, -1.025390625, -0.95703125, -0.888671875, -0.8203125, -0.751953125, -0.68359375, -0.615234375, -0.546875, -0.478515625, -0.41015625, -0.341796875, -0.2734375, -0.205078125, -0.13671875, -0.068359375, 0.0, 0.068359375, 0.13671875, 0.205078125, 0.2734375, 0.341796875, 0.41015625, 0.478515625, 0.546875, 0.615234375, 0.68359375, 0.751953125, 0.8203125, 0.888671875, 0.95703125, 1.025390625, 1.09375, 1.162109375, 1.23046875, 1.298828125, 1.3671875, 1.435546875, 1.50390625, 1.572265625, 1.640625, 1.708984375, 1.77734375, 1.845703125, 1.9140625, 1.982421875, 2.05078125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 8.0, 9.0, 3.0, 6.0, 13.0, 11.0, 14.0, 14.0, 13.0, 18.0, 22.0, 22.0, 36.0, 29.0, 37.0, 31.0, 39.0, 65.0, 76.0, 111.0, 182.0, 1367.0, 246.0, 137.0, 116.0, 64.0, 42.0, 45.0, 36.0, 33.0, 31.0, 30.0, 16.0, 20.0, 20.0, 19.0, 15.0, 12.0, 2.0, 7.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-7.33984375, -7.11541748046875, -6.8909912109375, -6.66656494140625, -6.442138671875, -6.21771240234375, -5.9932861328125, -5.76885986328125, -5.54443359375, -5.32000732421875, -5.0955810546875, -4.87115478515625, -4.646728515625, -4.42230224609375, -4.1978759765625, -3.97344970703125, -3.7490234375, -3.52459716796875, -3.3001708984375, -3.07574462890625, -2.851318359375, -2.62689208984375, -2.4024658203125, -2.17803955078125, -1.95361328125, -1.72918701171875, -1.5047607421875, -1.28033447265625, -1.055908203125, -0.83148193359375, -0.6070556640625, -0.38262939453125, -0.158203125, 0.06622314453125, 0.2906494140625, 0.51507568359375, 0.739501953125, 0.96392822265625, 1.1883544921875, 1.41278076171875, 1.63720703125, 1.86163330078125, 2.0860595703125, 2.31048583984375, 2.534912109375, 2.75933837890625, 2.9837646484375, 3.20819091796875, 3.4326171875, 3.65704345703125, 3.8814697265625, 4.10589599609375, 4.330322265625, 4.55474853515625, 4.7791748046875, 5.00360107421875, 5.22802734375, 5.45245361328125, 5.6768798828125, 5.90130615234375, 6.125732421875, 6.35015869140625, 6.5745849609375, 6.79901123046875, 7.0234375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 9.0, 8.0, 4.0, 9.0, 12.0, 10.0, 14.0, 24.0, 24.0, 43.0, 44.0, 40.0, 89.0, 94.0, 137.0, 223.0, 377.0, 890.0, 3605.0, 20878.0, 199097.0, 2510886.0, 368389.0, 33140.0, 5130.0, 1192.0, 435.0, 227.0, 167.0, 137.0, 65.0, 73.0, 50.0, 35.0, 28.0, 21.0, 23.0, 14.0, 18.0, 8.0, 12.0, 6.0, 6.0, 8.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-12.6953125, -12.3060302734375, -11.916748046875, -11.5274658203125, -11.13818359375, -10.7489013671875, -10.359619140625, -9.9703369140625, -9.5810546875, -9.1917724609375, -8.802490234375, -8.4132080078125, -8.02392578125, -7.6346435546875, -7.245361328125, -6.8560791015625, -6.466796875, -6.0775146484375, -5.688232421875, -5.2989501953125, -4.90966796875, -4.5203857421875, -4.131103515625, -3.7418212890625, -3.3525390625, -2.9632568359375, -2.573974609375, -2.1846923828125, -1.79541015625, -1.4061279296875, -1.016845703125, -0.6275634765625, -0.23828125, 0.1510009765625, 0.540283203125, 0.9295654296875, 1.31884765625, 1.7081298828125, 2.097412109375, 2.4866943359375, 2.8759765625, 3.2652587890625, 3.654541015625, 4.0438232421875, 4.43310546875, 4.8223876953125, 5.211669921875, 5.6009521484375, 5.990234375, 6.3795166015625, 6.768798828125, 7.1580810546875, 7.54736328125, 7.9366455078125, 8.325927734375, 8.7152099609375, 9.1044921875, 9.4937744140625, 9.883056640625, 10.2723388671875, 10.66162109375, 11.0509033203125, 11.440185546875, 11.8294677734375, 12.21875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [169.0, 724.0, 126.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.981283664703369, -2.498626708984375, 2.984030246734619, 8.46668815612793, 13.949344635009766, 19.4320011138916, 24.91465950012207, 30.397314071655273, 35.87997055053711, 41.36262893676758, 46.84528350830078, 52.32794189453125, 57.81060028076172, 63.29325485229492, 68.77590942382812, 74.2585678100586, 79.74122619628906, 85.22388458251953, 90.70654296875, 96.18919372558594, 101.6718521118164, 107.15451049804688, 112.63716888427734, 118.11982727050781, 123.60248565673828, 129.08514404296875, 134.5677947998047, 140.0504608154297, 145.53311157226562, 151.01577758789062, 156.49842834472656, 161.9810791015625, 167.46372985839844, 172.94638061523438, 178.42904663085938, 183.9116973876953, 189.3943634033203, 194.87701416015625, 200.35968017578125, 205.8423309326172, 211.32498168945312, 216.80763244628906, 222.29029846191406, 227.77294921875, 233.255615234375, 238.73826599121094, 244.22091674804688, 249.70358276367188, 255.18624877929688, 260.6689147949219, 266.15155029296875, 271.63421630859375, 277.11688232421875, 282.59954833984375, 288.0821838378906, 293.5648498535156, 299.0474853515625, 304.5301513671875, 310.0127868652344, 315.4954528808594, 320.9781188964844, 326.46075439453125, 331.94342041015625, 337.42608642578125, 342.90875244140625]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 11.0, 7.0, 7.0, 11.0, 13.0, 16.0, 16.0, 23.0, 23.0, 24.0, 34.0, 33.0, 35.0, 30.0, 38.0, 43.0, 32.0, 40.0, 47.0, 40.0, 31.0, 37.0, 37.0, 37.0, 34.0, 33.0, 35.0, 20.0, 30.0, 25.0, 15.0, 28.0, 17.0, 20.0, 15.0, 15.0, 10.0, 9.0, 5.0, 6.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-25.10976791381836, -24.4102840423584, -23.710800170898438, -23.01131820678711, -22.31183433532715, -21.612350463867188, -20.912866592407227, -20.213382720947266, -19.513898849487305, -18.814414978027344, -18.114931106567383, -17.415447235107422, -16.715965270996094, -16.016481399536133, -15.316997528076172, -14.617513656616211, -13.918030738830566, -13.218546867370605, -12.519063949584961, -11.819580078125, -11.120096206665039, -10.420612335205078, -9.721129417419434, -9.021645545959473, -8.322162628173828, -7.622679233551025, -6.9231953620910645, -6.223711967468262, -5.524228096008301, -4.824744701385498, -4.125261306762695, -3.4257774353027344, -2.7262935638427734, -2.0268099308013916, -1.3273264169692993, -0.627842903137207, 0.0716407299041748, 0.7711243629455566, 1.4706077575683594, 2.1700916290283203, 2.869575023651123, 3.569058656692505, 4.268542289733887, 4.9680256843566895, 5.667509078979492, 6.366992950439453, 7.066476345062256, 7.765960216522217, 8.46544361114502, 9.16492748260498, 9.864410400390625, 10.563894271850586, 11.263378143310547, 11.962862014770508, 12.662344932556152, 13.361828804016113, 14.061311721801758, 14.760795593261719, 15.460278511047363, 16.15976333618164, 16.85924530029297, 17.55872917175293, 18.25821304321289, 18.95769691467285, 19.657180786132812]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 3.0, 4.0, 10.0, 10.0, 8.0, 9.0, 12.0, 14.0, 11.0, 26.0, 19.0, 26.0, 28.0, 23.0, 33.0, 29.0, 24.0, 28.0, 35.0, 31.0, 37.0, 32.0, 41.0, 38.0, 39.0, 36.0, 30.0, 35.0, 28.0, 33.0, 31.0, 28.0, 25.0, 16.0, 27.0, 15.0, 18.0, 16.0, 18.0, 10.0, 10.0, 11.0, 7.0, 7.0, 4.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8974609375, -1.8375091552734375, -1.777557373046875, -1.7176055908203125, -1.65765380859375, -1.5977020263671875, -1.537750244140625, -1.4777984619140625, -1.4178466796875, -1.3578948974609375, -1.297943115234375, -1.2379913330078125, -1.17803955078125, -1.1180877685546875, -1.058135986328125, -0.9981842041015625, -0.938232421875, -0.8782806396484375, -0.818328857421875, -0.7583770751953125, -0.69842529296875, -0.6384735107421875, -0.578521728515625, -0.5185699462890625, -0.4586181640625, -0.3986663818359375, -0.338714599609375, -0.2787628173828125, -0.21881103515625, -0.1588592529296875, -0.098907470703125, -0.0389556884765625, 0.02099609375, 0.0809478759765625, 0.140899658203125, 0.2008514404296875, 0.26080322265625, 0.3207550048828125, 0.380706787109375, 0.4406585693359375, 0.5006103515625, 0.5605621337890625, 0.620513916015625, 0.6804656982421875, 0.74041748046875, 0.8003692626953125, 0.860321044921875, 0.9202728271484375, 0.980224609375, 1.0401763916015625, 1.100128173828125, 1.1600799560546875, 1.22003173828125, 1.2799835205078125, 1.339935302734375, 1.3998870849609375, 1.4598388671875, 1.5197906494140625, 1.579742431640625, 1.6396942138671875, 1.69964599609375, 1.7595977783203125, 1.819549560546875, 1.8795013427734375, 1.939453125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 9.0, 10.0, 17.0, 21.0, 27.0, 37.0, 67.0, 89.0, 145.0, 229.0, 360.0, 661.0, 1015.0, 2018.0, 3998.0, 7737.0, 15886.0, 33125.0, 70958.0, 154516.0, 335830.0, 702827.0, 1143913.0, 886512.0, 447023.0, 206821.0, 94881.0, 43345.0, 20875.0, 10163.0, 5136.0, 2672.0, 1398.0, 753.0, 431.0, 278.0, 168.0, 120.0, 71.0, 40.0, 31.0, 33.0, 17.0, 12.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.76171875, -2.682098388671875, -2.60247802734375, -2.522857666015625, -2.4432373046875, -2.363616943359375, -2.28399658203125, -2.204376220703125, -2.124755859375, -2.045135498046875, -1.96551513671875, -1.885894775390625, -1.8062744140625, -1.726654052734375, -1.64703369140625, -1.567413330078125, -1.48779296875, -1.408172607421875, -1.32855224609375, -1.248931884765625, -1.1693115234375, -1.089691162109375, -1.01007080078125, -0.930450439453125, -0.850830078125, -0.771209716796875, -0.69158935546875, -0.611968994140625, -0.5323486328125, -0.452728271484375, -0.37310791015625, -0.293487548828125, -0.2138671875, -0.134246826171875, -0.05462646484375, 0.024993896484375, 0.1046142578125, 0.184234619140625, 0.26385498046875, 0.343475341796875, 0.423095703125, 0.502716064453125, 0.58233642578125, 0.661956787109375, 0.7415771484375, 0.821197509765625, 0.90081787109375, 0.980438232421875, 1.06005859375, 1.139678955078125, 1.21929931640625, 1.298919677734375, 1.3785400390625, 1.458160400390625, 1.53778076171875, 1.617401123046875, 1.697021484375, 1.776641845703125, 1.85626220703125, 1.935882568359375, 2.0155029296875, 2.095123291015625, 2.17474365234375, 2.254364013671875, 2.333984375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 15.0, 13.0, 18.0, 25.0, 38.0, 58.0, 74.0, 118.0, 203.0, 261.0, 380.0, 457.0, 540.0, 505.0, 387.0, 290.0, 217.0, 150.0, 110.0, 57.0, 56.0, 35.0, 24.0, 12.0, 15.0, 7.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.55078125, -7.33355712890625, -7.1163330078125, -6.89910888671875, -6.681884765625, -6.46466064453125, -6.2474365234375, -6.03021240234375, -5.81298828125, -5.59576416015625, -5.3785400390625, -5.16131591796875, -4.944091796875, -4.72686767578125, -4.5096435546875, -4.29241943359375, -4.0751953125, -3.85797119140625, -3.6407470703125, -3.42352294921875, -3.206298828125, -2.98907470703125, -2.7718505859375, -2.55462646484375, -2.33740234375, -2.12017822265625, -1.9029541015625, -1.68572998046875, -1.468505859375, -1.25128173828125, -1.0340576171875, -0.81683349609375, -0.599609375, -0.38238525390625, -0.1651611328125, 0.05206298828125, 0.269287109375, 0.48651123046875, 0.7037353515625, 0.92095947265625, 1.13818359375, 1.35540771484375, 1.5726318359375, 1.78985595703125, 2.007080078125, 2.22430419921875, 2.4415283203125, 2.65875244140625, 2.8759765625, 3.09320068359375, 3.3104248046875, 3.52764892578125, 3.744873046875, 3.96209716796875, 4.1793212890625, 4.39654541015625, 4.61376953125, 4.83099365234375, 5.0482177734375, 5.26544189453125, 5.482666015625, 5.69989013671875, 5.9171142578125, 6.13433837890625, 6.3515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 6.0, 8.0, 29.0, 34.0, 54.0, 100.0, 137.0, 241.0, 510.0, 1479.0, 6751.0, 47447.0, 435092.0, 2453832.0, 1104208.0, 124735.0, 15322.0, 2772.0, 756.0, 324.0, 172.0, 95.0, 65.0, 35.0, 27.0, 21.0, 12.0, 7.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9296875, -9.5955810546875, -9.261474609375, -8.9273681640625, -8.59326171875, -8.2591552734375, -7.925048828125, -7.5909423828125, -7.2568359375, -6.9227294921875, -6.588623046875, -6.2545166015625, -5.92041015625, -5.5863037109375, -5.252197265625, -4.9180908203125, -4.583984375, -4.2498779296875, -3.915771484375, -3.5816650390625, -3.24755859375, -2.9134521484375, -2.579345703125, -2.2452392578125, -1.9111328125, -1.5770263671875, -1.242919921875, -0.9088134765625, -0.57470703125, -0.2406005859375, 0.093505859375, 0.4276123046875, 0.76171875, 1.0958251953125, 1.429931640625, 1.7640380859375, 2.09814453125, 2.4322509765625, 2.766357421875, 3.1004638671875, 3.4345703125, 3.7686767578125, 4.102783203125, 4.4368896484375, 4.77099609375, 5.1051025390625, 5.439208984375, 5.7733154296875, 6.107421875, 6.4415283203125, 6.775634765625, 7.1097412109375, 7.44384765625, 7.7779541015625, 8.112060546875, 8.4461669921875, 8.7802734375, 9.1143798828125, 9.448486328125, 9.7825927734375, 10.11669921875, 10.4508056640625, 10.784912109375, 11.1190185546875, 11.453125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 24.0, 60.0, 136.0, 204.0, 239.0, 174.0, 112.0, 49.0, 12.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.100248336791992, -26.759870529174805, -24.419490814208984, -22.079113006591797, -19.73873519897461, -17.398357391357422, -15.057978630065918, -12.717599868774414, -10.377222061157227, -8.036844253540039, -5.696465492248535, -3.3560872077941895, -1.0157089233398438, 1.3246688842773438, 3.6650476455688477, 6.005426406860352, 8.345804214477539, 10.686182022094727, 13.02656078338623, 15.366939544677734, 17.707317352294922, 20.04769515991211, 22.388072967529297, 24.728452682495117, 27.068830490112305, 29.409208297729492, 31.749588012695312, 34.0899658203125, 36.43034362792969, 38.770721435546875, 41.11109924316406, 43.45147705078125, 45.79186248779297, 48.132240295410156, 50.472618103027344, 52.81299591064453, 55.15337371826172, 57.493751525878906, 59.83413314819336, 62.17451095581055, 64.514892578125, 66.85527038574219, 69.19564819335938, 71.53602600097656, 73.87640380859375, 76.21678161621094, 78.55715942382812, 80.89753723144531, 83.2379150390625, 85.57829284667969, 87.91867065429688, 90.25904846191406, 92.59942626953125, 94.93980407714844, 97.28018188476562, 99.62055969238281, 101.9609375, 104.30131530761719, 106.64169311523438, 108.98207092285156, 111.32244873046875, 113.66282653808594, 116.00320434570312, 118.34358215332031, 120.68396759033203]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 4.0, 5.0, 4.0, 7.0, 5.0, 15.0, 17.0, 16.0, 27.0, 23.0, 19.0, 23.0, 20.0, 26.0, 36.0, 37.0, 32.0, 39.0, 36.0, 35.0, 33.0, 38.0, 50.0, 57.0, 37.0, 34.0, 37.0, 30.0, 27.0, 32.0, 23.0, 19.0, 29.0, 25.0, 19.0, 10.0, 13.0, 9.0, 12.0, 8.0, 4.0, 8.0, 3.0, 3.0, 3.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.26940155029297, -16.721149444580078, -16.172897338867188, -15.62464714050293, -15.076395034790039, -14.528142929077148, -13.979891777038574, -13.431640625, -12.88338851928711, -12.335136413574219, -11.786885261535645, -11.23863410949707, -10.69038200378418, -10.142129898071289, -9.593878746032715, -9.04562759399414, -8.49737548828125, -7.949123859405518, -7.400872230529785, -6.852620601654053, -6.30436897277832, -5.756117343902588, -5.2078657150268555, -4.659614086151123, -4.111362457275391, -3.563110828399658, -3.014859199523926, -2.4666075706481934, -1.918355941772461, -1.3701043128967285, -0.8218526840209961, -0.27360105514526367, 0.27465057373046875, 0.8229022026062012, 1.3711538314819336, 1.919405460357666, 2.4676570892333984, 3.015908718109131, 3.5641603469848633, 4.112411975860596, 4.660663604736328, 5.2089152336120605, 5.757166862487793, 6.305418491363525, 6.853670120239258, 7.40192174911499, 7.950173377990723, 8.498424530029297, 9.046676635742188, 9.594928741455078, 10.143179893493652, 10.691431045532227, 11.239683151245117, 11.787935256958008, 12.336186408996582, 12.884437561035156, 13.432689666748047, 13.980941772460938, 14.529192924499512, 15.077444076538086, 15.625696182250977, 16.173948287963867, 16.722198486328125, 17.270450592041016, 17.818702697753906]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 11.0, 7.0, 11.0, 14.0, 12.0, 15.0, 16.0, 21.0, 18.0, 23.0, 25.0, 34.0, 27.0, 31.0, 33.0, 40.0, 42.0, 30.0, 49.0, 54.0, 30.0, 40.0, 40.0, 35.0, 26.0, 28.0, 32.0, 38.0, 25.0, 22.0, 24.0, 16.0, 24.0, 9.0, 17.0, 20.0, 12.0, 11.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.072265625, -2.00634765625, -1.9404296875, -1.87451171875, -1.80859375, -1.74267578125, -1.6767578125, -1.61083984375, -1.544921875, -1.47900390625, -1.4130859375, -1.34716796875, -1.28125, -1.21533203125, -1.1494140625, -1.08349609375, -1.017578125, -0.95166015625, -0.8857421875, -0.81982421875, -0.75390625, -0.68798828125, -0.6220703125, -0.55615234375, -0.490234375, -0.42431640625, -0.3583984375, -0.29248046875, -0.2265625, -0.16064453125, -0.0947265625, -0.02880859375, 0.037109375, 0.10302734375, 0.1689453125, 0.23486328125, 0.30078125, 0.36669921875, 0.4326171875, 0.49853515625, 0.564453125, 0.63037109375, 0.6962890625, 0.76220703125, 0.828125, 0.89404296875, 0.9599609375, 1.02587890625, 1.091796875, 1.15771484375, 1.2236328125, 1.28955078125, 1.35546875, 1.42138671875, 1.4873046875, 1.55322265625, 1.619140625, 1.68505859375, 1.7509765625, 1.81689453125, 1.8828125, 1.94873046875, 2.0146484375, 2.08056640625, 2.146484375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 7.0, 9.0, 14.0, 21.0, 23.0, 47.0, 54.0, 77.0, 137.0, 198.0, 299.0, 438.0, 745.0, 1102.0, 1668.0, 2617.0, 3993.0, 6076.0, 9705.0, 15772.0, 25883.0, 43908.0, 76297.0, 148867.0, 370524.0, 149874.0, 76786.0, 43931.0, 26185.0, 15853.0, 9816.0, 6272.0, 4066.0, 2568.0, 1598.0, 1096.0, 685.0, 451.0, 288.0, 226.0, 134.0, 84.0, 55.0, 30.0, 27.0, 18.0, 11.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.093017578125, -0.09006500244140625, -0.0871124267578125, -0.08415985107421875, -0.081207275390625, -0.07825469970703125, -0.0753021240234375, -0.07234954833984375, -0.06939697265625, -0.06644439697265625, -0.0634918212890625, -0.06053924560546875, -0.057586669921875, -0.05463409423828125, -0.0516815185546875, -0.04872894287109375, -0.0457763671875, -0.04282379150390625, -0.0398712158203125, -0.03691864013671875, -0.033966064453125, -0.03101348876953125, -0.0280609130859375, -0.02510833740234375, -0.02215576171875, -0.01920318603515625, -0.0162506103515625, -0.01329803466796875, -0.010345458984375, -0.00739288330078125, -0.0044403076171875, -0.00148773193359375, 0.00146484375, 0.00441741943359375, 0.0073699951171875, 0.01032257080078125, 0.013275146484375, 0.01622772216796875, 0.0191802978515625, 0.02213287353515625, 0.02508544921875, 0.02803802490234375, 0.0309906005859375, 0.03394317626953125, 0.036895751953125, 0.03984832763671875, 0.0428009033203125, 0.04575347900390625, 0.0487060546875, 0.05165863037109375, 0.0546112060546875, 0.05756378173828125, 0.060516357421875, 0.06346893310546875, 0.0664215087890625, 0.06937408447265625, 0.07232666015625, 0.07527923583984375, 0.0782318115234375, 0.08118438720703125, 0.084136962890625, 0.08708953857421875, 0.0900421142578125, 0.09299468994140625, 0.095947265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 11.0, 14.0, 7.0, 6.0, 12.0, 31.0, 22.0, 22.0, 27.0, 26.0, 28.0, 26.0, 42.0, 35.0, 47.0, 47.0, 48.0, 1060.0, 43.0, 42.0, 33.0, 36.0, 37.0, 44.0, 28.0, 31.0, 28.0, 33.0, 23.0, 19.0, 18.0, 27.0, 8.0, 7.0, 8.0, 11.0, 9.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5654296875, -1.5162811279296875, -1.467132568359375, -1.4179840087890625, -1.36883544921875, -1.3196868896484375, -1.270538330078125, -1.2213897705078125, -1.1722412109375, -1.1230926513671875, -1.073944091796875, -1.0247955322265625, -0.97564697265625, -0.9264984130859375, -0.877349853515625, -0.8282012939453125, -0.779052734375, -0.7299041748046875, -0.680755615234375, -0.6316070556640625, -0.58245849609375, -0.5333099365234375, -0.484161376953125, -0.4350128173828125, -0.3858642578125, -0.3367156982421875, -0.287567138671875, -0.2384185791015625, -0.18927001953125, -0.1401214599609375, -0.090972900390625, -0.0418243408203125, 0.00732421875, 0.0564727783203125, 0.105621337890625, 0.1547698974609375, 0.20391845703125, 0.2530670166015625, 0.302215576171875, 0.3513641357421875, 0.4005126953125, 0.4496612548828125, 0.498809814453125, 0.5479583740234375, 0.59710693359375, 0.6462554931640625, 0.695404052734375, 0.7445526123046875, 0.793701171875, 0.8428497314453125, 0.891998291015625, 0.9411468505859375, 0.99029541015625, 1.0394439697265625, 1.088592529296875, 1.1377410888671875, 1.1868896484375, 1.2360382080078125, 1.285186767578125, 1.3343353271484375, 1.38348388671875, 1.4326324462890625, 1.481781005859375, 1.5309295654296875, 1.580078125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 10.0, 8.0, 23.0, 24.0, 40.0, 60.0, 80.0, 144.0, 173.0, 296.0, 448.0, 670.0, 953.0, 1395.0, 2103.0, 3056.0, 4670.0, 6718.0, 10288.0, 14993.0, 22845.0, 35240.0, 57156.0, 97527.0, 198989.0, 1333253.0, 119656.0, 66931.0, 40643.0, 26151.0, 17263.0, 11603.0, 7632.0, 5217.0, 3594.0, 2398.0, 1553.0, 1082.0, 773.0, 458.0, 343.0, 239.0, 144.0, 96.0, 60.0, 61.0, 18.0, 22.0, 13.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.045562744140625, -0.044146060943603516, -0.04272937774658203, -0.04131269454956055, -0.03989601135253906, -0.03847932815551758, -0.037062644958496094, -0.03564596176147461, -0.034229278564453125, -0.03281259536743164, -0.031395912170410156, -0.029979228973388672, -0.028562545776367188, -0.027145862579345703, -0.02572917938232422, -0.024312496185302734, -0.02289581298828125, -0.021479129791259766, -0.02006244659423828, -0.018645763397216797, -0.017229080200195312, -0.015812397003173828, -0.014395713806152344, -0.01297903060913086, -0.011562347412109375, -0.01014566421508789, -0.008728981018066406, -0.007312297821044922, -0.0058956146240234375, -0.004478931427001953, -0.0030622482299804688, -0.0016455650329589844, -0.0002288818359375, 0.0011878013610839844, 0.0026044845581054688, 0.004021167755126953, 0.0054378509521484375, 0.006854534149169922, 0.008271217346191406, 0.00968790054321289, 0.011104583740234375, 0.01252126693725586, 0.013937950134277344, 0.015354633331298828, 0.016771316528320312, 0.018187999725341797, 0.01960468292236328, 0.021021366119384766, 0.02243804931640625, 0.023854732513427734, 0.02527141571044922, 0.026688098907470703, 0.028104782104492188, 0.029521465301513672, 0.030938148498535156, 0.03235483169555664, 0.033771514892578125, 0.03518819808959961, 0.036604881286621094, 0.03802156448364258, 0.03943824768066406, 0.04085493087768555, 0.04227161407470703, 0.043688297271728516, 0.04510498046875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 18.0, 0.0, 21.0, 0.0, 27.0, 0.0, 32.0, 0.0, 50.0, 89.0, 0.0, 500.0, 0.0, 87.0, 0.0, 53.0, 0.0, 45.0, 0.0, 28.0, 0.0, 13.0, 0.0, 14.0, 0.0, 9.0, 0.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0], "bins": [-1.0728836059570312e-06, -1.0421499609947205e-06, -1.0114163160324097e-06, -9.806826710700989e-07, -9.499490261077881e-07, -9.192153811454773e-07, -8.884817361831665e-07, -8.577480912208557e-07, -8.270144462585449e-07, -7.962808012962341e-07, -7.655471563339233e-07, -7.348135113716125e-07, -7.040798664093018e-07, -6.73346221446991e-07, -6.426125764846802e-07, -6.118789315223694e-07, -5.811452865600586e-07, -5.504116415977478e-07, -5.19677996635437e-07, -4.889443516731262e-07, -4.5821070671081543e-07, -4.2747706174850464e-07, -3.9674341678619385e-07, -3.6600977182388306e-07, -3.3527612686157227e-07, -3.045424818992615e-07, -2.738088369369507e-07, -2.430751919746399e-07, -2.123415470123291e-07, -1.816079020500183e-07, -1.5087425708770752e-07, -1.2014061212539673e-07, -8.940696716308594e-08, -5.8673322200775146e-08, -2.7939677238464355e-08, 2.7939677238464355e-09, 3.3527612686157227e-08, 6.426125764846802e-08, 9.499490261077881e-08, 1.257285475730896e-07, 1.564621925354004e-07, 1.8719583749771118e-07, 2.1792948246002197e-07, 2.4866312742233276e-07, 2.7939677238464355e-07, 3.1013041734695435e-07, 3.4086406230926514e-07, 3.7159770727157593e-07, 4.023313522338867e-07, 4.330649971961975e-07, 4.637986421585083e-07, 4.945322871208191e-07, 5.252659320831299e-07, 5.559995770454407e-07, 5.867332220077515e-07, 6.174668669700623e-07, 6.48200511932373e-07, 6.789341568946838e-07, 7.096678018569946e-07, 7.404014468193054e-07, 7.711350917816162e-07, 8.01868736743927e-07, 8.326023817062378e-07, 8.633360266685486e-07, 8.940696716308594e-07]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 6.0, 11.0, 7.0, 28.0, 42.0, 47.0, 68.0, 157.0, 1164.0, 35665.0, 959153.0, 50288.0, 1510.0, 160.0, 77.0, 49.0, 27.0, 24.0, 16.0, 8.0, 5.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.8312595784664154e-05, -1.767091453075409e-05, -1.7029233276844025e-05, -1.638755202293396e-05, -1.5745870769023895e-05, -1.510418951511383e-05, -1.4462508261203766e-05, -1.3820827007293701e-05, -1.3179145753383636e-05, -1.2537464499473572e-05, -1.1895783245563507e-05, -1.1254101991653442e-05, -1.0612420737743378e-05, -9.970739483833313e-06, -9.329058229923248e-06, -8.687376976013184e-06, -8.045695722103119e-06, -7.404014468193054e-06, -6.7623332142829895e-06, -6.120651960372925e-06, -5.47897070646286e-06, -4.837289452552795e-06, -4.195608198642731e-06, -3.553926944732666e-06, -2.9122456908226013e-06, -2.2705644369125366e-06, -1.628883183002472e-06, -9.872019290924072e-07, -3.4552067518234253e-07, 2.9616057872772217e-07, 9.378418326377869e-07, 1.5795230865478516e-06, 2.2212043404579163e-06, 2.862885594367981e-06, 3.5045668482780457e-06, 4.14624810218811e-06, 4.787929356098175e-06, 5.42961061000824e-06, 6.0712918639183044e-06, 6.712973117828369e-06, 7.354654371738434e-06, 7.996335625648499e-06, 8.638016879558563e-06, 9.279698133468628e-06, 9.921379387378693e-06, 1.0563060641288757e-05, 1.1204741895198822e-05, 1.1846423149108887e-05, 1.2488104403018951e-05, 1.3129785656929016e-05, 1.377146691083908e-05, 1.4413148164749146e-05, 1.505482941865921e-05, 1.5696510672569275e-05, 1.633819192647934e-05, 1.6979873180389404e-05, 1.762155443429947e-05, 1.8263235688209534e-05, 1.89049169421196e-05, 1.9546598196029663e-05, 2.0188279449939728e-05, 2.0829960703849792e-05, 2.1471641957759857e-05, 2.2113323211669922e-05]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 17.0, 24.0, 20.0, 15.0, 11.0, 17.0, 26.0, 647.0, 30.0, 22.0, 24.0, 16.0, 25.0, 16.0, 13.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.0980652354628546e-07, -3.018973870894115e-07, -2.939882222108281e-07, -2.860790573322447e-07, -2.7816992087537074e-07, -2.7026078441849677e-07, -2.6235161953991337e-07, -2.5444245466133e-07, -2.46533318204456e-07, -2.3862418174758204e-07, -2.3071501686899865e-07, -2.2280586620126996e-07, -2.1489671553354128e-07, -2.069875648658126e-07, -1.9907841419808392e-07, -1.9116926353035524e-07, -1.8326011286262656e-07, -1.7535096219489787e-07, -1.674418115271692e-07, -1.595326608594405e-07, -1.5162351019171183e-07, -1.4371435952398315e-07, -1.3580520885625447e-07, -1.2789605818852579e-07, -1.199869075207971e-07, -1.1207775685306842e-07, -1.0416860618533974e-07, -9.625945551761106e-08, -8.835030484988238e-08, -8.04411541821537e-08, -7.253200351442501e-08, -6.462285284669633e-08, -5.6713716389822366e-08, -4.8804565722093685e-08, -4.0895415054365e-08, -3.298626438663632e-08, -2.507711371890764e-08, -1.7167963051178958e-08, -9.258812383450277e-09, -1.349661715721595e-09, 6.5594889520070865e-09, 1.4468639619735768e-08, 2.237779028746445e-08, 3.028694095519313e-08, 3.819609162292181e-08, 4.6105242290650494e-08, 5.4014392958379176e-08, 6.192354362610786e-08, 6.983269429383654e-08, 7.774184496156522e-08, 8.56509956292939e-08, 9.356014629702258e-08, 1.0146929696475127e-07, 1.0937844763247995e-07, 1.1728759830020863e-07, 1.251967489679373e-07, 1.33105899635666e-07, 1.4101505030339467e-07, 1.4892420097112335e-07, 1.5683335163885204e-07, 1.6474250230658072e-07, 1.726516529743094e-07, 1.8056080364203808e-07, 1.8846995430976676e-07, 1.9637910497749544e-07]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 133.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 685.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 130.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 11.0, 7.0, 11.0, 14.0, 12.0, 15.0, 16.0, 21.0, 18.0, 23.0, 25.0, 34.0, 27.0, 31.0, 33.0, 40.0, 42.0, 30.0, 49.0, 54.0, 30.0, 40.0, 40.0, 35.0, 26.0, 28.0, 32.0, 38.0, 25.0, 22.0, 24.0, 16.0, 24.0, 9.0, 17.0, 20.0, 12.0, 11.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.072265625, -2.00634765625, -1.9404296875, -1.87451171875, -1.80859375, -1.74267578125, -1.6767578125, -1.61083984375, -1.544921875, -1.47900390625, -1.4130859375, -1.34716796875, -1.28125, -1.21533203125, -1.1494140625, -1.08349609375, -1.017578125, -0.95166015625, -0.8857421875, -0.81982421875, -0.75390625, -0.68798828125, -0.6220703125, -0.55615234375, -0.490234375, -0.42431640625, -0.3583984375, -0.29248046875, -0.2265625, -0.16064453125, -0.0947265625, -0.02880859375, 0.037109375, 0.10302734375, 0.1689453125, 0.23486328125, 0.30078125, 0.36669921875, 0.4326171875, 0.49853515625, 0.564453125, 0.63037109375, 0.6962890625, 0.76220703125, 0.828125, 0.89404296875, 0.9599609375, 1.02587890625, 1.091796875, 1.15771484375, 1.2236328125, 1.28955078125, 1.35546875, 1.42138671875, 1.4873046875, 1.55322265625, 1.619140625, 1.68505859375, 1.7509765625, 1.81689453125, 1.8828125, 1.94873046875, 2.0146484375, 2.08056640625, 2.146484375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 6.0, 23.0, 26.0, 40.0, 79.0, 159.0, 277.0, 484.0, 769.0, 1367.0, 2345.0, 4448.0, 8347.0, 16427.0, 34289.0, 74063.0, 185627.0, 376803.0, 195074.0, 76658.0, 35538.0, 17005.0, 8513.0, 4488.0, 2431.0, 1343.0, 802.0, 467.0, 277.0, 184.0, 78.0, 38.0, 29.0, 25.0, 8.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.015625, -3.89215087890625, -3.7686767578125, -3.64520263671875, -3.521728515625, -3.39825439453125, -3.2747802734375, -3.15130615234375, -3.02783203125, -2.90435791015625, -2.7808837890625, -2.65740966796875, -2.533935546875, -2.41046142578125, -2.2869873046875, -2.16351318359375, -2.0400390625, -1.91656494140625, -1.7930908203125, -1.66961669921875, -1.546142578125, -1.42266845703125, -1.2991943359375, -1.17572021484375, -1.05224609375, -0.92877197265625, -0.8052978515625, -0.68182373046875, -0.558349609375, -0.43487548828125, -0.3114013671875, -0.18792724609375, -0.064453125, 0.05902099609375, 0.1824951171875, 0.30596923828125, 0.429443359375, 0.55291748046875, 0.6763916015625, 0.79986572265625, 0.92333984375, 1.04681396484375, 1.1702880859375, 1.29376220703125, 1.417236328125, 1.54071044921875, 1.6641845703125, 1.78765869140625, 1.9111328125, 2.03460693359375, 2.1580810546875, 2.28155517578125, 2.405029296875, 2.52850341796875, 2.6519775390625, 2.77545166015625, 2.89892578125, 3.02239990234375, 3.1458740234375, 3.26934814453125, 3.392822265625, 3.51629638671875, 3.6397705078125, 3.76324462890625, 3.88671875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 9.0, 8.0, 6.0, 10.0, 10.0, 10.0, 12.0, 7.0, 20.0, 24.0, 22.0, 36.0, 33.0, 39.0, 34.0, 72.0, 55.0, 91.0, 110.0, 220.0, 1321.0, 237.0, 147.0, 86.0, 66.0, 59.0, 43.0, 28.0, 41.0, 28.0, 30.0, 28.0, 29.0, 14.0, 11.0, 15.0, 10.0, 6.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1171875, -7.84228515625, -7.5673828125, -7.29248046875, -7.017578125, -6.74267578125, -6.4677734375, -6.19287109375, -5.91796875, -5.64306640625, -5.3681640625, -5.09326171875, -4.818359375, -4.54345703125, -4.2685546875, -3.99365234375, -3.71875, -3.44384765625, -3.1689453125, -2.89404296875, -2.619140625, -2.34423828125, -2.0693359375, -1.79443359375, -1.51953125, -1.24462890625, -0.9697265625, -0.69482421875, -0.419921875, -0.14501953125, 0.1298828125, 0.40478515625, 0.6796875, 0.95458984375, 1.2294921875, 1.50439453125, 1.779296875, 2.05419921875, 2.3291015625, 2.60400390625, 2.87890625, 3.15380859375, 3.4287109375, 3.70361328125, 3.978515625, 4.25341796875, 4.5283203125, 4.80322265625, 5.078125, 5.35302734375, 5.6279296875, 5.90283203125, 6.177734375, 6.45263671875, 6.7275390625, 7.00244140625, 7.27734375, 7.55224609375, 7.8271484375, 8.10205078125, 8.376953125, 8.65185546875, 8.9267578125, 9.20166015625, 9.4765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 8.0, 7.0, 10.0, 10.0, 29.0, 30.0, 44.0, 72.0, 89.0, 123.0, 163.0, 249.0, 579.0, 1799.0, 11116.0, 170299.0, 2767685.0, 178652.0, 11487.0, 1731.0, 612.0, 296.0, 149.0, 126.0, 81.0, 54.0, 43.0, 36.0, 34.0, 20.0, 16.0, 19.0, 9.0, 3.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.875, -17.2890625, -16.703125, -16.1171875, -15.53125, -14.9453125, -14.359375, -13.7734375, -13.1875, -12.6015625, -12.015625, -11.4296875, -10.84375, -10.2578125, -9.671875, -9.0859375, -8.5, -7.9140625, -7.328125, -6.7421875, -6.15625, -5.5703125, -4.984375, -4.3984375, -3.8125, -3.2265625, -2.640625, -2.0546875, -1.46875, -0.8828125, -0.296875, 0.2890625, 0.875, 1.4609375, 2.046875, 2.6328125, 3.21875, 3.8046875, 4.390625, 4.9765625, 5.5625, 6.1484375, 6.734375, 7.3203125, 7.90625, 8.4921875, 9.078125, 9.6640625, 10.25, 10.8359375, 11.421875, 12.0078125, 12.59375, 13.1796875, 13.765625, 14.3515625, 14.9375, 15.5234375, 16.109375, 16.6953125, 17.28125, 17.8671875, 18.453125, 19.0390625, 19.625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 151.0, 649.0, 196.0, 20.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.149761199951172, -18.923728942871094, -13.697694778442383, -8.471661567687988, -3.2456283569335938, 1.9804039001464844, 7.206438064575195, 12.432472229003906, 17.658504486083984, 22.884536743164062, 28.110570907592773, 33.336605072021484, 38.56263732910156, 43.78866958618164, 49.01470184326172, 54.24073791503906, 59.46677017211914, 64.69280242919922, 69.91883850097656, 75.14486694335938, 80.37090301513672, 85.59693908691406, 90.82296752929688, 96.04900360107422, 101.27503967285156, 106.5010757446289, 111.72710418701172, 116.95314025878906, 122.17916870117188, 127.40520477294922, 132.63124084472656, 137.85726928710938, 143.08331298828125, 148.30934143066406, 153.53538513183594, 158.76141357421875, 163.98744201660156, 169.21347045898438, 174.43951416015625, 179.66554260253906, 184.89157104492188, 190.1175994873047, 195.34364318847656, 200.56967163085938, 205.7957000732422, 211.021728515625, 216.24777221679688, 221.4738006591797, 226.69984436035156, 231.92587280273438, 237.15191650390625, 242.37794494628906, 247.60397338867188, 252.83001708984375, 258.0560302734375, 263.2820739746094, 268.50811767578125, 273.7341613769531, 278.9601745605469, 284.18621826171875, 289.4122619628906, 294.6382751464844, 299.86431884765625, 305.0903625488281, 310.3163757324219]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 3.0, 4.0, 3.0, 8.0, 16.0, 13.0, 12.0, 19.0, 19.0, 23.0, 28.0, 30.0, 37.0, 35.0, 43.0, 37.0, 37.0, 45.0, 42.0, 57.0, 48.0, 45.0, 39.0, 38.0, 36.0, 39.0, 28.0, 42.0, 34.0, 18.0, 17.0, 23.0, 9.0, 22.0, 9.0, 13.0, 11.0, 3.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.152633666992188, -25.332061767578125, -24.511489868164062, -23.69091796875, -22.870344161987305, -22.049772262573242, -21.22920036315918, -20.408628463745117, -19.588054656982422, -18.76748275756836, -17.946910858154297, -17.126338958740234, -16.30576515197754, -15.485193252563477, -14.664621353149414, -13.844049453735352, -13.023477554321289, -12.202905654907227, -11.382332801818848, -10.561760902404785, -9.741188049316406, -8.920616149902344, -8.100044250488281, -7.2794718742370605, -6.45889949798584, -5.638327121734619, -4.817754745483398, -3.997182846069336, -3.1766104698181152, -2.3560380935668945, -1.535466194152832, -0.7148938179016113, 0.10568046569824219, 0.9262527227401733, 1.7468249797821045, 2.567397117614746, 3.387969493865967, 4.2085418701171875, 5.02911376953125, 5.849686145782471, 6.670258522033691, 7.490830898284912, 8.311403274536133, 9.131975173950195, 9.952547073364258, 10.773119926452637, 11.5936918258667, 12.414264678955078, 13.23483657836914, 14.055408477783203, 14.875981330871582, 15.696553230285645, 16.517126083374023, 17.337697982788086, 18.15826988220215, 18.97884178161621, 19.799415588378906, 20.61998748779297, 21.44055938720703, 22.261131286621094, 23.08170509338379, 23.90227699279785, 24.722848892211914, 25.543420791625977, 26.36399269104004]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 12.0, 2.0, 5.0, 6.0, 5.0, 6.0, 6.0, 9.0, 9.0, 11.0, 18.0, 23.0, 19.0, 21.0, 23.0, 23.0, 33.0, 26.0, 27.0, 37.0, 22.0, 34.0, 38.0, 32.0, 39.0, 34.0, 42.0, 44.0, 34.0, 29.0, 40.0, 27.0, 24.0, 33.0, 30.0, 30.0, 20.0, 21.0, 22.0, 11.0, 11.0, 15.0, 10.0, 11.0, 5.0, 8.0, 5.0, 8.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-2.349609375, -2.278961181640625, -2.20831298828125, -2.137664794921875, -2.0670166015625, -1.996368408203125, -1.92572021484375, -1.855072021484375, -1.784423828125, -1.713775634765625, -1.64312744140625, -1.572479248046875, -1.5018310546875, -1.431182861328125, -1.36053466796875, -1.289886474609375, -1.21923828125, -1.148590087890625, -1.07794189453125, -1.007293701171875, -0.9366455078125, -0.865997314453125, -0.79534912109375, -0.724700927734375, -0.654052734375, -0.583404541015625, -0.51275634765625, -0.442108154296875, -0.3714599609375, -0.300811767578125, -0.23016357421875, -0.159515380859375, -0.0888671875, -0.018218994140625, 0.05242919921875, 0.123077392578125, 0.1937255859375, 0.264373779296875, 0.33502197265625, 0.405670166015625, 0.476318359375, 0.546966552734375, 0.61761474609375, 0.688262939453125, 0.7589111328125, 0.829559326171875, 0.90020751953125, 0.970855712890625, 1.04150390625, 1.112152099609375, 1.18280029296875, 1.253448486328125, 1.3240966796875, 1.394744873046875, 1.46539306640625, 1.536041259765625, 1.606689453125, 1.677337646484375, 1.74798583984375, 1.818634033203125, 1.8892822265625, 1.959930419921875, 2.03057861328125, 2.101226806640625, 2.171875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 4.0, 4.0, 9.0, 13.0, 15.0, 16.0, 30.0, 36.0, 32.0, 57.0, 123.0, 225.0, 440.0, 1431.0, 5812.0, 33569.0, 239599.0, 1616195.0, 1928951.0, 313863.0, 43641.0, 7374.0, 1704.0, 507.0, 233.0, 120.0, 62.0, 54.0, 27.0, 30.0, 16.0, 16.0, 8.0, 7.0, 12.0, 10.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.859375, -7.6473388671875, -7.435302734375, -7.2232666015625, -7.01123046875, -6.7991943359375, -6.587158203125, -6.3751220703125, -6.1630859375, -5.9510498046875, -5.739013671875, -5.5269775390625, -5.31494140625, -5.1029052734375, -4.890869140625, -4.6788330078125, -4.466796875, -4.2547607421875, -4.042724609375, -3.8306884765625, -3.61865234375, -3.4066162109375, -3.194580078125, -2.9825439453125, -2.7705078125, -2.5584716796875, -2.346435546875, -2.1343994140625, -1.92236328125, -1.7103271484375, -1.498291015625, -1.2862548828125, -1.07421875, -0.8621826171875, -0.650146484375, -0.4381103515625, -0.22607421875, -0.0140380859375, 0.197998046875, 0.4100341796875, 0.6220703125, 0.8341064453125, 1.046142578125, 1.2581787109375, 1.47021484375, 1.6822509765625, 1.894287109375, 2.1063232421875, 2.318359375, 2.5303955078125, 2.742431640625, 2.9544677734375, 3.16650390625, 3.3785400390625, 3.590576171875, 3.8026123046875, 4.0146484375, 4.2266845703125, 4.438720703125, 4.6507568359375, 4.86279296875, 5.0748291015625, 5.286865234375, 5.4989013671875, 5.7109375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 16.0, 16.0, 22.0, 16.0, 45.0, 57.0, 59.0, 98.0, 137.0, 169.0, 239.0, 284.0, 406.0, 439.0, 440.0, 386.0, 321.0, 263.0, 194.0, 142.0, 91.0, 54.0, 41.0, 46.0, 22.0, 19.0, 16.0, 11.0, 12.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.409423828125, -4.21728515625, -4.025146484375, -3.8330078125, -3.640869140625, -3.44873046875, -3.256591796875, -3.064453125, -2.872314453125, -2.68017578125, -2.488037109375, -2.2958984375, -2.103759765625, -1.91162109375, -1.719482421875, -1.52734375, -1.335205078125, -1.14306640625, -0.950927734375, -0.7587890625, -0.566650390625, -0.37451171875, -0.182373046875, 0.009765625, 0.201904296875, 0.39404296875, 0.586181640625, 0.7783203125, 0.970458984375, 1.16259765625, 1.354736328125, 1.546875, 1.739013671875, 1.93115234375, 2.123291015625, 2.3154296875, 2.507568359375, 2.69970703125, 2.891845703125, 3.083984375, 3.276123046875, 3.46826171875, 3.660400390625, 3.8525390625, 4.044677734375, 4.23681640625, 4.428955078125, 4.62109375, 4.813232421875, 5.00537109375, 5.197509765625, 5.3896484375, 5.581787109375, 5.77392578125, 5.966064453125, 6.158203125, 6.350341796875, 6.54248046875, 6.734619140625, 6.9267578125, 7.118896484375, 7.31103515625, 7.503173828125, 7.6953125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 15.0, 11.0, 25.0, 32.0, 36.0, 52.0, 82.0, 145.0, 171.0, 297.0, 686.0, 2326.0, 13596.0, 142809.0, 1486894.0, 2252146.0, 265348.0, 24467.0, 3318.0, 830.0, 378.0, 216.0, 118.0, 87.0, 70.0, 33.0, 30.0, 16.0, 19.0, 11.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-14.5625, -14.1995849609375, -13.836669921875, -13.4737548828125, -13.11083984375, -12.7479248046875, -12.385009765625, -12.0220947265625, -11.6591796875, -11.2962646484375, -10.933349609375, -10.5704345703125, -10.20751953125, -9.8446044921875, -9.481689453125, -9.1187744140625, -8.755859375, -8.3929443359375, -8.030029296875, -7.6671142578125, -7.30419921875, -6.9412841796875, -6.578369140625, -6.2154541015625, -5.8525390625, -5.4896240234375, -5.126708984375, -4.7637939453125, -4.40087890625, -4.0379638671875, -3.675048828125, -3.3121337890625, -2.94921875, -2.5863037109375, -2.223388671875, -1.8604736328125, -1.49755859375, -1.1346435546875, -0.771728515625, -0.4088134765625, -0.0458984375, 0.3170166015625, 0.679931640625, 1.0428466796875, 1.40576171875, 1.7686767578125, 2.131591796875, 2.4945068359375, 2.857421875, 3.2203369140625, 3.583251953125, 3.9461669921875, 4.30908203125, 4.6719970703125, 5.034912109375, 5.3978271484375, 5.7607421875, 6.1236572265625, 6.486572265625, 6.8494873046875, 7.21240234375, 7.5753173828125, 7.938232421875, 8.3011474609375, 8.6640625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 22.0, 65.0, 125.0, 196.0, 211.0, 194.0, 129.0, 52.0, 19.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.29646873474121, -26.009565353393555, -23.72266387939453, -21.435760498046875, -19.14885711669922, -16.861953735351562, -14.575051307678223, -12.288148880004883, -10.001245498657227, -7.7143425941467285, -5.4274396896362305, -3.1405367851257324, -0.8536338806152344, 1.4332695007324219, 3.7201719284057617, 6.007074356079102, 8.293977737426758, 10.580881118774414, 12.867783546447754, 15.154685974121094, 17.44158935546875, 19.728492736816406, 22.015396118164062, 24.302297592163086, 26.589200973510742, 28.8761043548584, 31.163005828857422, 33.44990921020508, 35.736812591552734, 38.02371597290039, 40.31061935424805, 42.59751892089844, 44.884429931640625, 47.17133331298828, 49.45823669433594, 51.745140075683594, 54.03204345703125, 56.318946838378906, 58.6058464050293, 60.89274978637695, 63.17965316772461, 65.466552734375, 67.75345611572266, 70.04035949707031, 72.32726287841797, 74.61416625976562, 76.90106964111328, 79.18797302246094, 81.4748764038086, 83.76177978515625, 86.0486831665039, 88.33558654785156, 90.62248992919922, 92.90939331054688, 95.19629669189453, 97.48320007324219, 99.77009582519531, 102.05699920654297, 104.34390258789062, 106.63080596923828, 108.91770935058594, 111.2046127319336, 113.49151611328125, 115.77841186523438, 118.06532287597656]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 7.0, 6.0, 9.0, 14.0, 7.0, 16.0, 19.0, 16.0, 27.0, 28.0, 22.0, 23.0, 39.0, 41.0, 31.0, 41.0, 50.0, 38.0, 49.0, 51.0, 43.0, 42.0, 47.0, 40.0, 37.0, 35.0, 33.0, 35.0, 23.0, 18.0, 27.0, 19.0, 14.0, 15.0, 14.0, 8.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.35489273071289, -18.71091651916504, -18.066940307617188, -17.422964096069336, -16.778987884521484, -16.135011672973633, -15.491035461425781, -14.84705924987793, -14.203083038330078, -13.559106826782227, -12.915130615234375, -12.271154403686523, -11.627178192138672, -10.98320198059082, -10.339225769042969, -9.695249557495117, -9.051274299621582, -8.40729808807373, -7.763321876525879, -7.119345664978027, -6.475369453430176, -5.831393241882324, -5.187417507171631, -4.543441295623779, -3.8994650840759277, -3.255488872528076, -2.6115126609802246, -1.9675366878509521, -1.3235604763031006, -0.679584264755249, -0.03560829162597656, 0.608367919921875, 1.2523441314697266, 1.8963203430175781, 2.5402965545654297, 3.184272527694702, 3.8282487392425537, 4.472225189208984, 5.116200923919678, 5.760177135467529, 6.404153347015381, 7.048129558563232, 7.692105770111084, 8.336081504821777, 8.980057716369629, 9.62403392791748, 10.268010139465332, 10.911986351013184, 11.555962562561035, 12.199938774108887, 12.843914985656738, 13.48789119720459, 14.131867408752441, 14.775843620300293, 15.419818878173828, 16.06379508972168, 16.70777130126953, 17.351747512817383, 17.995723724365234, 18.639699935913086, 19.283676147460938, 19.92765235900879, 20.57162857055664, 21.215604782104492, 21.859580993652344]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 10.0, 7.0, 9.0, 12.0, 15.0, 19.0, 18.0, 17.0, 24.0, 24.0, 25.0, 37.0, 37.0, 29.0, 36.0, 41.0, 38.0, 43.0, 37.0, 49.0, 48.0, 41.0, 30.0, 41.0, 42.0, 32.0, 34.0, 27.0, 29.0, 21.0, 17.0, 13.0, 17.0, 12.0, 12.0, 11.0, 11.0, 3.0, 6.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.52734375, -2.4481201171875, -2.368896484375, -2.2896728515625, -2.21044921875, -2.1312255859375, -2.052001953125, -1.9727783203125, -1.8935546875, -1.8143310546875, -1.735107421875, -1.6558837890625, -1.57666015625, -1.4974365234375, -1.418212890625, -1.3389892578125, -1.259765625, -1.1805419921875, -1.101318359375, -1.0220947265625, -0.94287109375, -0.8636474609375, -0.784423828125, -0.7052001953125, -0.6259765625, -0.5467529296875, -0.467529296875, -0.3883056640625, -0.30908203125, -0.2298583984375, -0.150634765625, -0.0714111328125, 0.0078125, 0.0870361328125, 0.166259765625, 0.2454833984375, 0.32470703125, 0.4039306640625, 0.483154296875, 0.5623779296875, 0.6416015625, 0.7208251953125, 0.800048828125, 0.8792724609375, 0.95849609375, 1.0377197265625, 1.116943359375, 1.1961669921875, 1.275390625, 1.3546142578125, 1.433837890625, 1.5130615234375, 1.59228515625, 1.6715087890625, 1.750732421875, 1.8299560546875, 1.9091796875, 1.9884033203125, 2.067626953125, 2.1468505859375, 2.22607421875, 2.3052978515625, 2.384521484375, 2.4637451171875, 2.54296875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 7.0, 0.0, 3.0, 6.0, 11.0, 21.0, 24.0, 41.0, 57.0, 88.0, 107.0, 162.0, 202.0, 353.0, 470.0, 734.0, 1048.0, 1551.0, 2156.0, 3194.0, 4771.0, 7029.0, 10483.0, 15759.0, 24475.0, 38780.0, 64419.0, 113587.0, 296862.0, 208680.0, 97159.0, 56496.0, 34607.0, 21584.0, 14302.0, 9379.0, 6228.0, 4340.0, 2991.0, 2029.0, 1359.0, 911.0, 634.0, 458.0, 335.0, 223.0, 150.0, 94.0, 66.0, 45.0, 30.0, 23.0, 19.0, 13.0, 5.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0], "bins": [-0.09991455078125, -0.09677982330322266, -0.09364509582519531, -0.09051036834716797, -0.08737564086914062, -0.08424091339111328, -0.08110618591308594, -0.0779714584350586, -0.07483673095703125, -0.0717020034790039, -0.06856727600097656, -0.06543254852294922, -0.062297821044921875, -0.05916309356689453, -0.05602836608886719, -0.052893638610839844, -0.0497589111328125, -0.046624183654785156, -0.04348945617675781, -0.04035472869873047, -0.037220001220703125, -0.03408527374267578, -0.030950546264648438, -0.027815818786621094, -0.02468109130859375, -0.021546363830566406, -0.018411636352539062, -0.015276908874511719, -0.012142181396484375, -0.009007453918457031, -0.0058727264404296875, -0.0027379989624023438, 0.000396728515625, 0.0035314559936523438, 0.0066661834716796875, 0.009800910949707031, 0.012935638427734375, 0.01607036590576172, 0.019205093383789062, 0.022339820861816406, 0.02547454833984375, 0.028609275817871094, 0.03174400329589844, 0.03487873077392578, 0.038013458251953125, 0.04114818572998047, 0.04428291320800781, 0.047417640686035156, 0.0505523681640625, 0.053687095642089844, 0.05682182312011719, 0.05995655059814453, 0.06309127807617188, 0.06622600555419922, 0.06936073303222656, 0.0724954605102539, 0.07563018798828125, 0.0787649154663086, 0.08189964294433594, 0.08503437042236328, 0.08816909790039062, 0.09130382537841797, 0.09443855285644531, 0.09757328033447266, 0.1007080078125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 5.0, 7.0, 11.0, 8.0, 7.0, 13.0, 18.0, 16.0, 25.0, 21.0, 19.0, 28.0, 29.0, 26.0, 33.0, 30.0, 31.0, 34.0, 22.0, 40.0, 39.0, 31.0, 1062.0, 33.0, 31.0, 27.0, 25.0, 35.0, 33.0, 33.0, 28.0, 34.0, 25.0, 16.0, 20.0, 23.0, 15.0, 17.0, 9.0, 3.0, 7.0, 4.0, 6.0, 5.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.59375, -1.5457000732421875, -1.497650146484375, -1.4496002197265625, -1.40155029296875, -1.3535003662109375, -1.305450439453125, -1.2574005126953125, -1.2093505859375, -1.1613006591796875, -1.113250732421875, -1.0652008056640625, -1.01715087890625, -0.9691009521484375, -0.921051025390625, -0.8730010986328125, -0.824951171875, -0.7769012451171875, -0.728851318359375, -0.6808013916015625, -0.63275146484375, -0.5847015380859375, -0.536651611328125, -0.4886016845703125, -0.4405517578125, -0.3925018310546875, -0.344451904296875, -0.2964019775390625, -0.24835205078125, -0.2003021240234375, -0.152252197265625, -0.1042022705078125, -0.05615234375, -0.0081024169921875, 0.039947509765625, 0.0879974365234375, 0.13604736328125, 0.1840972900390625, 0.232147216796875, 0.2801971435546875, 0.3282470703125, 0.3762969970703125, 0.424346923828125, 0.4723968505859375, 0.52044677734375, 0.5684967041015625, 0.616546630859375, 0.6645965576171875, 0.712646484375, 0.7606964111328125, 0.808746337890625, 0.8567962646484375, 0.90484619140625, 0.9528961181640625, 1.000946044921875, 1.0489959716796875, 1.0970458984375, 1.1450958251953125, 1.193145751953125, 1.2411956787109375, 1.28924560546875, 1.3372955322265625, 1.385345458984375, 1.4333953857421875, 1.4814453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 9.0, 17.0, 19.0, 36.0, 50.0, 93.0, 90.0, 135.0, 202.0, 274.0, 382.0, 507.0, 690.0, 1000.0, 1371.0, 1775.0, 2535.0, 3539.0, 4763.0, 6620.0, 9456.0, 13451.0, 19368.0, 28519.0, 41963.0, 64137.0, 102609.0, 203636.0, 1275199.0, 106690.0, 66196.0, 43408.0, 29470.0, 20184.0, 13918.0, 9846.0, 6958.0, 5050.0, 3555.0, 2616.0, 1843.0, 1357.0, 995.0, 749.0, 560.0, 377.0, 277.0, 203.0, 153.0, 83.0, 78.0, 45.0, 29.0, 22.0, 14.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.043212890625, -0.041820526123046875, -0.04042816162109375, -0.039035797119140625, -0.0376434326171875, -0.036251068115234375, -0.03485870361328125, -0.033466339111328125, -0.032073974609375, -0.030681610107421875, -0.02928924560546875, -0.027896881103515625, -0.0265045166015625, -0.025112152099609375, -0.02371978759765625, -0.022327423095703125, -0.02093505859375, -0.019542694091796875, -0.01815032958984375, -0.016757965087890625, -0.0153656005859375, -0.013973236083984375, -0.01258087158203125, -0.011188507080078125, -0.009796142578125, -0.008403778076171875, -0.00701141357421875, -0.005619049072265625, -0.0042266845703125, -0.002834320068359375, -0.00144195556640625, -4.9591064453125e-05, 0.0013427734375, 0.002735137939453125, 0.00412750244140625, 0.005519866943359375, 0.0069122314453125, 0.008304595947265625, 0.00969696044921875, 0.011089324951171875, 0.012481689453125, 0.013874053955078125, 0.01526641845703125, 0.016658782958984375, 0.0180511474609375, 0.019443511962890625, 0.02083587646484375, 0.022228240966796875, 0.02362060546875, 0.025012969970703125, 0.02640533447265625, 0.027797698974609375, 0.0291900634765625, 0.030582427978515625, 0.03197479248046875, 0.033367156982421875, 0.034759521484375, 0.036151885986328125, 0.03754425048828125, 0.038936614990234375, 0.0403289794921875, 0.041721343994140625, 0.04311370849609375, 0.044506072998046875, 0.0458984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 0.0, 6.0, 5.0, 0.0, 8.0, 13.0, 0.0, 7.0, 13.0, 0.0, 14.0, 18.0, 0.0, 33.0, 42.0, 0.0, 58.0, 74.0, 0.0, 407.0, 96.0, 0.0, 70.0, 41.0, 0.0, 20.0, 21.0, 0.0, 8.0, 8.0, 0.0, 12.0, 9.0, 0.0, 6.0, 6.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4500692486763e-06, -1.4100223779678345e-06, -1.369975507259369e-06, -1.3299286365509033e-06, -1.2898817658424377e-06, -1.2498348951339722e-06, -1.2097880244255066e-06, -1.169741153717041e-06, -1.1296942830085754e-06, -1.0896474123001099e-06, -1.0496005415916443e-06, -1.0095536708831787e-06, -9.695068001747131e-07, -9.294599294662476e-07, -8.89413058757782e-07, -8.493661880493164e-07, -8.093193173408508e-07, -7.692724466323853e-07, -7.292255759239197e-07, -6.891787052154541e-07, -6.491318345069885e-07, -6.09084963798523e-07, -5.690380930900574e-07, -5.289912223815918e-07, -4.889443516731262e-07, -4.4889748096466064e-07, -4.0885061025619507e-07, -3.688037395477295e-07, -3.287568688392639e-07, -2.8870999813079834e-07, -2.4866312742233276e-07, -2.086162567138672e-07, -1.685693860054016e-07, -1.2852251529693604e-07, -8.847564458847046e-08, -4.842877388000488e-08, -8.381903171539307e-09, 3.166496753692627e-08, 7.171183824539185e-08, 1.1175870895385742e-07, 1.51805579662323e-07, 1.9185245037078857e-07, 2.3189932107925415e-07, 2.7194619178771973e-07, 3.119930624961853e-07, 3.520399332046509e-07, 3.9208680391311646e-07, 4.3213367462158203e-07, 4.721805453300476e-07, 5.122274160385132e-07, 5.522742867469788e-07, 5.923211574554443e-07, 6.323680281639099e-07, 6.724148988723755e-07, 7.124617695808411e-07, 7.525086402893066e-07, 7.925555109977722e-07, 8.326023817062378e-07, 8.726492524147034e-07, 9.126961231231689e-07, 9.527429938316345e-07, 9.927898645401e-07, 1.0328367352485657e-06, 1.0728836059570312e-06]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 1.0, 6.0, 5.0, 4.0, 4.0, 13.0, 25.0, 39.0, 67.0, 70.0, 134.0, 464.0, 9927.0, 899641.0, 134032.0, 3501.0, 280.0, 123.0, 65.0, 43.0, 26.0, 21.0, 12.0, 8.0, 11.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2590160369873047e-05, -2.1778978407382965e-05, -2.0967796444892883e-05, -2.01566144824028e-05, -1.934543251991272e-05, -1.8534250557422638e-05, -1.7723068594932556e-05, -1.6911886632442474e-05, -1.6100704669952393e-05, -1.528952270746231e-05, -1.4478340744972229e-05, -1.3667158782482147e-05, -1.2855976819992065e-05, -1.2044794857501984e-05, -1.1233612895011902e-05, -1.042243093252182e-05, -9.611248970031738e-06, -8.800067007541656e-06, -7.988885045051575e-06, -7.177703082561493e-06, -6.366521120071411e-06, -5.555339157581329e-06, -4.7441571950912476e-06, -3.932975232601166e-06, -3.121793270111084e-06, -2.310611307621002e-06, -1.4994293451309204e-06, -6.882473826408386e-07, 1.2293457984924316e-07, 9.34116542339325e-07, 1.7452985048294067e-06, 2.5564804673194885e-06, 3.3676624298095703e-06, 4.178844392299652e-06, 4.990026354789734e-06, 5.801208317279816e-06, 6.6123902797698975e-06, 7.423572242259979e-06, 8.234754204750061e-06, 9.045936167240143e-06, 9.857118129730225e-06, 1.0668300092220306e-05, 1.1479482054710388e-05, 1.229066401720047e-05, 1.3101845979690552e-05, 1.3913027942180634e-05, 1.4724209904670715e-05, 1.5535391867160797e-05, 1.634657382965088e-05, 1.715775579214096e-05, 1.7968937754631042e-05, 1.8780119717121124e-05, 1.9591301679611206e-05, 2.0402483642101288e-05, 2.121366560459137e-05, 2.202484756708145e-05, 2.2836029529571533e-05, 2.3647211492061615e-05, 2.4458393454551697e-05, 2.526957541704178e-05, 2.608075737953186e-05, 2.6891939342021942e-05, 2.7703121304512024e-05, 2.8514303267002106e-05, 2.9325485229492188e-05]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 13.0, 26.0, 48.0, 88.0, 607.0, 97.0, 58.0, 33.0, 25.0, 9.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.8092907794198254e-06, -1.7743664102454204e-06, -1.7394421547578531e-06, -1.7045177855834481e-06, -1.6695935300958809e-06, -1.6346691609214759e-06, -1.5997447917470708e-06, -1.5648205362595036e-06, -1.5298961670850986e-06, -1.4949717979106936e-06, -1.4600475424231263e-06, -1.4251231732487213e-06, -1.390198917761154e-06, -1.355274548586749e-06, -1.3203502930991817e-06, -1.2854259239247767e-06, -1.2505015547503717e-06, -1.2155771855759667e-06, -1.1806529300883994e-06, -1.1457285609139944e-06, -1.1108043054264272e-06, -1.0758799362520222e-06, -1.0409555670776172e-06, -1.0060313115900499e-06, -9.711070561024826e-07, -9.361827437714965e-07, -9.012584314405103e-07, -8.663340622661053e-07, -8.314097499351192e-07, -7.96485437604133e-07, -7.615611252731469e-07, -7.266368129421608e-07, -6.917125574545935e-07, -6.567882451236073e-07, -6.218639327926212e-07, -5.869395636182162e-07, -5.520152512872301e-07, -5.170909389562439e-07, -4.821666266252578e-07, -4.472422858725622e-07, -4.1231794511986664e-07, -3.773936327888805e-07, -3.424692920361849e-07, -3.075449797051988e-07, -2.726206389525032e-07, -2.3769632662151707e-07, -2.0277201429053093e-07, -1.6784767353783536e-07, -1.3292336120684922e-07, -9.799903466500837e-08, -6.307471522859487e-08, -2.815039579218137e-08, 6.773930749659485e-09, 4.169825729150034e-08, 7.662256962248648e-08, 1.1154691037518205e-07, 1.464712227061682e-07, 1.8139554924800905e-07, 2.163198757898499e-07, 2.5124418812083604e-07, 2.861685288735316e-07, 3.2109284120451775e-07, 3.560171535355039e-07, 3.9094149428819946e-07, 4.258658066191856e-07]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 56.0, 0.0, 0.0, 0.0, 0.0, 147.0, 0.0, 0.0, 0.0, 0.0, 539.0, 0.0, 0.0, 0.0, 155.0, 0.0, 0.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 4.0, 10.0, 7.0, 9.0, 12.0, 15.0, 19.0, 18.0, 17.0, 24.0, 24.0, 25.0, 37.0, 37.0, 29.0, 36.0, 41.0, 38.0, 43.0, 37.0, 49.0, 48.0, 41.0, 30.0, 41.0, 42.0, 32.0, 34.0, 27.0, 29.0, 21.0, 17.0, 13.0, 17.0, 12.0, 12.0, 11.0, 11.0, 3.0, 6.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.52734375, -2.4481201171875, -2.368896484375, -2.2896728515625, -2.21044921875, -2.1312255859375, -2.052001953125, -1.9727783203125, -1.8935546875, -1.8143310546875, -1.735107421875, -1.6558837890625, -1.57666015625, -1.4974365234375, -1.418212890625, -1.3389892578125, -1.259765625, -1.1805419921875, -1.101318359375, -1.0220947265625, -0.94287109375, -0.8636474609375, -0.784423828125, -0.7052001953125, -0.6259765625, -0.5467529296875, -0.467529296875, -0.3883056640625, -0.30908203125, -0.2298583984375, -0.150634765625, -0.0714111328125, 0.0078125, 0.0870361328125, 0.166259765625, 0.2454833984375, 0.32470703125, 0.4039306640625, 0.483154296875, 0.5623779296875, 0.6416015625, 0.7208251953125, 0.800048828125, 0.8792724609375, 0.95849609375, 1.0377197265625, 1.116943359375, 1.1961669921875, 1.275390625, 1.3546142578125, 1.433837890625, 1.5130615234375, 1.59228515625, 1.6715087890625, 1.750732421875, 1.8299560546875, 1.9091796875, 1.9884033203125, 2.067626953125, 2.1468505859375, 2.22607421875, 2.3052978515625, 2.384521484375, 2.4637451171875, 2.54296875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 3.0, 10.0, 16.0, 33.0, 47.0, 82.0, 138.0, 224.0, 352.0, 651.0, 1088.0, 1836.0, 3035.0, 5169.0, 8514.0, 13632.0, 23054.0, 38508.0, 65543.0, 116250.0, 230909.0, 246919.0, 122996.0, 68780.0, 40215.0, 23873.0, 14776.0, 8855.0, 5193.0, 3132.0, 1861.0, 1179.0, 684.0, 375.0, 251.0, 131.0, 73.0, 53.0, 34.0, 33.0, 13.0, 10.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.505859375, -2.41650390625, -2.3271484375, -2.23779296875, -2.1484375, -2.05908203125, -1.9697265625, -1.88037109375, -1.791015625, -1.70166015625, -1.6123046875, -1.52294921875, -1.43359375, -1.34423828125, -1.2548828125, -1.16552734375, -1.076171875, -0.98681640625, -0.8974609375, -0.80810546875, -0.71875, -0.62939453125, -0.5400390625, -0.45068359375, -0.361328125, -0.27197265625, -0.1826171875, -0.09326171875, -0.00390625, 0.08544921875, 0.1748046875, 0.26416015625, 0.353515625, 0.44287109375, 0.5322265625, 0.62158203125, 0.7109375, 0.80029296875, 0.8896484375, 0.97900390625, 1.068359375, 1.15771484375, 1.2470703125, 1.33642578125, 1.42578125, 1.51513671875, 1.6044921875, 1.69384765625, 1.783203125, 1.87255859375, 1.9619140625, 2.05126953125, 2.140625, 2.22998046875, 2.3193359375, 2.40869140625, 2.498046875, 2.58740234375, 2.6767578125, 2.76611328125, 2.85546875, 2.94482421875, 3.0341796875, 3.12353515625, 3.212890625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 8.0, 13.0, 11.0, 13.0, 9.0, 32.0, 16.0, 23.0, 31.0, 31.0, 36.0, 41.0, 58.0, 63.0, 92.0, 154.0, 278.0, 1394.0, 195.0, 115.0, 83.0, 67.0, 40.0, 38.0, 24.0, 31.0, 24.0, 23.0, 21.0, 16.0, 11.0, 13.0, 9.0, 3.0, 11.0, 1.0, 8.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.679931640625, -8.38330078125, -8.086669921875, -7.7900390625, -7.493408203125, -7.19677734375, -6.900146484375, -6.603515625, -6.306884765625, -6.01025390625, -5.713623046875, -5.4169921875, -5.120361328125, -4.82373046875, -4.527099609375, -4.23046875, -3.933837890625, -3.63720703125, -3.340576171875, -3.0439453125, -2.747314453125, -2.45068359375, -2.154052734375, -1.857421875, -1.560791015625, -1.26416015625, -0.967529296875, -0.6708984375, -0.374267578125, -0.07763671875, 0.218994140625, 0.515625, 0.812255859375, 1.10888671875, 1.405517578125, 1.7021484375, 1.998779296875, 2.29541015625, 2.592041015625, 2.888671875, 3.185302734375, 3.48193359375, 3.778564453125, 4.0751953125, 4.371826171875, 4.66845703125, 4.965087890625, 5.26171875, 5.558349609375, 5.85498046875, 6.151611328125, 6.4482421875, 6.744873046875, 7.04150390625, 7.338134765625, 7.634765625, 7.931396484375, 8.22802734375, 8.524658203125, 8.8212890625, 9.117919921875, 9.41455078125, 9.711181640625, 10.0078125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 10.0, 9.0, 9.0, 12.0, 16.0, 14.0, 35.0, 30.0, 57.0, 69.0, 95.0, 132.0, 194.0, 389.0, 1014.0, 7393.0, 201694.0, 2805734.0, 121446.0, 5386.0, 888.0, 326.0, 205.0, 136.0, 102.0, 81.0, 60.0, 33.0, 38.0, 20.0, 19.0, 13.0, 11.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.109375, -20.513671875, -19.91796875, -19.322265625, -18.7265625, -18.130859375, -17.53515625, -16.939453125, -16.34375, -15.748046875, -15.15234375, -14.556640625, -13.9609375, -13.365234375, -12.76953125, -12.173828125, -11.578125, -10.982421875, -10.38671875, -9.791015625, -9.1953125, -8.599609375, -8.00390625, -7.408203125, -6.8125, -6.216796875, -5.62109375, -5.025390625, -4.4296875, -3.833984375, -3.23828125, -2.642578125, -2.046875, -1.451171875, -0.85546875, -0.259765625, 0.3359375, 0.931640625, 1.52734375, 2.123046875, 2.71875, 3.314453125, 3.91015625, 4.505859375, 5.1015625, 5.697265625, 6.29296875, 6.888671875, 7.484375, 8.080078125, 8.67578125, 9.271484375, 9.8671875, 10.462890625, 11.05859375, 11.654296875, 12.25, 12.845703125, 13.44140625, 14.037109375, 14.6328125, 15.228515625, 15.82421875, 16.419921875, 17.015625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 12.0, 52.0, 125.0, 225.0, 278.0, 195.0, 81.0, 35.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.813081741333008, -16.073143005371094, -14.333202362060547, -12.593262672424316, -10.853322982788086, -9.113383293151855, -7.373443603515625, -5.6335039138793945, -3.893564224243164, -2.1536245346069336, -0.4136848449707031, 1.3262548446655273, 3.066194534301758, 4.806134223937988, 6.546073913574219, 8.28601360321045, 10.02595329284668, 11.76589298248291, 13.50583267211914, 15.245772361755371, 16.9857120513916, 18.725650787353516, 20.465591430664062, 22.20553207397461, 23.945470809936523, 25.685409545898438, 27.425350189208984, 29.16529083251953, 30.905229568481445, 32.64516830444336, 34.385108947753906, 36.12504959106445, 37.864990234375, 39.60493087768555, 41.344871520996094, 43.084808349609375, 44.82474899291992, 46.56468963623047, 48.30462646484375, 50.0445671081543, 51.784507751464844, 53.52444839477539, 55.26438903808594, 57.00432586669922, 58.744266510009766, 60.48420715332031, 62.224143981933594, 63.96408462524414, 65.70402526855469, 67.44396209716797, 69.18390655517578, 70.92384338378906, 72.66378784179688, 74.40372467041016, 76.14366149902344, 77.88360595703125, 79.62354278564453, 81.36347961425781, 83.10342407226562, 84.8433609008789, 86.58329772949219, 88.3232421875, 90.06317901611328, 91.8031234741211, 93.54306030273438]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 12.0, 14.0, 13.0, 7.0, 13.0, 24.0, 17.0, 21.0, 37.0, 33.0, 46.0, 44.0, 48.0, 48.0, 46.0, 44.0, 52.0, 44.0, 53.0, 40.0, 47.0, 44.0, 40.0, 32.0, 35.0, 30.0, 30.0, 22.0, 16.0, 8.0, 9.0, 13.0, 6.0, 1.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.407669067382812, -28.35000991821289, -27.29235076904297, -26.23469352722168, -25.177034378051758, -24.119375228881836, -23.061717987060547, -22.004058837890625, -20.946399688720703, -19.88874053955078, -18.83108139038086, -17.77342414855957, -16.71576499938965, -15.658105850219727, -14.600447654724121, -13.542789459228516, -12.485130310058594, -11.427471160888672, -10.369812965393066, -9.312154769897461, -8.254495620727539, -7.196836948394775, -6.139178276062012, -5.081519603729248, -4.023860931396484, -2.9662022590637207, -1.908543586730957, -0.8508849143981934, 0.2067737579345703, 1.264432430267334, 2.3220911026000977, 3.3797497749328613, 4.437412261962891, 5.495070934295654, 6.552729606628418, 7.610388278961182, 8.668046951293945, 9.725706100463867, 10.783364295959473, 11.841022491455078, 12.898681640625, 13.956340789794922, 15.013998985290527, 16.071657180786133, 17.129316329956055, 18.186975479125977, 19.244632720947266, 20.302291870117188, 21.35995101928711, 22.41761016845703, 23.475269317626953, 24.532926559448242, 25.590585708618164, 26.648244857788086, 27.705902099609375, 28.763561248779297, 29.82122039794922, 30.87887954711914, 31.936538696289062, 32.994197845458984, 34.051856994628906, 35.10951232910156, 36.167171478271484, 37.224830627441406, 38.28248977661133]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 6.0, 7.0, 10.0, 11.0, 18.0, 23.0, 11.0, 14.0, 17.0, 16.0, 38.0, 37.0, 30.0, 40.0, 34.0, 51.0, 38.0, 43.0, 36.0, 44.0, 50.0, 38.0, 43.0, 36.0, 34.0, 45.0, 30.0, 28.0, 23.0, 20.0, 13.0, 23.0, 13.0, 17.0, 12.0, 7.0, 7.0, 10.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.923828125, -2.8353271484375, -2.746826171875, -2.6583251953125, -2.56982421875, -2.4813232421875, -2.392822265625, -2.3043212890625, -2.2158203125, -2.1273193359375, -2.038818359375, -1.9503173828125, -1.86181640625, -1.7733154296875, -1.684814453125, -1.5963134765625, -1.5078125, -1.4193115234375, -1.330810546875, -1.2423095703125, -1.15380859375, -1.0653076171875, -0.976806640625, -0.8883056640625, -0.7998046875, -0.7113037109375, -0.622802734375, -0.5343017578125, -0.44580078125, -0.3572998046875, -0.268798828125, -0.1802978515625, -0.091796875, -0.0032958984375, 0.085205078125, 0.1737060546875, 0.26220703125, 0.3507080078125, 0.439208984375, 0.5277099609375, 0.6162109375, 0.7047119140625, 0.793212890625, 0.8817138671875, 0.97021484375, 1.0587158203125, 1.147216796875, 1.2357177734375, 1.32421875, 1.4127197265625, 1.501220703125, 1.5897216796875, 1.67822265625, 1.7667236328125, 1.855224609375, 1.9437255859375, 2.0322265625, 2.1207275390625, 2.209228515625, 2.2977294921875, 2.38623046875, 2.4747314453125, 2.563232421875, 2.6517333984375, 2.740234375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 8.0, 19.0, 13.0, 14.0, 32.0, 25.0, 26.0, 39.0, 76.0, 112.0, 250.0, 651.0, 2075.0, 8952.0, 50167.0, 359580.0, 2010171.0, 1494789.0, 225136.0, 32996.0, 6388.0, 1593.0, 571.0, 218.0, 108.0, 72.0, 41.0, 36.0, 20.0, 15.0, 15.0, 5.0, 9.0, 9.0, 5.0, 12.0, 3.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80859375, -6.588134765625, -6.36767578125, -6.147216796875, -5.9267578125, -5.706298828125, -5.48583984375, -5.265380859375, -5.044921875, -4.824462890625, -4.60400390625, -4.383544921875, -4.1630859375, -3.942626953125, -3.72216796875, -3.501708984375, -3.28125, -3.060791015625, -2.84033203125, -2.619873046875, -2.3994140625, -2.178955078125, -1.95849609375, -1.738037109375, -1.517578125, -1.297119140625, -1.07666015625, -0.856201171875, -0.6357421875, -0.415283203125, -0.19482421875, 0.025634765625, 0.24609375, 0.466552734375, 0.68701171875, 0.907470703125, 1.1279296875, 1.348388671875, 1.56884765625, 1.789306640625, 2.009765625, 2.230224609375, 2.45068359375, 2.671142578125, 2.8916015625, 3.112060546875, 3.33251953125, 3.552978515625, 3.7734375, 3.993896484375, 4.21435546875, 4.434814453125, 4.6552734375, 4.875732421875, 5.09619140625, 5.316650390625, 5.537109375, 5.757568359375, 5.97802734375, 6.198486328125, 6.4189453125, 6.639404296875, 6.85986328125, 7.080322265625, 7.30078125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 6.0, 11.0, 15.0, 16.0, 36.0, 44.0, 72.0, 70.0, 138.0, 184.0, 236.0, 305.0, 409.0, 439.0, 494.0, 421.0, 298.0, 242.0, 174.0, 119.0, 104.0, 62.0, 47.0, 47.0, 29.0, 16.0, 12.0, 9.0, 8.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.85516357421875, -4.6439208984375, -4.43267822265625, -4.221435546875, -4.01019287109375, -3.7989501953125, -3.58770751953125, -3.37646484375, -3.16522216796875, -2.9539794921875, -2.74273681640625, -2.531494140625, -2.32025146484375, -2.1090087890625, -1.89776611328125, -1.6865234375, -1.47528076171875, -1.2640380859375, -1.05279541015625, -0.841552734375, -0.63031005859375, -0.4190673828125, -0.20782470703125, 0.00341796875, 0.21466064453125, 0.4259033203125, 0.63714599609375, 0.848388671875, 1.05963134765625, 1.2708740234375, 1.48211669921875, 1.693359375, 1.90460205078125, 2.1158447265625, 2.32708740234375, 2.538330078125, 2.74957275390625, 2.9608154296875, 3.17205810546875, 3.38330078125, 3.59454345703125, 3.8057861328125, 4.01702880859375, 4.228271484375, 4.43951416015625, 4.6507568359375, 4.86199951171875, 5.0732421875, 5.28448486328125, 5.4957275390625, 5.70697021484375, 5.918212890625, 6.12945556640625, 6.3406982421875, 6.55194091796875, 6.76318359375, 6.97442626953125, 7.1856689453125, 7.39691162109375, 7.608154296875, 7.81939697265625, 8.0306396484375, 8.24188232421875, 8.453125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 9.0, 9.0, 25.0, 26.0, 50.0, 59.0, 82.0, 121.0, 193.0, 324.0, 642.0, 4233.0, 254229.0, 3727098.0, 201952.0, 3774.0, 637.0, 321.0, 182.0, 98.0, 73.0, 51.0, 33.0, 17.0, 15.0, 11.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.15625, -26.450439453125, -25.74462890625, -25.038818359375, -24.3330078125, -23.627197265625, -22.92138671875, -22.215576171875, -21.509765625, -20.803955078125, -20.09814453125, -19.392333984375, -18.6865234375, -17.980712890625, -17.27490234375, -16.569091796875, -15.86328125, -15.157470703125, -14.45166015625, -13.745849609375, -13.0400390625, -12.334228515625, -11.62841796875, -10.922607421875, -10.216796875, -9.510986328125, -8.80517578125, -8.099365234375, -7.3935546875, -6.687744140625, -5.98193359375, -5.276123046875, -4.5703125, -3.864501953125, -3.15869140625, -2.452880859375, -1.7470703125, -1.041259765625, -0.33544921875, 0.370361328125, 1.076171875, 1.781982421875, 2.48779296875, 3.193603515625, 3.8994140625, 4.605224609375, 5.31103515625, 6.016845703125, 6.72265625, 7.428466796875, 8.13427734375, 8.840087890625, 9.5458984375, 10.251708984375, 10.95751953125, 11.663330078125, 12.369140625, 13.074951171875, 13.78076171875, 14.486572265625, 15.1923828125, 15.898193359375, 16.60400390625, 17.309814453125, 18.015625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 14.0, 68.0, 147.0, 227.0, 275.0, 171.0, 80.0, 24.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.93401336669922, -86.46440887451172, -83.99480438232422, -81.52519989013672, -79.05558776855469, -76.58598327636719, -74.11637878417969, -71.64677429199219, -69.17716979980469, -66.70756530761719, -64.23796081542969, -61.76835250854492, -59.29874801635742, -56.82914352416992, -54.359535217285156, -51.889930725097656, -49.420326232910156, -46.950721740722656, -44.481117248535156, -42.01150894165039, -39.54190444946289, -37.07229995727539, -34.602691650390625, -32.133087158203125, -29.663482666015625, -27.193878173828125, -24.724271774291992, -22.25466537475586, -19.78506088256836, -17.31545639038086, -14.845849990844727, -12.376243591308594, -9.906646728515625, -7.437041282653809, -4.967435836791992, -2.497830390930176, -0.028224945068359375, 2.441380500793457, 4.910985946655273, 7.380592346191406, 9.850196838378906, 12.319802284240723, 14.789407730102539, 17.259014129638672, 19.728618621826172, 22.198223114013672, 24.667829513549805, 27.137435913085938, 29.607040405273438, 32.07664489746094, 34.54624938964844, 37.0158576965332, 39.4854621887207, 41.9550666809082, 44.42467498779297, 46.89427947998047, 49.36388397216797, 51.83348846435547, 54.30309295654297, 56.772701263427734, 59.242305755615234, 61.711910247802734, 64.1815185546875, 66.651123046875, 69.1207275390625]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 11.0, 5.0, 5.0, 6.0, 20.0, 17.0, 18.0, 13.0, 25.0, 36.0, 29.0, 29.0, 35.0, 27.0, 29.0, 38.0, 48.0, 29.0, 41.0, 37.0, 48.0, 37.0, 42.0, 41.0, 39.0, 36.0, 37.0, 37.0, 16.0, 29.0, 8.0, 22.0, 22.0, 14.0, 14.0, 12.0, 16.0, 8.0, 8.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-22.92513656616211, -22.26451301574707, -21.6038875579834, -20.94326400756836, -20.28264045715332, -19.62201499938965, -18.96139144897461, -18.300765991210938, -17.6401424407959, -16.97951889038086, -16.318893432617188, -15.658269882202148, -14.997645378112793, -14.337020874023438, -13.676397323608398, -13.015772819519043, -12.355149269104004, -11.694524765014648, -11.03390121459961, -10.373276710510254, -9.712652206420898, -9.05202865600586, -8.391404151916504, -7.730779647827148, -7.070155620574951, -6.409531593322754, -5.748907089233398, -5.088283061981201, -4.427659034729004, -3.7670345306396484, -3.106410503387451, -2.4457859992980957, -1.7851619720458984, -1.124537706375122, -0.46391355991363525, 0.19671058654785156, 0.8573348522186279, 1.5179591178894043, 2.1785831451416016, 2.839207649230957, 3.4998316764831543, 4.160455703735352, 4.821080207824707, 5.481704235076904, 6.142328262329102, 6.802952766418457, 7.463576793670654, 8.124200820922852, 8.784825325012207, 9.445449829101562, 10.106073379516602, 10.766697883605957, 11.427322387695312, 12.087945938110352, 12.748570442199707, 13.409194946289062, 14.069818496704102, 14.730443000793457, 15.391066551208496, 16.05169105529785, 16.71231460571289, 17.372940063476562, 18.0335636138916, 18.69418716430664, 19.354812622070312]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 11.0, 8.0, 4.0, 12.0, 9.0, 10.0, 9.0, 18.0, 22.0, 18.0, 28.0, 28.0, 38.0, 37.0, 30.0, 32.0, 35.0, 43.0, 46.0, 47.0, 45.0, 42.0, 32.0, 43.0, 48.0, 43.0, 32.0, 31.0, 22.0, 24.0, 13.0, 31.0, 9.0, 18.0, 19.0, 19.0, 7.0, 8.0, 8.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.87890625, -2.792877197265625, -2.70684814453125, -2.620819091796875, -2.5347900390625, -2.448760986328125, -2.36273193359375, -2.276702880859375, -2.190673828125, -2.104644775390625, -2.01861572265625, -1.932586669921875, -1.8465576171875, -1.760528564453125, -1.67449951171875, -1.588470458984375, -1.50244140625, -1.416412353515625, -1.33038330078125, -1.244354248046875, -1.1583251953125, -1.072296142578125, -0.98626708984375, -0.900238037109375, -0.814208984375, -0.728179931640625, -0.64215087890625, -0.556121826171875, -0.4700927734375, -0.384063720703125, -0.29803466796875, -0.212005615234375, -0.1259765625, -0.039947509765625, 0.04608154296875, 0.132110595703125, 0.2181396484375, 0.304168701171875, 0.39019775390625, 0.476226806640625, 0.562255859375, 0.648284912109375, 0.73431396484375, 0.820343017578125, 0.9063720703125, 0.992401123046875, 1.07843017578125, 1.164459228515625, 1.25048828125, 1.336517333984375, 1.42254638671875, 1.508575439453125, 1.5946044921875, 1.680633544921875, 1.76666259765625, 1.852691650390625, 1.938720703125, 2.024749755859375, 2.11077880859375, 2.196807861328125, 2.2828369140625, 2.368865966796875, 2.45489501953125, 2.540924072265625, 2.626953125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 5.0, 6.0, 6.0, 6.0, 21.0, 23.0, 46.0, 50.0, 71.0, 120.0, 166.0, 225.0, 360.0, 475.0, 709.0, 963.0, 1454.0, 2035.0, 2816.0, 3928.0, 5860.0, 8089.0, 11934.0, 17284.0, 26051.0, 39701.0, 64555.0, 115776.0, 296585.0, 193705.0, 93628.0, 55043.0, 34104.0, 22847.0, 15279.0, 10433.0, 7150.0, 4966.0, 3624.0, 2547.0, 1699.0, 1281.0, 904.0, 656.0, 408.0, 294.0, 215.0, 149.0, 114.0, 54.0, 58.0, 25.0, 20.0, 15.0, 12.0, 4.0, 6.0, 5.0, 5.0, 1.0], "bins": [-0.1070556640625, -0.10379505157470703, -0.10053443908691406, -0.0972738265991211, -0.09401321411132812, -0.09075260162353516, -0.08749198913574219, -0.08423137664794922, -0.08097076416015625, -0.07771015167236328, -0.07444953918457031, -0.07118892669677734, -0.06792831420898438, -0.0646677017211914, -0.06140708923339844, -0.05814647674560547, -0.0548858642578125, -0.05162525177001953, -0.04836463928222656, -0.045104026794433594, -0.041843414306640625, -0.038582801818847656, -0.03532218933105469, -0.03206157684326172, -0.02880096435546875, -0.02554035186767578, -0.022279739379882812, -0.019019126892089844, -0.015758514404296875, -0.012497901916503906, -0.009237289428710938, -0.005976676940917969, -0.002716064453125, 0.0005445480346679688, 0.0038051605224609375, 0.007065773010253906, 0.010326385498046875, 0.013586997985839844, 0.016847610473632812, 0.02010822296142578, 0.02336883544921875, 0.02662944793701172, 0.029890060424804688, 0.033150672912597656, 0.036411285400390625, 0.039671897888183594, 0.04293251037597656, 0.04619312286376953, 0.0494537353515625, 0.05271434783935547, 0.05597496032714844, 0.059235572814941406, 0.062496185302734375, 0.06575679779052734, 0.06901741027832031, 0.07227802276611328, 0.07553863525390625, 0.07879924774169922, 0.08205986022949219, 0.08532047271728516, 0.08858108520507812, 0.0918416976928711, 0.09510231018066406, 0.09836292266845703, 0.10162353515625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 8.0, 6.0, 6.0, 6.0, 10.0, 6.0, 14.0, 13.0, 24.0, 23.0, 26.0, 23.0, 29.0, 37.0, 27.0, 36.0, 24.0, 35.0, 48.0, 43.0, 39.0, 1059.0, 32.0, 38.0, 31.0, 35.0, 27.0, 34.0, 21.0, 34.0, 34.0, 21.0, 33.0, 26.0, 25.0, 12.0, 10.0, 18.0, 9.0, 10.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.658203125, -1.60418701171875, -1.5501708984375, -1.49615478515625, -1.442138671875, -1.38812255859375, -1.3341064453125, -1.28009033203125, -1.22607421875, -1.17205810546875, -1.1180419921875, -1.06402587890625, -1.010009765625, -0.95599365234375, -0.9019775390625, -0.84796142578125, -0.7939453125, -0.73992919921875, -0.6859130859375, -0.63189697265625, -0.577880859375, -0.52386474609375, -0.4698486328125, -0.41583251953125, -0.36181640625, -0.30780029296875, -0.2537841796875, -0.19976806640625, -0.145751953125, -0.09173583984375, -0.0377197265625, 0.01629638671875, 0.0703125, 0.12432861328125, 0.1783447265625, 0.23236083984375, 0.286376953125, 0.34039306640625, 0.3944091796875, 0.44842529296875, 0.50244140625, 0.55645751953125, 0.6104736328125, 0.66448974609375, 0.718505859375, 0.77252197265625, 0.8265380859375, 0.88055419921875, 0.9345703125, 0.98858642578125, 1.0426025390625, 1.09661865234375, 1.150634765625, 1.20465087890625, 1.2586669921875, 1.31268310546875, 1.36669921875, 1.42071533203125, 1.4747314453125, 1.52874755859375, 1.582763671875, 1.63677978515625, 1.6907958984375, 1.74481201171875, 1.798828125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 17.0, 27.0, 38.0, 63.0, 78.0, 117.0, 179.0, 249.0, 353.0, 509.0, 721.0, 977.0, 1345.0, 1956.0, 2816.0, 4213.0, 5916.0, 8628.0, 12929.0, 19168.0, 28353.0, 42380.0, 66980.0, 113855.0, 1300745.0, 200822.0, 102220.0, 60510.0, 39323.0, 26096.0, 17580.0, 11866.0, 7999.0, 5475.0, 3807.0, 2656.0, 1789.0, 1318.0, 919.0, 597.0, 461.0, 300.0, 223.0, 156.0, 112.0, 95.0, 52.0, 53.0, 28.0, 21.0, 15.0, 7.0, 8.0, 2.0, 1.0, 2.0], "bins": [-0.05181884765625, -0.05024385452270508, -0.048668861389160156, -0.047093868255615234, -0.04551887512207031, -0.04394388198852539, -0.04236888885498047, -0.04079389572143555, -0.039218902587890625, -0.0376439094543457, -0.03606891632080078, -0.03449392318725586, -0.03291893005371094, -0.031343936920166016, -0.029768943786621094, -0.028193950653076172, -0.02661895751953125, -0.025043964385986328, -0.023468971252441406, -0.021893978118896484, -0.020318984985351562, -0.01874399185180664, -0.01716899871826172, -0.015594005584716797, -0.014019012451171875, -0.012444019317626953, -0.010869026184082031, -0.00929403305053711, -0.0077190399169921875, -0.006144046783447266, -0.004569053649902344, -0.002994060516357422, -0.0014190673828125, 0.00015592575073242188, 0.0017309188842773438, 0.0033059120178222656, 0.0048809051513671875, 0.006455898284912109, 0.008030891418457031, 0.009605884552001953, 0.011180877685546875, 0.012755870819091797, 0.014330863952636719, 0.01590585708618164, 0.017480850219726562, 0.019055843353271484, 0.020630836486816406, 0.022205829620361328, 0.02378082275390625, 0.025355815887451172, 0.026930809020996094, 0.028505802154541016, 0.030080795288085938, 0.03165578842163086, 0.03323078155517578, 0.0348057746887207, 0.036380767822265625, 0.03795576095581055, 0.03953075408935547, 0.04110574722290039, 0.04268074035644531, 0.044255733489990234, 0.045830726623535156, 0.04740571975708008, 0.048980712890625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 0.0, 5.0, 8.0, 7.0, 5.0, 5.0, 6.0, 13.0, 15.0, 13.0, 0.0, 22.0, 43.0, 62.0, 116.0, 353.0, 107.0, 67.0, 39.0, 15.0, 23.0, 0.0, 10.0, 9.0, 10.0, 14.0, 3.0, 2.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9669532775878906e-06, -1.912936568260193e-06, -1.8589198589324951e-06, -1.8049031496047974e-06, -1.7508864402770996e-06, -1.6968697309494019e-06, -1.642853021621704e-06, -1.5888363122940063e-06, -1.5348196029663086e-06, -1.4808028936386108e-06, -1.426786184310913e-06, -1.3727694749832153e-06, -1.3187527656555176e-06, -1.2647360563278198e-06, -1.210719347000122e-06, -1.1567026376724243e-06, -1.1026859283447266e-06, -1.0486692190170288e-06, -9.94652509689331e-07, -9.406358003616333e-07, -8.866190910339355e-07, -8.326023817062378e-07, -7.7858567237854e-07, -7.245689630508423e-07, -6.705522537231445e-07, -6.165355443954468e-07, -5.62518835067749e-07, -5.085021257400513e-07, -4.544854164123535e-07, -4.0046870708465576e-07, -3.46451997756958e-07, -2.9243528842926025e-07, -2.384185791015625e-07, -1.8440186977386475e-07, -1.30385160446167e-07, -7.636845111846924e-08, -2.2351741790771484e-08, 3.166496753692627e-08, 8.568167686462402e-08, 1.3969838619232178e-07, 1.9371509552001953e-07, 2.477318048477173e-07, 3.0174851417541504e-07, 3.557652235031128e-07, 4.0978193283081055e-07, 4.637986421585083e-07, 5.178153514862061e-07, 5.718320608139038e-07, 6.258487701416016e-07, 6.798654794692993e-07, 7.338821887969971e-07, 7.878988981246948e-07, 8.419156074523926e-07, 8.959323167800903e-07, 9.499490261077881e-07, 1.0039657354354858e-06, 1.0579824447631836e-06, 1.1119991540908813e-06, 1.166015863418579e-06, 1.2200325727462769e-06, 1.2740492820739746e-06, 1.3280659914016724e-06, 1.3820827007293701e-06, 1.4360994100570679e-06, 1.4901161193847656e-06]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 6.0, 4.0, 6.0, 7.0, 16.0, 29.0, 49.0, 74.0, 177.0, 470.0, 23198.0, 1000592.0, 23045.0, 505.0, 137.0, 90.0, 48.0, 23.0, 8.0, 9.0, 4.0, 8.0, 5.0, 4.0, 4.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.147125244140625e-05, -3.0326656997203827e-05, -2.9182061553001404e-05, -2.803746610879898e-05, -2.6892870664596558e-05, -2.5748275220394135e-05, -2.460367977619171e-05, -2.345908433198929e-05, -2.2314488887786865e-05, -2.1169893443584442e-05, -2.002529799938202e-05, -1.8880702555179596e-05, -1.7736107110977173e-05, -1.659151166677475e-05, -1.5446916222572327e-05, -1.4302320778369904e-05, -1.315772533416748e-05, -1.2013129889965057e-05, -1.0868534445762634e-05, -9.723939001560211e-06, -8.579343557357788e-06, -7.434748113155365e-06, -6.290152668952942e-06, -5.145557224750519e-06, -4.000961780548096e-06, -2.8563663363456726e-06, -1.7117708921432495e-06, -5.671754479408264e-07, 5.774199962615967e-07, 1.7220154404640198e-06, 2.866610884666443e-06, 4.011206328868866e-06, 5.155801773071289e-06, 6.300397217273712e-06, 7.444992661476135e-06, 8.589588105678558e-06, 9.734183549880981e-06, 1.0878778994083405e-05, 1.2023374438285828e-05, 1.316796988248825e-05, 1.4312565326690674e-05, 1.5457160770893097e-05, 1.660175621509552e-05, 1.7746351659297943e-05, 1.8890947103500366e-05, 2.003554254770279e-05, 2.1180137991905212e-05, 2.2324733436107635e-05, 2.346932888031006e-05, 2.461392432451248e-05, 2.5758519768714905e-05, 2.6903115212917328e-05, 2.804771065711975e-05, 2.9192306101322174e-05, 3.0336901545524597e-05, 3.148149698972702e-05, 3.262609243392944e-05, 3.3770687878131866e-05, 3.491528332233429e-05, 3.605987876653671e-05, 3.7204474210739136e-05, 3.834906965494156e-05, 3.949366509914398e-05, 4.0638260543346405e-05, 4.178285598754883e-05]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 15.0, 36.0, 70.0, 103.0, 413.0, 153.0, 114.0, 47.0, 18.0, 16.0, 9.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2349764801911078e-06, -1.1975039342360105e-06, -1.1600313882809132e-06, -1.122558842325816e-06, -1.0850864100575563e-06, -1.047613864102459e-06, -1.0101413181473617e-06, -9.726687721922644e-07, -9.351962262371671e-07, -8.977236802820698e-07, -8.602511911703914e-07, -8.227786452152941e-07, -7.853060992601968e-07, -7.478336101485183e-07, -7.10361064193421e-07, -6.728885182383237e-07, -6.354160291266453e-07, -5.97943483171548e-07, -5.604709940598696e-07, -5.229984481047723e-07, -4.85525902149675e-07, -4.480533846162871e-07, -4.105808670828992e-07, -3.731083211278019e-07, -3.3563580359441403e-07, -2.9816328606102616e-07, -2.6069074010592885e-07, -2.2321822257254098e-07, -1.857456908282984e-07, -1.482731590840558e-07, -1.1080064155066793e-07, -7.332809559557063e-08, -3.585557806218276e-08, 1.6169501293461508e-09, 3.908947832087506e-08, 7.656200295969029e-08, 1.1403453470393288e-07, 1.5150706644817546e-07, 1.8897958398156334e-07, 2.2645212993666064e-07, 2.639246474700485e-07, 3.013971650034364e-07, 3.388697109585337e-07, 3.7634222849192156e-07, 4.1381474602530943e-07, 4.5128729198040674e-07, 4.88759837935504e-07, 5.262323838906013e-07, 5.637048730022798e-07, 6.011774189573771e-07, 6.386499080690555e-07, 6.761224540241528e-07, 7.135949999792501e-07, 7.510675459343474e-07, 7.885400350460259e-07, 8.260125810011232e-07, 8.634850701128016e-07, 9.009576160678989e-07, 9.384301051795774e-07, 9.759025942912558e-07, 1.0133751402463531e-06, 1.0508476862014504e-06, 1.0883202321565477e-06, 1.125792778111645e-06, 1.1632653240667423e-06]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 0.0, 66.0, 0.0, 0.0, 0.0, 210.0, 0.0, 0.0, 0.0, 0.0, 392.0, 0.0, 0.0, 0.0, 0.0, 183.0, 0.0, 0.0, 0.0, 79.0, 0.0, 0.0, 0.0, 0.0, 28.0, 0.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4458935260772705e-07, -3.3155083656311035e-07, -3.1851232051849365e-07, -3.0547380447387695e-07, -2.9243528842926025e-07, -2.7939677238464355e-07, -2.6635825634002686e-07, -2.5331974029541016e-07, -2.4028122425079346e-07, -2.2724270820617676e-07, -2.1420419216156006e-07, -2.0116567611694336e-07, -1.8812716007232666e-07, -1.7508864402770996e-07, -1.6205012798309326e-07, -1.4901161193847656e-07, -1.3597309589385986e-07, -1.2293457984924316e-07, -1.0989606380462646e-07, -9.685754776000977e-08, -8.381903171539307e-08, -7.078051567077637e-08, -5.774199962615967e-08, -4.470348358154297e-08, -3.166496753692627e-08, -1.862645149230957e-08, -5.587935447692871e-09, 7.450580596923828e-09, 2.0489096641540527e-08, 3.3527612686157227e-08, 4.6566128730773926e-08, 5.960464477539063e-08, 7.264316082000732e-08, 8.568167686462402e-08, 9.872019290924072e-08, 1.1175870895385742e-07, 1.2479722499847412e-07, 1.3783574104309082e-07, 1.5087425708770752e-07, 1.6391277313232422e-07, 1.7695128917694092e-07, 1.8998980522155762e-07, 2.0302832126617432e-07, 2.1606683731079102e-07, 2.2910535335540771e-07, 2.421438694000244e-07, 2.551823854446411e-07, 2.682209014892578e-07, 2.812594175338745e-07, 2.942979335784912e-07, 3.073364496231079e-07, 3.203749656677246e-07, 3.334134817123413e-07, 3.46451997756958e-07, 3.594905138015747e-07, 3.725290298461914e-07, 3.855675458908081e-07, 3.986060619354248e-07, 4.116445779800415e-07, 4.246830940246582e-07, 4.377216100692749e-07, 4.507601261138916e-07, 4.637986421585083e-07, 4.76837158203125e-07]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 11.0, 8.0, 4.0, 12.0, 9.0, 10.0, 9.0, 18.0, 22.0, 18.0, 28.0, 28.0, 38.0, 37.0, 30.0, 32.0, 35.0, 43.0, 46.0, 47.0, 45.0, 42.0, 32.0, 43.0, 48.0, 43.0, 32.0, 31.0, 22.0, 24.0, 13.0, 31.0, 9.0, 18.0, 19.0, 19.0, 7.0, 8.0, 8.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.87890625, -2.792877197265625, -2.70684814453125, -2.620819091796875, -2.5347900390625, -2.448760986328125, -2.36273193359375, -2.276702880859375, -2.190673828125, -2.104644775390625, -2.01861572265625, -1.932586669921875, -1.8465576171875, -1.760528564453125, -1.67449951171875, -1.588470458984375, -1.50244140625, -1.416412353515625, -1.33038330078125, -1.244354248046875, -1.1583251953125, -1.072296142578125, -0.98626708984375, -0.900238037109375, -0.814208984375, -0.728179931640625, -0.64215087890625, -0.556121826171875, -0.4700927734375, -0.384063720703125, -0.29803466796875, -0.212005615234375, -0.1259765625, -0.039947509765625, 0.04608154296875, 0.132110595703125, 0.2181396484375, 0.304168701171875, 0.39019775390625, 0.476226806640625, 0.562255859375, 0.648284912109375, 0.73431396484375, 0.820343017578125, 0.9063720703125, 0.992401123046875, 1.07843017578125, 1.164459228515625, 1.25048828125, 1.336517333984375, 1.42254638671875, 1.508575439453125, 1.5946044921875, 1.680633544921875, 1.76666259765625, 1.852691650390625, 1.938720703125, 2.024749755859375, 2.11077880859375, 2.196807861328125, 2.2828369140625, 2.368865966796875, 2.45489501953125, 2.540924072265625, 2.626953125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 7.0, 12.0, 17.0, 31.0, 43.0, 66.0, 108.0, 180.0, 287.0, 496.0, 879.0, 1389.0, 2297.0, 3850.0, 6529.0, 11177.0, 19051.0, 32704.0, 54841.0, 89988.0, 158137.0, 278440.0, 160794.0, 91846.0, 55448.0, 33136.0, 19273.0, 11353.0, 6640.0, 3856.0, 2263.0, 1327.0, 810.0, 508.0, 326.0, 167.0, 104.0, 83.0, 41.0, 17.0, 12.0, 14.0, 8.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94140625, -2.845001220703125, -2.74859619140625, -2.652191162109375, -2.5557861328125, -2.459381103515625, -2.36297607421875, -2.266571044921875, -2.170166015625, -2.073760986328125, -1.97735595703125, -1.880950927734375, -1.7845458984375, -1.688140869140625, -1.59173583984375, -1.495330810546875, -1.39892578125, -1.302520751953125, -1.20611572265625, -1.109710693359375, -1.0133056640625, -0.916900634765625, -0.82049560546875, -0.724090576171875, -0.627685546875, -0.531280517578125, -0.43487548828125, -0.338470458984375, -0.2420654296875, -0.145660400390625, -0.04925537109375, 0.047149658203125, 0.1435546875, 0.239959716796875, 0.33636474609375, 0.432769775390625, 0.5291748046875, 0.625579833984375, 0.72198486328125, 0.818389892578125, 0.914794921875, 1.011199951171875, 1.10760498046875, 1.204010009765625, 1.3004150390625, 1.396820068359375, 1.49322509765625, 1.589630126953125, 1.68603515625, 1.782440185546875, 1.87884521484375, 1.975250244140625, 2.0716552734375, 2.168060302734375, 2.26446533203125, 2.360870361328125, 2.457275390625, 2.553680419921875, 2.65008544921875, 2.746490478515625, 2.8428955078125, 2.939300537109375, 3.03570556640625, 3.132110595703125, 3.228515625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 14.0, 5.0, 13.0, 12.0, 16.0, 21.0, 16.0, 29.0, 27.0, 28.0, 30.0, 27.0, 43.0, 46.0, 66.0, 76.0, 120.0, 155.0, 1363.0, 259.0, 153.0, 91.0, 64.0, 45.0, 38.0, 41.0, 36.0, 31.0, 26.0, 19.0, 26.0, 11.0, 16.0, 8.0, 15.0, 9.0, 11.0, 3.0, 5.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 5.0], "bins": [-9.59375, -9.32568359375, -9.0576171875, -8.78955078125, -8.521484375, -8.25341796875, -7.9853515625, -7.71728515625, -7.44921875, -7.18115234375, -6.9130859375, -6.64501953125, -6.376953125, -6.10888671875, -5.8408203125, -5.57275390625, -5.3046875, -5.03662109375, -4.7685546875, -4.50048828125, -4.232421875, -3.96435546875, -3.6962890625, -3.42822265625, -3.16015625, -2.89208984375, -2.6240234375, -2.35595703125, -2.087890625, -1.81982421875, -1.5517578125, -1.28369140625, -1.015625, -0.74755859375, -0.4794921875, -0.21142578125, 0.056640625, 0.32470703125, 0.5927734375, 0.86083984375, 1.12890625, 1.39697265625, 1.6650390625, 1.93310546875, 2.201171875, 2.46923828125, 2.7373046875, 3.00537109375, 3.2734375, 3.54150390625, 3.8095703125, 4.07763671875, 4.345703125, 4.61376953125, 4.8818359375, 5.14990234375, 5.41796875, 5.68603515625, 5.9541015625, 6.22216796875, 6.490234375, 6.75830078125, 7.0263671875, 7.29443359375, 7.5625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 16.0, 17.0, 21.0, 33.0, 28.0, 51.0, 69.0, 73.0, 100.0, 120.0, 175.0, 242.0, 329.0, 782.0, 4538.0, 77112.0, 2629836.0, 415981.0, 13172.0, 1490.0, 447.0, 255.0, 197.0, 145.0, 123.0, 86.0, 62.0, 42.0, 44.0, 34.0, 19.0, 23.0, 8.0, 6.0, 6.0, 3.0, 7.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.359375, -16.794189453125, -16.22900390625, -15.663818359375, -15.0986328125, -14.533447265625, -13.96826171875, -13.403076171875, -12.837890625, -12.272705078125, -11.70751953125, -11.142333984375, -10.5771484375, -10.011962890625, -9.44677734375, -8.881591796875, -8.31640625, -7.751220703125, -7.18603515625, -6.620849609375, -6.0556640625, -5.490478515625, -4.92529296875, -4.360107421875, -3.794921875, -3.229736328125, -2.66455078125, -2.099365234375, -1.5341796875, -0.968994140625, -0.40380859375, 0.161376953125, 0.7265625, 1.291748046875, 1.85693359375, 2.422119140625, 2.9873046875, 3.552490234375, 4.11767578125, 4.682861328125, 5.248046875, 5.813232421875, 6.37841796875, 6.943603515625, 7.5087890625, 8.073974609375, 8.63916015625, 9.204345703125, 9.76953125, 10.334716796875, 10.89990234375, 11.465087890625, 12.0302734375, 12.595458984375, 13.16064453125, 13.725830078125, 14.291015625, 14.856201171875, 15.42138671875, 15.986572265625, 16.5517578125, 17.116943359375, 17.68212890625, 18.247314453125, 18.8125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 9.0, 47.0, 137.0, 250.0, 263.0, 180.0, 89.0, 30.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.159503936767578, -10.49328899383545, -8.82707405090332, -7.160858154296875, -5.494643211364746, -3.828428268432617, -2.162212371826172, -0.49599742889404297, 1.170217514038086, 2.836432695388794, 4.502647876739502, 6.168863296508789, 7.835078239440918, 9.501293182373047, 11.167509078979492, 12.833724021911621, 14.49993896484375, 16.166154861450195, 17.832368850708008, 19.498584747314453, 21.164798736572266, 22.83101463317871, 24.497230529785156, 26.16344451904297, 27.829660415649414, 29.49587631225586, 31.162090301513672, 32.82830810546875, 34.49452209472656, 36.160736083984375, 37.82695007324219, 39.493167877197266, 41.159385681152344, 42.825599670410156, 44.491817474365234, 46.15803146362305, 47.82424545288086, 49.49046325683594, 51.15667724609375, 52.82289123535156, 54.489105224609375, 56.15531921386719, 57.821537017822266, 59.48775100708008, 61.15396499633789, 62.82018280029297, 64.48639678955078, 66.1526107788086, 67.81883239746094, 69.48504638671875, 71.15126037597656, 72.81747436523438, 74.48369598388672, 76.14990997314453, 77.81612396240234, 79.48233795166016, 81.14855194091797, 82.81476593017578, 84.4809799194336, 86.14720153808594, 87.81341552734375, 89.47962951660156, 91.14584350585938, 92.81205749511719, 94.478271484375]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 7.0, 8.0, 8.0, 12.0, 13.0, 18.0, 8.0, 26.0, 24.0, 27.0, 28.0, 34.0, 36.0, 37.0, 32.0, 49.0, 49.0, 58.0, 40.0, 40.0, 46.0, 44.0, 37.0, 26.0, 38.0, 32.0, 26.0, 25.0, 26.0, 10.0, 27.0, 19.0, 12.0, 16.0, 14.0, 9.0, 7.0, 1.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-26.554752349853516, -25.73130226135254, -24.907854080200195, -24.08440399169922, -23.260953903198242, -22.437503814697266, -21.614055633544922, -20.790605545043945, -19.96715545654297, -19.143705368041992, -18.32025718688965, -17.496807098388672, -16.673357009887695, -15.849907875061035, -15.026458740234375, -14.203008651733398, -13.379559516906738, -12.556110382080078, -11.732660293579102, -10.909211158752441, -10.085761070251465, -9.262311935424805, -8.438861846923828, -7.615412712097168, -6.79196310043335, -5.968513488769531, -5.145063877105713, -4.3216142654418945, -3.4981648921966553, -2.674715518951416, -1.8512659072875977, -1.0278162956237793, -0.20436668395996094, 0.6190828680992126, 1.4425324201583862, 2.265981912612915, 3.0894315242767334, 3.9128808975219727, 4.736330509185791, 5.559780120849609, 6.383229732513428, 7.206679344177246, 8.030128479003906, 8.853578567504883, 9.677027702331543, 10.500476837158203, 11.32392692565918, 12.147377014160156, 12.970826148986816, 13.794275283813477, 14.617725372314453, 15.441174507141113, 16.264623641967773, 17.08807373046875, 17.911523818969727, 18.734973907470703, 19.558422088623047, 20.381872177124023, 21.205320358276367, 22.028770446777344, 22.85222053527832, 23.675670623779297, 24.49911880493164, 25.322568893432617, 26.146018981933594]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 11.0, 8.0, 15.0, 9.0, 14.0, 9.0, 16.0, 21.0, 31.0, 27.0, 30.0, 25.0, 39.0, 23.0, 50.0, 49.0, 41.0, 39.0, 36.0, 45.0, 40.0, 55.0, 35.0, 42.0, 32.0, 24.0, 29.0, 32.0, 26.0, 15.0, 17.0, 13.0, 25.0, 14.0, 8.0, 14.0, 8.0, 7.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0703125, -2.97705078125, -2.8837890625, -2.79052734375, -2.697265625, -2.60400390625, -2.5107421875, -2.41748046875, -2.32421875, -2.23095703125, -2.1376953125, -2.04443359375, -1.951171875, -1.85791015625, -1.7646484375, -1.67138671875, -1.578125, -1.48486328125, -1.3916015625, -1.29833984375, -1.205078125, -1.11181640625, -1.0185546875, -0.92529296875, -0.83203125, -0.73876953125, -0.6455078125, -0.55224609375, -0.458984375, -0.36572265625, -0.2724609375, -0.17919921875, -0.0859375, 0.00732421875, 0.1005859375, 0.19384765625, 0.287109375, 0.38037109375, 0.4736328125, 0.56689453125, 0.66015625, 0.75341796875, 0.8466796875, 0.93994140625, 1.033203125, 1.12646484375, 1.2197265625, 1.31298828125, 1.40625, 1.49951171875, 1.5927734375, 1.68603515625, 1.779296875, 1.87255859375, 1.9658203125, 2.05908203125, 2.15234375, 2.24560546875, 2.3388671875, 2.43212890625, 2.525390625, 2.61865234375, 2.7119140625, 2.80517578125, 2.8984375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 8.0, 8.0, 14.0, 14.0, 29.0, 27.0, 35.0, 69.0, 111.0, 197.0, 409.0, 772.0, 1686.0, 4020.0, 11029.0, 31872.0, 100163.0, 325676.0, 978535.0, 1598475.0, 776152.0, 247982.0, 76750.0, 25023.0, 8715.0, 3480.0, 1424.0, 724.0, 355.0, 184.0, 118.0, 77.0, 35.0, 33.0, 25.0, 16.0, 13.0, 6.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.96331787109375, -3.8328857421875, -3.70245361328125, -3.572021484375, -3.44158935546875, -3.3111572265625, -3.18072509765625, -3.05029296875, -2.91986083984375, -2.7894287109375, -2.65899658203125, -2.528564453125, -2.39813232421875, -2.2677001953125, -2.13726806640625, -2.0068359375, -1.87640380859375, -1.7459716796875, -1.61553955078125, -1.485107421875, -1.35467529296875, -1.2242431640625, -1.09381103515625, -0.96337890625, -0.83294677734375, -0.7025146484375, -0.57208251953125, -0.441650390625, -0.31121826171875, -0.1807861328125, -0.05035400390625, 0.080078125, 0.21051025390625, 0.3409423828125, 0.47137451171875, 0.601806640625, 0.73223876953125, 0.8626708984375, 0.99310302734375, 1.12353515625, 1.25396728515625, 1.3843994140625, 1.51483154296875, 1.645263671875, 1.77569580078125, 1.9061279296875, 2.03656005859375, 2.1669921875, 2.29742431640625, 2.4278564453125, 2.55828857421875, 2.688720703125, 2.81915283203125, 2.9495849609375, 3.08001708984375, 3.21044921875, 3.34088134765625, 3.4713134765625, 3.60174560546875, 3.732177734375, 3.86260986328125, 3.9930419921875, 4.12347412109375, 4.25390625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 4.0, 8.0, 6.0, 10.0, 13.0, 13.0, 18.0, 36.0, 41.0, 64.0, 108.0, 117.0, 136.0, 192.0, 250.0, 303.0, 405.0, 398.0, 395.0, 368.0, 302.0, 231.0, 153.0, 119.0, 89.0, 79.0, 66.0, 44.0, 38.0, 25.0, 10.0, 14.0, 4.0, 9.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.90234375, -5.7318115234375, -5.561279296875, -5.3907470703125, -5.22021484375, -5.0496826171875, -4.879150390625, -4.7086181640625, -4.5380859375, -4.3675537109375, -4.197021484375, -4.0264892578125, -3.85595703125, -3.6854248046875, -3.514892578125, -3.3443603515625, -3.173828125, -3.0032958984375, -2.832763671875, -2.6622314453125, -2.49169921875, -2.3211669921875, -2.150634765625, -1.9801025390625, -1.8095703125, -1.6390380859375, -1.468505859375, -1.2979736328125, -1.12744140625, -0.9569091796875, -0.786376953125, -0.6158447265625, -0.4453125, -0.2747802734375, -0.104248046875, 0.0662841796875, 0.23681640625, 0.4073486328125, 0.577880859375, 0.7484130859375, 0.9189453125, 1.0894775390625, 1.260009765625, 1.4305419921875, 1.60107421875, 1.7716064453125, 1.942138671875, 2.1126708984375, 2.283203125, 2.4537353515625, 2.624267578125, 2.7947998046875, 2.96533203125, 3.1358642578125, 3.306396484375, 3.4769287109375, 3.6474609375, 3.8179931640625, 3.988525390625, 4.1590576171875, 4.32958984375, 4.5001220703125, 4.670654296875, 4.8411865234375, 5.01171875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 9.0, 5.0, 6.0, 12.0, 21.0, 26.0, 32.0, 61.0, 68.0, 116.0, 140.0, 181.0, 288.0, 534.0, 2111.0, 38822.0, 1345474.0, 2700141.0, 100544.0, 4095.0, 637.0, 290.0, 221.0, 137.0, 104.0, 56.0, 53.0, 28.0, 24.0, 15.0, 9.0, 9.0, 6.0, 9.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.65625, -15.118896484375, -14.58154296875, -14.044189453125, -13.5068359375, -12.969482421875, -12.43212890625, -11.894775390625, -11.357421875, -10.820068359375, -10.28271484375, -9.745361328125, -9.2080078125, -8.670654296875, -8.13330078125, -7.595947265625, -7.05859375, -6.521240234375, -5.98388671875, -5.446533203125, -4.9091796875, -4.371826171875, -3.83447265625, -3.297119140625, -2.759765625, -2.222412109375, -1.68505859375, -1.147705078125, -0.6103515625, -0.072998046875, 0.46435546875, 1.001708984375, 1.5390625, 2.076416015625, 2.61376953125, 3.151123046875, 3.6884765625, 4.225830078125, 4.76318359375, 5.300537109375, 5.837890625, 6.375244140625, 6.91259765625, 7.449951171875, 7.9873046875, 8.524658203125, 9.06201171875, 9.599365234375, 10.13671875, 10.674072265625, 11.21142578125, 11.748779296875, 12.2861328125, 12.823486328125, 13.36083984375, 13.898193359375, 14.435546875, 14.972900390625, 15.51025390625, 16.047607421875, 16.5849609375, 17.122314453125, 17.65966796875, 18.197021484375, 18.734375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 9.0, 8.0, 19.0, 29.0, 37.0, 47.0, 73.0, 95.0, 106.0, 106.0, 127.0, 109.0, 65.0, 64.0, 49.0, 31.0, 19.0, 13.0, 4.0, 6.0, 1.0], "bins": [-53.673614501953125, -52.65141677856445, -51.62921905517578, -50.60702133178711, -49.58482360839844, -48.562625885009766, -47.540428161621094, -46.51823043823242, -45.49603271484375, -44.47383499145508, -43.451637268066406, -42.429439544677734, -41.40724182128906, -40.38504409790039, -39.36284637451172, -38.34064865112305, -37.318450927734375, -36.2962532043457, -35.27405548095703, -34.25185775756836, -33.22966003417969, -32.207462310791016, -31.185264587402344, -30.163066864013672, -29.140872955322266, -28.118675231933594, -27.096477508544922, -26.07427978515625, -25.052082061767578, -24.029884338378906, -23.007686614990234, -21.985488891601562, -20.96329116821289, -19.94109344482422, -18.918895721435547, -17.896697998046875, -16.874500274658203, -15.852302551269531, -14.830105781555176, -13.807908058166504, -12.785710334777832, -11.76351261138916, -10.741314888000488, -9.719118118286133, -8.696920394897461, -7.674722194671631, -6.652524948120117, -5.630327224731445, -4.608129501342773, -3.5859317779541016, -2.563734292984009, -1.541536808013916, -0.5193390846252441, 0.5028586387634277, 1.5250558853149414, 2.5472536087036133, 3.569451332092285, 4.591649055480957, 5.613846778869629, 6.636044025421143, 7.6582417488098145, 8.680438995361328, 9.70263671875, 10.724834442138672, 11.747032165527344]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 6.0, 5.0, 11.0, 9.0, 15.0, 17.0, 20.0, 17.0, 27.0, 20.0, 28.0, 26.0, 33.0, 44.0, 49.0, 37.0, 60.0, 46.0, 41.0, 38.0, 39.0, 37.0, 33.0, 44.0, 38.0, 32.0, 47.0, 21.0, 25.0, 25.0, 23.0, 12.0, 13.0, 8.0, 15.0, 12.0, 5.0, 5.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.15804672241211, -20.55150032043457, -19.94495391845703, -19.33840560913086, -18.73185920715332, -18.12531280517578, -17.518766403198242, -16.912220001220703, -16.30567169189453, -15.699125289916992, -15.092577934265137, -14.486031532287598, -13.879484176635742, -13.272937774658203, -12.666391372680664, -12.059844017028809, -11.45329761505127, -10.84675121307373, -10.240203857421875, -9.633657455444336, -9.02711009979248, -8.420563697814941, -7.814016819000244, -7.207469940185547, -6.60092306137085, -5.994376182556152, -5.387829303741455, -4.781282424926758, -4.174736022949219, -3.5681889057159424, -2.961642265319824, -2.355095386505127, -1.7485485076904297, -1.1420016288757324, -0.5354548692703247, 0.07109189033508301, 0.6776387691497803, 1.2841856479644775, 1.8907322883605957, 2.497279167175293, 3.1038260459899902, 3.7103729248046875, 4.316919803619385, 4.923466682434082, 5.530013084411621, 6.136560440063477, 6.743106842041016, 7.349653720855713, 7.95620059967041, 8.56274700164795, 9.169294357299805, 9.775840759277344, 10.3823881149292, 10.988934516906738, 11.595481872558594, 12.202028274536133, 12.808574676513672, 13.415121078491211, 14.021668434143066, 14.628214836120605, 15.234762191772461, 15.84130859375, 16.44785499572754, 17.054401397705078, 17.66094970703125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 8.0, 9.0, 11.0, 11.0, 8.0, 18.0, 15.0, 31.0, 23.0, 32.0, 27.0, 26.0, 26.0, 43.0, 40.0, 48.0, 49.0, 35.0, 45.0, 37.0, 57.0, 22.0, 49.0, 41.0, 29.0, 37.0, 27.0, 24.0, 12.0, 13.0, 20.0, 15.0, 17.0, 15.0, 11.0, 16.0, 7.0, 7.0, 9.0, 4.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.033203125, -2.945037841796875, -2.85687255859375, -2.768707275390625, -2.6805419921875, -2.592376708984375, -2.50421142578125, -2.416046142578125, -2.327880859375, -2.239715576171875, -2.15155029296875, -2.063385009765625, -1.9752197265625, -1.887054443359375, -1.79888916015625, -1.710723876953125, -1.62255859375, -1.534393310546875, -1.44622802734375, -1.358062744140625, -1.2698974609375, -1.181732177734375, -1.09356689453125, -1.005401611328125, -0.917236328125, -0.829071044921875, -0.74090576171875, -0.652740478515625, -0.5645751953125, -0.476409912109375, -0.38824462890625, -0.300079345703125, -0.2119140625, -0.123748779296875, -0.03558349609375, 0.052581787109375, 0.1407470703125, 0.228912353515625, 0.31707763671875, 0.405242919921875, 0.493408203125, 0.581573486328125, 0.66973876953125, 0.757904052734375, 0.8460693359375, 0.934234619140625, 1.02239990234375, 1.110565185546875, 1.19873046875, 1.286895751953125, 1.37506103515625, 1.463226318359375, 1.5513916015625, 1.639556884765625, 1.72772216796875, 1.815887451171875, 1.904052734375, 1.992218017578125, 2.08038330078125, 2.168548583984375, 2.2567138671875, 2.344879150390625, 2.43304443359375, 2.521209716796875, 2.609375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 8.0, 20.0, 28.0, 37.0, 57.0, 71.0, 118.0, 162.0, 246.0, 370.0, 465.0, 758.0, 1101.0, 1571.0, 2305.0, 3412.0, 5034.0, 7469.0, 11218.0, 17085.0, 26087.0, 41259.0, 72301.0, 139848.0, 350329.0, 160111.0, 78857.0, 45293.0, 28134.0, 17826.0, 11918.0, 8003.0, 5513.0, 3620.0, 2570.0, 1696.0, 1139.0, 796.0, 541.0, 364.0, 277.0, 161.0, 111.0, 90.0, 51.0, 37.0, 30.0, 15.0, 18.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.12322998046875, -0.11944770812988281, -0.11566543579101562, -0.11188316345214844, -0.10810089111328125, -0.10431861877441406, -0.10053634643554688, -0.09675407409667969, -0.0929718017578125, -0.08918952941894531, -0.08540725708007812, -0.08162498474121094, -0.07784271240234375, -0.07406044006347656, -0.07027816772460938, -0.06649589538574219, -0.062713623046875, -0.05893135070800781, -0.055149078369140625, -0.05136680603027344, -0.04758453369140625, -0.04380226135253906, -0.040019989013671875, -0.03623771667480469, -0.0324554443359375, -0.028673171997070312, -0.024890899658203125, -0.021108627319335938, -0.01732635498046875, -0.013544082641601562, -0.009761810302734375, -0.0059795379638671875, -0.002197265625, 0.0015850067138671875, 0.005367279052734375, 0.009149551391601562, 0.01293182373046875, 0.016714096069335938, 0.020496368408203125, 0.024278640747070312, 0.0280609130859375, 0.03184318542480469, 0.035625457763671875, 0.03940773010253906, 0.04319000244140625, 0.04697227478027344, 0.050754547119140625, 0.05453681945800781, 0.058319091796875, 0.06210136413574219, 0.06588363647460938, 0.06966590881347656, 0.07344818115234375, 0.07723045349121094, 0.08101272583007812, 0.08479499816894531, 0.0885772705078125, 0.09235954284667969, 0.09614181518554688, 0.09992408752441406, 0.10370635986328125, 0.10748863220214844, 0.11127090454101562, 0.11505317687988281, 0.11883544921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 13.0, 9.0, 7.0, 8.0, 23.0, 22.0, 26.0, 22.0, 33.0, 38.0, 39.0, 27.0, 47.0, 34.0, 45.0, 42.0, 42.0, 1068.0, 48.0, 40.0, 37.0, 50.0, 43.0, 28.0, 28.0, 42.0, 22.0, 38.0, 14.0, 14.0, 25.0, 13.0, 15.0, 4.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.288116455078125, -2.21685791015625, -2.145599365234375, -2.0743408203125, -2.003082275390625, -1.93182373046875, -1.860565185546875, -1.789306640625, -1.718048095703125, -1.64678955078125, -1.575531005859375, -1.5042724609375, -1.433013916015625, -1.36175537109375, -1.290496826171875, -1.21923828125, -1.147979736328125, -1.07672119140625, -1.005462646484375, -0.9342041015625, -0.862945556640625, -0.79168701171875, -0.720428466796875, -0.649169921875, -0.577911376953125, -0.50665283203125, -0.435394287109375, -0.3641357421875, -0.292877197265625, -0.22161865234375, -0.150360107421875, -0.0791015625, -0.007843017578125, 0.06341552734375, 0.134674072265625, 0.2059326171875, 0.277191162109375, 0.34844970703125, 0.419708251953125, 0.490966796875, 0.562225341796875, 0.63348388671875, 0.704742431640625, 0.7760009765625, 0.847259521484375, 0.91851806640625, 0.989776611328125, 1.06103515625, 1.132293701171875, 1.20355224609375, 1.274810791015625, 1.3460693359375, 1.417327880859375, 1.48858642578125, 1.559844970703125, 1.631103515625, 1.702362060546875, 1.77362060546875, 1.844879150390625, 1.9161376953125, 1.987396240234375, 2.05865478515625, 2.129913330078125, 2.201171875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 11.0, 9.0, 9.0, 18.0, 31.0, 41.0, 62.0, 85.0, 158.0, 275.0, 346.0, 573.0, 960.0, 1464.0, 2338.0, 3605.0, 5698.0, 9294.0, 14173.0, 22523.0, 35957.0, 59899.0, 105374.0, 225419.0, 1325909.0, 114844.0, 64186.0, 38353.0, 24097.0, 15105.0, 9581.0, 6013.0, 3914.0, 2441.0, 1641.0, 924.0, 645.0, 431.0, 228.0, 169.0, 129.0, 73.0, 36.0, 32.0, 20.0, 14.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06414794921875, -0.06208324432373047, -0.06001853942871094, -0.057953834533691406, -0.055889129638671875, -0.053824424743652344, -0.05175971984863281, -0.04969501495361328, -0.04763031005859375, -0.04556560516357422, -0.04350090026855469, -0.041436195373535156, -0.039371490478515625, -0.037306785583496094, -0.03524208068847656, -0.03317737579345703, -0.0311126708984375, -0.02904796600341797, -0.026983261108398438, -0.024918556213378906, -0.022853851318359375, -0.020789146423339844, -0.018724441528320312, -0.01665973663330078, -0.01459503173828125, -0.012530326843261719, -0.010465621948242188, -0.008400917053222656, -0.006336212158203125, -0.004271507263183594, -0.0022068023681640625, -0.00014209747314453125, 0.001922607421875, 0.003987312316894531, 0.0060520172119140625, 0.008116722106933594, 0.010181427001953125, 0.012246131896972656, 0.014310836791992188, 0.01637554168701172, 0.01844024658203125, 0.02050495147705078, 0.022569656372070312, 0.024634361267089844, 0.026699066162109375, 0.028763771057128906, 0.030828475952148438, 0.03289318084716797, 0.0349578857421875, 0.03702259063720703, 0.03908729553222656, 0.041152000427246094, 0.043216705322265625, 0.045281410217285156, 0.04734611511230469, 0.04941082000732422, 0.05147552490234375, 0.05354022979736328, 0.05560493469238281, 0.057669639587402344, 0.059734344482421875, 0.061799049377441406, 0.06386375427246094, 0.06592845916748047, 0.0679931640625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 1.0, 7.0, 3.0, 4.0, 6.0, 8.0, 7.0, 13.0, 6.0, 41.0, 17.0, 37.0, 29.0, 153.0, 352.0, 83.0, 84.0, 23.0, 40.0, 6.0, 15.0, 8.0, 13.0, 2.0, 10.0, 3.0, 4.0, 3.0, 12.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.682209014892578e-06, -2.594664692878723e-06, -2.507120370864868e-06, -2.419576048851013e-06, -2.332031726837158e-06, -2.2444874048233032e-06, -2.1569430828094482e-06, -2.0693987607955933e-06, -1.9818544387817383e-06, -1.8943101167678833e-06, -1.8067657947540283e-06, -1.7192214727401733e-06, -1.6316771507263184e-06, -1.5441328287124634e-06, -1.4565885066986084e-06, -1.3690441846847534e-06, -1.2814998626708984e-06, -1.1939555406570435e-06, -1.1064112186431885e-06, -1.0188668966293335e-06, -9.313225746154785e-07, -8.437782526016235e-07, -7.562339305877686e-07, -6.686896085739136e-07, -5.811452865600586e-07, -4.936009645462036e-07, -4.0605664253234863e-07, -3.1851232051849365e-07, -2.3096799850463867e-07, -1.434236764907837e-07, -5.587935447692871e-08, 3.166496753692627e-08, 1.1920928955078125e-07, 2.0675361156463623e-07, 2.942979335784912e-07, 3.818422555923462e-07, 4.6938657760620117e-07, 5.569308996200562e-07, 6.444752216339111e-07, 7.320195436477661e-07, 8.195638656616211e-07, 9.071081876754761e-07, 9.94652509689331e-07, 1.082196831703186e-06, 1.169741153717041e-06, 1.257285475730896e-06, 1.344829797744751e-06, 1.432374119758606e-06, 1.519918441772461e-06, 1.607462763786316e-06, 1.695007085800171e-06, 1.7825514078140259e-06, 1.8700957298278809e-06, 1.957640051841736e-06, 2.045184373855591e-06, 2.132728695869446e-06, 2.2202730178833008e-06, 2.3078173398971558e-06, 2.3953616619110107e-06, 2.4829059839248657e-06, 2.5704503059387207e-06, 2.6579946279525757e-06, 2.7455389499664307e-06, 2.8330832719802856e-06, 2.9206275939941406e-06]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 8.0, 5.0, 3.0, 8.0, 3.0, 10.0, 12.0, 10.0, 11.0, 33.0, 57.0, 117.0, 350.0, 11821.0, 1029994.0, 5530.0, 290.0, 107.0, 54.0, 35.0, 24.0, 13.0, 10.0, 6.0, 6.0, 9.0, 6.0, 0.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.109476089477539e-05, -5.926750600337982e-05, -5.744025111198425e-05, -5.5612996220588684e-05, -5.3785741329193115e-05, -5.1958486437797546e-05, -5.013123154640198e-05, -4.830397665500641e-05, -4.647672176361084e-05, -4.464946687221527e-05, -4.28222119808197e-05, -4.099495708942413e-05, -3.9167702198028564e-05, -3.7340447306632996e-05, -3.551319241523743e-05, -3.368593752384186e-05, -3.185868263244629e-05, -3.003142774105072e-05, -2.820417284965515e-05, -2.6376917958259583e-05, -2.4549663066864014e-05, -2.2722408175468445e-05, -2.0895153284072876e-05, -1.9067898392677307e-05, -1.7240643501281738e-05, -1.541338860988617e-05, -1.35861337184906e-05, -1.1758878827095032e-05, -9.931623935699463e-06, -8.104369044303894e-06, -6.277114152908325e-06, -4.449859261512756e-06, -2.6226043701171875e-06, -7.953494787216187e-07, 1.0319054126739502e-06, 2.859160304069519e-06, 4.686415195465088e-06, 6.513670086860657e-06, 8.340924978256226e-06, 1.0168179869651794e-05, 1.1995434761047363e-05, 1.3822689652442932e-05, 1.56499445438385e-05, 1.747719943523407e-05, 1.930445432662964e-05, 2.1131709218025208e-05, 2.2958964109420776e-05, 2.4786219000816345e-05, 2.6613473892211914e-05, 2.8440728783607483e-05, 3.0267983675003052e-05, 3.209523856639862e-05, 3.392249345779419e-05, 3.574974834918976e-05, 3.757700324058533e-05, 3.9404258131980896e-05, 4.1231513023376465e-05, 4.3058767914772034e-05, 4.48860228061676e-05, 4.671327769756317e-05, 4.854053258895874e-05, 5.036778748035431e-05, 5.219504237174988e-05, 5.402229726314545e-05, 5.5849552154541016e-05]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 29.0, 81.0, 486.0, 291.0, 80.0, 24.0, 14.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0188667804177385e-06, -1.9268757114332402e-06, -1.834884642448742e-06, -1.7428935734642437e-06, -1.6509025044797454e-06, -1.5589114354952471e-06, -1.4669204801975866e-06, -1.3749294112130883e-06, -1.28293834222859e-06, -1.1909472732440918e-06, -1.0989562042595935e-06, -1.006965248961933e-06, -9.149741231340158e-07, -8.229830541495176e-07, -7.309920420084381e-07, -6.390009730239399e-07, -5.470099040394416e-07, -4.5501883505494334e-07, -3.630277944921545e-07, -2.7103675392936566e-07, -1.790456849448674e-07, -8.705461596036912e-08, 4.93639618071029e-09, 9.692746516520856e-08, 1.8891853414970683e-07, 2.809096031342051e-07, 3.7290064369699394e-07, 4.648916842597828e-07, 5.56882753244281e-07, 6.488738222287793e-07, 7.408648343698587e-07, 8.32855903354357e-07, 9.248469723388553e-07, 1.0168380413233535e-06, 1.1088291103078518e-06, 1.20082017929235e-06, 1.2928112482768483e-06, 1.3848023172613466e-06, 1.4767932725590072e-06, 1.5687843415435054e-06, 1.6607754105280037e-06, 1.752766479512502e-06, 1.8447575484970002e-06, 1.936748503794661e-06, 2.028739572779159e-06, 2.1207306417636573e-06, 2.2127217107481556e-06, 2.304712779732654e-06, 2.396703848717152e-06, 2.4886949177016504e-06, 2.5806859866861487e-06, 2.672677055670647e-06, 2.7646681246551452e-06, 2.8566591936396435e-06, 2.9486500352504663e-06, 3.04064133160864e-06, 3.132632173219463e-06, 3.224623242203961e-06, 3.3166143111884594e-06, 3.4086053801729577e-06, 3.500596449157456e-06, 3.592587518141954e-06, 3.6845785871264525e-06, 3.7765694287372753e-06, 3.868560725095449e-06]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 0.0, 6.0, 0.0, 8.0, 0.0, 0.0, 20.0, 0.0, 52.0, 0.0, 0.0, 87.0, 0.0, 160.0, 0.0, 315.0, 0.0, 0.0, 176.0, 0.0, 101.0, 0.0, 33.0, 0.0, 0.0, 22.0, 0.0, 17.0, 0.0, 0.0, 4.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.497146725654602e-07, -7.245689630508423e-07, -6.994232535362244e-07, -6.742775440216064e-07, -6.491318345069885e-07, -6.239861249923706e-07, -5.988404154777527e-07, -5.736947059631348e-07, -5.485489964485168e-07, -5.234032869338989e-07, -4.98257577419281e-07, -4.731118679046631e-07, -4.4796615839004517e-07, -4.2282044887542725e-07, -3.976747393608093e-07, -3.725290298461914e-07, -3.473833203315735e-07, -3.2223761081695557e-07, -2.9709190130233765e-07, -2.7194619178771973e-07, -2.468004822731018e-07, -2.2165477275848389e-07, -1.9650906324386597e-07, -1.7136335372924805e-07, -1.4621764421463013e-07, -1.210719347000122e-07, -9.592622518539429e-08, -7.078051567077637e-08, -4.563480615615845e-08, -2.0489096641540527e-08, 4.6566128730773926e-09, 2.9802322387695312e-08, 5.494803190231323e-08, 8.009374141693115e-08, 1.0523945093154907e-07, 1.30385160446167e-07, 1.555308699607849e-07, 1.8067657947540283e-07, 2.0582228899002075e-07, 2.3096799850463867e-07, 2.561137080192566e-07, 2.812594175338745e-07, 3.0640512704849243e-07, 3.3155083656311035e-07, 3.5669654607772827e-07, 3.818422555923462e-07, 4.069879651069641e-07, 4.3213367462158203e-07, 4.5727938413619995e-07, 4.824250936508179e-07, 5.075708031654358e-07, 5.327165126800537e-07, 5.578622221946716e-07, 5.830079317092896e-07, 6.081536412239075e-07, 6.332993507385254e-07, 6.584450602531433e-07, 6.835907697677612e-07, 7.087364792823792e-07, 7.338821887969971e-07, 7.59027898311615e-07, 7.841736078262329e-07, 8.093193173408508e-07, 8.344650268554688e-07]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 8.0, 9.0, 11.0, 11.0, 8.0, 18.0, 15.0, 31.0, 23.0, 32.0, 27.0, 26.0, 26.0, 43.0, 40.0, 48.0, 49.0, 35.0, 45.0, 37.0, 57.0, 22.0, 49.0, 41.0, 29.0, 37.0, 27.0, 24.0, 12.0, 13.0, 20.0, 15.0, 17.0, 15.0, 11.0, 16.0, 7.0, 7.0, 9.0, 4.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.033203125, -2.945037841796875, -2.85687255859375, -2.768707275390625, -2.6805419921875, -2.592376708984375, -2.50421142578125, -2.416046142578125, -2.327880859375, -2.239715576171875, -2.15155029296875, -2.063385009765625, -1.9752197265625, -1.887054443359375, -1.79888916015625, -1.710723876953125, -1.62255859375, -1.534393310546875, -1.44622802734375, -1.358062744140625, -1.2698974609375, -1.181732177734375, -1.09356689453125, -1.005401611328125, -0.917236328125, -0.829071044921875, -0.74090576171875, -0.652740478515625, -0.5645751953125, -0.476409912109375, -0.38824462890625, -0.300079345703125, -0.2119140625, -0.123748779296875, -0.03558349609375, 0.052581787109375, 0.1407470703125, 0.228912353515625, 0.31707763671875, 0.405242919921875, 0.493408203125, 0.581573486328125, 0.66973876953125, 0.757904052734375, 0.8460693359375, 0.934234619140625, 1.02239990234375, 1.110565185546875, 1.19873046875, 1.286895751953125, 1.37506103515625, 1.463226318359375, 1.5513916015625, 1.639556884765625, 1.72772216796875, 1.815887451171875, 1.904052734375, 1.992218017578125, 2.08038330078125, 2.168548583984375, 2.2567138671875, 2.344879150390625, 2.43304443359375, 2.521209716796875, 2.609375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 21.0, 17.0, 36.0, 54.0, 90.0, 157.0, 259.0, 453.0, 777.0, 1269.0, 2157.0, 3822.0, 6515.0, 11647.0, 21046.0, 40760.0, 82649.0, 175994.0, 330836.0, 187719.0, 88158.0, 43259.0, 22321.0, 12118.0, 6770.0, 4005.0, 2306.0, 1304.0, 798.0, 473.0, 290.0, 154.0, 115.0, 67.0, 47.0, 28.0, 15.0, 15.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.353515625, -3.2535400390625, -3.153564453125, -3.0535888671875, -2.95361328125, -2.8536376953125, -2.753662109375, -2.6536865234375, -2.5537109375, -2.4537353515625, -2.353759765625, -2.2537841796875, -2.15380859375, -2.0538330078125, -1.953857421875, -1.8538818359375, -1.75390625, -1.6539306640625, -1.553955078125, -1.4539794921875, -1.35400390625, -1.2540283203125, -1.154052734375, -1.0540771484375, -0.9541015625, -0.8541259765625, -0.754150390625, -0.6541748046875, -0.55419921875, -0.4542236328125, -0.354248046875, -0.2542724609375, -0.154296875, -0.0543212890625, 0.045654296875, 0.1456298828125, 0.24560546875, 0.3455810546875, 0.445556640625, 0.5455322265625, 0.6455078125, 0.7454833984375, 0.845458984375, 0.9454345703125, 1.04541015625, 1.1453857421875, 1.245361328125, 1.3453369140625, 1.4453125, 1.5452880859375, 1.645263671875, 1.7452392578125, 1.84521484375, 1.9451904296875, 2.045166015625, 2.1451416015625, 2.2451171875, 2.3450927734375, 2.445068359375, 2.5450439453125, 2.64501953125, 2.7449951171875, 2.844970703125, 2.9449462890625, 3.044921875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 8.0, 6.0, 9.0, 12.0, 17.0, 20.0, 16.0, 26.0, 22.0, 27.0, 35.0, 35.0, 37.0, 41.0, 41.0, 63.0, 112.0, 195.0, 1387.0, 259.0, 163.0, 98.0, 58.0, 51.0, 32.0, 28.0, 33.0, 30.0, 26.0, 16.0, 22.0, 18.0, 12.0, 15.0, 7.0, 12.0, 9.0, 7.0, 8.0, 4.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.6015625, -9.30029296875, -8.9990234375, -8.69775390625, -8.396484375, -8.09521484375, -7.7939453125, -7.49267578125, -7.19140625, -6.89013671875, -6.5888671875, -6.28759765625, -5.986328125, -5.68505859375, -5.3837890625, -5.08251953125, -4.78125, -4.47998046875, -4.1787109375, -3.87744140625, -3.576171875, -3.27490234375, -2.9736328125, -2.67236328125, -2.37109375, -2.06982421875, -1.7685546875, -1.46728515625, -1.166015625, -0.86474609375, -0.5634765625, -0.26220703125, 0.0390625, 0.34033203125, 0.6416015625, 0.94287109375, 1.244140625, 1.54541015625, 1.8466796875, 2.14794921875, 2.44921875, 2.75048828125, 3.0517578125, 3.35302734375, 3.654296875, 3.95556640625, 4.2568359375, 4.55810546875, 4.859375, 5.16064453125, 5.4619140625, 5.76318359375, 6.064453125, 6.36572265625, 6.6669921875, 6.96826171875, 7.26953125, 7.57080078125, 7.8720703125, 8.17333984375, 8.474609375, 8.77587890625, 9.0771484375, 9.37841796875, 9.6796875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 5.0, 12.0, 12.0, 11.0, 23.0, 23.0, 35.0, 33.0, 44.0, 81.0, 95.0, 173.0, 229.0, 386.0, 803.0, 2377.0, 28051.0, 2202367.0, 892385.0, 14929.0, 1793.0, 714.0, 368.0, 218.0, 134.0, 87.0, 80.0, 59.0, 48.0, 23.0, 19.0, 19.0, 15.0, 7.0, 11.0, 4.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.875, -20.240478515625, -19.60595703125, -18.971435546875, -18.3369140625, -17.702392578125, -17.06787109375, -16.433349609375, -15.798828125, -15.164306640625, -14.52978515625, -13.895263671875, -13.2607421875, -12.626220703125, -11.99169921875, -11.357177734375, -10.72265625, -10.088134765625, -9.45361328125, -8.819091796875, -8.1845703125, -7.550048828125, -6.91552734375, -6.281005859375, -5.646484375, -5.011962890625, -4.37744140625, -3.742919921875, -3.1083984375, -2.473876953125, -1.83935546875, -1.204833984375, -0.5703125, 0.064208984375, 0.69873046875, 1.333251953125, 1.9677734375, 2.602294921875, 3.23681640625, 3.871337890625, 4.505859375, 5.140380859375, 5.77490234375, 6.409423828125, 7.0439453125, 7.678466796875, 8.31298828125, 8.947509765625, 9.58203125, 10.216552734375, 10.85107421875, 11.485595703125, 12.1201171875, 12.754638671875, 13.38916015625, 14.023681640625, 14.658203125, 15.292724609375, 15.92724609375, 16.561767578125, 17.1962890625, 17.830810546875, 18.46533203125, 19.099853515625, 19.734375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 12.0, 29.0, 64.0, 126.0, 170.0, 216.0, 152.0, 131.0, 75.0, 27.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.57356071472168, -22.415613174438477, -21.25766372680664, -20.099716186523438, -18.941768646240234, -17.7838191986084, -16.625871658325195, -15.467923164367676, -14.309974670410156, -13.152026176452637, -11.994077682495117, -10.836130142211914, -9.678181648254395, -8.520233154296875, -7.362285137176514, -6.204337120056152, -5.046388626098633, -3.8884403705596924, -2.730492115020752, -1.5725438594818115, -0.4145956039428711, 0.7433528900146484, 1.9013009071350098, 3.059248924255371, 4.217197418212891, 5.37514591217041, 6.5330939292907715, 7.691041946411133, 8.848990440368652, 10.006938934326172, 11.164886474609375, 12.322834968566895, 13.480781555175781, 14.6387300491333, 15.79667854309082, 16.954626083374023, 18.11257553100586, 19.270523071289062, 20.428470611572266, 21.58641815185547, 22.744367599487305, 23.902315139770508, 25.060264587402344, 26.218212127685547, 27.37615966796875, 28.534109115600586, 29.69205665588379, 30.850006103515625, 32.00795364379883, 33.16590118408203, 34.323848724365234, 35.4818000793457, 36.639747619628906, 37.79769515991211, 38.95564270019531, 40.113590240478516, 41.27153778076172, 42.42948532104492, 43.587432861328125, 44.745384216308594, 45.9033317565918, 47.061279296875, 48.2192268371582, 49.377174377441406, 50.535125732421875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 9.0, 8.0, 10.0, 10.0, 13.0, 17.0, 20.0, 21.0, 19.0, 30.0, 30.0, 23.0, 20.0, 34.0, 47.0, 46.0, 40.0, 32.0, 47.0, 47.0, 51.0, 44.0, 48.0, 28.0, 41.0, 32.0, 45.0, 34.0, 28.0, 19.0, 18.0, 23.0, 8.0, 23.0, 13.0, 6.0, 12.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.353559494018555, -28.451400756835938, -27.549240112304688, -26.64708137512207, -25.744922637939453, -24.842763900756836, -23.94060516357422, -23.03844451904297, -22.13628578186035, -21.234127044677734, -20.331966400146484, -19.429807662963867, -18.52764892578125, -17.625490188598633, -16.723331451416016, -15.821170806884766, -14.919012069702148, -14.016853332519531, -13.114693641662598, -12.212533950805664, -11.310375213623047, -10.40821647644043, -9.506056785583496, -8.603897094726562, -7.701738357543945, -6.79957914352417, -5.8974199295043945, -4.995260715484619, -4.093101501464844, -3.1909422874450684, -2.288783073425293, -1.3866238594055176, -0.4844646453857422, 0.4176945686340332, 1.3198537826538086, 2.222012996673584, 3.1241722106933594, 4.026331424713135, 4.92849063873291, 5.8306498527526855, 6.732809066772461, 7.634968280792236, 8.537127494812012, 9.439287185668945, 10.341445922851562, 11.24360466003418, 12.145764350891113, 13.047924041748047, 13.950082778930664, 14.852241516113281, 15.754401206970215, 16.65656089782715, 17.558719635009766, 18.460878372192383, 19.363037109375, 20.26519775390625, 21.167356491088867, 22.069515228271484, 22.971675872802734, 23.87383460998535, 24.77599334716797, 25.678152084350586, 26.580310821533203, 27.482471466064453, 28.38463020324707]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 8.0, 13.0, 12.0, 11.0, 18.0, 21.0, 21.0, 26.0, 31.0, 17.0, 24.0, 32.0, 36.0, 47.0, 39.0, 44.0, 63.0, 52.0, 42.0, 36.0, 38.0, 44.0, 48.0, 34.0, 36.0, 23.0, 15.0, 21.0, 29.0, 11.0, 15.0, 15.0, 13.0, 11.0, 12.0, 10.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.10546875, -3.00701904296875, -2.9085693359375, -2.81011962890625, -2.711669921875, -2.61322021484375, -2.5147705078125, -2.41632080078125, -2.31787109375, -2.21942138671875, -2.1209716796875, -2.02252197265625, -1.924072265625, -1.82562255859375, -1.7271728515625, -1.62872314453125, -1.5302734375, -1.43182373046875, -1.3333740234375, -1.23492431640625, -1.136474609375, -1.03802490234375, -0.9395751953125, -0.84112548828125, -0.74267578125, -0.64422607421875, -0.5457763671875, -0.44732666015625, -0.348876953125, -0.25042724609375, -0.1519775390625, -0.05352783203125, 0.044921875, 0.14337158203125, 0.2418212890625, 0.34027099609375, 0.438720703125, 0.53717041015625, 0.6356201171875, 0.73406982421875, 0.83251953125, 0.93096923828125, 1.0294189453125, 1.12786865234375, 1.226318359375, 1.32476806640625, 1.4232177734375, 1.52166748046875, 1.6201171875, 1.71856689453125, 1.8170166015625, 1.91546630859375, 2.013916015625, 2.11236572265625, 2.2108154296875, 2.30926513671875, 2.40771484375, 2.50616455078125, 2.6046142578125, 2.70306396484375, 2.801513671875, 2.89996337890625, 2.9984130859375, 3.09686279296875, 3.1953125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 8.0, 3.0, 14.0, 16.0, 16.0, 25.0, 47.0, 67.0, 112.0, 131.0, 230.0, 388.0, 662.0, 1211.0, 2189.0, 4294.0, 8731.0, 18511.0, 40893.0, 94883.0, 226362.0, 529672.0, 1065270.0, 1146336.0, 599137.0, 258908.0, 108450.0, 46675.0, 20921.0, 9790.0, 4760.0, 2371.0, 1287.0, 743.0, 442.0, 282.0, 174.0, 78.0, 63.0, 44.0, 31.0, 13.0, 17.0, 11.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.484375, -3.385040283203125, -3.28570556640625, -3.186370849609375, -3.0870361328125, -2.987701416015625, -2.88836669921875, -2.789031982421875, -2.689697265625, -2.590362548828125, -2.49102783203125, -2.391693115234375, -2.2923583984375, -2.193023681640625, -2.09368896484375, -1.994354248046875, -1.89501953125, -1.795684814453125, -1.69635009765625, -1.597015380859375, -1.4976806640625, -1.398345947265625, -1.29901123046875, -1.199676513671875, -1.100341796875, -1.001007080078125, -0.90167236328125, -0.802337646484375, -0.7030029296875, -0.603668212890625, -0.50433349609375, -0.404998779296875, -0.3056640625, -0.206329345703125, -0.10699462890625, -0.007659912109375, 0.0916748046875, 0.191009521484375, 0.29034423828125, 0.389678955078125, 0.489013671875, 0.588348388671875, 0.68768310546875, 0.787017822265625, 0.8863525390625, 0.985687255859375, 1.08502197265625, 1.184356689453125, 1.28369140625, 1.383026123046875, 1.48236083984375, 1.581695556640625, 1.6810302734375, 1.780364990234375, 1.87969970703125, 1.979034423828125, 2.078369140625, 2.177703857421875, 2.27703857421875, 2.376373291015625, 2.4757080078125, 2.575042724609375, 2.67437744140625, 2.773712158203125, 2.873046875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 8.0, 6.0, 8.0, 6.0, 8.0, 14.0, 12.0, 31.0, 44.0, 44.0, 72.0, 88.0, 122.0, 136.0, 193.0, 243.0, 291.0, 397.0, 391.0, 385.0, 381.0, 286.0, 226.0, 178.0, 119.0, 84.0, 78.0, 64.0, 41.0, 29.0, 22.0, 15.0, 19.0, 6.0, 4.0, 6.0, 10.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0], "bins": [-6.33984375, -6.17205810546875, -6.0042724609375, -5.83648681640625, -5.668701171875, -5.50091552734375, -5.3331298828125, -5.16534423828125, -4.99755859375, -4.82977294921875, -4.6619873046875, -4.49420166015625, -4.326416015625, -4.15863037109375, -3.9908447265625, -3.82305908203125, -3.6552734375, -3.48748779296875, -3.3197021484375, -3.15191650390625, -2.984130859375, -2.81634521484375, -2.6485595703125, -2.48077392578125, -2.31298828125, -2.14520263671875, -1.9774169921875, -1.80963134765625, -1.641845703125, -1.47406005859375, -1.3062744140625, -1.13848876953125, -0.970703125, -0.80291748046875, -0.6351318359375, -0.46734619140625, -0.299560546875, -0.13177490234375, 0.0360107421875, 0.20379638671875, 0.37158203125, 0.53936767578125, 0.7071533203125, 0.87493896484375, 1.042724609375, 1.21051025390625, 1.3782958984375, 1.54608154296875, 1.7138671875, 1.88165283203125, 2.0494384765625, 2.21722412109375, 2.385009765625, 2.55279541015625, 2.7205810546875, 2.88836669921875, 3.05615234375, 3.22393798828125, 3.3917236328125, 3.55950927734375, 3.727294921875, 3.89508056640625, 4.0628662109375, 4.23065185546875, 4.3984375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 8.0, 10.0, 6.0, 13.0, 16.0, 22.0, 34.0, 44.0, 65.0, 81.0, 108.0, 170.0, 228.0, 445.0, 1501.0, 45567.0, 3338150.0, 797831.0, 8169.0, 757.0, 310.0, 198.0, 134.0, 120.0, 84.0, 58.0, 44.0, 29.0, 20.0, 11.0, 8.0, 8.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.421875, -19.65966796875, -18.8974609375, -18.13525390625, -17.373046875, -16.61083984375, -15.8486328125, -15.08642578125, -14.32421875, -13.56201171875, -12.7998046875, -12.03759765625, -11.275390625, -10.51318359375, -9.7509765625, -8.98876953125, -8.2265625, -7.46435546875, -6.7021484375, -5.93994140625, -5.177734375, -4.41552734375, -3.6533203125, -2.89111328125, -2.12890625, -1.36669921875, -0.6044921875, 0.15771484375, 0.919921875, 1.68212890625, 2.4443359375, 3.20654296875, 3.96875, 4.73095703125, 5.4931640625, 6.25537109375, 7.017578125, 7.77978515625, 8.5419921875, 9.30419921875, 10.06640625, 10.82861328125, 11.5908203125, 12.35302734375, 13.115234375, 13.87744140625, 14.6396484375, 15.40185546875, 16.1640625, 16.92626953125, 17.6884765625, 18.45068359375, 19.212890625, 19.97509765625, 20.7373046875, 21.49951171875, 22.26171875, 23.02392578125, 23.7861328125, 24.54833984375, 25.310546875, 26.07275390625, 26.8349609375, 27.59716796875, 28.359375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 14.0, 26.0, 37.0, 69.0, 108.0, 157.0, 155.0, 170.0, 128.0, 80.0, 37.0, 18.0, 9.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.42382049560547, -26.81435203552246, -25.20488166809082, -23.595413208007812, -21.985942840576172, -20.376474380493164, -18.767005920410156, -17.157535552978516, -15.548067092895508, -13.938597679138184, -12.32912826538086, -10.719659805297852, -9.110190391540527, -7.500720977783203, -5.891252517700195, -4.281783103942871, -2.672313690185547, -1.0628445148468018, 0.5466246604919434, 2.1560935974121094, 3.7655630111694336, 5.375032424926758, 6.984500885009766, 8.59397029876709, 10.203439712524414, 11.812909126281738, 13.422378540039062, 15.03184700012207, 16.641315460205078, 18.25078582763672, 19.860254287719727, 21.469722747802734, 23.079193115234375, 24.688661575317383, 26.298131942749023, 27.90760040283203, 29.517070770263672, 31.12653923034668, 32.73600769042969, 34.34547805786133, 35.95494842529297, 37.56441879272461, 39.173885345458984, 40.783355712890625, 42.392826080322266, 44.002296447753906, 45.61176300048828, 47.22123336791992, 48.8306999206543, 50.44017028808594, 52.04963684082031, 53.65910720825195, 55.268577575683594, 56.87804412841797, 58.48751449584961, 60.09698486328125, 61.706451416015625, 63.315921783447266, 64.9253921508789, 66.53485870361328, 68.14432525634766, 69.75379943847656, 71.36326599121094, 72.97273254394531, 74.58220672607422]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 14.0, 5.0, 9.0, 9.0, 7.0, 9.0, 10.0, 11.0, 20.0, 13.0, 19.0, 24.0, 25.0, 27.0, 16.0, 32.0, 29.0, 23.0, 33.0, 36.0, 33.0, 38.0, 28.0, 37.0, 36.0, 26.0, 43.0, 29.0, 41.0, 25.0, 39.0, 25.0, 26.0, 27.0, 19.0, 23.0, 27.0, 17.0, 9.0, 11.0, 14.0, 9.0, 8.0, 8.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-15.946121215820312, -15.441732406616211, -14.937342643737793, -14.432952880859375, -13.928564071655273, -13.424175262451172, -12.919785499572754, -12.415395736694336, -11.911006927490234, -11.406618118286133, -10.902228355407715, -10.397838592529297, -9.893449783325195, -9.389060974121094, -8.884671211242676, -8.380281448364258, -7.875892639160156, -7.3715033531188965, -6.867114067077637, -6.362724781036377, -5.858335494995117, -5.353946208953857, -4.849556922912598, -4.345167636871338, -3.840778350830078, -3.3363890647888184, -2.8319997787475586, -2.327610492706299, -1.823221206665039, -1.3188319206237793, -0.8144426345825195, -0.31005334854125977, 0.1943359375, 0.6987252235412598, 1.2031145095825195, 1.7075037956237793, 2.211893081665039, 2.716282367706299, 3.2206716537475586, 3.7250609397888184, 4.229450225830078, 4.733839511871338, 5.238228797912598, 5.742618083953857, 6.247007369995117, 6.751396656036377, 7.255785942077637, 7.7601752281188965, 8.264564514160156, 8.768953323364258, 9.273343086242676, 9.777732849121094, 10.282121658325195, 10.786510467529297, 11.290900230407715, 11.795289993286133, 12.299678802490234, 12.804067611694336, 13.308457374572754, 13.812847137451172, 14.317235946655273, 14.821624755859375, 15.326014518737793, 15.830404281616211, 16.334793090820312]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 10.0, 9.0, 9.0, 18.0, 18.0, 14.0, 19.0, 20.0, 28.0, 26.0, 26.0, 44.0, 30.0, 29.0, 45.0, 44.0, 54.0, 45.0, 39.0, 52.0, 32.0, 36.0, 38.0, 42.0, 32.0, 33.0, 17.0, 19.0, 18.0, 26.0, 9.0, 8.0, 20.0, 19.0, 17.0, 8.0, 4.0, 7.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.099609375, -3.008575439453125, -2.91754150390625, -2.826507568359375, -2.7354736328125, -2.644439697265625, -2.55340576171875, -2.462371826171875, -2.371337890625, -2.280303955078125, -2.18927001953125, -2.098236083984375, -2.0072021484375, -1.916168212890625, -1.82513427734375, -1.734100341796875, -1.64306640625, -1.552032470703125, -1.46099853515625, -1.369964599609375, -1.2789306640625, -1.187896728515625, -1.09686279296875, -1.005828857421875, -0.914794921875, -0.823760986328125, -0.73272705078125, -0.641693115234375, -0.5506591796875, -0.459625244140625, -0.36859130859375, -0.277557373046875, -0.1865234375, -0.095489501953125, -0.00445556640625, 0.086578369140625, 0.1776123046875, 0.268646240234375, 0.35968017578125, 0.450714111328125, 0.541748046875, 0.632781982421875, 0.72381591796875, 0.814849853515625, 0.9058837890625, 0.996917724609375, 1.08795166015625, 1.178985595703125, 1.27001953125, 1.361053466796875, 1.45208740234375, 1.543121337890625, 1.6341552734375, 1.725189208984375, 1.81622314453125, 1.907257080078125, 1.998291015625, 2.089324951171875, 2.18035888671875, 2.271392822265625, 2.3624267578125, 2.453460693359375, 2.54449462890625, 2.635528564453125, 2.7265625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 12.0, 15.0, 20.0, 29.0, 55.0, 61.0, 100.0, 149.0, 177.0, 286.0, 342.0, 540.0, 720.0, 1046.0, 1438.0, 1983.0, 2729.0, 3849.0, 5423.0, 7639.0, 11142.0, 16322.0, 24012.0, 37108.0, 59080.0, 104783.0, 275079.0, 230047.0, 97705.0, 56091.0, 35252.0, 22967.0, 15834.0, 10788.0, 7486.0, 5280.0, 3714.0, 2637.0, 1898.0, 1338.0, 994.0, 678.0, 520.0, 322.0, 256.0, 172.0, 120.0, 116.0, 56.0, 39.0, 46.0, 23.0, 19.0, 12.0, 4.0, 2.0, 2.0, 5.0], "bins": [-0.118896484375, -0.11528778076171875, -0.1116790771484375, -0.10807037353515625, -0.104461669921875, -0.10085296630859375, -0.0972442626953125, -0.09363555908203125, -0.09002685546875, -0.08641815185546875, -0.0828094482421875, -0.07920074462890625, -0.075592041015625, -0.07198333740234375, -0.0683746337890625, -0.06476593017578125, -0.0611572265625, -0.05754852294921875, -0.0539398193359375, -0.05033111572265625, -0.046722412109375, -0.04311370849609375, -0.0395050048828125, -0.03589630126953125, -0.03228759765625, -0.02867889404296875, -0.0250701904296875, -0.02146148681640625, -0.017852783203125, -0.01424407958984375, -0.0106353759765625, -0.00702667236328125, -0.00341796875, 0.00019073486328125, 0.0037994384765625, 0.00740814208984375, 0.011016845703125, 0.01462554931640625, 0.0182342529296875, 0.02184295654296875, 0.02545166015625, 0.02906036376953125, 0.0326690673828125, 0.03627777099609375, 0.039886474609375, 0.04349517822265625, 0.0471038818359375, 0.05071258544921875, 0.0543212890625, 0.05792999267578125, 0.0615386962890625, 0.06514739990234375, 0.068756103515625, 0.07236480712890625, 0.0759735107421875, 0.07958221435546875, 0.08319091796875, 0.08679962158203125, 0.0904083251953125, 0.09401702880859375, 0.097625732421875, 0.10123443603515625, 0.1048431396484375, 0.10845184326171875, 0.112060546875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 7.0, 6.0, 5.0, 10.0, 13.0, 16.0, 12.0, 13.0, 20.0, 20.0, 19.0, 22.0, 29.0, 34.0, 30.0, 37.0, 41.0, 46.0, 43.0, 35.0, 1050.0, 36.0, 28.0, 52.0, 34.0, 32.0, 41.0, 32.0, 25.0, 42.0, 28.0, 28.0, 24.0, 12.0, 10.0, 18.0, 11.0, 14.0, 12.0, 3.0, 12.0, 6.0, 3.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.056640625, -1.993927001953125, -1.93121337890625, -1.868499755859375, -1.8057861328125, -1.743072509765625, -1.68035888671875, -1.617645263671875, -1.554931640625, -1.492218017578125, -1.42950439453125, -1.366790771484375, -1.3040771484375, -1.241363525390625, -1.17864990234375, -1.115936279296875, -1.05322265625, -0.990509033203125, -0.92779541015625, -0.865081787109375, -0.8023681640625, -0.739654541015625, -0.67694091796875, -0.614227294921875, -0.551513671875, -0.488800048828125, -0.42608642578125, -0.363372802734375, -0.3006591796875, -0.237945556640625, -0.17523193359375, -0.112518310546875, -0.0498046875, 0.012908935546875, 0.07562255859375, 0.138336181640625, 0.2010498046875, 0.263763427734375, 0.32647705078125, 0.389190673828125, 0.451904296875, 0.514617919921875, 0.57733154296875, 0.640045166015625, 0.7027587890625, 0.765472412109375, 0.82818603515625, 0.890899658203125, 0.95361328125, 1.016326904296875, 1.07904052734375, 1.141754150390625, 1.2044677734375, 1.267181396484375, 1.32989501953125, 1.392608642578125, 1.455322265625, 1.518035888671875, 1.58074951171875, 1.643463134765625, 1.7061767578125, 1.768890380859375, 1.83160400390625, 1.894317626953125, 1.95703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 7.0, 12.0, 14.0, 21.0, 30.0, 37.0, 78.0, 98.0, 130.0, 200.0, 293.0, 424.0, 633.0, 871.0, 1340.0, 1835.0, 2620.0, 3663.0, 5370.0, 7477.0, 11049.0, 16329.0, 24141.0, 36563.0, 58421.0, 98813.0, 188288.0, 1312407.0, 124517.0, 70127.0, 43275.0, 27891.0, 18523.0, 12679.0, 8855.0, 6051.0, 4193.0, 2990.0, 2063.0, 1473.0, 975.0, 738.0, 511.0, 342.0, 244.0, 163.0, 126.0, 81.0, 59.0, 38.0, 22.0, 19.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.056365966796875, -0.054558753967285156, -0.05275154113769531, -0.05094432830810547, -0.049137115478515625, -0.04732990264892578, -0.04552268981933594, -0.043715476989746094, -0.04190826416015625, -0.040101051330566406, -0.03829383850097656, -0.03648662567138672, -0.034679412841796875, -0.03287220001220703, -0.031064987182617188, -0.029257774353027344, -0.0274505615234375, -0.025643348693847656, -0.023836135864257812, -0.02202892303466797, -0.020221710205078125, -0.01841449737548828, -0.016607284545898438, -0.014800071716308594, -0.01299285888671875, -0.011185646057128906, -0.009378433227539062, -0.007571220397949219, -0.005764007568359375, -0.003956794738769531, -0.0021495819091796875, -0.00034236907958984375, 0.00146484375, 0.0032720565795898438, 0.0050792694091796875, 0.006886482238769531, 0.008693695068359375, 0.010500907897949219, 0.012308120727539062, 0.014115333557128906, 0.01592254638671875, 0.017729759216308594, 0.019536972045898438, 0.02134418487548828, 0.023151397705078125, 0.02495861053466797, 0.026765823364257812, 0.028573036193847656, 0.0303802490234375, 0.032187461853027344, 0.03399467468261719, 0.03580188751220703, 0.037609100341796875, 0.03941631317138672, 0.04122352600097656, 0.043030738830566406, 0.04483795166015625, 0.046645164489746094, 0.04845237731933594, 0.05025959014892578, 0.052066802978515625, 0.05387401580810547, 0.05568122863769531, 0.057488441467285156, 0.059295654296875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 0.0, 5.0, 4.0, 4.0, 2.0, 4.0, 12.0, 10.0, 10.0, 11.0, 23.0, 24.0, 71.0, 54.0, 89.0, 427.0, 57.0, 48.0, 26.0, 46.0, 15.0, 13.0, 7.0, 13.0, 4.0, 5.0, 10.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7713755369186401e-06, -1.695007085800171e-06, -1.6186386346817017e-06, -1.5422701835632324e-06, -1.4659017324447632e-06, -1.389533281326294e-06, -1.3131648302078247e-06, -1.2367963790893555e-06, -1.1604279279708862e-06, -1.084059476852417e-06, -1.0076910257339478e-06, -9.313225746154785e-07, -8.549541234970093e-07, -7.7858567237854e-07, -7.022172212600708e-07, -6.258487701416016e-07, -5.494803190231323e-07, -4.731118679046631e-07, -3.9674341678619385e-07, -3.203749656677246e-07, -2.4400651454925537e-07, -1.6763806343078613e-07, -9.12696123123169e-08, -1.4901161193847656e-08, 6.146728992462158e-08, 1.3783574104309082e-07, 2.1420419216156006e-07, 2.905726432800293e-07, 3.6694109439849854e-07, 4.4330954551696777e-07, 5.19677996635437e-07, 5.960464477539062e-07, 6.724148988723755e-07, 7.487833499908447e-07, 8.25151801109314e-07, 9.015202522277832e-07, 9.778887033462524e-07, 1.0542571544647217e-06, 1.130625605583191e-06, 1.2069940567016602e-06, 1.2833625078201294e-06, 1.3597309589385986e-06, 1.4360994100570679e-06, 1.5124678611755371e-06, 1.5888363122940063e-06, 1.6652047634124756e-06, 1.7415732145309448e-06, 1.817941665649414e-06, 1.8943101167678833e-06, 1.9706785678863525e-06, 2.0470470190048218e-06, 2.123415470123291e-06, 2.1997839212417603e-06, 2.2761523723602295e-06, 2.3525208234786987e-06, 2.428889274597168e-06, 2.505257725715637e-06, 2.5816261768341064e-06, 2.6579946279525757e-06, 2.734363079071045e-06, 2.810731530189514e-06, 2.8870999813079834e-06, 2.9634684324264526e-06, 3.039836883544922e-06]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 6.0, 13.0, 7.0, 14.0, 28.0, 51.0, 78.0, 165.0, 1487.0, 865858.0, 179633.0, 841.0, 170.0, 75.0, 34.0, 22.0, 17.0, 8.0, 12.0, 8.0, 2.0, 1.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-6.872415542602539e-05, -6.700213998556137e-05, -6.528012454509735e-05, -6.355810910463333e-05, -6.183609366416931e-05, -6.011407822370529e-05, -5.839206278324127e-05, -5.667004734277725e-05, -5.494803190231323e-05, -5.322601646184921e-05, -5.150400102138519e-05, -4.978198558092117e-05, -4.805997014045715e-05, -4.6337954699993134e-05, -4.4615939259529114e-05, -4.2893923819065094e-05, -4.1171908378601074e-05, -3.9449892938137054e-05, -3.7727877497673035e-05, -3.6005862057209015e-05, -3.4283846616744995e-05, -3.2561831176280975e-05, -3.0839815735816956e-05, -2.9117800295352936e-05, -2.7395784854888916e-05, -2.5673769414424896e-05, -2.3951753973960876e-05, -2.2229738533496857e-05, -2.0507723093032837e-05, -1.8785707652568817e-05, -1.7063692212104797e-05, -1.5341676771640778e-05, -1.3619661331176758e-05, -1.1897645890712738e-05, -1.0175630450248718e-05, -8.453615009784698e-06, -6.731599569320679e-06, -5.009584128856659e-06, -3.287568688392639e-06, -1.5655532479286194e-06, 1.564621925354004e-07, 1.8784776329994202e-06, 3.60049307346344e-06, 5.32250851392746e-06, 7.0445239543914795e-06, 8.7665393948555e-06, 1.0488554835319519e-05, 1.2210570275783539e-05, 1.3932585716247559e-05, 1.565460115671158e-05, 1.7376616597175598e-05, 1.9098632037639618e-05, 2.0820647478103638e-05, 2.2542662918567657e-05, 2.4264678359031677e-05, 2.5986693799495697e-05, 2.7708709239959717e-05, 2.9430724680423737e-05, 3.1152740120887756e-05, 3.2874755561351776e-05, 3.4596771001815796e-05, 3.6318786442279816e-05, 3.8040801882743835e-05, 3.9762817323207855e-05, 4.1484832763671875e-05]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 8.0, 21.0, 27.0, 27.0, 41.0, 52.0, 62.0, 77.0, 95.0, 224.0, 91.0, 49.0, 54.0, 34.0, 32.0, 28.0, 12.0, 10.0, 11.0, 7.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.328449219632603e-07, -5.116322654430405e-07, -4.904196089228208e-07, -4.692069239808916e-07, -4.4799426746067184e-07, -4.267816109404521e-07, -4.055689259985229e-07, -3.8435626947830315e-07, -3.631436129580834e-07, -3.4193095643786364e-07, -3.207182999176439e-07, -2.995056149757147e-07, -2.7829295845549495e-07, -2.570803019352752e-07, -2.3586763120420073e-07, -2.1465496047312627e-07, -1.9344230395290651e-07, -1.7222964743268676e-07, -1.510169767016123e-07, -1.2980430597053783e-07, -1.0859164945031807e-07, -8.737898582467096e-08, -6.616632219902385e-08, -4.4953651467949385e-08, -2.3740994947729632e-08, -2.528331322082522e-09, 1.8684332303564588e-08, 3.98969959292117e-08, 6.110965955485881e-08, 8.232232318050592e-08, 1.0353498680615303e-07, 1.247476575372275e-07, 1.459603709008661e-07, 1.6717302742108586e-07, 1.8838569815216033e-07, 2.095983688832348e-07, 2.3081102540345455e-07, 2.520236819236743e-07, 2.732363668656035e-07, 2.9444902338582324e-07, 3.15661679906043e-07, 3.3687433642626274e-07, 3.580869929464825e-07, 3.792996778884117e-07, 4.0051233440863143e-07, 4.217249909288512e-07, 4.4293767587078037e-07, 4.641503323910001e-07, 4.853629889112199e-07, 5.065756454314396e-07, 5.277883019516594e-07, 5.490009584718791e-07, 5.702136149920989e-07, 5.914263283557375e-07, 6.126389848759572e-07, 6.33851641396177e-07, 6.550642979163968e-07, 6.762769544366165e-07, 6.974896109568363e-07, 7.18702267477056e-07, 7.399149808406946e-07, 7.611276373609144e-07, 7.823402938811341e-07, 8.035529504013539e-07, 8.247656069215736e-07]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 15.0, 0.0, 0.0, 29.0, 0.0, 0.0, 0.0, 49.0, 0.0, 0.0, 103.0, 0.0, 0.0, 155.0, 0.0, 0.0, 0.0, 242.0, 0.0, 0.0, 198.0, 0.0, 0.0, 0.0, 108.0, 0.0, 0.0, 58.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.364418029785156e-07, -5.187466740608215e-07, -5.010515451431274e-07, -4.833564162254333e-07, -4.6566128730773926e-07, -4.4796615839004517e-07, -4.302710294723511e-07, -4.12575900554657e-07, -3.948807716369629e-07, -3.771856427192688e-07, -3.594905138015747e-07, -3.417953848838806e-07, -3.241002559661865e-07, -3.0640512704849243e-07, -2.8870999813079834e-07, -2.7101486921310425e-07, -2.5331974029541016e-07, -2.3562461137771606e-07, -2.1792948246002197e-07, -2.0023435354232788e-07, -1.825392246246338e-07, -1.648440957069397e-07, -1.471489667892456e-07, -1.2945383787155151e-07, -1.1175870895385742e-07, -9.406358003616333e-08, -7.636845111846924e-08, -5.8673322200775146e-08, -4.0978193283081055e-08, -2.3283064365386963e-08, -5.587935447692871e-09, 1.210719347000122e-08, 2.9802322387695312e-08, 4.7497451305389404e-08, 6.51925802230835e-08, 8.288770914077759e-08, 1.0058283805847168e-07, 1.1827796697616577e-07, 1.3597309589385986e-07, 1.5366822481155396e-07, 1.7136335372924805e-07, 1.8905848264694214e-07, 2.0675361156463623e-07, 2.2444874048233032e-07, 2.421438694000244e-07, 2.598389983177185e-07, 2.775341272354126e-07, 2.952292561531067e-07, 3.129243850708008e-07, 3.3061951398849487e-07, 3.4831464290618896e-07, 3.6600977182388306e-07, 3.8370490074157715e-07, 4.0140002965927124e-07, 4.1909515857696533e-07, 4.367902874946594e-07, 4.544854164123535e-07, 4.721805453300476e-07, 4.898756742477417e-07, 5.075708031654358e-07, 5.252659320831299e-07, 5.42961061000824e-07, 5.606561899185181e-07, 5.783513188362122e-07, 5.960464477539062e-07]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 10.0, 9.0, 9.0, 18.0, 18.0, 14.0, 19.0, 20.0, 28.0, 26.0, 26.0, 44.0, 30.0, 29.0, 45.0, 44.0, 54.0, 45.0, 39.0, 52.0, 32.0, 36.0, 38.0, 42.0, 32.0, 33.0, 17.0, 19.0, 18.0, 26.0, 9.0, 8.0, 20.0, 19.0, 17.0, 8.0, 4.0, 7.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.099609375, -3.008575439453125, -2.91754150390625, -2.826507568359375, -2.7354736328125, -2.644439697265625, -2.55340576171875, -2.462371826171875, -2.371337890625, -2.280303955078125, -2.18927001953125, -2.098236083984375, -2.0072021484375, -1.916168212890625, -1.82513427734375, -1.734100341796875, -1.64306640625, -1.552032470703125, -1.46099853515625, -1.369964599609375, -1.2789306640625, -1.187896728515625, -1.09686279296875, -1.005828857421875, -0.914794921875, -0.823760986328125, -0.73272705078125, -0.641693115234375, -0.5506591796875, -0.459625244140625, -0.36859130859375, -0.277557373046875, -0.1865234375, -0.095489501953125, -0.00445556640625, 0.086578369140625, 0.1776123046875, 0.268646240234375, 0.35968017578125, 0.450714111328125, 0.541748046875, 0.632781982421875, 0.72381591796875, 0.814849853515625, 0.9058837890625, 0.996917724609375, 1.08795166015625, 1.178985595703125, 1.27001953125, 1.361053466796875, 1.45208740234375, 1.543121337890625, 1.6341552734375, 1.725189208984375, 1.81622314453125, 1.907257080078125, 1.998291015625, 2.089324951171875, 2.18035888671875, 2.271392822265625, 2.3624267578125, 2.453460693359375, 2.54449462890625, 2.635528564453125, 2.7265625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 10.0, 16.0, 13.0, 37.0, 61.0, 104.0, 147.0, 257.0, 452.0, 722.0, 1252.0, 2019.0, 3418.0, 5677.0, 9520.0, 15660.0, 26898.0, 49979.0, 101519.0, 216342.0, 286241.0, 160830.0, 75009.0, 38592.0, 21762.0, 12745.0, 7596.0, 4635.0, 2860.0, 1728.0, 963.0, 592.0, 369.0, 198.0, 105.0, 68.0, 55.0, 36.0, 18.0, 11.0, 11.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.62890625, -3.523101806640625, -3.41729736328125, -3.311492919921875, -3.2056884765625, -3.099884033203125, -2.99407958984375, -2.888275146484375, -2.782470703125, -2.676666259765625, -2.57086181640625, -2.465057373046875, -2.3592529296875, -2.253448486328125, -2.14764404296875, -2.041839599609375, -1.93603515625, -1.830230712890625, -1.72442626953125, -1.618621826171875, -1.5128173828125, -1.407012939453125, -1.30120849609375, -1.195404052734375, -1.089599609375, -0.983795166015625, -0.87799072265625, -0.772186279296875, -0.6663818359375, -0.560577392578125, -0.45477294921875, -0.348968505859375, -0.2431640625, -0.137359619140625, -0.03155517578125, 0.074249267578125, 0.1800537109375, 0.285858154296875, 0.39166259765625, 0.497467041015625, 0.603271484375, 0.709075927734375, 0.81488037109375, 0.920684814453125, 1.0264892578125, 1.132293701171875, 1.23809814453125, 1.343902587890625, 1.44970703125, 1.555511474609375, 1.66131591796875, 1.767120361328125, 1.8729248046875, 1.978729248046875, 2.08453369140625, 2.190338134765625, 2.296142578125, 2.401947021484375, 2.50775146484375, 2.613555908203125, 2.7193603515625, 2.825164794921875, 2.93096923828125, 3.036773681640625, 3.142578125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 4.0, 8.0, 6.0, 11.0, 18.0, 19.0, 24.0, 18.0, 20.0, 29.0, 41.0, 37.0, 39.0, 22.0, 58.0, 67.0, 77.0, 128.0, 243.0, 1398.0, 197.0, 100.0, 75.0, 63.0, 59.0, 35.0, 36.0, 28.0, 21.0, 17.0, 23.0, 16.0, 19.0, 16.0, 10.0, 12.0, 7.0, 8.0, 3.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-9.890625, -9.5843505859375, -9.278076171875, -8.9718017578125, -8.66552734375, -8.3592529296875, -8.052978515625, -7.7467041015625, -7.4404296875, -7.1341552734375, -6.827880859375, -6.5216064453125, -6.21533203125, -5.9090576171875, -5.602783203125, -5.2965087890625, -4.990234375, -4.6839599609375, -4.377685546875, -4.0714111328125, -3.76513671875, -3.4588623046875, -3.152587890625, -2.8463134765625, -2.5400390625, -2.2337646484375, -1.927490234375, -1.6212158203125, -1.31494140625, -1.0086669921875, -0.702392578125, -0.3961181640625, -0.08984375, 0.2164306640625, 0.522705078125, 0.8289794921875, 1.13525390625, 1.4415283203125, 1.747802734375, 2.0540771484375, 2.3603515625, 2.6666259765625, 2.972900390625, 3.2791748046875, 3.58544921875, 3.8917236328125, 4.197998046875, 4.5042724609375, 4.810546875, 5.1168212890625, 5.423095703125, 5.7293701171875, 6.03564453125, 6.3419189453125, 6.648193359375, 6.9544677734375, 7.2607421875, 7.5670166015625, 7.873291015625, 8.1795654296875, 8.48583984375, 8.7921142578125, 9.098388671875, 9.4046630859375, 9.7109375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 9.0, 6.0, 8.0, 8.0, 19.0, 22.0, 28.0, 25.0, 40.0, 39.0, 66.0, 76.0, 108.0, 128.0, 212.0, 360.0, 1123.0, 11329.0, 475158.0, 2604916.0, 47794.0, 2628.0, 556.0, 283.0, 192.0, 131.0, 98.0, 91.0, 57.0, 31.0, 26.0, 27.0, 27.0, 19.0, 14.0, 8.0, 7.0, 8.0, 2.0, 9.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.078125, -19.43505859375, -18.7919921875, -18.14892578125, -17.505859375, -16.86279296875, -16.2197265625, -15.57666015625, -14.93359375, -14.29052734375, -13.6474609375, -13.00439453125, -12.361328125, -11.71826171875, -11.0751953125, -10.43212890625, -9.7890625, -9.14599609375, -8.5029296875, -7.85986328125, -7.216796875, -6.57373046875, -5.9306640625, -5.28759765625, -4.64453125, -4.00146484375, -3.3583984375, -2.71533203125, -2.072265625, -1.42919921875, -0.7861328125, -0.14306640625, 0.5, 1.14306640625, 1.7861328125, 2.42919921875, 3.072265625, 3.71533203125, 4.3583984375, 5.00146484375, 5.64453125, 6.28759765625, 6.9306640625, 7.57373046875, 8.216796875, 8.85986328125, 9.5029296875, 10.14599609375, 10.7890625, 11.43212890625, 12.0751953125, 12.71826171875, 13.361328125, 14.00439453125, 14.6474609375, 15.29052734375, 15.93359375, 16.57666015625, 17.2197265625, 17.86279296875, 18.505859375, 19.14892578125, 19.7919921875, 20.43505859375, 21.078125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 200.0, 817.0], "bins": [-514.3544921875, -506.2168273925781, -498.0791320800781, -489.94146728515625, -481.8038024902344, -473.6661376953125, -465.5284423828125, -457.3907775878906, -449.25311279296875, -441.1154479980469, -432.9777526855469, -424.840087890625, -416.7024230957031, -408.56475830078125, -400.42706298828125, -392.2893981933594, -384.1517028808594, -376.0140380859375, -367.8763427734375, -359.7386779785156, -351.60101318359375, -343.46331787109375, -335.3256530761719, -327.18798828125, -319.05029296875, -310.9126281738281, -302.7749328613281, -294.63726806640625, -286.4996032714844, -278.3619384765625, -270.2242431640625, -262.0865783691406, -253.9488983154297, -245.81121826171875, -237.67355346679688, -229.53587341308594, -221.398193359375, -213.26052856445312, -205.1228485107422, -196.98516845703125, -188.84750366210938, -180.70982360839844, -172.57215881347656, -164.43447875976562, -156.29681396484375, -148.1591339111328, -140.02145385742188, -131.8837890625, -123.7461166381836, -115.60844421386719, -107.47076416015625, -99.33309173583984, -91.19541931152344, -83.05774688720703, -74.92007446289062, -66.78239440917969, -58.644718170166016, -50.507041931152344, -42.36936950683594, -34.23169708251953, -26.09402084350586, -17.956348419189453, -9.818672180175781, -1.6809959411621094, 6.4566755294799805]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 13.0, 4.0, 12.0, 8.0, 20.0, 26.0, 10.0, 17.0, 16.0, 23.0, 30.0, 26.0, 22.0, 16.0, 26.0, 35.0, 41.0, 47.0, 55.0, 54.0, 45.0, 31.0, 40.0, 34.0, 41.0, 26.0, 37.0, 25.0, 23.0, 28.0, 25.0, 26.0, 18.0, 12.0, 12.0, 7.0, 13.0, 13.0, 8.0, 8.0, 6.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.11357879638672, -24.307601928710938, -23.501625061035156, -22.695648193359375, -21.889673233032227, -21.083696365356445, -20.277719497680664, -19.471742630004883, -18.665767669677734, -17.859790802001953, -17.053813934326172, -16.24783706665039, -15.441862106323242, -14.635885238647461, -13.82990837097168, -13.023931503295898, -12.217954635620117, -11.411977767944336, -10.606001853942871, -9.80002498626709, -8.994049072265625, -8.188072204589844, -7.3820953369140625, -6.5761189460754395, -5.770142555236816, -4.964166164398193, -4.15818977355957, -3.352212905883789, -2.546236515045166, -1.740260124206543, -0.9342832565307617, -0.12830686569213867, 0.6776695251464844, 1.483646035194397, 2.2896225452423096, 3.0955991744995117, 3.9015755653381348, 4.707551956176758, 5.513528823852539, 6.319505214691162, 7.125481605529785, 7.931457996368408, 8.737434387207031, 9.543411254882812, 10.349388122558594, 11.155364036560059, 11.96134090423584, 12.767316818237305, 13.573293685913086, 14.379270553588867, 15.185246467590332, 15.991223335266113, 16.797199249267578, 17.60317611694336, 18.40915298461914, 19.215129852294922, 20.021106719970703, 20.827083587646484, 21.633060455322266, 22.439037322998047, 23.245012283325195, 24.050989151000977, 24.856966018676758, 25.66294288635254, 26.468917846679688]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 2.0, 9.0, 3.0, 11.0, 8.0, 14.0, 10.0, 15.0, 15.0, 23.0, 17.0, 26.0, 36.0, 31.0, 22.0, 41.0, 26.0, 38.0, 48.0, 48.0, 51.0, 37.0, 43.0, 45.0, 35.0, 32.0, 33.0, 39.0, 28.0, 26.0, 26.0, 19.0, 15.0, 19.0, 18.0, 16.0, 18.0, 10.0, 5.0, 8.0, 6.0, 6.0, 10.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.25, -3.155059814453125, -3.06011962890625, -2.965179443359375, -2.8702392578125, -2.775299072265625, -2.68035888671875, -2.585418701171875, -2.490478515625, -2.395538330078125, -2.30059814453125, -2.205657958984375, -2.1107177734375, -2.015777587890625, -1.92083740234375, -1.825897216796875, -1.73095703125, -1.636016845703125, -1.54107666015625, -1.446136474609375, -1.3511962890625, -1.256256103515625, -1.16131591796875, -1.066375732421875, -0.971435546875, -0.876495361328125, -0.78155517578125, -0.686614990234375, -0.5916748046875, -0.496734619140625, -0.40179443359375, -0.306854248046875, -0.2119140625, -0.116973876953125, -0.02203369140625, 0.072906494140625, 0.1678466796875, 0.262786865234375, 0.35772705078125, 0.452667236328125, 0.547607421875, 0.642547607421875, 0.73748779296875, 0.832427978515625, 0.9273681640625, 1.022308349609375, 1.11724853515625, 1.212188720703125, 1.30712890625, 1.402069091796875, 1.49700927734375, 1.591949462890625, 1.6868896484375, 1.781829833984375, 1.87677001953125, 1.971710205078125, 2.066650390625, 2.161590576171875, 2.25653076171875, 2.351470947265625, 2.4464111328125, 2.541351318359375, 2.63629150390625, 2.731231689453125, 2.826171875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 8.0, 10.0, 13.0, 5.0, 12.0, 22.0, 15.0, 16.0, 33.0, 35.0, 52.0, 74.0, 159.0, 406.0, 1027.0, 3178.0, 11297.0, 44860.0, 199892.0, 910458.0, 2057057.0, 751278.0, 163011.0, 37261.0, 9571.0, 2776.0, 970.0, 312.0, 166.0, 65.0, 38.0, 31.0, 22.0, 16.0, 15.0, 16.0, 12.0, 13.0, 17.0, 7.0, 8.0, 9.0, 4.0, 4.0, 8.0, 2.0, 1.0, 5.0, 1.0, 3.0], "bins": [-6.35546875, -6.1708984375, -5.986328125, -5.8017578125, -5.6171875, -5.4326171875, -5.248046875, -5.0634765625, -4.87890625, -4.6943359375, -4.509765625, -4.3251953125, -4.140625, -3.9560546875, -3.771484375, -3.5869140625, -3.40234375, -3.2177734375, -3.033203125, -2.8486328125, -2.6640625, -2.4794921875, -2.294921875, -2.1103515625, -1.92578125, -1.7412109375, -1.556640625, -1.3720703125, -1.1875, -1.0029296875, -0.818359375, -0.6337890625, -0.44921875, -0.2646484375, -0.080078125, 0.1044921875, 0.2890625, 0.4736328125, 0.658203125, 0.8427734375, 1.02734375, 1.2119140625, 1.396484375, 1.5810546875, 1.765625, 1.9501953125, 2.134765625, 2.3193359375, 2.50390625, 2.6884765625, 2.873046875, 3.0576171875, 3.2421875, 3.4267578125, 3.611328125, 3.7958984375, 3.98046875, 4.1650390625, 4.349609375, 4.5341796875, 4.71875, 4.9033203125, 5.087890625, 5.2724609375, 5.45703125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 9.0, 8.0, 10.0, 11.0, 17.0, 16.0, 17.0, 26.0, 36.0, 47.0, 61.0, 62.0, 106.0, 83.0, 119.0, 165.0, 181.0, 221.0, 290.0, 302.0, 337.0, 336.0, 297.0, 226.0, 210.0, 176.0, 136.0, 132.0, 93.0, 79.0, 50.0, 46.0, 34.0, 25.0, 22.0, 20.0, 10.0, 14.0, 8.0, 4.0, 8.0, 6.0, 5.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.09765625, -3.95989990234375, -3.8221435546875, -3.68438720703125, -3.546630859375, -3.40887451171875, -3.2711181640625, -3.13336181640625, -2.99560546875, -2.85784912109375, -2.7200927734375, -2.58233642578125, -2.444580078125, -2.30682373046875, -2.1690673828125, -2.03131103515625, -1.8935546875, -1.75579833984375, -1.6180419921875, -1.48028564453125, -1.342529296875, -1.20477294921875, -1.0670166015625, -0.92926025390625, -0.79150390625, -0.65374755859375, -0.5159912109375, -0.37823486328125, -0.240478515625, -0.10272216796875, 0.0350341796875, 0.17279052734375, 0.310546875, 0.44830322265625, 0.5860595703125, 0.72381591796875, 0.861572265625, 0.99932861328125, 1.1370849609375, 1.27484130859375, 1.41259765625, 1.55035400390625, 1.6881103515625, 1.82586669921875, 1.963623046875, 2.10137939453125, 2.2391357421875, 2.37689208984375, 2.5146484375, 2.65240478515625, 2.7901611328125, 2.92791748046875, 3.065673828125, 3.20343017578125, 3.3411865234375, 3.47894287109375, 3.61669921875, 3.75445556640625, 3.8922119140625, 4.02996826171875, 4.167724609375, 4.30548095703125, 4.4432373046875, 4.58099365234375, 4.71875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 6.0, 12.0, 17.0, 9.0, 20.0, 23.0, 30.0, 42.0, 53.0, 67.0, 81.0, 106.0, 180.0, 190.0, 269.0, 479.0, 2127.0, 48822.0, 2063734.0, 2026478.0, 47790.0, 2118.0, 448.0, 275.0, 205.0, 136.0, 100.0, 106.0, 66.0, 62.0, 49.0, 34.0, 17.0, 28.0, 10.0, 13.0, 16.0, 10.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-20.890625, -20.293701171875, -19.69677734375, -19.099853515625, -18.5029296875, -17.906005859375, -17.30908203125, -16.712158203125, -16.115234375, -15.518310546875, -14.92138671875, -14.324462890625, -13.7275390625, -13.130615234375, -12.53369140625, -11.936767578125, -11.33984375, -10.742919921875, -10.14599609375, -9.549072265625, -8.9521484375, -8.355224609375, -7.75830078125, -7.161376953125, -6.564453125, -5.967529296875, -5.37060546875, -4.773681640625, -4.1767578125, -3.579833984375, -2.98291015625, -2.385986328125, -1.7890625, -1.192138671875, -0.59521484375, 0.001708984375, 0.5986328125, 1.195556640625, 1.79248046875, 2.389404296875, 2.986328125, 3.583251953125, 4.18017578125, 4.777099609375, 5.3740234375, 5.970947265625, 6.56787109375, 7.164794921875, 7.76171875, 8.358642578125, 8.95556640625, 9.552490234375, 10.1494140625, 10.746337890625, 11.34326171875, 11.940185546875, 12.537109375, 13.134033203125, 13.73095703125, 14.327880859375, 14.9248046875, 15.521728515625, 16.11865234375, 16.715576171875, 17.3125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 11.0, 12.0, 19.0, 29.0, 50.0, 52.0, 76.0, 95.0, 97.0, 97.0, 101.0, 81.0, 86.0, 58.0, 43.0, 41.0, 18.0, 19.0, 9.0, 8.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.57284927368164, -13.711023330688477, -12.849196434020996, -11.987370491027832, -11.125543594360352, -10.263717651367188, -9.401891708374023, -8.54006576538086, -7.678238868713379, -6.816412448883057, -5.954586029052734, -5.09276008605957, -4.230933666229248, -3.369107246398926, -2.5072813034057617, -1.6454548835754395, -0.7836284637451172, 0.07819783687591553, 0.9400241374969482, 1.8018503189086914, 2.6636767387390137, 3.525503158569336, 4.3873291015625, 5.249155521392822, 6.1109819412231445, 6.972808361053467, 7.834634780883789, 8.696460723876953, 9.558286666870117, 10.420113563537598, 11.281939506530762, 12.143766403198242, 13.005592346191406, 13.86741828918457, 14.72924518585205, 15.591071128845215, 16.452898025512695, 17.31472396850586, 18.176549911499023, 19.038375854492188, 19.900203704833984, 20.76202964782715, 21.623855590820312, 22.48568344116211, 23.347509384155273, 24.209335327148438, 25.0711612701416, 25.932987213134766, 26.79481315612793, 27.656639099121094, 28.518465042114258, 29.380290985107422, 30.24211883544922, 31.103944778442383, 31.965770721435547, 32.827598571777344, 33.689422607421875, 34.55125045776367, 35.4130744934082, 36.27490234375, 37.13672637939453, 37.99855422973633, 38.860382080078125, 39.722206115722656, 40.58403396606445]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 8.0, 13.0, 11.0, 13.0, 19.0, 16.0, 24.0, 31.0, 39.0, 28.0, 40.0, 34.0, 40.0, 29.0, 35.0, 39.0, 41.0, 45.0, 43.0, 36.0, 36.0, 36.0, 32.0, 37.0, 29.0, 30.0, 18.0, 26.0, 21.0, 23.0, 19.0, 19.0, 17.0, 13.0, 14.0, 11.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.84534454345703, -16.25760269165039, -15.669862747192383, -15.082121849060059, -14.494380950927734, -13.906639099121094, -13.31889820098877, -12.731157302856445, -12.143416404724121, -11.555675506591797, -10.967934608459473, -10.380193710327148, -9.792451858520508, -9.2047119140625, -8.61697006225586, -8.029229164123535, -7.441488265991211, -6.853747367858887, -6.2660064697265625, -5.67826509475708, -5.090524196624756, -4.502783298492432, -3.9150421619415283, -3.327301025390625, -2.739560127258301, -2.1518192291259766, -1.5640780925750732, -0.9763370752334595, -0.3885960578918457, 0.19914484024047852, 0.7868859767913818, 1.3746271133422852, 1.9623680114746094, 2.5501089096069336, 3.137850046157837, 3.7255911827087402, 4.3133320808410645, 4.901072978973389, 5.488814353942871, 6.076555252075195, 6.6642961502075195, 7.252037048339844, 7.839777946472168, 8.427518844604492, 9.015260696411133, 9.60300064086914, 10.190742492675781, 10.778483390808105, 11.36622428894043, 11.953965187072754, 12.541706085205078, 13.129446983337402, 13.717187881469727, 14.304929733276367, 14.892670631408691, 15.480411529541016, 16.068153381347656, 16.655895233154297, 17.243635177612305, 17.831377029418945, 18.419116973876953, 19.006858825683594, 19.5945987701416, 20.182340621948242, 20.77008056640625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 5.0, 5.0, 4.0, 6.0, 4.0, 15.0, 13.0, 9.0, 13.0, 21.0, 19.0, 21.0, 22.0, 28.0, 28.0, 29.0, 40.0, 41.0, 39.0, 34.0, 38.0, 36.0, 40.0, 52.0, 49.0, 30.0, 34.0, 41.0, 23.0, 43.0, 24.0, 27.0, 27.0, 20.0, 21.0, 21.0, 7.0, 15.0, 11.0, 11.0, 11.0, 4.0, 5.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.009765625, -2.917327880859375, -2.82489013671875, -2.732452392578125, -2.6400146484375, -2.547576904296875, -2.45513916015625, -2.362701416015625, -2.270263671875, -2.177825927734375, -2.08538818359375, -1.992950439453125, -1.9005126953125, -1.808074951171875, -1.71563720703125, -1.623199462890625, -1.53076171875, -1.438323974609375, -1.34588623046875, -1.253448486328125, -1.1610107421875, -1.068572998046875, -0.97613525390625, -0.883697509765625, -0.791259765625, -0.698822021484375, -0.60638427734375, -0.513946533203125, -0.4215087890625, -0.329071044921875, -0.23663330078125, -0.144195556640625, -0.0517578125, 0.040679931640625, 0.13311767578125, 0.225555419921875, 0.3179931640625, 0.410430908203125, 0.50286865234375, 0.595306396484375, 0.687744140625, 0.780181884765625, 0.87261962890625, 0.965057373046875, 1.0574951171875, 1.149932861328125, 1.24237060546875, 1.334808349609375, 1.42724609375, 1.519683837890625, 1.61212158203125, 1.704559326171875, 1.7969970703125, 1.889434814453125, 1.98187255859375, 2.074310302734375, 2.166748046875, 2.259185791015625, 2.35162353515625, 2.444061279296875, 2.5364990234375, 2.628936767578125, 2.72137451171875, 2.813812255859375, 2.90625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 8.0, 9.0, 15.0, 18.0, 28.0, 35.0, 46.0, 82.0, 100.0, 135.0, 169.0, 257.0, 367.0, 521.0, 711.0, 1027.0, 1399.0, 2039.0, 2880.0, 4206.0, 6170.0, 9056.0, 13300.0, 19858.0, 29832.0, 46297.0, 76004.0, 140500.0, 318096.0, 151202.0, 80029.0, 48319.0, 31165.0, 20645.0, 13750.0, 9312.0, 6396.0, 4379.0, 2987.0, 2135.0, 1449.0, 1062.0, 671.0, 566.0, 376.0, 258.0, 196.0, 139.0, 96.0, 80.0, 60.0, 42.0, 30.0, 16.0, 14.0, 11.0, 6.0, 3.0, 4.0, 2.0], "bins": [-0.1270751953125, -0.12317085266113281, -0.11926651000976562, -0.11536216735839844, -0.11145782470703125, -0.10755348205566406, -0.10364913940429688, -0.09974479675292969, -0.0958404541015625, -0.09193611145019531, -0.08803176879882812, -0.08412742614746094, -0.08022308349609375, -0.07631874084472656, -0.07241439819335938, -0.06851005554199219, -0.064605712890625, -0.06070137023925781, -0.056797027587890625, -0.05289268493652344, -0.04898834228515625, -0.04508399963378906, -0.041179656982421875, -0.03727531433105469, -0.0333709716796875, -0.029466629028320312, -0.025562286376953125, -0.021657943725585938, -0.01775360107421875, -0.013849258422851562, -0.009944915771484375, -0.0060405731201171875, -0.00213623046875, 0.0017681121826171875, 0.005672454833984375, 0.009576797485351562, 0.01348114013671875, 0.017385482788085938, 0.021289825439453125, 0.025194168090820312, 0.0290985107421875, 0.03300285339355469, 0.036907196044921875, 0.04081153869628906, 0.04471588134765625, 0.04862022399902344, 0.052524566650390625, 0.05642890930175781, 0.060333251953125, 0.06423759460449219, 0.06814193725585938, 0.07204627990722656, 0.07595062255859375, 0.07985496520996094, 0.08375930786132812, 0.08766365051269531, 0.0915679931640625, 0.09547233581542969, 0.09937667846679688, 0.10328102111816406, 0.10718536376953125, 0.11108970642089844, 0.11499404907226562, 0.11889839172363281, 0.122802734375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 8.0, 7.0, 11.0, 9.0, 17.0, 13.0, 6.0, 15.0, 29.0, 20.0, 20.0, 29.0, 39.0, 24.0, 29.0, 40.0, 35.0, 38.0, 43.0, 1067.0, 43.0, 44.0, 45.0, 41.0, 31.0, 43.0, 36.0, 31.0, 28.0, 30.0, 19.0, 21.0, 13.0, 16.0, 20.0, 10.0, 9.0, 9.0, 10.0, 9.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.077606201171875, -2.00286865234375, -1.928131103515625, -1.8533935546875, -1.778656005859375, -1.70391845703125, -1.629180908203125, -1.554443359375, -1.479705810546875, -1.40496826171875, -1.330230712890625, -1.2554931640625, -1.180755615234375, -1.10601806640625, -1.031280517578125, -0.95654296875, -0.881805419921875, -0.80706787109375, -0.732330322265625, -0.6575927734375, -0.582855224609375, -0.50811767578125, -0.433380126953125, -0.358642578125, -0.283905029296875, -0.20916748046875, -0.134429931640625, -0.0596923828125, 0.015045166015625, 0.08978271484375, 0.164520263671875, 0.2392578125, 0.313995361328125, 0.38873291015625, 0.463470458984375, 0.5382080078125, 0.612945556640625, 0.68768310546875, 0.762420654296875, 0.837158203125, 0.911895751953125, 0.98663330078125, 1.061370849609375, 1.1361083984375, 1.210845947265625, 1.28558349609375, 1.360321044921875, 1.43505859375, 1.509796142578125, 1.58453369140625, 1.659271240234375, 1.7340087890625, 1.808746337890625, 1.88348388671875, 1.958221435546875, 2.032958984375, 2.107696533203125, 2.18243408203125, 2.257171630859375, 2.3319091796875, 2.406646728515625, 2.48138427734375, 2.556121826171875, 2.630859375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 18.0, 22.0, 45.0, 59.0, 123.0, 139.0, 274.0, 419.0, 586.0, 901.0, 1442.0, 2070.0, 3182.0, 4654.0, 6924.0, 10418.0, 15501.0, 24006.0, 38193.0, 62585.0, 112654.0, 1327267.0, 223824.0, 102073.0, 57916.0, 35462.0, 22266.0, 14770.0, 9567.0, 6591.0, 4403.0, 2931.0, 2032.0, 1295.0, 864.0, 601.0, 388.0, 237.0, 153.0, 103.0, 53.0, 29.0, 32.0, 15.0, 11.0, 10.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.07586669921875, -0.0735626220703125, -0.071258544921875, -0.0689544677734375, -0.066650390625, -0.0643463134765625, -0.062042236328125, -0.0597381591796875, -0.05743408203125, -0.0551300048828125, -0.052825927734375, -0.0505218505859375, -0.0482177734375, -0.0459136962890625, -0.043609619140625, -0.0413055419921875, -0.03900146484375, -0.0366973876953125, -0.034393310546875, -0.0320892333984375, -0.02978515625, -0.0274810791015625, -0.025177001953125, -0.0228729248046875, -0.02056884765625, -0.0182647705078125, -0.015960693359375, -0.0136566162109375, -0.0113525390625, -0.0090484619140625, -0.006744384765625, -0.0044403076171875, -0.00213623046875, 0.0001678466796875, 0.002471923828125, 0.0047760009765625, 0.007080078125, 0.0093841552734375, 0.011688232421875, 0.0139923095703125, 0.01629638671875, 0.0186004638671875, 0.020904541015625, 0.0232086181640625, 0.0255126953125, 0.0278167724609375, 0.030120849609375, 0.0324249267578125, 0.03472900390625, 0.0370330810546875, 0.039337158203125, 0.0416412353515625, 0.0439453125, 0.0462493896484375, 0.048553466796875, 0.0508575439453125, 0.05316162109375, 0.0554656982421875, 0.057769775390625, 0.0600738525390625, 0.0623779296875, 0.0646820068359375, 0.066986083984375, 0.0692901611328125, 0.07159423828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 4.0, 7.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 19.0, 19.0, 0.0, 18.0, 27.0, 24.0, 46.0, 0.0, 56.0, 99.0, 303.0, 95.0, 80.0, 0.0, 41.0, 41.0, 23.0, 18.0, 0.0, 16.0, 10.0, 9.0, 6.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 0.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6205012798309326e-06, -1.5720725059509277e-06, -1.5236437320709229e-06, -1.475214958190918e-06, -1.426786184310913e-06, -1.3783574104309082e-06, -1.3299286365509033e-06, -1.2814998626708984e-06, -1.2330710887908936e-06, -1.1846423149108887e-06, -1.1362135410308838e-06, -1.087784767150879e-06, -1.039355993270874e-06, -9.909272193908691e-07, -9.424984455108643e-07, -8.940696716308594e-07, -8.456408977508545e-07, -7.972121238708496e-07, -7.487833499908447e-07, -7.003545761108398e-07, -6.51925802230835e-07, -6.034970283508301e-07, -5.550682544708252e-07, -5.066394805908203e-07, -4.5821070671081543e-07, -4.0978193283081055e-07, -3.6135315895080566e-07, -3.129243850708008e-07, -2.644956111907959e-07, -2.1606683731079102e-07, -1.6763806343078613e-07, -1.1920928955078125e-07, -7.078051567077637e-08, -2.2351741790771484e-08, 2.60770320892334e-08, 7.450580596923828e-08, 1.2293457984924316e-07, 1.7136335372924805e-07, 2.1979212760925293e-07, 2.682209014892578e-07, 3.166496753692627e-07, 3.650784492492676e-07, 4.1350722312927246e-07, 4.6193599700927734e-07, 5.103647708892822e-07, 5.587935447692871e-07, 6.07222318649292e-07, 6.556510925292969e-07, 7.040798664093018e-07, 7.525086402893066e-07, 8.009374141693115e-07, 8.493661880493164e-07, 8.977949619293213e-07, 9.462237358093262e-07, 9.94652509689331e-07, 1.043081283569336e-06, 1.0915100574493408e-06, 1.1399388313293457e-06, 1.1883676052093506e-06, 1.2367963790893555e-06, 1.2852251529693604e-06, 1.3336539268493652e-06, 1.3820827007293701e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 2.0, 9.0, 11.0, 17.0, 19.0, 36.0, 42.0, 65.0, 117.0, 325.0, 2947.0, 173053.0, 864384.0, 6677.0, 420.0, 149.0, 83.0, 43.0, 21.0, 28.0, 24.0, 17.0, 13.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.962350845336914e-05, -2.8570182621479034e-05, -2.7516856789588928e-05, -2.6463530957698822e-05, -2.5410205125808716e-05, -2.435687929391861e-05, -2.3303553462028503e-05, -2.2250227630138397e-05, -2.119690179824829e-05, -2.0143575966358185e-05, -1.909025013446808e-05, -1.8036924302577972e-05, -1.6983598470687866e-05, -1.593027263879776e-05, -1.4876946806907654e-05, -1.3823620975017548e-05, -1.2770295143127441e-05, -1.1716969311237335e-05, -1.0663643479347229e-05, -9.610317647457123e-06, -8.556991815567017e-06, -7.50366598367691e-06, -6.450340151786804e-06, -5.397014319896698e-06, -4.343688488006592e-06, -3.2903626561164856e-06, -2.2370368242263794e-06, -1.1837109923362732e-06, -1.30385160446167e-07, 9.229406714439392e-07, 1.9762665033340454e-06, 3.0295923352241516e-06, 4.082918167114258e-06, 5.136243999004364e-06, 6.18956983089447e-06, 7.242895662784576e-06, 8.296221494674683e-06, 9.349547326564789e-06, 1.0402873158454895e-05, 1.1456198990345001e-05, 1.2509524822235107e-05, 1.3562850654125214e-05, 1.461617648601532e-05, 1.5669502317905426e-05, 1.6722828149795532e-05, 1.777615398168564e-05, 1.8829479813575745e-05, 1.988280564546585e-05, 2.0936131477355957e-05, 2.1989457309246063e-05, 2.304278314113617e-05, 2.4096108973026276e-05, 2.5149434804916382e-05, 2.6202760636806488e-05, 2.7256086468696594e-05, 2.83094123005867e-05, 2.9362738132476807e-05, 3.0416063964366913e-05, 3.146938979625702e-05, 3.2522715628147125e-05, 3.357604146003723e-05, 3.462936729192734e-05, 3.5682693123817444e-05, 3.673601895570755e-05, 3.7789344787597656e-05]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 13.0, 14.0, 25.0, 30.0, 44.0, 79.0, 89.0, 139.0, 246.0, 124.0, 66.0, 44.0, 28.0, 21.0, 19.0, 5.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.845655775578052e-07, -6.534622798426426e-07, -6.223590389708988e-07, -5.912557412557362e-07, -5.601524435405736e-07, -5.29049145825411e-07, -4.979458481102483e-07, -4.6684260723850457e-07, -4.3573930952334194e-07, -4.046360118081793e-07, -3.735327425147261e-07, -3.4242947322127293e-07, -3.113261755061103e-07, -2.802228777909477e-07, -2.491196084974945e-07, -2.1801632499318657e-07, -1.8691304148887866e-07, -1.5580975798457075e-07, -1.2470647448026284e-07, -9.360319097595493e-08, -6.249990747164702e-08, -3.139662396733911e-08, -2.9334046303119976e-10, 3.080994304127671e-08, 6.191322654558462e-08, 9.301651004989253e-08, 1.2411979355420044e-07, 1.5522307705850835e-07, 1.8632636056281626e-07, 2.1742964406712417e-07, 2.485329275714321e-07, 2.796361968648853e-07, 3.1073955142346676e-07, 3.418428491386294e-07, 3.729461184320826e-07, 4.040493877255358e-07, 4.351526854406984e-07, 4.6625598315586103e-07, 4.973592240276048e-07, 5.284625217427674e-07, 5.5956581945793e-07, 5.906691171730927e-07, 6.217724148882553e-07, 6.528756557599991e-07, 6.839789534751617e-07, 7.150822511903243e-07, 7.461854920620681e-07, 7.772887897772307e-07, 8.083920874923933e-07, 8.39495385207556e-07, 8.705986829227186e-07, 9.017019237944623e-07, 9.32805221509625e-07, 9.639085192247876e-07, 9.950117600965314e-07, 1.0261151146551128e-06, 1.0572183555268566e-06, 1.0883215963986004e-06, 1.1194249509571819e-06, 1.1505281918289256e-06, 1.1816314327006694e-06, 1.2127347872592509e-06, 1.2438380281309946e-06, 1.2749413826895761e-06, 1.30604462356132e-06]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 14.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 43.0, 0.0, 0.0, 86.0, 0.0, 0.0, 0.0, 201.0, 0.0, 0.0, 256.0, 0.0, 0.0, 0.0, 188.0, 0.0, 0.0, 107.0, 0.0, 0.0, 41.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 11.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.783513188362122e-07, -5.606561899185181e-07, -5.42961061000824e-07, -5.252659320831299e-07, -5.075708031654358e-07, -4.898756742477417e-07, -4.721805453300476e-07, -4.544854164123535e-07, -4.367902874946594e-07, -4.1909515857696533e-07, -4.0140002965927124e-07, -3.8370490074157715e-07, -3.6600977182388306e-07, -3.4831464290618896e-07, -3.3061951398849487e-07, -3.129243850708008e-07, -2.952292561531067e-07, -2.775341272354126e-07, -2.598389983177185e-07, -2.421438694000244e-07, -2.2444874048233032e-07, -2.0675361156463623e-07, -1.8905848264694214e-07, -1.7136335372924805e-07, -1.5366822481155396e-07, -1.3597309589385986e-07, -1.1827796697616577e-07, -1.0058283805847168e-07, -8.288770914077759e-08, -6.51925802230835e-08, -4.7497451305389404e-08, -2.9802322387695312e-08, -1.210719347000122e-08, 5.587935447692871e-09, 2.3283064365386963e-08, 4.0978193283081055e-08, 5.8673322200775146e-08, 7.636845111846924e-08, 9.406358003616333e-08, 1.1175870895385742e-07, 1.2945383787155151e-07, 1.471489667892456e-07, 1.648440957069397e-07, 1.825392246246338e-07, 2.0023435354232788e-07, 2.1792948246002197e-07, 2.3562461137771606e-07, 2.5331974029541016e-07, 2.7101486921310425e-07, 2.8870999813079834e-07, 3.0640512704849243e-07, 3.241002559661865e-07, 3.417953848838806e-07, 3.594905138015747e-07, 3.771856427192688e-07, 3.948807716369629e-07, 4.12575900554657e-07, 4.302710294723511e-07, 4.4796615839004517e-07, 4.6566128730773926e-07, 4.833564162254333e-07, 5.010515451431274e-07, 5.187466740608215e-07, 5.364418029785156e-07]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 5.0, 5.0, 4.0, 6.0, 4.0, 15.0, 13.0, 9.0, 13.0, 21.0, 19.0, 21.0, 22.0, 28.0, 28.0, 29.0, 40.0, 41.0, 39.0, 34.0, 38.0, 36.0, 40.0, 52.0, 49.0, 30.0, 34.0, 41.0, 23.0, 43.0, 24.0, 27.0, 27.0, 20.0, 21.0, 21.0, 7.0, 15.0, 11.0, 11.0, 11.0, 4.0, 5.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.009765625, -2.917327880859375, -2.82489013671875, -2.732452392578125, -2.6400146484375, -2.547576904296875, -2.45513916015625, -2.362701416015625, -2.270263671875, -2.177825927734375, -2.08538818359375, -1.992950439453125, -1.9005126953125, -1.808074951171875, -1.71563720703125, -1.623199462890625, -1.53076171875, -1.438323974609375, -1.34588623046875, -1.253448486328125, -1.1610107421875, -1.068572998046875, -0.97613525390625, -0.883697509765625, -0.791259765625, -0.698822021484375, -0.60638427734375, -0.513946533203125, -0.4215087890625, -0.329071044921875, -0.23663330078125, -0.144195556640625, -0.0517578125, 0.040679931640625, 0.13311767578125, 0.225555419921875, 0.3179931640625, 0.410430908203125, 0.50286865234375, 0.595306396484375, 0.687744140625, 0.780181884765625, 0.87261962890625, 0.965057373046875, 1.0574951171875, 1.149932861328125, 1.24237060546875, 1.334808349609375, 1.42724609375, 1.519683837890625, 1.61212158203125, 1.704559326171875, 1.7969970703125, 1.889434814453125, 1.98187255859375, 2.074310302734375, 2.166748046875, 2.259185791015625, 2.35162353515625, 2.444061279296875, 2.5364990234375, 2.628936767578125, 2.72137451171875, 2.813812255859375, 2.90625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 8.0, 15.0, 25.0, 41.0, 59.0, 78.0, 126.0, 204.0, 340.0, 516.0, 828.0, 1292.0, 2141.0, 3601.0, 5906.0, 9613.0, 17116.0, 31220.0, 59654.0, 118967.0, 242658.0, 271054.0, 134600.0, 67641.0, 34968.0, 18884.0, 10583.0, 6364.0, 3883.0, 2289.0, 1416.0, 947.0, 576.0, 353.0, 207.0, 142.0, 70.0, 58.0, 43.0, 25.0, 15.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.66796875, -3.56036376953125, -3.4527587890625, -3.34515380859375, -3.237548828125, -3.12994384765625, -3.0223388671875, -2.91473388671875, -2.80712890625, -2.69952392578125, -2.5919189453125, -2.48431396484375, -2.376708984375, -2.26910400390625, -2.1614990234375, -2.05389404296875, -1.9462890625, -1.83868408203125, -1.7310791015625, -1.62347412109375, -1.515869140625, -1.40826416015625, -1.3006591796875, -1.19305419921875, -1.08544921875, -0.97784423828125, -0.8702392578125, -0.76263427734375, -0.655029296875, -0.54742431640625, -0.4398193359375, -0.33221435546875, -0.224609375, -0.11700439453125, -0.0093994140625, 0.09820556640625, 0.205810546875, 0.31341552734375, 0.4210205078125, 0.52862548828125, 0.63623046875, 0.74383544921875, 0.8514404296875, 0.95904541015625, 1.066650390625, 1.17425537109375, 1.2818603515625, 1.38946533203125, 1.4970703125, 1.60467529296875, 1.7122802734375, 1.81988525390625, 1.927490234375, 2.03509521484375, 2.1427001953125, 2.25030517578125, 2.35791015625, 2.46551513671875, 2.5731201171875, 2.68072509765625, 2.788330078125, 2.89593505859375, 3.0035400390625, 3.11114501953125, 3.21875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 7.0, 9.0, 9.0, 11.0, 20.0, 28.0, 16.0, 18.0, 26.0, 33.0, 35.0, 37.0, 33.0, 57.0, 64.0, 100.0, 102.0, 247.0, 1459.0, 236.0, 94.0, 69.0, 42.0, 62.0, 34.0, 30.0, 33.0, 28.0, 26.0, 16.0, 12.0, 8.0, 5.0, 5.0, 8.0, 10.0, 6.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -10.031982421875, -9.71240234375, -9.392822265625, -9.0732421875, -8.753662109375, -8.43408203125, -8.114501953125, -7.794921875, -7.475341796875, -7.15576171875, -6.836181640625, -6.5166015625, -6.197021484375, -5.87744140625, -5.557861328125, -5.23828125, -4.918701171875, -4.59912109375, -4.279541015625, -3.9599609375, -3.640380859375, -3.32080078125, -3.001220703125, -2.681640625, -2.362060546875, -2.04248046875, -1.722900390625, -1.4033203125, -1.083740234375, -0.76416015625, -0.444580078125, -0.125, 0.194580078125, 0.51416015625, 0.833740234375, 1.1533203125, 1.472900390625, 1.79248046875, 2.112060546875, 2.431640625, 2.751220703125, 3.07080078125, 3.390380859375, 3.7099609375, 4.029541015625, 4.34912109375, 4.668701171875, 4.98828125, 5.307861328125, 5.62744140625, 5.947021484375, 6.2666015625, 6.586181640625, 6.90576171875, 7.225341796875, 7.544921875, 7.864501953125, 8.18408203125, 8.503662109375, 8.8232421875, 9.142822265625, 9.46240234375, 9.781982421875, 10.1015625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 12.0, 15.0, 16.0, 11.0, 23.0, 33.0, 55.0, 48.0, 78.0, 92.0, 151.0, 180.0, 339.0, 567.0, 1580.0, 9590.0, 176585.0, 2814374.0, 130781.0, 7943.0, 1446.0, 575.0, 336.0, 207.0, 149.0, 107.0, 80.0, 70.0, 52.0, 44.0, 25.0, 28.0, 23.0, 19.0, 10.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.171875, -17.612060546875, -17.05224609375, -16.492431640625, -15.9326171875, -15.372802734375, -14.81298828125, -14.253173828125, -13.693359375, -13.133544921875, -12.57373046875, -12.013916015625, -11.4541015625, -10.894287109375, -10.33447265625, -9.774658203125, -9.21484375, -8.655029296875, -8.09521484375, -7.535400390625, -6.9755859375, -6.415771484375, -5.85595703125, -5.296142578125, -4.736328125, -4.176513671875, -3.61669921875, -3.056884765625, -2.4970703125, -1.937255859375, -1.37744140625, -0.817626953125, -0.2578125, 0.302001953125, 0.86181640625, 1.421630859375, 1.9814453125, 2.541259765625, 3.10107421875, 3.660888671875, 4.220703125, 4.780517578125, 5.34033203125, 5.900146484375, 6.4599609375, 7.019775390625, 7.57958984375, 8.139404296875, 8.69921875, 9.259033203125, 9.81884765625, 10.378662109375, 10.9384765625, 11.498291015625, 12.05810546875, 12.617919921875, 13.177734375, 13.737548828125, 14.29736328125, 14.857177734375, 15.4169921875, 15.976806640625, 16.53662109375, 17.096435546875, 17.65625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 26.0, 135.0, 303.0, 347.0, 159.0, 40.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.669567108154297, -15.727313995361328, -13.78506088256836, -11.84280776977539, -9.900554656982422, -7.958301544189453, -6.016048431396484, -4.073795318603516, -2.131542205810547, -0.18928909301757812, 1.7529640197753906, 3.6952171325683594, 5.637470245361328, 7.579723358154297, 9.521976470947266, 11.464229583740234, 13.406482696533203, 15.348735809326172, 17.29098892211914, 19.23324203491211, 21.175495147705078, 23.117748260498047, 25.060001373291016, 27.002254486083984, 28.944507598876953, 30.886760711669922, 32.82901382446289, 34.77126693725586, 36.71352005004883, 38.6557731628418, 40.598026275634766, 42.540279388427734, 44.48252868652344, 46.424781799316406, 48.367034912109375, 50.309288024902344, 52.25154113769531, 54.19379425048828, 56.13604736328125, 58.07830047607422, 60.02055358886719, 61.962806701660156, 63.905059814453125, 65.8473129272461, 67.78956604003906, 69.73181915283203, 71.674072265625, 73.61632537841797, 75.55857849121094, 77.5008316040039, 79.44308471679688, 81.38533782958984, 83.32759094238281, 85.26984405517578, 87.21209716796875, 89.15435028076172, 91.09660339355469, 93.03885650634766, 94.98110961914062, 96.9233627319336, 98.86561584472656, 100.80786895751953, 102.7501220703125, 104.69237518310547, 106.63462829589844]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 8.0, 3.0, 9.0, 11.0, 4.0, 10.0, 7.0, 12.0, 7.0, 19.0, 17.0, 19.0, 26.0, 18.0, 23.0, 19.0, 32.0, 32.0, 34.0, 32.0, 34.0, 28.0, 42.0, 31.0, 43.0, 33.0, 47.0, 37.0, 34.0, 41.0, 37.0, 28.0, 23.0, 27.0, 26.0, 21.0, 21.0, 20.0, 12.0, 8.0, 10.0, 9.0, 11.0, 8.0, 5.0, 8.0, 3.0, 7.0, 2.0, 1.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-23.31140899658203, -22.597003936767578, -21.882598876953125, -21.168193817138672, -20.45378875732422, -19.7393856048584, -19.024980545043945, -18.310575485229492, -17.59617042541504, -16.881765365600586, -16.167360305786133, -15.452956199645996, -14.738551139831543, -14.02414608001709, -13.309741973876953, -12.5953369140625, -11.880931854248047, -11.166526794433594, -10.45212173461914, -9.737717628479004, -9.02331256866455, -8.308907508850098, -7.594502925872803, -6.880098342895508, -6.165693283081055, -5.451288223266602, -4.736883640289307, -4.022479057312012, -3.3080739974975586, -2.5936691761016846, -1.8792643547058105, -1.1648597717285156, -0.4504566192626953, 0.2639482021331787, 0.9783530235290527, 1.6927578449249268, 2.407162666320801, 3.121567487716675, 3.835972309112549, 4.550376892089844, 5.264781951904297, 5.97918701171875, 6.693591594696045, 7.40799617767334, 8.122401237487793, 8.836806297302246, 9.551210403442383, 10.265615463256836, 10.980020523071289, 11.694425582885742, 12.408830642700195, 13.123234748840332, 13.837639808654785, 14.552044868469238, 15.266448974609375, 15.980854034423828, 16.69525909423828, 17.409664154052734, 18.124069213867188, 18.83847427368164, 19.552879333496094, 20.267282485961914, 20.981687545776367, 21.69609260559082, 22.410497665405273]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 2.0, 11.0, 10.0, 23.0, 15.0, 9.0, 19.0, 14.0, 25.0, 25.0, 28.0, 33.0, 30.0, 44.0, 28.0, 32.0, 42.0, 40.0, 40.0, 44.0, 39.0, 50.0, 45.0, 26.0, 33.0, 26.0, 31.0, 37.0, 28.0, 16.0, 25.0, 21.0, 17.0, 18.0, 7.0, 9.0, 9.0, 12.0, 6.0, 6.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.263671875, -3.16558837890625, -3.0675048828125, -2.96942138671875, -2.871337890625, -2.77325439453125, -2.6751708984375, -2.57708740234375, -2.47900390625, -2.38092041015625, -2.2828369140625, -2.18475341796875, -2.086669921875, -1.98858642578125, -1.8905029296875, -1.79241943359375, -1.6943359375, -1.59625244140625, -1.4981689453125, -1.40008544921875, -1.302001953125, -1.20391845703125, -1.1058349609375, -1.00775146484375, -0.90966796875, -0.81158447265625, -0.7135009765625, -0.61541748046875, -0.517333984375, -0.41925048828125, -0.3211669921875, -0.22308349609375, -0.125, -0.02691650390625, 0.0711669921875, 0.16925048828125, 0.267333984375, 0.36541748046875, 0.4635009765625, 0.56158447265625, 0.65966796875, 0.75775146484375, 0.8558349609375, 0.95391845703125, 1.052001953125, 1.15008544921875, 1.2481689453125, 1.34625244140625, 1.4443359375, 1.54241943359375, 1.6405029296875, 1.73858642578125, 1.836669921875, 1.93475341796875, 2.0328369140625, 2.13092041015625, 2.22900390625, 2.32708740234375, 2.4251708984375, 2.52325439453125, 2.621337890625, 2.71942138671875, 2.8175048828125, 2.91558837890625, 3.013671875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 1.0, 4.0, 4.0, 5.0, 6.0, 10.0, 15.0, 11.0, 18.0, 15.0, 21.0, 28.0, 32.0, 35.0, 69.0, 93.0, 219.0, 444.0, 1266.0, 4296.0, 17284.0, 75232.0, 357340.0, 1558397.0, 1678654.0, 392805.0, 81916.0, 18776.0, 4755.0, 1464.0, 469.0, 206.0, 121.0, 64.0, 31.0, 30.0, 27.0, 22.0, 16.0, 16.0, 12.0, 11.0, 9.0, 6.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.05859375, -5.86944580078125, -5.6802978515625, -5.49114990234375, -5.302001953125, -5.11285400390625, -4.9237060546875, -4.73455810546875, -4.54541015625, -4.35626220703125, -4.1671142578125, -3.97796630859375, -3.788818359375, -3.59967041015625, -3.4105224609375, -3.22137451171875, -3.0322265625, -2.84307861328125, -2.6539306640625, -2.46478271484375, -2.275634765625, -2.08648681640625, -1.8973388671875, -1.70819091796875, -1.51904296875, -1.32989501953125, -1.1407470703125, -0.95159912109375, -0.762451171875, -0.57330322265625, -0.3841552734375, -0.19500732421875, -0.005859375, 0.18328857421875, 0.3724365234375, 0.56158447265625, 0.750732421875, 0.93988037109375, 1.1290283203125, 1.31817626953125, 1.50732421875, 1.69647216796875, 1.8856201171875, 2.07476806640625, 2.263916015625, 2.45306396484375, 2.6422119140625, 2.83135986328125, 3.0205078125, 3.20965576171875, 3.3988037109375, 3.58795166015625, 3.777099609375, 3.96624755859375, 4.1553955078125, 4.34454345703125, 4.53369140625, 4.72283935546875, 4.9119873046875, 5.10113525390625, 5.290283203125, 5.47943115234375, 5.6685791015625, 5.85772705078125, 6.046875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 5.0, 8.0, 11.0, 16.0, 17.0, 35.0, 38.0, 52.0, 95.0, 94.0, 136.0, 162.0, 228.0, 309.0, 366.0, 435.0, 433.0, 353.0, 307.0, 222.0, 180.0, 134.0, 106.0, 83.0, 60.0, 51.0, 34.0, 18.0, 16.0, 14.0, 7.0, 9.0, 9.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.256591796875, -5.08740234375, -4.918212890625, -4.7490234375, -4.579833984375, -4.41064453125, -4.241455078125, -4.072265625, -3.903076171875, -3.73388671875, -3.564697265625, -3.3955078125, -3.226318359375, -3.05712890625, -2.887939453125, -2.71875, -2.549560546875, -2.38037109375, -2.211181640625, -2.0419921875, -1.872802734375, -1.70361328125, -1.534423828125, -1.365234375, -1.196044921875, -1.02685546875, -0.857666015625, -0.6884765625, -0.519287109375, -0.35009765625, -0.180908203125, -0.01171875, 0.157470703125, 0.32666015625, 0.495849609375, 0.6650390625, 0.834228515625, 1.00341796875, 1.172607421875, 1.341796875, 1.510986328125, 1.68017578125, 1.849365234375, 2.0185546875, 2.187744140625, 2.35693359375, 2.526123046875, 2.6953125, 2.864501953125, 3.03369140625, 3.202880859375, 3.3720703125, 3.541259765625, 3.71044921875, 3.879638671875, 4.048828125, 4.218017578125, 4.38720703125, 4.556396484375, 4.7255859375, 4.894775390625, 5.06396484375, 5.233154296875, 5.40234375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 1.0, 11.0, 6.0, 10.0, 9.0, 14.0, 18.0, 18.0, 34.0, 46.0, 63.0, 98.0, 107.0, 149.0, 223.0, 379.0, 990.0, 27900.0, 3748230.0, 411894.0, 2638.0, 512.0, 277.0, 176.0, 117.0, 107.0, 78.0, 47.0, 30.0, 28.0, 19.0, 15.0, 10.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.515625, -27.556396484375, -26.59716796875, -25.637939453125, -24.6787109375, -23.719482421875, -22.76025390625, -21.801025390625, -20.841796875, -19.882568359375, -18.92333984375, -17.964111328125, -17.0048828125, -16.045654296875, -15.08642578125, -14.127197265625, -13.16796875, -12.208740234375, -11.24951171875, -10.290283203125, -9.3310546875, -8.371826171875, -7.41259765625, -6.453369140625, -5.494140625, -4.534912109375, -3.57568359375, -2.616455078125, -1.6572265625, -0.697998046875, 0.26123046875, 1.220458984375, 2.1796875, 3.138916015625, 4.09814453125, 5.057373046875, 6.0166015625, 6.975830078125, 7.93505859375, 8.894287109375, 9.853515625, 10.812744140625, 11.77197265625, 12.731201171875, 13.6904296875, 14.649658203125, 15.60888671875, 16.568115234375, 17.52734375, 18.486572265625, 19.44580078125, 20.405029296875, 21.3642578125, 22.323486328125, 23.28271484375, 24.241943359375, 25.201171875, 26.160400390625, 27.11962890625, 28.078857421875, 29.0380859375, 29.997314453125, 30.95654296875, 31.915771484375, 32.875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 10.0, 29.0, 26.0, 50.0, 65.0, 98.0, 135.0, 123.0, 111.0, 104.0, 90.0, 59.0, 42.0, 28.0, 19.0, 9.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.44246482849121, -15.464035034179688, -14.485605239868164, -13.50717544555664, -12.528745651245117, -11.550315856933594, -10.571885108947754, -9.59345531463623, -8.615025520324707, -7.636595726013184, -6.65816593170166, -5.6797356605529785, -4.701305866241455, -3.7228760719299316, -2.74444580078125, -1.7660160064697266, -0.7875862121582031, 0.19084370136260986, 1.1692736148834229, 2.1477036476135254, 3.126133441925049, 4.104563236236572, 5.082993507385254, 6.061423301696777, 7.039853096008301, 8.018282890319824, 8.996712684631348, 9.975143432617188, 10.953573226928711, 11.932003021240234, 12.910432815551758, 13.888862609863281, 14.867294311523438, 15.845724105834961, 16.824153900146484, 17.802583694458008, 18.78101348876953, 19.759443283081055, 20.737873077392578, 21.716304779052734, 22.694732666015625, 23.67316246032715, 24.651592254638672, 25.630022048950195, 26.60845184326172, 27.586881637573242, 28.565311431884766, 29.543743133544922, 30.522172927856445, 31.50060272216797, 32.479034423828125, 33.457462310791016, 34.43589401245117, 35.41432189941406, 36.39275360107422, 37.37118148803711, 38.349613189697266, 39.32804489135742, 40.30647277832031, 41.28490447998047, 42.26333236694336, 43.241764068603516, 44.220191955566406, 45.19862365722656, 46.17705154418945]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 7.0, 9.0, 16.0, 7.0, 8.0, 11.0, 17.0, 21.0, 25.0, 28.0, 36.0, 41.0, 39.0, 37.0, 51.0, 36.0, 43.0, 46.0, 40.0, 33.0, 34.0, 37.0, 43.0, 39.0, 41.0, 35.0, 29.0, 27.0, 29.0, 16.0, 19.0, 8.0, 17.0, 14.0, 15.0, 5.0, 9.0, 5.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.608158111572266, -17.004281997680664, -16.400405883789062, -15.796528816223145, -15.192652702331543, -14.588775634765625, -13.984899520874023, -13.381023406982422, -12.77714729309082, -12.173271179199219, -11.5693941116333, -10.9655179977417, -10.361641883850098, -9.75776481628418, -9.153888702392578, -8.550012588500977, -7.946135520935059, -7.342258930206299, -6.738382816314697, -6.1345062255859375, -5.530630111694336, -4.926753520965576, -4.322876930236816, -3.719000816345215, -3.115124225616455, -2.5112478733062744, -1.9073714017868042, -1.303494930267334, -0.6996185779571533, -0.09574222564697266, 0.5081343650817871, 1.1120104789733887, 1.7158870697021484, 2.319763422012329, 2.9236397743225098, 3.5275163650512695, 4.131392478942871, 4.735269069671631, 5.339145660400391, 5.943021774291992, 6.546898365020752, 7.150774955749512, 7.754651069641113, 8.358528137207031, 8.962404251098633, 9.566280364990234, 10.170156478881836, 10.774032592773438, 11.377909660339355, 11.981785774230957, 12.585662841796875, 13.189538955688477, 13.793415069580078, 14.39729118347168, 15.001168251037598, 15.6050443649292, 16.208921432495117, 16.81279754638672, 17.41667366027832, 18.020549774169922, 18.624427795410156, 19.228303909301758, 19.83218002319336, 20.43605613708496, 21.039932250976562]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 12.0, 9.0, 6.0, 6.0, 14.0, 11.0, 17.0, 19.0, 22.0, 21.0, 29.0, 33.0, 37.0, 29.0, 46.0, 41.0, 36.0, 44.0, 41.0, 41.0, 44.0, 44.0, 36.0, 51.0, 46.0, 33.0, 28.0, 26.0, 29.0, 20.0, 27.0, 19.0, 16.0, 12.0, 12.0, 6.0, 13.0, 6.0, 2.0, 5.0, 3.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.318603515625, -3.21337890625, -3.108154296875, -3.0029296875, -2.897705078125, -2.79248046875, -2.687255859375, -2.58203125, -2.476806640625, -2.37158203125, -2.266357421875, -2.1611328125, -2.055908203125, -1.95068359375, -1.845458984375, -1.740234375, -1.635009765625, -1.52978515625, -1.424560546875, -1.3193359375, -1.214111328125, -1.10888671875, -1.003662109375, -0.8984375, -0.793212890625, -0.68798828125, -0.582763671875, -0.4775390625, -0.372314453125, -0.26708984375, -0.161865234375, -0.056640625, 0.048583984375, 0.15380859375, 0.259033203125, 0.3642578125, 0.469482421875, 0.57470703125, 0.679931640625, 0.78515625, 0.890380859375, 0.99560546875, 1.100830078125, 1.2060546875, 1.311279296875, 1.41650390625, 1.521728515625, 1.626953125, 1.732177734375, 1.83740234375, 1.942626953125, 2.0478515625, 2.153076171875, 2.25830078125, 2.363525390625, 2.46875, 2.573974609375, 2.67919921875, 2.784423828125, 2.8896484375, 2.994873046875, 3.10009765625, 3.205322265625, 3.310546875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 3.0, 6.0, 11.0, 13.0, 17.0, 34.0, 57.0, 80.0, 146.0, 217.0, 297.0, 492.0, 797.0, 1174.0, 1895.0, 3025.0, 4953.0, 8079.0, 13380.0, 23175.0, 41180.0, 77318.0, 162425.0, 390521.0, 151478.0, 72925.0, 39234.0, 22178.0, 13057.0, 7747.0, 4714.0, 2881.0, 1865.0, 1123.0, 702.0, 491.0, 323.0, 192.0, 128.0, 78.0, 55.0, 36.0, 30.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1668701171875, -0.16156578063964844, -0.15626144409179688, -0.1509571075439453, -0.14565277099609375, -0.1403484344482422, -0.13504409790039062, -0.12973976135253906, -0.1244354248046875, -0.11913108825683594, -0.11382675170898438, -0.10852241516113281, -0.10321807861328125, -0.09791374206542969, -0.09260940551757812, -0.08730506896972656, -0.082000732421875, -0.07669639587402344, -0.07139205932617188, -0.06608772277832031, -0.06078338623046875, -0.05547904968261719, -0.050174713134765625, -0.04487037658691406, -0.0395660400390625, -0.03426170349121094, -0.028957366943359375, -0.023653030395507812, -0.01834869384765625, -0.013044357299804688, -0.007740020751953125, -0.0024356842041015625, 0.00286865234375, 0.008172988891601562, 0.013477325439453125, 0.018781661987304688, 0.02408599853515625, 0.029390335083007812, 0.034694671630859375, 0.03999900817871094, 0.0453033447265625, 0.05060768127441406, 0.055912017822265625, 0.06121635437011719, 0.06652069091796875, 0.07182502746582031, 0.07712936401367188, 0.08243370056152344, 0.087738037109375, 0.09304237365722656, 0.09834671020507812, 0.10365104675292969, 0.10895538330078125, 0.11425971984863281, 0.11956405639648438, 0.12486839294433594, 0.1301727294921875, 0.13547706604003906, 0.14078140258789062, 0.1460857391357422, 0.15139007568359375, 0.1566944122314453, 0.16199874877929688, 0.16730308532714844, 0.172607421875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 5.0, 14.0, 16.0, 20.0, 16.0, 16.0, 24.0, 26.0, 41.0, 24.0, 35.0, 25.0, 39.0, 43.0, 32.0, 35.0, 38.0, 1071.0, 58.0, 39.0, 30.0, 37.0, 35.0, 39.0, 33.0, 30.0, 21.0, 27.0, 21.0, 15.0, 24.0, 17.0, 13.0, 15.0, 11.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.321868896484375, -2.24530029296875, -2.168731689453125, -2.0921630859375, -2.015594482421875, -1.93902587890625, -1.862457275390625, -1.785888671875, -1.709320068359375, -1.63275146484375, -1.556182861328125, -1.4796142578125, -1.403045654296875, -1.32647705078125, -1.249908447265625, -1.17333984375, -1.096771240234375, -1.02020263671875, -0.943634033203125, -0.8670654296875, -0.790496826171875, -0.71392822265625, -0.637359619140625, -0.560791015625, -0.484222412109375, -0.40765380859375, -0.331085205078125, -0.2545166015625, -0.177947998046875, -0.10137939453125, -0.024810791015625, 0.0517578125, 0.128326416015625, 0.20489501953125, 0.281463623046875, 0.3580322265625, 0.434600830078125, 0.51116943359375, 0.587738037109375, 0.664306640625, 0.740875244140625, 0.81744384765625, 0.894012451171875, 0.9705810546875, 1.047149658203125, 1.12371826171875, 1.200286865234375, 1.27685546875, 1.353424072265625, 1.42999267578125, 1.506561279296875, 1.5831298828125, 1.659698486328125, 1.73626708984375, 1.812835693359375, 1.889404296875, 1.965972900390625, 2.04254150390625, 2.119110107421875, 2.1956787109375, 2.272247314453125, 2.34881591796875, 2.425384521484375, 2.501953125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 15.0, 11.0, 21.0, 29.0, 43.0, 82.0, 96.0, 162.0, 214.0, 316.0, 505.0, 757.0, 1124.0, 1721.0, 2512.0, 3885.0, 5842.0, 8522.0, 12767.0, 18938.0, 28907.0, 45055.0, 73164.0, 129309.0, 1355284.0, 166100.0, 88485.0, 53353.0, 33271.0, 22203.0, 14596.0, 9932.0, 6622.0, 4352.0, 2973.0, 1974.0, 1351.0, 935.0, 569.0, 395.0, 240.0, 165.0, 109.0, 80.0, 47.0, 35.0, 15.0, 22.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0721435546875, -0.06993579864501953, -0.06772804260253906, -0.0655202865600586, -0.06331253051757812, -0.061104774475097656, -0.05889701843261719, -0.05668926239013672, -0.05448150634765625, -0.05227375030517578, -0.05006599426269531, -0.047858238220214844, -0.045650482177734375, -0.043442726135253906, -0.04123497009277344, -0.03902721405029297, -0.0368194580078125, -0.03461170196533203, -0.03240394592285156, -0.030196189880371094, -0.027988433837890625, -0.025780677795410156, -0.023572921752929688, -0.02136516571044922, -0.01915740966796875, -0.01694965362548828, -0.014741897583007812, -0.012534141540527344, -0.010326385498046875, -0.008118629455566406, -0.0059108734130859375, -0.0037031173706054688, -0.001495361328125, 0.0007123947143554688, 0.0029201507568359375, 0.005127906799316406, 0.007335662841796875, 0.009543418884277344, 0.011751174926757812, 0.013958930969238281, 0.01616668701171875, 0.01837444305419922, 0.020582199096679688, 0.022789955139160156, 0.024997711181640625, 0.027205467224121094, 0.029413223266601562, 0.03162097930908203, 0.0338287353515625, 0.03603649139404297, 0.03824424743652344, 0.040452003479003906, 0.042659759521484375, 0.044867515563964844, 0.04707527160644531, 0.04928302764892578, 0.05149078369140625, 0.05369853973388672, 0.05590629577636719, 0.058114051818847656, 0.060321807861328125, 0.0625295639038086, 0.06473731994628906, 0.06694507598876953, 0.06915283203125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 4.0, 4.0, 9.0, 13.0, 14.0, 19.0, 19.0, 20.0, 19.0, 42.0, 38.0, 54.0, 104.0, 288.0, 0.0, 97.0, 61.0, 42.0, 26.0, 12.0, 19.0, 20.0, 14.0, 11.0, 8.0, 12.0, 10.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7881393432617188e-06, -1.730397343635559e-06, -1.6726553440093994e-06, -1.6149133443832397e-06, -1.55717134475708e-06, -1.4994293451309204e-06, -1.4416873455047607e-06, -1.383945345878601e-06, -1.3262033462524414e-06, -1.2684613466262817e-06, -1.210719347000122e-06, -1.1529773473739624e-06, -1.0952353477478027e-06, -1.037493348121643e-06, -9.797513484954834e-07, -9.220093488693237e-07, -8.642673492431641e-07, -8.065253496170044e-07, -7.487833499908447e-07, -6.910413503646851e-07, -6.332993507385254e-07, -5.755573511123657e-07, -5.178153514862061e-07, -4.600733518600464e-07, -4.023313522338867e-07, -3.4458935260772705e-07, -2.868473529815674e-07, -2.2910535335540771e-07, -1.7136335372924805e-07, -1.1362135410308838e-07, -5.587935447692871e-08, 1.862645149230957e-09, 5.960464477539063e-08, 1.1734664440155029e-07, 1.7508864402770996e-07, 2.3283064365386963e-07, 2.905726432800293e-07, 3.4831464290618896e-07, 4.0605664253234863e-07, 4.637986421585083e-07, 5.21540641784668e-07, 5.792826414108276e-07, 6.370246410369873e-07, 6.94766640663147e-07, 7.525086402893066e-07, 8.102506399154663e-07, 8.67992639541626e-07, 9.257346391677856e-07, 9.834766387939453e-07, 1.041218638420105e-06, 1.0989606380462646e-06, 1.1567026376724243e-06, 1.214444637298584e-06, 1.2721866369247437e-06, 1.3299286365509033e-06, 1.387670636177063e-06, 1.4454126358032227e-06, 1.5031546354293823e-06, 1.560896635055542e-06, 1.6186386346817017e-06, 1.6763806343078613e-06, 1.734122633934021e-06, 1.7918646335601807e-06, 1.8496066331863403e-06, 1.9073486328125e-06]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 11.0, 11.0, 7.0, 12.0, 25.0, 25.0, 26.0, 42.0, 107.0, 198.0, 915.0, 95491.0, 946601.0, 4428.0, 283.0, 128.0, 66.0, 38.0, 27.0, 26.0, 20.0, 13.0, 13.0, 11.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.309415817260742e-05, -4.1795894503593445e-05, -4.049763083457947e-05, -3.919936716556549e-05, -3.7901103496551514e-05, -3.660283982753754e-05, -3.530457615852356e-05, -3.400631248950958e-05, -3.2708048820495605e-05, -3.140978515148163e-05, -3.011152148246765e-05, -2.8813257813453674e-05, -2.7514994144439697e-05, -2.621673047542572e-05, -2.4918466806411743e-05, -2.3620203137397766e-05, -2.232193946838379e-05, -2.1023675799369812e-05, -1.9725412130355835e-05, -1.8427148461341858e-05, -1.712888479232788e-05, -1.5830621123313904e-05, -1.4532357454299927e-05, -1.323409378528595e-05, -1.1935830116271973e-05, -1.0637566447257996e-05, -9.339302778244019e-06, -8.041039109230042e-06, -6.7427754402160645e-06, -5.444511771202087e-06, -4.14624810218811e-06, -2.8479844331741333e-06, -1.5497207641601562e-06, -2.514570951461792e-07, 1.0468065738677979e-06, 2.345070242881775e-06, 3.643333911895752e-06, 4.941597580909729e-06, 6.239861249923706e-06, 7.538124918937683e-06, 8.83638858795166e-06, 1.0134652256965637e-05, 1.1432915925979614e-05, 1.2731179594993591e-05, 1.4029443264007568e-05, 1.5327706933021545e-05, 1.6625970602035522e-05, 1.79242342710495e-05, 1.9222497940063477e-05, 2.0520761609077454e-05, 2.181902527809143e-05, 2.3117288947105408e-05, 2.4415552616119385e-05, 2.5713816285133362e-05, 2.701207995414734e-05, 2.8310343623161316e-05, 2.9608607292175293e-05, 3.090687096118927e-05, 3.220513463020325e-05, 3.3503398299217224e-05, 3.48016619682312e-05, 3.609992563724518e-05, 3.7398189306259155e-05, 3.869645297527313e-05, 3.999471664428711e-05]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 25.0, 84.0, 299.0, 450.0, 101.0, 26.0, 16.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.428028998721857e-06, -5.329571649781428e-06, -5.231113846093649e-06, -5.132656497153221e-06, -5.0341986934654415e-06, -4.935741344525013e-06, -4.837283995584585e-06, -4.7388261918968055e-06, -4.640368842956377e-06, -4.541911494015949e-06, -4.44345369032817e-06, -4.344996341387741e-06, -4.246538992447313e-06, -4.148081188759534e-06, -4.049623839819105e-06, -3.951166036131326e-06, -3.852708687190898e-06, -3.754251110876794e-06, -3.65579353456269e-06, -3.557336185622262e-06, -3.458878609308158e-06, -3.3604210329940543e-06, -3.261963684053626e-06, -3.163506107739522e-06, -3.0650485314254183e-06, -2.9665909551113145e-06, -2.8681333787972108e-06, -2.7696760298567824e-06, -2.6712184535426786e-06, -2.572760877228575e-06, -2.4743035282881465e-06, -2.3758459519740427e-06, -2.277388375659939e-06, -2.178930799345835e-06, -2.0804732230317313e-06, -1.982015874091303e-06, -1.8835582977771992e-06, -1.7851007214630954e-06, -1.6866432588358293e-06, -1.5881857962085633e-06, -1.4897282198944595e-06, -1.3912706435803557e-06, -1.2928131809530896e-06, -1.1943557183258235e-06, -1.0958981420117198e-06, -9.97440565697616e-07, -8.989831030703499e-07, -8.00525583599665e-07, -7.0206806412898e-07, -6.036105446582951e-07, -5.051530251876102e-07, -4.0669550571692525e-07, -3.082379862462403e-07, -2.097804667755554e-07, -1.1132294730487047e-07, -1.2865427834185539e-08, 8.559209163649939e-08, 1.8404961110718432e-07, 2.8250713057786925e-07, 3.809646500485542e-07, 4.794221695192391e-07, 5.77879688989924e-07, 6.76337208460609e-07, 7.747947279312939e-07, 8.732522474019788e-07]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 10.0, 0.0, 0.0, 17.0, 0.0, 31.0, 0.0, 0.0, 63.0, 0.0, 0.0, 87.0, 0.0, 151.0, 0.0, 0.0, 249.0, 0.0, 172.0, 0.0, 0.0, 116.0, 0.0, 59.0, 0.0, 0.0, 31.0, 0.0, 16.0, 0.0, 0.0, 7.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.323680281639099e-07, -6.09084963798523e-07, -5.85801899433136e-07, -5.62518835067749e-07, -5.392357707023621e-07, -5.159527063369751e-07, -4.926696419715881e-07, -4.6938657760620117e-07, -4.461035132408142e-07, -4.2282044887542725e-07, -3.995373845100403e-07, -3.762543201446533e-07, -3.5297125577926636e-07, -3.296881914138794e-07, -3.0640512704849243e-07, -2.8312206268310547e-07, -2.598389983177185e-07, -2.3655593395233154e-07, -2.1327286958694458e-07, -1.8998980522155762e-07, -1.6670674085617065e-07, -1.434236764907837e-07, -1.2014061212539673e-07, -9.685754776000977e-08, -7.35744833946228e-08, -5.029141902923584e-08, -2.7008354663848877e-08, -3.725290298461914e-09, 1.955777406692505e-08, 4.284083843231201e-08, 6.612390279769897e-08, 8.940696716308594e-08, 1.126900315284729e-07, 1.3597309589385986e-07, 1.5925616025924683e-07, 1.825392246246338e-07, 2.0582228899002075e-07, 2.2910535335540771e-07, 2.523884177207947e-07, 2.7567148208618164e-07, 2.989545464515686e-07, 3.2223761081695557e-07, 3.4552067518234253e-07, 3.688037395477295e-07, 3.9208680391311646e-07, 4.153698682785034e-07, 4.386529326438904e-07, 4.6193599700927734e-07, 4.852190613746643e-07, 5.085021257400513e-07, 5.317851901054382e-07, 5.550682544708252e-07, 5.783513188362122e-07, 6.016343832015991e-07, 6.249174475669861e-07, 6.48200511932373e-07, 6.7148357629776e-07, 6.94766640663147e-07, 7.180497050285339e-07, 7.413327693939209e-07, 7.646158337593079e-07, 7.878988981246948e-07, 8.111819624900818e-07, 8.344650268554688e-07]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 12.0, 9.0, 6.0, 6.0, 14.0, 11.0, 17.0, 19.0, 22.0, 21.0, 29.0, 33.0, 37.0, 29.0, 46.0, 41.0, 36.0, 44.0, 41.0, 41.0, 44.0, 44.0, 36.0, 51.0, 46.0, 33.0, 28.0, 26.0, 29.0, 20.0, 27.0, 19.0, 16.0, 12.0, 12.0, 6.0, 13.0, 6.0, 2.0, 5.0, 3.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.318603515625, -3.21337890625, -3.108154296875, -3.0029296875, -2.897705078125, -2.79248046875, -2.687255859375, -2.58203125, -2.476806640625, -2.37158203125, -2.266357421875, -2.1611328125, -2.055908203125, -1.95068359375, -1.845458984375, -1.740234375, -1.635009765625, -1.52978515625, -1.424560546875, -1.3193359375, -1.214111328125, -1.10888671875, -1.003662109375, -0.8984375, -0.793212890625, -0.68798828125, -0.582763671875, -0.4775390625, -0.372314453125, -0.26708984375, -0.161865234375, -0.056640625, 0.048583984375, 0.15380859375, 0.259033203125, 0.3642578125, 0.469482421875, 0.57470703125, 0.679931640625, 0.78515625, 0.890380859375, 0.99560546875, 1.100830078125, 1.2060546875, 1.311279296875, 1.41650390625, 1.521728515625, 1.626953125, 1.732177734375, 1.83740234375, 1.942626953125, 2.0478515625, 2.153076171875, 2.25830078125, 2.363525390625, 2.46875, 2.573974609375, 2.67919921875, 2.784423828125, 2.8896484375, 2.994873046875, 3.10009765625, 3.205322265625, 3.310546875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 12.0, 11.0, 23.0, 29.0, 39.0, 89.0, 141.0, 250.0, 483.0, 892.0, 1678.0, 3225.0, 5868.0, 10711.0, 19818.0, 37530.0, 76320.0, 187263.0, 424203.0, 146922.0, 63672.0, 31860.0, 17197.0, 9187.0, 5142.0, 2787.0, 1472.0, 766.0, 425.0, 193.0, 120.0, 80.0, 47.0, 32.0, 13.0, 19.0, 7.0, 3.0, 2.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.62890625, -4.490234375, -4.3515625, -4.212890625, -4.07421875, -3.935546875, -3.796875, -3.658203125, -3.51953125, -3.380859375, -3.2421875, -3.103515625, -2.96484375, -2.826171875, -2.6875, -2.548828125, -2.41015625, -2.271484375, -2.1328125, -1.994140625, -1.85546875, -1.716796875, -1.578125, -1.439453125, -1.30078125, -1.162109375, -1.0234375, -0.884765625, -0.74609375, -0.607421875, -0.46875, -0.330078125, -0.19140625, -0.052734375, 0.0859375, 0.224609375, 0.36328125, 0.501953125, 0.640625, 0.779296875, 0.91796875, 1.056640625, 1.1953125, 1.333984375, 1.47265625, 1.611328125, 1.75, 1.888671875, 2.02734375, 2.166015625, 2.3046875, 2.443359375, 2.58203125, 2.720703125, 2.859375, 2.998046875, 3.13671875, 3.275390625, 3.4140625, 3.552734375, 3.69140625, 3.830078125, 3.96875, 4.107421875, 4.24609375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 14.0, 15.0, 15.0, 14.0, 27.0, 20.0, 27.0, 34.0, 42.0, 43.0, 58.0, 50.0, 82.0, 130.0, 231.0, 1528.0, 174.0, 103.0, 68.0, 59.0, 50.0, 34.0, 35.0, 32.0, 20.0, 21.0, 26.0, 19.0, 17.0, 10.0, 5.0, 8.0, 8.0, 2.0, 6.0, 3.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.4375, -10.06884765625, -9.7001953125, -9.33154296875, -8.962890625, -8.59423828125, -8.2255859375, -7.85693359375, -7.48828125, -7.11962890625, -6.7509765625, -6.38232421875, -6.013671875, -5.64501953125, -5.2763671875, -4.90771484375, -4.5390625, -4.17041015625, -3.8017578125, -3.43310546875, -3.064453125, -2.69580078125, -2.3271484375, -1.95849609375, -1.58984375, -1.22119140625, -0.8525390625, -0.48388671875, -0.115234375, 0.25341796875, 0.6220703125, 0.99072265625, 1.359375, 1.72802734375, 2.0966796875, 2.46533203125, 2.833984375, 3.20263671875, 3.5712890625, 3.93994140625, 4.30859375, 4.67724609375, 5.0458984375, 5.41455078125, 5.783203125, 6.15185546875, 6.5205078125, 6.88916015625, 7.2578125, 7.62646484375, 7.9951171875, 8.36376953125, 8.732421875, 9.10107421875, 9.4697265625, 9.83837890625, 10.20703125, 10.57568359375, 10.9443359375, 11.31298828125, 11.681640625, 12.05029296875, 12.4189453125, 12.78759765625, 13.15625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 12.0, 9.0, 11.0, 20.0, 21.0, 24.0, 39.0, 43.0, 54.0, 51.0, 104.0, 152.0, 244.0, 622.0, 3428.0, 81391.0, 2859049.0, 192283.0, 6425.0, 812.0, 281.0, 180.0, 114.0, 71.0, 55.0, 44.0, 25.0, 37.0, 21.0, 22.0, 21.0, 10.0, 4.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.203125, -27.4111328125, -26.619140625, -25.8271484375, -25.03515625, -24.2431640625, -23.451171875, -22.6591796875, -21.8671875, -21.0751953125, -20.283203125, -19.4912109375, -18.69921875, -17.9072265625, -17.115234375, -16.3232421875, -15.53125, -14.7392578125, -13.947265625, -13.1552734375, -12.36328125, -11.5712890625, -10.779296875, -9.9873046875, -9.1953125, -8.4033203125, -7.611328125, -6.8193359375, -6.02734375, -5.2353515625, -4.443359375, -3.6513671875, -2.859375, -2.0673828125, -1.275390625, -0.4833984375, 0.30859375, 1.1005859375, 1.892578125, 2.6845703125, 3.4765625, 4.2685546875, 5.060546875, 5.8525390625, 6.64453125, 7.4365234375, 8.228515625, 9.0205078125, 9.8125, 10.6044921875, 11.396484375, 12.1884765625, 12.98046875, 13.7724609375, 14.564453125, 15.3564453125, 16.1484375, 16.9404296875, 17.732421875, 18.5244140625, 19.31640625, 20.1083984375, 20.900390625, 21.6923828125, 22.484375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [2.0, 20.0, 63.0, 241.0, 362.0, 236.0, 83.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.559069633483887, -7.432194709777832, -5.305319309234619, -3.1784439086914062, -1.0515689849853516, 1.0753059387207031, 3.202181816101074, 5.329056739807129, 7.455931663513184, 9.582806587219238, 11.70968246459961, 13.836557388305664, 15.963432312011719, 18.090307235717773, 20.217182159423828, 22.344058990478516, 24.470932006835938, 26.597806930541992, 28.724681854248047, 30.851558685302734, 32.978431701660156, 35.105308532714844, 37.23218536376953, 39.35905838012695, 41.48593521118164, 43.61281204223633, 45.73968505859375, 47.86656188964844, 49.99343490600586, 52.12031173706055, 54.24718475341797, 56.374061584472656, 58.500938415527344, 60.62781524658203, 62.75468826293945, 64.88156127929688, 67.00843811035156, 69.13531494140625, 71.26219177246094, 73.38906860351562, 75.51593780517578, 77.64281463623047, 79.76969146728516, 81.89656066894531, 84.0234375, 86.15031433105469, 88.27719116210938, 90.40406799316406, 92.53094482421875, 94.65782165527344, 96.78469848632812, 98.91156768798828, 101.03844451904297, 103.16532135009766, 105.29219818115234, 107.4190673828125, 109.54594421386719, 111.67282104492188, 113.79969787597656, 115.92656707763672, 118.0534439086914, 120.1803207397461, 122.30719757080078, 124.43406677246094, 126.56094360351562]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 13.0, 8.0, 8.0, 11.0, 25.0, 19.0, 33.0, 40.0, 31.0, 45.0, 42.0, 51.0, 50.0, 47.0, 47.0, 42.0, 54.0, 41.0, 49.0, 39.0, 58.0, 42.0, 41.0, 35.0, 14.0, 20.0, 20.0, 14.0, 9.0, 15.0, 11.0, 5.0, 4.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.96651077270508, -31.773164749145508, -30.579818725585938, -29.386472702026367, -28.193126678466797, -26.99978256225586, -25.80643653869629, -24.61309051513672, -23.41974449157715, -22.226398468017578, -21.033052444458008, -19.839706420898438, -18.6463623046875, -17.453014373779297, -16.25967025756836, -15.066324234008789, -13.872978210449219, -12.679632186889648, -11.486286163330078, -10.292941093444824, -9.099595069885254, -7.906249046325684, -6.7129034996032715, -5.519557952880859, -4.326211929321289, -3.132866144180298, -1.9395203590393066, -0.7461745738983154, 0.4471712112426758, 1.640517234802246, 2.833862781524658, 4.02720832824707, 5.220558166503906, 6.413904190063477, 7.607249736785889, 8.8005952835083, 9.993941307067871, 11.187287330627441, 12.380632400512695, 13.573978424072266, 14.767324447631836, 15.960670471191406, 17.154016494750977, 18.347362518310547, 19.540706634521484, 20.734054565429688, 21.927398681640625, 23.120744705200195, 24.314090728759766, 25.507436752319336, 26.700782775878906, 27.894128799438477, 29.087474822998047, 30.280818939208984, 31.474164962768555, 32.667510986328125, 33.86085510253906, 35.05419921875, 36.2475471496582, 37.44089126586914, 38.634239196777344, 39.82758331298828, 41.020931243896484, 42.21427536010742, 43.407623291015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 13.0, 6.0, 11.0, 9.0, 15.0, 19.0, 22.0, 16.0, 27.0, 20.0, 35.0, 28.0, 40.0, 32.0, 51.0, 34.0, 46.0, 46.0, 37.0, 44.0, 54.0, 42.0, 39.0, 40.0, 39.0, 20.0, 33.0, 25.0, 22.0, 19.0, 21.0, 13.0, 21.0, 8.0, 5.0, 10.0, 8.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.80859375, -3.694366455078125, -3.58013916015625, -3.465911865234375, -3.3516845703125, -3.237457275390625, -3.12322998046875, -3.009002685546875, -2.894775390625, -2.780548095703125, -2.66632080078125, -2.552093505859375, -2.4378662109375, -2.323638916015625, -2.20941162109375, -2.095184326171875, -1.98095703125, -1.866729736328125, -1.75250244140625, -1.638275146484375, -1.5240478515625, -1.409820556640625, -1.29559326171875, -1.181365966796875, -1.067138671875, -0.952911376953125, -0.83868408203125, -0.724456787109375, -0.6102294921875, -0.496002197265625, -0.38177490234375, -0.267547607421875, -0.1533203125, -0.039093017578125, 0.07513427734375, 0.189361572265625, 0.3035888671875, 0.417816162109375, 0.53204345703125, 0.646270751953125, 0.760498046875, 0.874725341796875, 0.98895263671875, 1.103179931640625, 1.2174072265625, 1.331634521484375, 1.44586181640625, 1.560089111328125, 1.67431640625, 1.788543701171875, 1.90277099609375, 2.016998291015625, 2.1312255859375, 2.245452880859375, 2.35968017578125, 2.473907470703125, 2.588134765625, 2.702362060546875, 2.81658935546875, 2.930816650390625, 3.0450439453125, 3.159271240234375, 3.27349853515625, 3.387725830078125, 3.501953125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 1.0, 2.0, 3.0, 5.0, 12.0, 24.0, 33.0, 46.0, 63.0, 107.0, 176.0, 262.0, 437.0, 712.0, 1151.0, 2016.0, 3609.0, 6309.0, 11640.0, 22134.0, 42380.0, 84015.0, 165869.0, 319769.0, 580139.0, 896443.0, 874474.0, 554312.0, 304811.0, 157052.0, 79355.0, 40402.0, 21117.0, 11306.0, 6004.0, 3351.0, 1881.0, 1142.0, 660.0, 390.0, 236.0, 169.0, 90.0, 61.0, 32.0, 25.0, 19.0, 16.0, 15.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.884765625, -2.7972412109375, -2.709716796875, -2.6221923828125, -2.53466796875, -2.4471435546875, -2.359619140625, -2.2720947265625, -2.1845703125, -2.0970458984375, -2.009521484375, -1.9219970703125, -1.83447265625, -1.7469482421875, -1.659423828125, -1.5718994140625, -1.484375, -1.3968505859375, -1.309326171875, -1.2218017578125, -1.13427734375, -1.0467529296875, -0.959228515625, -0.8717041015625, -0.7841796875, -0.6966552734375, -0.609130859375, -0.5216064453125, -0.43408203125, -0.3465576171875, -0.259033203125, -0.1715087890625, -0.083984375, 0.0035400390625, 0.091064453125, 0.1785888671875, 0.26611328125, 0.3536376953125, 0.441162109375, 0.5286865234375, 0.6162109375, 0.7037353515625, 0.791259765625, 0.8787841796875, 0.96630859375, 1.0538330078125, 1.141357421875, 1.2288818359375, 1.31640625, 1.4039306640625, 1.491455078125, 1.5789794921875, 1.66650390625, 1.7540283203125, 1.841552734375, 1.9290771484375, 2.0166015625, 2.1041259765625, 2.191650390625, 2.2791748046875, 2.36669921875, 2.4542236328125, 2.541748046875, 2.6292724609375, 2.716796875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 7.0, 7.0, 22.0, 16.0, 24.0, 36.0, 63.0, 77.0, 86.0, 128.0, 152.0, 228.0, 268.0, 341.0, 420.0, 464.0, 388.0, 316.0, 255.0, 172.0, 147.0, 101.0, 88.0, 74.0, 55.0, 29.0, 22.0, 24.0, 16.0, 5.0, 8.0, 6.0, 4.0, 5.0, 1.0, 6.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.79296875, -6.60552978515625, -6.4180908203125, -6.23065185546875, -6.043212890625, -5.85577392578125, -5.6683349609375, -5.48089599609375, -5.29345703125, -5.10601806640625, -4.9185791015625, -4.73114013671875, -4.543701171875, -4.35626220703125, -4.1688232421875, -3.98138427734375, -3.7939453125, -3.60650634765625, -3.4190673828125, -3.23162841796875, -3.044189453125, -2.85675048828125, -2.6693115234375, -2.48187255859375, -2.29443359375, -2.10699462890625, -1.9195556640625, -1.73211669921875, -1.544677734375, -1.35723876953125, -1.1697998046875, -0.98236083984375, -0.794921875, -0.60748291015625, -0.4200439453125, -0.23260498046875, -0.045166015625, 0.14227294921875, 0.3297119140625, 0.51715087890625, 0.70458984375, 0.89202880859375, 1.0794677734375, 1.26690673828125, 1.454345703125, 1.64178466796875, 1.8292236328125, 2.01666259765625, 2.2041015625, 2.39154052734375, 2.5789794921875, 2.76641845703125, 2.953857421875, 3.14129638671875, 3.3287353515625, 3.51617431640625, 3.70361328125, 3.89105224609375, 4.0784912109375, 4.26593017578125, 4.453369140625, 4.64080810546875, 4.8282470703125, 5.01568603515625, 5.203125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 7.0, 6.0, 5.0, 7.0, 19.0, 24.0, 18.0, 41.0, 75.0, 64.0, 94.0, 151.0, 210.0, 339.0, 657.0, 2930.0, 119523.0, 3659400.0, 402562.0, 6139.0, 807.0, 413.0, 232.0, 153.0, 109.0, 79.0, 71.0, 37.0, 28.0, 23.0, 16.0, 12.0, 3.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.095458984375, -18.37841796875, -17.661376953125, -16.9443359375, -16.227294921875, -15.51025390625, -14.793212890625, -14.076171875, -13.359130859375, -12.64208984375, -11.925048828125, -11.2080078125, -10.490966796875, -9.77392578125, -9.056884765625, -8.33984375, -7.622802734375, -6.90576171875, -6.188720703125, -5.4716796875, -4.754638671875, -4.03759765625, -3.320556640625, -2.603515625, -1.886474609375, -1.16943359375, -0.452392578125, 0.2646484375, 0.981689453125, 1.69873046875, 2.415771484375, 3.1328125, 3.849853515625, 4.56689453125, 5.283935546875, 6.0009765625, 6.718017578125, 7.43505859375, 8.152099609375, 8.869140625, 9.586181640625, 10.30322265625, 11.020263671875, 11.7373046875, 12.454345703125, 13.17138671875, 13.888427734375, 14.60546875, 15.322509765625, 16.03955078125, 16.756591796875, 17.4736328125, 18.190673828125, 18.90771484375, 19.624755859375, 20.341796875, 21.058837890625, 21.77587890625, 22.492919921875, 23.2099609375, 23.927001953125, 24.64404296875, 25.361083984375, 26.078125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 59.0, 275.0, 453.0, 194.0, 28.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.2837677001953, -136.19705200195312, -132.11033630371094, -128.02362060546875, -123.9369125366211, -119.8501968383789, -115.76348876953125, -111.67677307128906, -107.59005737304688, -103.50334167480469, -99.4166259765625, -95.32991790771484, -91.24320220947266, -87.15648651123047, -83.06977844238281, -78.98306274414062, -74.89634704589844, -70.80963134765625, -66.72291564941406, -62.636207580566406, -58.54949188232422, -54.46277618408203, -50.37606430053711, -46.28935241699219, -42.20263671875, -38.11592102050781, -34.02920913696289, -29.942495346069336, -25.85578155517578, -21.769067764282227, -17.682353973388672, -13.595640182495117, -9.508941650390625, -5.42222785949707, -1.3355140686035156, 2.751199722290039, 6.837913513183594, 10.924627304077148, 15.011341094970703, 19.098054885864258, 23.184768676757812, 27.271482467651367, 31.358196258544922, 35.444908142089844, 39.53162384033203, 43.61833953857422, 47.70505142211914, 51.79176330566406, 55.87847900390625, 59.96519470214844, 64.05191040039062, 68.13861846923828, 72.22533416748047, 76.31204986572266, 80.39875793457031, 84.4854736328125, 88.57218933105469, 92.65890502929688, 96.74562072753906, 100.83232879638672, 104.9190444946289, 109.0057601928711, 113.09246826171875, 117.17918395996094, 121.26589965820312]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 9.0, 6.0, 4.0, 9.0, 13.0, 5.0, 13.0, 20.0, 15.0, 33.0, 34.0, 34.0, 43.0, 42.0, 42.0, 37.0, 34.0, 51.0, 43.0, 48.0, 41.0, 44.0, 43.0, 42.0, 32.0, 52.0, 26.0, 24.0, 24.0, 19.0, 18.0, 24.0, 18.0, 18.0, 10.0, 13.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.325834274291992, -20.60890007019043, -19.891965866088867, -19.175031661987305, -18.458099365234375, -17.741165161132812, -17.02423095703125, -16.307296752929688, -15.590362548828125, -14.873428344726562, -14.156494140625, -13.439560890197754, -12.722626686096191, -12.005692481994629, -11.288759231567383, -10.57182502746582, -9.854890823364258, -9.137956619262695, -8.421022415161133, -7.704089164733887, -6.987154960632324, -6.270220756530762, -5.553287029266357, -4.836353302001953, -4.119419097900391, -3.4024851322174072, -2.685551166534424, -1.9686172008514404, -1.251683235168457, -0.5347492694854736, 0.18218469619750977, 0.8991184234619141, 1.6160507202148438, 2.332984685897827, 3.0499186515808105, 3.766852617263794, 4.483786582946777, 5.20072078704834, 5.917654514312744, 6.634588241577148, 7.351522445678711, 8.068456649780273, 8.785390853881836, 9.502324104309082, 10.219258308410645, 10.936192512512207, 11.653125762939453, 12.370059967041016, 13.086994171142578, 13.80392837524414, 14.520862579345703, 15.23779582977295, 15.954730033874512, 16.671663284301758, 17.38859748840332, 18.105531692504883, 18.822465896606445, 19.539400100708008, 20.25633430480957, 20.973268508911133, 21.690200805664062, 22.407135009765625, 23.124069213867188, 23.84100341796875, 24.557937622070312]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 15.0, 14.0, 14.0, 13.0, 17.0, 21.0, 17.0, 25.0, 36.0, 27.0, 24.0, 38.0, 38.0, 45.0, 44.0, 35.0, 40.0, 54.0, 40.0, 51.0, 46.0, 34.0, 35.0, 30.0, 26.0, 27.0, 20.0, 28.0, 21.0, 16.0, 12.0, 19.0, 7.0, 11.0, 10.0, 8.0, 1.0, 3.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.34906005859375, -3.2410888671875, -3.13311767578125, -3.025146484375, -2.91717529296875, -2.8092041015625, -2.70123291015625, -2.59326171875, -2.48529052734375, -2.3773193359375, -2.26934814453125, -2.161376953125, -2.05340576171875, -1.9454345703125, -1.83746337890625, -1.7294921875, -1.62152099609375, -1.5135498046875, -1.40557861328125, -1.297607421875, -1.18963623046875, -1.0816650390625, -0.97369384765625, -0.86572265625, -0.75775146484375, -0.6497802734375, -0.54180908203125, -0.433837890625, -0.32586669921875, -0.2178955078125, -0.10992431640625, -0.001953125, 0.10601806640625, 0.2139892578125, 0.32196044921875, 0.429931640625, 0.53790283203125, 0.6458740234375, 0.75384521484375, 0.86181640625, 0.96978759765625, 1.0777587890625, 1.18572998046875, 1.293701171875, 1.40167236328125, 1.5096435546875, 1.61761474609375, 1.7255859375, 1.83355712890625, 1.9415283203125, 2.04949951171875, 2.157470703125, 2.26544189453125, 2.3734130859375, 2.48138427734375, 2.58935546875, 2.69732666015625, 2.8052978515625, 2.91326904296875, 3.021240234375, 3.12921142578125, 3.2371826171875, 3.34515380859375, 3.453125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 9.0, 18.0, 27.0, 47.0, 69.0, 82.0, 146.0, 194.0, 301.0, 454.0, 622.0, 895.0, 1391.0, 2149.0, 3179.0, 4641.0, 6934.0, 10051.0, 15300.0, 23174.0, 35539.0, 58210.0, 105677.0, 288698.0, 237250.0, 97974.0, 55045.0, 33941.0, 21931.0, 14701.0, 9669.0, 6624.0, 4442.0, 2913.0, 2027.0, 1421.0, 911.0, 629.0, 427.0, 267.0, 217.0, 126.0, 92.0, 53.0, 30.0, 21.0, 13.0, 9.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.141357421875, -0.136932373046875, -0.13250732421875, -0.128082275390625, -0.1236572265625, -0.119232177734375, -0.11480712890625, -0.110382080078125, -0.10595703125, -0.101531982421875, -0.09710693359375, -0.092681884765625, -0.0882568359375, -0.083831787109375, -0.07940673828125, -0.074981689453125, -0.070556640625, -0.066131591796875, -0.06170654296875, -0.057281494140625, -0.0528564453125, -0.048431396484375, -0.04400634765625, -0.039581298828125, -0.03515625, -0.030731201171875, -0.02630615234375, -0.021881103515625, -0.0174560546875, -0.013031005859375, -0.00860595703125, -0.004180908203125, 0.000244140625, 0.004669189453125, 0.00909423828125, 0.013519287109375, 0.0179443359375, 0.022369384765625, 0.02679443359375, 0.031219482421875, 0.03564453125, 0.040069580078125, 0.04449462890625, 0.048919677734375, 0.0533447265625, 0.057769775390625, 0.06219482421875, 0.066619873046875, 0.071044921875, 0.075469970703125, 0.07989501953125, 0.084320068359375, 0.0887451171875, 0.093170166015625, 0.09759521484375, 0.102020263671875, 0.1064453125, 0.110870361328125, 0.11529541015625, 0.119720458984375, 0.1241455078125, 0.128570556640625, 0.13299560546875, 0.137420654296875, 0.141845703125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 7.0, 5.0, 6.0, 7.0, 12.0, 12.0, 8.0, 17.0, 16.0, 25.0, 20.0, 30.0, 24.0, 30.0, 41.0, 37.0, 30.0, 35.0, 39.0, 35.0, 37.0, 39.0, 1066.0, 31.0, 37.0, 37.0, 30.0, 45.0, 32.0, 35.0, 25.0, 17.0, 17.0, 25.0, 21.0, 14.0, 15.0, 16.0, 12.0, 8.0, 4.0, 6.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.48828125, -2.41070556640625, -2.3331298828125, -2.25555419921875, -2.177978515625, -2.10040283203125, -2.0228271484375, -1.94525146484375, -1.86767578125, -1.79010009765625, -1.7125244140625, -1.63494873046875, -1.557373046875, -1.47979736328125, -1.4022216796875, -1.32464599609375, -1.2470703125, -1.16949462890625, -1.0919189453125, -1.01434326171875, -0.936767578125, -0.85919189453125, -0.7816162109375, -0.70404052734375, -0.62646484375, -0.54888916015625, -0.4713134765625, -0.39373779296875, -0.316162109375, -0.23858642578125, -0.1610107421875, -0.08343505859375, -0.005859375, 0.07171630859375, 0.1492919921875, 0.22686767578125, 0.304443359375, 0.38201904296875, 0.4595947265625, 0.53717041015625, 0.61474609375, 0.69232177734375, 0.7698974609375, 0.84747314453125, 0.925048828125, 1.00262451171875, 1.0802001953125, 1.15777587890625, 1.2353515625, 1.31292724609375, 1.3905029296875, 1.46807861328125, 1.545654296875, 1.62322998046875, 1.7008056640625, 1.77838134765625, 1.85595703125, 1.93353271484375, 2.0111083984375, 2.08868408203125, 2.166259765625, 2.24383544921875, 2.3214111328125, 2.39898681640625, 2.4765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 15.0, 13.0, 25.0, 38.0, 50.0, 83.0, 111.0, 187.0, 194.0, 369.0, 493.0, 675.0, 966.0, 1392.0, 1963.0, 2834.0, 4092.0, 5792.0, 8561.0, 12084.0, 18039.0, 26606.0, 41156.0, 65828.0, 111791.0, 1296079.0, 208871.0, 104925.0, 62922.0, 39422.0, 25770.0, 17186.0, 11915.0, 8081.0, 5618.0, 3856.0, 2804.0, 1932.0, 1305.0, 953.0, 625.0, 462.0, 332.0, 225.0, 148.0, 117.0, 70.0, 52.0, 43.0, 23.0, 16.0, 9.0, 9.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0714111328125, -0.06917572021484375, -0.0669403076171875, -0.06470489501953125, -0.062469482421875, -0.06023406982421875, -0.0579986572265625, -0.05576324462890625, -0.05352783203125, -0.05129241943359375, -0.0490570068359375, -0.04682159423828125, -0.044586181640625, -0.04235076904296875, -0.0401153564453125, -0.03787994384765625, -0.03564453125, -0.03340911865234375, -0.0311737060546875, -0.02893829345703125, -0.026702880859375, -0.02446746826171875, -0.0222320556640625, -0.01999664306640625, -0.01776123046875, -0.01552581787109375, -0.0132904052734375, -0.01105499267578125, -0.008819580078125, -0.00658416748046875, -0.0043487548828125, -0.00211334228515625, 0.0001220703125, 0.00235748291015625, 0.0045928955078125, 0.00682830810546875, 0.009063720703125, 0.01129913330078125, 0.0135345458984375, 0.01576995849609375, 0.01800537109375, 0.02024078369140625, 0.0224761962890625, 0.02471160888671875, 0.026947021484375, 0.02918243408203125, 0.0314178466796875, 0.03365325927734375, 0.035888671875, 0.03812408447265625, 0.0403594970703125, 0.04259490966796875, 0.044830322265625, 0.04706573486328125, 0.0493011474609375, 0.05153656005859375, 0.05377197265625, 0.05600738525390625, 0.0582427978515625, 0.06047821044921875, 0.062713623046875, 0.06494903564453125, 0.0671844482421875, 0.06941986083984375, 0.0716552734375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 0.0, 7.0, 14.0, 9.0, 13.0, 16.0, 21.0, 19.0, 41.0, 36.0, 0.0, 28.0, 60.0, 72.0, 302.0, 84.0, 64.0, 37.0, 33.0, 30.0, 15.0, 0.0, 21.0, 10.0, 11.0, 13.0, 2.0, 3.0, 5.0, 7.0, 10.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9073486328125e-06, -1.8533319234848022e-06, -1.7993152141571045e-06, -1.7452985048294067e-06, -1.691281795501709e-06, -1.6372650861740112e-06, -1.5832483768463135e-06, -1.5292316675186157e-06, -1.475214958190918e-06, -1.4211982488632202e-06, -1.3671815395355225e-06, -1.3131648302078247e-06, -1.259148120880127e-06, -1.2051314115524292e-06, -1.1511147022247314e-06, -1.0970979928970337e-06, -1.043081283569336e-06, -9.890645742416382e-07, -9.350478649139404e-07, -8.810311555862427e-07, -8.270144462585449e-07, -7.729977369308472e-07, -7.189810276031494e-07, -6.649643182754517e-07, -6.109476089477539e-07, -5.569308996200562e-07, -5.029141902923584e-07, -4.4889748096466064e-07, -3.948807716369629e-07, -3.4086406230926514e-07, -2.868473529815674e-07, -2.3283064365386963e-07, -1.7881393432617188e-07, -1.2479722499847412e-07, -7.078051567077637e-08, -1.6763806343078613e-08, 3.725290298461914e-08, 9.12696123123169e-08, 1.4528632164001465e-07, 1.993030309677124e-07, 2.5331974029541016e-07, 3.073364496231079e-07, 3.6135315895080566e-07, 4.153698682785034e-07, 4.6938657760620117e-07, 5.234032869338989e-07, 5.774199962615967e-07, 6.314367055892944e-07, 6.854534149169922e-07, 7.394701242446899e-07, 7.934868335723877e-07, 8.475035429000854e-07, 9.015202522277832e-07, 9.55536961555481e-07, 1.0095536708831787e-06, 1.0635703802108765e-06, 1.1175870895385742e-06, 1.171603798866272e-06, 1.2256205081939697e-06, 1.2796372175216675e-06, 1.3336539268493652e-06, 1.387670636177063e-06, 1.4416873455047607e-06, 1.4957040548324585e-06, 1.5497207641601562e-06]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 5.0, 4.0, 2.0, 4.0, 4.0, 8.0, 8.0, 6.0, 13.0, 18.0, 20.0, 17.0, 37.0, 56.0, 93.0, 196.0, 762.0, 42307.0, 988610.0, 15447.0, 455.0, 149.0, 88.0, 56.0, 48.0, 30.0, 18.0, 14.0, 12.0, 14.0, 10.0, 7.0, 7.0, 8.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.403425216674805e-05, -3.287661820650101e-05, -3.171898424625397e-05, -3.056135028600693e-05, -2.9403716325759888e-05, -2.8246082365512848e-05, -2.7088448405265808e-05, -2.593081444501877e-05, -2.477318048477173e-05, -2.361554652452469e-05, -2.245791256427765e-05, -2.130027860403061e-05, -2.014264464378357e-05, -1.898501068353653e-05, -1.782737672328949e-05, -1.666974276304245e-05, -1.551210880279541e-05, -1.435447484254837e-05, -1.319684088230133e-05, -1.203920692205429e-05, -1.0881572961807251e-05, -9.723939001560211e-06, -8.566305041313171e-06, -7.408671081066132e-06, -6.251037120819092e-06, -5.093403160572052e-06, -3.935769200325012e-06, -2.7781352400779724e-06, -1.6205012798309326e-06, -4.628673195838928e-07, 6.94766640663147e-07, 1.8524006009101868e-06, 3.0100345611572266e-06, 4.167668521404266e-06, 5.325302481651306e-06, 6.482936441898346e-06, 7.640570402145386e-06, 8.798204362392426e-06, 9.955838322639465e-06, 1.1113472282886505e-05, 1.2271106243133545e-05, 1.3428740203380585e-05, 1.4586374163627625e-05, 1.5744008123874664e-05, 1.6901642084121704e-05, 1.8059276044368744e-05, 1.9216910004615784e-05, 2.0374543964862823e-05, 2.1532177925109863e-05, 2.2689811885356903e-05, 2.3847445845603943e-05, 2.5005079805850983e-05, 2.6162713766098022e-05, 2.7320347726345062e-05, 2.8477981686592102e-05, 2.9635615646839142e-05, 3.079324960708618e-05, 3.195088356733322e-05, 3.310851752758026e-05, 3.42661514878273e-05, 3.542378544807434e-05, 3.658141940832138e-05, 3.773905336856842e-05, 3.889668732881546e-05, 4.00543212890625e-05]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 27.0, 173.0, 648.0, 140.0, 24.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.361460459127557e-06, -8.202021490433253e-06, -8.04258252173895e-06, -7.883144462539349e-06, -7.723705493845046e-06, -7.564266525150742e-06, -7.404827556456439e-06, -7.245389042509487e-06, -7.085950073815184e-06, -6.9265111051208805e-06, -6.767072591173928e-06, -6.607633622479625e-06, -6.448195108532673e-06, -6.2887561398383696e-06, -6.129317625891417e-06, -5.969878657197114e-06, -5.810439688502811e-06, -5.651000719808508e-06, -5.491562205861555e-06, -5.332123237167252e-06, -5.1726847232203e-06, -5.013245754525997e-06, -4.8538067858316936e-06, -4.694368271884741e-06, -4.534929757937789e-06, -4.375490789243486e-06, -4.2160522752965335e-06, -4.05661330660223e-06, -3.897174792655278e-06, -3.737735823960975e-06, -3.578297082640347e-06, -3.4188583413197193e-06, -3.259419827372767e-06, -3.0999810860521393e-06, -2.9405423447315115e-06, -2.7811033760372084e-06, -2.6216646347165806e-06, -2.462225893395953e-06, -2.302787152075325e-06, -2.1433484107546974e-06, -1.9839094420603942e-06, -1.8244707007397665e-06, -1.665031845732301e-06, -1.5055931044116733e-06, -1.3461542494042078e-06, -1.18671550808358e-06, -1.0272767667629523e-06, -8.678379117554869e-07, -7.083991704348591e-07, -5.489603722708125e-07, -3.8952160252847534e-07, -2.3008283278613817e-07, -7.064403462209157e-08, 8.879476354195504e-08, 2.482335048625828e-07, 4.0767235987004824e-07, 5.67111101190676e-07, 7.265498993547226e-07, 8.859886975187692e-07, 1.045427438839397e-06, 1.2048662938468624e-06, 1.3643050351674901e-06, 1.5237437764881179e-06, 1.6831826314955833e-06, 1.842621372816211e-06]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 8.0, 0.0, 23.0, 0.0, 0.0, 35.0, 0.0, 0.0, 37.0, 0.0, 58.0, 0.0, 0.0, 100.0, 0.0, 0.0, 133.0, 0.0, 213.0, 0.0, 0.0, 141.0, 0.0, 0.0, 100.0, 0.0, 59.0, 0.0, 0.0, 45.0, 0.0, 0.0, 25.0, 0.0, 19.0, 0.0, 0.0, 9.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.736947059631348e-07, -5.513429641723633e-07, -5.289912223815918e-07, -5.066394805908203e-07, -4.842877388000488e-07, -4.6193599700927734e-07, -4.3958425521850586e-07, -4.172325134277344e-07, -3.948807716369629e-07, -3.725290298461914e-07, -3.501772880554199e-07, -3.2782554626464844e-07, -3.0547380447387695e-07, -2.8312206268310547e-07, -2.60770320892334e-07, -2.384185791015625e-07, -2.1606683731079102e-07, -1.9371509552001953e-07, -1.7136335372924805e-07, -1.4901161193847656e-07, -1.2665987014770508e-07, -1.043081283569336e-07, -8.195638656616211e-08, -5.960464477539063e-08, -3.725290298461914e-08, -1.4901161193847656e-08, 7.450580596923828e-09, 2.9802322387695312e-08, 5.21540641784668e-08, 7.450580596923828e-08, 9.685754776000977e-08, 1.1920928955078125e-07, 1.4156103134155273e-07, 1.6391277313232422e-07, 1.862645149230957e-07, 2.086162567138672e-07, 2.3096799850463867e-07, 2.5331974029541016e-07, 2.7567148208618164e-07, 2.980232238769531e-07, 3.203749656677246e-07, 3.427267074584961e-07, 3.650784492492676e-07, 3.8743019104003906e-07, 4.0978193283081055e-07, 4.3213367462158203e-07, 4.544854164123535e-07, 4.76837158203125e-07, 4.991888999938965e-07, 5.21540641784668e-07, 5.438923835754395e-07, 5.662441253662109e-07, 5.885958671569824e-07, 6.109476089477539e-07, 6.332993507385254e-07, 6.556510925292969e-07, 6.780028343200684e-07, 7.003545761108398e-07, 7.227063179016113e-07, 7.450580596923828e-07, 7.674098014831543e-07, 7.897615432739258e-07, 8.121132850646973e-07, 8.344650268554688e-07]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 15.0, 14.0, 14.0, 13.0, 17.0, 21.0, 17.0, 25.0, 36.0, 27.0, 24.0, 38.0, 38.0, 45.0, 44.0, 35.0, 40.0, 54.0, 40.0, 51.0, 46.0, 34.0, 35.0, 30.0, 26.0, 27.0, 20.0, 28.0, 21.0, 16.0, 12.0, 19.0, 7.0, 11.0, 10.0, 8.0, 1.0, 3.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.34906005859375, -3.2410888671875, -3.13311767578125, -3.025146484375, -2.91717529296875, -2.8092041015625, -2.70123291015625, -2.59326171875, -2.48529052734375, -2.3773193359375, -2.26934814453125, -2.161376953125, -2.05340576171875, -1.9454345703125, -1.83746337890625, -1.7294921875, -1.62152099609375, -1.5135498046875, -1.40557861328125, -1.297607421875, -1.18963623046875, -1.0816650390625, -0.97369384765625, -0.86572265625, -0.75775146484375, -0.6497802734375, -0.54180908203125, -0.433837890625, -0.32586669921875, -0.2178955078125, -0.10992431640625, -0.001953125, 0.10601806640625, 0.2139892578125, 0.32196044921875, 0.429931640625, 0.53790283203125, 0.6458740234375, 0.75384521484375, 0.86181640625, 0.96978759765625, 1.0777587890625, 1.18572998046875, 1.293701171875, 1.40167236328125, 1.5096435546875, 1.61761474609375, 1.7255859375, 1.83355712890625, 1.9415283203125, 2.04949951171875, 2.157470703125, 2.26544189453125, 2.3734130859375, 2.48138427734375, 2.58935546875, 2.69732666015625, 2.8052978515625, 2.91326904296875, 3.021240234375, 3.12921142578125, 3.2371826171875, 3.34515380859375, 3.453125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 1.0, 16.0, 21.0, 38.0, 57.0, 78.0, 139.0, 221.0, 379.0, 564.0, 900.0, 1397.0, 2229.0, 3318.0, 5267.0, 8345.0, 13267.0, 20919.0, 32738.0, 51572.0, 83765.0, 145224.0, 222967.0, 180989.0, 103525.0, 62437.0, 39167.0, 25178.0, 15868.0, 10160.0, 6524.0, 4057.0, 2593.0, 1669.0, 1075.0, 705.0, 426.0, 275.0, 205.0, 107.0, 71.0, 42.0, 21.0, 15.0, 10.0, 1.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.984375, -2.887176513671875, -2.78997802734375, -2.692779541015625, -2.5955810546875, -2.498382568359375, -2.40118408203125, -2.303985595703125, -2.206787109375, -2.109588623046875, -2.01239013671875, -1.915191650390625, -1.8179931640625, -1.720794677734375, -1.62359619140625, -1.526397705078125, -1.42919921875, -1.332000732421875, -1.23480224609375, -1.137603759765625, -1.0404052734375, -0.943206787109375, -0.84600830078125, -0.748809814453125, -0.651611328125, -0.554412841796875, -0.45721435546875, -0.360015869140625, -0.2628173828125, -0.165618896484375, -0.06842041015625, 0.028778076171875, 0.1259765625, 0.223175048828125, 0.32037353515625, 0.417572021484375, 0.5147705078125, 0.611968994140625, 0.70916748046875, 0.806365966796875, 0.903564453125, 1.000762939453125, 1.09796142578125, 1.195159912109375, 1.2923583984375, 1.389556884765625, 1.48675537109375, 1.583953857421875, 1.68115234375, 1.778350830078125, 1.87554931640625, 1.972747802734375, 2.0699462890625, 2.167144775390625, 2.26434326171875, 2.361541748046875, 2.458740234375, 2.555938720703125, 2.65313720703125, 2.750335693359375, 2.8475341796875, 2.944732666015625, 3.04193115234375, 3.139129638671875, 3.236328125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 4.0, 5.0, 6.0, 13.0, 10.0, 5.0, 16.0, 16.0, 20.0, 26.0, 23.0, 23.0, 30.0, 31.0, 39.0, 41.0, 64.0, 82.0, 134.0, 271.0, 1349.0, 227.0, 138.0, 75.0, 58.0, 45.0, 41.0, 38.0, 32.0, 32.0, 23.0, 24.0, 18.0, 10.0, 7.0, 13.0, 12.0, 10.0, 10.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.8125, -10.46728515625, -10.1220703125, -9.77685546875, -9.431640625, -9.08642578125, -8.7412109375, -8.39599609375, -8.05078125, -7.70556640625, -7.3603515625, -7.01513671875, -6.669921875, -6.32470703125, -5.9794921875, -5.63427734375, -5.2890625, -4.94384765625, -4.5986328125, -4.25341796875, -3.908203125, -3.56298828125, -3.2177734375, -2.87255859375, -2.52734375, -2.18212890625, -1.8369140625, -1.49169921875, -1.146484375, -0.80126953125, -0.4560546875, -0.11083984375, 0.234375, 0.57958984375, 0.9248046875, 1.27001953125, 1.615234375, 1.96044921875, 2.3056640625, 2.65087890625, 2.99609375, 3.34130859375, 3.6865234375, 4.03173828125, 4.376953125, 4.72216796875, 5.0673828125, 5.41259765625, 5.7578125, 6.10302734375, 6.4482421875, 6.79345703125, 7.138671875, 7.48388671875, 7.8291015625, 8.17431640625, 8.51953125, 8.86474609375, 9.2099609375, 9.55517578125, 9.900390625, 10.24560546875, 10.5908203125, 10.93603515625, 11.28125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 10.0, 9.0, 7.0, 12.0, 14.0, 14.0, 24.0, 37.0, 38.0, 56.0, 95.0, 96.0, 143.0, 214.0, 390.0, 1042.0, 5791.0, 61980.0, 1303586.0, 1686120.0, 76706.0, 7012.0, 1103.0, 371.0, 238.0, 154.0, 91.0, 93.0, 58.0, 41.0, 35.0, 30.0, 21.0, 14.0, 6.0, 16.0, 10.0, 6.0, 5.0, 4.0, 8.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.625, -15.166015625, -14.70703125, -14.248046875, -13.7890625, -13.330078125, -12.87109375, -12.412109375, -11.953125, -11.494140625, -11.03515625, -10.576171875, -10.1171875, -9.658203125, -9.19921875, -8.740234375, -8.28125, -7.822265625, -7.36328125, -6.904296875, -6.4453125, -5.986328125, -5.52734375, -5.068359375, -4.609375, -4.150390625, -3.69140625, -3.232421875, -2.7734375, -2.314453125, -1.85546875, -1.396484375, -0.9375, -0.478515625, -0.01953125, 0.439453125, 0.8984375, 1.357421875, 1.81640625, 2.275390625, 2.734375, 3.193359375, 3.65234375, 4.111328125, 4.5703125, 5.029296875, 5.48828125, 5.947265625, 6.40625, 6.865234375, 7.32421875, 7.783203125, 8.2421875, 8.701171875, 9.16015625, 9.619140625, 10.078125, 10.537109375, 10.99609375, 11.455078125, 11.9140625, 12.373046875, 12.83203125, 13.291015625, 13.75]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 16.0, 132.0, 470.0, 334.0, 59.0, 7.0], "bins": [-198.3383331298828, -195.07504272460938, -191.81173706054688, -188.54844665527344, -185.28514099121094, -182.0218505859375, -178.758544921875, -175.49525451660156, -172.23194885253906, -168.96865844726562, -165.70535278320312, -162.4420623779297, -159.1787567138672, -155.91546630859375, -152.65216064453125, -149.3888702392578, -146.12557983398438, -142.86228942871094, -139.59898376464844, -136.335693359375, -133.0723876953125, -129.80909729003906, -126.54579162597656, -123.28250122070312, -120.01919555664062, -116.75589752197266, -113.49259948730469, -110.22930145263672, -106.96600341796875, -103.70270538330078, -100.43940734863281, -97.17611694335938, -93.91280364990234, -90.64950561523438, -87.3862075805664, -84.12290954589844, -80.85961151123047, -77.5963134765625, -74.33302307128906, -71.06971740722656, -67.80642700195312, -64.54312896728516, -61.27983093261719, -58.01653289794922, -54.75323486328125, -51.48993682861328, -48.22664260864258, -44.96334457397461, -41.700042724609375, -38.436744689941406, -35.17344665527344, -31.9101505279541, -28.646852493286133, -25.383554458618164, -22.120258331298828, -18.85696029663086, -15.593664169311523, -12.330366134643555, -9.067069053649902, -5.80377197265625, -2.5404739379882812, 0.7228240966796875, 3.9861202239990234, 7.249418258666992, 10.512716293334961]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 4.0, 9.0, 5.0, 6.0, 17.0, 14.0, 13.0, 17.0, 27.0, 15.0, 25.0, 36.0, 26.0, 33.0, 25.0, 29.0, 34.0, 42.0, 32.0, 50.0, 37.0, 35.0, 43.0, 40.0, 35.0, 40.0, 43.0, 30.0, 36.0, 28.0, 27.0, 21.0, 19.0, 18.0, 13.0, 8.0, 11.0, 10.0, 10.0, 9.0, 10.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-31.950580596923828, -31.040042877197266, -30.129507064819336, -29.218969345092773, -28.308433532714844, -27.39789581298828, -26.48736000061035, -25.57682228088379, -24.66628646850586, -23.755748748779297, -22.845212936401367, -21.934675216674805, -21.024139404296875, -20.113601684570312, -19.203065872192383, -18.29252815246582, -17.38199234008789, -16.471454620361328, -15.560918807983398, -14.650382041931152, -13.739845275878906, -12.829307556152344, -11.918771743774414, -11.008234024047852, -10.097696304321289, -9.187159538269043, -8.276622772216797, -7.366086006164551, -6.455549240112305, -5.5450119972229, -4.634475231170654, -3.723938465118408, -2.8134021759033203, -1.9028654098510742, -0.9923285245895386, -0.08179163932800293, 0.8287451267242432, 1.7392821311950684, 2.6498188972473145, 3.5603556632995605, 4.470892429351807, 5.381429195404053, 6.291965961456299, 7.202503204345703, 8.11303997039795, 9.023576736450195, 9.934113502502441, 10.844650268554688, 11.755187034606934, 12.66572380065918, 13.576260566711426, 14.486797332763672, 15.397334098815918, 16.307870864868164, 17.218408584594727, 18.128944396972656, 19.03948211669922, 19.95001983642578, 20.86055564880371, 21.771093368530273, 22.681629180908203, 23.592166900634766, 24.502702713012695, 25.413240432739258, 26.323776245117188]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 10.0, 4.0, 8.0, 8.0, 9.0, 14.0, 19.0, 17.0, 18.0, 19.0, 24.0, 31.0, 35.0, 34.0, 46.0, 33.0, 45.0, 52.0, 37.0, 39.0, 50.0, 47.0, 37.0, 36.0, 32.0, 45.0, 33.0, 31.0, 29.0, 21.0, 29.0, 14.0, 15.0, 12.0, 16.0, 7.0, 12.0, 6.0, 4.0, 3.0, 3.0, 4.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-4.01953125, -3.90399169921875, -3.7884521484375, -3.67291259765625, -3.557373046875, -3.44183349609375, -3.3262939453125, -3.21075439453125, -3.09521484375, -2.97967529296875, -2.8641357421875, -2.74859619140625, -2.633056640625, -2.51751708984375, -2.4019775390625, -2.28643798828125, -2.1708984375, -2.05535888671875, -1.9398193359375, -1.82427978515625, -1.708740234375, -1.59320068359375, -1.4776611328125, -1.36212158203125, -1.24658203125, -1.13104248046875, -1.0155029296875, -0.89996337890625, -0.784423828125, -0.66888427734375, -0.5533447265625, -0.43780517578125, -0.322265625, -0.20672607421875, -0.0911865234375, 0.02435302734375, 0.139892578125, 0.25543212890625, 0.3709716796875, 0.48651123046875, 0.60205078125, 0.71759033203125, 0.8331298828125, 0.94866943359375, 1.064208984375, 1.17974853515625, 1.2952880859375, 1.41082763671875, 1.5263671875, 1.64190673828125, 1.7574462890625, 1.87298583984375, 1.988525390625, 2.10406494140625, 2.2196044921875, 2.33514404296875, 2.45068359375, 2.56622314453125, 2.6817626953125, 2.79730224609375, 2.912841796875, 3.02838134765625, 3.1439208984375, 3.25946044921875, 3.375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 10.0, 10.0, 18.0, 11.0, 26.0, 15.0, 19.0, 25.0, 33.0, 46.0, 65.0, 171.0, 463.0, 2523.0, 15123.0, 116813.0, 1012029.0, 2530272.0, 454288.0, 53052.0, 7344.0, 1260.0, 293.0, 93.0, 51.0, 28.0, 32.0, 28.0, 26.0, 13.0, 13.0, 9.0, 13.0, 14.0, 8.0, 10.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-10.4765625, -10.18804931640625, -9.8995361328125, -9.61102294921875, -9.322509765625, -9.03399658203125, -8.7454833984375, -8.45697021484375, -8.16845703125, -7.87994384765625, -7.5914306640625, -7.30291748046875, -7.014404296875, -6.72589111328125, -6.4373779296875, -6.14886474609375, -5.8603515625, -5.57183837890625, -5.2833251953125, -4.99481201171875, -4.706298828125, -4.41778564453125, -4.1292724609375, -3.84075927734375, -3.55224609375, -3.26373291015625, -2.9752197265625, -2.68670654296875, -2.398193359375, -2.10968017578125, -1.8211669921875, -1.53265380859375, -1.244140625, -0.95562744140625, -0.6671142578125, -0.37860107421875, -0.090087890625, 0.19842529296875, 0.4869384765625, 0.77545166015625, 1.06396484375, 1.35247802734375, 1.6409912109375, 1.92950439453125, 2.218017578125, 2.50653076171875, 2.7950439453125, 3.08355712890625, 3.3720703125, 3.66058349609375, 3.9490966796875, 4.23760986328125, 4.526123046875, 4.81463623046875, 5.1031494140625, 5.39166259765625, 5.68017578125, 5.96868896484375, 6.2572021484375, 6.54571533203125, 6.834228515625, 7.12274169921875, 7.4112548828125, 7.69976806640625, 7.98828125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 4.0, 11.0, 10.0, 16.0, 19.0, 26.0, 39.0, 34.0, 58.0, 75.0, 102.0, 122.0, 153.0, 212.0, 256.0, 356.0, 442.0, 404.0, 380.0, 302.0, 219.0, 205.0, 148.0, 115.0, 94.0, 71.0, 50.0, 31.0, 36.0, 24.0, 17.0, 11.0, 8.0, 5.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.98828125, -5.8135986328125, -5.638916015625, -5.4642333984375, -5.28955078125, -5.1148681640625, -4.940185546875, -4.7655029296875, -4.5908203125, -4.4161376953125, -4.241455078125, -4.0667724609375, -3.89208984375, -3.7174072265625, -3.542724609375, -3.3680419921875, -3.193359375, -3.0186767578125, -2.843994140625, -2.6693115234375, -2.49462890625, -2.3199462890625, -2.145263671875, -1.9705810546875, -1.7958984375, -1.6212158203125, -1.446533203125, -1.2718505859375, -1.09716796875, -0.9224853515625, -0.747802734375, -0.5731201171875, -0.3984375, -0.2237548828125, -0.049072265625, 0.1256103515625, 0.30029296875, 0.4749755859375, 0.649658203125, 0.8243408203125, 0.9990234375, 1.1737060546875, 1.348388671875, 1.5230712890625, 1.69775390625, 1.8724365234375, 2.047119140625, 2.2218017578125, 2.396484375, 2.5711669921875, 2.745849609375, 2.9205322265625, 3.09521484375, 3.2698974609375, 3.444580078125, 3.6192626953125, 3.7939453125, 3.9686279296875, 4.143310546875, 4.3179931640625, 4.49267578125, 4.6673583984375, 4.842041015625, 5.0167236328125, 5.19140625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 4.0, 7.0, 12.0, 16.0, 25.0, 26.0, 41.0, 55.0, 87.0, 105.0, 163.0, 224.0, 370.0, 696.0, 3412.0, 81409.0, 2751343.0, 1319863.0, 32870.0, 1981.0, 571.0, 303.0, 182.0, 142.0, 115.0, 63.0, 48.0, 42.0, 21.0, 22.0, 17.0, 14.0, 9.0, 6.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.348876953125, -17.71337890625, -17.077880859375, -16.4423828125, -15.806884765625, -15.17138671875, -14.535888671875, -13.900390625, -13.264892578125, -12.62939453125, -11.993896484375, -11.3583984375, -10.722900390625, -10.08740234375, -9.451904296875, -8.81640625, -8.180908203125, -7.54541015625, -6.909912109375, -6.2744140625, -5.638916015625, -5.00341796875, -4.367919921875, -3.732421875, -3.096923828125, -2.46142578125, -1.825927734375, -1.1904296875, -0.554931640625, 0.08056640625, 0.716064453125, 1.3515625, 1.987060546875, 2.62255859375, 3.258056640625, 3.8935546875, 4.529052734375, 5.16455078125, 5.800048828125, 6.435546875, 7.071044921875, 7.70654296875, 8.342041015625, 8.9775390625, 9.613037109375, 10.24853515625, 10.884033203125, 11.51953125, 12.155029296875, 12.79052734375, 13.426025390625, 14.0615234375, 14.697021484375, 15.33251953125, 15.968017578125, 16.603515625, 17.239013671875, 17.87451171875, 18.510009765625, 19.1455078125, 19.781005859375, 20.41650390625, 21.052001953125, 21.6875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 12.0, 76.0, 175.0, 360.0, 260.0, 108.0, 26.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.68100357055664, -15.911445617675781, -13.141887664794922, -10.372329711914062, -7.602771759033203, -4.833213806152344, -2.0636558532714844, 0.705902099609375, 3.4754600524902344, 6.245018005371094, 9.014575958251953, 11.784133911132812, 14.553691864013672, 17.32324981689453, 20.09280776977539, 22.86236572265625, 25.63192367553711, 28.40148162841797, 31.171039581298828, 33.94059753417969, 36.71015548706055, 39.479713439941406, 42.249271392822266, 45.018829345703125, 47.788387298583984, 50.557945251464844, 53.3275032043457, 56.09706115722656, 58.86661911010742, 61.63617706298828, 64.40573120117188, 67.17529296875, 69.94485473632812, 72.71441650390625, 75.48397064208984, 78.25352478027344, 81.02308654785156, 83.79264831542969, 86.56220245361328, 89.33175659179688, 92.101318359375, 94.87088012695312, 97.64043426513672, 100.40998840332031, 103.17955017089844, 105.94911193847656, 108.71866607666016, 111.48822021484375, 114.25778198242188, 117.02734375, 119.7968978881836, 122.56645202636719, 125.33601379394531, 128.10557556152344, 130.8751220703125, 133.64468383789062, 136.41424560546875, 139.18380737304688, 141.953369140625, 144.72291564941406, 147.4924774169922, 150.2620391845703, 153.03158569335938, 155.8011474609375, 158.57070922851562]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 12.0, 6.0, 7.0, 6.0, 12.0, 17.0, 19.0, 21.0, 18.0, 21.0, 24.0, 28.0, 25.0, 33.0, 41.0, 44.0, 40.0, 54.0, 52.0, 46.0, 31.0, 46.0, 48.0, 29.0, 42.0, 33.0, 41.0, 40.0, 29.0, 20.0, 23.0, 24.0, 13.0, 13.0, 11.0, 9.0, 10.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.800262451171875, -19.150474548339844, -18.50068473815918, -17.85089683532715, -17.201108932495117, -16.551321029663086, -15.901531219482422, -15.25174331665039, -14.60195541381836, -13.952166557312012, -13.30237865447998, -12.652589797973633, -12.002801895141602, -11.353013038635254, -10.703224182128906, -10.053436279296875, -9.403647422790527, -8.75385856628418, -8.104070663452148, -7.454281806945801, -6.8044939041137695, -6.154705047607422, -5.504916667938232, -4.855128288269043, -4.2053399085998535, -3.555551528930664, -2.9057631492614746, -2.255974531173706, -1.6061861515045166, -0.9563977718353271, -0.3066091537475586, 0.34317922592163086, 0.9929676055908203, 1.6427559852600098, 2.292544364929199, 2.9423329830169678, 3.5921213626861572, 4.241909980773926, 4.891698360443115, 5.541486740112305, 6.191275119781494, 6.841063499450684, 7.490851879119873, 8.140640258789062, 8.79042911529541, 9.440217018127441, 10.090005874633789, 10.73979377746582, 11.389582633972168, 12.039371490478516, 12.689159393310547, 13.338948249816895, 13.988736152648926, 14.638525009155273, 15.288312911987305, 15.938101768493652, 16.587890625, 17.23767852783203, 17.887468338012695, 18.537256240844727, 19.187044143676758, 19.83683204650879, 20.486621856689453, 21.136409759521484, 21.786197662353516]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 4.0, 10.0, 5.0, 12.0, 13.0, 11.0, 11.0, 16.0, 19.0, 27.0, 33.0, 27.0, 35.0, 37.0, 37.0, 34.0, 30.0, 36.0, 45.0, 54.0, 48.0, 40.0, 32.0, 36.0, 27.0, 39.0, 34.0, 22.0, 35.0, 31.0, 17.0, 21.0, 22.0, 15.0, 9.0, 16.0, 4.0, 7.0, 6.0, 8.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0], "bins": [-4.0234375, -3.911712646484375, -3.79998779296875, -3.688262939453125, -3.5765380859375, -3.464813232421875, -3.35308837890625, -3.241363525390625, -3.129638671875, -3.017913818359375, -2.90618896484375, -2.794464111328125, -2.6827392578125, -2.571014404296875, -2.45928955078125, -2.347564697265625, -2.23583984375, -2.124114990234375, -2.01239013671875, -1.900665283203125, -1.7889404296875, -1.677215576171875, -1.56549072265625, -1.453765869140625, -1.342041015625, -1.230316162109375, -1.11859130859375, -1.006866455078125, -0.8951416015625, -0.783416748046875, -0.67169189453125, -0.559967041015625, -0.4482421875, -0.336517333984375, -0.22479248046875, -0.113067626953125, -0.0013427734375, 0.110382080078125, 0.22210693359375, 0.333831787109375, 0.445556640625, 0.557281494140625, 0.66900634765625, 0.780731201171875, 0.8924560546875, 1.004180908203125, 1.11590576171875, 1.227630615234375, 1.33935546875, 1.451080322265625, 1.56280517578125, 1.674530029296875, 1.7862548828125, 1.897979736328125, 2.00970458984375, 2.121429443359375, 2.233154296875, 2.344879150390625, 2.45660400390625, 2.568328857421875, 2.6800537109375, 2.791778564453125, 2.90350341796875, 3.015228271484375, 3.126953125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 5.0, 10.0, 19.0, 22.0, 32.0, 64.0, 80.0, 140.0, 183.0, 308.0, 525.0, 741.0, 1095.0, 1738.0, 2632.0, 3877.0, 6229.0, 9739.0, 15858.0, 26695.0, 45513.0, 81189.0, 155089.0, 356711.0, 148802.0, 78270.0, 44492.0, 26026.0, 15806.0, 9452.0, 6052.0, 3834.0, 2561.0, 1624.0, 1043.0, 697.0, 490.0, 278.0, 214.0, 126.0, 99.0, 62.0, 40.0, 32.0, 15.0, 12.0, 15.0, 5.0, 1.0, 3.0, 5.0, 2.0], "bins": [-0.195068359375, -0.18956947326660156, -0.18407058715820312, -0.1785717010498047, -0.17307281494140625, -0.1675739288330078, -0.16207504272460938, -0.15657615661621094, -0.1510772705078125, -0.14557838439941406, -0.14007949829101562, -0.1345806121826172, -0.12908172607421875, -0.12358283996582031, -0.11808395385742188, -0.11258506774902344, -0.107086181640625, -0.10158729553222656, -0.09608840942382812, -0.09058952331542969, -0.08509063720703125, -0.07959175109863281, -0.07409286499023438, -0.06859397888183594, -0.0630950927734375, -0.05759620666503906, -0.052097320556640625, -0.04659843444824219, -0.04109954833984375, -0.03560066223144531, -0.030101776123046875, -0.024602890014648438, -0.01910400390625, -0.013605117797851562, -0.008106231689453125, -0.0026073455810546875, 0.00289154052734375, 0.008390426635742188, 0.013889312744140625, 0.019388198852539062, 0.0248870849609375, 0.030385971069335938, 0.035884857177734375, 0.04138374328613281, 0.04688262939453125, 0.05238151550292969, 0.057880401611328125, 0.06337928771972656, 0.068878173828125, 0.07437705993652344, 0.07987594604492188, 0.08537483215332031, 0.09087371826171875, 0.09637260437011719, 0.10187149047851562, 0.10737037658691406, 0.1128692626953125, 0.11836814880371094, 0.12386703491210938, 0.1293659210205078, 0.13486480712890625, 0.1403636932373047, 0.14586257934570312, 0.15136146545410156, 0.1568603515625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 2.0, 13.0, 13.0, 8.0, 10.0, 10.0, 7.0, 16.0, 14.0, 21.0, 20.0, 19.0, 30.0, 26.0, 32.0, 28.0, 37.0, 31.0, 37.0, 39.0, 48.0, 1059.0, 31.0, 49.0, 43.0, 40.0, 44.0, 21.0, 29.0, 38.0, 27.0, 23.0, 16.0, 22.0, 14.0, 17.0, 18.0, 14.0, 11.0, 4.0, 7.0, 9.0, 4.0, 3.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.4375, -2.3553466796875, -2.273193359375, -2.1910400390625, -2.10888671875, -2.0267333984375, -1.944580078125, -1.8624267578125, -1.7802734375, -1.6981201171875, -1.615966796875, -1.5338134765625, -1.45166015625, -1.3695068359375, -1.287353515625, -1.2052001953125, -1.123046875, -1.0408935546875, -0.958740234375, -0.8765869140625, -0.79443359375, -0.7122802734375, -0.630126953125, -0.5479736328125, -0.4658203125, -0.3836669921875, -0.301513671875, -0.2193603515625, -0.13720703125, -0.0550537109375, 0.027099609375, 0.1092529296875, 0.19140625, 0.2735595703125, 0.355712890625, 0.4378662109375, 0.52001953125, 0.6021728515625, 0.684326171875, 0.7664794921875, 0.8486328125, 0.9307861328125, 1.012939453125, 1.0950927734375, 1.17724609375, 1.2593994140625, 1.341552734375, 1.4237060546875, 1.505859375, 1.5880126953125, 1.670166015625, 1.7523193359375, 1.83447265625, 1.9166259765625, 1.998779296875, 2.0809326171875, 2.1630859375, 2.2452392578125, 2.327392578125, 2.4095458984375, 2.49169921875, 2.5738525390625, 2.656005859375, 2.7381591796875, 2.8203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 11.0, 17.0, 29.0, 33.0, 63.0, 99.0, 147.0, 226.0, 317.0, 526.0, 652.0, 1015.0, 1362.0, 2023.0, 2812.0, 4026.0, 5773.0, 8434.0, 11640.0, 17348.0, 25645.0, 39817.0, 63868.0, 112640.0, 1317746.0, 210712.0, 99598.0, 57886.0, 36423.0, 23782.0, 16019.0, 11127.0, 7396.0, 5399.0, 3875.0, 2602.0, 1928.0, 1261.0, 901.0, 619.0, 409.0, 290.0, 207.0, 153.0, 88.0, 65.0, 41.0, 30.0, 16.0, 14.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.08123779296875, -0.07876873016357422, -0.07629966735839844, -0.07383060455322266, -0.07136154174804688, -0.0688924789428711, -0.06642341613769531, -0.06395435333251953, -0.06148529052734375, -0.05901622772216797, -0.05654716491699219, -0.054078102111816406, -0.051609039306640625, -0.049139976501464844, -0.04667091369628906, -0.04420185089111328, -0.0417327880859375, -0.03926372528076172, -0.03679466247558594, -0.034325599670410156, -0.031856536865234375, -0.029387474060058594, -0.026918411254882812, -0.02444934844970703, -0.02198028564453125, -0.01951122283935547, -0.017042160034179688, -0.014573097229003906, -0.012104034423828125, -0.009634971618652344, -0.0071659088134765625, -0.004696846008300781, -0.002227783203125, 0.00024127960205078125, 0.0027103424072265625, 0.005179405212402344, 0.007648468017578125, 0.010117530822753906, 0.012586593627929688, 0.015055656433105469, 0.01752471923828125, 0.01999378204345703, 0.022462844848632812, 0.024931907653808594, 0.027400970458984375, 0.029870033264160156, 0.03233909606933594, 0.03480815887451172, 0.0372772216796875, 0.03974628448486328, 0.04221534729003906, 0.044684410095214844, 0.047153472900390625, 0.049622535705566406, 0.05209159851074219, 0.05456066131591797, 0.05702972412109375, 0.05949878692626953, 0.06196784973144531, 0.0644369125366211, 0.06690597534179688, 0.06937503814697266, 0.07184410095214844, 0.07431316375732422, 0.0767822265625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 9.0, 5.0, 11.0, 9.0, 18.0, 10.0, 7.0, 24.0, 39.0, 23.0, 54.0, 101.0, 73.0, 279.0, 49.0, 81.0, 56.0, 26.0, 43.0, 20.0, 9.0, 12.0, 13.0, 2.0, 8.0, 10.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.635883331298828e-06, -3.538094460964203e-06, -3.4403055906295776e-06, -3.3425167202949524e-06, -3.244727849960327e-06, -3.146938979625702e-06, -3.0491501092910767e-06, -2.9513612389564514e-06, -2.853572368621826e-06, -2.755783498287201e-06, -2.6579946279525757e-06, -2.5602057576179504e-06, -2.462416887283325e-06, -2.3646280169487e-06, -2.2668391466140747e-06, -2.1690502762794495e-06, -2.0712614059448242e-06, -1.973472535610199e-06, -1.8756836652755737e-06, -1.7778947949409485e-06, -1.6801059246063232e-06, -1.582317054271698e-06, -1.4845281839370728e-06, -1.3867393136024475e-06, -1.2889504432678223e-06, -1.191161572933197e-06, -1.0933727025985718e-06, -9.955838322639465e-07, -8.977949619293213e-07, -8.00006091594696e-07, -7.022172212600708e-07, -6.044283509254456e-07, -5.066394805908203e-07, -4.0885061025619507e-07, -3.110617399215698e-07, -2.1327286958694458e-07, -1.1548399925231934e-07, -1.7695128917694092e-08, 8.009374141693115e-08, 1.778826117515564e-07, 2.7567148208618164e-07, 3.734603524208069e-07, 4.7124922275543213e-07, 5.690380930900574e-07, 6.668269634246826e-07, 7.646158337593079e-07, 8.624047040939331e-07, 9.601935744285583e-07, 1.0579824447631836e-06, 1.1557713150978088e-06, 1.253560185432434e-06, 1.3513490557670593e-06, 1.4491379261016846e-06, 1.5469267964363098e-06, 1.644715666770935e-06, 1.7425045371055603e-06, 1.8402934074401855e-06, 1.938082277774811e-06, 2.035871148109436e-06, 2.1336600184440613e-06, 2.2314488887786865e-06, 2.3292377591133118e-06, 2.427026629447937e-06, 2.5248154997825623e-06, 2.6226043701171875e-06]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 7.0, 6.0, 6.0, 13.0, 12.0, 20.0, 29.0, 49.0, 96.0, 122.0, 269.0, 1234.0, 943055.0, 102459.0, 646.0, 215.0, 106.0, 63.0, 39.0, 19.0, 15.0, 12.0, 19.0, 9.0, 9.0, 6.0, 8.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6803226470947266e-05, -5.46872615814209e-05, -5.257129669189453e-05, -5.0455331802368164e-05, -4.83393669128418e-05, -4.622340202331543e-05, -4.410743713378906e-05, -4.1991472244262695e-05, -3.987550735473633e-05, -3.775954246520996e-05, -3.5643577575683594e-05, -3.3527612686157227e-05, -3.141164779663086e-05, -2.9295682907104492e-05, -2.7179718017578125e-05, -2.5063753128051758e-05, -2.294778823852539e-05, -2.0831823348999023e-05, -1.8715858459472656e-05, -1.659989356994629e-05, -1.4483928680419922e-05, -1.2367963790893555e-05, -1.0251998901367188e-05, -8.13603401184082e-06, -6.020069122314453e-06, -3.904104232788086e-06, -1.7881393432617188e-06, 3.2782554626464844e-07, 2.4437904357910156e-06, 4.559755325317383e-06, 6.67572021484375e-06, 8.791685104370117e-06, 1.0907649993896484e-05, 1.3023614883422852e-05, 1.5139579772949219e-05, 1.7255544662475586e-05, 1.9371509552001953e-05, 2.148747444152832e-05, 2.3603439331054688e-05, 2.5719404220581055e-05, 2.7835369110107422e-05, 2.995133399963379e-05, 3.2067298889160156e-05, 3.4183263778686523e-05, 3.629922866821289e-05, 3.841519355773926e-05, 4.0531158447265625e-05, 4.264712333679199e-05, 4.476308822631836e-05, 4.6879053115844727e-05, 4.8995018005371094e-05, 5.111098289489746e-05, 5.322694778442383e-05, 5.5342912673950195e-05, 5.745887756347656e-05, 5.957484245300293e-05, 6.16908073425293e-05, 6.380677223205566e-05, 6.592273712158203e-05, 6.80387020111084e-05, 7.015466690063477e-05, 7.227063179016113e-05, 7.43865966796875e-05, 7.650256156921387e-05, 7.861852645874023e-05]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 19.0, 66.0, 217.0, 396.0, 217.0, 57.0, 23.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2027502281125635e-06, -6.07735819357913e-06, -5.951965704298345e-06, -5.826573669764912e-06, -5.701181180484127e-06, -5.575789145950694e-06, -5.450396656669909e-06, -5.3250046221364755e-06, -5.199612132855691e-06, -5.074220098322257e-06, -4.948827609041473e-06, -4.823435574508039e-06, -4.698043085227255e-06, -4.572651050693821e-06, -4.447258561413037e-06, -4.321866526879603e-06, -4.1964740375988185e-06, -4.071082003065385e-06, -3.9456895137846e-06, -3.820297479251167e-06, -3.6949049899703823e-06, -3.5695127280632732e-06, -3.444120466156164e-06, -3.3187284316227306e-06, -3.193336397089297e-06, -3.067944135182188e-06, -2.942551873275079e-06, -2.8171596113679698e-06, -2.6917673494608607e-06, -2.5663750875537517e-06, -2.4409828256466426e-06, -2.315590791113209e-06, -2.1901987565797754e-06, -2.0648064946726663e-06, -1.9394142327655572e-06, -1.8140219708584482e-06, -1.6886297089513391e-06, -1.56323744704423e-06, -1.4378452988239587e-06, -1.3124530369168497e-06, -1.1870606613229029e-06, -1.0616683994157938e-06, -9.362761375086848e-07, -8.108839324449946e-07, -6.854916705378855e-07, -5.600994086307765e-07, -4.3470720356708625e-07, -3.093149416599772e-07, -1.8392267975286813e-07, -5.853043205661379e-08, 6.686181563964055e-08, 1.9225404912504018e-07, 3.1764631103214924e-07, 4.430385729392583e-07, 5.684307780029485e-07, 6.938230399100576e-07, 8.192153018171666e-07, 9.446075637242757e-07, 1.0699998256313847e-06, 1.1953920875384938e-06, 1.3207843494456029e-06, 1.446176611352712e-06, 1.5715687595729833e-06, 1.6969610214800923e-06, 1.8223532833872014e-06]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 0.0, 6.0, 7.0, 0.0, 8.0, 8.0, 0.0, 12.0, 18.0, 0.0, 23.0, 22.0, 0.0, 28.0, 42.0, 0.0, 60.0, 59.0, 0.0, 73.0, 83.0, 0.0, 97.0, 80.0, 0.0, 67.0, 54.0, 0.0, 54.0, 47.0, 0.0, 32.0, 16.0, 0.0, 29.0, 23.0, 0.0, 18.0, 11.0, 0.0, 14.0, 3.0, 0.0, 4.0, 3.0, 0.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2116506695747375e-06, -1.171603798866272e-06, -1.1315569281578064e-06, -1.0915100574493408e-06, -1.0514631867408752e-06, -1.0114163160324097e-06, -9.71369445323944e-07, -9.313225746154785e-07, -8.912757039070129e-07, -8.512288331985474e-07, -8.111819624900818e-07, -7.711350917816162e-07, -7.310882210731506e-07, -6.910413503646851e-07, -6.509944796562195e-07, -6.109476089477539e-07, -5.709007382392883e-07, -5.308538675308228e-07, -4.908069968223572e-07, -4.507601261138916e-07, -4.10713255405426e-07, -3.7066638469696045e-07, -3.3061951398849487e-07, -2.905726432800293e-07, -2.505257725715637e-07, -2.1047890186309814e-07, -1.7043203115463257e-07, -1.30385160446167e-07, -9.033828973770142e-08, -5.029141902923584e-08, -1.0244548320770264e-08, 2.9802322387695312e-08, 6.984919309616089e-08, 1.0989606380462646e-07, 1.4994293451309204e-07, 1.8998980522155762e-07, 2.300366759300232e-07, 2.7008354663848877e-07, 3.1013041734695435e-07, 3.501772880554199e-07, 3.902241587638855e-07, 4.302710294723511e-07, 4.7031790018081665e-07, 5.103647708892822e-07, 5.504116415977478e-07, 5.904585123062134e-07, 6.30505383014679e-07, 6.705522537231445e-07, 7.105991244316101e-07, 7.506459951400757e-07, 7.906928658485413e-07, 8.307397365570068e-07, 8.707866072654724e-07, 9.10833477973938e-07, 9.508803486824036e-07, 9.909272193908691e-07, 1.0309740900993347e-06, 1.0710209608078003e-06, 1.1110678315162659e-06, 1.1511147022247314e-06, 1.191161572933197e-06, 1.2312084436416626e-06, 1.2712553143501282e-06, 1.3113021850585938e-06]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 4.0, 10.0, 5.0, 12.0, 13.0, 11.0, 11.0, 16.0, 19.0, 27.0, 33.0, 27.0, 35.0, 37.0, 37.0, 34.0, 30.0, 36.0, 45.0, 54.0, 48.0, 40.0, 32.0, 36.0, 27.0, 39.0, 34.0, 22.0, 35.0, 31.0, 17.0, 21.0, 22.0, 15.0, 9.0, 16.0, 4.0, 7.0, 6.0, 8.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0], "bins": [-4.0234375, -3.911712646484375, -3.79998779296875, -3.688262939453125, -3.5765380859375, -3.464813232421875, -3.35308837890625, -3.241363525390625, -3.129638671875, -3.017913818359375, -2.90618896484375, -2.794464111328125, -2.6827392578125, -2.571014404296875, -2.45928955078125, -2.347564697265625, -2.23583984375, -2.124114990234375, -2.01239013671875, -1.900665283203125, -1.7889404296875, -1.677215576171875, -1.56549072265625, -1.453765869140625, -1.342041015625, -1.230316162109375, -1.11859130859375, -1.006866455078125, -0.8951416015625, -0.783416748046875, -0.67169189453125, -0.559967041015625, -0.4482421875, -0.336517333984375, -0.22479248046875, -0.113067626953125, -0.0013427734375, 0.110382080078125, 0.22210693359375, 0.333831787109375, 0.445556640625, 0.557281494140625, 0.66900634765625, 0.780731201171875, 0.8924560546875, 1.004180908203125, 1.11590576171875, 1.227630615234375, 1.33935546875, 1.451080322265625, 1.56280517578125, 1.674530029296875, 1.7862548828125, 1.897979736328125, 2.00970458984375, 2.121429443359375, 2.233154296875, 2.344879150390625, 2.45660400390625, 2.568328857421875, 2.6800537109375, 2.791778564453125, 2.90350341796875, 3.015228271484375, 3.126953125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 3.0, 7.0, 9.0, 6.0, 9.0, 12.0, 21.0, 19.0, 29.0, 43.0, 57.0, 99.0, 165.0, 234.0, 532.0, 935.0, 1763.0, 3297.0, 6138.0, 11366.0, 23861.0, 54550.0, 132031.0, 280638.0, 288268.0, 137476.0, 56802.0, 24658.0, 11951.0, 6273.0, 3355.0, 1708.0, 926.0, 535.0, 288.0, 167.0, 77.0, 52.0, 40.0, 29.0, 30.0, 21.0, 15.0, 14.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-5.11328125, -4.95843505859375, -4.8035888671875, -4.64874267578125, -4.493896484375, -4.33905029296875, -4.1842041015625, -4.02935791015625, -3.87451171875, -3.71966552734375, -3.5648193359375, -3.40997314453125, -3.255126953125, -3.10028076171875, -2.9454345703125, -2.79058837890625, -2.6357421875, -2.48089599609375, -2.3260498046875, -2.17120361328125, -2.016357421875, -1.86151123046875, -1.7066650390625, -1.55181884765625, -1.39697265625, -1.24212646484375, -1.0872802734375, -0.93243408203125, -0.777587890625, -0.62274169921875, -0.4678955078125, -0.31304931640625, -0.158203125, -0.00335693359375, 0.1514892578125, 0.30633544921875, 0.461181640625, 0.61602783203125, 0.7708740234375, 0.92572021484375, 1.08056640625, 1.23541259765625, 1.3902587890625, 1.54510498046875, 1.699951171875, 1.85479736328125, 2.0096435546875, 2.16448974609375, 2.3193359375, 2.47418212890625, 2.6290283203125, 2.78387451171875, 2.938720703125, 3.09356689453125, 3.2484130859375, 3.40325927734375, 3.55810546875, 3.71295166015625, 3.8677978515625, 4.02264404296875, 4.177490234375, 4.33233642578125, 4.4871826171875, 4.64202880859375, 4.796875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 4.0, 3.0, 7.0, 13.0, 8.0, 7.0, 15.0, 16.0, 15.0, 20.0, 24.0, 18.0, 24.0, 35.0, 39.0, 39.0, 31.0, 60.0, 80.0, 160.0, 243.0, 1391.0, 229.0, 114.0, 73.0, 55.0, 44.0, 38.0, 42.0, 33.0, 27.0, 25.0, 15.0, 27.0, 11.0, 11.0, 10.0, 5.0, 8.0, 5.0, 8.0, 6.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.28125, -11.8912353515625, -11.501220703125, -11.1112060546875, -10.72119140625, -10.3311767578125, -9.941162109375, -9.5511474609375, -9.1611328125, -8.7711181640625, -8.381103515625, -7.9910888671875, -7.60107421875, -7.2110595703125, -6.821044921875, -6.4310302734375, -6.041015625, -5.6510009765625, -5.260986328125, -4.8709716796875, -4.48095703125, -4.0909423828125, -3.700927734375, -3.3109130859375, -2.9208984375, -2.5308837890625, -2.140869140625, -1.7508544921875, -1.36083984375, -0.9708251953125, -0.580810546875, -0.1907958984375, 0.19921875, 0.5892333984375, 0.979248046875, 1.3692626953125, 1.75927734375, 2.1492919921875, 2.539306640625, 2.9293212890625, 3.3193359375, 3.7093505859375, 4.099365234375, 4.4893798828125, 4.87939453125, 5.2694091796875, 5.659423828125, 6.0494384765625, 6.439453125, 6.8294677734375, 7.219482421875, 7.6094970703125, 7.99951171875, 8.3895263671875, 8.779541015625, 9.1695556640625, 9.5595703125, 9.9495849609375, 10.339599609375, 10.7296142578125, 11.11962890625, 11.5096435546875, 11.899658203125, 12.2896728515625, 12.6796875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 10.0, 9.0, 7.0, 12.0, 13.0, 22.0, 25.0, 28.0, 46.0, 53.0, 55.0, 75.0, 123.0, 166.0, 319.0, 605.0, 1951.0, 10109.0, 98246.0, 2349596.0, 645430.0, 31861.0, 4540.0, 1104.0, 424.0, 227.0, 155.0, 107.0, 82.0, 55.0, 42.0, 28.0, 35.0, 18.0, 22.0, 17.0, 19.0, 6.0, 5.0, 13.0, 11.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-16.5625, -16.041259765625, -15.52001953125, -14.998779296875, -14.4775390625, -13.956298828125, -13.43505859375, -12.913818359375, -12.392578125, -11.871337890625, -11.35009765625, -10.828857421875, -10.3076171875, -9.786376953125, -9.26513671875, -8.743896484375, -8.22265625, -7.701416015625, -7.18017578125, -6.658935546875, -6.1376953125, -5.616455078125, -5.09521484375, -4.573974609375, -4.052734375, -3.531494140625, -3.01025390625, -2.489013671875, -1.9677734375, -1.446533203125, -0.92529296875, -0.404052734375, 0.1171875, 0.638427734375, 1.15966796875, 1.680908203125, 2.2021484375, 2.723388671875, 3.24462890625, 3.765869140625, 4.287109375, 4.808349609375, 5.32958984375, 5.850830078125, 6.3720703125, 6.893310546875, 7.41455078125, 7.935791015625, 8.45703125, 8.978271484375, 9.49951171875, 10.020751953125, 10.5419921875, 11.063232421875, 11.58447265625, 12.105712890625, 12.626953125, 13.148193359375, 13.66943359375, 14.190673828125, 14.7119140625, 15.233154296875, 15.75439453125, 16.275634765625, 16.796875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [11.0, 98.0, 421.0, 387.0, 84.0, 16.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.581006050109863, -6.396378517150879, -3.2117505073547363, -0.02712249755859375, 3.1575050354003906, 6.342132568359375, 9.526761054992676, 12.71138858795166, 15.896016120910645, 19.080644607543945, 22.26527214050293, 25.449899673461914, 28.6345272064209, 31.819154739379883, 35.0037841796875, 38.188411712646484, 41.37303924560547, 44.55766677856445, 47.74229431152344, 50.92692184448242, 54.111549377441406, 57.29617691040039, 60.480804443359375, 63.665435791015625, 66.85005950927734, 70.0346908569336, 73.21931457519531, 76.40394592285156, 79.58856964111328, 82.77320098876953, 85.95782470703125, 89.1424560546875, 92.32707977294922, 95.51171112060547, 98.69633483886719, 101.88096618652344, 105.06558990478516, 108.2502212524414, 111.43484497070312, 114.61947631835938, 117.8041000366211, 120.98873138427734, 124.17335510253906, 127.35798645019531, 130.54261779785156, 133.72723388671875, 136.911865234375, 140.09649658203125, 143.2811279296875, 146.46575927734375, 149.650390625, 152.8350067138672, 156.01963806152344, 159.2042694091797, 162.38890075683594, 165.57351684570312, 168.75814819335938, 171.94277954101562, 175.12741088867188, 178.31202697753906, 181.4966583251953, 184.68128967285156, 187.8659210205078, 191.050537109375, 194.23516845703125]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 4.0, 7.0, 9.0, 13.0, 23.0, 22.0, 23.0, 19.0, 23.0, 27.0, 30.0, 39.0, 39.0, 24.0, 49.0, 37.0, 42.0, 44.0, 51.0, 43.0, 35.0, 47.0, 33.0, 30.0, 31.0, 29.0, 33.0, 29.0, 17.0, 32.0, 18.0, 20.0, 12.0, 11.0, 11.0, 8.0, 8.0, 2.0, 4.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.528907775878906, -34.39859390258789, -33.268280029296875, -32.137962341308594, -31.00765037536621, -29.877334594726562, -28.747020721435547, -27.61670684814453, -26.486392974853516, -25.3560791015625, -24.22576332092285, -23.095449447631836, -21.96513557434082, -20.834819793701172, -19.704505920410156, -18.57419204711914, -17.443876266479492, -16.313562393188477, -15.183247566223145, -14.052932739257812, -12.922618865966797, -11.792304039001465, -10.661989212036133, -9.531675338745117, -8.401360511779785, -7.271046161651611, -6.1407318115234375, -5.0104169845581055, -3.8801026344299316, -2.749788284301758, -1.6194734573364258, -0.48915910720825195, 0.6411552429199219, 1.7714697122573853, 2.9017841815948486, 4.032098770141602, 5.162413120269775, 6.292727470397949, 7.423042297363281, 8.553356170654297, 9.683670997619629, 10.813985824584961, 11.944299697875977, 13.074614524841309, 14.20492935180664, 15.335243225097656, 16.465557098388672, 17.59587287902832, 18.726186752319336, 19.85650062561035, 20.98681640625, 22.117130279541016, 23.24744415283203, 24.377758026123047, 25.508073806762695, 26.63838768005371, 27.76870346069336, 28.899017333984375, 30.029333114624023, 31.15964698791504, 32.28996276855469, 33.4202766418457, 34.55059051513672, 35.680904388427734, 36.81121826171875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 10.0, 12.0, 8.0, 15.0, 21.0, 15.0, 11.0, 34.0, 33.0, 37.0, 32.0, 22.0, 41.0, 27.0, 41.0, 41.0, 42.0, 45.0, 43.0, 53.0, 28.0, 38.0, 35.0, 37.0, 26.0, 30.0, 31.0, 22.0, 13.0, 33.0, 13.0, 17.0, 18.0, 4.0, 9.0, 13.0, 6.0, 5.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-4.265625, -4.14398193359375, -4.0223388671875, -3.90069580078125, -3.779052734375, -3.65740966796875, -3.5357666015625, -3.41412353515625, -3.29248046875, -3.17083740234375, -3.0491943359375, -2.92755126953125, -2.805908203125, -2.68426513671875, -2.5626220703125, -2.44097900390625, -2.3193359375, -2.19769287109375, -2.0760498046875, -1.95440673828125, -1.832763671875, -1.71112060546875, -1.5894775390625, -1.46783447265625, -1.34619140625, -1.22454833984375, -1.1029052734375, -0.98126220703125, -0.859619140625, -0.73797607421875, -0.6163330078125, -0.49468994140625, -0.373046875, -0.25140380859375, -0.1297607421875, -0.00811767578125, 0.113525390625, 0.23516845703125, 0.3568115234375, 0.47845458984375, 0.60009765625, 0.72174072265625, 0.8433837890625, 0.96502685546875, 1.086669921875, 1.20831298828125, 1.3299560546875, 1.45159912109375, 1.5732421875, 1.69488525390625, 1.8165283203125, 1.93817138671875, 2.059814453125, 2.18145751953125, 2.3031005859375, 2.42474365234375, 2.54638671875, 2.66802978515625, 2.7896728515625, 2.91131591796875, 3.032958984375, 3.15460205078125, 3.2762451171875, 3.39788818359375, 3.51953125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 9.0, 7.0, 10.0, 6.0, 14.0, 15.0, 17.0, 26.0, 35.0, 66.0, 128.0, 282.0, 610.0, 1627.0, 4679.0, 14376.0, 48346.0, 182278.0, 702769.0, 1847594.0, 1018841.0, 270377.0, 71259.0, 20539.0, 6536.0, 2183.0, 856.0, 343.0, 169.0, 88.0, 45.0, 29.0, 22.0, 26.0, 18.0, 7.0, 13.0, 9.0, 4.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.10546875, -5.92401123046875, -5.7425537109375, -5.56109619140625, -5.379638671875, -5.19818115234375, -5.0167236328125, -4.83526611328125, -4.65380859375, -4.47235107421875, -4.2908935546875, -4.10943603515625, -3.927978515625, -3.74652099609375, -3.5650634765625, -3.38360595703125, -3.2021484375, -3.02069091796875, -2.8392333984375, -2.65777587890625, -2.476318359375, -2.29486083984375, -2.1134033203125, -1.93194580078125, -1.75048828125, -1.56903076171875, -1.3875732421875, -1.20611572265625, -1.024658203125, -0.84320068359375, -0.6617431640625, -0.48028564453125, -0.298828125, -0.11737060546875, 0.0640869140625, 0.24554443359375, 0.427001953125, 0.60845947265625, 0.7899169921875, 0.97137451171875, 1.15283203125, 1.33428955078125, 1.5157470703125, 1.69720458984375, 1.878662109375, 2.06011962890625, 2.2415771484375, 2.42303466796875, 2.6044921875, 2.78594970703125, 2.9674072265625, 3.14886474609375, 3.330322265625, 3.51177978515625, 3.6932373046875, 3.87469482421875, 4.05615234375, 4.23760986328125, 4.4190673828125, 4.60052490234375, 4.781982421875, 4.96343994140625, 5.1448974609375, 5.32635498046875, 5.5078125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 4.0, 7.0, 6.0, 16.0, 19.0, 36.0, 39.0, 71.0, 87.0, 150.0, 207.0, 293.0, 414.0, 541.0, 560.0, 486.0, 351.0, 294.0, 156.0, 97.0, 82.0, 49.0, 30.0, 24.0, 16.0, 13.0, 5.0, 9.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -6.0789794921875, -5.837646484375, -5.5963134765625, -5.35498046875, -5.1136474609375, -4.872314453125, -4.6309814453125, -4.3896484375, -4.1483154296875, -3.906982421875, -3.6656494140625, -3.42431640625, -3.1829833984375, -2.941650390625, -2.7003173828125, -2.458984375, -2.2176513671875, -1.976318359375, -1.7349853515625, -1.49365234375, -1.2523193359375, -1.010986328125, -0.7696533203125, -0.5283203125, -0.2869873046875, -0.045654296875, 0.1956787109375, 0.43701171875, 0.6783447265625, 0.919677734375, 1.1610107421875, 1.40234375, 1.6436767578125, 1.885009765625, 2.1263427734375, 2.36767578125, 2.6090087890625, 2.850341796875, 3.0916748046875, 3.3330078125, 3.5743408203125, 3.815673828125, 4.0570068359375, 4.29833984375, 4.5396728515625, 4.781005859375, 5.0223388671875, 5.263671875, 5.5050048828125, 5.746337890625, 5.9876708984375, 6.22900390625, 6.4703369140625, 6.711669921875, 6.9530029296875, 7.1943359375, 7.4356689453125, 7.677001953125, 7.9183349609375, 8.15966796875, 8.4010009765625, 8.642333984375, 8.8836669921875, 9.125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 8.0, 8.0, 21.0, 25.0, 34.0, 50.0, 93.0, 133.0, 220.0, 414.0, 905.0, 3533.0, 44253.0, 1317846.0, 2713932.0, 104273.0, 6188.0, 1153.0, 500.0, 243.0, 158.0, 102.0, 62.0, 40.0, 27.0, 16.0, 17.0, 9.0, 1.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.46875, -21.8795166015625, -21.290283203125, -20.7010498046875, -20.11181640625, -19.5225830078125, -18.933349609375, -18.3441162109375, -17.7548828125, -17.1656494140625, -16.576416015625, -15.9871826171875, -15.39794921875, -14.8087158203125, -14.219482421875, -13.6302490234375, -13.041015625, -12.4517822265625, -11.862548828125, -11.2733154296875, -10.68408203125, -10.0948486328125, -9.505615234375, -8.9163818359375, -8.3271484375, -7.7379150390625, -7.148681640625, -6.5594482421875, -5.97021484375, -5.3809814453125, -4.791748046875, -4.2025146484375, -3.61328125, -3.0240478515625, -2.434814453125, -1.8455810546875, -1.25634765625, -0.6671142578125, -0.077880859375, 0.5113525390625, 1.1005859375, 1.6898193359375, 2.279052734375, 2.8682861328125, 3.45751953125, 4.0467529296875, 4.635986328125, 5.2252197265625, 5.814453125, 6.4036865234375, 6.992919921875, 7.5821533203125, 8.17138671875, 8.7606201171875, 9.349853515625, 9.9390869140625, 10.5283203125, 11.1175537109375, 11.706787109375, 12.2960205078125, 12.88525390625, 13.4744873046875, 14.063720703125, 14.6529541015625, 15.2421875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 25.0, 96.0, 238.0, 276.0, 224.0, 109.0, 30.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.45670700073242, -43.01179504394531, -40.5668830871582, -38.121971130371094, -35.67705535888672, -33.23214340209961, -30.7872314453125, -28.342317581176758, -25.89740562438965, -23.45249366760254, -21.007579803466797, -18.562667846679688, -16.117755889892578, -13.672842025756836, -11.227930068969727, -8.783016204833984, -6.338104248046875, -3.8931915760040283, -1.4482789039611816, 0.9966335296630859, 3.4415464401245117, 5.8864593505859375, 8.331371307373047, 10.776285171508789, 13.221197128295898, 15.666110038757324, 18.11102294921875, 20.55593490600586, 23.00084686279297, 25.44576072692871, 27.89067268371582, 30.335586547851562, 32.780494689941406, 35.225406646728516, 37.670318603515625, 40.115234375, 42.56014633178711, 45.00505828857422, 47.44997024536133, 49.89488220214844, 52.33979797363281, 54.78470993041992, 57.22962188720703, 59.674537658691406, 62.119449615478516, 64.56436157226562, 67.00927734375, 69.45418548583984, 71.89909362792969, 74.34400939941406, 76.7889175415039, 79.23383331298828, 81.67874145507812, 84.1236572265625, 86.56857299804688, 89.01348114013672, 91.4583969116211, 93.90331268310547, 96.34822082519531, 98.79313659667969, 101.23804473876953, 103.6829605102539, 106.12786865234375, 108.57278442382812, 111.0177001953125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 1.0, 2.0, 4.0, 9.0, 9.0, 8.0, 10.0, 10.0, 9.0, 14.0, 9.0, 17.0, 14.0, 22.0, 30.0, 35.0, 28.0, 30.0, 32.0, 33.0, 36.0, 37.0, 38.0, 34.0, 33.0, 38.0, 45.0, 37.0, 40.0, 30.0, 36.0, 27.0, 20.0, 25.0, 21.0, 13.0, 27.0, 26.0, 21.0, 12.0, 15.0, 10.0, 10.0, 7.0, 11.0, 7.0, 6.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.797183990478516, -19.18671226501465, -18.576242446899414, -17.965770721435547, -17.35529899597168, -16.744827270507812, -16.134357452392578, -15.523885726928711, -14.913414001464844, -14.302943229675293, -13.692471504211426, -13.082000732421875, -12.471529006958008, -11.861058235168457, -11.250587463378906, -10.640115737915039, -10.029644966125488, -9.419174194335938, -8.80870246887207, -8.19823169708252, -7.587759971618652, -6.977289199829102, -6.366817951202393, -5.756346702575684, -5.145875453948975, -4.535404205322266, -3.9249329566955566, -3.3144619464874268, -2.7039906978607178, -2.093519449234009, -1.483048439025879, -0.8725771903991699, -0.26210594177246094, 0.34836524724960327, 0.9588364362716675, 1.569307565689087, 2.179778814315796, 2.790250062942505, 3.4007210731506348, 4.011192321777344, 4.621663570404053, 5.232134819030762, 5.842606067657471, 6.45307731628418, 7.0635480880737305, 7.674019813537598, 8.284490585327148, 8.894962310791016, 9.505433082580566, 10.115903854370117, 10.726375579833984, 11.336846351623535, 11.947318077087402, 12.557788848876953, 13.16826057434082, 13.778731346130371, 14.389202117919922, 14.999672889709473, 15.61014461517334, 16.22061538696289, 16.831087112426758, 17.441558837890625, 18.05202865600586, 18.662500381469727, 19.272972106933594]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 10.0, 11.0, 16.0, 16.0, 19.0, 22.0, 26.0, 32.0, 22.0, 38.0, 41.0, 39.0, 36.0, 31.0, 42.0, 51.0, 49.0, 43.0, 37.0, 30.0, 37.0, 33.0, 33.0, 35.0, 31.0, 33.0, 19.0, 22.0, 17.0, 15.0, 21.0, 15.0, 9.0, 8.0, 7.0, 6.0, 6.0, 4.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.33203125, -4.207550048828125, -4.08306884765625, -3.958587646484375, -3.8341064453125, -3.709625244140625, -3.58514404296875, -3.460662841796875, -3.336181640625, -3.211700439453125, -3.08721923828125, -2.962738037109375, -2.8382568359375, -2.713775634765625, -2.58929443359375, -2.464813232421875, -2.34033203125, -2.215850830078125, -2.09136962890625, -1.966888427734375, -1.8424072265625, -1.717926025390625, -1.59344482421875, -1.468963623046875, -1.344482421875, -1.220001220703125, -1.09552001953125, -0.971038818359375, -0.8465576171875, -0.722076416015625, -0.59759521484375, -0.473114013671875, -0.3486328125, -0.224151611328125, -0.09967041015625, 0.024810791015625, 0.1492919921875, 0.273773193359375, 0.39825439453125, 0.522735595703125, 0.647216796875, 0.771697998046875, 0.89617919921875, 1.020660400390625, 1.1451416015625, 1.269622802734375, 1.39410400390625, 1.518585205078125, 1.64306640625, 1.767547607421875, 1.89202880859375, 2.016510009765625, 2.1409912109375, 2.265472412109375, 2.38995361328125, 2.514434814453125, 2.638916015625, 2.763397216796875, 2.88787841796875, 3.012359619140625, 3.1368408203125, 3.261322021484375, 3.38580322265625, 3.510284423828125, 3.634765625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 9.0, 7.0, 25.0, 35.0, 48.0, 92.0, 130.0, 216.0, 327.0, 511.0, 791.0, 1243.0, 1880.0, 3014.0, 4808.0, 7724.0, 12604.0, 21007.0, 35911.0, 64294.0, 123078.0, 349525.0, 204421.0, 92718.0, 50606.0, 28680.0, 17037.0, 10355.0, 6394.0, 4090.0, 2545.0, 1606.0, 1036.0, 656.0, 383.0, 262.0, 165.0, 109.0, 62.0, 53.0, 35.0, 18.0, 11.0, 14.0, 8.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.20654296875, -0.2006072998046875, -0.194671630859375, -0.1887359619140625, -0.18280029296875, -0.1768646240234375, -0.170928955078125, -0.1649932861328125, -0.1590576171875, -0.1531219482421875, -0.147186279296875, -0.1412506103515625, -0.13531494140625, -0.1293792724609375, -0.123443603515625, -0.1175079345703125, -0.111572265625, -0.1056365966796875, -0.099700927734375, -0.0937652587890625, -0.08782958984375, -0.0818939208984375, -0.075958251953125, -0.0700225830078125, -0.0640869140625, -0.0581512451171875, -0.052215576171875, -0.0462799072265625, -0.04034423828125, -0.0344085693359375, -0.028472900390625, -0.0225372314453125, -0.0166015625, -0.0106658935546875, -0.004730224609375, 0.0012054443359375, 0.00714111328125, 0.0130767822265625, 0.019012451171875, 0.0249481201171875, 0.0308837890625, 0.0368194580078125, 0.042755126953125, 0.0486907958984375, 0.05462646484375, 0.0605621337890625, 0.066497802734375, 0.0724334716796875, 0.078369140625, 0.0843048095703125, 0.090240478515625, 0.0961761474609375, 0.10211181640625, 0.1080474853515625, 0.113983154296875, 0.1199188232421875, 0.1258544921875, 0.1317901611328125, 0.137725830078125, 0.1436614990234375, 0.14959716796875, 0.1555328369140625, 0.161468505859375, 0.1674041748046875, 0.17333984375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 4.0, 14.0, 16.0, 15.0, 16.0, 19.0, 17.0, 28.0, 26.0, 21.0, 46.0, 28.0, 36.0, 30.0, 39.0, 42.0, 43.0, 42.0, 1065.0, 40.0, 53.0, 34.0, 37.0, 33.0, 31.0, 27.0, 26.0, 27.0, 23.0, 18.0, 24.0, 11.0, 15.0, 12.0, 9.0, 12.0, 9.0, 7.0, 4.0, 9.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.78125, -2.6929931640625, -2.604736328125, -2.5164794921875, -2.42822265625, -2.3399658203125, -2.251708984375, -2.1634521484375, -2.0751953125, -1.9869384765625, -1.898681640625, -1.8104248046875, -1.72216796875, -1.6339111328125, -1.545654296875, -1.4573974609375, -1.369140625, -1.2808837890625, -1.192626953125, -1.1043701171875, -1.01611328125, -0.9278564453125, -0.839599609375, -0.7513427734375, -0.6630859375, -0.5748291015625, -0.486572265625, -0.3983154296875, -0.31005859375, -0.2218017578125, -0.133544921875, -0.0452880859375, 0.04296875, 0.1312255859375, 0.219482421875, 0.3077392578125, 0.39599609375, 0.4842529296875, 0.572509765625, 0.6607666015625, 0.7490234375, 0.8372802734375, 0.925537109375, 1.0137939453125, 1.10205078125, 1.1903076171875, 1.278564453125, 1.3668212890625, 1.455078125, 1.5433349609375, 1.631591796875, 1.7198486328125, 1.80810546875, 1.8963623046875, 1.984619140625, 2.0728759765625, 2.1611328125, 2.2493896484375, 2.337646484375, 2.4259033203125, 2.51416015625, 2.6024169921875, 2.690673828125, 2.7789306640625, 2.8671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 19.0, 23.0, 33.0, 47.0, 64.0, 97.0, 146.0, 201.0, 308.0, 472.0, 642.0, 955.0, 1507.0, 2073.0, 3018.0, 4486.0, 6296.0, 9379.0, 13904.0, 20435.0, 30686.0, 48242.0, 79338.0, 148734.0, 1357225.0, 147138.0, 79005.0, 48144.0, 30937.0, 20473.0, 13607.0, 9257.0, 6540.0, 4262.0, 2943.0, 2036.0, 1369.0, 988.0, 622.0, 491.0, 292.0, 229.0, 153.0, 88.0, 71.0, 52.0, 32.0, 23.0, 18.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0826416015625, -0.08009815216064453, -0.07755470275878906, -0.0750112533569336, -0.07246780395507812, -0.06992435455322266, -0.06738090515136719, -0.06483745574951172, -0.06229400634765625, -0.05975055694580078, -0.05720710754394531, -0.054663658142089844, -0.052120208740234375, -0.049576759338378906, -0.04703330993652344, -0.04448986053466797, -0.0419464111328125, -0.03940296173095703, -0.03685951232910156, -0.034316062927246094, -0.031772613525390625, -0.029229164123535156, -0.026685714721679688, -0.02414226531982422, -0.02159881591796875, -0.01905536651611328, -0.016511917114257812, -0.013968467712402344, -0.011425018310546875, -0.008881568908691406, -0.0063381195068359375, -0.0037946701049804688, -0.001251220703125, 0.0012922286987304688, 0.0038356781005859375, 0.006379127502441406, 0.008922576904296875, 0.011466026306152344, 0.014009475708007812, 0.01655292510986328, 0.01909637451171875, 0.02163982391357422, 0.024183273315429688, 0.026726722717285156, 0.029270172119140625, 0.031813621520996094, 0.03435707092285156, 0.03690052032470703, 0.0394439697265625, 0.04198741912841797, 0.04453086853027344, 0.047074317932128906, 0.049617767333984375, 0.052161216735839844, 0.05470466613769531, 0.05724811553955078, 0.05979156494140625, 0.06233501434326172, 0.06487846374511719, 0.06742191314697266, 0.06996536254882812, 0.0725088119506836, 0.07505226135253906, 0.07759571075439453, 0.08013916015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 1.0, 8.0, 7.0, 20.0, 8.0, 10.0, 13.0, 33.0, 20.0, 25.0, 20.0, 51.0, 38.0, 56.0, 62.0, 271.0, 37.0, 41.0, 35.0, 27.0, 34.0, 20.0, 17.0, 12.0, 26.0, 13.0, 11.0, 11.0, 8.0, 5.0, 6.0, 7.0, 8.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1457672119140625e-06, -2.0721927285194397e-06, -1.998618245124817e-06, -1.925043761730194e-06, -1.8514692783355713e-06, -1.7778947949409485e-06, -1.7043203115463257e-06, -1.6307458281517029e-06, -1.55717134475708e-06, -1.4835968613624573e-06, -1.4100223779678345e-06, -1.3364478945732117e-06, -1.2628734111785889e-06, -1.189298927783966e-06, -1.1157244443893433e-06, -1.0421499609947205e-06, -9.685754776000977e-07, -8.950009942054749e-07, -8.21426510810852e-07, -7.478520274162292e-07, -6.742775440216064e-07, -6.007030606269836e-07, -5.271285772323608e-07, -4.5355409383773804e-07, -3.7997961044311523e-07, -3.0640512704849243e-07, -2.3283064365386963e-07, -1.5925616025924683e-07, -8.568167686462402e-08, -1.210719347000122e-08, 6.146728992462158e-08, 1.3504177331924438e-07, 2.086162567138672e-07, 2.8219074010849e-07, 3.557652235031128e-07, 4.293397068977356e-07, 5.029141902923584e-07, 5.764886736869812e-07, 6.50063157081604e-07, 7.236376404762268e-07, 7.972121238708496e-07, 8.707866072654724e-07, 9.443610906600952e-07, 1.017935574054718e-06, 1.0915100574493408e-06, 1.1650845408439636e-06, 1.2386590242385864e-06, 1.3122335076332092e-06, 1.385807991027832e-06, 1.4593824744224548e-06, 1.5329569578170776e-06, 1.6065314412117004e-06, 1.6801059246063232e-06, 1.753680408000946e-06, 1.8272548913955688e-06, 1.9008293747901917e-06, 1.9744038581848145e-06, 2.0479783415794373e-06, 2.12155282497406e-06, 2.195127308368683e-06, 2.2687017917633057e-06, 2.3422762751579285e-06, 2.4158507585525513e-06, 2.489425241947174e-06, 2.562999725341797e-06]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 2.0, 9.0, 7.0, 7.0, 6.0, 21.0, 27.0, 18.0, 25.0, 39.0, 43.0, 73.0, 95.0, 191.0, 280.0, 865.0, 185019.0, 859306.0, 1621.0, 303.0, 163.0, 131.0, 54.0, 47.0, 38.0, 35.0, 18.0, 25.0, 13.0, 18.0, 7.0, 4.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.716085433959961e-05, -5.553197115659714e-05, -5.3903087973594666e-05, -5.2274204790592194e-05, -5.064532160758972e-05, -4.901643842458725e-05, -4.738755524158478e-05, -4.5758672058582306e-05, -4.4129788875579834e-05, -4.250090569257736e-05, -4.087202250957489e-05, -3.924313932657242e-05, -3.7614256143569946e-05, -3.5985372960567474e-05, -3.4356489777565e-05, -3.272760659456253e-05, -3.109872341156006e-05, -2.9469840228557587e-05, -2.7840957045555115e-05, -2.6212073862552643e-05, -2.458319067955017e-05, -2.29543074965477e-05, -2.1325424313545227e-05, -1.9696541130542755e-05, -1.8067657947540283e-05, -1.643877476453781e-05, -1.480989158153534e-05, -1.3181008398532867e-05, -1.1552125215530396e-05, -9.923242032527924e-06, -8.294358849525452e-06, -6.66547566652298e-06, -5.036592483520508e-06, -3.407709300518036e-06, -1.778826117515564e-06, -1.4994293451309204e-07, 1.4789402484893799e-06, 3.107823431491852e-06, 4.736706614494324e-06, 6.365589797496796e-06, 7.994472980499268e-06, 9.62335616350174e-06, 1.1252239346504211e-05, 1.2881122529506683e-05, 1.4510005712509155e-05, 1.6138888895511627e-05, 1.77677720785141e-05, 1.939665526151657e-05, 2.1025538444519043e-05, 2.2654421627521515e-05, 2.4283304810523987e-05, 2.591218799352646e-05, 2.754107117652893e-05, 2.9169954359531403e-05, 3.0798837542533875e-05, 3.2427720725536346e-05, 3.405660390853882e-05, 3.568548709154129e-05, 3.731437027454376e-05, 3.8943253457546234e-05, 4.0572136640548706e-05, 4.220101982355118e-05, 4.382990300655365e-05, 4.545878618955612e-05, 4.7087669372558594e-05]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 25.0, 429.0, 537.0, 29.0], "bins": [-1.535175761091523e-05, -1.5104257727216464e-05, -1.4856757843517698e-05, -1.4609257959818933e-05, -1.4361758076120168e-05, -1.4114258192421403e-05, -1.3866758308722638e-05, -1.3619258425023872e-05, -1.3371758541325107e-05, -1.3124258657626342e-05, -1.2876758773927577e-05, -1.2629258890228812e-05, -1.2381759006530046e-05, -1.2134259122831281e-05, -1.1886759239132516e-05, -1.1639259355433751e-05, -1.1391759471734986e-05, -1.114425958803622e-05, -1.0896759704337455e-05, -1.064925982063869e-05, -1.0401759936939925e-05, -1.015426005324116e-05, -9.906760169542395e-06, -9.65926028584363e-06, -9.411759492650162e-06, -9.164259608951397e-06, -8.916759725252632e-06, -8.669259841553867e-06, -8.421759957855102e-06, -8.174260074156336e-06, -7.926760190457571e-06, -7.679260306758806e-06, -7.431760877807392e-06, -7.184260994108627e-06, -6.9367611104098614e-06, -6.689261226711096e-06, -6.441761343012331e-06, -6.194261459313566e-06, -5.94676112086745e-06, -5.699261237168685e-06, -5.45176180821727e-06, -5.204261924518505e-06, -4.95676204081974e-06, -4.709262157120975e-06, -4.4617622734222095e-06, -4.214262389723444e-06, -3.966762051277328e-06, -3.7192623949522385e-06, -3.471762283879798e-06, -3.2242624001810327e-06, -2.9767625164822675e-06, -2.7292626327835023e-06, -2.481762749084737e-06, -2.234262865385972e-06, -1.9867627543135313e-06, -1.7392628706147661e-06, -1.4917631006028387e-06, -1.2442632169040735e-06, -9.967632195184706e-07, -7.492633358197054e-07, -5.017634521209402e-07, -2.54263568422175e-07, -6.7635710365721025e-09, 2.407363126621931e-07, 4.882361963609583e-07]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 0.0, 9.0, 0.0, 11.0, 13.0, 0.0, 23.0, 24.0, 0.0, 38.0, 0.0, 52.0, 58.0, 0.0, 89.0, 0.0, 105.0, 130.0, 0.0, 118.0, 0.0, 79.0, 85.0, 0.0, 46.0, 0.0, 34.0, 23.0, 0.0, 29.0, 13.0, 0.0, 6.0, 0.0, 7.0, 10.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1557713150978088e-06, -1.1194497346878052e-06, -1.0831281542778015e-06, -1.0468065738677979e-06, -1.0104849934577942e-06, -9.741634130477905e-07, -9.378418326377869e-07, -9.015202522277832e-07, -8.651986718177795e-07, -8.288770914077759e-07, -7.925555109977722e-07, -7.562339305877686e-07, -7.199123501777649e-07, -6.835907697677612e-07, -6.472691893577576e-07, -6.109476089477539e-07, -5.746260285377502e-07, -5.383044481277466e-07, -5.019828677177429e-07, -4.6566128730773926e-07, -4.293397068977356e-07, -3.9301812648773193e-07, -3.5669654607772827e-07, -3.203749656677246e-07, -2.8405338525772095e-07, -2.477318048477173e-07, -2.1141022443771362e-07, -1.7508864402770996e-07, -1.387670636177063e-07, -1.0244548320770264e-07, -6.612390279769897e-08, -2.9802322387695312e-08, 6.51925802230835e-09, 4.284083843231201e-08, 7.916241884231567e-08, 1.1548399925231934e-07, 1.51805579662323e-07, 1.8812716007232666e-07, 2.2444874048233032e-07, 2.60770320892334e-07, 2.9709190130233765e-07, 3.334134817123413e-07, 3.6973506212234497e-07, 4.0605664253234863e-07, 4.423782229423523e-07, 4.78699803352356e-07, 5.150213837623596e-07, 5.513429641723633e-07, 5.876645445823669e-07, 6.239861249923706e-07, 6.603077054023743e-07, 6.966292858123779e-07, 7.329508662223816e-07, 7.692724466323853e-07, 8.055940270423889e-07, 8.419156074523926e-07, 8.782371878623962e-07, 9.145587682723999e-07, 9.508803486824036e-07, 9.872019290924072e-07, 1.0235235095024109e-06, 1.0598450899124146e-06, 1.0961666703224182e-06, 1.1324882507324219e-06]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 7.0, 10.0, 11.0, 16.0, 16.0, 19.0, 22.0, 26.0, 32.0, 22.0, 38.0, 41.0, 39.0, 36.0, 31.0, 42.0, 51.0, 49.0, 43.0, 37.0, 30.0, 37.0, 33.0, 33.0, 35.0, 31.0, 33.0, 19.0, 22.0, 17.0, 15.0, 21.0, 15.0, 9.0, 8.0, 7.0, 6.0, 6.0, 4.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.33203125, -4.207550048828125, -4.08306884765625, -3.958587646484375, -3.8341064453125, -3.709625244140625, -3.58514404296875, -3.460662841796875, -3.336181640625, -3.211700439453125, -3.08721923828125, -2.962738037109375, -2.8382568359375, -2.713775634765625, -2.58929443359375, -2.464813232421875, -2.34033203125, -2.215850830078125, -2.09136962890625, -1.966888427734375, -1.8424072265625, -1.717926025390625, -1.59344482421875, -1.468963623046875, -1.344482421875, -1.220001220703125, -1.09552001953125, -0.971038818359375, -0.8465576171875, -0.722076416015625, -0.59759521484375, -0.473114013671875, -0.3486328125, -0.224151611328125, -0.09967041015625, 0.024810791015625, 0.1492919921875, 0.273773193359375, 0.39825439453125, 0.522735595703125, 0.647216796875, 0.771697998046875, 0.89617919921875, 1.020660400390625, 1.1451416015625, 1.269622802734375, 1.39410400390625, 1.518585205078125, 1.64306640625, 1.767547607421875, 1.89202880859375, 2.016510009765625, 2.1409912109375, 2.265472412109375, 2.38995361328125, 2.514434814453125, 2.638916015625, 2.763397216796875, 2.88787841796875, 3.012359619140625, 3.1368408203125, 3.261322021484375, 3.38580322265625, 3.510284423828125, 3.634765625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 10.0, 16.0, 17.0, 21.0, 26.0, 37.0, 44.0, 59.0, 75.0, 120.0, 170.0, 307.0, 520.0, 1005.0, 1831.0, 3382.0, 6454.0, 12499.0, 26664.0, 65702.0, 252236.0, 486996.0, 113482.0, 40210.0, 17767.0, 8760.0, 4580.0, 2442.0, 1300.0, 723.0, 359.0, 187.0, 112.0, 88.0, 68.0, 60.0, 31.0, 40.0, 28.0, 22.0, 12.0, 17.0, 12.0, 12.0, 13.0, 8.0, 3.0, 6.0, 4.0, 1.0, 2.0], "bins": [-6.90234375, -6.70074462890625, -6.4991455078125, -6.29754638671875, -6.095947265625, -5.89434814453125, -5.6927490234375, -5.49114990234375, -5.28955078125, -5.08795166015625, -4.8863525390625, -4.68475341796875, -4.483154296875, -4.28155517578125, -4.0799560546875, -3.87835693359375, -3.6767578125, -3.47515869140625, -3.2735595703125, -3.07196044921875, -2.870361328125, -2.66876220703125, -2.4671630859375, -2.26556396484375, -2.06396484375, -1.86236572265625, -1.6607666015625, -1.45916748046875, -1.257568359375, -1.05596923828125, -0.8543701171875, -0.65277099609375, -0.451171875, -0.24957275390625, -0.0479736328125, 0.15362548828125, 0.355224609375, 0.55682373046875, 0.7584228515625, 0.96002197265625, 1.16162109375, 1.36322021484375, 1.5648193359375, 1.76641845703125, 1.968017578125, 2.16961669921875, 2.3712158203125, 2.57281494140625, 2.7744140625, 2.97601318359375, 3.1776123046875, 3.37921142578125, 3.580810546875, 3.78240966796875, 3.9840087890625, 4.18560791015625, 4.38720703125, 4.58880615234375, 4.7904052734375, 4.99200439453125, 5.193603515625, 5.39520263671875, 5.5968017578125, 5.79840087890625, 6.0]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 6.0, 12.0, 12.0, 14.0, 11.0, 17.0, 13.0, 18.0, 16.0, 25.0, 24.0, 36.0, 37.0, 37.0, 42.0, 60.0, 65.0, 87.0, 203.0, 1413.0, 261.0, 128.0, 72.0, 64.0, 43.0, 44.0, 37.0, 26.0, 26.0, 32.0, 20.0, 17.0, 27.0, 9.0, 21.0, 6.0, 14.0, 10.0, 8.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2578125, -9.9127197265625, -9.567626953125, -9.2225341796875, -8.87744140625, -8.5323486328125, -8.187255859375, -7.8421630859375, -7.4970703125, -7.1519775390625, -6.806884765625, -6.4617919921875, -6.11669921875, -5.7716064453125, -5.426513671875, -5.0814208984375, -4.736328125, -4.3912353515625, -4.046142578125, -3.7010498046875, -3.35595703125, -3.0108642578125, -2.665771484375, -2.3206787109375, -1.9755859375, -1.6304931640625, -1.285400390625, -0.9403076171875, -0.59521484375, -0.2501220703125, 0.094970703125, 0.4400634765625, 0.78515625, 1.1302490234375, 1.475341796875, 1.8204345703125, 2.16552734375, 2.5106201171875, 2.855712890625, 3.2008056640625, 3.5458984375, 3.8909912109375, 4.236083984375, 4.5811767578125, 4.92626953125, 5.2713623046875, 5.616455078125, 5.9615478515625, 6.306640625, 6.6517333984375, 6.996826171875, 7.3419189453125, 7.68701171875, 8.0321044921875, 8.377197265625, 8.7222900390625, 9.0673828125, 9.4124755859375, 9.757568359375, 10.1026611328125, 10.44775390625, 10.7928466796875, 11.137939453125, 11.4830322265625, 11.828125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 7.0, 7.0, 9.0, 14.0, 14.0, 16.0, 22.0, 25.0, 28.0, 27.0, 38.0, 48.0, 72.0, 97.0, 161.0, 193.0, 301.0, 642.0, 2076.0, 9735.0, 66844.0, 2120473.0, 894012.0, 40770.0, 6914.0, 1635.0, 531.0, 268.0, 171.0, 116.0, 100.0, 69.0, 52.0, 43.0, 23.0, 15.0, 18.0, 21.0, 17.0, 19.0, 14.0, 9.0, 3.0, 8.0, 3.0, 4.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.8125, -16.3013916015625, -15.790283203125, -15.2791748046875, -14.76806640625, -14.2569580078125, -13.745849609375, -13.2347412109375, -12.7236328125, -12.2125244140625, -11.701416015625, -11.1903076171875, -10.67919921875, -10.1680908203125, -9.656982421875, -9.1458740234375, -8.634765625, -8.1236572265625, -7.612548828125, -7.1014404296875, -6.59033203125, -6.0792236328125, -5.568115234375, -5.0570068359375, -4.5458984375, -4.0347900390625, -3.523681640625, -3.0125732421875, -2.50146484375, -1.9903564453125, -1.479248046875, -0.9681396484375, -0.45703125, 0.0540771484375, 0.565185546875, 1.0762939453125, 1.58740234375, 2.0985107421875, 2.609619140625, 3.1207275390625, 3.6318359375, 4.1429443359375, 4.654052734375, 5.1651611328125, 5.67626953125, 6.1873779296875, 6.698486328125, 7.2095947265625, 7.720703125, 8.2318115234375, 8.742919921875, 9.2540283203125, 9.76513671875, 10.2762451171875, 10.787353515625, 11.2984619140625, 11.8095703125, 12.3206787109375, 12.831787109375, 13.3428955078125, 13.85400390625, 14.3651123046875, 14.876220703125, 15.3873291015625, 15.8984375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 14.0, 132.0, 414.0, 359.0, 88.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.984806060791016, -14.138572692871094, -11.292338371276855, -8.446104049682617, -5.599870681762695, -2.7536373138427734, 0.09259796142578125, 2.938831329345703, 5.785064697265625, 8.631298065185547, 11.477532386779785, 14.323766708374023, 17.170000076293945, 20.016233444213867, 22.862468719482422, 25.708702087402344, 28.554935455322266, 31.401168823242188, 34.24740219116211, 37.09363555908203, 39.93987274169922, 42.786102294921875, 45.63233947753906, 48.478572845458984, 51.324806213378906, 54.17103958129883, 57.01727294921875, 59.86351013183594, 62.709739685058594, 65.55597686767578, 68.40220642089844, 71.24844360351562, 74.09468078613281, 76.94091796875, 79.78714752197266, 82.63338470458984, 85.4796142578125, 88.32585144042969, 91.17208862304688, 94.01831817626953, 96.86454772949219, 99.71078491210938, 102.55701446533203, 105.40325164794922, 108.24948120117188, 111.09571838378906, 113.94195556640625, 116.7881851196289, 119.6344223022461, 122.48065948486328, 125.32688903808594, 128.17312622070312, 131.0193634033203, 133.86558532714844, 136.71182250976562, 139.5580596923828, 142.404296875, 145.2505340576172, 148.09677124023438, 150.9429931640625, 153.7892303466797, 156.63546752929688, 159.48170471191406, 162.32794189453125, 165.17416381835938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 9.0, 7.0, 10.0, 10.0, 15.0, 13.0, 12.0, 17.0, 16.0, 22.0, 15.0, 24.0, 27.0, 42.0, 29.0, 35.0, 28.0, 40.0, 32.0, 49.0, 36.0, 46.0, 44.0, 57.0, 41.0, 30.0, 38.0, 33.0, 27.0, 26.0, 26.0, 21.0, 20.0, 20.0, 26.0, 17.0, 14.0, 1.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.67845916748047, -34.64162063598633, -33.60478210449219, -32.56794357299805, -31.531105041503906, -30.494266510009766, -29.457429885864258, -28.420591354370117, -27.383752822875977, -26.346914291381836, -25.310075759887695, -24.273237228393555, -23.236400604248047, -22.199562072753906, -21.162723541259766, -20.125885009765625, -19.089046478271484, -18.052207946777344, -17.015369415283203, -15.978531837463379, -14.941693305969238, -13.904854774475098, -12.868017196655273, -11.831178665161133, -10.794340133666992, -9.757501602172852, -8.720663070678711, -7.683825492858887, -6.646986961364746, -5.6101484298706055, -4.573310375213623, -3.5364723205566406, -2.4996376037597656, -1.462799310684204, -0.4259610176086426, 0.610877275466919, 1.6477155685424805, 2.684554100036621, 3.7213921546936035, 4.758230209350586, 5.795068740844727, 6.831907272338867, 7.86874532699585, 8.905583381652832, 9.942421913146973, 10.979260444641113, 12.016098022460938, 13.052936553955078, 14.089775085449219, 15.12661361694336, 16.1634521484375, 17.20029067993164, 18.23712921142578, 19.273967742919922, 20.31080436706543, 21.34764289855957, 22.38448143005371, 23.42131996154785, 24.458158493041992, 25.494997024536133, 26.53183364868164, 27.56867218017578, 28.605510711669922, 29.642349243164062, 30.679187774658203]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 3.0, 5.0, 7.0, 10.0, 5.0, 13.0, 18.0, 15.0, 25.0, 15.0, 31.0, 20.0, 23.0, 33.0, 32.0, 32.0, 38.0, 43.0, 47.0, 41.0, 33.0, 32.0, 45.0, 36.0, 34.0, 26.0, 39.0, 36.0, 27.0, 27.0, 22.0, 22.0, 19.0, 18.0, 19.0, 16.0, 10.0, 15.0, 15.0, 9.0, 7.0, 9.0, 10.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 4.0], "bins": [-4.26171875, -4.137939453125, -4.01416015625, -3.890380859375, -3.7666015625, -3.642822265625, -3.51904296875, -3.395263671875, -3.271484375, -3.147705078125, -3.02392578125, -2.900146484375, -2.7763671875, -2.652587890625, -2.52880859375, -2.405029296875, -2.28125, -2.157470703125, -2.03369140625, -1.909912109375, -1.7861328125, -1.662353515625, -1.53857421875, -1.414794921875, -1.291015625, -1.167236328125, -1.04345703125, -0.919677734375, -0.7958984375, -0.672119140625, -0.54833984375, -0.424560546875, -0.30078125, -0.177001953125, -0.05322265625, 0.070556640625, 0.1943359375, 0.318115234375, 0.44189453125, 0.565673828125, 0.689453125, 0.813232421875, 0.93701171875, 1.060791015625, 1.1845703125, 1.308349609375, 1.43212890625, 1.555908203125, 1.6796875, 1.803466796875, 1.92724609375, 2.051025390625, 2.1748046875, 2.298583984375, 2.42236328125, 2.546142578125, 2.669921875, 2.793701171875, 2.91748046875, 3.041259765625, 3.1650390625, 3.288818359375, 3.41259765625, 3.536376953125, 3.66015625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 7.0, 14.0, 17.0, 20.0, 38.0, 53.0, 80.0, 154.0, 293.0, 688.0, 1453.0, 3631.0, 9231.0, 25157.0, 72570.0, 220079.0, 689725.0, 1631903.0, 1032633.0, 337620.0, 108799.0, 37463.0, 13474.0, 5151.0, 2079.0, 901.0, 486.0, 232.0, 116.0, 64.0, 46.0, 30.0, 19.0, 18.0, 12.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.74609375, -5.5804443359375, -5.414794921875, -5.2491455078125, -5.08349609375, -4.9178466796875, -4.752197265625, -4.5865478515625, -4.4208984375, -4.2552490234375, -4.089599609375, -3.9239501953125, -3.75830078125, -3.5926513671875, -3.427001953125, -3.2613525390625, -3.095703125, -2.9300537109375, -2.764404296875, -2.5987548828125, -2.43310546875, -2.2674560546875, -2.101806640625, -1.9361572265625, -1.7705078125, -1.6048583984375, -1.439208984375, -1.2735595703125, -1.10791015625, -0.9422607421875, -0.776611328125, -0.6109619140625, -0.4453125, -0.2796630859375, -0.114013671875, 0.0516357421875, 0.21728515625, 0.3829345703125, 0.548583984375, 0.7142333984375, 0.8798828125, 1.0455322265625, 1.211181640625, 1.3768310546875, 1.54248046875, 1.7081298828125, 1.873779296875, 2.0394287109375, 2.205078125, 2.3707275390625, 2.536376953125, 2.7020263671875, 2.86767578125, 3.0333251953125, 3.198974609375, 3.3646240234375, 3.5302734375, 3.6959228515625, 3.861572265625, 4.0272216796875, 4.19287109375, 4.3585205078125, 4.524169921875, 4.6898193359375, 4.85546875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 12.0, 11.0, 14.0, 22.0, 11.0, 24.0, 47.0, 54.0, 52.0, 87.0, 101.0, 129.0, 197.0, 233.0, 326.0, 360.0, 401.0, 409.0, 359.0, 230.0, 222.0, 158.0, 152.0, 119.0, 76.0, 54.0, 52.0, 28.0, 28.0, 18.0, 21.0, 16.0, 11.0, 8.0, 8.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.4140625, -6.234375, -6.0546875, -5.875, -5.6953125, -5.515625, -5.3359375, -5.15625, -4.9765625, -4.796875, -4.6171875, -4.4375, -4.2578125, -4.078125, -3.8984375, -3.71875, -3.5390625, -3.359375, -3.1796875, -3.0, -2.8203125, -2.640625, -2.4609375, -2.28125, -2.1015625, -1.921875, -1.7421875, -1.5625, -1.3828125, -1.203125, -1.0234375, -0.84375, -0.6640625, -0.484375, -0.3046875, -0.125, 0.0546875, 0.234375, 0.4140625, 0.59375, 0.7734375, 0.953125, 1.1328125, 1.3125, 1.4921875, 1.671875, 1.8515625, 2.03125, 2.2109375, 2.390625, 2.5703125, 2.75, 2.9296875, 3.109375, 3.2890625, 3.46875, 3.6484375, 3.828125, 4.0078125, 4.1875, 4.3671875, 4.546875, 4.7265625, 4.90625, 5.0859375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 12.0, 12.0, 18.0, 30.0, 27.0, 41.0, 52.0, 69.0, 102.0, 156.0, 220.0, 329.0, 599.0, 1644.0, 8828.0, 89223.0, 1336119.0, 2544215.0, 191486.0, 16694.0, 2446.0, 751.0, 396.0, 221.0, 171.0, 117.0, 93.0, 59.0, 32.0, 27.0, 23.0, 20.0, 13.0, 10.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.984375, -14.4873046875, -13.990234375, -13.4931640625, -12.99609375, -12.4990234375, -12.001953125, -11.5048828125, -11.0078125, -10.5107421875, -10.013671875, -9.5166015625, -9.01953125, -8.5224609375, -8.025390625, -7.5283203125, -7.03125, -6.5341796875, -6.037109375, -5.5400390625, -5.04296875, -4.5458984375, -4.048828125, -3.5517578125, -3.0546875, -2.5576171875, -2.060546875, -1.5634765625, -1.06640625, -0.5693359375, -0.072265625, 0.4248046875, 0.921875, 1.4189453125, 1.916015625, 2.4130859375, 2.91015625, 3.4072265625, 3.904296875, 4.4013671875, 4.8984375, 5.3955078125, 5.892578125, 6.3896484375, 6.88671875, 7.3837890625, 7.880859375, 8.3779296875, 8.875, 9.3720703125, 9.869140625, 10.3662109375, 10.86328125, 11.3603515625, 11.857421875, 12.3544921875, 12.8515625, 13.3486328125, 13.845703125, 14.3427734375, 14.83984375, 15.3369140625, 15.833984375, 16.3310546875, 16.828125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 10.0, 10.0, 38.0, 47.0, 77.0, 105.0, 133.0, 153.0, 121.0, 120.0, 79.0, 59.0, 33.0, 21.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.97929382324219, -36.68626022338867, -35.393226623535156, -34.100189208984375, -32.80715560913086, -31.514122009277344, -30.221086502075195, -28.928050994873047, -27.63501739501953, -26.341983795166016, -25.048948287963867, -23.75591278076172, -22.462879180908203, -21.169845581054688, -19.87681007385254, -18.58377456665039, -17.290740966796875, -15.997706413269043, -14.704671859741211, -13.411637306213379, -12.118602752685547, -10.825568199157715, -9.532533645629883, -8.23949909210205, -6.946464538574219, -5.653429985046387, -4.360395431518555, -3.0673608779907227, -1.7743263244628906, -0.4812917709350586, 0.8117427825927734, 2.1047773361206055, 3.3978118896484375, 4.6908464431762695, 5.983880996704102, 7.276915550231934, 8.569950103759766, 9.862984657287598, 11.15601921081543, 12.449053764343262, 13.742088317871094, 15.035122871398926, 16.328157424926758, 17.621192932128906, 18.914226531982422, 20.207260131835938, 21.500295639038086, 22.793331146240234, 24.08636474609375, 25.379398345947266, 26.672433853149414, 27.965469360351562, 29.258502960205078, 30.551536560058594, 31.844572067260742, 33.13760757446289, 34.430641174316406, 35.72367477416992, 37.01670837402344, 38.30974578857422, 39.602779388427734, 40.89581298828125, 42.18885040283203, 43.48188400268555, 44.77491760253906]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 2.0, 8.0, 5.0, 9.0, 11.0, 17.0, 22.0, 19.0, 10.0, 29.0, 28.0, 20.0, 18.0, 22.0, 34.0, 32.0, 28.0, 41.0, 41.0, 38.0, 46.0, 34.0, 45.0, 41.0, 39.0, 35.0, 30.0, 35.0, 38.0, 32.0, 23.0, 18.0, 19.0, 16.0, 18.0, 15.0, 15.0, 8.0, 14.0, 4.0, 8.0, 5.0, 1.0, 3.0, 2.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.344802856445312, -19.695880889892578, -19.046960830688477, -18.398040771484375, -17.74911880493164, -17.100196838378906, -16.451276779174805, -15.802355766296387, -15.153434753417969, -14.50451374053955, -13.855592727661133, -13.206671714782715, -12.557750701904297, -11.908829689025879, -11.259908676147461, -10.610987663269043, -9.962066650390625, -9.313145637512207, -8.664224624633789, -8.015303611755371, -7.366382598876953, -6.717461585998535, -6.068540573120117, -5.419619560241699, -4.770698547363281, -4.121777534484863, -3.4728565216064453, -2.8239355087280273, -2.1750144958496094, -1.5260934829711914, -0.8771724700927734, -0.22825145721435547, 0.4206695556640625, 1.0695905685424805, 1.7185115814208984, 2.3674325942993164, 3.0163536071777344, 3.6652746200561523, 4.31419563293457, 4.963116645812988, 5.612037658691406, 6.260958671569824, 6.909879684448242, 7.55880069732666, 8.207721710205078, 8.856642723083496, 9.505563735961914, 10.154484748840332, 10.80340576171875, 11.452326774597168, 12.101247787475586, 12.750168800354004, 13.399089813232422, 14.04801082611084, 14.696931838989258, 15.345852851867676, 15.994773864746094, 16.643695831298828, 17.29261589050293, 17.94153594970703, 18.590457916259766, 19.2393798828125, 19.8882999420166, 20.537220001220703, 21.186141967773438]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 6.0, 12.0, 10.0, 13.0, 10.0, 16.0, 22.0, 24.0, 28.0, 28.0, 18.0, 40.0, 36.0, 30.0, 40.0, 34.0, 43.0, 43.0, 40.0, 43.0, 34.0, 35.0, 35.0, 30.0, 30.0, 27.0, 27.0, 23.0, 24.0, 22.0, 19.0, 23.0, 16.0, 21.0, 12.0, 16.0, 14.0, 10.0, 11.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.783203125, -3.661895751953125, -3.54058837890625, -3.419281005859375, -3.2979736328125, -3.176666259765625, -3.05535888671875, -2.934051513671875, -2.812744140625, -2.691436767578125, -2.57012939453125, -2.448822021484375, -2.3275146484375, -2.206207275390625, -2.08489990234375, -1.963592529296875, -1.84228515625, -1.720977783203125, -1.59967041015625, -1.478363037109375, -1.3570556640625, -1.235748291015625, -1.11444091796875, -0.993133544921875, -0.871826171875, -0.750518798828125, -0.62921142578125, -0.507904052734375, -0.3865966796875, -0.265289306640625, -0.14398193359375, -0.022674560546875, 0.0986328125, 0.219940185546875, 0.34124755859375, 0.462554931640625, 0.5838623046875, 0.705169677734375, 0.82647705078125, 0.947784423828125, 1.069091796875, 1.190399169921875, 1.31170654296875, 1.433013916015625, 1.5543212890625, 1.675628662109375, 1.79693603515625, 1.918243408203125, 2.03955078125, 2.160858154296875, 2.28216552734375, 2.403472900390625, 2.5247802734375, 2.646087646484375, 2.76739501953125, 2.888702392578125, 3.010009765625, 3.131317138671875, 3.25262451171875, 3.373931884765625, 3.4952392578125, 3.616546630859375, 3.73785400390625, 3.859161376953125, 3.98046875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 6.0, 7.0, 17.0, 26.0, 18.0, 45.0, 46.0, 74.0, 104.0, 133.0, 182.0, 258.0, 359.0, 490.0, 680.0, 948.0, 1349.0, 1891.0, 2601.0, 3517.0, 5228.0, 7441.0, 10979.0, 16035.0, 24126.0, 36938.0, 58071.0, 97313.0, 209561.0, 274511.0, 108944.0, 63652.0, 40408.0, 26065.0, 17617.0, 11761.0, 8053.0, 5593.0, 3897.0, 2794.0, 1891.0, 1379.0, 995.0, 732.0, 532.0, 343.0, 247.0, 189.0, 156.0, 104.0, 80.0, 53.0, 39.0, 24.0, 20.0, 21.0, 7.0, 7.0, 7.0, 2.0, 1.0], "bins": [-0.1422119140625, -0.13778114318847656, -0.13335037231445312, -0.1289196014404297, -0.12448883056640625, -0.12005805969238281, -0.11562728881835938, -0.11119651794433594, -0.1067657470703125, -0.10233497619628906, -0.09790420532226562, -0.09347343444824219, -0.08904266357421875, -0.08461189270019531, -0.08018112182617188, -0.07575035095214844, -0.071319580078125, -0.06688880920410156, -0.062458038330078125, -0.05802726745605469, -0.05359649658203125, -0.04916572570800781, -0.044734954833984375, -0.04030418395996094, -0.0358734130859375, -0.03144264221191406, -0.027011871337890625, -0.022581100463867188, -0.01815032958984375, -0.013719558715820312, -0.009288787841796875, -0.0048580169677734375, -0.00042724609375, 0.0040035247802734375, 0.008434295654296875, 0.012865066528320312, 0.01729583740234375, 0.021726608276367188, 0.026157379150390625, 0.030588150024414062, 0.0350189208984375, 0.03944969177246094, 0.043880462646484375, 0.04831123352050781, 0.05274200439453125, 0.05717277526855469, 0.061603546142578125, 0.06603431701660156, 0.070465087890625, 0.07489585876464844, 0.07932662963867188, 0.08375740051269531, 0.08818817138671875, 0.09261894226074219, 0.09704971313476562, 0.10148048400878906, 0.1059112548828125, 0.11034202575683594, 0.11477279663085938, 0.11920356750488281, 0.12363433837890625, 0.1280651092529297, 0.13249588012695312, 0.13692665100097656, 0.141357421875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 9.0, 8.0, 15.0, 20.0, 13.0, 10.0, 26.0, 14.0, 24.0, 29.0, 29.0, 37.0, 40.0, 26.0, 35.0, 49.0, 45.0, 1068.0, 38.0, 47.0, 35.0, 38.0, 43.0, 31.0, 38.0, 25.0, 26.0, 31.0, 29.0, 19.0, 21.0, 20.0, 14.0, 12.0, 7.0, 10.0, 11.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.822265625, -2.726593017578125, -2.63092041015625, -2.535247802734375, -2.4395751953125, -2.343902587890625, -2.24822998046875, -2.152557373046875, -2.056884765625, -1.961212158203125, -1.86553955078125, -1.769866943359375, -1.6741943359375, -1.578521728515625, -1.48284912109375, -1.387176513671875, -1.29150390625, -1.195831298828125, -1.10015869140625, -1.004486083984375, -0.9088134765625, -0.813140869140625, -0.71746826171875, -0.621795654296875, -0.526123046875, -0.430450439453125, -0.33477783203125, -0.239105224609375, -0.1434326171875, -0.047760009765625, 0.04791259765625, 0.143585205078125, 0.2392578125, 0.334930419921875, 0.43060302734375, 0.526275634765625, 0.6219482421875, 0.717620849609375, 0.81329345703125, 0.908966064453125, 1.004638671875, 1.100311279296875, 1.19598388671875, 1.291656494140625, 1.3873291015625, 1.483001708984375, 1.57867431640625, 1.674346923828125, 1.77001953125, 1.865692138671875, 1.96136474609375, 2.057037353515625, 2.1527099609375, 2.248382568359375, 2.34405517578125, 2.439727783203125, 2.535400390625, 2.631072998046875, 2.72674560546875, 2.822418212890625, 2.9180908203125, 3.013763427734375, 3.10943603515625, 3.205108642578125, 3.30078125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 14.0, 21.0, 25.0, 42.0, 70.0, 87.0, 133.0, 210.0, 269.0, 459.0, 640.0, 954.0, 1501.0, 2249.0, 3316.0, 4838.0, 7131.0, 10932.0, 16323.0, 24824.0, 38885.0, 63645.0, 112157.0, 1326286.0, 219127.0, 101159.0, 58154.0, 35687.0, 22535.0, 14929.0, 9946.0, 6810.0, 4409.0, 3068.0, 2004.0, 1351.0, 932.0, 664.0, 474.0, 278.0, 211.0, 133.0, 78.0, 54.0, 38.0, 29.0, 13.0, 18.0, 2.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.09515380859375, -0.09226322174072266, -0.08937263488769531, -0.08648204803466797, -0.08359146118164062, -0.08070087432861328, -0.07781028747558594, -0.0749197006225586, -0.07202911376953125, -0.0691385269165039, -0.06624794006347656, -0.06335735321044922, -0.060466766357421875, -0.05757617950439453, -0.05468559265136719, -0.051795005798339844, -0.0489044189453125, -0.046013832092285156, -0.04312324523925781, -0.04023265838623047, -0.037342071533203125, -0.03445148468017578, -0.03156089782714844, -0.028670310974121094, -0.02577972412109375, -0.022889137268066406, -0.019998550415039062, -0.01710796356201172, -0.014217376708984375, -0.011326789855957031, -0.008436203002929688, -0.005545616149902344, -0.002655029296875, 0.00023555755615234375, 0.0031261444091796875, 0.006016731262207031, 0.008907318115234375, 0.011797904968261719, 0.014688491821289062, 0.017579078674316406, 0.02046966552734375, 0.023360252380371094, 0.026250839233398438, 0.02914142608642578, 0.032032012939453125, 0.03492259979248047, 0.03781318664550781, 0.040703773498535156, 0.0435943603515625, 0.046484947204589844, 0.04937553405761719, 0.05226612091064453, 0.055156707763671875, 0.05804729461669922, 0.06093788146972656, 0.0638284683227539, 0.06671905517578125, 0.0696096420288086, 0.07250022888183594, 0.07539081573486328, 0.07828140258789062, 0.08117198944091797, 0.08406257629394531, 0.08695316314697266, 0.08984375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 16.0, 2.0, 3.0, 6.0, 14.0, 14.0, 13.0, 54.0, 29.0, 37.0, 48.0, 50.0, 83.0, 244.0, 130.0, 39.0, 23.0, 31.0, 18.0, 15.0, 19.0, 33.0, 5.0, 8.0, 1.0, 5.0, 4.0, 7.0, 15.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-2.3245811462402344e-06, -2.2565945982933044e-06, -2.1886080503463745e-06, -2.1206215023994446e-06, -2.0526349544525146e-06, -1.9846484065055847e-06, -1.9166618585586548e-06, -1.8486753106117249e-06, -1.780688762664795e-06, -1.712702214717865e-06, -1.644715666770935e-06, -1.5767291188240051e-06, -1.5087425708770752e-06, -1.4407560229301453e-06, -1.3727694749832153e-06, -1.3047829270362854e-06, -1.2367963790893555e-06, -1.1688098311424255e-06, -1.1008232831954956e-06, -1.0328367352485657e-06, -9.648501873016357e-07, -8.968636393547058e-07, -8.288770914077759e-07, -7.60890543460846e-07, -6.92903995513916e-07, -6.249174475669861e-07, -5.569308996200562e-07, -4.889443516731262e-07, -4.209578037261963e-07, -3.5297125577926636e-07, -2.849847078323364e-07, -2.169981598854065e-07, -1.4901161193847656e-07, -8.102506399154663e-08, -1.30385160446167e-08, 5.494803190231323e-08, 1.2293457984924316e-07, 1.909211277961731e-07, 2.5890767574310303e-07, 3.2689422369003296e-07, 3.948807716369629e-07, 4.628673195838928e-07, 5.308538675308228e-07, 5.988404154777527e-07, 6.668269634246826e-07, 7.348135113716125e-07, 8.028000593185425e-07, 8.707866072654724e-07, 9.387731552124023e-07, 1.0067597031593323e-06, 1.0747462511062622e-06, 1.1427327990531921e-06, 1.210719347000122e-06, 1.278705894947052e-06, 1.346692442893982e-06, 1.4146789908409119e-06, 1.4826655387878418e-06, 1.5506520867347717e-06, 1.6186386346817017e-06, 1.6866251826286316e-06, 1.7546117305755615e-06, 1.8225982785224915e-06, 1.8905848264694214e-06, 1.9585713744163513e-06, 2.0265579223632812e-06]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 5.0, 9.0, 8.0, 14.0, 16.0, 14.0, 14.0, 39.0, 41.0, 63.0, 85.0, 166.0, 271.0, 1062.0, 350210.0, 694749.0, 1027.0, 268.0, 152.0, 92.0, 67.0, 44.0, 37.0, 10.0, 19.0, 13.0, 17.0, 3.0, 7.0, 4.0, 0.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5239925384521484e-05, -4.3732114136219025e-05, -4.2224302887916565e-05, -4.0716491639614105e-05, -3.9208680391311646e-05, -3.7700869143009186e-05, -3.6193057894706726e-05, -3.4685246646404266e-05, -3.317743539810181e-05, -3.166962414979935e-05, -3.0161812901496887e-05, -2.8654001653194427e-05, -2.7146190404891968e-05, -2.5638379156589508e-05, -2.413056790828705e-05, -2.262275665998459e-05, -2.111494541168213e-05, -1.960713416337967e-05, -1.809932291507721e-05, -1.659151166677475e-05, -1.508370041847229e-05, -1.357588917016983e-05, -1.206807792186737e-05, -1.0560266673564911e-05, -9.052455425262451e-06, -7.5446441769599915e-06, -6.036832928657532e-06, -4.529021680355072e-06, -3.0212104320526123e-06, -1.5133991837501526e-06, -5.587935447692871e-09, 1.5022233128547668e-06, 3.0100345611572266e-06, 4.517845809459686e-06, 6.025657057762146e-06, 7.533468306064606e-06, 9.041279554367065e-06, 1.0549090802669525e-05, 1.2056902050971985e-05, 1.3564713299274445e-05, 1.5072524547576904e-05, 1.6580335795879364e-05, 1.8088147044181824e-05, 1.9595958292484283e-05, 2.1103769540786743e-05, 2.2611580789089203e-05, 2.4119392037391663e-05, 2.5627203285694122e-05, 2.7135014533996582e-05, 2.8642825782299042e-05, 3.01506370306015e-05, 3.165844827890396e-05, 3.316625952720642e-05, 3.467407077550888e-05, 3.618188202381134e-05, 3.76896932721138e-05, 3.919750452041626e-05, 4.070531576871872e-05, 4.221312701702118e-05, 4.372093826532364e-05, 4.52287495136261e-05, 4.673656076192856e-05, 4.824437201023102e-05, 4.975218325853348e-05, 5.125999450683594e-05]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 12.0, 40.0, 214.0, 507.0, 181.0, 41.0, 12.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3205189942673314e-06, -5.214945304032881e-06, -5.10937161379843e-06, -5.0037979235639796e-06, -4.89822468807688e-06, -4.792650997842429e-06, -4.687077307607979e-06, -4.581503617373528e-06, -4.475929927139077e-06, -4.370356236904627e-06, -4.264782546670176e-06, -4.159209311183076e-06, -4.053635620948626e-06, -3.948061930714175e-06, -3.8424882404797245e-06, -3.736914550245274e-06, -3.6313410873844987e-06, -3.525767397150048e-06, -3.420193934289273e-06, -3.3146202440548223e-06, -3.2090465538203716e-06, -3.103472863585921e-06, -2.997899400725146e-06, -2.892325710490695e-06, -2.78675224762992e-06, -2.6811785573954694e-06, -2.5756050945346942e-06, -2.4700314043002436e-06, -2.364457714065793e-06, -2.258884251205018e-06, -2.153310560970567e-06, -2.0477368707361165e-06, -1.942163180501666e-06, -1.836589603954053e-06, -1.7310159137196024e-06, -1.6254423371719895e-06, -1.5198686469375389e-06, -1.414295070389926e-06, -1.308721493842313e-06, -1.2031478036078624e-06, -1.0975741133734118e-06, -9.92000536825799e-07, -8.864268465913483e-07, -7.808532700437354e-07, -6.752796366527036e-07, -5.697060032616719e-07, -4.6413242671405897e-07, -3.585587933230272e-07, -2.5298515993199544e-07, -1.474115407518184e-07, -4.1837921571641346e-08, 6.373568339768099e-08, 1.6930931678871275e-07, 2.748829501797445e-07, 3.804565267273574e-07, 4.860301601183892e-07, 5.916037935094209e-07, 6.971774269004527e-07, 8.027510602914845e-07, 9.083246368390974e-07, 1.013898327073548e-06, 1.1194719036211609e-06, 1.2250454801687738e-06, 1.3306191704032244e-06, 1.4361927469508373e-06]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 11.0, 0.0, 7.0, 0.0, 15.0, 0.0, 20.0, 0.0, 0.0, 39.0, 0.0, 50.0, 0.0, 57.0, 0.0, 101.0, 0.0, 122.0, 0.0, 0.0, 158.0, 0.0, 134.0, 0.0, 90.0, 0.0, 71.0, 0.0, 44.0, 0.0, 0.0, 28.0, 0.0, 24.0, 0.0, 19.0, 0.0, 6.0, 0.0, 7.0, 0.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.940696716308594e-07, -8.670613169670105e-07, -8.400529623031616e-07, -8.130446076393127e-07, -7.860362529754639e-07, -7.59027898311615e-07, -7.320195436477661e-07, -7.050111889839172e-07, -6.780028343200684e-07, -6.509944796562195e-07, -6.239861249923706e-07, -5.969777703285217e-07, -5.699694156646729e-07, -5.42961061000824e-07, -5.159527063369751e-07, -4.889443516731262e-07, -4.6193599700927734e-07, -4.3492764234542847e-07, -4.079192876815796e-07, -3.809109330177307e-07, -3.5390257835388184e-07, -3.2689422369003296e-07, -2.998858690261841e-07, -2.728775143623352e-07, -2.4586915969848633e-07, -2.1886080503463745e-07, -1.9185245037078857e-07, -1.648440957069397e-07, -1.3783574104309082e-07, -1.1082738637924194e-07, -8.381903171539307e-08, -5.681067705154419e-08, -2.9802322387695312e-08, -2.7939677238464355e-09, 2.421438694000244e-08, 5.122274160385132e-08, 7.82310962677002e-08, 1.0523945093154907e-07, 1.3224780559539795e-07, 1.5925616025924683e-07, 1.862645149230957e-07, 2.1327286958694458e-07, 2.4028122425079346e-07, 2.6728957891464233e-07, 2.942979335784912e-07, 3.213062882423401e-07, 3.4831464290618896e-07, 3.7532299757003784e-07, 4.023313522338867e-07, 4.293397068977356e-07, 4.5634806156158447e-07, 4.833564162254333e-07, 5.103647708892822e-07, 5.373731255531311e-07, 5.6438148021698e-07, 5.913898348808289e-07, 6.183981895446777e-07, 6.454065442085266e-07, 6.724148988723755e-07, 6.994232535362244e-07, 7.264316082000732e-07, 7.534399628639221e-07, 7.80448317527771e-07, 8.074566721916199e-07, 8.344650268554688e-07]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 6.0, 12.0, 10.0, 13.0, 10.0, 16.0, 22.0, 24.0, 28.0, 28.0, 18.0, 40.0, 36.0, 30.0, 40.0, 34.0, 43.0, 43.0, 40.0, 43.0, 34.0, 35.0, 35.0, 30.0, 30.0, 27.0, 27.0, 23.0, 24.0, 22.0, 19.0, 23.0, 16.0, 21.0, 12.0, 16.0, 14.0, 10.0, 11.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.783203125, -3.661895751953125, -3.54058837890625, -3.419281005859375, -3.2979736328125, -3.176666259765625, -3.05535888671875, -2.934051513671875, -2.812744140625, -2.691436767578125, -2.57012939453125, -2.448822021484375, -2.3275146484375, -2.206207275390625, -2.08489990234375, -1.963592529296875, -1.84228515625, -1.720977783203125, -1.59967041015625, -1.478363037109375, -1.3570556640625, -1.235748291015625, -1.11444091796875, -0.993133544921875, -0.871826171875, -0.750518798828125, -0.62921142578125, -0.507904052734375, -0.3865966796875, -0.265289306640625, -0.14398193359375, -0.022674560546875, 0.0986328125, 0.219940185546875, 0.34124755859375, 0.462554931640625, 0.5838623046875, 0.705169677734375, 0.82647705078125, 0.947784423828125, 1.069091796875, 1.190399169921875, 1.31170654296875, 1.433013916015625, 1.5543212890625, 1.675628662109375, 1.79693603515625, 1.918243408203125, 2.03955078125, 2.160858154296875, 2.28216552734375, 2.403472900390625, 2.5247802734375, 2.646087646484375, 2.76739501953125, 2.888702392578125, 3.010009765625, 3.131317138671875, 3.25262451171875, 3.373931884765625, 3.4952392578125, 3.616546630859375, 3.73785400390625, 3.859161376953125, 3.98046875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 10.0, 13.0, 21.0, 20.0, 33.0, 44.0, 53.0, 118.0, 161.0, 221.0, 437.0, 664.0, 1088.0, 1922.0, 3086.0, 4955.0, 8026.0, 12703.0, 20410.0, 32092.0, 50573.0, 81437.0, 146583.0, 251974.0, 179190.0, 95748.0, 58212.0, 36850.0, 23370.0, 14655.0, 9175.0, 5747.0, 3374.0, 2164.0, 1307.0, 813.0, 464.0, 282.0, 196.0, 120.0, 75.0, 62.0, 36.0, 24.0, 14.0, 9.0, 7.0, 2.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-4.421875, -4.28643798828125, -4.1510009765625, -4.01556396484375, -3.880126953125, -3.74468994140625, -3.6092529296875, -3.47381591796875, -3.33837890625, -3.20294189453125, -3.0675048828125, -2.93206787109375, -2.796630859375, -2.66119384765625, -2.5257568359375, -2.39031982421875, -2.2548828125, -2.11944580078125, -1.9840087890625, -1.84857177734375, -1.713134765625, -1.57769775390625, -1.4422607421875, -1.30682373046875, -1.17138671875, -1.03594970703125, -0.9005126953125, -0.76507568359375, -0.629638671875, -0.49420166015625, -0.3587646484375, -0.22332763671875, -0.087890625, 0.04754638671875, 0.1829833984375, 0.31842041015625, 0.453857421875, 0.58929443359375, 0.7247314453125, 0.86016845703125, 0.99560546875, 1.13104248046875, 1.2664794921875, 1.40191650390625, 1.537353515625, 1.67279052734375, 1.8082275390625, 1.94366455078125, 2.0791015625, 2.21453857421875, 2.3499755859375, 2.48541259765625, 2.620849609375, 2.75628662109375, 2.8917236328125, 3.02716064453125, 3.16259765625, 3.29803466796875, 3.4334716796875, 3.56890869140625, 3.704345703125, 3.83978271484375, 3.9752197265625, 4.11065673828125, 4.24609375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 6.0, 6.0, 8.0, 15.0, 20.0, 16.0, 24.0, 31.0, 35.0, 37.0, 46.0, 71.0, 81.0, 114.0, 197.0, 1373.0, 280.0, 145.0, 92.0, 87.0, 57.0, 57.0, 44.0, 19.0, 26.0, 29.0, 29.0, 11.0, 16.0, 16.0, 11.0, 12.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.1953125, -12.76708984375, -12.3388671875, -11.91064453125, -11.482421875, -11.05419921875, -10.6259765625, -10.19775390625, -9.76953125, -9.34130859375, -8.9130859375, -8.48486328125, -8.056640625, -7.62841796875, -7.2001953125, -6.77197265625, -6.34375, -5.91552734375, -5.4873046875, -5.05908203125, -4.630859375, -4.20263671875, -3.7744140625, -3.34619140625, -2.91796875, -2.48974609375, -2.0615234375, -1.63330078125, -1.205078125, -0.77685546875, -0.3486328125, 0.07958984375, 0.5078125, 0.93603515625, 1.3642578125, 1.79248046875, 2.220703125, 2.64892578125, 3.0771484375, 3.50537109375, 3.93359375, 4.36181640625, 4.7900390625, 5.21826171875, 5.646484375, 6.07470703125, 6.5029296875, 6.93115234375, 7.359375, 7.78759765625, 8.2158203125, 8.64404296875, 9.072265625, 9.50048828125, 9.9287109375, 10.35693359375, 10.78515625, 11.21337890625, 11.6416015625, 12.06982421875, 12.498046875, 12.92626953125, 13.3544921875, 13.78271484375, 14.2109375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 10.0, 15.0, 18.0, 23.0, 38.0, 50.0, 60.0, 83.0, 137.0, 220.0, 400.0, 872.0, 3666.0, 21627.0, 156123.0, 1889978.0, 964374.0, 90399.0, 13567.0, 2474.0, 653.0, 343.0, 184.0, 127.0, 89.0, 52.0, 40.0, 29.0, 21.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.78125, -15.3153076171875, -14.849365234375, -14.3834228515625, -13.91748046875, -13.4515380859375, -12.985595703125, -12.5196533203125, -12.0537109375, -11.5877685546875, -11.121826171875, -10.6558837890625, -10.18994140625, -9.7239990234375, -9.258056640625, -8.7921142578125, -8.326171875, -7.8602294921875, -7.394287109375, -6.9283447265625, -6.46240234375, -5.9964599609375, -5.530517578125, -5.0645751953125, -4.5986328125, -4.1326904296875, -3.666748046875, -3.2008056640625, -2.73486328125, -2.2689208984375, -1.802978515625, -1.3370361328125, -0.87109375, -0.4051513671875, 0.060791015625, 0.5267333984375, 0.99267578125, 1.4586181640625, 1.924560546875, 2.3905029296875, 2.8564453125, 3.3223876953125, 3.788330078125, 4.2542724609375, 4.72021484375, 5.1861572265625, 5.652099609375, 6.1180419921875, 6.583984375, 7.0499267578125, 7.515869140625, 7.9818115234375, 8.44775390625, 8.9136962890625, 9.379638671875, 9.8455810546875, 10.3115234375, 10.7774658203125, 11.243408203125, 11.7093505859375, 12.17529296875, 12.6412353515625, 13.107177734375, 13.5731201171875, 14.0390625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 31.0, 89.0, 230.0, 359.0, 217.0, 70.0, 17.0, 3.0, 1.0, 1.0], "bins": [-161.70558166503906, -158.8855743408203, -156.06558227539062, -153.24557495117188, -150.42556762695312, -147.60556030273438, -144.7855682373047, -141.96556091308594, -139.1455535888672, -136.32554626464844, -133.50555419921875, -130.685546875, -127.86553955078125, -125.04553985595703, -122.22554016113281, -119.40553283691406, -116.58554077148438, -113.76554107666016, -110.9455337524414, -108.12553405761719, -105.30552673339844, -102.48552703857422, -99.66552734375, -96.84552001953125, -94.0255126953125, -91.20551300048828, -88.38550567626953, -85.56550598144531, -82.74549865722656, -79.92549896240234, -77.10549926757812, -74.28549194335938, -71.46549224853516, -68.64549255371094, -65.82548522949219, -63.00548553466797, -60.185482025146484, -57.365478515625, -54.545475006103516, -51.72547149658203, -48.90546798706055, -46.08546447753906, -43.26546096801758, -40.445457458496094, -37.625457763671875, -34.80545425415039, -31.985450744628906, -29.165449142456055, -26.34544563293457, -23.525442123413086, -20.705440521240234, -17.88543701171875, -15.065434455871582, -12.245431900024414, -9.42542839050293, -6.605426788330078, -3.7854232788085938, -0.9654204845428467, 1.8545823097229004, 4.674585342407227, 7.4945878982543945, 10.314590454101562, 13.134593963623047, 15.954595565795898, 18.774599075317383]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 8.0, 7.0, 13.0, 9.0, 14.0, 13.0, 15.0, 21.0, 16.0, 19.0, 25.0, 28.0, 26.0, 29.0, 34.0, 34.0, 35.0, 36.0, 44.0, 38.0, 45.0, 46.0, 33.0, 32.0, 36.0, 40.0, 41.0, 33.0, 30.0, 32.0, 21.0, 18.0, 21.0, 20.0, 13.0, 13.0, 12.0, 9.0, 10.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0], "bins": [-32.12983703613281, -31.19971466064453, -30.26959228515625, -29.33946990966797, -28.409347534179688, -27.479225158691406, -26.549102783203125, -25.618980407714844, -24.688858032226562, -23.75873565673828, -22.82861328125, -21.89849090576172, -20.968368530273438, -20.038246154785156, -19.108123779296875, -18.178001403808594, -17.247879028320312, -16.31775665283203, -15.38763427734375, -14.457511901855469, -13.527389526367188, -12.597267150878906, -11.667144775390625, -10.737022399902344, -9.806901931762695, -8.876779556274414, -7.946657180786133, -7.016534805297852, -6.08641242980957, -5.156290531158447, -4.226168155670166, -3.2960457801818848, -2.3659229278564453, -1.435800552368164, -0.5056782960891724, 0.42444396018981934, 1.3545663356781006, 2.2846884727478027, 3.214810848236084, 4.144933223724365, 5.0750555992126465, 6.005177974700928, 6.935300350189209, 7.865422248840332, 8.795544624328613, 9.725666999816895, 10.655789375305176, 11.585911750793457, 12.516034126281738, 13.44615650177002, 14.3762788772583, 15.306401252746582, 16.236522674560547, 17.166645050048828, 18.09676742553711, 19.02688980102539, 19.957012176513672, 20.887134552001953, 21.817256927490234, 22.747379302978516, 23.677501678466797, 24.607624053955078, 25.53774642944336, 26.46786880493164, 27.397991180419922]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 13.0, 6.0, 5.0, 10.0, 13.0, 23.0, 17.0, 23.0, 14.0, 20.0, 22.0, 37.0, 24.0, 37.0, 36.0, 34.0, 42.0, 34.0, 34.0, 36.0, 38.0, 33.0, 41.0, 30.0, 39.0, 40.0, 31.0, 18.0, 19.0, 31.0, 17.0, 26.0, 23.0, 18.0, 11.0, 13.0, 20.0, 8.0, 9.0, 14.0, 11.0, 4.0, 2.0, 6.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.1484375, -4.0234375, -3.8984375, -3.7734375, -3.6484375, -3.5234375, -3.3984375, -3.2734375, -3.1484375, -3.0234375, -2.8984375, -2.7734375, -2.6484375, -2.5234375, -2.3984375, -2.2734375, -2.1484375, -2.0234375, -1.8984375, -1.7734375, -1.6484375, -1.5234375, -1.3984375, -1.2734375, -1.1484375, -1.0234375, -0.8984375, -0.7734375, -0.6484375, -0.5234375, -0.3984375, -0.2734375, -0.1484375, -0.0234375, 0.1015625, 0.2265625, 0.3515625, 0.4765625, 0.6015625, 0.7265625, 0.8515625, 0.9765625, 1.1015625, 1.2265625, 1.3515625, 1.4765625, 1.6015625, 1.7265625, 1.8515625, 1.9765625, 2.1015625, 2.2265625, 2.3515625, 2.4765625, 2.6015625, 2.7265625, 2.8515625, 2.9765625, 3.1015625, 3.2265625, 3.3515625, 3.4765625, 3.6015625, 3.7265625, 3.8515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 8.0, 10.0, 12.0, 15.0, 27.0, 31.0, 56.0, 69.0, 105.0, 176.0, 270.0, 484.0, 877.0, 1765.0, 3776.0, 8605.0, 20398.0, 51788.0, 142085.0, 425659.0, 1279978.0, 1476426.0, 509274.0, 169275.0, 60762.0, 23780.0, 9764.0, 4292.0, 2025.0, 1023.0, 532.0, 318.0, 207.0, 119.0, 76.0, 41.0, 61.0, 29.0, 12.0, 11.0, 11.0, 16.0, 11.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.38671875, -5.21881103515625, -5.0509033203125, -4.88299560546875, -4.715087890625, -4.54718017578125, -4.3792724609375, -4.21136474609375, -4.04345703125, -3.87554931640625, -3.7076416015625, -3.53973388671875, -3.371826171875, -3.20391845703125, -3.0360107421875, -2.86810302734375, -2.7001953125, -2.53228759765625, -2.3643798828125, -2.19647216796875, -2.028564453125, -1.86065673828125, -1.6927490234375, -1.52484130859375, -1.35693359375, -1.18902587890625, -1.0211181640625, -0.85321044921875, -0.685302734375, -0.51739501953125, -0.3494873046875, -0.18157958984375, -0.013671875, 0.15423583984375, 0.3221435546875, 0.49005126953125, 0.657958984375, 0.82586669921875, 0.9937744140625, 1.16168212890625, 1.32958984375, 1.49749755859375, 1.6654052734375, 1.83331298828125, 2.001220703125, 2.16912841796875, 2.3370361328125, 2.50494384765625, 2.6728515625, 2.84075927734375, 3.0086669921875, 3.17657470703125, 3.344482421875, 3.51239013671875, 3.6802978515625, 3.84820556640625, 4.01611328125, 4.18402099609375, 4.3519287109375, 4.51983642578125, 4.687744140625, 4.85565185546875, 5.0235595703125, 5.19146728515625, 5.359375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 6.0, 8.0, 10.0, 10.0, 10.0, 17.0, 38.0, 25.0, 53.0, 47.0, 79.0, 105.0, 153.0, 193.0, 248.0, 348.0, 442.0, 474.0, 435.0, 346.0, 287.0, 178.0, 131.0, 130.0, 69.0, 66.0, 49.0, 29.0, 18.0, 13.0, 10.0, 13.0, 10.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.3116455078125, -5.119384765625, -4.9271240234375, -4.73486328125, -4.5426025390625, -4.350341796875, -4.1580810546875, -3.9658203125, -3.7735595703125, -3.581298828125, -3.3890380859375, -3.19677734375, -3.0045166015625, -2.812255859375, -2.6199951171875, -2.427734375, -2.2354736328125, -2.043212890625, -1.8509521484375, -1.65869140625, -1.4664306640625, -1.274169921875, -1.0819091796875, -0.8896484375, -0.6973876953125, -0.505126953125, -0.3128662109375, -0.12060546875, 0.0716552734375, 0.263916015625, 0.4561767578125, 0.6484375, 0.8406982421875, 1.032958984375, 1.2252197265625, 1.41748046875, 1.6097412109375, 1.802001953125, 1.9942626953125, 2.1865234375, 2.3787841796875, 2.571044921875, 2.7633056640625, 2.95556640625, 3.1478271484375, 3.340087890625, 3.5323486328125, 3.724609375, 3.9168701171875, 4.109130859375, 4.3013916015625, 4.49365234375, 4.6859130859375, 4.878173828125, 5.0704345703125, 5.2626953125, 5.4549560546875, 5.647216796875, 5.8394775390625, 6.03173828125, 6.2239990234375, 6.416259765625, 6.6085205078125, 6.80078125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 11.0, 12.0, 16.0, 23.0, 26.0, 46.0, 58.0, 81.0, 125.0, 193.0, 362.0, 790.0, 1895.0, 5336.0, 19329.0, 86639.0, 464767.0, 2308076.0, 1068743.0, 185048.0, 37741.0, 9479.0, 2999.0, 1140.0, 536.0, 239.0, 168.0, 131.0, 59.0, 52.0, 44.0, 22.0, 16.0, 15.0, 13.0, 8.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.84375, -9.5234375, -9.203125, -8.8828125, -8.5625, -8.2421875, -7.921875, -7.6015625, -7.28125, -6.9609375, -6.640625, -6.3203125, -6.0, -5.6796875, -5.359375, -5.0390625, -4.71875, -4.3984375, -4.078125, -3.7578125, -3.4375, -3.1171875, -2.796875, -2.4765625, -2.15625, -1.8359375, -1.515625, -1.1953125, -0.875, -0.5546875, -0.234375, 0.0859375, 0.40625, 0.7265625, 1.046875, 1.3671875, 1.6875, 2.0078125, 2.328125, 2.6484375, 2.96875, 3.2890625, 3.609375, 3.9296875, 4.25, 4.5703125, 4.890625, 5.2109375, 5.53125, 5.8515625, 6.171875, 6.4921875, 6.8125, 7.1328125, 7.453125, 7.7734375, 8.09375, 8.4140625, 8.734375, 9.0546875, 9.375, 9.6953125, 10.015625, 10.3359375, 10.65625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 50.0, 316.0, 463.0, 170.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.245723724365234, -27.861465454101562, -23.477209091186523, -19.092952728271484, -14.708694458007812, -10.32443618774414, -5.940179824829102, -1.5559234619140625, 2.8283348083496094, 7.212592124938965, 11.59684944152832, 15.981106758117676, 20.36536407470703, 24.749622344970703, 29.133878707885742, 33.51813507080078, 37.90239334106445, 42.286651611328125, 46.67090606689453, 51.0551643371582, 55.439422607421875, 59.82368087768555, 64.20793914794922, 68.59219360351562, 72.97645568847656, 77.36071014404297, 81.7449722290039, 86.12922668457031, 90.51348876953125, 94.89774322509766, 99.28199768066406, 103.666259765625, 108.05050659179688, 112.43476104736328, 116.81902313232422, 121.20327758789062, 125.58753967285156, 129.9718017578125, 134.35604858398438, 138.7403106689453, 143.12457275390625, 147.5088348388672, 151.89308166503906, 156.27734375, 160.66160583496094, 165.04586791992188, 169.43011474609375, 173.8143768310547, 178.19862365722656, 182.5828857421875, 186.96713256835938, 191.3513946533203, 195.73565673828125, 200.11990356445312, 204.50416564941406, 208.888427734375, 213.27267456054688, 217.6569366455078, 222.0411834716797, 226.42544555664062, 230.80970764160156, 235.1939697265625, 239.57821655273438, 243.9624786376953, 248.34674072265625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 4.0, 9.0, 12.0, 8.0, 9.0, 13.0, 15.0, 14.0, 19.0, 18.0, 18.0, 36.0, 33.0, 23.0, 33.0, 25.0, 38.0, 39.0, 35.0, 35.0, 41.0, 35.0, 31.0, 35.0, 51.0, 28.0, 43.0, 31.0, 27.0, 31.0, 30.0, 22.0, 20.0, 22.0, 14.0, 13.0, 9.0, 15.0, 12.0, 10.0, 5.0, 13.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0], "bins": [-19.534732818603516, -18.914165496826172, -18.293596267700195, -17.67302703857422, -17.052459716796875, -16.43189239501953, -15.811323165893555, -15.190754890441895, -14.570186614990234, -13.949618339538574, -13.329050064086914, -12.708481788635254, -12.087913513183594, -11.467345237731934, -10.846776962280273, -10.226208686828613, -9.605640411376953, -8.985072135925293, -8.364503860473633, -7.743935585021973, -7.1233673095703125, -6.502799034118652, -5.882230758666992, -5.261662483215332, -4.641094207763672, -4.020525932312012, -3.3999576568603516, -2.7793893814086914, -2.1588211059570312, -1.538252830505371, -0.9176845550537109, -0.2971162796020508, 0.3234519958496094, 0.9440202713012695, 1.5645885467529297, 2.18515682220459, 2.80572509765625, 3.42629337310791, 4.04686164855957, 4.6674299240112305, 5.287998199462891, 5.908566474914551, 6.529134750366211, 7.149703025817871, 7.770271301269531, 8.390839576721191, 9.011407852172852, 9.631976127624512, 10.252544403076172, 10.873112678527832, 11.493680953979492, 12.114249229431152, 12.734817504882812, 13.355385780334473, 13.975954055786133, 14.596522331237793, 15.217090606689453, 15.837658882141113, 16.458227157592773, 17.07879638671875, 17.699363708496094, 18.319931030273438, 18.940500259399414, 19.56106948852539, 20.181636810302734]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 6.0, 7.0, 6.0, 6.0, 5.0, 12.0, 13.0, 15.0, 18.0, 27.0, 19.0, 20.0, 27.0, 40.0, 31.0, 20.0, 32.0, 43.0, 59.0, 41.0, 43.0, 40.0, 28.0, 32.0, 45.0, 36.0, 30.0, 28.0, 32.0, 29.0, 29.0, 27.0, 23.0, 18.0, 15.0, 20.0, 12.0, 19.0, 9.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.22265625, -4.0892333984375, -3.955810546875, -3.8223876953125, -3.68896484375, -3.5555419921875, -3.422119140625, -3.2886962890625, -3.1552734375, -3.0218505859375, -2.888427734375, -2.7550048828125, -2.62158203125, -2.4881591796875, -2.354736328125, -2.2213134765625, -2.087890625, -1.9544677734375, -1.821044921875, -1.6876220703125, -1.55419921875, -1.4207763671875, -1.287353515625, -1.1539306640625, -1.0205078125, -0.8870849609375, -0.753662109375, -0.6202392578125, -0.48681640625, -0.3533935546875, -0.219970703125, -0.0865478515625, 0.046875, 0.1802978515625, 0.313720703125, 0.4471435546875, 0.58056640625, 0.7139892578125, 0.847412109375, 0.9808349609375, 1.1142578125, 1.2476806640625, 1.381103515625, 1.5145263671875, 1.64794921875, 1.7813720703125, 1.914794921875, 2.0482177734375, 2.181640625, 2.3150634765625, 2.448486328125, 2.5819091796875, 2.71533203125, 2.8487548828125, 2.982177734375, 3.1156005859375, 3.2490234375, 3.3824462890625, 3.515869140625, 3.6492919921875, 3.78271484375, 3.9161376953125, 4.049560546875, 4.1829833984375, 4.31640625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 11.0, 14.0, 13.0, 28.0, 36.0, 50.0, 79.0, 103.0, 145.0, 209.0, 358.0, 483.0, 683.0, 1069.0, 1635.0, 2368.0, 3666.0, 5521.0, 8568.0, 13270.0, 20704.0, 32312.0, 51785.0, 89360.0, 180592.0, 319713.0, 129328.0, 69367.0, 41997.0, 26570.0, 16804.0, 10932.0, 7068.0, 4578.0, 3013.0, 2006.0, 1325.0, 931.0, 581.0, 402.0, 261.0, 194.0, 129.0, 83.0, 59.0, 50.0, 26.0, 22.0, 23.0, 9.0, 11.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.1617431640625, -0.15673255920410156, -0.15172195434570312, -0.1467113494873047, -0.14170074462890625, -0.1366901397705078, -0.13167953491210938, -0.12666893005371094, -0.1216583251953125, -0.11664772033691406, -0.11163711547851562, -0.10662651062011719, -0.10161590576171875, -0.09660530090332031, -0.09159469604492188, -0.08658409118652344, -0.081573486328125, -0.07656288146972656, -0.07155227661132812, -0.06654167175292969, -0.06153106689453125, -0.05652046203613281, -0.051509857177734375, -0.04649925231933594, -0.0414886474609375, -0.03647804260253906, -0.031467437744140625, -0.026456832885742188, -0.02144622802734375, -0.016435623168945312, -0.011425018310546875, -0.0064144134521484375, -0.00140380859375, 0.0036067962646484375, 0.008617401123046875, 0.013628005981445312, 0.01863861083984375, 0.023649215698242188, 0.028659820556640625, 0.03367042541503906, 0.0386810302734375, 0.04369163513183594, 0.048702239990234375, 0.05371284484863281, 0.05872344970703125, 0.06373405456542969, 0.06874465942382812, 0.07375526428222656, 0.078765869140625, 0.08377647399902344, 0.08878707885742188, 0.09379768371582031, 0.09880828857421875, 0.10381889343261719, 0.10882949829101562, 0.11384010314941406, 0.1188507080078125, 0.12386131286621094, 0.12887191772460938, 0.1338825225830078, 0.13889312744140625, 0.1439037322998047, 0.14891433715820312, 0.15392494201660156, 0.158935546875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 3.0, 5.0, 6.0, 9.0, 10.0, 6.0, 10.0, 15.0, 13.0, 18.0, 17.0, 24.0, 26.0, 35.0, 39.0, 38.0, 37.0, 40.0, 32.0, 42.0, 32.0, 44.0, 1055.0, 41.0, 46.0, 39.0, 33.0, 37.0, 32.0, 32.0, 26.0, 33.0, 18.0, 21.0, 13.0, 18.0, 12.0, 13.0, 10.0, 7.0, 11.0, 5.0, 2.0, 8.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.00390625, -2.910064697265625, -2.81622314453125, -2.722381591796875, -2.6285400390625, -2.534698486328125, -2.44085693359375, -2.347015380859375, -2.253173828125, -2.159332275390625, -2.06549072265625, -1.971649169921875, -1.8778076171875, -1.783966064453125, -1.69012451171875, -1.596282958984375, -1.50244140625, -1.408599853515625, -1.31475830078125, -1.220916748046875, -1.1270751953125, -1.033233642578125, -0.93939208984375, -0.845550537109375, -0.751708984375, -0.657867431640625, -0.56402587890625, -0.470184326171875, -0.3763427734375, -0.282501220703125, -0.18865966796875, -0.094818115234375, -0.0009765625, 0.092864990234375, 0.18670654296875, 0.280548095703125, 0.3743896484375, 0.468231201171875, 0.56207275390625, 0.655914306640625, 0.749755859375, 0.843597412109375, 0.93743896484375, 1.031280517578125, 1.1251220703125, 1.218963623046875, 1.31280517578125, 1.406646728515625, 1.50048828125, 1.594329833984375, 1.68817138671875, 1.782012939453125, 1.8758544921875, 1.969696044921875, 2.06353759765625, 2.157379150390625, 2.251220703125, 2.345062255859375, 2.43890380859375, 2.532745361328125, 2.6265869140625, 2.720428466796875, 2.81427001953125, 2.908111572265625, 3.001953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 8.0, 18.0, 27.0, 42.0, 45.0, 73.0, 109.0, 151.0, 241.0, 331.0, 471.0, 679.0, 930.0, 1349.0, 1860.0, 2660.0, 3797.0, 5377.0, 7760.0, 11322.0, 16654.0, 25384.0, 39499.0, 63351.0, 109781.0, 1286668.0, 229544.0, 108409.0, 62973.0, 39184.0, 25119.0, 16508.0, 11167.0, 7642.0, 5241.0, 3849.0, 2583.0, 1890.0, 1336.0, 933.0, 622.0, 513.0, 297.0, 238.0, 158.0, 109.0, 74.0, 56.0, 32.0, 30.0, 20.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.0865478515625, -0.08384227752685547, -0.08113670349121094, -0.0784311294555664, -0.07572555541992188, -0.07301998138427734, -0.07031440734863281, -0.06760883331298828, -0.06490325927734375, -0.06219768524169922, -0.05949211120605469, -0.056786537170410156, -0.054080963134765625, -0.051375389099121094, -0.04866981506347656, -0.04596424102783203, -0.0432586669921875, -0.04055309295654297, -0.03784751892089844, -0.035141944885253906, -0.032436370849609375, -0.029730796813964844, -0.027025222778320312, -0.02431964874267578, -0.02161407470703125, -0.01890850067138672, -0.016202926635742188, -0.013497352600097656, -0.010791778564453125, -0.008086204528808594, -0.0053806304931640625, -0.0026750564575195312, 3.0517578125e-05, 0.0027360916137695312, 0.0054416656494140625, 0.008147239685058594, 0.010852813720703125, 0.013558387756347656, 0.016263961791992188, 0.01896953582763672, 0.02167510986328125, 0.02438068389892578, 0.027086257934570312, 0.029791831970214844, 0.032497406005859375, 0.035202980041503906, 0.03790855407714844, 0.04061412811279297, 0.0433197021484375, 0.04602527618408203, 0.04873085021972656, 0.051436424255371094, 0.054141998291015625, 0.056847572326660156, 0.05955314636230469, 0.06225872039794922, 0.06496429443359375, 0.06766986846923828, 0.07037544250488281, 0.07308101654052734, 0.07578659057617188, 0.0784921646118164, 0.08119773864746094, 0.08390331268310547, 0.08660888671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 5.0, 6.0, 9.0, 0.0, 7.0, 10.0, 8.0, 0.0, 18.0, 11.0, 26.0, 25.0, 0.0, 46.0, 50.0, 73.0, 0.0, 105.0, 224.0, 97.0, 69.0, 0.0, 58.0, 29.0, 32.0, 27.0, 0.0, 6.0, 14.0, 8.0, 0.0, 9.0, 9.0, 5.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5497207641601562e-06, -1.5031546354293823e-06, -1.4565885066986084e-06, -1.4100223779678345e-06, -1.3634562492370605e-06, -1.3168901205062866e-06, -1.2703239917755127e-06, -1.2237578630447388e-06, -1.1771917343139648e-06, -1.130625605583191e-06, -1.084059476852417e-06, -1.037493348121643e-06, -9.909272193908691e-07, -9.443610906600952e-07, -8.977949619293213e-07, -8.512288331985474e-07, -8.046627044677734e-07, -7.580965757369995e-07, -7.115304470062256e-07, -6.649643182754517e-07, -6.183981895446777e-07, -5.718320608139038e-07, -5.252659320831299e-07, -4.78699803352356e-07, -4.3213367462158203e-07, -3.855675458908081e-07, -3.390014171600342e-07, -2.9243528842926025e-07, -2.4586915969848633e-07, -1.993030309677124e-07, -1.5273690223693848e-07, -1.0617077350616455e-07, -5.960464477539063e-08, -1.30385160446167e-08, 3.3527612686157227e-08, 8.009374141693115e-08, 1.2665987014770508e-07, 1.73225998878479e-07, 2.1979212760925293e-07, 2.6635825634002686e-07, 3.129243850708008e-07, 3.594905138015747e-07, 4.0605664253234863e-07, 4.5262277126312256e-07, 4.991888999938965e-07, 5.457550287246704e-07, 5.923211574554443e-07, 6.388872861862183e-07, 6.854534149169922e-07, 7.320195436477661e-07, 7.7858567237854e-07, 8.25151801109314e-07, 8.717179298400879e-07, 9.182840585708618e-07, 9.648501873016357e-07, 1.0114163160324097e-06, 1.0579824447631836e-06, 1.1045485734939575e-06, 1.1511147022247314e-06, 1.1976808309555054e-06, 1.2442469596862793e-06, 1.2908130884170532e-06, 1.3373792171478271e-06, 1.383945345878601e-06, 1.430511474609375e-06]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 7.0, 10.0, 11.0, 10.0, 10.0, 19.0, 23.0, 16.0, 48.0, 59.0, 63.0, 114.0, 236.0, 612.0, 13989.0, 970979.0, 60445.0, 1099.0, 273.0, 163.0, 86.0, 61.0, 56.0, 39.0, 18.0, 19.0, 16.0, 12.0, 7.0, 8.0, 11.0, 9.0, 2.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.0159950256347656e-05, -2.9175542294979095e-05, -2.8191134333610535e-05, -2.7206726372241974e-05, -2.6222318410873413e-05, -2.5237910449504852e-05, -2.425350248813629e-05, -2.326909452676773e-05, -2.228468656539917e-05, -2.130027860403061e-05, -2.031587064266205e-05, -1.9331462681293488e-05, -1.8347054719924927e-05, -1.7362646758556366e-05, -1.6378238797187805e-05, -1.5393830835819244e-05, -1.4409422874450684e-05, -1.3425014913082123e-05, -1.2440606951713562e-05, -1.1456198990345001e-05, -1.047179102897644e-05, -9.48738306760788e-06, -8.502975106239319e-06, -7.518567144870758e-06, -6.534159183502197e-06, -5.5497512221336365e-06, -4.565343260765076e-06, -3.580935299396515e-06, -2.596527338027954e-06, -1.6121193766593933e-06, -6.277114152908325e-07, 3.5669654607772827e-07, 1.341104507446289e-06, 2.32551246881485e-06, 3.3099204301834106e-06, 4.2943283915519714e-06, 5.278736352920532e-06, 6.263144314289093e-06, 7.247552275657654e-06, 8.231960237026215e-06, 9.216368198394775e-06, 1.0200776159763336e-05, 1.1185184121131897e-05, 1.2169592082500458e-05, 1.3154000043869019e-05, 1.413840800523758e-05, 1.512281596660614e-05, 1.61072239279747e-05, 1.7091631889343262e-05, 1.8076039850711823e-05, 1.9060447812080383e-05, 2.0044855773448944e-05, 2.1029263734817505e-05, 2.2013671696186066e-05, 2.2998079657554626e-05, 2.3982487618923187e-05, 2.4966895580291748e-05, 2.595130354166031e-05, 2.693571150302887e-05, 2.792011946439743e-05, 2.890452742576599e-05, 2.9888935387134552e-05, 3.087334334850311e-05, 3.1857751309871674e-05, 3.2842159271240234e-05]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 14.0, 38.0, 96.0, 333.0, 366.0, 123.0, 33.0, 11.0], "bins": [-5.794078333565267e-06, -5.697569577023387e-06, -5.601061275228858e-06, -5.504552518686978e-06, -5.408043762145098e-06, -5.311535460350569e-06, -5.2150267038086895e-06, -5.11851794726681e-06, -5.022009645472281e-06, -4.925500888930401e-06, -4.828992587135872e-06, -4.732483830593992e-06, -4.635975074052112e-06, -4.539466772257583e-06, -4.442958015715703e-06, -4.3464492591738235e-06, -4.249940502631944e-06, -4.153431746090064e-06, -4.056923444295535e-06, -3.960414687753655e-06, -3.863905931211775e-06, -3.767397629417246e-06, -3.6708888728753664e-06, -3.574380343707162e-06, -3.4778718145389576e-06, -3.381363285370753e-06, -3.2848545288288733e-06, -3.188345999660669e-06, -3.0918374704924645e-06, -2.99532894132426e-06, -2.8988201847823802e-06, -2.802311655614176e-06, -2.7058031264459714e-06, -2.609294597277767e-06, -2.512785840735887e-06, -2.4162773115676828e-06, -2.3197687823994784e-06, -2.223260253231274e-06, -2.126751496689394e-06, -2.0302429675211897e-06, -1.9337344383529853e-06, -1.8372257954979432e-06, -1.7407172663297388e-06, -1.6442086234746967e-06, -1.5477000943064922e-06, -1.4511914514514501e-06, -1.354682808596408e-06, -1.2581742794282036e-06, -1.1616656365731615e-06, -1.0651569937181193e-06, -9.68648464549915e-07, -8.721398216948728e-07, -7.756312356832495e-07, -6.791226496716263e-07, -5.826140068165842e-07, -4.861054208049609e-07, -3.895968347933376e-07, -2.9308824878171436e-07, -1.9657963434838166e-07, -1.0007101991504896e-07, -3.562433903425699e-09, 9.294615210819757e-08, 1.894547949632397e-07, 2.8596338097486296e-07, 3.824719669864862e-07]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 11.0, 0.0, 0.0, 25.0, 0.0, 43.0, 0.0, 0.0, 50.0, 0.0, 0.0, 82.0, 0.0, 102.0, 0.0, 0.0, 105.0, 0.0, 129.0, 0.0, 0.0, 123.0, 0.0, 111.0, 0.0, 0.0, 70.0, 0.0, 60.0, 0.0, 0.0, 34.0, 0.0, 0.0, 32.0, 0.0, 20.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.919726729393005e-07, -6.686896085739136e-07, -6.454065442085266e-07, -6.221234798431396e-07, -5.988404154777527e-07, -5.755573511123657e-07, -5.522742867469788e-07, -5.289912223815918e-07, -5.057081580162048e-07, -4.824250936508179e-07, -4.591420292854309e-07, -4.3585896492004395e-07, -4.12575900554657e-07, -3.8929283618927e-07, -3.6600977182388306e-07, -3.427267074584961e-07, -3.1944364309310913e-07, -2.9616057872772217e-07, -2.728775143623352e-07, -2.4959444999694824e-07, -2.2631138563156128e-07, -2.0302832126617432e-07, -1.7974525690078735e-07, -1.564621925354004e-07, -1.3317912817001343e-07, -1.0989606380462646e-07, -8.66129994392395e-08, -6.332993507385254e-08, -4.0046870708465576e-08, -1.6763806343078613e-08, 6.51925802230835e-09, 2.9802322387695312e-08, 5.3085386753082275e-08, 7.636845111846924e-08, 9.96515154838562e-08, 1.2293457984924316e-07, 1.4621764421463013e-07, 1.695007085800171e-07, 1.9278377294540405e-07, 2.1606683731079102e-07, 2.39349901676178e-07, 2.6263296604156494e-07, 2.859160304069519e-07, 3.0919909477233887e-07, 3.3248215913772583e-07, 3.557652235031128e-07, 3.7904828786849976e-07, 4.023313522338867e-07, 4.256144165992737e-07, 4.4889748096466064e-07, 4.721805453300476e-07, 4.954636096954346e-07, 5.187466740608215e-07, 5.420297384262085e-07, 5.653128027915955e-07, 5.885958671569824e-07, 6.118789315223694e-07, 6.351619958877563e-07, 6.584450602531433e-07, 6.817281246185303e-07, 7.050111889839172e-07, 7.282942533493042e-07, 7.515773177146912e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 6.0, 7.0, 6.0, 6.0, 5.0, 12.0, 13.0, 15.0, 18.0, 27.0, 19.0, 20.0, 27.0, 40.0, 31.0, 20.0, 32.0, 43.0, 59.0, 41.0, 43.0, 40.0, 28.0, 32.0, 45.0, 36.0, 30.0, 28.0, 32.0, 29.0, 29.0, 27.0, 23.0, 18.0, 15.0, 20.0, 12.0, 19.0, 9.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.22265625, -4.0892333984375, -3.955810546875, -3.8223876953125, -3.68896484375, -3.5555419921875, -3.422119140625, -3.2886962890625, -3.1552734375, -3.0218505859375, -2.888427734375, -2.7550048828125, -2.62158203125, -2.4881591796875, -2.354736328125, -2.2213134765625, -2.087890625, -1.9544677734375, -1.821044921875, -1.6876220703125, -1.55419921875, -1.4207763671875, -1.287353515625, -1.1539306640625, -1.0205078125, -0.8870849609375, -0.753662109375, -0.6202392578125, -0.48681640625, -0.3533935546875, -0.219970703125, -0.0865478515625, 0.046875, 0.1802978515625, 0.313720703125, 0.4471435546875, 0.58056640625, 0.7139892578125, 0.847412109375, 0.9808349609375, 1.1142578125, 1.2476806640625, 1.381103515625, 1.5145263671875, 1.64794921875, 1.7813720703125, 1.914794921875, 2.0482177734375, 2.181640625, 2.3150634765625, 2.448486328125, 2.5819091796875, 2.71533203125, 2.8487548828125, 2.982177734375, 3.1156005859375, 3.2490234375, 3.3824462890625, 3.515869140625, 3.6492919921875, 3.78271484375, 3.9161376953125, 4.049560546875, 4.1829833984375, 4.31640625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 13.0, 11.0, 21.0, 23.0, 38.0, 65.0, 86.0, 189.0, 263.0, 453.0, 894.0, 1492.0, 2650.0, 4720.0, 7926.0, 13092.0, 21233.0, 33767.0, 52910.0, 83317.0, 151240.0, 288023.0, 157131.0, 85789.0, 54096.0, 34384.0, 21909.0, 13444.0, 8049.0, 4782.0, 2736.0, 1634.0, 883.0, 516.0, 305.0, 179.0, 102.0, 67.0, 34.0, 20.0, 18.0, 16.0, 10.0, 11.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.328369140625, -5.16455078125, -5.000732421875, -4.8369140625, -4.673095703125, -4.50927734375, -4.345458984375, -4.181640625, -4.017822265625, -3.85400390625, -3.690185546875, -3.5263671875, -3.362548828125, -3.19873046875, -3.034912109375, -2.87109375, -2.707275390625, -2.54345703125, -2.379638671875, -2.2158203125, -2.052001953125, -1.88818359375, -1.724365234375, -1.560546875, -1.396728515625, -1.23291015625, -1.069091796875, -0.9052734375, -0.741455078125, -0.57763671875, -0.413818359375, -0.25, -0.086181640625, 0.07763671875, 0.241455078125, 0.4052734375, 0.569091796875, 0.73291015625, 0.896728515625, 1.060546875, 1.224365234375, 1.38818359375, 1.552001953125, 1.7158203125, 1.879638671875, 2.04345703125, 2.207275390625, 2.37109375, 2.534912109375, 2.69873046875, 2.862548828125, 3.0263671875, 3.190185546875, 3.35400390625, 3.517822265625, 3.681640625, 3.845458984375, 4.00927734375, 4.173095703125, 4.3369140625, 4.500732421875, 4.66455078125, 4.828369140625, 4.9921875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 16.0, 17.0, 9.0, 12.0, 21.0, 29.0, 27.0, 31.0, 30.0, 47.0, 58.0, 65.0, 93.0, 138.0, 232.0, 1397.0, 216.0, 149.0, 110.0, 77.0, 43.0, 49.0, 31.0, 28.0, 30.0, 26.0, 19.0, 15.0, 10.0, 12.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6015625, -15.1505126953125, -14.699462890625, -14.2484130859375, -13.79736328125, -13.3463134765625, -12.895263671875, -12.4442138671875, -11.9931640625, -11.5421142578125, -11.091064453125, -10.6400146484375, -10.18896484375, -9.7379150390625, -9.286865234375, -8.8358154296875, -8.384765625, -7.9337158203125, -7.482666015625, -7.0316162109375, -6.58056640625, -6.1295166015625, -5.678466796875, -5.2274169921875, -4.7763671875, -4.3253173828125, -3.874267578125, -3.4232177734375, -2.97216796875, -2.5211181640625, -2.070068359375, -1.6190185546875, -1.16796875, -0.7169189453125, -0.265869140625, 0.1851806640625, 0.63623046875, 1.0872802734375, 1.538330078125, 1.9893798828125, 2.4404296875, 2.8914794921875, 3.342529296875, 3.7935791015625, 4.24462890625, 4.6956787109375, 5.146728515625, 5.5977783203125, 6.048828125, 6.4998779296875, 6.950927734375, 7.4019775390625, 7.85302734375, 8.3040771484375, 8.755126953125, 9.2061767578125, 9.6572265625, 10.1082763671875, 10.559326171875, 11.0103759765625, 11.46142578125, 11.9124755859375, 12.363525390625, 12.8145751953125, 13.265625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 7.0, 9.0, 17.0, 24.0, 29.0, 24.0, 48.0, 65.0, 88.0, 134.0, 208.0, 300.0, 495.0, 1149.0, 4606.0, 24348.0, 157044.0, 1916928.0, 928284.0, 91607.0, 15126.0, 2955.0, 888.0, 423.0, 244.0, 164.0, 138.0, 86.0, 62.0, 54.0, 43.0, 27.0, 20.0, 11.0, 12.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.125, -13.6673583984375, -13.209716796875, -12.7520751953125, -12.29443359375, -11.8367919921875, -11.379150390625, -10.9215087890625, -10.4638671875, -10.0062255859375, -9.548583984375, -9.0909423828125, -8.63330078125, -8.1756591796875, -7.718017578125, -7.2603759765625, -6.802734375, -6.3450927734375, -5.887451171875, -5.4298095703125, -4.97216796875, -4.5145263671875, -4.056884765625, -3.5992431640625, -3.1416015625, -2.6839599609375, -2.226318359375, -1.7686767578125, -1.31103515625, -0.8533935546875, -0.395751953125, 0.0618896484375, 0.51953125, 0.9771728515625, 1.434814453125, 1.8924560546875, 2.35009765625, 2.8077392578125, 3.265380859375, 3.7230224609375, 4.1806640625, 4.6383056640625, 5.095947265625, 5.5535888671875, 6.01123046875, 6.4688720703125, 6.926513671875, 7.3841552734375, 7.841796875, 8.2994384765625, 8.757080078125, 9.2147216796875, 9.67236328125, 10.1300048828125, 10.587646484375, 11.0452880859375, 11.5029296875, 11.9605712890625, 12.418212890625, 12.8758544921875, 13.33349609375, 13.7911376953125, 14.248779296875, 14.7064208984375, 15.1640625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 45.0, 178.0, 308.0, 298.0, 158.0, 16.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.47114562988281, -65.18412780761719, -61.89710998535156, -58.6100959777832, -55.32307815551758, -52.03606033325195, -48.749046325683594, -45.46202850341797, -42.175010681152344, -38.88799285888672, -35.600975036621094, -32.313961029052734, -29.02694320678711, -25.739925384521484, -22.452909469604492, -19.1658935546875, -15.878875732421875, -12.591858863830566, -9.304841995239258, -6.017825126647949, -2.7308082580566406, 0.5562095642089844, 3.8432254791259766, 7.130241394042969, 10.417259216308594, 13.704276084899902, 16.99129295349121, 20.278308868408203, 23.565326690673828, 26.852344512939453, 30.139360427856445, 33.42637634277344, 36.71339416503906, 40.00041198730469, 43.28742980957031, 46.57444381713867, 49.8614616394043, 53.14847946166992, 56.43549346923828, 59.722511291503906, 63.00952911376953, 66.29654693603516, 69.58356475830078, 72.8705825805664, 76.1575927734375, 79.44461059570312, 82.73162841796875, 86.01864624023438, 89.3056640625, 92.59268188476562, 95.87969970703125, 99.16671752929688, 102.4537353515625, 105.74075317382812, 109.02776336669922, 112.31478118896484, 115.60179901123047, 118.8888168334961, 122.17583465576172, 125.46285247802734, 128.74986267089844, 132.03688049316406, 135.3238983154297, 138.6109161376953, 141.89793395996094]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 10.0, 9.0, 12.0, 17.0, 20.0, 22.0, 16.0, 19.0, 25.0, 25.0, 28.0, 37.0, 33.0, 38.0, 35.0, 36.0, 44.0, 44.0, 41.0, 46.0, 46.0, 41.0, 28.0, 37.0, 40.0, 34.0, 28.0, 33.0, 23.0, 23.0, 14.0, 12.0, 14.0, 17.0, 11.0, 12.0, 7.0, 9.0, 3.0, 2.0, 2.0, 7.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.44413375854492, -34.48119354248047, -33.51824951171875, -32.5553092956543, -31.592369079589844, -30.629426956176758, -29.666484832763672, -28.70354461669922, -27.740602493286133, -26.777660369873047, -25.814720153808594, -24.851778030395508, -23.888837814331055, -22.92589569091797, -21.962955474853516, -21.00001335144043, -20.037071228027344, -19.074129104614258, -18.111188888549805, -17.14824676513672, -16.185306549072266, -15.22236442565918, -14.25942325592041, -13.29648208618164, -12.333541870117188, -11.370600700378418, -10.407659530639648, -9.444717407226562, -8.481776237487793, -7.518835067749023, -6.555893898010254, -5.592952251434326, -4.630010604858398, -3.66706919670105, -2.704127788543701, -1.7411866188049316, -0.778245210647583, 0.18469619750976562, 1.1476373672485352, 2.110579013824463, 3.0735201835632324, 4.036461353302002, 4.99940299987793, 5.962344169616699, 6.925285339355469, 7.8882269859313965, 8.851167678833008, 9.814109802246094, 10.777050971984863, 11.739992141723633, 12.702933311462402, 13.665874481201172, 14.628816604614258, 15.591757774353027, 16.554698944091797, 17.517641067504883, 18.480581283569336, 19.443523406982422, 20.406463623046875, 21.36940574645996, 22.332345962524414, 23.2952880859375, 24.258228302001953, 25.22117042541504, 26.184112548828125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 3.0, 7.0, 11.0, 13.0, 10.0, 17.0, 15.0, 17.0, 18.0, 28.0, 28.0, 29.0, 28.0, 29.0, 33.0, 33.0, 36.0, 40.0, 35.0, 57.0, 36.0, 38.0, 37.0, 26.0, 37.0, 35.0, 42.0, 37.0, 26.0, 31.0, 23.0, 20.0, 12.0, 20.0, 16.0, 14.0, 21.0, 9.0, 3.0, 6.0, 7.0, 3.0, 7.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.8125, -3.67413330078125, -3.5357666015625, -3.39739990234375, -3.259033203125, -3.12066650390625, -2.9822998046875, -2.84393310546875, -2.70556640625, -2.56719970703125, -2.4288330078125, -2.29046630859375, -2.152099609375, -2.01373291015625, -1.8753662109375, -1.73699951171875, -1.5986328125, -1.46026611328125, -1.3218994140625, -1.18353271484375, -1.045166015625, -0.90679931640625, -0.7684326171875, -0.63006591796875, -0.49169921875, -0.35333251953125, -0.2149658203125, -0.07659912109375, 0.061767578125, 0.20013427734375, 0.3385009765625, 0.47686767578125, 0.615234375, 0.75360107421875, 0.8919677734375, 1.03033447265625, 1.168701171875, 1.30706787109375, 1.4454345703125, 1.58380126953125, 1.72216796875, 1.86053466796875, 1.9989013671875, 2.13726806640625, 2.275634765625, 2.41400146484375, 2.5523681640625, 2.69073486328125, 2.8291015625, 2.96746826171875, 3.1058349609375, 3.24420166015625, 3.382568359375, 3.52093505859375, 3.6593017578125, 3.79766845703125, 3.93603515625, 4.07440185546875, 4.2127685546875, 4.35113525390625, 4.489501953125, 4.62786865234375, 4.7662353515625, 4.90460205078125, 5.04296875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 11.0, 15.0, 22.0, 26.0, 30.0, 35.0, 43.0, 57.0, 76.0, 105.0, 142.0, 207.0, 389.0, 822.0, 16796.0, 3973194.0, 199106.0, 1763.0, 464.0, 283.0, 159.0, 129.0, 93.0, 50.0, 47.0, 43.0, 26.0, 30.0, 20.0, 16.0, 16.0, 12.0, 8.0, 4.0, 4.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.4228515625, -38.095703125, -36.7685546875, -35.44140625, -34.1142578125, -32.787109375, -31.4599609375, -30.1328125, -28.8056640625, -27.478515625, -26.1513671875, -24.82421875, -23.4970703125, -22.169921875, -20.8427734375, -19.515625, -18.1884765625, -16.861328125, -15.5341796875, -14.20703125, -12.8798828125, -11.552734375, -10.2255859375, -8.8984375, -7.5712890625, -6.244140625, -4.9169921875, -3.58984375, -2.2626953125, -0.935546875, 0.3916015625, 1.71875, 3.0458984375, 4.373046875, 5.7001953125, 7.02734375, 8.3544921875, 9.681640625, 11.0087890625, 12.3359375, 13.6630859375, 14.990234375, 16.3173828125, 17.64453125, 18.9716796875, 20.298828125, 21.6259765625, 22.953125, 24.2802734375, 25.607421875, 26.9345703125, 28.26171875, 29.5888671875, 30.916015625, 32.2431640625, 33.5703125, 34.8974609375, 36.224609375, 37.5517578125, 38.87890625, 40.2060546875, 41.533203125, 42.8603515625, 44.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 8.0, 12.0, 14.0, 18.0, 14.0, 28.0, 51.0, 72.0, 90.0, 130.0, 187.0, 256.0, 389.0, 547.0, 655.0, 454.0, 329.0, 237.0, 155.0, 136.0, 68.0, 53.0, 42.0, 29.0, 25.0, 13.0, 16.0, 8.0, 11.0, 4.0, 2.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.828125, -7.59918212890625, -7.3702392578125, -7.14129638671875, -6.912353515625, -6.68341064453125, -6.4544677734375, -6.22552490234375, -5.99658203125, -5.76763916015625, -5.5386962890625, -5.30975341796875, -5.080810546875, -4.85186767578125, -4.6229248046875, -4.39398193359375, -4.1650390625, -3.93609619140625, -3.7071533203125, -3.47821044921875, -3.249267578125, -3.02032470703125, -2.7913818359375, -2.56243896484375, -2.33349609375, -2.10455322265625, -1.8756103515625, -1.64666748046875, -1.417724609375, -1.18878173828125, -0.9598388671875, -0.73089599609375, -0.501953125, -0.27301025390625, -0.0440673828125, 0.18487548828125, 0.413818359375, 0.64276123046875, 0.8717041015625, 1.10064697265625, 1.32958984375, 1.55853271484375, 1.7874755859375, 2.01641845703125, 2.245361328125, 2.47430419921875, 2.7032470703125, 2.93218994140625, 3.1611328125, 3.39007568359375, 3.6190185546875, 3.84796142578125, 4.076904296875, 4.30584716796875, 4.5347900390625, 4.76373291015625, 4.99267578125, 5.22161865234375, 5.4505615234375, 5.67950439453125, 5.908447265625, 6.13739013671875, 6.3663330078125, 6.59527587890625, 6.82421875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 8.0, 18.0, 13.0, 14.0, 22.0, 47.0, 44.0, 58.0, 80.0, 147.0, 247.0, 413.0, 1185.0, 3991.0, 21577.0, 199882.0, 2917172.0, 964462.0, 71279.0, 9792.0, 2205.0, 748.0, 307.0, 169.0, 105.0, 78.0, 43.0, 46.0, 26.0, 24.0, 15.0, 18.0, 12.0, 10.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.90625, -17.376220703125, -16.84619140625, -16.316162109375, -15.7861328125, -15.256103515625, -14.72607421875, -14.196044921875, -13.666015625, -13.135986328125, -12.60595703125, -12.075927734375, -11.5458984375, -11.015869140625, -10.48583984375, -9.955810546875, -9.42578125, -8.895751953125, -8.36572265625, -7.835693359375, -7.3056640625, -6.775634765625, -6.24560546875, -5.715576171875, -5.185546875, -4.655517578125, -4.12548828125, -3.595458984375, -3.0654296875, -2.535400390625, -2.00537109375, -1.475341796875, -0.9453125, -0.415283203125, 0.11474609375, 0.644775390625, 1.1748046875, 1.704833984375, 2.23486328125, 2.764892578125, 3.294921875, 3.824951171875, 4.35498046875, 4.885009765625, 5.4150390625, 5.945068359375, 6.47509765625, 7.005126953125, 7.53515625, 8.065185546875, 8.59521484375, 9.125244140625, 9.6552734375, 10.185302734375, 10.71533203125, 11.245361328125, 11.775390625, 12.305419921875, 12.83544921875, 13.365478515625, 13.8955078125, 14.425537109375, 14.95556640625, 15.485595703125, 16.015625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 37.0, 179.0, 302.0, 296.0, 129.0, 55.0, 7.0, 1.0, 2.0], "bins": [-172.10218811035156, -169.1282501220703, -166.15431213378906, -163.1803741455078, -160.20643615722656, -157.23251342773438, -154.25857543945312, -151.28463745117188, -148.31069946289062, -145.33676147460938, -142.36282348632812, -139.38888549804688, -136.41494750976562, -133.44100952148438, -130.46707153320312, -127.4931411743164, -124.51920318603516, -121.5452651977539, -118.57132720947266, -115.59739685058594, -112.62345886230469, -109.64952087402344, -106.67558288574219, -103.70164489746094, -100.72770690917969, -97.75376892089844, -94.77983093261719, -91.80589294433594, -88.83196258544922, -85.85802459716797, -82.88408660888672, -79.91014862060547, -76.93622589111328, -73.96228790283203, -70.98834991455078, -68.01441955566406, -65.04048156738281, -62.06654357910156, -59.09260559082031, -56.11866760253906, -53.14472961425781, -50.17079162597656, -47.19685745239258, -44.22291946411133, -41.248985290527344, -38.275047302246094, -35.301109313964844, -32.327171325683594, -29.353239059448242, -26.379302978515625, -23.405364990234375, -20.431428909301758, -17.45749282836914, -14.483556747436523, -11.509618759155273, -8.535682678222656, -5.561746597290039, -2.5878100395202637, 0.3861265182495117, 3.3600635528564453, 6.3339996337890625, 9.30793571472168, 12.28187370300293, 15.255809783935547, 18.229745864868164]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 9.0, 7.0, 12.0, 13.0, 14.0, 12.0, 20.0, 17.0, 23.0, 28.0, 33.0, 32.0, 51.0, 38.0, 35.0, 33.0, 47.0, 43.0, 39.0, 45.0, 35.0, 42.0, 36.0, 34.0, 34.0, 27.0, 23.0, 36.0, 26.0, 22.0, 22.0, 15.0, 17.0, 13.0, 10.0, 14.0, 6.0, 6.0, 8.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.676143646240234, -21.95744514465332, -21.238746643066406, -20.520048141479492, -19.801349639892578, -19.082651138305664, -18.36395263671875, -17.645254135131836, -16.926555633544922, -16.207857131958008, -15.489158630371094, -14.77046012878418, -14.051761627197266, -13.333063125610352, -12.614364624023438, -11.895666122436523, -11.176968574523926, -10.458270072937012, -9.739571571350098, -9.020873069763184, -8.30217456817627, -7.5834760665893555, -6.8647780418396, -6.1460795402526855, -5.4273810386657715, -4.708682537078857, -3.9899840354919434, -3.2712857723236084, -2.5525872707366943, -1.8338887691497803, -1.1151905059814453, -0.39649200439453125, 0.3222064971923828, 1.0409049987792969, 1.7596033811569214, 2.478301763534546, 3.19700026512146, 3.915698766708374, 4.634397029876709, 5.353095531463623, 6.071794033050537, 6.790492534637451, 7.509191036224365, 8.227889060974121, 8.946587562561035, 9.66528606414795, 10.383984565734863, 11.102683067321777, 11.821381568908691, 12.540080070495605, 13.25877857208252, 13.977477073669434, 14.696175575256348, 15.414874076843262, 16.13357162475586, 16.852270126342773, 17.570968627929688, 18.2896671295166, 19.008365631103516, 19.72706413269043, 20.445762634277344, 21.164461135864258, 21.883159637451172, 22.601858139038086, 23.320556640625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 7.0, 4.0, 7.0, 10.0, 15.0, 14.0, 14.0, 23.0, 25.0, 27.0, 21.0, 34.0, 32.0, 29.0, 38.0, 41.0, 43.0, 51.0, 50.0, 36.0, 38.0, 34.0, 33.0, 31.0, 36.0, 36.0, 29.0, 28.0, 28.0, 32.0, 16.0, 18.0, 19.0, 16.0, 15.0, 14.0, 5.0, 12.0, 4.0, 6.0, 4.0, 11.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.1484375, -4.00909423828125, -3.8697509765625, -3.73040771484375, -3.591064453125, -3.45172119140625, -3.3123779296875, -3.17303466796875, -3.03369140625, -2.89434814453125, -2.7550048828125, -2.61566162109375, -2.476318359375, -2.33697509765625, -2.1976318359375, -2.05828857421875, -1.9189453125, -1.77960205078125, -1.6402587890625, -1.50091552734375, -1.361572265625, -1.22222900390625, -1.0828857421875, -0.94354248046875, -0.80419921875, -0.66485595703125, -0.5255126953125, -0.38616943359375, -0.246826171875, -0.10748291015625, 0.0318603515625, 0.17120361328125, 0.310546875, 0.44989013671875, 0.5892333984375, 0.72857666015625, 0.867919921875, 1.00726318359375, 1.1466064453125, 1.28594970703125, 1.42529296875, 1.56463623046875, 1.7039794921875, 1.84332275390625, 1.982666015625, 2.12200927734375, 2.2613525390625, 2.40069580078125, 2.5400390625, 2.67938232421875, 2.8187255859375, 2.95806884765625, 3.097412109375, 3.23675537109375, 3.3760986328125, 3.51544189453125, 3.65478515625, 3.79412841796875, 3.9334716796875, 4.07281494140625, 4.212158203125, 4.35150146484375, 4.4908447265625, 4.63018798828125, 4.76953125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 8.0, 10.0, 33.0, 21.0, 31.0, 57.0, 93.0, 143.0, 220.0, 306.0, 463.0, 759.0, 1198.0, 1901.0, 2732.0, 4030.0, 6488.0, 9976.0, 15393.0, 24398.0, 38855.0, 64982.0, 120141.0, 317284.0, 201134.0, 93519.0, 53667.0, 32691.0, 20325.0, 13120.0, 8580.0, 5492.0, 3568.0, 2426.0, 1577.0, 1044.0, 626.0, 425.0, 299.0, 200.0, 119.0, 69.0, 48.0, 35.0, 23.0, 13.0, 15.0, 9.0, 10.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.1920166015625, -0.1863384246826172, -0.18066024780273438, -0.17498207092285156, -0.16930389404296875, -0.16362571716308594, -0.15794754028320312, -0.1522693634033203, -0.1465911865234375, -0.1409130096435547, -0.13523483276367188, -0.12955665588378906, -0.12387847900390625, -0.11820030212402344, -0.11252212524414062, -0.10684394836425781, -0.101165771484375, -0.09548759460449219, -0.08980941772460938, -0.08413124084472656, -0.07845306396484375, -0.07277488708496094, -0.06709671020507812, -0.06141853332519531, -0.0557403564453125, -0.05006217956542969, -0.044384002685546875, -0.03870582580566406, -0.03302764892578125, -0.027349472045898438, -0.021671295166015625, -0.015993118286132812, -0.01031494140625, -0.0046367645263671875, 0.001041412353515625, 0.0067195892333984375, 0.01239776611328125, 0.018075942993164062, 0.023754119873046875, 0.029432296752929688, 0.0351104736328125, 0.04078865051269531, 0.046466827392578125, 0.05214500427246094, 0.05782318115234375, 0.06350135803222656, 0.06917953491210938, 0.07485771179199219, 0.080535888671875, 0.08621406555175781, 0.09189224243164062, 0.09757041931152344, 0.10324859619140625, 0.10892677307128906, 0.11460494995117188, 0.12028312683105469, 0.1259613037109375, 0.1316394805908203, 0.13731765747070312, 0.14299583435058594, 0.14867401123046875, 0.15435218811035156, 0.16003036499023438, 0.1657085418701172, 0.17138671875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 3.0, 4.0, 10.0, 13.0, 15.0, 12.0, 17.0, 13.0, 27.0, 21.0, 26.0, 40.0, 28.0, 36.0, 47.0, 47.0, 41.0, 47.0, 46.0, 1066.0, 39.0, 35.0, 31.0, 39.0, 44.0, 26.0, 28.0, 37.0, 27.0, 18.0, 24.0, 15.0, 18.0, 19.0, 16.0, 7.0, 12.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.369140625, -3.26409912109375, -3.1590576171875, -3.05401611328125, -2.948974609375, -2.84393310546875, -2.7388916015625, -2.63385009765625, -2.52880859375, -2.42376708984375, -2.3187255859375, -2.21368408203125, -2.108642578125, -2.00360107421875, -1.8985595703125, -1.79351806640625, -1.6884765625, -1.58343505859375, -1.4783935546875, -1.37335205078125, -1.268310546875, -1.16326904296875, -1.0582275390625, -0.95318603515625, -0.84814453125, -0.74310302734375, -0.6380615234375, -0.53302001953125, -0.427978515625, -0.32293701171875, -0.2178955078125, -0.11285400390625, -0.0078125, 0.09722900390625, 0.2022705078125, 0.30731201171875, 0.412353515625, 0.51739501953125, 0.6224365234375, 0.72747802734375, 0.83251953125, 0.93756103515625, 1.0426025390625, 1.14764404296875, 1.252685546875, 1.35772705078125, 1.4627685546875, 1.56781005859375, 1.6728515625, 1.77789306640625, 1.8829345703125, 1.98797607421875, 2.093017578125, 2.19805908203125, 2.3031005859375, 2.40814208984375, 2.51318359375, 2.61822509765625, 2.7232666015625, 2.82830810546875, 2.933349609375, 3.03839111328125, 3.1434326171875, 3.24847412109375, 3.353515625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 20.0, 19.0, 34.0, 44.0, 72.0, 99.0, 156.0, 197.0, 334.0, 454.0, 672.0, 983.0, 1572.0, 2237.0, 3381.0, 4945.0, 7392.0, 10949.0, 16328.0, 25086.0, 39127.0, 64457.0, 112763.0, 1319746.0, 218223.0, 102641.0, 59360.0, 36160.0, 22992.0, 15250.0, 10132.0, 6976.0, 4547.0, 3088.0, 2221.0, 1442.0, 981.0, 664.0, 460.0, 289.0, 231.0, 127.0, 80.0, 61.0, 43.0, 27.0, 26.0, 10.0, 12.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0965576171875, -0.09353256225585938, -0.09050750732421875, -0.08748245239257812, -0.0844573974609375, -0.08143234252929688, -0.07840728759765625, -0.07538223266601562, -0.072357177734375, -0.06933212280273438, -0.06630706787109375, -0.06328201293945312, -0.0602569580078125, -0.057231903076171875, -0.05420684814453125, -0.051181793212890625, -0.04815673828125, -0.045131683349609375, -0.04210662841796875, -0.039081573486328125, -0.0360565185546875, -0.033031463623046875, -0.03000640869140625, -0.026981353759765625, -0.023956298828125, -0.020931243896484375, -0.01790618896484375, -0.014881134033203125, -0.0118560791015625, -0.008831024169921875, -0.00580596923828125, -0.002780914306640625, 0.000244140625, 0.003269195556640625, 0.00629425048828125, 0.009319305419921875, 0.0123443603515625, 0.015369415283203125, 0.01839447021484375, 0.021419525146484375, 0.024444580078125, 0.027469635009765625, 0.03049468994140625, 0.033519744873046875, 0.0365447998046875, 0.039569854736328125, 0.04259490966796875, 0.045619964599609375, 0.04864501953125, 0.051670074462890625, 0.05469512939453125, 0.057720184326171875, 0.0607452392578125, 0.06377029418945312, 0.06679534912109375, 0.06982040405273438, 0.072845458984375, 0.07587051391601562, 0.07889556884765625, 0.08192062377929688, 0.0849456787109375, 0.08797073364257812, 0.09099578857421875, 0.09402084350585938, 0.0970458984375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 6.0, 4.0, 3.0, 5.0, 8.0, 8.0, 8.0, 10.0, 6.0, 9.0, 9.0, 13.0, 11.0, 17.0, 13.0, 20.0, 22.0, 17.0, 72.0, 57.0, 104.0, 219.0, 92.0, 55.0, 46.0, 18.0, 19.0, 18.0, 19.0, 22.0, 5.0, 8.0, 9.0, 6.0, 12.0, 5.0, 5.0, 4.0, 3.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5441328287124634e-06, -1.4789402484893799e-06, -1.4137476682662964e-06, -1.3485550880432129e-06, -1.2833625078201294e-06, -1.218169927597046e-06, -1.1529773473739624e-06, -1.087784767150879e-06, -1.0225921869277954e-06, -9.57399606704712e-07, -8.922070264816284e-07, -8.270144462585449e-07, -7.618218660354614e-07, -6.966292858123779e-07, -6.314367055892944e-07, -5.662441253662109e-07, -5.010515451431274e-07, -4.3585896492004395e-07, -3.7066638469696045e-07, -3.0547380447387695e-07, -2.4028122425079346e-07, -1.7508864402770996e-07, -1.0989606380462646e-07, -4.470348358154297e-08, 2.0489096641540527e-08, 8.568167686462402e-08, 1.5087425708770752e-07, 2.1606683731079102e-07, 2.812594175338745e-07, 3.46451997756958e-07, 4.116445779800415e-07, 4.76837158203125e-07, 5.420297384262085e-07, 6.07222318649292e-07, 6.724148988723755e-07, 7.37607479095459e-07, 8.028000593185425e-07, 8.67992639541626e-07, 9.331852197647095e-07, 9.98377799987793e-07, 1.0635703802108765e-06, 1.12876296043396e-06, 1.1939555406570435e-06, 1.259148120880127e-06, 1.3243407011032104e-06, 1.389533281326294e-06, 1.4547258615493774e-06, 1.519918441772461e-06, 1.5851110219955444e-06, 1.650303602218628e-06, 1.7154961824417114e-06, 1.780688762664795e-06, 1.8458813428878784e-06, 1.911073923110962e-06, 1.9762665033340454e-06, 2.041459083557129e-06, 2.1066516637802124e-06, 2.171844244003296e-06, 2.2370368242263794e-06, 2.302229404449463e-06, 2.3674219846725464e-06, 2.43261456489563e-06, 2.4978071451187134e-06, 2.562999725341797e-06]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 6.0, 5.0, 5.0, 5.0, 5.0, 13.0, 14.0, 19.0, 28.0, 43.0, 45.0, 45.0, 84.0, 136.0, 214.0, 469.0, 10905.0, 1007587.0, 27412.0, 689.0, 258.0, 144.0, 105.0, 69.0, 42.0, 40.0, 31.0, 25.0, 22.0, 12.0, 10.0, 4.0, 5.0, 7.0, 12.0, 5.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0], "bins": [-5.352497100830078e-05, -5.2138231694698334e-05, -5.0751492381095886e-05, -4.936475306749344e-05, -4.797801375389099e-05, -4.6591274440288544e-05, -4.5204535126686096e-05, -4.381779581308365e-05, -4.24310564994812e-05, -4.1044317185878754e-05, -3.9657577872276306e-05, -3.827083855867386e-05, -3.688409924507141e-05, -3.5497359931468964e-05, -3.4110620617866516e-05, -3.272388130426407e-05, -3.133714199066162e-05, -2.9950402677059174e-05, -2.8563663363456726e-05, -2.717692404985428e-05, -2.579018473625183e-05, -2.4403445422649384e-05, -2.3016706109046936e-05, -2.162996679544449e-05, -2.024322748184204e-05, -1.8856488168239594e-05, -1.7469748854637146e-05, -1.60830095410347e-05, -1.4696270227432251e-05, -1.3309530913829803e-05, -1.1922791600227356e-05, -1.0536052286624908e-05, -9.149312973022461e-06, -7.762573659420013e-06, -6.375834345817566e-06, -4.989095032215118e-06, -3.602355718612671e-06, -2.2156164050102234e-06, -8.288770914077759e-07, 5.578622221946716e-07, 1.944601535797119e-06, 3.3313408493995667e-06, 4.718080163002014e-06, 6.104819476604462e-06, 7.491558790206909e-06, 8.878298103809357e-06, 1.0265037417411804e-05, 1.1651776731014252e-05, 1.30385160446167e-05, 1.4425255358219147e-05, 1.5811994671821594e-05, 1.7198733985424042e-05, 1.858547329902649e-05, 1.9972212612628937e-05, 2.1358951926231384e-05, 2.2745691239833832e-05, 2.413243055343628e-05, 2.5519169867038727e-05, 2.6905909180641174e-05, 2.8292648494243622e-05, 2.967938780784607e-05, 3.106612712144852e-05, 3.2452866435050964e-05, 3.383960574865341e-05, 3.522634506225586e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 16.0, 60.0, 224.0, 462.0, 205.0, 39.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.366380595565715e-07, -7.908117822807981e-07, -6.449855618484435e-07, -4.9915928457267e-07, -3.5333300729689654e-07, -2.0750673002112308e-07, -6.168050958876847e-08, 8.414582453042385e-08, 2.2997204496277845e-07, 3.757983222385519e-07, 5.216245426709065e-07, 6.6745081994668e-07, 8.132770972224534e-07, 9.59103317654808e-07, 1.1049296517740004e-06, 1.2507559858931927e-06, 1.3965820926387096e-06, 1.5424083130710642e-06, 1.6882346471902565e-06, 1.8340608676226111e-06, 1.9798872017418034e-06, 2.1257133084873203e-06, 2.2715396426065126e-06, 2.417365976725705e-06, 2.5631923108448973e-06, 2.7090186449640896e-06, 2.8548447517096065e-06, 3.000671085828799e-06, 3.146497419947991e-06, 3.292323526693508e-06, 3.4381498608127004e-06, 3.5839761949318927e-06, 3.7298027564247604e-06, 3.875628863170277e-06, 4.021455424663145e-06, 4.167281531408662e-06, 4.313107638154179e-06, 4.458934199647047e-06, 4.6047603063925635e-06, 4.75058641313808e-06, 4.896412974630948e-06, 5.042239081376465e-06, 5.188065642869333e-06, 5.33389174961485e-06, 5.4797178563603666e-06, 5.625544417853234e-06, 5.771370524598751e-06, 5.917197086091619e-06, 6.063022738089785e-06, 6.208848844835302e-06, 6.35467540632817e-06, 6.5005015130736865e-06, 6.646327619819203e-06, 6.792154181312071e-06, 6.937980288057588e-06, 7.083806849550456e-06, 7.229632956295973e-06, 7.3754590630414896e-06, 7.521285624534357e-06, 7.667111276532523e-06, 7.812937838025391e-06, 7.958764399518259e-06, 8.104590961011127e-06, 8.250416613009293e-06, 8.39624317450216e-06]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 0.0, 5.0, 15.0, 0.0, 23.0, 0.0, 25.0, 0.0, 43.0, 72.0, 0.0, 118.0, 0.0, 132.0, 0.0, 131.0, 0.0, 106.0, 108.0, 0.0, 92.0, 0.0, 47.0, 0.0, 44.0, 17.0, 0.0, 10.0, 0.0, 12.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.797513484954834e-07, -9.462237358093262e-07, -9.126961231231689e-07, -8.791685104370117e-07, -8.456408977508545e-07, -8.121132850646973e-07, -7.7858567237854e-07, -7.450580596923828e-07, -7.115304470062256e-07, -6.780028343200684e-07, -6.444752216339111e-07, -6.109476089477539e-07, -5.774199962615967e-07, -5.438923835754395e-07, -5.103647708892822e-07, -4.76837158203125e-07, -4.4330954551696777e-07, -4.0978193283081055e-07, -3.762543201446533e-07, -3.427267074584961e-07, -3.0919909477233887e-07, -2.7567148208618164e-07, -2.421438694000244e-07, -2.086162567138672e-07, -1.7508864402770996e-07, -1.4156103134155273e-07, -1.0803341865539551e-07, -7.450580596923828e-08, -4.0978193283081055e-08, -7.450580596923828e-09, 2.60770320892334e-08, 5.960464477539063e-08, 9.313225746154785e-08, 1.2665987014770508e-07, 1.601874828338623e-07, 1.9371509552001953e-07, 2.2724270820617676e-07, 2.60770320892334e-07, 2.942979335784912e-07, 3.2782554626464844e-07, 3.6135315895080566e-07, 3.948807716369629e-07, 4.284083843231201e-07, 4.6193599700927734e-07, 4.954636096954346e-07, 5.289912223815918e-07, 5.62518835067749e-07, 5.960464477539062e-07, 6.295740604400635e-07, 6.631016731262207e-07, 6.966292858123779e-07, 7.301568984985352e-07, 7.636845111846924e-07, 7.972121238708496e-07, 8.307397365570068e-07, 8.642673492431641e-07, 8.977949619293213e-07, 9.313225746154785e-07, 9.648501873016357e-07, 9.98377799987793e-07, 1.0319054126739502e-06, 1.0654330253601074e-06, 1.0989606380462646e-06, 1.1324882507324219e-06]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 7.0, 4.0, 7.0, 10.0, 15.0, 14.0, 14.0, 23.0, 25.0, 27.0, 21.0, 34.0, 32.0, 29.0, 38.0, 41.0, 43.0, 51.0, 50.0, 36.0, 38.0, 34.0, 33.0, 31.0, 36.0, 36.0, 29.0, 28.0, 28.0, 32.0, 16.0, 18.0, 19.0, 16.0, 15.0, 14.0, 5.0, 12.0, 4.0, 6.0, 4.0, 11.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.1484375, -4.00909423828125, -3.8697509765625, -3.73040771484375, -3.591064453125, -3.45172119140625, -3.3123779296875, -3.17303466796875, -3.03369140625, -2.89434814453125, -2.7550048828125, -2.61566162109375, -2.476318359375, -2.33697509765625, -2.1976318359375, -2.05828857421875, -1.9189453125, -1.77960205078125, -1.6402587890625, -1.50091552734375, -1.361572265625, -1.22222900390625, -1.0828857421875, -0.94354248046875, -0.80419921875, -0.66485595703125, -0.5255126953125, -0.38616943359375, -0.246826171875, -0.10748291015625, 0.0318603515625, 0.17120361328125, 0.310546875, 0.44989013671875, 0.5892333984375, 0.72857666015625, 0.867919921875, 1.00726318359375, 1.1466064453125, 1.28594970703125, 1.42529296875, 1.56463623046875, 1.7039794921875, 1.84332275390625, 1.982666015625, 2.12200927734375, 2.2613525390625, 2.40069580078125, 2.5400390625, 2.67938232421875, 2.8187255859375, 2.95806884765625, 3.097412109375, 3.23675537109375, 3.3760986328125, 3.51544189453125, 3.65478515625, 3.79412841796875, 3.9334716796875, 4.07281494140625, 4.212158203125, 4.35150146484375, 4.4908447265625, 4.63018798828125, 4.76953125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 2.0, 9.0, 9.0, 7.0, 11.0, 18.0, 27.0, 38.0, 63.0, 92.0, 102.0, 187.0, 291.0, 477.0, 868.0, 1560.0, 3051.0, 6201.0, 11730.0, 22796.0, 45198.0, 87821.0, 165870.0, 264947.0, 206847.0, 111424.0, 58280.0, 29391.0, 14987.0, 7736.0, 3817.0, 2024.0, 1061.0, 615.0, 328.0, 217.0, 137.0, 102.0, 68.0, 40.0, 36.0, 15.0, 13.0, 16.0, 6.0, 12.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.33203125, -6.12567138671875, -5.9193115234375, -5.71295166015625, -5.506591796875, -5.30023193359375, -5.0938720703125, -4.88751220703125, -4.68115234375, -4.47479248046875, -4.2684326171875, -4.06207275390625, -3.855712890625, -3.64935302734375, -3.4429931640625, -3.23663330078125, -3.0302734375, -2.82391357421875, -2.6175537109375, -2.41119384765625, -2.204833984375, -1.99847412109375, -1.7921142578125, -1.58575439453125, -1.37939453125, -1.17303466796875, -0.9666748046875, -0.76031494140625, -0.553955078125, -0.34759521484375, -0.1412353515625, 0.06512451171875, 0.271484375, 0.47784423828125, 0.6842041015625, 0.89056396484375, 1.096923828125, 1.30328369140625, 1.5096435546875, 1.71600341796875, 1.92236328125, 2.12872314453125, 2.3350830078125, 2.54144287109375, 2.747802734375, 2.95416259765625, 3.1605224609375, 3.36688232421875, 3.5732421875, 3.77960205078125, 3.9859619140625, 4.19232177734375, 4.398681640625, 4.60504150390625, 4.8114013671875, 5.01776123046875, 5.22412109375, 5.43048095703125, 5.6368408203125, 5.84320068359375, 6.049560546875, 6.25592041015625, 6.4622802734375, 6.66864013671875, 6.875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 7.0, 6.0, 9.0, 14.0, 14.0, 21.0, 19.0, 27.0, 43.0, 39.0, 38.0, 65.0, 78.0, 135.0, 228.0, 1341.0, 265.0, 199.0, 110.0, 86.0, 56.0, 36.0, 31.0, 35.0, 21.0, 27.0, 16.0, 23.0, 15.0, 9.0, 12.0, 4.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.875, -10.454833984375, -10.03466796875, -9.614501953125, -9.1943359375, -8.774169921875, -8.35400390625, -7.933837890625, -7.513671875, -7.093505859375, -6.67333984375, -6.253173828125, -5.8330078125, -5.412841796875, -4.99267578125, -4.572509765625, -4.15234375, -3.732177734375, -3.31201171875, -2.891845703125, -2.4716796875, -2.051513671875, -1.63134765625, -1.211181640625, -0.791015625, -0.370849609375, 0.04931640625, 0.469482421875, 0.8896484375, 1.309814453125, 1.72998046875, 2.150146484375, 2.5703125, 2.990478515625, 3.41064453125, 3.830810546875, 4.2509765625, 4.671142578125, 5.09130859375, 5.511474609375, 5.931640625, 6.351806640625, 6.77197265625, 7.192138671875, 7.6123046875, 8.032470703125, 8.45263671875, 8.872802734375, 9.29296875, 9.713134765625, 10.13330078125, 10.553466796875, 10.9736328125, 11.393798828125, 11.81396484375, 12.234130859375, 12.654296875, 13.074462890625, 13.49462890625, 13.914794921875, 14.3349609375, 14.755126953125, 15.17529296875, 15.595458984375, 16.015625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 11.0, 8.0, 9.0, 20.0, 22.0, 27.0, 41.0, 69.0, 88.0, 128.0, 195.0, 406.0, 669.0, 1815.0, 75357.0, 3049194.0, 14881.0, 1316.0, 560.0, 292.0, 213.0, 133.0, 77.0, 46.0, 40.0, 27.0, 19.0, 15.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.84375, -51.46630859375, -50.0888671875, -48.71142578125, -47.333984375, -45.95654296875, -44.5791015625, -43.20166015625, -41.82421875, -40.44677734375, -39.0693359375, -37.69189453125, -36.314453125, -34.93701171875, -33.5595703125, -32.18212890625, -30.8046875, -29.42724609375, -28.0498046875, -26.67236328125, -25.294921875, -23.91748046875, -22.5400390625, -21.16259765625, -19.78515625, -18.40771484375, -17.0302734375, -15.65283203125, -14.275390625, -12.89794921875, -11.5205078125, -10.14306640625, -8.765625, -7.38818359375, -6.0107421875, -4.63330078125, -3.255859375, -1.87841796875, -0.5009765625, 0.87646484375, 2.25390625, 3.63134765625, 5.0087890625, 6.38623046875, 7.763671875, 9.14111328125, 10.5185546875, 11.89599609375, 13.2734375, 14.65087890625, 16.0283203125, 17.40576171875, 18.783203125, 20.16064453125, 21.5380859375, 22.91552734375, 24.29296875, 25.67041015625, 27.0478515625, 28.42529296875, 29.802734375, 31.18017578125, 32.5576171875, 33.93505859375, 35.3125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 27.0, 73.0, 178.0, 244.0, 248.0, 143.0, 75.0, 15.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.38157653808594, -36.541175842285156, -33.700775146484375, -30.860374450683594, -28.019973754882812, -25.17957305908203, -22.339170455932617, -19.498769760131836, -16.658369064331055, -13.817968368530273, -10.977567672729492, -8.137166023254395, -5.296765327453613, -2.456364631652832, 0.3840370178222656, 3.224437713623047, 6.064838409423828, 8.90523910522461, 11.74563980102539, 14.586041450500488, 17.426441192626953, 20.266841888427734, 23.10724449157715, 25.94764518737793, 28.78804588317871, 31.628446578979492, 34.468849182128906, 37.30924987792969, 40.14965057373047, 42.99005126953125, 45.83045196533203, 48.67085266113281, 51.511253356933594, 54.351654052734375, 57.192054748535156, 60.03245544433594, 62.87285614013672, 65.7132568359375, 68.55365753173828, 71.39405822753906, 74.23445892333984, 77.07485961914062, 79.9152603149414, 82.75566101074219, 85.59606170654297, 88.43646240234375, 91.27686309814453, 94.11726379394531, 96.95767211914062, 99.7980728149414, 102.63847351074219, 105.47887420654297, 108.31927490234375, 111.15967559814453, 114.00007629394531, 116.8404769897461, 119.68087768554688, 122.52127838134766, 125.36167907714844, 128.20208740234375, 131.04248046875, 133.8828887939453, 136.72328186035156, 139.56369018554688, 142.40408325195312]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 13.0, 8.0, 15.0, 18.0, 13.0, 23.0, 16.0, 16.0, 24.0, 29.0, 35.0, 41.0, 43.0, 44.0, 46.0, 49.0, 50.0, 46.0, 37.0, 60.0, 43.0, 38.0, 30.0, 28.0, 31.0, 28.0, 18.0, 21.0, 16.0, 12.0, 19.0, 16.0, 20.0, 13.0, 6.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.38334655761719, -36.24794006347656, -35.1125373840332, -33.97713088989258, -32.84172821044922, -31.706321716308594, -30.5709171295166, -29.43551254272461, -28.300107955932617, -27.164703369140625, -26.029298782348633, -24.89389419555664, -23.758487701416016, -22.623085021972656, -21.48767852783203, -20.35227394104004, -19.216869354248047, -18.081464767456055, -16.946060180664062, -15.810654640197754, -14.675250053405762, -13.53984546661377, -12.404439926147461, -11.269035339355469, -10.133630752563477, -8.998226165771484, -7.862821102142334, -6.727416038513184, -5.592011451721191, -4.456606864929199, -3.321201801300049, -2.1857967376708984, -1.0503921508789062, 0.08501267433166504, 1.2204174995422363, 2.3558223247528076, 3.491227149963379, 4.626631736755371, 5.7620368003845215, 6.897441864013672, 8.032846450805664, 9.168251037597656, 10.303655624389648, 11.439061164855957, 12.57446575164795, 13.709870338439941, 14.84527587890625, 15.980680465698242, 17.116085052490234, 18.251489639282227, 19.38689422607422, 20.52229881286621, 21.657703399658203, 22.793109893798828, 23.92851448059082, 25.063919067382812, 26.199323654174805, 27.334728240966797, 28.47013282775879, 29.60553741455078, 30.740943908691406, 31.876346588134766, 33.01175308227539, 34.14715576171875, 35.282562255859375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 10.0, 7.0, 10.0, 11.0, 17.0, 18.0, 11.0, 17.0, 22.0, 32.0, 34.0, 22.0, 28.0, 38.0, 42.0, 45.0, 51.0, 49.0, 41.0, 28.0, 39.0, 39.0, 32.0, 44.0, 24.0, 20.0, 39.0, 32.0, 23.0, 33.0, 16.0, 15.0, 17.0, 12.0, 12.0, 15.0, 8.0, 17.0, 7.0, 2.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.12109375, -3.98046875, -3.83984375, -3.69921875, -3.55859375, -3.41796875, -3.27734375, -3.13671875, -2.99609375, -2.85546875, -2.71484375, -2.57421875, -2.43359375, -2.29296875, -2.15234375, -2.01171875, -1.87109375, -1.73046875, -1.58984375, -1.44921875, -1.30859375, -1.16796875, -1.02734375, -0.88671875, -0.74609375, -0.60546875, -0.46484375, -0.32421875, -0.18359375, -0.04296875, 0.09765625, 0.23828125, 0.37890625, 0.51953125, 0.66015625, 0.80078125, 0.94140625, 1.08203125, 1.22265625, 1.36328125, 1.50390625, 1.64453125, 1.78515625, 1.92578125, 2.06640625, 2.20703125, 2.34765625, 2.48828125, 2.62890625, 2.76953125, 2.91015625, 3.05078125, 3.19140625, 3.33203125, 3.47265625, 3.61328125, 3.75390625, 3.89453125, 4.03515625, 4.17578125, 4.31640625, 4.45703125, 4.59765625, 4.73828125, 4.87890625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 5.0, 8.0, 13.0, 23.0, 53.0, 116.0, 387.0, 1482.0, 7013.0, 54494.0, 1591454.0, 2447779.0, 79336.0, 9422.0, 1903.0, 470.0, 169.0, 75.0, 31.0, 9.0, 10.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.75, -16.173828125, -15.59765625, -15.021484375, -14.4453125, -13.869140625, -13.29296875, -12.716796875, -12.140625, -11.564453125, -10.98828125, -10.412109375, -9.8359375, -9.259765625, -8.68359375, -8.107421875, -7.53125, -6.955078125, -6.37890625, -5.802734375, -5.2265625, -4.650390625, -4.07421875, -3.498046875, -2.921875, -2.345703125, -1.76953125, -1.193359375, -0.6171875, -0.041015625, 0.53515625, 1.111328125, 1.6875, 2.263671875, 2.83984375, 3.416015625, 3.9921875, 4.568359375, 5.14453125, 5.720703125, 6.296875, 6.873046875, 7.44921875, 8.025390625, 8.6015625, 9.177734375, 9.75390625, 10.330078125, 10.90625, 11.482421875, 12.05859375, 12.634765625, 13.2109375, 13.787109375, 14.36328125, 14.939453125, 15.515625, 16.091796875, 16.66796875, 17.244140625, 17.8203125, 18.396484375, 18.97265625, 19.548828125, 20.125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 13.0, 16.0, 27.0, 42.0, 71.0, 89.0, 146.0, 224.0, 348.0, 426.0, 655.0, 702.0, 429.0, 294.0, 189.0, 131.0, 82.0, 69.0, 46.0, 22.0, 18.0, 12.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.953125, -11.6607666015625, -11.368408203125, -11.0760498046875, -10.78369140625, -10.4913330078125, -10.198974609375, -9.9066162109375, -9.6142578125, -9.3218994140625, -9.029541015625, -8.7371826171875, -8.44482421875, -8.1524658203125, -7.860107421875, -7.5677490234375, -7.275390625, -6.9830322265625, -6.690673828125, -6.3983154296875, -6.10595703125, -5.8135986328125, -5.521240234375, -5.2288818359375, -4.9365234375, -4.6441650390625, -4.351806640625, -4.0594482421875, -3.76708984375, -3.4747314453125, -3.182373046875, -2.8900146484375, -2.59765625, -2.3052978515625, -2.012939453125, -1.7205810546875, -1.42822265625, -1.1358642578125, -0.843505859375, -0.5511474609375, -0.2587890625, 0.0335693359375, 0.325927734375, 0.6182861328125, 0.91064453125, 1.2030029296875, 1.495361328125, 1.7877197265625, 2.080078125, 2.3724365234375, 2.664794921875, 2.9571533203125, 3.24951171875, 3.5418701171875, 3.834228515625, 4.1265869140625, 4.4189453125, 4.7113037109375, 5.003662109375, 5.2960205078125, 5.58837890625, 5.8807373046875, 6.173095703125, 6.4654541015625, 6.7578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 9.0, 16.0, 34.0, 56.0, 78.0, 185.0, 387.0, 840.0, 2393.0, 11184.0, 147860.0, 3128461.0, 858170.0, 37377.0, 4794.0, 1350.0, 586.0, 224.0, 114.0, 63.0, 38.0, 25.0, 13.0, 9.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.90625, -19.36474609375, -18.8232421875, -18.28173828125, -17.740234375, -17.19873046875, -16.6572265625, -16.11572265625, -15.57421875, -15.03271484375, -14.4912109375, -13.94970703125, -13.408203125, -12.86669921875, -12.3251953125, -11.78369140625, -11.2421875, -10.70068359375, -10.1591796875, -9.61767578125, -9.076171875, -8.53466796875, -7.9931640625, -7.45166015625, -6.91015625, -6.36865234375, -5.8271484375, -5.28564453125, -4.744140625, -4.20263671875, -3.6611328125, -3.11962890625, -2.578125, -2.03662109375, -1.4951171875, -0.95361328125, -0.412109375, 0.12939453125, 0.6708984375, 1.21240234375, 1.75390625, 2.29541015625, 2.8369140625, 3.37841796875, 3.919921875, 4.46142578125, 5.0029296875, 5.54443359375, 6.0859375, 6.62744140625, 7.1689453125, 7.71044921875, 8.251953125, 8.79345703125, 9.3349609375, 9.87646484375, 10.41796875, 10.95947265625, 11.5009765625, 12.04248046875, 12.583984375, 13.12548828125, 13.6669921875, 14.20849609375, 14.75]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 30.0, 116.0, 280.0, 339.0, 176.0, 45.0, 17.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.49299621582031, -88.46482849121094, -85.43665313720703, -82.40848541259766, -79.38031768798828, -76.3521499633789, -73.323974609375, -70.29580688476562, -67.26763916015625, -64.23947143554688, -61.211299896240234, -58.183128356933594, -55.15496063232422, -52.12678909301758, -49.09861755371094, -46.07044982910156, -43.04227828979492, -40.01410675048828, -36.985939025878906, -33.957767486572266, -30.92959976196289, -27.90142822265625, -24.873258590698242, -21.845088958740234, -18.816919326782227, -15.788749694824219, -12.760580062866211, -9.732409477233887, -6.704239845275879, -3.676070213317871, -0.6478996276855469, 2.380270004272461, 5.408439636230469, 8.436609268188477, 11.464778900146484, 14.492949485778809, 17.5211181640625, 20.54928970336914, 23.57745933532715, 26.605628967285156, 29.633798599243164, 32.66196823120117, 35.69013977050781, 38.71830749511719, 41.74647903442383, 44.7746467590332, 47.802818298339844, 50.83098602294922, 53.85915756225586, 56.8873291015625, 59.915496826171875, 62.943668365478516, 65.97183990478516, 69.00000762939453, 72.0281753540039, 75.05635070800781, 78.08451843261719, 81.11268615722656, 84.14086151123047, 87.16902923583984, 90.19719696044922, 93.2253646850586, 96.2535400390625, 99.28170776367188, 102.30987548828125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 6.0, 11.0, 11.0, 14.0, 14.0, 16.0, 18.0, 12.0, 25.0, 31.0, 28.0, 32.0, 32.0, 41.0, 41.0, 44.0, 51.0, 31.0, 48.0, 33.0, 35.0, 47.0, 46.0, 29.0, 30.0, 31.0, 29.0, 27.0, 20.0, 24.0, 23.0, 15.0, 15.0, 11.0, 11.0, 15.0, 6.0, 11.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-24.68231964111328, -23.925870895385742, -23.169422149658203, -22.412975311279297, -21.656526565551758, -20.90007781982422, -20.14362907409668, -19.38718032836914, -18.630733489990234, -17.874284744262695, -17.117835998535156, -16.36138916015625, -15.604940414428711, -14.848491668701172, -14.092042922973633, -13.335594177246094, -12.579145431518555, -11.822696685791016, -11.066248893737793, -10.309800148010254, -9.553352355957031, -8.796903610229492, -8.040454864501953, -7.284006595611572, -6.527558326721191, -5.7711100578308105, -5.01466178894043, -4.258213043212891, -3.5017647743225098, -2.745316505432129, -1.9888677597045898, -1.232419490814209, -0.4759712219238281, 0.2804771661758423, 1.0369255542755127, 1.7933740615844727, 2.5498223304748535, 3.3062705993652344, 4.062719345092773, 4.819167613983154, 5.575615882873535, 6.332064151763916, 7.088512420654297, 7.844961166381836, 8.601409912109375, 9.357857704162598, 10.114306449890137, 10.87075424194336, 11.627202987670898, 12.383651733398438, 13.14009952545166, 13.8965482711792, 14.652996063232422, 15.409444808959961, 16.1658935546875, 16.92234230041504, 17.678791046142578, 18.435239791870117, 19.191688537597656, 19.948135375976562, 20.7045841217041, 21.46103286743164, 22.21748161315918, 22.97393035888672, 23.730377197265625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 5.0, 9.0, 9.0, 8.0, 14.0, 12.0, 17.0, 10.0, 17.0, 23.0, 27.0, 32.0, 25.0, 34.0, 43.0, 37.0, 56.0, 39.0, 37.0, 43.0, 44.0, 40.0, 56.0, 26.0, 23.0, 18.0, 32.0, 28.0, 29.0, 31.0, 23.0, 22.0, 22.0, 18.0, 12.0, 16.0, 11.0, 7.0, 6.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.654296875, -3.528656005859375, -3.40301513671875, -3.277374267578125, -3.1517333984375, -3.026092529296875, -2.90045166015625, -2.774810791015625, -2.649169921875, -2.523529052734375, -2.39788818359375, -2.272247314453125, -2.1466064453125, -2.020965576171875, -1.89532470703125, -1.769683837890625, -1.64404296875, -1.518402099609375, -1.39276123046875, -1.267120361328125, -1.1414794921875, -1.015838623046875, -0.89019775390625, -0.764556884765625, -0.638916015625, -0.513275146484375, -0.38763427734375, -0.261993408203125, -0.1363525390625, -0.010711669921875, 0.11492919921875, 0.240570068359375, 0.3662109375, 0.491851806640625, 0.61749267578125, 0.743133544921875, 0.8687744140625, 0.994415283203125, 1.12005615234375, 1.245697021484375, 1.371337890625, 1.496978759765625, 1.62261962890625, 1.748260498046875, 1.8739013671875, 1.999542236328125, 2.12518310546875, 2.250823974609375, 2.37646484375, 2.502105712890625, 2.62774658203125, 2.753387451171875, 2.8790283203125, 3.004669189453125, 3.13031005859375, 3.255950927734375, 3.381591796875, 3.507232666015625, 3.63287353515625, 3.758514404296875, 3.8841552734375, 4.009796142578125, 4.13543701171875, 4.261077880859375, 4.38671875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 10.0, 10.0, 20.0, 36.0, 37.0, 65.0, 86.0, 140.0, 197.0, 295.0, 478.0, 660.0, 1059.0, 1548.0, 2227.0, 3275.0, 4860.0, 7208.0, 10906.0, 16493.0, 25493.0, 40611.0, 67468.0, 127368.0, 332440.0, 180472.0, 85907.0, 49801.0, 30735.0, 19746.0, 12722.0, 8498.0, 5729.0, 3858.0, 2669.0, 1779.0, 1258.0, 778.0, 543.0, 362.0, 240.0, 148.0, 108.0, 75.0, 50.0, 30.0, 16.0, 17.0, 9.0, 8.0, 8.0, 4.0, 1.0, 2.0], "bins": [-0.1800537109375, -0.17486572265625, -0.169677734375, -0.16448974609375, -0.1593017578125, -0.15411376953125, -0.14892578125, -0.14373779296875, -0.1385498046875, -0.13336181640625, -0.128173828125, -0.12298583984375, -0.1177978515625, -0.11260986328125, -0.107421875, -0.10223388671875, -0.0970458984375, -0.09185791015625, -0.086669921875, -0.08148193359375, -0.0762939453125, -0.07110595703125, -0.06591796875, -0.06072998046875, -0.0555419921875, -0.05035400390625, -0.045166015625, -0.03997802734375, -0.0347900390625, -0.02960205078125, -0.0244140625, -0.01922607421875, -0.0140380859375, -0.00885009765625, -0.003662109375, 0.00152587890625, 0.0067138671875, 0.01190185546875, 0.01708984375, 0.02227783203125, 0.0274658203125, 0.03265380859375, 0.037841796875, 0.04302978515625, 0.0482177734375, 0.05340576171875, 0.05859375, 0.06378173828125, 0.0689697265625, 0.07415771484375, 0.079345703125, 0.08453369140625, 0.0897216796875, 0.09490966796875, 0.10009765625, 0.10528564453125, 0.1104736328125, 0.11566162109375, 0.120849609375, 0.12603759765625, 0.1312255859375, 0.13641357421875, 0.1416015625, 0.14678955078125, 0.1519775390625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 4.0, 0.0, 7.0, 3.0, 4.0, 10.0, 8.0, 10.0, 14.0, 11.0, 14.0, 16.0, 23.0, 21.0, 30.0, 33.0, 29.0, 34.0, 42.0, 28.0, 38.0, 27.0, 42.0, 36.0, 1061.0, 39.0, 46.0, 40.0, 25.0, 35.0, 32.0, 42.0, 30.0, 28.0, 31.0, 27.0, 22.0, 11.0, 13.0, 14.0, 6.0, 5.0, 6.0, 7.0, 13.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.673828125, -2.587646484375, -2.50146484375, -2.415283203125, -2.3291015625, -2.242919921875, -2.15673828125, -2.070556640625, -1.984375, -1.898193359375, -1.81201171875, -1.725830078125, -1.6396484375, -1.553466796875, -1.46728515625, -1.381103515625, -1.294921875, -1.208740234375, -1.12255859375, -1.036376953125, -0.9501953125, -0.864013671875, -0.77783203125, -0.691650390625, -0.60546875, -0.519287109375, -0.43310546875, -0.346923828125, -0.2607421875, -0.174560546875, -0.08837890625, -0.002197265625, 0.083984375, 0.170166015625, 0.25634765625, 0.342529296875, 0.4287109375, 0.514892578125, 0.60107421875, 0.687255859375, 0.7734375, 0.859619140625, 0.94580078125, 1.031982421875, 1.1181640625, 1.204345703125, 1.29052734375, 1.376708984375, 1.462890625, 1.549072265625, 1.63525390625, 1.721435546875, 1.8076171875, 1.893798828125, 1.97998046875, 2.066162109375, 2.15234375, 2.238525390625, 2.32470703125, 2.410888671875, 2.4970703125, 2.583251953125, 2.66943359375, 2.755615234375, 2.841796875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 14.0, 14.0, 23.0, 38.0, 55.0, 88.0, 123.0, 175.0, 208.0, 344.0, 485.0, 605.0, 967.0, 1285.0, 1957.0, 2737.0, 3855.0, 5402.0, 8110.0, 11887.0, 17847.0, 26842.0, 41386.0, 65001.0, 111009.0, 1292457.0, 216208.0, 105453.0, 62251.0, 39749.0, 25969.0, 17151.0, 11516.0, 7762.0, 5559.0, 3762.0, 2567.0, 1854.0, 1315.0, 951.0, 701.0, 446.0, 329.0, 221.0, 161.0, 103.0, 68.0, 40.0, 28.0, 20.0, 13.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.0819091796875, -0.07942390441894531, -0.07693862915039062, -0.07445335388183594, -0.07196807861328125, -0.06948280334472656, -0.06699752807617188, -0.06451225280761719, -0.0620269775390625, -0.05954170227050781, -0.057056427001953125, -0.05457115173339844, -0.05208587646484375, -0.04960060119628906, -0.047115325927734375, -0.04463005065917969, -0.042144775390625, -0.03965950012207031, -0.037174224853515625, -0.03468894958496094, -0.03220367431640625, -0.029718399047851562, -0.027233123779296875, -0.024747848510742188, -0.0222625732421875, -0.019777297973632812, -0.017292022705078125, -0.014806747436523438, -0.01232147216796875, -0.009836196899414062, -0.007350921630859375, -0.0048656463623046875, -0.00238037109375, 0.0001049041748046875, 0.002590179443359375, 0.0050754547119140625, 0.00756072998046875, 0.010046005249023438, 0.012531280517578125, 0.015016555786132812, 0.0175018310546875, 0.019987106323242188, 0.022472381591796875, 0.024957656860351562, 0.02744293212890625, 0.029928207397460938, 0.032413482666015625, 0.03489875793457031, 0.037384033203125, 0.03986930847167969, 0.042354583740234375, 0.04483985900878906, 0.04732513427734375, 0.04981040954589844, 0.052295684814453125, 0.05478096008300781, 0.0572662353515625, 0.05975151062011719, 0.062236785888671875, 0.06472206115722656, 0.06720733642578125, 0.06969261169433594, 0.07217788696289062, 0.07466316223144531, 0.0771484375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 13.0, 11.0, 16.0, 6.0, 12.0, 31.0, 20.0, 21.0, 59.0, 46.0, 167.0, 198.0, 85.0, 90.0, 41.0, 27.0, 47.0, 17.0, 18.0, 15.0, 12.0, 18.0, 7.0, 4.0, 6.0, 2.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.5273690223693848e-06, -1.4454126358032227e-06, -1.3634562492370605e-06, -1.2814998626708984e-06, -1.1995434761047363e-06, -1.1175870895385742e-06, -1.0356307029724121e-06, -9.5367431640625e-07, -8.717179298400879e-07, -7.897615432739258e-07, -7.078051567077637e-07, -6.258487701416016e-07, -5.438923835754395e-07, -4.6193599700927734e-07, -3.7997961044311523e-07, -2.980232238769531e-07, -2.1606683731079102e-07, -1.341104507446289e-07, -5.21540641784668e-08, 2.9802322387695312e-08, 1.1175870895385742e-07, 1.9371509552001953e-07, 2.7567148208618164e-07, 3.5762786865234375e-07, 4.3958425521850586e-07, 5.21540641784668e-07, 6.034970283508301e-07, 6.854534149169922e-07, 7.674098014831543e-07, 8.493661880493164e-07, 9.313225746154785e-07, 1.0132789611816406e-06, 1.0952353477478027e-06, 1.1771917343139648e-06, 1.259148120880127e-06, 1.341104507446289e-06, 1.4230608940124512e-06, 1.5050172805786133e-06, 1.5869736671447754e-06, 1.6689300537109375e-06, 1.7508864402770996e-06, 1.8328428268432617e-06, 1.914799213409424e-06, 1.996755599975586e-06, 2.078711986541748e-06, 2.16066837310791e-06, 2.2426247596740723e-06, 2.3245811462402344e-06, 2.4065375328063965e-06, 2.4884939193725586e-06, 2.5704503059387207e-06, 2.652406692504883e-06, 2.734363079071045e-06, 2.816319465637207e-06, 2.898275852203369e-06, 2.9802322387695312e-06, 3.0621886253356934e-06, 3.1441450119018555e-06, 3.2261013984680176e-06, 3.3080577850341797e-06, 3.390014171600342e-06, 3.471970558166504e-06, 3.553926944732666e-06, 3.635883331298828e-06]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 7.0, 23.0, 22.0, 25.0, 43.0, 42.0, 94.0, 124.0, 236.0, 658.0, 17711.0, 1021885.0, 6612.0, 523.0, 186.0, 92.0, 71.0, 57.0, 32.0, 25.0, 19.0, 11.0, 7.0, 8.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.081031799316406e-05, -6.914045661687851e-05, -6.747059524059296e-05, -6.58007338643074e-05, -6.413087248802185e-05, -6.24610111117363e-05, -6.0791149735450745e-05, -5.912128835916519e-05, -5.745142698287964e-05, -5.5781565606594086e-05, -5.411170423030853e-05, -5.244184285402298e-05, -5.077198147773743e-05, -4.9102120101451874e-05, -4.743225872516632e-05, -4.576239734888077e-05, -4.4092535972595215e-05, -4.242267459630966e-05, -4.075281322002411e-05, -3.9082951843738556e-05, -3.7413090467453e-05, -3.574322909116745e-05, -3.40733677148819e-05, -3.2403506338596344e-05, -3.073364496231079e-05, -2.9063783586025238e-05, -2.7393922209739685e-05, -2.5724060833454132e-05, -2.405419945716858e-05, -2.2384338080883026e-05, -2.0714476704597473e-05, -1.904461532831192e-05, -1.7374753952026367e-05, -1.5704892575740814e-05, -1.4035031199455261e-05, -1.2365169823169708e-05, -1.0695308446884155e-05, -9.025447070598602e-06, -7.355585694313049e-06, -5.685724318027496e-06, -4.015862941741943e-06, -2.3460015654563904e-06, -6.761401891708374e-07, 9.937211871147156e-07, 2.6635825634002686e-06, 4.3334439396858215e-06, 6.0033053159713745e-06, 7.673166692256927e-06, 9.34302806854248e-06, 1.1012889444828033e-05, 1.2682750821113586e-05, 1.435261219739914e-05, 1.6022473573684692e-05, 1.7692334949970245e-05, 1.93621963262558e-05, 2.103205770254135e-05, 2.2701919078826904e-05, 2.4371780455112457e-05, 2.604164183139801e-05, 2.7711503207683563e-05, 2.9381364583969116e-05, 3.105122596025467e-05, 3.272108733654022e-05, 3.4390948712825775e-05, 3.606081008911133e-05]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 20.0, 62.0, 135.0, 318.0, 291.0, 124.0, 36.0, 14.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.361519015423255e-06, -5.249654350336641e-06, -5.137789230502676e-06, -5.025924565416062e-06, -4.914059445582097e-06, -4.8021947804954834e-06, -4.6903296606615186e-06, -4.578464995574905e-06, -4.466600330488291e-06, -4.354735665401677e-06, -4.242870545567712e-06, -4.131005880481098e-06, -4.019140760647133e-06, -3.907276095560519e-06, -3.7954112031002296e-06, -3.68354631063994e-06, -3.571681418179651e-06, -3.4598165257193614e-06, -3.347951633259072e-06, -3.2360867407987826e-06, -3.1242220757121686e-06, -3.012357183251879e-06, -2.9004922907915898e-06, -2.7886273983313004e-06, -2.676762505871011e-06, -2.5648976134107215e-06, -2.453032720950432e-06, -2.341168055863818e-06, -2.2293031634035287e-06, -2.1174382709432393e-06, -2.00557337848295e-06, -1.8937084860226605e-06, -1.7818437072492088e-06, -1.6699788147889194e-06, -1.5581140360154677e-06, -1.4462491435551783e-06, -1.334384251094889e-06, -1.2225194723214372e-06, -1.1106545798611478e-06, -9.98789801087696e-07, -8.869249086274067e-07, -7.750600730105361e-07, -6.631952373936656e-07, -5.513303449333762e-07, -4.3946550931650563e-07, -3.276006736996351e-07, -2.1573578123934567e-07, -1.0387094562247512e-07, 7.993889994395431e-09, 1.198587398221207e-07, 2.3172358964984596e-07, 3.4358845368842594e-07, 4.554532893052965e-07, 5.67318124922167e-07, 6.791830173824565e-07, 7.91047852999327e-07, 9.029126886161976e-07, 1.014777581076487e-06, 1.1266423598499387e-06, 1.238507252310228e-06, 1.3503720310836798e-06, 1.4622369235439692e-06, 1.5741018160042586e-06, 1.685966708464548e-06, 1.7978314872379997e-06]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 13.0, 0.0, 11.0, 0.0, 14.0, 0.0, 0.0, 22.0, 0.0, 36.0, 0.0, 53.0, 0.0, 71.0, 0.0, 94.0, 0.0, 0.0, 124.0, 0.0, 104.0, 0.0, 133.0, 0.0, 83.0, 0.0, 84.0, 0.0, 0.0, 61.0, 0.0, 43.0, 0.0, 25.0, 0.0, 16.0, 0.0, 10.0, 0.0, 0.0, 10.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.5367431640625e-07, -9.266659617424011e-07, -8.996576070785522e-07, -8.726492524147034e-07, -8.456408977508545e-07, -8.186325430870056e-07, -7.916241884231567e-07, -7.646158337593079e-07, -7.37607479095459e-07, -7.105991244316101e-07, -6.835907697677612e-07, -6.565824151039124e-07, -6.295740604400635e-07, -6.025657057762146e-07, -5.755573511123657e-07, -5.485489964485168e-07, -5.21540641784668e-07, -4.945322871208191e-07, -4.675239324569702e-07, -4.4051557779312134e-07, -4.1350722312927246e-07, -3.864988684654236e-07, -3.594905138015747e-07, -3.3248215913772583e-07, -3.0547380447387695e-07, -2.784654498100281e-07, -2.514570951461792e-07, -2.2444874048233032e-07, -1.9744038581848145e-07, -1.7043203115463257e-07, -1.434236764907837e-07, -1.1641532182693481e-07, -8.940696716308594e-08, -6.239861249923706e-08, -3.5390257835388184e-08, -8.381903171539307e-09, 1.862645149230957e-08, 4.563480615615845e-08, 7.264316082000732e-08, 9.96515154838562e-08, 1.2665987014770508e-07, 1.5366822481155396e-07, 1.8067657947540283e-07, 2.076849341392517e-07, 2.3469328880310059e-07, 2.6170164346694946e-07, 2.8870999813079834e-07, 3.157183527946472e-07, 3.427267074584961e-07, 3.6973506212234497e-07, 3.9674341678619385e-07, 4.237517714500427e-07, 4.507601261138916e-07, 4.777684807777405e-07, 5.047768354415894e-07, 5.317851901054382e-07, 5.587935447692871e-07, 5.85801899433136e-07, 6.128102540969849e-07, 6.398186087608337e-07, 6.668269634246826e-07, 6.938353180885315e-07, 7.208436727523804e-07, 7.478520274162292e-07, 7.748603820800781e-07]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 5.0, 9.0, 9.0, 8.0, 14.0, 12.0, 17.0, 10.0, 17.0, 23.0, 27.0, 32.0, 25.0, 34.0, 43.0, 37.0, 56.0, 39.0, 37.0, 43.0, 44.0, 40.0, 56.0, 26.0, 23.0, 18.0, 32.0, 28.0, 29.0, 31.0, 23.0, 22.0, 22.0, 18.0, 12.0, 16.0, 11.0, 7.0, 6.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.654296875, -3.528656005859375, -3.40301513671875, -3.277374267578125, -3.1517333984375, -3.026092529296875, -2.90045166015625, -2.774810791015625, -2.649169921875, -2.523529052734375, -2.39788818359375, -2.272247314453125, -2.1466064453125, -2.020965576171875, -1.89532470703125, -1.769683837890625, -1.64404296875, -1.518402099609375, -1.39276123046875, -1.267120361328125, -1.1414794921875, -1.015838623046875, -0.89019775390625, -0.764556884765625, -0.638916015625, -0.513275146484375, -0.38763427734375, -0.261993408203125, -0.1363525390625, -0.010711669921875, 0.11492919921875, 0.240570068359375, 0.3662109375, 0.491851806640625, 0.61749267578125, 0.743133544921875, 0.8687744140625, 0.994415283203125, 1.12005615234375, 1.245697021484375, 1.371337890625, 1.496978759765625, 1.62261962890625, 1.748260498046875, 1.8739013671875, 1.999542236328125, 2.12518310546875, 2.250823974609375, 2.37646484375, 2.502105712890625, 2.62774658203125, 2.753387451171875, 2.8790283203125, 3.004669189453125, 3.13031005859375, 3.255950927734375, 3.381591796875, 3.507232666015625, 3.63287353515625, 3.758514404296875, 3.8841552734375, 4.009796142578125, 4.13543701171875, 4.261077880859375, 4.38671875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 1.0, 6.0, 10.0, 13.0, 10.0, 18.0, 34.0, 44.0, 57.0, 91.0, 103.0, 146.0, 217.0, 337.0, 480.0, 715.0, 1183.0, 2228.0, 4173.0, 8952.0, 21336.0, 51591.0, 126904.0, 340414.0, 298556.0, 109878.0, 45011.0, 18889.0, 8164.0, 3688.0, 1979.0, 1124.0, 717.0, 436.0, 317.0, 213.0, 141.0, 107.0, 75.0, 52.0, 44.0, 34.0, 19.0, 13.0, 8.0, 6.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.5078125, -7.27264404296875, -7.0374755859375, -6.80230712890625, -6.567138671875, -6.33197021484375, -6.0968017578125, -5.86163330078125, -5.62646484375, -5.39129638671875, -5.1561279296875, -4.92095947265625, -4.685791015625, -4.45062255859375, -4.2154541015625, -3.98028564453125, -3.7451171875, -3.50994873046875, -3.2747802734375, -3.03961181640625, -2.804443359375, -2.56927490234375, -2.3341064453125, -2.09893798828125, -1.86376953125, -1.62860107421875, -1.3934326171875, -1.15826416015625, -0.923095703125, -0.68792724609375, -0.4527587890625, -0.21759033203125, 0.017578125, 0.25274658203125, 0.4879150390625, 0.72308349609375, 0.958251953125, 1.19342041015625, 1.4285888671875, 1.66375732421875, 1.89892578125, 2.13409423828125, 2.3692626953125, 2.60443115234375, 2.839599609375, 3.07476806640625, 3.3099365234375, 3.54510498046875, 3.7802734375, 4.01544189453125, 4.2506103515625, 4.48577880859375, 4.720947265625, 4.95611572265625, 5.1912841796875, 5.42645263671875, 5.66162109375, 5.89678955078125, 6.1319580078125, 6.36712646484375, 6.602294921875, 6.83746337890625, 7.0726318359375, 7.30780029296875, 7.54296875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 3.0, 9.0, 13.0, 7.0, 7.0, 15.0, 12.0, 16.0, 17.0, 29.0, 22.0, 24.0, 36.0, 40.0, 54.0, 69.0, 65.0, 128.0, 195.0, 752.0, 773.0, 162.0, 113.0, 89.0, 68.0, 48.0, 45.0, 27.0, 27.0, 27.0, 31.0, 12.0, 23.0, 13.0, 12.0, 10.0, 13.0, 7.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.2109375, -8.923095703125, -8.63525390625, -8.347412109375, -8.0595703125, -7.771728515625, -7.48388671875, -7.196044921875, -6.908203125, -6.620361328125, -6.33251953125, -6.044677734375, -5.7568359375, -5.468994140625, -5.18115234375, -4.893310546875, -4.60546875, -4.317626953125, -4.02978515625, -3.741943359375, -3.4541015625, -3.166259765625, -2.87841796875, -2.590576171875, -2.302734375, -2.014892578125, -1.72705078125, -1.439208984375, -1.1513671875, -0.863525390625, -0.57568359375, -0.287841796875, 0.0, 0.287841796875, 0.57568359375, 0.863525390625, 1.1513671875, 1.439208984375, 1.72705078125, 2.014892578125, 2.302734375, 2.590576171875, 2.87841796875, 3.166259765625, 3.4541015625, 3.741943359375, 4.02978515625, 4.317626953125, 4.60546875, 4.893310546875, 5.18115234375, 5.468994140625, 5.7568359375, 6.044677734375, 6.33251953125, 6.620361328125, 6.908203125, 7.196044921875, 7.48388671875, 7.771728515625, 8.0595703125, 8.347412109375, 8.63525390625, 8.923095703125, 9.2109375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 11.0, 18.0, 17.0, 18.0, 21.0, 41.0, 47.0, 74.0, 90.0, 167.0, 212.0, 319.0, 533.0, 789.0, 1612.0, 5946.0, 581130.0, 2538619.0, 11270.0, 2093.0, 986.0, 521.0, 378.0, 224.0, 159.0, 100.0, 67.0, 58.0, 34.0, 26.0, 33.0, 15.0, 14.0, 10.0, 9.0, 3.0, 7.0, 8.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-27.515625, -26.684814453125, -25.85400390625, -25.023193359375, -24.1923828125, -23.361572265625, -22.53076171875, -21.699951171875, -20.869140625, -20.038330078125, -19.20751953125, -18.376708984375, -17.5458984375, -16.715087890625, -15.88427734375, -15.053466796875, -14.22265625, -13.391845703125, -12.56103515625, -11.730224609375, -10.8994140625, -10.068603515625, -9.23779296875, -8.406982421875, -7.576171875, -6.745361328125, -5.91455078125, -5.083740234375, -4.2529296875, -3.422119140625, -2.59130859375, -1.760498046875, -0.9296875, -0.098876953125, 0.73193359375, 1.562744140625, 2.3935546875, 3.224365234375, 4.05517578125, 4.885986328125, 5.716796875, 6.547607421875, 7.37841796875, 8.209228515625, 9.0400390625, 9.870849609375, 10.70166015625, 11.532470703125, 12.36328125, 13.194091796875, 14.02490234375, 14.855712890625, 15.6865234375, 16.517333984375, 17.34814453125, 18.178955078125, 19.009765625, 19.840576171875, 20.67138671875, 21.502197265625, 22.3330078125, 23.163818359375, 23.99462890625, 24.825439453125, 25.65625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 13.0, 59.0, 187.0, 320.0, 264.0, 135.0, 28.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-181.91429138183594, -178.2638397216797, -174.6134033203125, -170.96295166015625, -167.3125, -163.66204833984375, -160.01161193847656, -156.3611602783203, -152.71070861816406, -149.0602569580078, -145.40982055664062, -141.75936889648438, -138.10891723632812, -134.45846557617188, -130.8080291748047, -127.15757751464844, -123.50712585449219, -119.85668182373047, -116.20623016357422, -112.5557861328125, -108.90533447265625, -105.25489044189453, -101.60443878173828, -97.95399475097656, -94.30355072021484, -90.65310668945312, -87.00265502929688, -83.35221099853516, -79.7017593383789, -76.05131530761719, -72.40086364746094, -68.75041961669922, -65.09996795654297, -61.449520111083984, -57.799072265625, -54.148624420166016, -50.49817657470703, -46.84773254394531, -43.19728088378906, -39.546836853027344, -35.896385192871094, -32.24593734741211, -28.595489501953125, -24.94504165649414, -21.294593811035156, -17.644147872924805, -13.99370002746582, -10.343252182006836, -6.692806243896484, -3.042358636856079, 0.6080889701843262, 4.258536338806152, 7.908984184265137, 11.559431076049805, 15.209878921508789, 18.860326766967773, 22.510774612426758, 26.161222457885742, 29.811670303344727, 33.46211624145508, 37.11256408691406, 40.76301193237305, 44.41345977783203, 48.063907623291016, 51.71435546875]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 4.0, 10.0, 9.0, 16.0, 15.0, 17.0, 17.0, 19.0, 24.0, 27.0, 28.0, 22.0, 28.0, 30.0, 27.0, 39.0, 31.0, 46.0, 47.0, 39.0, 44.0, 48.0, 46.0, 35.0, 35.0, 37.0, 25.0, 26.0, 26.0, 26.0, 21.0, 15.0, 23.0, 18.0, 12.0, 11.0, 7.0, 9.0, 9.0, 5.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-34.04804229736328, -33.092899322509766, -32.13775634765625, -31.1826114654541, -30.227468490600586, -29.27232551574707, -28.317180633544922, -27.362037658691406, -26.40689468383789, -25.451751708984375, -24.49660873413086, -23.54146385192871, -22.586320877075195, -21.63117790222168, -20.67603302001953, -19.720890045166016, -18.7657470703125, -17.810604095458984, -16.85546112060547, -15.90031623840332, -14.945173263549805, -13.990030288696289, -13.034886360168457, -12.079742431640625, -11.12459945678711, -10.169456481933594, -9.214312553405762, -8.25916862487793, -7.304025650024414, -6.34888219833374, -5.393738746643066, -4.438595294952393, -3.4834518432617188, -2.528308391571045, -1.573164939880371, -0.6180214881896973, 0.33712196350097656, 1.2922654151916504, 2.247408866882324, 3.202552318572998, 4.157695770263672, 5.112839221954346, 6.0679826736450195, 7.023126125335693, 7.978269577026367, 8.933412551879883, 9.888556480407715, 10.843700408935547, 11.798843383789062, 12.753986358642578, 13.70913028717041, 14.664274215698242, 15.619417190551758, 16.574560165405273, 17.529705047607422, 18.484848022460938, 19.439990997314453, 20.39513397216797, 21.350276947021484, 22.305421829223633, 23.26056480407715, 24.215707778930664, 25.170852661132812, 26.125995635986328, 27.081138610839844]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 10.0, 13.0, 7.0, 17.0, 16.0, 18.0, 16.0, 24.0, 25.0, 21.0, 24.0, 26.0, 37.0, 30.0, 38.0, 37.0, 37.0, 43.0, 40.0, 34.0, 36.0, 35.0, 33.0, 36.0, 30.0, 29.0, 32.0, 37.0, 19.0, 28.0, 11.0, 27.0, 15.0, 19.0, 12.0, 14.0, 12.0, 11.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.05859375, -3.9326171875, -3.806640625, -3.6806640625, -3.5546875, -3.4287109375, -3.302734375, -3.1767578125, -3.05078125, -2.9248046875, -2.798828125, -2.6728515625, -2.546875, -2.4208984375, -2.294921875, -2.1689453125, -2.04296875, -1.9169921875, -1.791015625, -1.6650390625, -1.5390625, -1.4130859375, -1.287109375, -1.1611328125, -1.03515625, -0.9091796875, -0.783203125, -0.6572265625, -0.53125, -0.4052734375, -0.279296875, -0.1533203125, -0.02734375, 0.0986328125, 0.224609375, 0.3505859375, 0.4765625, 0.6025390625, 0.728515625, 0.8544921875, 0.98046875, 1.1064453125, 1.232421875, 1.3583984375, 1.484375, 1.6103515625, 1.736328125, 1.8623046875, 1.98828125, 2.1142578125, 2.240234375, 2.3662109375, 2.4921875, 2.6181640625, 2.744140625, 2.8701171875, 2.99609375, 3.1220703125, 3.248046875, 3.3740234375, 3.5, 3.6259765625, 3.751953125, 3.8779296875, 4.00390625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 14.0, 18.0, 13.0, 48.0, 76.0, 105.0, 222.0, 436.0, 771.0, 1688.0, 3947.0, 10297.0, 31213.0, 184602.0, 1972967.0, 1777305.0, 164526.0, 29111.0, 9685.0, 3852.0, 1655.0, 806.0, 389.0, 227.0, 125.0, 86.0, 34.0, 24.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.5, -11.140380859375, -10.78076171875, -10.421142578125, -10.0615234375, -9.701904296875, -9.34228515625, -8.982666015625, -8.623046875, -8.263427734375, -7.90380859375, -7.544189453125, -7.1845703125, -6.824951171875, -6.46533203125, -6.105712890625, -5.74609375, -5.386474609375, -5.02685546875, -4.667236328125, -4.3076171875, -3.947998046875, -3.58837890625, -3.228759765625, -2.869140625, -2.509521484375, -2.14990234375, -1.790283203125, -1.4306640625, -1.071044921875, -0.71142578125, -0.351806640625, 0.0078125, 0.367431640625, 0.72705078125, 1.086669921875, 1.4462890625, 1.805908203125, 2.16552734375, 2.525146484375, 2.884765625, 3.244384765625, 3.60400390625, 3.963623046875, 4.3232421875, 4.682861328125, 5.04248046875, 5.402099609375, 5.76171875, 6.121337890625, 6.48095703125, 6.840576171875, 7.2001953125, 7.559814453125, 7.91943359375, 8.279052734375, 8.638671875, 8.998291015625, 9.35791015625, 9.717529296875, 10.0771484375, 10.436767578125, 10.79638671875, 11.156005859375, 11.515625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 2.0, 4.0, 4.0, 9.0, 11.0, 9.0, 11.0, 28.0, 30.0, 29.0, 40.0, 62.0, 84.0, 95.0, 147.0, 144.0, 203.0, 250.0, 318.0, 381.0, 416.0, 402.0, 294.0, 249.0, 191.0, 149.0, 112.0, 89.0, 71.0, 47.0, 43.0, 35.0, 26.0, 19.0, 12.0, 11.0, 7.0, 6.0, 12.0, 4.0, 9.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.6484375, -5.48931884765625, -5.3302001953125, -5.17108154296875, -5.011962890625, -4.85284423828125, -4.6937255859375, -4.53460693359375, -4.37548828125, -4.21636962890625, -4.0572509765625, -3.89813232421875, -3.739013671875, -3.57989501953125, -3.4207763671875, -3.26165771484375, -3.1025390625, -2.94342041015625, -2.7843017578125, -2.62518310546875, -2.466064453125, -2.30694580078125, -2.1478271484375, -1.98870849609375, -1.82958984375, -1.67047119140625, -1.5113525390625, -1.35223388671875, -1.193115234375, -1.03399658203125, -0.8748779296875, -0.71575927734375, -0.556640625, -0.39752197265625, -0.2384033203125, -0.07928466796875, 0.079833984375, 0.23895263671875, 0.3980712890625, 0.55718994140625, 0.71630859375, 0.87542724609375, 1.0345458984375, 1.19366455078125, 1.352783203125, 1.51190185546875, 1.6710205078125, 1.83013916015625, 1.9892578125, 2.14837646484375, 2.3074951171875, 2.46661376953125, 2.625732421875, 2.78485107421875, 2.9439697265625, 3.10308837890625, 3.26220703125, 3.42132568359375, 3.5804443359375, 3.73956298828125, 3.898681640625, 4.05780029296875, 4.2169189453125, 4.37603759765625, 4.53515625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 11.0, 13.0, 6.0, 13.0, 16.0, 19.0, 44.0, 37.0, 50.0, 95.0, 118.0, 178.0, 293.0, 480.0, 1041.0, 2259.0, 7126.0, 30919.0, 234991.0, 2373074.0, 1381693.0, 132507.0, 20280.0, 5121.0, 1824.0, 777.0, 464.0, 251.0, 184.0, 98.0, 83.0, 46.0, 33.0, 28.0, 28.0, 17.0, 15.0, 7.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.6640625, -9.36083984375, -9.0576171875, -8.75439453125, -8.451171875, -8.14794921875, -7.8447265625, -7.54150390625, -7.23828125, -6.93505859375, -6.6318359375, -6.32861328125, -6.025390625, -5.72216796875, -5.4189453125, -5.11572265625, -4.8125, -4.50927734375, -4.2060546875, -3.90283203125, -3.599609375, -3.29638671875, -2.9931640625, -2.68994140625, -2.38671875, -2.08349609375, -1.7802734375, -1.47705078125, -1.173828125, -0.87060546875, -0.5673828125, -0.26416015625, 0.0390625, 0.34228515625, 0.6455078125, 0.94873046875, 1.251953125, 1.55517578125, 1.8583984375, 2.16162109375, 2.46484375, 2.76806640625, 3.0712890625, 3.37451171875, 3.677734375, 3.98095703125, 4.2841796875, 4.58740234375, 4.890625, 5.19384765625, 5.4970703125, 5.80029296875, 6.103515625, 6.40673828125, 6.7099609375, 7.01318359375, 7.31640625, 7.61962890625, 7.9228515625, 8.22607421875, 8.529296875, 8.83251953125, 9.1357421875, 9.43896484375, 9.7421875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 27.0, 47.0, 105.0, 151.0, 167.0, 179.0, 146.0, 103.0, 46.0, 17.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-65.17100524902344, -63.507144927978516, -61.843284606933594, -60.17942810058594, -58.515567779541016, -56.851707458496094, -55.18784713745117, -53.52398681640625, -51.860130310058594, -50.19626998901367, -48.53240966796875, -46.868553161621094, -45.20469284057617, -43.54083251953125, -41.87697219848633, -40.213111877441406, -38.549251556396484, -36.88539123535156, -35.22153091430664, -33.55767059326172, -31.893814086914062, -30.22995376586914, -28.56609344482422, -26.902233123779297, -25.238374710083008, -23.574514389038086, -21.910655975341797, -20.246795654296875, -18.582935333251953, -16.919076919555664, -15.255216598510742, -13.591357231140137, -11.927501678466797, -10.263642311096191, -8.599782943725586, -6.935922622680664, -5.272063255310059, -3.608203887939453, -1.9443435668945312, -0.2804841995239258, 1.3833751678466797, 3.0472347736358643, 4.711094379425049, 6.3749542236328125, 8.038813591003418, 9.702672958374023, 11.366533279418945, 13.03039264678955, 14.694252014160156, 16.358112335205078, 18.021970748901367, 19.68583106994629, 21.349689483642578, 23.0135498046875, 24.677410125732422, 26.341270446777344, 28.005128860473633, 29.668989181518555, 31.332847595214844, 32.996707916259766, 34.66056823730469, 36.324424743652344, 37.98828887939453, 39.65214538574219, 41.31600570678711]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 10.0, 9.0, 13.0, 7.0, 11.0, 11.0, 17.0, 13.0, 22.0, 19.0, 21.0, 28.0, 32.0, 43.0, 31.0, 41.0, 26.0, 49.0, 31.0, 40.0, 42.0, 35.0, 39.0, 35.0, 34.0, 37.0, 31.0, 31.0, 35.0, 22.0, 25.0, 25.0, 26.0, 14.0, 12.0, 17.0, 13.0, 13.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.790016174316406, -23.031953811645508, -22.27389144897461, -21.515830993652344, -20.757768630981445, -19.999706268310547, -19.24164390563965, -18.48358154296875, -17.725521087646484, -16.967458724975586, -16.209396362304688, -15.451334953308105, -14.693273544311523, -13.935211181640625, -13.177148818969727, -12.419086456298828, -11.66102409362793, -10.902961730957031, -10.14490032196045, -9.38683795928955, -8.628776550292969, -7.87071418762207, -7.112651824951172, -6.354589939117432, -5.596528053283691, -4.838466167449951, -4.080404281616211, -3.3223419189453125, -2.5642800331115723, -1.806218147277832, -1.0481557846069336, -0.29009389877319336, 0.4679679870605469, 1.2260299921035767, 1.9840919971466064, 2.742154121398926, 3.500216007232666, 4.258277893066406, 5.016340255737305, 5.774402141571045, 6.532464027404785, 7.290525913238525, 8.048587799072266, 8.806650161743164, 9.564712524414062, 10.322773933410645, 11.080836296081543, 11.838897705078125, 12.596960067749023, 13.355022430419922, 14.113083839416504, 14.871146202087402, 15.629207611083984, 16.387269973754883, 17.14533233642578, 17.90339469909668, 18.661457061767578, 19.419519424438477, 20.177581787109375, 20.93564224243164, 21.69370460510254, 22.451766967773438, 23.209829330444336, 23.967891693115234, 24.7259521484375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 8.0, 3.0, 7.0, 9.0, 12.0, 8.0, 14.0, 17.0, 12.0, 26.0, 23.0, 26.0, 36.0, 30.0, 26.0, 35.0, 47.0, 40.0, 42.0, 44.0, 46.0, 40.0, 39.0, 41.0, 30.0, 29.0, 25.0, 35.0, 32.0, 29.0, 27.0, 24.0, 21.0, 24.0, 20.0, 12.0, 13.0, 13.0, 7.0, 8.0, 4.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.818359375, -3.690948486328125, -3.56353759765625, -3.436126708984375, -3.3087158203125, -3.181304931640625, -3.05389404296875, -2.926483154296875, -2.799072265625, -2.671661376953125, -2.54425048828125, -2.416839599609375, -2.2894287109375, -2.162017822265625, -2.03460693359375, -1.907196044921875, -1.77978515625, -1.652374267578125, -1.52496337890625, -1.397552490234375, -1.2701416015625, -1.142730712890625, -1.01531982421875, -0.887908935546875, -0.760498046875, -0.633087158203125, -0.50567626953125, -0.378265380859375, -0.2508544921875, -0.123443603515625, 0.00396728515625, 0.131378173828125, 0.2587890625, 0.386199951171875, 0.51361083984375, 0.641021728515625, 0.7684326171875, 0.895843505859375, 1.02325439453125, 1.150665283203125, 1.278076171875, 1.405487060546875, 1.53289794921875, 1.660308837890625, 1.7877197265625, 1.915130615234375, 2.04254150390625, 2.169952392578125, 2.29736328125, 2.424774169921875, 2.55218505859375, 2.679595947265625, 2.8070068359375, 2.934417724609375, 3.06182861328125, 3.189239501953125, 3.316650390625, 3.444061279296875, 3.57147216796875, 3.698883056640625, 3.8262939453125, 3.953704833984375, 4.08111572265625, 4.208526611328125, 4.3359375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 6.0, 8.0, 21.0, 14.0, 42.0, 64.0, 92.0, 132.0, 160.0, 259.0, 365.0, 556.0, 829.0, 1204.0, 1745.0, 2749.0, 4052.0, 6130.0, 9340.0, 14369.0, 22365.0, 35685.0, 57783.0, 102566.0, 261757.0, 263501.0, 104205.0, 58603.0, 35556.0, 22427.0, 14221.0, 9437.0, 6059.0, 4021.0, 2684.0, 1787.0, 1170.0, 875.0, 555.0, 359.0, 233.0, 186.0, 136.0, 91.0, 49.0, 42.0, 21.0, 18.0, 10.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.2052001953125, -0.19916534423828125, -0.1931304931640625, -0.18709564208984375, -0.181060791015625, -0.17502593994140625, -0.1689910888671875, -0.16295623779296875, -0.15692138671875, -0.15088653564453125, -0.1448516845703125, -0.13881683349609375, -0.132781982421875, -0.12674713134765625, -0.1207122802734375, -0.11467742919921875, -0.108642578125, -0.10260772705078125, -0.0965728759765625, -0.09053802490234375, -0.084503173828125, -0.07846832275390625, -0.0724334716796875, -0.06639862060546875, -0.06036376953125, -0.05432891845703125, -0.0482940673828125, -0.04225921630859375, -0.036224365234375, -0.03018951416015625, -0.0241546630859375, -0.01811981201171875, -0.0120849609375, -0.00605010986328125, -1.52587890625e-05, 0.00601959228515625, 0.012054443359375, 0.01808929443359375, 0.0241241455078125, 0.03015899658203125, 0.03619384765625, 0.04222869873046875, 0.0482635498046875, 0.05429840087890625, 0.060333251953125, 0.06636810302734375, 0.0724029541015625, 0.07843780517578125, 0.08447265625, 0.09050750732421875, 0.0965423583984375, 0.10257720947265625, 0.108612060546875, 0.11464691162109375, 0.1206817626953125, 0.12671661376953125, 0.13275146484375, 0.13878631591796875, 0.1448211669921875, 0.15085601806640625, 0.156890869140625, 0.16292572021484375, 0.1689605712890625, 0.17499542236328125, 0.1810302734375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 3.0, 7.0, 14.0, 17.0, 12.0, 17.0, 14.0, 18.0, 24.0, 29.0, 31.0, 20.0, 31.0, 29.0, 33.0, 38.0, 46.0, 32.0, 37.0, 46.0, 1058.0, 31.0, 35.0, 31.0, 36.0, 49.0, 28.0, 32.0, 31.0, 28.0, 18.0, 19.0, 26.0, 14.0, 10.0, 5.0, 9.0, 14.0, 9.0, 7.0, 9.0, 4.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.75390625, -2.66510009765625, -2.5762939453125, -2.48748779296875, -2.398681640625, -2.30987548828125, -2.2210693359375, -2.13226318359375, -2.04345703125, -1.95465087890625, -1.8658447265625, -1.77703857421875, -1.688232421875, -1.59942626953125, -1.5106201171875, -1.42181396484375, -1.3330078125, -1.24420166015625, -1.1553955078125, -1.06658935546875, -0.977783203125, -0.88897705078125, -0.8001708984375, -0.71136474609375, -0.62255859375, -0.53375244140625, -0.4449462890625, -0.35614013671875, -0.267333984375, -0.17852783203125, -0.0897216796875, -0.00091552734375, 0.087890625, 0.17669677734375, 0.2655029296875, 0.35430908203125, 0.443115234375, 0.53192138671875, 0.6207275390625, 0.70953369140625, 0.79833984375, 0.88714599609375, 0.9759521484375, 1.06475830078125, 1.153564453125, 1.24237060546875, 1.3311767578125, 1.41998291015625, 1.5087890625, 1.59759521484375, 1.6864013671875, 1.77520751953125, 1.864013671875, 1.95281982421875, 2.0416259765625, 2.13043212890625, 2.21923828125, 2.30804443359375, 2.3968505859375, 2.48565673828125, 2.574462890625, 2.66326904296875, 2.7520751953125, 2.84088134765625, 2.9296875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 10.0, 14.0, 17.0, 27.0, 43.0, 59.0, 81.0, 112.0, 168.0, 237.0, 374.0, 510.0, 730.0, 1075.0, 1548.0, 2103.0, 3088.0, 4361.0, 6041.0, 8705.0, 12807.0, 18115.0, 27530.0, 41765.0, 66909.0, 114096.0, 1304220.0, 199180.0, 102107.0, 60878.0, 38705.0, 25046.0, 17416.0, 11666.0, 8295.0, 5777.0, 3972.0, 2796.0, 1933.0, 1379.0, 947.0, 715.0, 479.0, 337.0, 235.0, 158.0, 122.0, 73.0, 51.0, 51.0, 25.0, 20.0, 12.0, 7.0, 5.0, 2.0, 3.0, 3.0], "bins": [-0.08447265625, -0.08190536499023438, -0.07933807373046875, -0.07677078247070312, -0.0742034912109375, -0.07163619995117188, -0.06906890869140625, -0.06650161743164062, -0.063934326171875, -0.061367034912109375, -0.05879974365234375, -0.056232452392578125, -0.0536651611328125, -0.051097869873046875, -0.04853057861328125, -0.045963287353515625, -0.04339599609375, -0.040828704833984375, -0.03826141357421875, -0.035694122314453125, -0.0331268310546875, -0.030559539794921875, -0.02799224853515625, -0.025424957275390625, -0.022857666015625, -0.020290374755859375, -0.01772308349609375, -0.015155792236328125, -0.0125885009765625, -0.010021209716796875, -0.00745391845703125, -0.004886627197265625, -0.0023193359375, 0.000247955322265625, 0.00281524658203125, 0.005382537841796875, 0.0079498291015625, 0.010517120361328125, 0.01308441162109375, 0.015651702880859375, 0.018218994140625, 0.020786285400390625, 0.02335357666015625, 0.025920867919921875, 0.0284881591796875, 0.031055450439453125, 0.03362274169921875, 0.036190032958984375, 0.03875732421875, 0.041324615478515625, 0.04389190673828125, 0.046459197998046875, 0.0490264892578125, 0.051593780517578125, 0.05416107177734375, 0.056728363037109375, 0.059295654296875, 0.061862945556640625, 0.06443023681640625, 0.06699752807617188, 0.0695648193359375, 0.07213211059570312, 0.07469940185546875, 0.07726669311523438, 0.079833984375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 11.0, 10.0, 12.0, 13.0, 16.0, 49.0, 29.0, 24.0, 31.0, 39.0, 50.0, 67.0, 83.0, 118.0, 84.0, 59.0, 48.0, 34.0, 37.0, 26.0, 32.0, 17.0, 19.0, 19.0, 12.0, 11.0, 16.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7853453755378723e-06, -1.7229467630386353e-06, -1.6605481505393982e-06, -1.5981495380401611e-06, -1.535750925540924e-06, -1.473352313041687e-06, -1.41095370054245e-06, -1.3485550880432129e-06, -1.2861564755439758e-06, -1.2237578630447388e-06, -1.1613592505455017e-06, -1.0989606380462646e-06, -1.0365620255470276e-06, -9.741634130477905e-07, -9.117648005485535e-07, -8.493661880493164e-07, -7.869675755500793e-07, -7.245689630508423e-07, -6.621703505516052e-07, -5.997717380523682e-07, -5.373731255531311e-07, -4.7497451305389404e-07, -4.12575900554657e-07, -3.501772880554199e-07, -2.8777867555618286e-07, -2.253800630569458e-07, -1.6298145055770874e-07, -1.0058283805847168e-07, -3.818422555923462e-08, 2.421438694000244e-08, 8.66129994392395e-08, 1.4901161193847656e-07, 2.1141022443771362e-07, 2.738088369369507e-07, 3.3620744943618774e-07, 3.986060619354248e-07, 4.6100467443466187e-07, 5.234032869338989e-07, 5.85801899433136e-07, 6.48200511932373e-07, 7.105991244316101e-07, 7.729977369308472e-07, 8.353963494300842e-07, 8.977949619293213e-07, 9.601935744285583e-07, 1.0225921869277954e-06, 1.0849907994270325e-06, 1.1473894119262695e-06, 1.2097880244255066e-06, 1.2721866369247437e-06, 1.3345852494239807e-06, 1.3969838619232178e-06, 1.4593824744224548e-06, 1.521781086921692e-06, 1.584179699420929e-06, 1.646578311920166e-06, 1.708976924419403e-06, 1.7713755369186401e-06, 1.8337741494178772e-06, 1.8961727619171143e-06, 1.9585713744163513e-06, 2.0209699869155884e-06, 2.0833685994148254e-06, 2.1457672119140625e-06]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 9.0, 8.0, 7.0, 17.0, 26.0, 22.0, 34.0, 37.0, 60.0, 61.0, 108.0, 151.0, 187.0, 351.0, 936.0, 4102.0, 36720.0, 650106.0, 327137.0, 23737.0, 3007.0, 684.0, 323.0, 173.0, 123.0, 102.0, 67.0, 53.0, 41.0, 30.0, 22.0, 25.0, 19.0, 16.0, 7.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.212690353393555e-05, -3.117881715297699e-05, -3.0230730772018433e-05, -2.9282644391059875e-05, -2.833455801010132e-05, -2.738647162914276e-05, -2.6438385248184204e-05, -2.5490298867225647e-05, -2.454221248626709e-05, -2.3594126105308533e-05, -2.2646039724349976e-05, -2.169795334339142e-05, -2.074986696243286e-05, -1.9801780581474304e-05, -1.8853694200515747e-05, -1.790560781955719e-05, -1.6957521438598633e-05, -1.6009435057640076e-05, -1.5061348676681519e-05, -1.4113262295722961e-05, -1.3165175914764404e-05, -1.2217089533805847e-05, -1.126900315284729e-05, -1.0320916771888733e-05, -9.372830390930176e-06, -8.424744009971619e-06, -7.4766576290130615e-06, -6.528571248054504e-06, -5.580484867095947e-06, -4.63239848613739e-06, -3.684312105178833e-06, -2.736225724220276e-06, -1.7881393432617188e-06, -8.400529623031616e-07, 1.0803341865539551e-07, 1.0561197996139526e-06, 2.0042061805725098e-06, 2.952292561531067e-06, 3.900378942489624e-06, 4.848465323448181e-06, 5.796551704406738e-06, 6.744638085365295e-06, 7.692724466323853e-06, 8.64081084728241e-06, 9.588897228240967e-06, 1.0536983609199524e-05, 1.1485069990158081e-05, 1.2433156371116638e-05, 1.3381242752075195e-05, 1.4329329133033752e-05, 1.527741551399231e-05, 1.6225501894950867e-05, 1.7173588275909424e-05, 1.812167465686798e-05, 1.9069761037826538e-05, 2.0017847418785095e-05, 2.0965933799743652e-05, 2.191402018070221e-05, 2.2862106561660767e-05, 2.3810192942619324e-05, 2.475827932357788e-05, 2.5706365704536438e-05, 2.6654452085494995e-05, 2.7602538466453552e-05, 2.855062484741211e-05]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 10.0, 24.0, 51.0, 137.0, 275.0, 278.0, 143.0, 52.0, 23.0, 4.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0994086753489682e-06, -1.9088206499873195e-06, -1.7182326246256707e-06, -1.527644599264022e-06, -1.3370565739023732e-06, -1.1464685485407244e-06, -9.558806368659134e-07, -7.652926115042646e-07, -5.747045861426159e-07, -3.841165607809671e-07, -1.935285638410278e-07, -2.9405669010884594e-09, 1.876474584605603e-07, 3.7823548382220906e-07, 5.68823452340439e-07, 7.594114777020877e-07, 9.499995030637365e-07, 1.1405875284253852e-06, 1.331175553787034e-06, 1.5217635791486828e-06, 1.7123516045103315e-06, 1.9029396298719803e-06, 2.093527655233629e-06, 2.2841154532216024e-06, 2.4747037059569266e-06, 2.6652917313185753e-06, 2.855879756680224e-06, 3.046467782041873e-06, 3.2370558074035216e-06, 3.4276438327651704e-06, 3.618231858126819e-06, 3.8088196561147925e-06, 3.999407908850117e-06, 4.18999570683809e-06, 4.380583959573414e-06, 4.5711717575613875e-06, 4.761760010296712e-06, 4.952347808284685e-06, 5.142936061020009e-06, 5.3335238590079825e-06, 5.524112111743307e-06, 5.71469990973128e-06, 5.905288162466604e-06, 6.095875960454578e-06, 6.286464213189902e-06, 6.477052011177875e-06, 6.667640263913199e-06, 6.858228061901173e-06, 7.048815859889146e-06, 7.239403657877119e-06, 7.4299919106124435e-06, 7.620579708600417e-06, 7.811167961335741e-06, 8.001756214071065e-06, 8.192343557311688e-06, 8.382931810047012e-06, 8.573520062782336e-06, 8.76410831551766e-06, 8.954695658758283e-06, 9.145283911493607e-06, 9.335872164228931e-06, 9.526460416964255e-06, 9.717047760204878e-06, 9.907636012940202e-06, 1.0098224265675526e-05]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 8.0, 16.0, 20.0, 0.0, 24.0, 30.0, 35.0, 29.0, 40.0, 54.0, 65.0, 65.0, 62.0, 0.0, 72.0, 65.0, 50.0, 56.0, 48.0, 43.0, 37.0, 33.0, 36.0, 24.0, 0.0, 12.0, 15.0, 14.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7285346984863281e-06, -1.6745179891586304e-06, -1.6205012798309326e-06, -1.5664845705032349e-06, -1.5124678611755371e-06, -1.4584511518478394e-06, -1.4044344425201416e-06, -1.3504177331924438e-06, -1.296401023864746e-06, -1.2423843145370483e-06, -1.1883676052093506e-06, -1.1343508958816528e-06, -1.080334186553955e-06, -1.0263174772262573e-06, -9.723007678985596e-07, -9.182840585708618e-07, -8.642673492431641e-07, -8.102506399154663e-07, -7.562339305877686e-07, -7.022172212600708e-07, -6.48200511932373e-07, -5.941838026046753e-07, -5.401670932769775e-07, -4.861503839492798e-07, -4.3213367462158203e-07, -3.781169652938843e-07, -3.241002559661865e-07, -2.7008354663848877e-07, -2.1606683731079102e-07, -1.6205012798309326e-07, -1.0803341865539551e-07, -5.4016709327697754e-08, 0.0, 5.4016709327697754e-08, 1.0803341865539551e-07, 1.6205012798309326e-07, 2.1606683731079102e-07, 2.7008354663848877e-07, 3.241002559661865e-07, 3.781169652938843e-07, 4.3213367462158203e-07, 4.861503839492798e-07, 5.401670932769775e-07, 5.941838026046753e-07, 6.48200511932373e-07, 7.022172212600708e-07, 7.562339305877686e-07, 8.102506399154663e-07, 8.642673492431641e-07, 9.182840585708618e-07, 9.723007678985596e-07, 1.0263174772262573e-06, 1.080334186553955e-06, 1.1343508958816528e-06, 1.1883676052093506e-06, 1.2423843145370483e-06, 1.296401023864746e-06, 1.3504177331924438e-06, 1.4044344425201416e-06, 1.4584511518478394e-06, 1.5124678611755371e-06, 1.5664845705032349e-06, 1.6205012798309326e-06, 1.6745179891586304e-06, 1.7285346984863281e-06]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 8.0, 3.0, 7.0, 9.0, 12.0, 8.0, 14.0, 17.0, 12.0, 26.0, 23.0, 26.0, 36.0, 30.0, 26.0, 35.0, 47.0, 40.0, 42.0, 44.0, 46.0, 40.0, 39.0, 41.0, 30.0, 29.0, 25.0, 35.0, 32.0, 29.0, 27.0, 24.0, 21.0, 24.0, 20.0, 12.0, 13.0, 13.0, 7.0, 8.0, 4.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.818359375, -3.690948486328125, -3.56353759765625, -3.436126708984375, -3.3087158203125, -3.181304931640625, -3.05389404296875, -2.926483154296875, -2.799072265625, -2.671661376953125, -2.54425048828125, -2.416839599609375, -2.2894287109375, -2.162017822265625, -2.03460693359375, -1.907196044921875, -1.77978515625, -1.652374267578125, -1.52496337890625, -1.397552490234375, -1.2701416015625, -1.142730712890625, -1.01531982421875, -0.887908935546875, -0.760498046875, -0.633087158203125, -0.50567626953125, -0.378265380859375, -0.2508544921875, -0.123443603515625, 0.00396728515625, 0.131378173828125, 0.2587890625, 0.386199951171875, 0.51361083984375, 0.641021728515625, 0.7684326171875, 0.895843505859375, 1.02325439453125, 1.150665283203125, 1.278076171875, 1.405487060546875, 1.53289794921875, 1.660308837890625, 1.7877197265625, 1.915130615234375, 2.04254150390625, 2.169952392578125, 2.29736328125, 2.424774169921875, 2.55218505859375, 2.679595947265625, 2.8070068359375, 2.934417724609375, 3.06182861328125, 3.189239501953125, 3.316650390625, 3.444061279296875, 3.57147216796875, 3.698883056640625, 3.8262939453125, 3.953704833984375, 4.08111572265625, 4.208526611328125, 4.3359375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 11.0, 22.0, 18.0, 29.0, 41.0, 45.0, 55.0, 74.0, 78.0, 117.0, 135.0, 206.0, 275.0, 378.0, 561.0, 908.0, 1538.0, 2909.0, 5663.0, 11737.0, 25716.0, 59516.0, 141002.0, 270446.0, 272416.0, 142819.0, 60882.0, 26043.0, 11649.0, 5670.0, 2963.0, 1612.0, 903.0, 592.0, 417.0, 247.0, 186.0, 150.0, 139.0, 83.0, 67.0, 65.0, 45.0, 32.0, 24.0, 15.0, 11.0, 12.0, 8.0, 7.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.9140625, -3.78363037109375, -3.6531982421875, -3.52276611328125, -3.392333984375, -3.26190185546875, -3.1314697265625, -3.00103759765625, -2.87060546875, -2.74017333984375, -2.6097412109375, -2.47930908203125, -2.348876953125, -2.21844482421875, -2.0880126953125, -1.95758056640625, -1.8271484375, -1.69671630859375, -1.5662841796875, -1.43585205078125, -1.305419921875, -1.17498779296875, -1.0445556640625, -0.91412353515625, -0.78369140625, -0.65325927734375, -0.5228271484375, -0.39239501953125, -0.261962890625, -0.13153076171875, -0.0010986328125, 0.12933349609375, 0.259765625, 0.39019775390625, 0.5206298828125, 0.65106201171875, 0.781494140625, 0.91192626953125, 1.0423583984375, 1.17279052734375, 1.30322265625, 1.43365478515625, 1.5640869140625, 1.69451904296875, 1.824951171875, 1.95538330078125, 2.0858154296875, 2.21624755859375, 2.3466796875, 2.47711181640625, 2.6075439453125, 2.73797607421875, 2.868408203125, 2.99884033203125, 3.1292724609375, 3.25970458984375, 3.39013671875, 3.52056884765625, 3.6510009765625, 3.78143310546875, 3.911865234375, 4.04229736328125, 4.1727294921875, 4.30316162109375, 4.43359375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 7.0, 11.0, 19.0, 17.0, 21.0, 16.0, 39.0, 37.0, 26.0, 40.0, 60.0, 62.0, 81.0, 184.0, 358.0, 1415.0, 178.0, 95.0, 57.0, 59.0, 42.0, 31.0, 35.0, 28.0, 33.0, 16.0, 20.0, 12.0, 3.0, 9.0, 5.0, 10.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9375, -11.5654296875, -11.193359375, -10.8212890625, -10.44921875, -10.0771484375, -9.705078125, -9.3330078125, -8.9609375, -8.5888671875, -8.216796875, -7.8447265625, -7.47265625, -7.1005859375, -6.728515625, -6.3564453125, -5.984375, -5.6123046875, -5.240234375, -4.8681640625, -4.49609375, -4.1240234375, -3.751953125, -3.3798828125, -3.0078125, -2.6357421875, -2.263671875, -1.8916015625, -1.51953125, -1.1474609375, -0.775390625, -0.4033203125, -0.03125, 0.3408203125, 0.712890625, 1.0849609375, 1.45703125, 1.8291015625, 2.201171875, 2.5732421875, 2.9453125, 3.3173828125, 3.689453125, 4.0615234375, 4.43359375, 4.8056640625, 5.177734375, 5.5498046875, 5.921875, 6.2939453125, 6.666015625, 7.0380859375, 7.41015625, 7.7822265625, 8.154296875, 8.5263671875, 8.8984375, 9.2705078125, 9.642578125, 10.0146484375, 10.38671875, 10.7587890625, 11.130859375, 11.5029296875, 11.875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 5.0, 7.0, 11.0, 13.0, 18.0, 30.0, 22.0, 43.0, 52.0, 47.0, 69.0, 104.0, 140.0, 210.0, 395.0, 719.0, 2516.0, 69428.0, 3012451.0, 55147.0, 2330.0, 748.0, 379.0, 231.0, 136.0, 118.0, 69.0, 55.0, 54.0, 27.0, 28.0, 28.0, 16.0, 14.0, 7.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.359375, -16.789794921875, -16.22021484375, -15.650634765625, -15.0810546875, -14.511474609375, -13.94189453125, -13.372314453125, -12.802734375, -12.233154296875, -11.66357421875, -11.093994140625, -10.5244140625, -9.954833984375, -9.38525390625, -8.815673828125, -8.24609375, -7.676513671875, -7.10693359375, -6.537353515625, -5.9677734375, -5.398193359375, -4.82861328125, -4.259033203125, -3.689453125, -3.119873046875, -2.55029296875, -1.980712890625, -1.4111328125, -0.841552734375, -0.27197265625, 0.297607421875, 0.8671875, 1.436767578125, 2.00634765625, 2.575927734375, 3.1455078125, 3.715087890625, 4.28466796875, 4.854248046875, 5.423828125, 5.993408203125, 6.56298828125, 7.132568359375, 7.7021484375, 8.271728515625, 8.84130859375, 9.410888671875, 9.98046875, 10.550048828125, 11.11962890625, 11.689208984375, 12.2587890625, 12.828369140625, 13.39794921875, 13.967529296875, 14.537109375, 15.106689453125, 15.67626953125, 16.245849609375, 16.8154296875, 17.385009765625, 17.95458984375, 18.524169921875, 19.09375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 44.0, 282.0, 482.0, 165.0, 31.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.62942886352539, -51.48860168457031, -48.347774505615234, -45.206947326660156, -42.06611633300781, -38.925289154052734, -35.784461975097656, -32.64363098144531, -29.502805709838867, -26.36197853088379, -23.221149444580078, -20.080322265625, -16.939495086669922, -13.798666000366211, -10.657838821411133, -7.517009735107422, -4.376182556152344, -1.2353546619415283, 1.905473232269287, 5.046300888061523, 8.187129020690918, 11.327957153320312, 14.46878433227539, 17.6096134185791, 20.75044059753418, 23.891267776489258, 27.03209686279297, 30.172924041748047, 33.313751220703125, 36.45458221435547, 39.59540557861328, 42.736236572265625, 45.87706756591797, 49.01789474487305, 52.158721923828125, 55.29955291748047, 58.44038009643555, 61.581207275390625, 64.72203063964844, 67.86286163330078, 71.00369262695312, 74.14452362060547, 77.28534698486328, 80.42617797851562, 83.56700134277344, 86.70783233642578, 89.84866333007812, 92.98948669433594, 96.13031005859375, 99.2711410522461, 102.4119644165039, 105.55279541015625, 108.69361877441406, 111.8344497680664, 114.97528076171875, 118.11610412597656, 121.2569351196289, 124.39776611328125, 127.53858947753906, 130.67941284179688, 133.82025146484375, 136.96107482910156, 140.10189819335938, 143.24273681640625, 146.38356018066406]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 8.0, 7.0, 3.0, 5.0, 8.0, 15.0, 19.0, 16.0, 27.0, 32.0, 21.0, 37.0, 48.0, 30.0, 56.0, 45.0, 54.0, 52.0, 51.0, 45.0, 41.0, 40.0, 44.0, 48.0, 33.0, 27.0, 33.0, 29.0, 30.0, 21.0, 17.0, 16.0, 9.0, 8.0, 16.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.740962982177734, -39.63297653198242, -38.524993896484375, -37.41700744628906, -36.30902099609375, -35.2010383605957, -34.09305191040039, -32.985069274902344, -31.87708282470703, -30.76909828186035, -29.661113739013672, -28.55312728881836, -27.44514274597168, -26.337158203125, -25.229171752929688, -24.121187210083008, -23.013202667236328, -21.90521812438965, -20.79723358154297, -19.689247131347656, -18.581262588500977, -17.473278045654297, -16.365291595458984, -15.257307052612305, -14.149322509765625, -13.041337966918945, -11.93335247039795, -10.825366973876953, -9.717382431030273, -8.609397888183594, -7.501412391662598, -6.39342737197876, -5.285442352294922, -4.177457332611084, -3.069472312927246, -1.9614872932434082, -0.8535022735595703, 0.2544827461242676, 1.3624677658081055, 2.4704527854919434, 3.5784378051757812, 4.686422824859619, 5.794407844543457, 6.902392864227295, 8.010377883911133, 9.118362426757812, 10.226347923278809, 11.334333419799805, 12.442317962646484, 13.550302505493164, 14.65828800201416, 15.766273498535156, 16.874258041381836, 17.982242584228516, 19.090229034423828, 20.198213577270508, 21.306198120117188, 22.414182662963867, 23.522167205810547, 24.63015365600586, 25.73813819885254, 26.84612274169922, 27.95410919189453, 29.06209373474121, 30.17007827758789]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 2.0, 7.0, 5.0, 6.0, 6.0, 5.0, 11.0, 10.0, 15.0, 22.0, 16.0, 20.0, 23.0, 25.0, 33.0, 26.0, 30.0, 38.0, 27.0, 27.0, 41.0, 39.0, 54.0, 40.0, 31.0, 36.0, 33.0, 27.0, 35.0, 18.0, 31.0, 28.0, 21.0, 16.0, 25.0, 23.0, 24.0, 23.0, 10.0, 11.0, 13.0, 12.0, 11.0, 8.0, 8.0, 5.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0], "bins": [-4.33203125, -4.203399658203125, -4.07476806640625, -3.946136474609375, -3.8175048828125, -3.688873291015625, -3.56024169921875, -3.431610107421875, -3.302978515625, -3.174346923828125, -3.04571533203125, -2.917083740234375, -2.7884521484375, -2.659820556640625, -2.53118896484375, -2.402557373046875, -2.27392578125, -2.145294189453125, -2.01666259765625, -1.888031005859375, -1.7593994140625, -1.630767822265625, -1.50213623046875, -1.373504638671875, -1.244873046875, -1.116241455078125, -0.98760986328125, -0.858978271484375, -0.7303466796875, -0.601715087890625, -0.47308349609375, -0.344451904296875, -0.2158203125, -0.087188720703125, 0.04144287109375, 0.170074462890625, 0.2987060546875, 0.427337646484375, 0.55596923828125, 0.684600830078125, 0.813232421875, 0.941864013671875, 1.07049560546875, 1.199127197265625, 1.3277587890625, 1.456390380859375, 1.58502197265625, 1.713653564453125, 1.84228515625, 1.970916748046875, 2.09954833984375, 2.228179931640625, 2.3568115234375, 2.485443115234375, 2.61407470703125, 2.742706298828125, 2.871337890625, 2.999969482421875, 3.12860107421875, 3.257232666015625, 3.3858642578125, 3.514495849609375, 3.64312744140625, 3.771759033203125, 3.900390625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 8.0, 7.0, 7.0, 8.0, 7.0, 22.0, 16.0, 27.0, 26.0, 60.0, 71.0, 95.0, 118.0, 166.0, 219.0, 316.0, 425.0, 655.0, 1216.0, 2775.0, 11505.0, 114488.0, 2172891.0, 1783821.0, 90025.0, 9515.0, 2506.0, 1081.0, 633.0, 416.0, 289.0, 219.0, 160.0, 114.0, 100.0, 79.0, 45.0, 33.0, 31.0, 17.0, 20.0, 16.0, 4.0, 5.0, 3.0, 5.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0], "bins": [-24.484375, -23.783935546875, -23.08349609375, -22.383056640625, -21.6826171875, -20.982177734375, -20.28173828125, -19.581298828125, -18.880859375, -18.180419921875, -17.47998046875, -16.779541015625, -16.0791015625, -15.378662109375, -14.67822265625, -13.977783203125, -13.27734375, -12.576904296875, -11.87646484375, -11.176025390625, -10.4755859375, -9.775146484375, -9.07470703125, -8.374267578125, -7.673828125, -6.973388671875, -6.27294921875, -5.572509765625, -4.8720703125, -4.171630859375, -3.47119140625, -2.770751953125, -2.0703125, -1.369873046875, -0.66943359375, 0.031005859375, 0.7314453125, 1.431884765625, 2.13232421875, 2.832763671875, 3.533203125, 4.233642578125, 4.93408203125, 5.634521484375, 6.3349609375, 7.035400390625, 7.73583984375, 8.436279296875, 9.13671875, 9.837158203125, 10.53759765625, 11.238037109375, 11.9384765625, 12.638916015625, 13.33935546875, 14.039794921875, 14.740234375, 15.440673828125, 16.14111328125, 16.841552734375, 17.5419921875, 18.242431640625, 18.94287109375, 19.643310546875, 20.34375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 9.0, 6.0, 10.0, 11.0, 14.0, 20.0, 30.0, 49.0, 63.0, 107.0, 175.0, 211.0, 295.0, 353.0, 434.0, 477.0, 469.0, 393.0, 276.0, 186.0, 155.0, 102.0, 63.0, 46.0, 32.0, 21.0, 23.0, 10.0, 8.0, 4.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6640625, -9.3603515625, -9.056640625, -8.7529296875, -8.44921875, -8.1455078125, -7.841796875, -7.5380859375, -7.234375, -6.9306640625, -6.626953125, -6.3232421875, -6.01953125, -5.7158203125, -5.412109375, -5.1083984375, -4.8046875, -4.5009765625, -4.197265625, -3.8935546875, -3.58984375, -3.2861328125, -2.982421875, -2.6787109375, -2.375, -2.0712890625, -1.767578125, -1.4638671875, -1.16015625, -0.8564453125, -0.552734375, -0.2490234375, 0.0546875, 0.3583984375, 0.662109375, 0.9658203125, 1.26953125, 1.5732421875, 1.876953125, 2.1806640625, 2.484375, 2.7880859375, 3.091796875, 3.3955078125, 3.69921875, 4.0029296875, 4.306640625, 4.6103515625, 4.9140625, 5.2177734375, 5.521484375, 5.8251953125, 6.12890625, 6.4326171875, 6.736328125, 7.0400390625, 7.34375, 7.6474609375, 7.951171875, 8.2548828125, 8.55859375, 8.8623046875, 9.166015625, 9.4697265625, 9.7734375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 11.0, 12.0, 16.0, 46.0, 68.0, 154.0, 292.0, 712.0, 1845.0, 7132.0, 49782.0, 574114.0, 2890757.0, 606610.0, 52068.0, 7339.0, 1925.0, 732.0, 334.0, 146.0, 80.0, 39.0, 26.0, 7.0, 14.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.9296875, -12.4761962890625, -12.022705078125, -11.5692138671875, -11.11572265625, -10.6622314453125, -10.208740234375, -9.7552490234375, -9.3017578125, -8.8482666015625, -8.394775390625, -7.9412841796875, -7.48779296875, -7.0343017578125, -6.580810546875, -6.1273193359375, -5.673828125, -5.2203369140625, -4.766845703125, -4.3133544921875, -3.85986328125, -3.4063720703125, -2.952880859375, -2.4993896484375, -2.0458984375, -1.5924072265625, -1.138916015625, -0.6854248046875, -0.23193359375, 0.2215576171875, 0.675048828125, 1.1285400390625, 1.58203125, 2.0355224609375, 2.489013671875, 2.9425048828125, 3.39599609375, 3.8494873046875, 4.302978515625, 4.7564697265625, 5.2099609375, 5.6634521484375, 6.116943359375, 6.5704345703125, 7.02392578125, 7.4774169921875, 7.930908203125, 8.3843994140625, 8.837890625, 9.2913818359375, 9.744873046875, 10.1983642578125, 10.65185546875, 11.1053466796875, 11.558837890625, 12.0123291015625, 12.4658203125, 12.9193115234375, 13.372802734375, 13.8262939453125, 14.27978515625, 14.7332763671875, 15.186767578125, 15.6402587890625, 16.09375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 13.0, 22.0, 33.0, 54.0, 74.0, 100.0, 114.0, 118.0, 124.0, 121.0, 79.0, 54.0, 32.0, 22.0, 13.0, 11.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.53193664550781, -77.36991119384766, -74.2078857421875, -71.04585266113281, -67.88382720947266, -64.7218017578125, -61.559776306152344, -58.39774703979492, -55.2357177734375, -52.073692321777344, -48.91166305541992, -45.749637603759766, -42.587608337402344, -39.42558288574219, -36.26355743408203, -33.10152816772461, -29.939502716064453, -26.777475357055664, -23.615447998046875, -20.45342254638672, -17.291393280029297, -14.129366874694824, -10.967340469360352, -7.8053131103515625, -4.643285751342773, -1.4812586307525635, 1.6807684898376465, 4.842795372009277, 8.004822731018066, 11.166850090026855, 14.328876495361328, 17.490903854370117, 20.652931213378906, 23.814958572387695, 26.976985931396484, 30.13901138305664, 33.30104064941406, 36.46306610107422, 39.625091552734375, 42.7871208190918, 45.94915008544922, 49.111175537109375, 52.2732048034668, 55.43523025512695, 58.597259521484375, 61.75928497314453, 64.92131042480469, 68.08334350585938, 71.245361328125, 74.40738677978516, 77.56941223144531, 80.7314453125, 83.89347076416016, 87.05549621582031, 90.21752166748047, 93.37954711914062, 96.54158020019531, 99.70360565185547, 102.86563110351562, 106.02766418457031, 109.18968963623047, 112.35171508789062, 115.51374053955078, 118.67576599121094, 121.83779907226562]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 11.0, 14.0, 10.0, 10.0, 14.0, 19.0, 16.0, 29.0, 27.0, 24.0, 21.0, 31.0, 32.0, 31.0, 46.0, 30.0, 47.0, 32.0, 40.0, 42.0, 45.0, 31.0, 43.0, 42.0, 31.0, 36.0, 27.0, 23.0, 23.0, 18.0, 19.0, 16.0, 28.0, 20.0, 6.0, 11.0, 9.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-45.17182159423828, -43.788028717041016, -42.404232025146484, -41.02043914794922, -39.63664245605469, -38.25284957885742, -36.869056701660156, -35.485260009765625, -34.101463317871094, -32.71767044067383, -31.333873748779297, -29.95008087158203, -28.5662841796875, -27.182491302490234, -25.798696517944336, -24.414901733398438, -23.031108856201172, -21.647314071655273, -20.263519287109375, -18.87972640991211, -17.495929718017578, -16.112136840820312, -14.728342056274414, -13.344547271728516, -11.960752487182617, -10.576957702636719, -9.19316291809082, -7.809369087219238, -6.42557430267334, -5.041779518127441, -3.6579856872558594, -2.274190902709961, -0.8903961181640625, 0.49339842796325684, 1.8771929740905762, 3.2609872817993164, 4.644782066345215, 6.028576850891113, 7.412370681762695, 8.796165466308594, 10.179960250854492, 11.56375503540039, 12.947549819946289, 14.331343650817871, 15.71513843536377, 17.098934173583984, 18.48272705078125, 19.86652183532715, 21.250316619873047, 22.634111404418945, 24.017906188964844, 25.40169906616211, 26.78549575805664, 28.169288635253906, 29.553083419799805, 30.936878204345703, 32.32067108154297, 33.704463958740234, 35.088260650634766, 36.47205352783203, 37.85585021972656, 39.23964309692383, 40.623435974121094, 42.007232666015625, 43.391029357910156]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 13.0, 8.0, 5.0, 13.0, 17.0, 21.0, 27.0, 24.0, 25.0, 30.0, 32.0, 38.0, 33.0, 34.0, 44.0, 46.0, 40.0, 44.0, 46.0, 37.0, 37.0, 48.0, 47.0, 36.0, 29.0, 29.0, 30.0, 26.0, 20.0, 24.0, 17.0, 22.0, 5.0, 10.0, 10.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-101.125, -97.84765625, -94.5703125, -91.29296875, -88.015625, -84.73828125, -81.4609375, -78.18359375, -74.90625, -71.62890625, -68.3515625, -65.07421875, -61.796875, -58.51953125, -55.2421875, -51.96484375, -48.6875, -45.41015625, -42.1328125, -38.85546875, -35.578125, -32.30078125, -29.0234375, -25.74609375, -22.46875, -19.19140625, -15.9140625, -12.63671875, -9.359375, -6.08203125, -2.8046875, 0.47265625, 3.75, 7.02734375, 10.3046875, 13.58203125, 16.859375, 20.13671875, 23.4140625, 26.69140625, 29.96875, 33.24609375, 36.5234375, 39.80078125, 43.078125, 46.35546875, 49.6328125, 52.91015625, 56.1875, 59.46484375, 62.7421875, 66.01953125, 69.296875, 72.57421875, 75.8515625, 79.12890625, 82.40625, 85.68359375, 88.9609375, 92.23828125, 95.515625, 98.79296875, 102.0703125, 105.34765625, 108.625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 19.0, 24.0, 30.0, 44.0, 78.0, 106.0, 159.0, 224.0, 367.0, 570.0, 885.0, 1286.0, 2097.0, 3218.0, 5266.0, 8036.0, 12892.0, 20736.0, 33053.0, 55151.0, 97546.0, 210835.0, 307353.0, 119870.0, 65136.0, 38911.0, 23650.0, 15039.0, 9360.0, 6001.0, 3753.0, 2431.0, 1497.0, 1027.0, 622.0, 411.0, 273.0, 196.0, 125.0, 75.0, 57.0, 44.0, 28.0, 22.0, 17.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.4765625, -4.341552734375, -4.20654296875, -4.071533203125, -3.9365234375, -3.801513671875, -3.66650390625, -3.531494140625, -3.396484375, -3.261474609375, -3.12646484375, -2.991455078125, -2.8564453125, -2.721435546875, -2.58642578125, -2.451416015625, -2.31640625, -2.181396484375, -2.04638671875, -1.911376953125, -1.7763671875, -1.641357421875, -1.50634765625, -1.371337890625, -1.236328125, -1.101318359375, -0.96630859375, -0.831298828125, -0.6962890625, -0.561279296875, -0.42626953125, -0.291259765625, -0.15625, -0.021240234375, 0.11376953125, 0.248779296875, 0.3837890625, 0.518798828125, 0.65380859375, 0.788818359375, 0.923828125, 1.058837890625, 1.19384765625, 1.328857421875, 1.4638671875, 1.598876953125, 1.73388671875, 1.868896484375, 2.00390625, 2.138916015625, 2.27392578125, 2.408935546875, 2.5439453125, 2.678955078125, 2.81396484375, 2.948974609375, 3.083984375, 3.218994140625, 3.35400390625, 3.489013671875, 3.6240234375, 3.759033203125, 3.89404296875, 4.029052734375, 4.1640625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 7.0, 10.0, 12.0, 5.0, 19.0, 11.0, 12.0, 19.0, 21.0, 23.0, 34.0, 30.0, 35.0, 30.0, 39.0, 36.0, 39.0, 33.0, 37.0, 1059.0, 39.0, 57.0, 47.0, 45.0, 37.0, 37.0, 29.0, 28.0, 33.0, 30.0, 26.0, 20.0, 16.0, 14.0, 8.0, 9.0, 12.0, 4.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.4375, -65.087890625, -62.73828125, -60.388671875, -58.0390625, -55.689453125, -53.33984375, -50.990234375, -48.640625, -46.291015625, -43.94140625, -41.591796875, -39.2421875, -36.892578125, -34.54296875, -32.193359375, -29.84375, -27.494140625, -25.14453125, -22.794921875, -20.4453125, -18.095703125, -15.74609375, -13.396484375, -11.046875, -8.697265625, -6.34765625, -3.998046875, -1.6484375, 0.701171875, 3.05078125, 5.400390625, 7.75, 10.099609375, 12.44921875, 14.798828125, 17.1484375, 19.498046875, 21.84765625, 24.197265625, 26.546875, 28.896484375, 31.24609375, 33.595703125, 35.9453125, 38.294921875, 40.64453125, 42.994140625, 45.34375, 47.693359375, 50.04296875, 52.392578125, 54.7421875, 57.091796875, 59.44140625, 61.791015625, 64.140625, 66.490234375, 68.83984375, 71.189453125, 73.5390625, 75.888671875, 78.23828125, 80.587890625, 82.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 13.0, 19.0, 35.0, 54.0, 66.0, 104.0, 195.0, 250.0, 377.0, 581.0, 875.0, 1257.0, 1843.0, 2775.0, 4029.0, 6481.0, 9632.0, 15090.0, 23662.0, 37691.0, 63651.0, 116625.0, 1328971.0, 223192.0, 104372.0, 57769.0, 35137.0, 21827.0, 13888.0, 9019.0, 5900.0, 4062.0, 2472.0, 1729.0, 1182.0, 722.0, 520.0, 337.0, 236.0, 156.0, 120.0, 68.0, 54.0, 28.0, 22.0, 15.0, 15.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.388671875, -2.31610107421875, -2.2435302734375, -2.17095947265625, -2.098388671875, -2.02581787109375, -1.9532470703125, -1.88067626953125, -1.80810546875, -1.73553466796875, -1.6629638671875, -1.59039306640625, -1.517822265625, -1.44525146484375, -1.3726806640625, -1.30010986328125, -1.2275390625, -1.15496826171875, -1.0823974609375, -1.00982666015625, -0.937255859375, -0.86468505859375, -0.7921142578125, -0.71954345703125, -0.64697265625, -0.57440185546875, -0.5018310546875, -0.42926025390625, -0.356689453125, -0.28411865234375, -0.2115478515625, -0.13897705078125, -0.06640625, 0.00616455078125, 0.0787353515625, 0.15130615234375, 0.223876953125, 0.29644775390625, 0.3690185546875, 0.44158935546875, 0.51416015625, 0.58673095703125, 0.6593017578125, 0.73187255859375, 0.804443359375, 0.87701416015625, 0.9495849609375, 1.02215576171875, 1.0947265625, 1.16729736328125, 1.2398681640625, 1.31243896484375, 1.385009765625, 1.45758056640625, 1.5301513671875, 1.60272216796875, 1.67529296875, 1.74786376953125, 1.8204345703125, 1.89300537109375, 1.965576171875, 2.03814697265625, 2.1107177734375, 2.18328857421875, 2.255859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 6.0, 10.0, 9.0, 14.0, 12.0, 18.0, 19.0, 24.0, 31.0, 37.0, 51.0, 64.0, 87.0, 94.0, 110.0, 82.0, 62.0, 60.0, 51.0, 35.0, 27.0, 19.0, 16.0, 12.0, 10.0, 7.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0961971282958984e-05, -4.9219466745853424e-05, -4.7476962208747864e-05, -4.5734457671642303e-05, -4.399195313453674e-05, -4.224944859743118e-05, -4.050694406032562e-05, -3.876443952322006e-05, -3.70219349861145e-05, -3.527943044900894e-05, -3.353692591190338e-05, -3.179442137479782e-05, -3.005191683769226e-05, -2.83094123005867e-05, -2.656690776348114e-05, -2.482440322637558e-05, -2.308189868927002e-05, -2.133939415216446e-05, -1.95968896150589e-05, -1.785438507795334e-05, -1.611188054084778e-05, -1.4369376003742218e-05, -1.2626871466636658e-05, -1.0884366929531097e-05, -9.141862392425537e-06, -7.399357855319977e-06, -5.6568533182144165e-06, -3.914348781108856e-06, -2.171844244003296e-06, -4.293397068977356e-07, 1.3131648302078247e-06, 3.055669367313385e-06, 4.798173904418945e-06, 6.540678441524506e-06, 8.283182978630066e-06, 1.0025687515735626e-05, 1.1768192052841187e-05, 1.3510696589946747e-05, 1.5253201127052307e-05, 1.6995705664157867e-05, 1.8738210201263428e-05, 2.0480714738368988e-05, 2.222321927547455e-05, 2.396572381258011e-05, 2.570822834968567e-05, 2.745073288679123e-05, 2.919323742389679e-05, 3.093574196100235e-05, 3.267824649810791e-05, 3.442075103521347e-05, 3.616325557231903e-05, 3.790576010942459e-05, 3.964826464653015e-05, 4.139076918363571e-05, 4.313327372074127e-05, 4.487577825784683e-05, 4.661828279495239e-05, 4.836078733205795e-05, 5.010329186916351e-05, 5.1845796406269073e-05, 5.3588300943374634e-05, 5.5330805480480194e-05, 5.7073310017585754e-05, 5.8815814554691315e-05, 6.0558319091796875e-05]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 14.0, 8.0, 17.0, 27.0, 33.0, 56.0, 96.0, 138.0, 188.0, 320.0, 542.0, 984.0, 1764.0, 3517.0, 7526.0, 17231.0, 42015.0, 122735.0, 490472.0, 241510.0, 70852.0, 26365.0, 11354.0, 5125.0, 2497.0, 1279.0, 741.0, 394.0, 267.0, 153.0, 106.0, 65.0, 41.0, 36.0, 16.0, 16.0, 8.0, 8.0, 6.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002391338348388672, -0.00023204833269119263, -0.00022496283054351807, -0.0002178773283958435, -0.00021079182624816895, -0.00020370632410049438, -0.00019662082195281982, -0.00018953531980514526, -0.0001824498176574707, -0.00017536431550979614, -0.00016827881336212158, -0.00016119331121444702, -0.00015410780906677246, -0.0001470223069190979, -0.00013993680477142334, -0.00013285130262374878, -0.00012576580047607422, -0.00011868029832839966, -0.0001115947961807251, -0.00010450929403305054, -9.742379188537598e-05, -9.033828973770142e-05, -8.325278759002686e-05, -7.61672854423523e-05, -6.908178329467773e-05, -6.199628114700317e-05, -5.491077899932861e-05, -4.782527685165405e-05, -4.073977470397949e-05, -3.365427255630493e-05, -2.656877040863037e-05, -1.948326826095581e-05, -1.239776611328125e-05, -5.3122639656066895e-06, 1.773238182067871e-06, 8.858740329742432e-06, 1.5944242477416992e-05, 2.3029744625091553e-05, 3.0115246772766113e-05, 3.7200748920440674e-05, 4.4286251068115234e-05, 5.1371753215789795e-05, 5.8457255363464355e-05, 6.554275751113892e-05, 7.262825965881348e-05, 7.971376180648804e-05, 8.67992639541626e-05, 9.388476610183716e-05, 0.00010097026824951172, 0.00010805577039718628, 0.00011514127254486084, 0.0001222267746925354, 0.00012931227684020996, 0.00013639777898788452, 0.00014348328113555908, 0.00015056878328323364, 0.0001576542854309082, 0.00016473978757858276, 0.00017182528972625732, 0.00017891079187393188, 0.00018599629402160645, 0.000193081796169281, 0.00020016729831695557, 0.00020725280046463013, 0.0002143383026123047]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 12.0, 17.0, 26.0, 31.0, 55.0, 67.0, 98.0, 94.0, 109.0, 104.0, 82.0, 74.0, 53.0, 51.0, 27.0, 25.0, 16.0, 14.0, 8.0, 9.0, 3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4051616239594296e-05, -3.2660464057698846e-05, -3.126930823782459e-05, -2.987815605592914e-05, -2.848700387403369e-05, -2.709585169213824e-05, -2.5704697691253386e-05, -2.4313543690368533e-05, -2.2922391508473083e-05, -2.1531239326577634e-05, -2.014008532569278e-05, -1.8748931324807927e-05, -1.7357779142912477e-05, -1.5966626961017027e-05, -1.4575472960132174e-05, -1.3184319868742023e-05, -1.1793166777351871e-05, -1.040201368596172e-05, -9.010860594571568e-06, -7.6197075031814165e-06, -6.228554411791265e-06, -4.8374013204011135e-06, -3.446248229010962e-06, -2.0550951376208104e-06, -6.639420462306589e-07, 7.272110451594926e-07, 2.118364136549644e-06, 3.5095172279397957e-06, 4.900670319329947e-06, 6.291823410720099e-06, 7.68297650211025e-06, 9.074129593500402e-06, 1.046528632286936e-05, 1.1856439414259512e-05, 1.3247592505649664e-05, 1.4638745597039815e-05, 1.6029898688429967e-05, 1.7421050870325416e-05, 1.881220487121027e-05, 2.0203358872095123e-05, 2.1594511053990573e-05, 2.2985663235886022e-05, 2.4376817236770876e-05, 2.576797123765573e-05, 2.715912341955118e-05, 2.855027560144663e-05, 2.9941429602331482e-05, 3.1332583603216335e-05, 3.2723735785111785e-05, 3.4114887967007235e-05, 3.5506040148902684e-05, 3.689719596877694e-05, 3.828834815067239e-05, 3.967950033256784e-05, 4.10706561524421e-05, 4.246180833433755e-05, 4.3852960516233e-05, 4.524411269812845e-05, 4.66352648800239e-05, 4.8026420699898154e-05, 4.94175728817936e-05, 5.080872506368905e-05, 5.219988088356331e-05, 5.359103306545876e-05, 5.498218524735421e-05]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 7.0, 5.0, 17.0, 8.0, 13.0, 10.0, 14.0, 18.0, 20.0, 18.0, 26.0, 31.0, 32.0, 30.0, 28.0, 23.0, 21.0, 42.0, 45.0, 37.0, 51.0, 36.0, 36.0, 43.0, 41.0, 37.0, 39.0, 30.0, 37.0, 27.0, 29.0, 18.0, 12.0, 15.0, 20.0, 19.0, 10.0, 10.0, 10.0, 9.0, 2.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.3245811462402344e-05, -2.2532418370246887e-05, -2.181902527809143e-05, -2.1105632185935974e-05, -2.0392239093780518e-05, -1.967884600162506e-05, -1.8965452909469604e-05, -1.8252059817314148e-05, -1.753866672515869e-05, -1.6825273633003235e-05, -1.611188054084778e-05, -1.5398487448692322e-05, -1.4685094356536865e-05, -1.3971701264381409e-05, -1.3258308172225952e-05, -1.2544915080070496e-05, -1.1831521987915039e-05, -1.1118128895759583e-05, -1.0404735803604126e-05, -9.69134271144867e-06, -8.977949619293213e-06, -8.264556527137756e-06, -7.5511634349823e-06, -6.837770342826843e-06, -6.124377250671387e-06, -5.41098415851593e-06, -4.697591066360474e-06, -3.984197974205017e-06, -3.2708048820495605e-06, -2.557411789894104e-06, -1.8440186977386475e-06, -1.130625605583191e-06, -4.172325134277344e-07, 2.9616057872772217e-07, 1.0095536708831787e-06, 1.7229467630386353e-06, 2.436339855194092e-06, 3.1497329473495483e-06, 3.863126039505005e-06, 4.5765191316604614e-06, 5.289912223815918e-06, 6.0033053159713745e-06, 6.716698408126831e-06, 7.430091500282288e-06, 8.143484592437744e-06, 8.8568776845932e-06, 9.570270776748657e-06, 1.0283663868904114e-05, 1.099705696105957e-05, 1.1710450053215027e-05, 1.2423843145370483e-05, 1.313723623752594e-05, 1.3850629329681396e-05, 1.4564022421836853e-05, 1.527741551399231e-05, 1.5990808606147766e-05, 1.6704201698303223e-05, 1.741759479045868e-05, 1.8130987882614136e-05, 1.8844380974769592e-05, 1.955777406692505e-05, 2.0271167159080505e-05, 2.0984560251235962e-05, 2.169795334339142e-05, 2.2411346435546875e-05]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 13.0, 8.0, 5.0, 13.0, 17.0, 21.0, 27.0, 24.0, 25.0, 30.0, 32.0, 38.0, 33.0, 34.0, 44.0, 46.0, 40.0, 44.0, 46.0, 37.0, 37.0, 48.0, 47.0, 36.0, 29.0, 29.0, 30.0, 26.0, 20.0, 24.0, 17.0, 22.0, 5.0, 10.0, 10.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-101.125, -97.84765625, -94.5703125, -91.29296875, -88.015625, -84.73828125, -81.4609375, -78.18359375, -74.90625, -71.62890625, -68.3515625, -65.07421875, -61.796875, -58.51953125, -55.2421875, -51.96484375, -48.6875, -45.41015625, -42.1328125, -38.85546875, -35.578125, -32.30078125, -29.0234375, -25.74609375, -22.46875, -19.19140625, -15.9140625, -12.63671875, -9.359375, -6.08203125, -2.8046875, 0.47265625, 3.75, 7.02734375, 10.3046875, 13.58203125, 16.859375, 20.13671875, 23.4140625, 26.69140625, 29.96875, 33.24609375, 36.5234375, 39.80078125, 43.078125, 46.35546875, 49.6328125, 52.91015625, 56.1875, 59.46484375, 62.7421875, 66.01953125, 69.296875, 72.57421875, 75.8515625, 79.12890625, 82.40625, 85.68359375, 88.9609375, 92.23828125, 95.515625, 98.79296875, 102.0703125, 105.34765625, 108.625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 10.0, 9.0, 8.0, 17.0, 11.0, 22.0, 27.0, 24.0, 24.0, 41.0, 51.0, 82.0, 121.0, 346.0, 1056.0, 5678.0, 55293.0, 549378.0, 396796.0, 34065.0, 3995.0, 774.0, 264.0, 136.0, 65.0, 49.0, 32.0, 37.0, 21.0, 23.0, 18.0, 19.0, 11.0, 9.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.546875, -20.849609375, -20.15234375, -19.455078125, -18.7578125, -18.060546875, -17.36328125, -16.666015625, -15.96875, -15.271484375, -14.57421875, -13.876953125, -13.1796875, -12.482421875, -11.78515625, -11.087890625, -10.390625, -9.693359375, -8.99609375, -8.298828125, -7.6015625, -6.904296875, -6.20703125, -5.509765625, -4.8125, -4.115234375, -3.41796875, -2.720703125, -2.0234375, -1.326171875, -0.62890625, 0.068359375, 0.765625, 1.462890625, 2.16015625, 2.857421875, 3.5546875, 4.251953125, 4.94921875, 5.646484375, 6.34375, 7.041015625, 7.73828125, 8.435546875, 9.1328125, 9.830078125, 10.52734375, 11.224609375, 11.921875, 12.619140625, 13.31640625, 14.013671875, 14.7109375, 15.408203125, 16.10546875, 16.802734375, 17.5, 18.197265625, 18.89453125, 19.591796875, 20.2890625, 20.986328125, 21.68359375, 22.380859375, 23.078125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 9.0, 13.0, 32.0, 41.0, 67.0, 111.0, 151.0, 2196.0, 131.0, 103.0, 92.0, 48.0, 25.0, 14.0, 9.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-506.75, -492.4453125, -478.140625, -463.8359375, -449.53125, -435.2265625, -420.921875, -406.6171875, -392.3125, -378.0078125, -363.703125, -349.3984375, -335.09375, -320.7890625, -306.484375, -292.1796875, -277.875, -263.5703125, -249.265625, -234.9609375, -220.65625, -206.3515625, -192.046875, -177.7421875, -163.4375, -149.1328125, -134.828125, -120.5234375, -106.21875, -91.9140625, -77.609375, -63.3046875, -49.0, -34.6953125, -20.390625, -6.0859375, 8.21875, 22.5234375, 36.828125, 51.1328125, 65.4375, 79.7421875, 94.046875, 108.3515625, 122.65625, 136.9609375, 151.265625, 165.5703125, 179.875, 194.1796875, 208.484375, 222.7890625, 237.09375, 251.3984375, 265.703125, 280.0078125, 294.3125, 308.6171875, 322.921875, 337.2265625, 351.53125, 365.8359375, 380.140625, 394.4453125, 408.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 8.0, 13.0, 17.0, 23.0, 33.0, 62.0, 104.0, 171.0, 329.0, 715.0, 1838.0, 7016.0, 72542.0, 2832490.0, 211946.0, 13746.0, 2736.0, 894.0, 460.0, 231.0, 125.0, 72.0, 47.0, 22.0, 23.0, 7.0, 13.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -17.005126953125, -16.43212890625, -15.859130859375, -15.2861328125, -14.713134765625, -14.14013671875, -13.567138671875, -12.994140625, -12.421142578125, -11.84814453125, -11.275146484375, -10.7021484375, -10.129150390625, -9.55615234375, -8.983154296875, -8.41015625, -7.837158203125, -7.26416015625, -6.691162109375, -6.1181640625, -5.545166015625, -4.97216796875, -4.399169921875, -3.826171875, -3.253173828125, -2.68017578125, -2.107177734375, -1.5341796875, -0.961181640625, -0.38818359375, 0.184814453125, 0.7578125, 1.330810546875, 1.90380859375, 2.476806640625, 3.0498046875, 3.622802734375, 4.19580078125, 4.768798828125, 5.341796875, 5.914794921875, 6.48779296875, 7.060791015625, 7.6337890625, 8.206787109375, 8.77978515625, 9.352783203125, 9.92578125, 10.498779296875, 11.07177734375, 11.644775390625, 12.2177734375, 12.790771484375, 13.36376953125, 13.936767578125, 14.509765625, 15.082763671875, 15.65576171875, 16.228759765625, 16.8017578125, 17.374755859375, 17.94775390625, 18.520751953125, 19.09375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 9.0, 13.0, 16.0, 29.0, 49.0, 112.0, 180.0, 201.0, 172.0, 94.0, 33.0, 25.0, 16.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-496.2736511230469, -485.98358154296875, -475.6935119628906, -465.4034423828125, -455.1133728027344, -444.82330322265625, -434.5332336425781, -424.2431640625, -413.9530944824219, -403.66302490234375, -393.3729553222656, -383.0828857421875, -372.7928161621094, -362.50274658203125, -352.2126770019531, -341.922607421875, -331.6325378417969, -321.34246826171875, -311.0523986816406, -300.7623291015625, -290.4722595214844, -280.18218994140625, -269.8921203613281, -259.60205078125, -249.31198120117188, -239.02191162109375, -228.73184204101562, -218.4417724609375, -208.15170288085938, -197.86163330078125, -187.57156372070312, -177.281494140625, -166.9914093017578, -156.7013397216797, -146.41127014160156, -136.12120056152344, -125.83113098144531, -115.54106140136719, -105.25099182128906, -94.96092224121094, -84.67085266113281, -74.38078308105469, -64.09071350097656, -53.80064392089844, -43.51057434082031, -33.22050476074219, -22.930435180664062, -12.640365600585938, -2.3502960205078125, 7.9397735595703125, 18.229843139648438, 28.519912719726562, 38.80998229980469, 49.10005187988281, 59.39012145996094, 69.68019104003906, 79.97026062011719, 90.26033020019531, 100.55039978027344, 110.84046936035156, 121.13053894042969, 131.4206085205078, 141.71067810058594, 152.00074768066406, 162.2908172607422]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 0.0, 7.0, 4.0, 7.0, 5.0, 7.0, 13.0, 12.0, 12.0, 9.0, 15.0, 9.0, 17.0, 22.0, 19.0, 32.0, 17.0, 27.0, 28.0, 44.0, 36.0, 33.0, 43.0, 38.0, 27.0, 38.0, 42.0, 29.0, 42.0, 37.0, 23.0, 39.0, 31.0, 28.0, 27.0, 22.0, 18.0, 20.0, 12.0, 17.0, 9.0, 15.0, 11.0, 9.0, 5.0, 9.0, 7.0, 8.0, 7.0, 2.0, 4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-246.9398193359375, -239.129638671875, -231.31944274902344, -223.50926208496094, -215.69906616210938, -207.88888549804688, -200.07870483398438, -192.26852416992188, -184.4583282470703, -176.6481475830078, -168.83795166015625, -161.02777099609375, -153.21759033203125, -145.4073944091797, -137.5972137451172, -129.78701782226562, -121.97683715820312, -114.1666488647461, -106.35646057128906, -98.54627990722656, -90.73609161376953, -82.9259033203125, -75.11572265625, -67.30553436279297, -59.49534606933594, -51.685157775878906, -43.87497329711914, -36.064788818359375, -28.254600524902344, -20.444412231445312, -12.634227752685547, -4.824043273925781, 2.98614501953125, 10.796331405639648, 18.606517791748047, 26.416704177856445, 34.226890563964844, 42.037078857421875, 49.84726333618164, 57.657447814941406, 65.46763610839844, 73.27782440185547, 81.0880126953125, 88.898193359375, 96.70838165283203, 104.51856994628906, 112.32875061035156, 120.1389389038086, 127.94912719726562, 135.75930786132812, 143.5695037841797, 151.3796844482422, 159.18988037109375, 167.00006103515625, 174.81024169921875, 182.62042236328125, 190.4306182861328, 198.2407989501953, 206.05099487304688, 213.86117553710938, 221.67135620117188, 229.48155212402344, 237.29173278808594, 245.1019287109375, 252.912109375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 8.0, 7.0, 13.0, 13.0, 18.0, 25.0, 48.0, 68.0, 96.0, 118.0, 139.0, 220.0, 317.0, 407.0, 533.0, 712.0, 973.0, 1404.0, 1811.0, 2395.0, 3095.0, 4102.0, 1018202.0, 3453.0, 2704.0, 1941.0, 1566.0, 1155.0, 796.0, 605.0, 443.0, 315.0, 254.0, 165.0, 144.0, 84.0, 58.0, 43.0, 35.0, 19.0, 11.0, 11.0, 13.0, 7.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-29.696792602539062, -28.773496627807617, -27.850200653076172, -26.92690658569336, -26.003610610961914, -25.08031463623047, -24.157020568847656, -23.23372459411621, -22.310428619384766, -21.38713264465332, -20.463836669921875, -19.540542602539062, -18.617246627807617, -17.693950653076172, -16.77065658569336, -15.847360610961914, -14.924064636230469, -14.000768661499023, -13.077473640441895, -12.154178619384766, -11.23088264465332, -10.307586669921875, -9.384291648864746, -8.460996627807617, -7.537700653076172, -6.614405155181885, -5.691109657287598, -4.7678141593933105, -3.8445186614990234, -2.9212231636047363, -1.9979276657104492, -1.074632167816162, -0.1513347625732422, 0.7719607353210449, 1.695256233215332, 2.618551731109619, 3.5418472290039062, 4.465142726898193, 5.3884382247924805, 6.311733722686768, 7.235029220581055, 8.1583251953125, 9.081620216369629, 10.004915237426758, 10.928211212158203, 11.851507186889648, 12.774802207946777, 13.698097229003906, 14.621393203735352, 15.544689178466797, 16.46798324584961, 17.391279220581055, 18.3145751953125, 19.237871170043945, 20.16116714477539, 21.084461212158203, 22.00775718688965, 22.931053161621094, 23.854347229003906, 24.77764320373535, 25.700939178466797, 26.624235153198242, 27.547531127929688, 28.4708251953125, 29.394121170043945]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 9.0, 8.0, 19.0, 25.0, 32.0, 48.0, 96.0, 211.0, 883.0, 86618.0, 51373864.0, 1062.0, 187.0, 92.0, 38.0, 30.0, 13.0, 15.0, 13.0, 13.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-759.0606079101562, -733.8005981445312, -708.54052734375, -683.280517578125, -658.0205078125, -632.760498046875, -607.50048828125, -582.2404174804688, -556.9804077148438, -531.7203979492188, -506.4603576660156, -481.2003173828125, -455.9403076171875, -430.6802978515625, -405.4202575683594, -380.16021728515625, -354.90020751953125, -329.64019775390625, -304.3801574707031, -279.1201171875, -253.860107421875, -228.60008239746094, -203.34005737304688, -178.0800323486328, -152.82000732421875, -127.55998229980469, -102.29995727539062, -77.03993225097656, -51.7799072265625, -26.519882202148438, -1.259857177734375, 24.000167846679688, 49.26019287109375, 74.52021789550781, 99.78024291992188, 125.04026794433594, 150.30029296875, 175.56031799316406, 200.82034301757812, 226.0803680419922, 251.34039306640625, 276.60040283203125, 301.8604431152344, 327.1204833984375, 352.3804931640625, 377.6405029296875, 402.9005432128906, 428.16058349609375, 453.42059326171875, 478.68060302734375, 503.9406433105469, 529.20068359375, 554.460693359375, 579.720703125, 604.980712890625, 630.2407836914062, 655.5007934570312, 680.7608032226562, 706.0208740234375, 731.2808837890625, 756.5408935546875, 781.8009033203125, 807.0609130859375, 832.3209838867188, 857.5809936523438]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [6.0, 6.0, 5.0, 7.0, 18.0, 22.0, 35.0, 63.0, 79.0, 105.0, 141.0, 216.0, 272.0, 456.0, 610.0, 837.0, 1231.0, 1868.0, 2521.0, 3890.0, 5640.0, 8126.0, 11999.0, 18024.0, 26831.0, 39866.0, 59988.0, 94146.0, 151209.0, 250762.0, 478640.0, 4099761.0, 414703.0, 227114.0, 136192.0, 86722.0, 55941.0, 36412.0, 24592.0, 16589.0, 11200.0, 7565.0, 5188.0, 3672.0, 2520.0, 1756.0, 1226.0, 860.0, 562.0, 405.0, 257.0, 200.0, 140.0, 93.0, 35.0, 37.0, 24.0, 27.0, 14.0, 17.0, 4.0, 0.0, 3.0, 6.0], "bins": [-0.888671875, -0.8603744506835938, -0.8320770263671875, -0.8037796020507812, -0.775482177734375, -0.7471847534179688, -0.7188873291015625, -0.6905899047851562, -0.66229248046875, -0.6339950561523438, -0.6056976318359375, -0.5774002075195312, -0.549102783203125, -0.5208053588867188, -0.4925079345703125, -0.46421051025390625, -0.4359130859375, -0.40761566162109375, -0.3793182373046875, -0.35102081298828125, -0.322723388671875, -0.29442596435546875, -0.2661285400390625, -0.23783111572265625, -0.20953369140625, -0.18123626708984375, -0.1529388427734375, -0.12464141845703125, -0.096343994140625, -0.06804656982421875, -0.0397491455078125, -0.01145172119140625, 0.016845703125, 0.04514312744140625, 0.0734405517578125, 0.10173797607421875, 0.130035400390625, 0.15833282470703125, 0.1866302490234375, 0.21492767333984375, 0.24322509765625, 0.27152252197265625, 0.2998199462890625, 0.32811737060546875, 0.356414794921875, 0.38471221923828125, 0.4130096435546875, 0.44130706787109375, 0.4696044921875, 0.49790191650390625, 0.5261993408203125, 0.5544967651367188, 0.582794189453125, 0.6110916137695312, 0.6393890380859375, 0.6676864624023438, 0.69598388671875, 0.7242813110351562, 0.7525787353515625, 0.7808761596679688, 0.809173583984375, 0.8374710083007812, 0.8657684326171875, 0.8940658569335938, 0.92236328125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 2.0, 7.0, 3.0, 14.0, 14.0, 8.0, 14.0, 19.0, 17.0, 25.0, 19.0, 17.0, 26.0, 18.0, 27.0, 34.0, 36.0, 30.0, 37.0, 29.0, 38.0, 52.0, 1043.0, 32.0, 29.0, 38.0, 29.0, 23.0, 32.0, 38.0, 27.0, 31.0, 27.0, 25.0, 15.0, 22.0, 18.0, 19.0, 13.0, 8.0, 8.0, 9.0, 8.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0], "bins": [-39.1875, -38.01318359375, -36.8388671875, -35.66455078125, -34.490234375, -33.31591796875, -32.1416015625, -30.96728515625, -29.79296875, -28.61865234375, -27.4443359375, -26.27001953125, -25.095703125, -23.92138671875, -22.7470703125, -21.57275390625, -20.3984375, -19.22412109375, -18.0498046875, -16.87548828125, -15.701171875, -14.52685546875, -13.3525390625, -12.17822265625, -11.00390625, -9.82958984375, -8.6552734375, -7.48095703125, -6.306640625, -5.13232421875, -3.9580078125, -2.78369140625, -1.609375, -0.43505859375, 0.7392578125, 1.91357421875, 3.087890625, 4.26220703125, 5.4365234375, 6.61083984375, 7.78515625, 8.95947265625, 10.1337890625, 11.30810546875, 12.482421875, 13.65673828125, 14.8310546875, 16.00537109375, 17.1796875, 18.35400390625, 19.5283203125, 20.70263671875, 21.876953125, 23.05126953125, 24.2255859375, 25.39990234375, 26.57421875, 27.74853515625, 28.9228515625, 30.09716796875, 31.271484375, 32.44580078125, 33.6201171875, 34.79443359375, 35.96875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 9.0, 9.0, 18.0, 21.0, 35.0, 39.0, 77.0, 135.0, 217.0, 301.0, 467.0, 747.0, 1110.0, 1752.0, 2648.0, 4036.0, 6502.0, 10398.0, 16323.0, 25993.0, 41434.0, 66259.0, 109983.0, 195848.0, 404109.0, 4279443.0, 542423.0, 243177.0, 130033.0, 77718.0, 48321.0, 30000.0, 18883.0, 12031.0, 7460.0, 4878.0, 3094.0, 1883.0, 1316.0, 833.0, 516.0, 297.0, 230.0, 133.0, 92.0, 73.0, 54.0, 34.0, 20.0, 22.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.3291015625, -1.2884063720703125, -1.247711181640625, -1.2070159912109375, -1.16632080078125, -1.1256256103515625, -1.084930419921875, -1.0442352294921875, -1.0035400390625, -0.9628448486328125, -0.922149658203125, -0.8814544677734375, -0.84075927734375, -0.8000640869140625, -0.759368896484375, -0.7186737060546875, -0.677978515625, -0.6372833251953125, -0.596588134765625, -0.5558929443359375, -0.51519775390625, -0.4745025634765625, -0.433807373046875, -0.3931121826171875, -0.3524169921875, -0.3117218017578125, -0.271026611328125, -0.2303314208984375, -0.18963623046875, -0.1489410400390625, -0.108245849609375, -0.0675506591796875, -0.02685546875, 0.0138397216796875, 0.054534912109375, 0.0952301025390625, 0.13592529296875, 0.1766204833984375, 0.217315673828125, 0.2580108642578125, 0.2987060546875, 0.3394012451171875, 0.380096435546875, 0.4207916259765625, 0.46148681640625, 0.5021820068359375, 0.542877197265625, 0.5835723876953125, 0.624267578125, 0.6649627685546875, 0.705657958984375, 0.7463531494140625, 0.78704833984375, 0.8277435302734375, 0.868438720703125, 0.9091339111328125, 0.9498291015625, 0.9905242919921875, 1.031219482421875, 1.0719146728515625, 1.11260986328125, 1.1533050537109375, 1.194000244140625, 1.2346954345703125, 1.275390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 11.0, 17.0, 12.0, 21.0, 16.0, 25.0, 17.0, 26.0, 27.0, 40.0, 32.0, 43.0, 62.0, 46.0, 44.0, 1059.0, 50.0, 47.0, 49.0, 48.0, 41.0, 40.0, 29.0, 27.0, 25.0, 32.0, 16.0, 19.0, 20.0, 11.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.5, -65.435546875, -63.37109375, -61.306640625, -59.2421875, -57.177734375, -55.11328125, -53.048828125, -50.984375, -48.919921875, -46.85546875, -44.791015625, -42.7265625, -40.662109375, -38.59765625, -36.533203125, -34.46875, -32.404296875, -30.33984375, -28.275390625, -26.2109375, -24.146484375, -22.08203125, -20.017578125, -17.953125, -15.888671875, -13.82421875, -11.759765625, -9.6953125, -7.630859375, -5.56640625, -3.501953125, -1.4375, 0.626953125, 2.69140625, 4.755859375, 6.8203125, 8.884765625, 10.94921875, 13.013671875, 15.078125, 17.142578125, 19.20703125, 21.271484375, 23.3359375, 25.400390625, 27.46484375, 29.529296875, 31.59375, 33.658203125, 35.72265625, 37.787109375, 39.8515625, 41.916015625, 43.98046875, 46.044921875, 48.109375, 50.173828125, 52.23828125, 54.302734375, 56.3671875, 58.431640625, 60.49609375, 62.560546875, 64.625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 15.0, 24.0, 18.0, 16.0, 46.0, 42.0, 57.0, 81.0, 96.0, 175.0, 237.0, 260.0, 392.0, 553.0, 751.0, 1244.0, 1949.0, 3100.0, 4717.0, 7686.0, 13151.0, 25295.0, 59100.0, 305384.0, 5601290.0, 169957.0, 46109.0, 20584.0, 11055.0, 6524.0, 3939.0, 2417.0, 1619.0, 1020.0, 734.0, 409.0, 374.0, 268.0, 187.0, 111.0, 108.0, 89.0, 65.0, 31.0, 35.0, 55.0, 12.0, 14.0, 12.0, 9.0, 10.0, 9.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.275390625, -3.170989990234375, -3.06658935546875, -2.962188720703125, -2.8577880859375, -2.753387451171875, -2.64898681640625, -2.544586181640625, -2.440185546875, -2.335784912109375, -2.23138427734375, -2.126983642578125, -2.0225830078125, -1.918182373046875, -1.81378173828125, -1.709381103515625, -1.60498046875, -1.500579833984375, -1.39617919921875, -1.291778564453125, -1.1873779296875, -1.082977294921875, -0.97857666015625, -0.874176025390625, -0.769775390625, -0.665374755859375, -0.56097412109375, -0.456573486328125, -0.3521728515625, -0.247772216796875, -0.14337158203125, -0.038970947265625, 0.0654296875, 0.169830322265625, 0.27423095703125, 0.378631591796875, 0.4830322265625, 0.587432861328125, 0.69183349609375, 0.796234130859375, 0.900634765625, 1.005035400390625, 1.10943603515625, 1.213836669921875, 1.3182373046875, 1.422637939453125, 1.52703857421875, 1.631439208984375, 1.73583984375, 1.840240478515625, 1.94464111328125, 2.049041748046875, 2.1534423828125, 2.257843017578125, 2.36224365234375, 2.466644287109375, 2.571044921875, 2.675445556640625, 2.77984619140625, 2.884246826171875, 2.9886474609375, 3.093048095703125, 3.19744873046875, 3.301849365234375, 3.40625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 9.0, 10.0, 12.0, 8.0, 21.0, 18.0, 17.0, 18.0, 12.0, 26.0, 29.0, 37.0, 28.0, 32.0, 32.0, 42.0, 42.0, 35.0, 54.0, 44.0, 1052.0, 28.0, 44.0, 31.0, 57.0, 35.0, 31.0, 26.0, 24.0, 25.0, 20.0, 24.0, 17.0, 15.0, 11.0, 10.0, 12.0, 9.0, 5.0, 3.0, 1.0, 3.0, 8.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.46875, -59.36376953125, -57.2587890625, -55.15380859375, -53.048828125, -50.94384765625, -48.8388671875, -46.73388671875, -44.62890625, -42.52392578125, -40.4189453125, -38.31396484375, -36.208984375, -34.10400390625, -31.9990234375, -29.89404296875, -27.7890625, -25.68408203125, -23.5791015625, -21.47412109375, -19.369140625, -17.26416015625, -15.1591796875, -13.05419921875, -10.94921875, -8.84423828125, -6.7392578125, -4.63427734375, -2.529296875, -0.42431640625, 1.6806640625, 3.78564453125, 5.890625, 7.99560546875, 10.1005859375, 12.20556640625, 14.310546875, 16.41552734375, 18.5205078125, 20.62548828125, 22.73046875, 24.83544921875, 26.9404296875, 29.04541015625, 31.150390625, 33.25537109375, 35.3603515625, 37.46533203125, 39.5703125, 41.67529296875, 43.7802734375, 45.88525390625, 47.990234375, 50.09521484375, 52.2001953125, 54.30517578125, 56.41015625, 58.51513671875, 60.6201171875, 62.72509765625, 64.830078125, 66.93505859375, 69.0400390625, 71.14501953125, 73.25]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 11.0, 9.0, 13.0, 16.0, 14.0, 29.0, 46.0, 240.0, 419.0, 51.0, 26.0, 29.0, 19.0, 15.0, 8.0, 10.0, 6.0, 3.0, 9.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-326.4184875488281, -309.28857421875, -292.1586608886719, -275.02874755859375, -257.8988037109375, -240.76889038085938, -223.63897705078125, -206.50906372070312, -189.37913513183594, -172.2492218017578, -155.11929321289062, -137.9893798828125, -120.85945892333984, -103.72953796386719, -86.59962463378906, -69.4697036743164, -52.33978271484375, -35.209861755371094, -18.079944610595703, -0.9500274658203125, 16.179893493652344, 33.309814453125, 50.439727783203125, 67.56964874267578, 84.69956970214844, 101.8294906616211, 118.95941162109375, 136.08932495117188, 153.21923828125, 170.3491668701172, 187.4790802001953, 204.6090087890625, 221.7388916015625, 238.86880493164062, 255.9987335205078, 273.128662109375, 290.2585754394531, 307.38848876953125, 324.5184020996094, 341.6483154296875, 358.77825927734375, 375.9081726074219, 393.0380859375, 410.16802978515625, 427.2979431152344, 444.4278564453125, 461.5577697753906, 478.68768310546875, 495.8175964355469, 512.947509765625, 530.0774536132812, 547.2073364257812, 564.3372802734375, 581.4671630859375, 598.5971069335938, 615.72705078125, 632.85693359375, 649.9868774414062, 667.1167602539062, 684.2467041015625, 701.3765869140625, 718.5065307617188, 735.636474609375, 752.766357421875, 769.8963012695312]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 2.0, 8.0, 7.0, 8.0, 16.0, 16.0, 21.0, 16.0, 16.0, 17.0, 27.0, 22.0, 20.0, 30.0, 33.0, 23.0, 38.0, 44.0, 49.0, 41.0, 41.0, 39.0, 30.0, 37.0, 32.0, 35.0, 42.0, 37.0, 38.0, 26.0, 23.0, 31.0, 23.0, 21.0, 18.0, 17.0, 10.0, 10.0, 8.0, 5.0, 3.0, 8.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-238.36233520507812, -231.1828155517578, -224.0032958984375, -216.82379150390625, -209.64427185058594, -202.46475219726562, -195.28524780273438, -188.10572814941406, -180.92620849609375, -173.74668884277344, -166.56716918945312, -159.38766479492188, -152.20814514160156, -145.02862548828125, -137.84912109375, -130.6696014404297, -123.49008178710938, -116.31056213378906, -109.13105010986328, -101.9515380859375, -94.77201843261719, -87.59249877929688, -80.4129867553711, -73.23347473144531, -66.053955078125, -58.87443923950195, -51.694923400878906, -44.51540756225586, -37.33589172363281, -30.156375885009766, -22.97686004638672, -15.797344207763672, -8.617843627929688, -1.4383277893066406, 5.741188049316406, 12.920703887939453, 20.1002197265625, 27.279735565185547, 34.459251403808594, 41.63876724243164, 48.81828308105469, 55.997798919677734, 63.17731475830078, 70.35682678222656, 77.53634643554688, 84.71586608886719, 91.89537811279297, 99.07489013671875, 106.25440979003906, 113.43392944335938, 120.61344146728516, 127.79295349121094, 134.97247314453125, 142.15199279785156, 149.33151245117188, 156.51101684570312, 163.69053649902344, 170.87005615234375, 178.049560546875, 185.2290802001953, 192.40859985351562, 199.58811950683594, 206.76763916015625, 213.9471435546875, 221.1266632080078]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 7.0, 10.0, 16.0, 16.0, 21.0, 49.0, 58.0, 79.0, 143.0, 145.0, 201.0, 278.0, 364.0, 454.0, 505.0, 574.0, 676.0, 844.0, 1070.0, 1258.0, 1837.0, 3050.0, 4103.0, 7972.0, 4129380.0, 11858.0, 6935.0, 4431.0, 3256.0, 2545.0, 2005.0, 1730.0, 1458.0, 1266.0, 1053.0, 882.0, 712.0, 541.0, 479.0, 363.0, 306.0, 236.0, 222.0, 180.0, 143.0, 143.0, 113.0, 74.0, 59.0, 58.0, 35.0, 29.0, 18.0, 21.0, 11.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0], "bins": [-1.5078125, -1.4535980224609375, -1.399383544921875, -1.3451690673828125, -1.29095458984375, -1.2367401123046875, -1.182525634765625, -1.1283111572265625, -1.0740966796875, -1.0198822021484375, -0.965667724609375, -0.9114532470703125, -0.85723876953125, -0.8030242919921875, -0.748809814453125, -0.6945953369140625, -0.640380859375, -0.5861663818359375, -0.531951904296875, -0.4777374267578125, -0.42352294921875, -0.3693084716796875, -0.315093994140625, -0.2608795166015625, -0.2066650390625, -0.1524505615234375, -0.098236083984375, -0.0440216064453125, 0.01019287109375, 0.0644073486328125, 0.118621826171875, 0.1728363037109375, 0.22705078125, 0.2812652587890625, 0.335479736328125, 0.3896942138671875, 0.44390869140625, 0.4981231689453125, 0.552337646484375, 0.6065521240234375, 0.6607666015625, 0.7149810791015625, 0.769195556640625, 0.8234100341796875, 0.87762451171875, 0.9318389892578125, 0.986053466796875, 1.0402679443359375, 1.094482421875, 1.1486968994140625, 1.202911376953125, 1.2571258544921875, 1.31134033203125, 1.3655548095703125, 1.419769287109375, 1.4739837646484375, 1.5281982421875, 1.5824127197265625, 1.636627197265625, 1.6908416748046875, 1.74505615234375, 1.7992706298828125, 1.853485107421875, 1.9076995849609375, 1.9619140625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 8.0, 10.0, 7.0, 14.0, 50.0, 760.0, 20.0, 15.0, 15.0, 10.0, 5.0, 9.0, 4.0, 7.0, 5.0, 2.0, 5.0, 6.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0791015625, -0.07625770568847656, -0.07341384887695312, -0.07056999206542969, -0.06772613525390625, -0.06488227844238281, -0.062038421630859375, -0.05919456481933594, -0.0563507080078125, -0.05350685119628906, -0.050662994384765625, -0.04781913757324219, -0.04497528076171875, -0.04213142395019531, -0.039287567138671875, -0.03644371032714844, -0.033599853515625, -0.030755996704101562, -0.027912139892578125, -0.025068283081054688, -0.02222442626953125, -0.019380569458007812, -0.016536712646484375, -0.013692855834960938, -0.0108489990234375, -0.008005142211914062, -0.005161285400390625, -0.0023174285888671875, 0.00052642822265625, 0.0033702850341796875, 0.006214141845703125, 0.009057998657226562, 0.01190185546875, 0.014745712280273438, 0.017589569091796875, 0.020433425903320312, 0.02327728271484375, 0.026121139526367188, 0.028964996337890625, 0.03180885314941406, 0.0346527099609375, 0.03749656677246094, 0.040340423583984375, 0.04318428039550781, 0.04602813720703125, 0.04887199401855469, 0.051715850830078125, 0.05455970764160156, 0.057403564453125, 0.06024742126464844, 0.06309127807617188, 0.06593513488769531, 0.06877899169921875, 0.07162284851074219, 0.07446670532226562, 0.07731056213378906, 0.0801544189453125, 0.08299827575683594, 0.08584213256835938, 0.08868598937988281, 0.09152984619140625, 0.09437370300292969, 0.09721755981445312, 0.10006141662597656, 0.1029052734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 12.0, 7.0, 9.0, 12.0, 10.0, 21.0, 27.0, 51.0, 84.0, 98.0, 161.0, 262.0, 493.0, 832.0, 1525.0, 2884.0, 5775.0, 13045.0, 49897.0, 4072225.0, 26754.0, 9878.0, 4643.0, 2417.0, 1252.0, 749.0, 444.0, 231.0, 165.0, 107.0, 80.0, 30.0, 25.0, 22.0, 10.0, 15.0, 3.0, 9.0, 10.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.1083221435546875, -1.075042724609375, -1.0417633056640625, -1.00848388671875, -0.9752044677734375, -0.941925048828125, -0.9086456298828125, -0.8753662109375, -0.8420867919921875, -0.808807373046875, -0.7755279541015625, -0.74224853515625, -0.7089691162109375, -0.675689697265625, -0.6424102783203125, -0.609130859375, -0.5758514404296875, -0.542572021484375, -0.5092926025390625, -0.47601318359375, -0.4427337646484375, -0.409454345703125, -0.3761749267578125, -0.3428955078125, -0.3096160888671875, -0.276336669921875, -0.2430572509765625, -0.20977783203125, -0.1764984130859375, -0.143218994140625, -0.1099395751953125, -0.07666015625, -0.0433807373046875, -0.010101318359375, 0.0231781005859375, 0.05645751953125, 0.0897369384765625, 0.123016357421875, 0.1562957763671875, 0.1895751953125, 0.2228546142578125, 0.256134033203125, 0.2894134521484375, 0.32269287109375, 0.3559722900390625, 0.389251708984375, 0.4225311279296875, 0.455810546875, 0.4890899658203125, 0.522369384765625, 0.5556488037109375, 0.58892822265625, 0.6222076416015625, 0.655487060546875, 0.6887664794921875, 0.7220458984375, 0.7553253173828125, 0.788604736328125, 0.8218841552734375, 0.85516357421875, 0.8884429931640625, 0.921722412109375, 0.9550018310546875, 0.98828125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 3.0, 6.0, 6.0, 9.0, 1.0, 13.0, 16.0, 9.0, 19.0, 14.0, 29.0, 3725.0, 78.0, 25.0, 19.0, 14.0, 19.0, 8.0, 16.0, 9.0, 11.0, 8.0, 4.0, 1.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.235107421875, -0.22481536865234375, -0.2145233154296875, -0.20423126220703125, -0.193939208984375, -0.18364715576171875, -0.1733551025390625, -0.16306304931640625, -0.15277099609375, -0.14247894287109375, -0.1321868896484375, -0.12189483642578125, -0.111602783203125, -0.10131072998046875, -0.0910186767578125, -0.08072662353515625, -0.0704345703125, -0.06014251708984375, -0.0498504638671875, -0.03955841064453125, -0.029266357421875, -0.01897430419921875, -0.0086822509765625, 0.00160980224609375, 0.01190185546875, 0.02219390869140625, 0.0324859619140625, 0.04277801513671875, 0.053070068359375, 0.06336212158203125, 0.0736541748046875, 0.08394622802734375, 0.09423828125, 0.10453033447265625, 0.1148223876953125, 0.12511444091796875, 0.135406494140625, 0.14569854736328125, 0.1559906005859375, 0.16628265380859375, 0.17657470703125, 0.18686676025390625, 0.1971588134765625, 0.20745086669921875, 0.217742919921875, 0.22803497314453125, 0.2383270263671875, 0.24861907958984375, 0.2589111328125, 0.26920318603515625, 0.2794952392578125, 0.28978729248046875, 0.300079345703125, 0.31037139892578125, 0.3206634521484375, 0.33095550537109375, 0.34124755859375, 0.35153961181640625, 0.3618316650390625, 0.37212371826171875, 0.382415771484375, 0.39270782470703125, 0.4029998779296875, 0.41329193115234375, 0.423583984375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 14.0, 59.0, 639.0, 195.0, 55.0, 20.0, 13.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3403024673461914, -0.2676445245742798, -0.19498655200004578, -0.12232859432697296, -0.049670636653900146, 0.022987306118011475, 0.09564527869224548, 0.1683032512664795, 0.2409611940383911, 0.31361913681030273, 0.38627710938453674, 0.45893508195877075, 0.5315930247306824, 0.604250967502594, 0.6769089698791504, 0.749566912651062, 0.8222248554229736, 0.8948827981948853, 0.9675407409667969, 1.0401986837387085, 1.1128566265106201, 1.1855146884918213, 1.258172631263733, 1.3308305740356445, 1.4034885168075562, 1.4761464595794678, 1.5488044023513794, 1.621462345123291, 1.6941204071044922, 1.7667782306671143, 1.8394362926483154, 1.912094235420227, 1.9847521781921387, 2.05741024017334, 2.130068063735962, 2.202726125717163, 2.275383949279785, 2.3480420112609863, 2.4206998348236084, 2.4933578968048096, 2.5660157203674316, 2.638673782348633, 2.711331605911255, 2.783989667892456, 2.856647491455078, 2.9293055534362793, 3.0019633769989014, 3.0746214389801025, 3.1472795009613037, 3.219937562942505, 3.292595386505127, 3.365253448486328, 3.43791127204895, 3.5105693340301514, 3.5832271575927734, 3.6558852195739746, 3.728543281555176, 3.801201343536377, 3.873859167098999, 3.9465172290802, 4.019175052642822, 4.091833114624023, 4.164491176605225, 4.237149238586426, 4.309806823730469]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 7.0, 5.0, 10.0, 11.0, 14.0, 11.0, 15.0, 27.0, 42.0, 64.0, 74.0, 89.0, 103.0, 110.0, 102.0, 79.0, 68.0, 33.0, 33.0, 27.0, 15.0, 7.0, 11.0, 6.0, 4.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9741743206977844, -0.941252589225769, -0.9083309173583984, -0.8754091858863831, -0.8424875140190125, -0.8095657825469971, -0.7766441106796265, -0.7437223792076111, -0.7108006477355957, -0.6778789162635803, -0.6449572443962097, -0.6120355129241943, -0.5791138410568237, -0.5461921095848083, -0.513270378112793, -0.48034870624542236, -0.44742703437805176, -0.41450533270835876, -0.38158363103866577, -0.3486618995666504, -0.3157402276992798, -0.2828184962272644, -0.2498967945575714, -0.21697509288787842, -0.18405339121818542, -0.15113168954849243, -0.11820998042821884, -0.08528827130794525, -0.05236656963825226, -0.019444867968559265, 0.013476848602294922, 0.046398550271987915, 0.07932019233703613, 0.11224189400672913, 0.14516359567642212, 0.1780853122472763, 0.2110070139169693, 0.2439287155866623, 0.2768504321575165, 0.3097721338272095, 0.34269383549690247, 0.37561553716659546, 0.40853723883628845, 0.44145894050598145, 0.4743806719779968, 0.5073023438453674, 0.5402240753173828, 0.5731457471847534, 0.6060674786567688, 0.6389892101287842, 0.6719108819961548, 0.7048326134681702, 0.7377542853355408, 0.7706760168075562, 0.8035976886749268, 0.8365194201469421, 0.8694411516189575, 0.9023628830909729, 0.9352845549583435, 0.9682062864303589, 1.0011279582977295, 1.0340496301651, 1.0669714212417603, 1.0998930931091309, 1.1328147649765015]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 15.0, 22.0, 25.0, 38.0, 49.0, 70.0, 99.0, 118.0, 165.0, 228.0, 323.0, 469.0, 609.0, 899.0, 1269.0, 1716.0, 2618.0, 3977.0, 6209.0, 10890.0, 24140.0, 867617.0, 87720.0, 15249.0, 8173.0, 4932.0, 3286.0, 2200.0, 1511.0, 1095.0, 747.0, 563.0, 387.0, 298.0, 220.0, 158.0, 121.0, 85.0, 59.0, 43.0, 36.0, 25.0, 17.0, 18.0, 13.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.52734375, -0.5112380981445312, -0.4951324462890625, -0.47902679443359375, -0.462921142578125, -0.44681549072265625, -0.4307098388671875, -0.41460418701171875, -0.39849853515625, -0.38239288330078125, -0.3662872314453125, -0.35018157958984375, -0.334075927734375, -0.31797027587890625, -0.3018646240234375, -0.28575897216796875, -0.2696533203125, -0.25354766845703125, -0.2374420166015625, -0.22133636474609375, -0.205230712890625, -0.18912506103515625, -0.1730194091796875, -0.15691375732421875, -0.14080810546875, -0.12470245361328125, -0.1085968017578125, -0.09249114990234375, -0.076385498046875, -0.06027984619140625, -0.0441741943359375, -0.02806854248046875, -0.011962890625, 0.00414276123046875, 0.0202484130859375, 0.03635406494140625, 0.052459716796875, 0.06856536865234375, 0.0846710205078125, 0.10077667236328125, 0.11688232421875, 0.13298797607421875, 0.1490936279296875, 0.16519927978515625, 0.181304931640625, 0.19741058349609375, 0.2135162353515625, 0.22962188720703125, 0.2457275390625, 0.26183319091796875, 0.2779388427734375, 0.29404449462890625, 0.310150146484375, 0.32625579833984375, 0.3423614501953125, 0.35846710205078125, 0.37457275390625, 0.39067840576171875, 0.4067840576171875, 0.42288970947265625, 0.438995361328125, 0.45510101318359375, 0.4712066650390625, 0.48731231689453125, 0.50341796875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 4.0, 5.0, 12.0, 7.0, 9.0, 13.0, 700.0, 115.0, 14.0, 18.0, 11.0, 9.0, 5.0, 7.0, 6.0, 6.0, 5.0, 2.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07440185546875, -0.07169723510742188, -0.06899261474609375, -0.06628799438476562, -0.0635833740234375, -0.060878753662109375, -0.05817413330078125, -0.055469512939453125, -0.052764892578125, -0.050060272216796875, -0.04735565185546875, -0.044651031494140625, -0.0419464111328125, -0.039241790771484375, -0.03653717041015625, -0.033832550048828125, -0.0311279296875, -0.028423309326171875, -0.02571868896484375, -0.023014068603515625, -0.0203094482421875, -0.017604827880859375, -0.01490020751953125, -0.012195587158203125, -0.009490966796875, -0.006786346435546875, -0.00408172607421875, -0.001377105712890625, 0.0013275146484375, 0.004032135009765625, 0.00673675537109375, 0.009441375732421875, 0.01214599609375, 0.014850616455078125, 0.01755523681640625, 0.020259857177734375, 0.0229644775390625, 0.025669097900390625, 0.02837371826171875, 0.031078338623046875, 0.033782958984375, 0.036487579345703125, 0.03919219970703125, 0.041896820068359375, 0.0446014404296875, 0.047306060791015625, 0.05001068115234375, 0.052715301513671875, 0.055419921875, 0.058124542236328125, 0.06082916259765625, 0.06353378295898438, 0.0662384033203125, 0.06894302368164062, 0.07164764404296875, 0.07435226440429688, 0.077056884765625, 0.07976150512695312, 0.08246612548828125, 0.08517074584960938, 0.0878753662109375, 0.09057998657226562, 0.09328460693359375, 0.09598922729492188, 0.09869384765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 16.0, 14.0, 22.0, 27.0, 49.0, 66.0, 82.0, 123.0, 202.0, 269.0, 459.0, 634.0, 1087.0, 1671.0, 2749.0, 4530.0, 7631.0, 13334.0, 24206.0, 47383.0, 135774.0, 602937.0, 110295.0, 42533.0, 21833.0, 12381.0, 7103.0, 4215.0, 2483.0, 1563.0, 984.0, 628.0, 409.0, 252.0, 173.0, 132.0, 74.0, 62.0, 38.0, 37.0, 19.0, 23.0, 7.0, 16.0, 7.0, 7.0, 3.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32568359375, -0.3146171569824219, -0.30355072021484375, -0.2924842834472656, -0.2814178466796875, -0.2703514099121094, -0.25928497314453125, -0.24821853637695312, -0.237152099609375, -0.22608566284179688, -0.21501922607421875, -0.20395278930664062, -0.1928863525390625, -0.18181991577148438, -0.17075347900390625, -0.15968704223632812, -0.14862060546875, -0.13755416870117188, -0.12648773193359375, -0.11542129516601562, -0.1043548583984375, -0.09328842163085938, -0.08222198486328125, -0.07115554809570312, -0.060089111328125, -0.049022674560546875, -0.03795623779296875, -0.026889801025390625, -0.0158233642578125, -0.004756927490234375, 0.00630950927734375, 0.017375946044921875, 0.0284423828125, 0.039508819580078125, 0.05057525634765625, 0.061641693115234375, 0.0727081298828125, 0.08377456665039062, 0.09484100341796875, 0.10590744018554688, 0.116973876953125, 0.12804031372070312, 0.13910675048828125, 0.15017318725585938, 0.1612396240234375, 0.17230606079101562, 0.18337249755859375, 0.19443893432617188, 0.20550537109375, 0.21657180786132812, 0.22763824462890625, 0.23870468139648438, 0.2497711181640625, 0.2608375549316406, 0.27190399169921875, 0.2829704284667969, 0.294036865234375, 0.3051033020019531, 0.31616973876953125, 0.3272361755371094, 0.3383026123046875, 0.3493690490722656, 0.36043548583984375, 0.3715019226074219, 0.382568359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 1.0, 9.0, 4.0, 9.0, 13.0, 10.0, 14.0, 21.0, 14.0, 21.0, 22.0, 24.0, 26.0, 33.0, 29.0, 39.0, 52.0, 30.0, 38.0, 35.0, 41.0, 40.0, 30.0, 36.0, 47.0, 35.0, 35.0, 25.0, 35.0, 28.0, 29.0, 29.0, 15.0, 25.0, 18.0, 21.0, 10.0, 9.0, 12.0, 8.0, 5.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.377685546875, -0.3667564392089844, -0.35582733154296875, -0.3448982238769531, -0.3339691162109375, -0.3230400085449219, -0.31211090087890625, -0.3011817932128906, -0.290252685546875, -0.2793235778808594, -0.26839447021484375, -0.2574653625488281, -0.2465362548828125, -0.23560714721679688, -0.22467803955078125, -0.21374893188476562, -0.20281982421875, -0.19189071655273438, -0.18096160888671875, -0.17003250122070312, -0.1591033935546875, -0.14817428588867188, -0.13724517822265625, -0.12631607055664062, -0.115386962890625, -0.10445785522460938, -0.09352874755859375, -0.08259963989257812, -0.0716705322265625, -0.060741424560546875, -0.04981231689453125, -0.038883209228515625, -0.0279541015625, -0.017024993896484375, -0.00609588623046875, 0.004833221435546875, 0.0157623291015625, 0.026691436767578125, 0.03762054443359375, 0.048549652099609375, 0.059478759765625, 0.07040786743164062, 0.08133697509765625, 0.09226608276367188, 0.1031951904296875, 0.11412429809570312, 0.12505340576171875, 0.13598251342773438, 0.14691162109375, 0.15784072875976562, 0.16876983642578125, 0.17969894409179688, 0.1906280517578125, 0.20155715942382812, 0.21248626708984375, 0.22341537475585938, 0.234344482421875, 0.24527359008789062, 0.25620269775390625, 0.2671318054199219, 0.2780609130859375, 0.2889900207519531, 0.29991912841796875, 0.3108482360839844, 0.32177734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 18.0, 24.0, 46.0, 94.0, 137.0, 418.0, 1956.0, 70982.0, 967608.0, 6070.0, 695.0, 246.0, 127.0, 59.0, 24.0, 14.0, 8.0, 9.0, 6.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032787322998046875, -0.003192901611328125, -0.0031070709228515625, -0.003021240234375, -0.0029354095458984375, -0.002849578857421875, -0.0027637481689453125, -0.00267791748046875, -0.0025920867919921875, -0.002506256103515625, -0.0024204254150390625, -0.0023345947265625, -0.0022487640380859375, -0.002162933349609375, -0.0020771026611328125, -0.00199127197265625, -0.0019054412841796875, -0.001819610595703125, -0.0017337799072265625, -0.00164794921875, -0.0015621185302734375, -0.001476287841796875, -0.0013904571533203125, -0.00130462646484375, -0.0012187957763671875, -0.001132965087890625, -0.0010471343994140625, -0.0009613037109375, -0.0008754730224609375, -0.000789642333984375, -0.0007038116455078125, -0.00061798095703125, -0.0005321502685546875, -0.000446319580078125, -0.0003604888916015625, -0.000274658203125, -0.0001888275146484375, -0.000102996826171875, -1.71661376953125e-05, 6.866455078125e-05, 0.0001544952392578125, 0.000240325927734375, 0.0003261566162109375, 0.0004119873046875, 0.0004978179931640625, 0.000583648681640625, 0.0006694793701171875, 0.00075531005859375, 0.0008411407470703125, 0.000926971435546875, 0.0010128021240234375, 0.0010986328125, 0.0011844635009765625, 0.001270294189453125, 0.0013561248779296875, 0.00144195556640625, 0.0015277862548828125, 0.001613616943359375, 0.0016994476318359375, 0.0017852783203125, 0.0018711090087890625, 0.001956939697265625, 0.0020427703857421875, 0.00212860107421875, 0.0022144317626953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 14.0, 12.0, 23.0, 26.0, 44.0, 76.0, 185.0, 274.0, 154.0, 73.0, 37.0, 31.0, 16.0, 9.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006814002990722656, -0.0006631985306739807, -0.0006449967622756958, -0.0006267949938774109, -0.000608593225479126, -0.0005903914570808411, -0.0005721896886825562, -0.0005539879202842712, -0.0005357861518859863, -0.0005175843834877014, -0.0004993826150894165, -0.0004811808466911316, -0.0004629790782928467, -0.00044477730989456177, -0.00042657554149627686, -0.00040837377309799194, -0.00039017200469970703, -0.0003719702363014221, -0.0003537684679031372, -0.0003355666995048523, -0.0003173649311065674, -0.00029916316270828247, -0.00028096139430999756, -0.00026275962591171265, -0.00024455785751342773, -0.00022635608911514282, -0.0002081543207168579, -0.000189952552318573, -0.00017175078392028809, -0.00015354901552200317, -0.00013534724712371826, -0.00011714547872543335, -9.894371032714844e-05, -8.074194192886353e-05, -6.254017353057861e-05, -4.43384051322937e-05, -2.613663673400879e-05, -7.934868335723877e-06, 1.0266900062561035e-05, 2.8468668460845947e-05, 4.667043685913086e-05, 6.487220525741577e-05, 8.307397365570068e-05, 0.0001012757420539856, 0.00011947751045227051, 0.00013767927885055542, 0.00015588104724884033, 0.00017408281564712524, 0.00019228458404541016, 0.00021048635244369507, 0.00022868812084197998, 0.0002468898892402649, 0.0002650916576385498, 0.0002832934260368347, 0.00030149519443511963, 0.00031969696283340454, 0.00033789873123168945, 0.00035610049962997437, 0.0003743022680282593, 0.0003925040364265442, 0.0004107058048248291, 0.000428907573223114, 0.0004471093416213989, 0.00046531111001968384, 0.00048351287841796875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 9.0, 14.0, 11.0, 27.0, 24.0, 40.0, 58.0, 86.0, 99.0, 173.0, 258.0, 421.0, 655.0, 1067.0, 1795.0, 3222.0, 6617.0, 14964.0, 45895.0, 739457.0, 179243.0, 31226.0, 11254.0, 5193.0, 2687.0, 1518.0, 869.0, 549.0, 350.0, 235.0, 168.0, 107.0, 78.0, 56.0, 31.0, 33.0, 10.0, 14.0, 10.0, 4.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004382133483886719, -0.0004230216145515442, -0.0004078298807144165, -0.0003926381468772888, -0.00037744641304016113, -0.00036225467920303345, -0.00034706294536590576, -0.0003318712115287781, -0.0003166794776916504, -0.0003014877438545227, -0.000286296010017395, -0.00027110427618026733, -0.00025591254234313965, -0.00024072080850601196, -0.00022552907466888428, -0.0002103373408317566, -0.0001951456069946289, -0.00017995387315750122, -0.00016476213932037354, -0.00014957040548324585, -0.00013437867164611816, -0.00011918693780899048, -0.00010399520397186279, -8.880347013473511e-05, -7.361173629760742e-05, -5.8420002460479736e-05, -4.322826862335205e-05, -2.8036534786224365e-05, -1.284480094909668e-05, 2.346932888031006e-06, 1.753866672515869e-05, 3.273040056228638e-05, 4.792213439941406e-05, 6.311386823654175e-05, 7.830560207366943e-05, 9.349733591079712e-05, 0.0001086890697479248, 0.0001238808035850525, 0.00013907253742218018, 0.00015426427125930786, 0.00016945600509643555, 0.00018464773893356323, 0.00019983947277069092, 0.0002150312066078186, 0.0002302229404449463, 0.000245414674282074, 0.00026060640811920166, 0.00027579814195632935, 0.00029098987579345703, 0.0003061816096305847, 0.0003213733434677124, 0.0003365650773048401, 0.0003517568111419678, 0.00036694854497909546, 0.00038214027881622314, 0.00039733201265335083, 0.0004125237464904785, 0.0004277154803276062, 0.0004429072141647339, 0.00045809894800186157, 0.00047329068183898926, 0.0004884824156761169, 0.0005036741495132446, 0.0005188658833503723, 0.0005340576171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 5.0, 10.0, 5.0, 11.0, 19.0, 17.0, 36.0, 27.0, 43.0, 51.0, 68.0, 119.0, 189.0, 86.0, 68.0, 52.0, 41.0, 30.0, 21.0, 15.0, 23.0, 7.0, 8.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0005273818969726562, -0.0005123801529407501, -0.000497378408908844, -0.00048237666487693787, -0.00046737492084503174, -0.0004523731768131256, -0.0004373714327812195, -0.00042236968874931335, -0.0004073679447174072, -0.0003923662006855011, -0.00037736445665359497, -0.00036236271262168884, -0.0003473609685897827, -0.0003323592245578766, -0.00031735748052597046, -0.00030235573649406433, -0.0002873539924621582, -0.0002723522484302521, -0.00025735050439834595, -0.00024234876036643982, -0.0002273470163345337, -0.00021234527230262756, -0.00019734352827072144, -0.0001823417842388153, -0.00016734004020690918, -0.00015233829617500305, -0.00013733655214309692, -0.0001223348081111908, -0.00010733306407928467, -9.233132004737854e-05, -7.732957601547241e-05, -6.232783198356628e-05, -4.7326087951660156e-05, -3.232434391975403e-05, -1.73225998878479e-05, -2.3208558559417725e-06, 1.2680888175964355e-05, 2.7682632207870483e-05, 4.268437623977661e-05, 5.768612027168274e-05, 7.268786430358887e-05, 8.7689608335495e-05, 0.00010269135236740112, 0.00011769309639930725, 0.00013269484043121338, 0.0001476965844631195, 0.00016269832849502563, 0.00017770007252693176, 0.0001927018165588379, 0.00020770356059074402, 0.00022270530462265015, 0.00023770704865455627, 0.0002527087926864624, 0.00026771053671836853, 0.00028271228075027466, 0.0002977140247821808, 0.0003127157688140869, 0.00032771751284599304, 0.00034271925687789917, 0.0003577210009098053, 0.0003727227449417114, 0.00038772448897361755, 0.0004027262330055237, 0.0004177279770374298, 0.00043272972106933594]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 6.0, 4.0, 6.0, 2.0, 9.0, 8.0, 18.0, 26.0, 33.0, 49.0, 94.0, 414.0, 178.0, 61.0, 31.0, 22.0, 14.0, 11.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.104447364807129, -4.988015174865723, -4.871582508087158, -4.755150318145752, -4.638718128204346, -4.5222859382629395, -4.405853271484375, -4.289421081542969, -4.1729888916015625, -4.056556701660156, -3.940124273300171, -3.8236918449401855, -3.7072596549987793, -3.590827226638794, -3.4743950366973877, -3.3579626083374023, -3.241530418395996, -3.1250979900360107, -3.0086658000946045, -2.892233371734619, -2.775801181793213, -2.6593687534332275, -2.5429365634918213, -2.426504135131836, -2.3100717067718506, -2.1936392784118652, -2.077207088470459, -1.9607747793197632, -1.8443424701690674, -1.727910041809082, -1.6114778518676758, -1.4950454235076904, -1.3786132335662842, -1.2621809244155884, -1.1457486152648926, -1.0293163061141968, -0.912883996963501, -0.7964516282081604, -0.6800193190574646, -0.5635870099067688, -0.447154700756073, -0.3307223916053772, -0.2142900675535202, -0.09785774350166321, 0.018574565649032593, 0.13500690460205078, 0.2514392137527466, 0.3678715229034424, 0.4843038320541382, 0.600736141204834, 0.7171684503555298, 0.8336007595062256, 0.9500330686569214, 1.0664653778076172, 1.1828978061676025, 1.2993299961090088, 1.4157624244689941, 1.53219473361969, 1.6486270427703857, 1.7650593519210815, 1.8814916610717773, 1.9979240894317627, 2.114356279373169, 2.2307887077331543, 2.3472208976745605]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 7.0, 8.0, 5.0, 16.0, 14.0, 16.0, 18.0, 38.0, 75.0, 100.0, 153.0, 181.0, 135.0, 92.0, 56.0, 20.0, 20.0, 7.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.555797576904297, -8.305106163024902, -8.054415702819824, -7.80372428894043, -7.553033351898193, -7.302342414855957, -7.0516510009765625, -6.800960063934326, -6.55026912689209, -6.2995781898498535, -6.048886775970459, -5.798195838928223, -5.547504901885986, -5.29681396484375, -5.0461225509643555, -4.795431613922119, -4.544740200042725, -4.294049263000488, -4.043357849121094, -3.7926669120788574, -3.541975975036621, -3.2912847995758057, -3.0405936241149902, -2.789902687072754, -2.5392115116119385, -2.288520336151123, -2.0378293991088867, -1.7871382236480713, -1.5364471673965454, -1.2857561111450195, -1.035064935684204, -0.7843738794326782, -0.5336823463439941, -0.2829912602901459, -0.03230017423629761, 0.21839094161987305, 0.4690819978713989, 0.7197730541229248, 0.9704642295837402, 1.2211552858352661, 1.471846342086792, 1.7225373983383179, 1.9732284545898438, 2.223919630050659, 2.4746108055114746, 2.725301742553711, 2.9759929180145264, 3.226684093475342, 3.477375030517578, 3.7280662059783936, 3.97875714302063, 4.229448318481445, 4.480139255523682, 4.730830192565918, 4.9815216064453125, 5.232212543487549, 5.482903480529785, 5.7335944175720215, 5.984285831451416, 6.234976768493652, 6.485667705535889, 6.736358642578125, 6.9870500564575195, 7.237740993499756, 7.48843240737915]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 3.0, 8.0, 10.0, 13.0, 21.0, 35.0, 67.0, 134.0, 321.0, 744.0, 2063.0, 5571.0, 29780.0, 4129031.0, 15669.0, 6076.0, 2561.0, 1016.0, 537.0, 232.0, 127.0, 72.0, 45.0, 38.0, 19.0, 10.0, 13.0, 5.0, 12.0, 9.0, 5.0, 1.0, 3.0, 4.0, 4.0, 6.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.1953125, -6.9405517578125, -6.685791015625, -6.4310302734375, -6.17626953125, -5.9215087890625, -5.666748046875, -5.4119873046875, -5.1572265625, -4.9024658203125, -4.647705078125, -4.3929443359375, -4.13818359375, -3.8834228515625, -3.628662109375, -3.3739013671875, -3.119140625, -2.8643798828125, -2.609619140625, -2.3548583984375, -2.10009765625, -1.8453369140625, -1.590576171875, -1.3358154296875, -1.0810546875, -0.8262939453125, -0.571533203125, -0.3167724609375, -0.06201171875, 0.1927490234375, 0.447509765625, 0.7022705078125, 0.95703125, 1.2117919921875, 1.466552734375, 1.7213134765625, 1.97607421875, 2.2308349609375, 2.485595703125, 2.7403564453125, 2.9951171875, 3.2498779296875, 3.504638671875, 3.7593994140625, 4.01416015625, 4.2689208984375, 4.523681640625, 4.7784423828125, 5.033203125, 5.2879638671875, 5.542724609375, 5.7974853515625, 6.05224609375, 6.3070068359375, 6.561767578125, 6.8165283203125, 7.0712890625, 7.3260498046875, 7.580810546875, 7.8355712890625, 8.09033203125, 8.3450927734375, 8.599853515625, 8.8546142578125, 9.109375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 3.0, 5.0, 9.0, 6.0, 7.0, 12.0, 35.0, 743.0, 41.0, 14.0, 11.0, 10.0, 10.0, 7.0, 10.0, 3.0, 3.0, 5.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 7.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.061309814453125, -0.05913972854614258, -0.056969642639160156, -0.054799556732177734, -0.05262947082519531, -0.05045938491821289, -0.04828929901123047, -0.04611921310424805, -0.043949127197265625, -0.0417790412902832, -0.03960895538330078, -0.03743886947631836, -0.03526878356933594, -0.033098697662353516, -0.030928611755371094, -0.028758525848388672, -0.02658843994140625, -0.024418354034423828, -0.022248268127441406, -0.020078182220458984, -0.017908096313476562, -0.01573801040649414, -0.013567924499511719, -0.011397838592529297, -0.009227752685546875, -0.007057666778564453, -0.004887580871582031, -0.0027174949645996094, -0.0005474090576171875, 0.0016226768493652344, 0.0037927627563476562, 0.005962848663330078, 0.0081329345703125, 0.010303020477294922, 0.012473106384277344, 0.014643192291259766, 0.016813278198242188, 0.01898336410522461, 0.02115345001220703, 0.023323535919189453, 0.025493621826171875, 0.027663707733154297, 0.02983379364013672, 0.03200387954711914, 0.03417396545410156, 0.036344051361083984, 0.038514137268066406, 0.04068422317504883, 0.04285430908203125, 0.04502439498901367, 0.047194480895996094, 0.049364566802978516, 0.05153465270996094, 0.05370473861694336, 0.05587482452392578, 0.0580449104309082, 0.060214996337890625, 0.06238508224487305, 0.06455516815185547, 0.06672525405883789, 0.06889533996582031, 0.07106542587280273, 0.07323551177978516, 0.07540559768676758, 0.07757568359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 15.0, 15.0, 29.0, 34.0, 53.0, 103.0, 126.0, 227.0, 418.0, 805.0, 1400.0, 2772.0, 5711.0, 13052.0, 36308.0, 3877999.0, 197351.0, 33839.0, 12465.0, 5576.0, 2746.0, 1394.0, 741.0, 431.0, 260.0, 140.0, 99.0, 47.0, 33.0, 24.0, 19.0, 10.0, 6.0, 6.0, 7.0, 0.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.3654098510742188, -1.3284759521484375, -1.2915420532226562, -1.254608154296875, -1.2176742553710938, -1.1807403564453125, -1.1438064575195312, -1.10687255859375, -1.0699386596679688, -1.0330047607421875, -0.9960708618164062, -0.959136962890625, -0.9222030639648438, -0.8852691650390625, -0.8483352661132812, -0.8114013671875, -0.7744674682617188, -0.7375335693359375, -0.7005996704101562, -0.663665771484375, -0.6267318725585938, -0.5897979736328125, -0.5528640747070312, -0.51593017578125, -0.47899627685546875, -0.4420623779296875, -0.40512847900390625, -0.368194580078125, -0.33126068115234375, -0.2943267822265625, -0.25739288330078125, -0.220458984375, -0.18352508544921875, -0.1465911865234375, -0.10965728759765625, -0.072723388671875, -0.03578948974609375, 0.0011444091796875, 0.03807830810546875, 0.07501220703125, 0.11194610595703125, 0.1488800048828125, 0.18581390380859375, 0.222747802734375, 0.25968170166015625, 0.2966156005859375, 0.33354949951171875, 0.3704833984375, 0.40741729736328125, 0.4443511962890625, 0.48128509521484375, 0.518218994140625, 0.5551528930664062, 0.5920867919921875, 0.6290206909179688, 0.66595458984375, 0.7028884887695312, 0.7398223876953125, 0.7767562866210938, 0.813690185546875, 0.8506240844726562, 0.8875579833984375, 0.9244918823242188, 0.96142578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 9.0, 7.0, 9.0, 17.0, 20.0, 19.0, 17.0, 14.0, 29.0, 26.0, 23.0, 21.0, 44.0, 3561.0, 28.0, 20.0, 28.0, 15.0, 26.0, 17.0, 15.0, 17.0, 15.0, 12.0, 7.0, 10.0, 6.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1300048828125, -0.12502098083496094, -0.12003707885742188, -0.11505317687988281, -0.11006927490234375, -0.10508537292480469, -0.10010147094726562, -0.09511756896972656, -0.0901336669921875, -0.08514976501464844, -0.08016586303710938, -0.07518196105957031, -0.07019805908203125, -0.06521415710449219, -0.060230255126953125, -0.05524635314941406, -0.050262451171875, -0.04527854919433594, -0.040294647216796875, -0.03531074523925781, -0.03032684326171875, -0.025342941284179688, -0.020359039306640625, -0.015375137329101562, -0.0103912353515625, -0.0054073333740234375, -0.000423431396484375, 0.0045604705810546875, 0.00954437255859375, 0.014528274536132812, 0.019512176513671875, 0.024496078491210938, 0.02947998046875, 0.03446388244628906, 0.039447784423828125, 0.04443168640136719, 0.04941558837890625, 0.05439949035644531, 0.059383392333984375, 0.06436729431152344, 0.0693511962890625, 0.07433509826660156, 0.07931900024414062, 0.08430290222167969, 0.08928680419921875, 0.09427070617675781, 0.09925460815429688, 0.10423851013183594, 0.109222412109375, 0.11420631408691406, 0.11919021606445312, 0.12417411804199219, 0.12915802001953125, 0.1341419219970703, 0.13912582397460938, 0.14410972595214844, 0.1490936279296875, 0.15407752990722656, 0.15906143188476562, 0.1640453338623047, 0.16902923583984375, 0.1740131378173828, 0.17899703979492188, 0.18398094177246094, 0.18896484375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 6.0, 10.0, 37.0, 236.0, 578.0, 87.0, 26.0, 17.0, 9.0, 4.0, 0.0, 2.0], "bins": [-2.3651981353759766, -2.323052167892456, -2.2809059619903564, -2.238759994506836, -2.1966140270233154, -2.154467821121216, -2.1123218536376953, -2.070175886154175, -2.028029680252075, -1.9858835935592651, -1.9437376260757446, -1.9015915393829346, -1.8594454526901245, -1.8172993659973145, -1.775153398513794, -1.7330073118209839, -1.6908613443374634, -1.6487152576446533, -1.6065692901611328, -1.5644232034683228, -1.5222771167755127, -1.4801311492919922, -1.4379850625991821, -1.395838975906372, -1.3536930084228516, -1.3115469217300415, -1.269400954246521, -1.227254867553711, -1.1851087808609009, -1.1429626941680908, -1.1008167266845703, -1.0586706399917603, -1.0165245532989502, -0.9743785262107849, -0.9322324395179749, -0.8900864124298096, -0.8479403257369995, -0.8057942986488342, -0.763648271560669, -0.7215021848678589, -0.6793560981750488, -0.6372100710868835, -0.5950639843940735, -0.5529179573059082, -0.5107718706130981, -0.46862584352493286, -0.4264798164367676, -0.3843337595462799, -0.34218770265579224, -0.30004164576530457, -0.2578955888748169, -0.2157495617866516, -0.17360350489616394, -0.13145744800567627, -0.08931142091751099, -0.047165364027023315, -0.0050193071365356445, 0.03712674230337143, 0.0792727917432785, 0.12141883373260498, 0.16356489062309265, 0.20571094751358032, 0.2478569746017456, 0.2900030314922333, 0.33214908838272095]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 5.0, 7.0, 9.0, 13.0, 13.0, 17.0, 29.0, 37.0, 70.0, 106.0, 87.0, 117.0, 104.0, 116.0, 72.0, 51.0, 41.0, 18.0, 17.0, 12.0, 4.0, 5.0, 6.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8739718794822693, -0.8499200940132141, -0.8258683085441589, -0.8018165826797485, -0.7777647972106934, -0.7537130117416382, -0.729661226272583, -0.7056094408035278, -0.6815576553344727, -0.6575058698654175, -0.6334540843963623, -0.6094022989273071, -0.5853505730628967, -0.5612987875938416, -0.5372470021247864, -0.5131952166557312, -0.4891434907913208, -0.4650917053222656, -0.44103994965553284, -0.41698816418647766, -0.3929364085197449, -0.3688846230506897, -0.3448328375816345, -0.32078105211257935, -0.29672929644584656, -0.2726775109767914, -0.2486257553100586, -0.22457396984100342, -0.20052219927310944, -0.17647042870521545, -0.15241864323616028, -0.1283668726682663, -0.10431504249572754, -0.08026327192783356, -0.05621149390935898, -0.0321597158908844, -0.008107945322990417, 0.015943825244903564, 0.03999561071395874, 0.06404738128185272, 0.0880991518497467, 0.11215092241764069, 0.13620269298553467, 0.16025447845458984, 0.18430624902248383, 0.2083580195903778, 0.23240980505943298, 0.25646156072616577, 0.28051334619522095, 0.3045651316642761, 0.3286168873310089, 0.3526686728000641, 0.3767204284667969, 0.40077221393585205, 0.4248239994049072, 0.4488757848739624, 0.4729275405406952, 0.49697932600975037, 0.5210310816764832, 0.5450828671455383, 0.5691346526145935, 0.5931863784790039, 0.6172381639480591, 0.6412899494171143, 0.6653417348861694]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 9.0, 9.0, 9.0, 22.0, 32.0, 45.0, 61.0, 93.0, 143.0, 235.0, 315.0, 470.0, 778.0, 1136.0, 1751.0, 2660.0, 4041.0, 6794.0, 12319.0, 32333.0, 879173.0, 68551.0, 15626.0, 8082.0, 4779.0, 3068.0, 1969.0, 1343.0, 909.0, 575.0, 394.0, 271.0, 173.0, 109.0, 81.0, 59.0, 37.0, 28.0, 25.0, 14.0, 10.0, 7.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.373046875, -0.35955810546875, -0.3460693359375, -0.33258056640625, -0.319091796875, -0.30560302734375, -0.2921142578125, -0.27862548828125, -0.26513671875, -0.25164794921875, -0.2381591796875, -0.22467041015625, -0.211181640625, -0.19769287109375, -0.1842041015625, -0.17071533203125, -0.1572265625, -0.14373779296875, -0.1302490234375, -0.11676025390625, -0.103271484375, -0.08978271484375, -0.0762939453125, -0.06280517578125, -0.04931640625, -0.03582763671875, -0.0223388671875, -0.00885009765625, 0.004638671875, 0.01812744140625, 0.0316162109375, 0.04510498046875, 0.05859375, 0.07208251953125, 0.0855712890625, 0.09906005859375, 0.112548828125, 0.12603759765625, 0.1395263671875, 0.15301513671875, 0.16650390625, 0.17999267578125, 0.1934814453125, 0.20697021484375, 0.220458984375, 0.23394775390625, 0.2474365234375, 0.26092529296875, 0.2744140625, 0.28790283203125, 0.3013916015625, 0.31488037109375, 0.328369140625, 0.34185791015625, 0.3553466796875, 0.36883544921875, 0.38232421875, 0.39581298828125, 0.4093017578125, 0.42279052734375, 0.436279296875, 0.44976806640625, 0.4632568359375, 0.47674560546875, 0.490234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 3.0, 4.0, 11.0, 3.0, 6.0, 10.0, 12.0, 107.0, 514.0, 175.0, 30.0, 12.0, 16.0, 5.0, 8.0, 5.0, 9.0, 2.0, 3.0, 5.0, 7.0, 3.0, 7.0, 6.0, 2.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048614501953125, -0.04676389694213867, -0.044913291931152344, -0.043062686920166016, -0.04121208190917969, -0.03936147689819336, -0.03751087188720703, -0.0356602668762207, -0.033809661865234375, -0.03195905685424805, -0.03010845184326172, -0.02825784683227539, -0.026407241821289062, -0.024556636810302734, -0.022706031799316406, -0.020855426788330078, -0.01900482177734375, -0.017154216766357422, -0.015303611755371094, -0.013453006744384766, -0.011602401733398438, -0.00975179672241211, -0.007901191711425781, -0.006050586700439453, -0.004199981689453125, -0.002349376678466797, -0.0004987716674804688, 0.0013518333435058594, 0.0032024383544921875, 0.005053043365478516, 0.006903648376464844, 0.008754253387451172, 0.0106048583984375, 0.012455463409423828, 0.014306068420410156, 0.016156673431396484, 0.018007278442382812, 0.01985788345336914, 0.02170848846435547, 0.023559093475341797, 0.025409698486328125, 0.027260303497314453, 0.02911090850830078, 0.03096151351928711, 0.03281211853027344, 0.034662723541259766, 0.036513328552246094, 0.03836393356323242, 0.04021453857421875, 0.04206514358520508, 0.043915748596191406, 0.045766353607177734, 0.04761695861816406, 0.04946756362915039, 0.05131816864013672, 0.05316877365112305, 0.055019378662109375, 0.0568699836730957, 0.05872058868408203, 0.06057119369506836, 0.06242179870605469, 0.06427240371704102, 0.06612300872802734, 0.06797361373901367, 0.06982421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 6.0, 7.0, 17.0, 21.0, 17.0, 27.0, 34.0, 40.0, 50.0, 68.0, 110.0, 211.0, 389.0, 871.0, 2474.0, 8966.0, 49075.0, 819639.0, 141846.0, 17947.0, 4178.0, 1255.0, 553.0, 249.0, 163.0, 87.0, 72.0, 41.0, 28.0, 23.0, 16.0, 13.0, 10.0, 10.0, 9.0, 2.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.70361328125, -0.6827392578125, -0.661865234375, -0.6409912109375, -0.6201171875, -0.5992431640625, -0.578369140625, -0.5574951171875, -0.53662109375, -0.5157470703125, -0.494873046875, -0.4739990234375, -0.453125, -0.4322509765625, -0.411376953125, -0.3905029296875, -0.36962890625, -0.3487548828125, -0.327880859375, -0.3070068359375, -0.2861328125, -0.2652587890625, -0.244384765625, -0.2235107421875, -0.20263671875, -0.1817626953125, -0.160888671875, -0.1400146484375, -0.119140625, -0.0982666015625, -0.077392578125, -0.0565185546875, -0.03564453125, -0.0147705078125, 0.006103515625, 0.0269775390625, 0.0478515625, 0.0687255859375, 0.089599609375, 0.1104736328125, 0.13134765625, 0.1522216796875, 0.173095703125, 0.1939697265625, 0.21484375, 0.2357177734375, 0.256591796875, 0.2774658203125, 0.29833984375, 0.3192138671875, 0.340087890625, 0.3609619140625, 0.3818359375, 0.4027099609375, 0.423583984375, 0.4444580078125, 0.46533203125, 0.4862060546875, 0.507080078125, 0.5279541015625, 0.548828125, 0.5697021484375, 0.590576171875, 0.6114501953125, 0.63232421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 9.0, 11.0, 6.0, 13.0, 18.0, 20.0, 19.0, 26.0, 22.0, 35.0, 31.0, 27.0, 41.0, 38.0, 35.0, 48.0, 49.0, 59.0, 46.0, 36.0, 45.0, 45.0, 37.0, 39.0, 25.0, 26.0, 21.0, 30.0, 27.0, 22.0, 15.0, 15.0, 18.0, 7.0, 5.0, 7.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18268775939941406, -0.17641067504882812, -0.1701335906982422, -0.16385650634765625, -0.1575794219970703, -0.15130233764648438, -0.14502525329589844, -0.1387481689453125, -0.13247108459472656, -0.12619400024414062, -0.11991691589355469, -0.11363983154296875, -0.10736274719238281, -0.10108566284179688, -0.09480857849121094, -0.088531494140625, -0.08225440979003906, -0.07597732543945312, -0.06970024108886719, -0.06342315673828125, -0.05714607238769531, -0.050868988037109375, -0.04459190368652344, -0.0383148193359375, -0.03203773498535156, -0.025760650634765625, -0.019483566284179688, -0.01320648193359375, -0.0069293975830078125, -0.000652313232421875, 0.0056247711181640625, 0.01190185546875, 0.018178939819335938, 0.024456024169921875, 0.030733108520507812, 0.03701019287109375, 0.04328727722167969, 0.049564361572265625, 0.05584144592285156, 0.0621185302734375, 0.06839561462402344, 0.07467269897460938, 0.08094978332519531, 0.08722686767578125, 0.09350395202636719, 0.09978103637695312, 0.10605812072753906, 0.112335205078125, 0.11861228942871094, 0.12488937377929688, 0.1311664581298828, 0.13744354248046875, 0.1437206268310547, 0.14999771118164062, 0.15627479553222656, 0.1625518798828125, 0.16882896423339844, 0.17510604858398438, 0.1813831329345703, 0.18766021728515625, 0.1939373016357422, 0.20021438598632812, 0.20649147033691406, 0.2127685546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 19.0, 22.0, 17.0, 37.0, 60.0, 269.0, 1793.0, 919620.0, 124843.0, 1434.0, 234.0, 74.0, 33.0, 24.0, 16.0, 18.0, 10.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0242462158203125, -0.023552417755126953, -0.022858619689941406, -0.02216482162475586, -0.021471023559570312, -0.020777225494384766, -0.02008342742919922, -0.019389629364013672, -0.018695831298828125, -0.018002033233642578, -0.01730823516845703, -0.016614437103271484, -0.015920639038085938, -0.01522684097290039, -0.014533042907714844, -0.013839244842529297, -0.01314544677734375, -0.012451648712158203, -0.011757850646972656, -0.01106405258178711, -0.010370254516601562, -0.009676456451416016, -0.008982658386230469, -0.008288860321044922, -0.007595062255859375, -0.006901264190673828, -0.006207466125488281, -0.005513668060302734, -0.0048198699951171875, -0.004126071929931641, -0.0034322738647460938, -0.002738475799560547, -0.002044677734375, -0.0013508796691894531, -0.0006570816040039062, 3.6716461181640625e-05, 0.0007305145263671875, 0.0014243125915527344, 0.0021181106567382812, 0.002811908721923828, 0.003505706787109375, 0.004199504852294922, 0.004893302917480469, 0.005587100982666016, 0.0062808990478515625, 0.006974697113037109, 0.007668495178222656, 0.008362293243408203, 0.00905609130859375, 0.009749889373779297, 0.010443687438964844, 0.01113748550415039, 0.011831283569335938, 0.012525081634521484, 0.013218879699707031, 0.013912677764892578, 0.014606475830078125, 0.015300273895263672, 0.01599407196044922, 0.016687870025634766, 0.017381668090820312, 0.01807546615600586, 0.018769264221191406, 0.019463062286376953, 0.0201568603515625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 0.0, 3.0, 4.0, 8.0, 5.0, 5.0, 8.0, 22.0, 18.0, 31.0, 30.0, 52.0, 60.0, 160.0, 256.0, 112.0, 52.0, 48.0, 33.0, 29.0, 17.0, 13.0, 9.0, 8.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.41157341003418e-05, -9.054038673639297e-05, -8.696503937244415e-05, -8.338969200849533e-05, -7.981434464454651e-05, -7.623899728059769e-05, -7.266364991664886e-05, -6.908830255270004e-05, -6.551295518875122e-05, -6.19376078248024e-05, -5.836226046085358e-05, -5.4786913096904755e-05, -5.121156573295593e-05, -4.763621836900711e-05, -4.406087100505829e-05, -4.0485523641109467e-05, -3.6910176277160645e-05, -3.333482891321182e-05, -2.9759481549263e-05, -2.618413418531418e-05, -2.2608786821365356e-05, -1.9033439457416534e-05, -1.5458092093467712e-05, -1.188274472951889e-05, -8.307397365570068e-06, -4.732050001621246e-06, -1.1567026376724243e-06, 2.4186447262763977e-06, 5.99399209022522e-06, 9.569339454174042e-06, 1.3144686818122864e-05, 1.6720034182071686e-05, 2.0295381546020508e-05, 2.387072890996933e-05, 2.7446076273918152e-05, 3.1021423637866974e-05, 3.4596771001815796e-05, 3.817211836576462e-05, 4.174746572971344e-05, 4.532281309366226e-05, 4.8898160457611084e-05, 5.2473507821559906e-05, 5.604885518550873e-05, 5.962420254945755e-05, 6.319954991340637e-05, 6.67748972773552e-05, 7.035024464130402e-05, 7.392559200525284e-05, 7.750093936920166e-05, 8.107628673315048e-05, 8.46516340970993e-05, 8.822698146104813e-05, 9.180232882499695e-05, 9.537767618894577e-05, 9.895302355289459e-05, 0.00010252837091684341, 0.00010610371828079224, 0.00010967906564474106, 0.00011325441300868988, 0.0001168297603726387, 0.00012040510773658752, 0.00012398045510053635, 0.00012755580246448517, 0.000131131149828434, 0.0001347064971923828]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 8.0, 10.0, 24.0, 37.0, 61.0, 143.0, 309.0, 708.0, 2049.0, 12011.0, 1019944.0, 9935.0, 1957.0, 708.0, 310.0, 147.0, 58.0, 35.0, 25.0, 21.0, 6.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0235443115234375, -0.022861242294311523, -0.022178173065185547, -0.02149510383605957, -0.020812034606933594, -0.020128965377807617, -0.01944589614868164, -0.018762826919555664, -0.018079757690429688, -0.01739668846130371, -0.016713619232177734, -0.016030550003051758, -0.015347480773925781, -0.014664411544799805, -0.013981342315673828, -0.013298273086547852, -0.012615203857421875, -0.011932134628295898, -0.011249065399169922, -0.010565996170043945, -0.009882926940917969, -0.009199857711791992, -0.008516788482666016, -0.007833719253540039, -0.0071506500244140625, -0.006467580795288086, -0.005784511566162109, -0.005101442337036133, -0.004418373107910156, -0.0037353038787841797, -0.003052234649658203, -0.0023691654205322266, -0.00168609619140625, -0.0010030269622802734, -0.0003199577331542969, 0.0003631114959716797, 0.0010461807250976562, 0.0017292499542236328, 0.0024123191833496094, 0.003095388412475586, 0.0037784576416015625, 0.004461526870727539, 0.005144596099853516, 0.005827665328979492, 0.006510734558105469, 0.007193803787231445, 0.007876873016357422, 0.008559942245483398, 0.009243011474609375, 0.009926080703735352, 0.010609149932861328, 0.011292219161987305, 0.011975288391113281, 0.012658357620239258, 0.013341426849365234, 0.014024496078491211, 0.014707565307617188, 0.015390634536743164, 0.01607370376586914, 0.016756772994995117, 0.017439842224121094, 0.01812291145324707, 0.018805980682373047, 0.019489049911499023, 0.020172119140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 23.0, 22.0, 45.0, 154.0, 462.0, 166.0, 54.0, 27.0, 11.0, 4.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00649261474609375, -0.006272792816162109, -0.006052970886230469, -0.005833148956298828, -0.0056133270263671875, -0.005393505096435547, -0.005173683166503906, -0.004953861236572266, -0.004734039306640625, -0.004514217376708984, -0.004294395446777344, -0.004074573516845703, -0.0038547515869140625, -0.003634929656982422, -0.0034151077270507812, -0.0031952857971191406, -0.0029754638671875, -0.0027556419372558594, -0.0025358200073242188, -0.002315998077392578, -0.0020961761474609375, -0.0018763542175292969, -0.0016565322875976562, -0.0014367103576660156, -0.001216888427734375, -0.0009970664978027344, -0.0007772445678710938, -0.0005574226379394531, -0.0003376007080078125, -0.00011777877807617188, 0.00010204315185546875, 0.0003218650817871094, 0.00054168701171875, 0.0007615089416503906, 0.0009813308715820312, 0.0012011528015136719, 0.0014209747314453125, 0.0016407966613769531, 0.0018606185913085938, 0.0020804405212402344, 0.002300262451171875, 0.0025200843811035156, 0.0027399063110351562, 0.002959728240966797, 0.0031795501708984375, 0.003399372100830078, 0.0036191940307617188, 0.0038390159606933594, 0.004058837890625, 0.004278659820556641, 0.004498481750488281, 0.004718303680419922, 0.0049381256103515625, 0.005157947540283203, 0.005377769470214844, 0.005597591400146484, 0.005817413330078125, 0.006037235260009766, 0.006257057189941406, 0.006476879119873047, 0.0066967010498046875, 0.006916522979736328, 0.007136344909667969, 0.007356166839599609, 0.00757598876953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 32.0, 922.0, 57.0, 6.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.794506072998047, -26.329580307006836, -25.864656448364258, -25.399730682373047, -24.934804916381836, -24.469879150390625, -24.004955291748047, -23.540029525756836, -23.075103759765625, -22.610177993774414, -22.145254135131836, -21.680328369140625, -21.215402603149414, -20.750476837158203, -20.285552978515625, -19.820627212524414, -19.355703353881836, -18.890777587890625, -18.425853729248047, -17.960927963256836, -17.496002197265625, -17.031078338623047, -16.566152572631836, -16.101226806640625, -15.636301040649414, -15.17137622833252, -14.706450462341309, -14.241525650024414, -13.776599884033203, -13.311675071716309, -12.846750259399414, -12.381824493408203, -11.916900634765625, -11.45197582244873, -10.98705005645752, -10.522125244140625, -10.057199478149414, -9.59227466583252, -9.127349853515625, -8.662424087524414, -8.197498321533203, -7.73257303237915, -7.267647743225098, -6.802722930908203, -6.33779764175415, -5.872872352600098, -5.407947063446045, -4.943021774291992, -4.478096961975098, -4.013171672821045, -3.5482466220855713, -3.0833213329315186, -2.618396282196045, -2.153470993041992, -1.6885457038879395, -1.2236206531524658, -0.7586953639984131, -0.2937701642513275, 0.17115503549575806, 0.636080265045166, 1.1010054349899292, 1.5659306049346924, 2.030855894088745, 2.4957809448242188, 2.9607062339782715]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 3.0, 4.0, 8.0, 3.0, 7.0, 14.0, 18.0, 24.0, 28.0, 56.0, 59.0, 68.0, 80.0, 90.0, 102.0, 85.0, 68.0, 62.0, 51.0, 43.0, 25.0, 28.0, 11.0, 12.0, 9.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.3362526893615723, -2.2663745880126953, -2.1964962482452393, -2.1266181468963623, -2.0567398071289062, -1.9868617057800293, -1.9169836044311523, -1.8471053838729858, -1.7772271633148193, -1.7073489427566528, -1.6374707221984863, -1.5675926208496094, -1.4977144002914429, -1.4278361797332764, -1.3579580783843994, -1.288079857826233, -1.2182016372680664, -1.1483234167099, -1.0784451961517334, -1.0085670948028564, -0.9386888742446899, -0.8688106536865234, -0.7989324927330017, -0.72905433177948, -0.6591761112213135, -0.589297890663147, -0.5194197297096252, -0.44954153895378113, -0.379663348197937, -0.3097851574420929, -0.23990696668624878, -0.17002877593040466, -0.10015058517456055, -0.03027239441871643, 0.039605796337127686, 0.1094839870929718, 0.17936217784881592, 0.24924036860466003, 0.31911855936050415, 0.38899675011634827, 0.4588749408721924, 0.5287531614303589, 0.5986313223838806, 0.6685094833374023, 0.7383877038955688, 0.8082659244537354, 0.8781440854072571, 0.9480222463607788, 1.0179004669189453, 1.0877786874771118, 1.1576569080352783, 1.2275350093841553, 1.2974132299423218, 1.3672914505004883, 1.4371695518493652, 1.5070477724075317, 1.5769259929656982, 1.6468042135238647, 1.7166824340820312, 1.7865605354309082, 1.8564387559890747, 1.9263169765472412, 1.9961950778961182, 2.066073417663574, 2.135951519012451]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 5.0, 13.0, 49.0, 174.0, 735.0, 2850.0, 11600.0, 3987534.0, 166485.0, 17533.0, 5133.0, 1461.0, 436.0, 122.0, 49.0, 15.0, 10.0, 8.0, 7.0, 4.0, 4.0, 4.0, 4.0, 5.0, 2.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9814453125, -1.9079742431640625, -1.834503173828125, -1.7610321044921875, -1.68756103515625, -1.6140899658203125, -1.540618896484375, -1.4671478271484375, -1.3936767578125, -1.3202056884765625, -1.246734619140625, -1.1732635498046875, -1.09979248046875, -1.0263214111328125, -0.952850341796875, -0.8793792724609375, -0.805908203125, -0.7324371337890625, -0.658966064453125, -0.5854949951171875, -0.51202392578125, -0.4385528564453125, -0.365081787109375, -0.2916107177734375, -0.2181396484375, -0.1446685791015625, -0.071197509765625, 0.0022735595703125, 0.07574462890625, 0.1492156982421875, 0.222686767578125, 0.2961578369140625, 0.36962890625, 0.4430999755859375, 0.516571044921875, 0.5900421142578125, 0.66351318359375, 0.7369842529296875, 0.810455322265625, 0.8839263916015625, 0.9573974609375, 1.0308685302734375, 1.104339599609375, 1.1778106689453125, 1.25128173828125, 1.3247528076171875, 1.398223876953125, 1.4716949462890625, 1.545166015625, 1.6186370849609375, 1.692108154296875, 1.7655792236328125, 1.83905029296875, 1.9125213623046875, 1.985992431640625, 2.0594635009765625, 2.1329345703125, 2.2064056396484375, 2.279876708984375, 2.3533477783203125, 2.42681884765625, 2.5002899169921875, 2.573760986328125, 2.6472320556640625, 2.720703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 4.0, 7.0, 6.0, 13.0, 7.0, 41.0, 235.0, 369.0, 151.0, 33.0, 20.0, 7.0, 11.0, 6.0, 7.0, 3.0, 5.0, 7.0, 7.0, 4.0, 4.0, 4.0, 4.0, 5.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043914794921875, -0.04228544235229492, -0.040656089782714844, -0.039026737213134766, -0.03739738464355469, -0.03576803207397461, -0.03413867950439453, -0.03250932693481445, -0.030879974365234375, -0.029250621795654297, -0.02762126922607422, -0.02599191665649414, -0.024362564086914062, -0.022733211517333984, -0.021103858947753906, -0.019474506378173828, -0.01784515380859375, -0.016215801239013672, -0.014586448669433594, -0.012957096099853516, -0.011327743530273438, -0.00969839096069336, -0.008069038391113281, -0.006439685821533203, -0.004810333251953125, -0.003180980682373047, -0.0015516281127929688, 7.772445678710938e-05, 0.0017070770263671875, 0.0033364295959472656, 0.004965782165527344, 0.006595134735107422, 0.0082244873046875, 0.009853839874267578, 0.011483192443847656, 0.013112545013427734, 0.014741897583007812, 0.01637125015258789, 0.01800060272216797, 0.019629955291748047, 0.021259307861328125, 0.022888660430908203, 0.02451801300048828, 0.02614736557006836, 0.027776718139648438, 0.029406070709228516, 0.031035423278808594, 0.03266477584838867, 0.03429412841796875, 0.03592348098754883, 0.037552833557128906, 0.039182186126708984, 0.04081153869628906, 0.04244089126586914, 0.04407024383544922, 0.0456995964050293, 0.047328948974609375, 0.04895830154418945, 0.05058765411376953, 0.05221700668334961, 0.05384635925292969, 0.055475711822509766, 0.057105064392089844, 0.05873441696166992, 0.06036376953125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 16.0, 14.0, 24.0, 26.0, 42.0, 42.0, 77.0, 118.0, 228.0, 606.0, 3125.0, 65248.0, 4110409.0, 12099.0, 1362.0, 383.0, 156.0, 86.0, 59.0, 50.0, 26.0, 22.0, 20.0, 13.0, 14.0, 4.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.646484375, -2.5838775634765625, -2.521270751953125, -2.4586639404296875, -2.39605712890625, -2.3334503173828125, -2.270843505859375, -2.2082366943359375, -2.1456298828125, -2.0830230712890625, -2.020416259765625, -1.9578094482421875, -1.89520263671875, -1.8325958251953125, -1.769989013671875, -1.7073822021484375, -1.644775390625, -1.5821685791015625, -1.519561767578125, -1.4569549560546875, -1.39434814453125, -1.3317413330078125, -1.269134521484375, -1.2065277099609375, -1.1439208984375, -1.0813140869140625, -1.018707275390625, -0.9561004638671875, -0.89349365234375, -0.8308868408203125, -0.768280029296875, -0.7056732177734375, -0.64306640625, -0.5804595947265625, -0.517852783203125, -0.4552459716796875, -0.39263916015625, -0.3300323486328125, -0.267425537109375, -0.2048187255859375, -0.1422119140625, -0.0796051025390625, -0.016998291015625, 0.0456085205078125, 0.10821533203125, 0.1708221435546875, 0.233428955078125, 0.2960357666015625, 0.358642578125, 0.4212493896484375, 0.483856201171875, 0.5464630126953125, 0.60906982421875, 0.6716766357421875, 0.734283447265625, 0.7968902587890625, 0.8594970703125, 0.9221038818359375, 0.984710693359375, 1.0473175048828125, 1.10992431640625, 1.1725311279296875, 1.235137939453125, 1.2977447509765625, 1.3603515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 1.0, 2.0, 12.0, 13.0, 13.0, 15.0, 16.0, 23.0, 34.0, 39.0, 46.0, 57.0, 85.0, 100.0, 2976.0, 211.0, 98.0, 61.0, 57.0, 54.0, 39.0, 24.0, 27.0, 18.0, 17.0, 10.0, 17.0, 2.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11981201171875, -0.11431598663330078, -0.10881996154785156, -0.10332393646240234, -0.09782791137695312, -0.0923318862915039, -0.08683586120605469, -0.08133983612060547, -0.07584381103515625, -0.07034778594970703, -0.06485176086425781, -0.059355735778808594, -0.053859710693359375, -0.048363685607910156, -0.04286766052246094, -0.03737163543701172, -0.0318756103515625, -0.02637958526611328, -0.020883560180664062, -0.015387535095214844, -0.009891510009765625, -0.004395484924316406, 0.0011005401611328125, 0.006596565246582031, 0.01209259033203125, 0.01758861541748047, 0.023084640502929688, 0.028580665588378906, 0.034076690673828125, 0.039572715759277344, 0.04506874084472656, 0.05056476593017578, 0.056060791015625, 0.06155681610107422, 0.06705284118652344, 0.07254886627197266, 0.07804489135742188, 0.0835409164428711, 0.08903694152832031, 0.09453296661376953, 0.10002899169921875, 0.10552501678466797, 0.11102104187011719, 0.1165170669555664, 0.12201309204101562, 0.12750911712646484, 0.13300514221191406, 0.13850116729736328, 0.1439971923828125, 0.14949321746826172, 0.15498924255371094, 0.16048526763916016, 0.16598129272460938, 0.1714773178100586, 0.1769733428955078, 0.18246936798095703, 0.18796539306640625, 0.19346141815185547, 0.1989574432373047, 0.2044534683227539, 0.20994949340820312, 0.21544551849365234, 0.22094154357910156, 0.22643756866455078, 0.23193359375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 55.0, 742.0, 164.0, 26.0, 3.0, 8.0, 2.0, 3.0, 0.0, 3.0], "bins": [-2.836090564727783, -2.785233497619629, -2.7343766689300537, -2.6835196018218994, -2.632662534713745, -2.58180570602417, -2.5309486389160156, -2.4800915718078613, -2.429234743118286, -2.378377676010132, -2.3275208473205566, -2.2766637802124023, -2.225806713104248, -2.174949884414673, -2.1240928173065186, -2.0732357501983643, -2.02237868309021, -1.9715217351913452, -1.920664668083191, -1.8698077201843262, -1.8189507722854614, -1.7680937051773071, -1.7172367572784424, -1.666379690170288, -1.615522861480713, -1.5646659135818481, -1.5138088464736938, -1.462951898574829, -1.4120949506759644, -1.36123788356781, -1.3103809356689453, -1.259523868560791, -1.2086668014526367, -1.157809853553772, -1.1069527864456177, -1.056095838546753, -1.0052388906478882, -0.9543818235397339, -0.9035248756408691, -0.8526678681373596, -0.8018109798431396, -0.7509539723396301, -0.7000970244407654, -0.6492400169372559, -0.5983830094337463, -0.5475260019302368, -0.49666905403137207, -0.44581204652786255, -0.394955039024353, -0.3440980613231659, -0.29324105381965637, -0.24238407611846924, -0.1915270835161209, -0.14067009091377258, -0.08981311321258545, -0.03895610570907593, 0.011900871992111206, 0.06275786459445953, 0.11361484974622726, 0.164471834897995, 0.21532882750034332, 0.26618582010269165, 0.3170427978038788, 0.3678998053073883, 0.41875678300857544]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 8.0, 23.0, 21.0, 27.0, 34.0, 51.0, 51.0, 69.0, 77.0, 80.0, 82.0, 94.0, 83.0, 60.0, 45.0, 48.0, 24.0, 27.0, 17.0, 8.0, 8.0, 2.0, 2.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7812978625297546, -0.7593730688095093, -0.7374482750892639, -0.7155234813690186, -0.6935986876487732, -0.6716738939285278, -0.6497490406036377, -0.6278243064880371, -0.605899453163147, -0.5839746594429016, -0.5620498657226562, -0.5401250720024109, -0.5182002782821655, -0.49627548456192017, -0.4743506610393524, -0.45242586731910706, -0.4305011034011841, -0.4085763096809387, -0.38665151596069336, -0.364726722240448, -0.34280192852020264, -0.3208771347999573, -0.2989523112773895, -0.27702751755714417, -0.2551027238368988, -0.23317793011665344, -0.21125313639640808, -0.18932832777500153, -0.16740353405475616, -0.1454787403345108, -0.12355393171310425, -0.10162913799285889, -0.07970428466796875, -0.05777948722243309, -0.03585468977689743, -0.013929888606071472, 0.00799490511417389, 0.02991969883441925, 0.051844507455825806, 0.07376930117607117, 0.09569409489631653, 0.11761888861656189, 0.13954368233680725, 0.1614684909582138, 0.18339328467845917, 0.20531807839870453, 0.22724288702011108, 0.24916768074035645, 0.2710924744606018, 0.29301726818084717, 0.31494206190109253, 0.3368668556213379, 0.35879164934158325, 0.3807164430618286, 0.40264126658439636, 0.4245660603046417, 0.4464908540248871, 0.46841564774513245, 0.4903404414653778, 0.5122652649879456, 0.5341900587081909, 0.5561148524284363, 0.5780396461486816, 0.599964439868927, 0.6218892335891724]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 9.0, 8.0, 19.0, 25.0, 24.0, 36.0, 64.0, 69.0, 114.0, 148.0, 194.0, 257.0, 378.0, 507.0, 759.0, 1094.0, 1611.0, 2495.0, 4149.0, 7706.0, 17401.0, 66869.0, 776559.0, 121318.0, 23383.0, 9365.0, 4875.0, 2977.0, 1896.0, 1266.0, 844.0, 591.0, 415.0, 309.0, 232.0, 152.0, 127.0, 78.0, 69.0, 49.0, 30.0, 24.0, 21.0, 8.0, 13.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20556640625, -0.19885826110839844, -0.19215011596679688, -0.1854419708251953, -0.17873382568359375, -0.1720256805419922, -0.16531753540039062, -0.15860939025878906, -0.1519012451171875, -0.14519309997558594, -0.13848495483398438, -0.1317768096923828, -0.12506866455078125, -0.11836051940917969, -0.11165237426757812, -0.10494422912597656, -0.098236083984375, -0.09152793884277344, -0.08481979370117188, -0.07811164855957031, -0.07140350341796875, -0.06469535827636719, -0.057987213134765625, -0.05127906799316406, -0.0445709228515625, -0.03786277770996094, -0.031154632568359375, -0.024446487426757812, -0.01773834228515625, -0.011030197143554688, -0.004322052001953125, 0.0023860931396484375, 0.00909423828125, 0.015802383422851562, 0.022510528564453125, 0.029218673706054688, 0.03592681884765625, 0.04263496398925781, 0.049343109130859375, 0.05605125427246094, 0.0627593994140625, 0.06946754455566406, 0.07617568969726562, 0.08288383483886719, 0.08959197998046875, 0.09630012512207031, 0.10300827026367188, 0.10971641540527344, 0.116424560546875, 0.12313270568847656, 0.12984085083007812, 0.1365489959716797, 0.14325714111328125, 0.1499652862548828, 0.15667343139648438, 0.16338157653808594, 0.1700897216796875, 0.17679786682128906, 0.18350601196289062, 0.1902141571044922, 0.19692230224609375, 0.2036304473876953, 0.21033859252929688, 0.21704673767089844, 0.2237548828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 3.0, 8.0, 13.0, 40.0, 84.0, 131.0, 181.0, 176.0, 116.0, 67.0, 44.0, 15.0, 19.0, 9.0, 11.0, 7.0, 5.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 4.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034515380859375, -0.03338289260864258, -0.032250404357910156, -0.031117916107177734, -0.029985427856445312, -0.02885293960571289, -0.02772045135498047, -0.026587963104248047, -0.025455474853515625, -0.024322986602783203, -0.02319049835205078, -0.02205801010131836, -0.020925521850585938, -0.019793033599853516, -0.018660545349121094, -0.017528057098388672, -0.01639556884765625, -0.015263080596923828, -0.014130592346191406, -0.012998104095458984, -0.011865615844726562, -0.01073312759399414, -0.009600639343261719, -0.008468151092529297, -0.007335662841796875, -0.006203174591064453, -0.005070686340332031, -0.003938198089599609, -0.0028057098388671875, -0.0016732215881347656, -0.0005407333374023438, 0.0005917549133300781, 0.0017242431640625, 0.002856731414794922, 0.003989219665527344, 0.005121707916259766, 0.0062541961669921875, 0.007386684417724609, 0.008519172668457031, 0.009651660919189453, 0.010784149169921875, 0.011916637420654297, 0.013049125671386719, 0.01418161392211914, 0.015314102172851562, 0.016446590423583984, 0.017579078674316406, 0.018711566925048828, 0.01984405517578125, 0.020976543426513672, 0.022109031677246094, 0.023241519927978516, 0.024374008178710938, 0.02550649642944336, 0.02663898468017578, 0.027771472930908203, 0.028903961181640625, 0.030036449432373047, 0.03116893768310547, 0.03230142593383789, 0.03343391418457031, 0.034566402435302734, 0.035698890686035156, 0.03683137893676758, 0.0379638671875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 11.0, 11.0, 13.0, 21.0, 19.0, 35.0, 49.0, 54.0, 111.0, 165.0, 331.0, 648.0, 1643.0, 6661.0, 322897.0, 704593.0, 7935.0, 1793.0, 708.0, 319.0, 169.0, 118.0, 63.0, 61.0, 30.0, 21.0, 21.0, 18.0, 7.0, 6.0, 9.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470947265625, -0.4557762145996094, -0.44060516357421875, -0.4254341125488281, -0.4102630615234375, -0.3950920104980469, -0.37992095947265625, -0.3647499084472656, -0.349578857421875, -0.3344078063964844, -0.31923675537109375, -0.3040657043457031, -0.2888946533203125, -0.2737236022949219, -0.25855255126953125, -0.24338150024414062, -0.22821044921875, -0.21303939819335938, -0.19786834716796875, -0.18269729614257812, -0.1675262451171875, -0.15235519409179688, -0.13718414306640625, -0.12201309204101562, -0.106842041015625, -0.09167098999023438, -0.07649993896484375, -0.061328887939453125, -0.0461578369140625, -0.030986785888671875, -0.01581573486328125, -0.000644683837890625, 0.0145263671875, 0.029697418212890625, 0.04486846923828125, 0.060039520263671875, 0.0752105712890625, 0.09038162231445312, 0.10555267333984375, 0.12072372436523438, 0.135894775390625, 0.15106582641601562, 0.16623687744140625, 0.18140792846679688, 0.1965789794921875, 0.21175003051757812, 0.22692108154296875, 0.24209213256835938, 0.25726318359375, 0.2724342346191406, 0.28760528564453125, 0.3027763366699219, 0.3179473876953125, 0.3331184387207031, 0.34828948974609375, 0.3634605407714844, 0.378631591796875, 0.3938026428222656, 0.40897369384765625, 0.4241447448730469, 0.4393157958984375, 0.4544868469238281, 0.46965789794921875, 0.4848289489746094, 0.5]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 9.0, 7.0, 11.0, 12.0, 19.0, 24.0, 24.0, 39.0, 37.0, 41.0, 49.0, 47.0, 37.0, 45.0, 53.0, 58.0, 59.0, 56.0, 51.0, 47.0, 56.0, 48.0, 32.0, 29.0, 23.0, 19.0, 18.0, 14.0, 12.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138916015625, -0.13463211059570312, -0.13034820556640625, -0.12606430053710938, -0.1217803955078125, -0.11749649047851562, -0.11321258544921875, -0.10892868041992188, -0.104644775390625, -0.10036087036132812, -0.09607696533203125, -0.09179306030273438, -0.0875091552734375, -0.08322525024414062, -0.07894134521484375, -0.07465744018554688, -0.07037353515625, -0.06608963012695312, -0.06180572509765625, -0.057521820068359375, -0.0532379150390625, -0.048954010009765625, -0.04467010498046875, -0.040386199951171875, -0.036102294921875, -0.031818389892578125, -0.02753448486328125, -0.023250579833984375, -0.0189666748046875, -0.014682769775390625, -0.01039886474609375, -0.006114959716796875, -0.0018310546875, 0.002452850341796875, 0.00673675537109375, 0.011020660400390625, 0.0153045654296875, 0.019588470458984375, 0.02387237548828125, 0.028156280517578125, 0.032440185546875, 0.036724090576171875, 0.04100799560546875, 0.045291900634765625, 0.0495758056640625, 0.053859710693359375, 0.05814361572265625, 0.062427520751953125, 0.06671142578125, 0.07099533081054688, 0.07527923583984375, 0.07956314086914062, 0.0838470458984375, 0.08813095092773438, 0.09241485595703125, 0.09669876098632812, 0.100982666015625, 0.10526657104492188, 0.10955047607421875, 0.11383438110351562, 0.1181182861328125, 0.12240219116210938, 0.12668609619140625, 0.13097000122070312, 0.13525390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 6.0, 3.0, 13.0, 25.0, 34.0, 20.0, 29.0, 51.0, 55.0, 81.0, 134.0, 190.0, 289.0, 537.0, 1272.0, 4262.0, 44398.0, 967360.0, 24149.0, 3117.0, 1106.0, 512.0, 281.0, 181.0, 111.0, 79.0, 47.0, 46.0, 38.0, 28.0, 17.0, 14.0, 9.0, 14.0, 5.0, 6.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00838470458984375, -0.008108973503112793, -0.007833242416381836, -0.007557511329650879, -0.007281780242919922, -0.007006049156188965, -0.006730318069458008, -0.006454586982727051, -0.006178855895996094, -0.005903124809265137, -0.00562739372253418, -0.005351662635803223, -0.005075931549072266, -0.004800200462341309, -0.0045244693756103516, -0.0042487382888793945, -0.0039730072021484375, -0.0036972761154174805, -0.0034215450286865234, -0.0031458139419555664, -0.0028700828552246094, -0.0025943517684936523, -0.0023186206817626953, -0.0020428895950317383, -0.0017671585083007812, -0.0014914274215698242, -0.0012156963348388672, -0.0009399652481079102, -0.0006642341613769531, -0.0003885030746459961, -0.00011277198791503906, 0.00016295909881591797, 0.000438690185546875, 0.000714421272277832, 0.000990152359008789, 0.001265883445739746, 0.0015416145324707031, 0.0018173456192016602, 0.002093076705932617, 0.0023688077926635742, 0.0026445388793945312, 0.0029202699661254883, 0.0031960010528564453, 0.0034717321395874023, 0.0037474632263183594, 0.004023194313049316, 0.0042989253997802734, 0.0045746564865112305, 0.0048503875732421875, 0.0051261186599731445, 0.0054018497467041016, 0.005677580833435059, 0.005953311920166016, 0.006229043006896973, 0.00650477409362793, 0.006780505180358887, 0.007056236267089844, 0.007331967353820801, 0.007607698440551758, 0.007883429527282715, 0.008159160614013672, 0.008434891700744629, 0.008710622787475586, 0.008986353874206543, 0.0092620849609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 3.0, 1.0, 4.0, 9.0, 9.0, 2.0, 6.0, 7.0, 11.0, 11.0, 24.0, 21.0, 17.0, 31.0, 38.0, 98.0, 159.0, 229.0, 90.0, 62.0, 43.0, 27.0, 20.0, 21.0, 13.0, 15.0, 7.0, 6.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.728006362915039e-05, -5.549192428588867e-05, -5.370378494262695e-05, -5.1915645599365234e-05, -5.0127506256103516e-05, -4.83393669128418e-05, -4.655122756958008e-05, -4.476308822631836e-05, -4.297494888305664e-05, -4.118680953979492e-05, -3.93986701965332e-05, -3.7610530853271484e-05, -3.5822391510009766e-05, -3.403425216674805e-05, -3.224611282348633e-05, -3.045797348022461e-05, -2.866983413696289e-05, -2.6881694793701172e-05, -2.5093555450439453e-05, -2.3305416107177734e-05, -2.1517276763916016e-05, -1.9729137420654297e-05, -1.7940998077392578e-05, -1.615285873413086e-05, -1.436471939086914e-05, -1.2576580047607422e-05, -1.0788440704345703e-05, -9.000301361083984e-06, -7.212162017822266e-06, -5.424022674560547e-06, -3.635883331298828e-06, -1.8477439880371094e-06, -5.960464477539063e-08, 1.7285346984863281e-06, 3.516674041748047e-06, 5.304813385009766e-06, 7.092952728271484e-06, 8.881092071533203e-06, 1.0669231414794922e-05, 1.245737075805664e-05, 1.424551010131836e-05, 1.6033649444580078e-05, 1.7821788787841797e-05, 1.9609928131103516e-05, 2.1398067474365234e-05, 2.3186206817626953e-05, 2.4974346160888672e-05, 2.676248550415039e-05, 2.855062484741211e-05, 3.0338764190673828e-05, 3.212690353393555e-05, 3.3915042877197266e-05, 3.5703182220458984e-05, 3.74913215637207e-05, 3.927946090698242e-05, 4.106760025024414e-05, 4.285573959350586e-05, 4.464387893676758e-05, 4.64320182800293e-05, 4.8220157623291016e-05, 5.0008296966552734e-05, 5.179643630981445e-05, 5.358457565307617e-05, 5.537271499633789e-05, 5.716085433959961e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 10.0, 9.0, 12.0, 18.0, 36.0, 51.0, 93.0, 226.0, 608.0, 2816.0, 788820.0, 252174.0, 2612.0, 585.0, 217.0, 108.0, 49.0, 35.0, 22.0, 14.0, 12.0, 6.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249481201171875, -0.024254560470581055, -0.02356100082397461, -0.022867441177368164, -0.02217388153076172, -0.021480321884155273, -0.020786762237548828, -0.020093202590942383, -0.019399642944335938, -0.018706083297729492, -0.018012523651123047, -0.0173189640045166, -0.016625404357910156, -0.01593184471130371, -0.015238285064697266, -0.01454472541809082, -0.013851165771484375, -0.01315760612487793, -0.012464046478271484, -0.011770486831665039, -0.011076927185058594, -0.010383367538452148, -0.009689807891845703, -0.008996248245239258, -0.008302688598632812, -0.007609128952026367, -0.006915569305419922, -0.0062220096588134766, -0.005528450012207031, -0.004834890365600586, -0.004141330718994141, -0.0034477710723876953, -0.00275421142578125, -0.0020606517791748047, -0.0013670921325683594, -0.0006735324859619141, 2.002716064453125e-05, 0.0007135868072509766, 0.0014071464538574219, 0.002100706100463867, 0.0027942657470703125, 0.003487825393676758, 0.004181385040283203, 0.0048749446868896484, 0.005568504333496094, 0.006262063980102539, 0.006955623626708984, 0.00764918327331543, 0.008342742919921875, 0.00903630256652832, 0.009729862213134766, 0.010423421859741211, 0.011116981506347656, 0.011810541152954102, 0.012504100799560547, 0.013197660446166992, 0.013891220092773438, 0.014584779739379883, 0.015278339385986328, 0.015971899032592773, 0.01666545867919922, 0.017359018325805664, 0.01805257797241211, 0.018746137619018555, 0.019439697265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 15.0, 14.0, 21.0, 34.0, 44.0, 72.0, 109.0, 169.0, 167.0, 127.0, 76.0, 39.0, 26.0, 20.0, 16.0, 10.0, 4.0, 2.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005382537841796875, -0.005190372467041016, -0.004998207092285156, -0.004806041717529297, -0.0046138763427734375, -0.004421710968017578, -0.004229545593261719, -0.004037380218505859, -0.00384521484375, -0.0036530494689941406, -0.0034608840942382812, -0.003268718719482422, -0.0030765533447265625, -0.002884387969970703, -0.0026922225952148438, -0.0025000572204589844, -0.002307891845703125, -0.0021157264709472656, -0.0019235610961914062, -0.0017313957214355469, -0.0015392303466796875, -0.0013470649719238281, -0.0011548995971679688, -0.0009627342224121094, -0.00077056884765625, -0.0005784034729003906, -0.00038623809814453125, -0.00019407272338867188, -1.9073486328125e-06, 0.00019025802612304688, 0.00038242340087890625, 0.0005745887756347656, 0.000766754150390625, 0.0009589195251464844, 0.0011510848999023438, 0.0013432502746582031, 0.0015354156494140625, 0.0017275810241699219, 0.0019197463989257812, 0.0021119117736816406, 0.0023040771484375, 0.0024962425231933594, 0.0026884078979492188, 0.002880573272705078, 0.0030727386474609375, 0.003264904022216797, 0.0034570693969726562, 0.0036492347717285156, 0.003841400146484375, 0.004033565521240234, 0.004225730895996094, 0.004417896270751953, 0.0046100616455078125, 0.004802227020263672, 0.004994392395019531, 0.005186557769775391, 0.00537872314453125, 0.005570888519287109, 0.005763053894042969, 0.005955219268798828, 0.0061473846435546875, 0.006339550018310547, 0.006531715393066406, 0.006723880767822266, 0.006916046142578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 14.0, 669.0, 328.0, 5.0, 0.0, 2.0, 1.0], "bins": [-9.949470520019531, -9.780729293823242, -9.611988067626953, -9.443246841430664, -9.274505615234375, -9.105764389038086, -8.937023162841797, -8.768281936645508, -8.599540710449219, -8.43079948425293, -8.26205825805664, -8.093317031860352, -7.9245758056640625, -7.755834579467773, -7.587093353271484, -7.418352127075195, -7.249610424041748, -7.080869197845459, -6.91212797164917, -6.743386745452881, -6.574645519256592, -6.405904293060303, -6.2371625900268555, -6.068421363830566, -5.899680137634277, -5.730938911437988, -5.562197685241699, -5.39345645904541, -5.224715232849121, -5.055974006652832, -4.887232780456543, -4.718491554260254, -4.549750804901123, -4.381009578704834, -4.212268352508545, -4.043527126312256, -3.874785900115967, -3.7060446739196777, -3.5373032093048096, -3.3685619831085205, -3.1998207569122314, -3.0310795307159424, -2.8623383045196533, -2.693596839904785, -2.524855613708496, -2.356114387512207, -2.187373161315918, -2.018631935119629, -1.8498907089233398, -1.6811494827270508, -1.5124082565307617, -1.343666911125183, -1.174925684928894, -1.006184458732605, -0.8374431133270264, -0.6687018871307373, -0.49996060132980347, -0.331219345331192, -0.16247808933258057, 0.0062631964683532715, 0.17500442266464233, 0.3437456488609314, 0.51248699426651, 0.6812282204627991, 0.8499694466590881]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 18.0, 19.0, 15.0, 13.0, 22.0, 35.0, 24.0, 46.0, 53.0, 59.0, 50.0, 54.0, 52.0, 58.0, 67.0, 58.0, 52.0, 45.0, 44.0, 41.0, 26.0, 32.0, 21.0, 21.0, 18.0, 13.0, 8.0, 3.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7800173163414001, -0.7510339617729187, -0.722050666809082, -0.6930673122406006, -0.6640839576721191, -0.6351006031036377, -0.606117308139801, -0.5771339535713196, -0.5481506586074829, -0.5191673040390015, -0.4901839792728424, -0.46120065450668335, -0.4322172999382019, -0.40323397517204285, -0.3742506504058838, -0.34526729583740234, -0.3162839412689209, -0.28730061650276184, -0.2583172619342804, -0.22933393716812134, -0.2003505975008011, -0.17136725783348083, -0.14238393306732178, -0.11340059340000153, -0.08441725373268127, -0.05543391779065132, -0.02645058184862137, 0.002532750368118286, 0.03151609003543854, 0.06049942970275879, 0.08948275446891785, 0.1184660941362381, 0.14744937419891357, 0.17643271386623383, 0.20541605353355408, 0.23439937829971313, 0.2633827328681946, 0.29236605763435364, 0.3213493824005127, 0.35033273696899414, 0.3793160617351532, 0.40829938650131226, 0.4372827410697937, 0.46626606583595276, 0.4952493906021118, 0.5242327451705933, 0.5532160997390747, 0.5821993947029114, 0.6111827492713928, 0.6401661038398743, 0.6691493988037109, 0.6981327533721924, 0.7271161079406738, 0.7560994625091553, 0.7850827574729919, 0.8140661120414734, 0.8430494070053101, 0.8720327615737915, 0.9010160565376282, 0.9299994111061096, 0.9589827656745911, 0.9879660606384277, 1.0169494152069092, 1.0459327697753906, 1.074916124343872]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 5.0, 12.0, 16.0, 28.0, 63.0, 184.0, 536.0, 2178.0, 51733.0, 4133052.0, 4799.0, 1071.0, 312.0, 119.0, 57.0, 31.0, 11.0, 12.0, 10.0, 5.0, 3.0, 5.0, 5.0, 2.0, 1.0, 7.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89111328125, -0.8633804321289062, -0.8356475830078125, -0.8079147338867188, -0.780181884765625, -0.7524490356445312, -0.7247161865234375, -0.6969833374023438, -0.66925048828125, -0.6415176391601562, -0.6137847900390625, -0.5860519409179688, -0.558319091796875, -0.5305862426757812, -0.5028533935546875, -0.47512054443359375, -0.4473876953125, -0.41965484619140625, -0.3919219970703125, -0.36418914794921875, -0.336456298828125, -0.30872344970703125, -0.2809906005859375, -0.25325775146484375, -0.22552490234375, -0.19779205322265625, -0.1700592041015625, -0.14232635498046875, -0.114593505859375, -0.08686065673828125, -0.0591278076171875, -0.03139495849609375, -0.003662109375, 0.02407073974609375, 0.0518035888671875, 0.07953643798828125, 0.107269287109375, 0.13500213623046875, 0.1627349853515625, 0.19046783447265625, 0.21820068359375, 0.24593353271484375, 0.2736663818359375, 0.30139923095703125, 0.329132080078125, 0.35686492919921875, 0.3845977783203125, 0.41233062744140625, 0.4400634765625, 0.46779632568359375, 0.4955291748046875, 0.5232620239257812, 0.550994873046875, 0.5787277221679688, 0.6064605712890625, 0.6341934204101562, 0.66192626953125, 0.6896591186523438, 0.7173919677734375, 0.7451248168945312, 0.772857666015625, 0.8005905151367188, 0.8283233642578125, 0.8560562133789062, 0.8837890625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 9.0, 14.0, 19.0, 60.0, 98.0, 159.0, 159.0, 149.0, 96.0, 62.0, 31.0, 27.0, 19.0, 15.0, 6.0, 8.0, 9.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03594970703125, -0.03483009338378906, -0.033710479736328125, -0.03259086608886719, -0.03147125244140625, -0.030351638793945312, -0.029232025146484375, -0.028112411499023438, -0.0269927978515625, -0.025873184204101562, -0.024753570556640625, -0.023633956909179688, -0.02251434326171875, -0.021394729614257812, -0.020275115966796875, -0.019155502319335938, -0.018035888671875, -0.016916275024414062, -0.015796661376953125, -0.014677047729492188, -0.01355743408203125, -0.012437820434570312, -0.011318206787109375, -0.010198593139648438, -0.0090789794921875, -0.007959365844726562, -0.006839752197265625, -0.0057201385498046875, -0.00460052490234375, -0.0034809112548828125, -0.002361297607421875, -0.0012416839599609375, -0.0001220703125, 0.0009975433349609375, 0.002117156982421875, 0.0032367706298828125, 0.00435638427734375, 0.0054759979248046875, 0.006595611572265625, 0.0077152252197265625, 0.0088348388671875, 0.009954452514648438, 0.011074066162109375, 0.012193679809570312, 0.01331329345703125, 0.014432907104492188, 0.015552520751953125, 0.016672134399414062, 0.017791748046875, 0.018911361694335938, 0.020030975341796875, 0.021150588989257812, 0.02227020263671875, 0.023389816284179688, 0.024509429931640625, 0.025629043579101562, 0.0267486572265625, 0.027868270874023438, 0.028987884521484375, 0.030107498168945312, 0.03122711181640625, 0.03234672546386719, 0.033466339111328125, 0.03458595275878906, 0.03570556640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 0.0, 14.0, 13.0, 20.0, 22.0, 44.0, 84.0, 151.0, 413.0, 1744.0, 14324.0, 4142069.0, 31938.0, 2423.0, 561.0, 197.0, 96.0, 44.0, 25.0, 20.0, 17.0, 11.0, 14.0, 7.0, 4.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57861328125, -0.5603485107421875, -0.542083740234375, -0.5238189697265625, -0.50555419921875, -0.4872894287109375, -0.469024658203125, -0.4507598876953125, -0.4324951171875, -0.4142303466796875, -0.395965576171875, -0.3777008056640625, -0.35943603515625, -0.3411712646484375, -0.322906494140625, -0.3046417236328125, -0.286376953125, -0.2681121826171875, -0.249847412109375, -0.2315826416015625, -0.21331787109375, -0.1950531005859375, -0.176788330078125, -0.1585235595703125, -0.1402587890625, -0.1219940185546875, -0.103729248046875, -0.0854644775390625, -0.06719970703125, -0.0489349365234375, -0.030670166015625, -0.0124053955078125, 0.005859375, 0.0241241455078125, 0.042388916015625, 0.0606536865234375, 0.07891845703125, 0.0971832275390625, 0.115447998046875, 0.1337127685546875, 0.1519775390625, 0.1702423095703125, 0.188507080078125, 0.2067718505859375, 0.22503662109375, 0.2433013916015625, 0.261566162109375, 0.2798309326171875, 0.298095703125, 0.3163604736328125, 0.334625244140625, 0.3528900146484375, 0.37115478515625, 0.3894195556640625, 0.407684326171875, 0.4259490966796875, 0.4442138671875, 0.4624786376953125, 0.480743408203125, 0.4990081787109375, 0.51727294921875, 0.5355377197265625, 0.553802490234375, 0.5720672607421875, 0.59033203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 3.0, 11.0, 6.0, 13.0, 11.0, 10.0, 8.0, 14.0, 14.0, 24.0, 40.0, 45.0, 3472.0, 228.0, 42.0, 26.0, 19.0, 20.0, 16.0, 7.0, 7.0, 8.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08392333984375, -0.08136558532714844, -0.07880783081054688, -0.07625007629394531, -0.07369232177734375, -0.07113456726074219, -0.06857681274414062, -0.06601905822753906, -0.0634613037109375, -0.06090354919433594, -0.058345794677734375, -0.05578804016113281, -0.05323028564453125, -0.05067253112792969, -0.048114776611328125, -0.04555702209472656, -0.042999267578125, -0.04044151306152344, -0.037883758544921875, -0.03532600402832031, -0.03276824951171875, -0.030210494995117188, -0.027652740478515625, -0.025094985961914062, -0.0225372314453125, -0.019979476928710938, -0.017421722412109375, -0.014863967895507812, -0.01230621337890625, -0.009748458862304688, -0.007190704345703125, -0.0046329498291015625, -0.0020751953125, 0.0004825592041015625, 0.003040313720703125, 0.0055980682373046875, 0.00815582275390625, 0.010713577270507812, 0.013271331787109375, 0.015829086303710938, 0.0183868408203125, 0.020944595336914062, 0.023502349853515625, 0.026060104370117188, 0.02861785888671875, 0.031175613403320312, 0.033733367919921875, 0.03629112243652344, 0.038848876953125, 0.04140663146972656, 0.043964385986328125, 0.04652214050292969, 0.04907989501953125, 0.05163764953613281, 0.054195404052734375, 0.05675315856933594, 0.0593109130859375, 0.06186866760253906, 0.06442642211914062, 0.06698417663574219, 0.06954193115234375, 0.07209968566894531, 0.07465744018554688, 0.07721519470214844, 0.07977294921875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 239.0, 774.0, 5.0], "bins": [-3.634164810180664, -3.5756020545959473, -3.5170395374298096, -3.4584767818450928, -3.399914264678955, -3.3413515090942383, -3.2827889919281006, -3.224226236343384, -3.165663719177246, -3.1071009635925293, -3.0485384464263916, -2.989975690841675, -2.931413173675537, -2.8728504180908203, -2.8142879009246826, -2.755725145339966, -2.697162628173828, -2.6385998725891113, -2.5800373554229736, -2.521474599838257, -2.462912082672119, -2.4043493270874023, -2.3457868099212646, -2.287224054336548, -2.22866153717041, -2.1700987815856934, -2.1115362644195557, -2.052973508834839, -1.9944109916687012, -1.935848355293274, -1.8772857189178467, -1.8187230825424194, -1.7601604461669922, -1.701597809791565, -1.6430351734161377, -1.5844725370407104, -1.5259099006652832, -1.467347264289856, -1.4087846279144287, -1.3502219915390015, -1.2916593551635742, -1.233096718788147, -1.1745340824127197, -1.1159714460372925, -1.0574088096618652, -0.998846173286438, -0.9402835369110107, -0.8817209005355835, -0.8231581449508667, -0.7645955085754395, -0.7060328722000122, -0.647470235824585, -0.5889075994491577, -0.5303449630737305, -0.47178229689598083, -0.4132196605205536, -0.35465705394744873, -0.2960944175720215, -0.23753178119659424, -0.1789691299200058, -0.12040649354457855, -0.06184384226799011, -0.003281205892562866, 0.05528143048286438, 0.11384406685829163]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 8.0, 12.0, 9.0, 12.0, 21.0, 34.0, 28.0, 41.0, 42.0, 45.0, 52.0, 50.0, 57.0, 50.0, 64.0, 50.0, 62.0, 45.0, 54.0, 62.0, 42.0, 30.0, 28.0, 29.0, 13.0, 11.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.23556888103485107, -0.2282554805278778, -0.22094208002090454, -0.21362867951393127, -0.2063152939081192, -0.19900189340114594, -0.19168849289417267, -0.1843750923871994, -0.17706170678138733, -0.16974830627441406, -0.1624349057674408, -0.15512150526046753, -0.14780811965465546, -0.1404947191476822, -0.13318131864070892, -0.12586791813373566, -0.11855451762676239, -0.11124111711978912, -0.10392772406339645, -0.09661432355642319, -0.08930093050003052, -0.08198752999305725, -0.07467412948608398, -0.06736072897911072, -0.06004733592271805, -0.05273393914103508, -0.04542054235935211, -0.038107141852378845, -0.030793745070695877, -0.02348034828901291, -0.016166947782039642, -0.008853551000356674, -0.001540154218673706, 0.005773243494331837, 0.01308664120733738, 0.020400039851665497, 0.027713436633348465, 0.03502683341503143, 0.0423402339220047, 0.04965363070368767, 0.056967027485370636, 0.0642804279923439, 0.07159382104873657, 0.07890722155570984, 0.0862206220626831, 0.09353401511907578, 0.10084741562604904, 0.10816080868244171, 0.11547420918941498, 0.12278760969638824, 0.1301010102033615, 0.13741439580917358, 0.14472779631614685, 0.15204119682312012, 0.15935459733009338, 0.16666799783706665, 0.17398139834403992, 0.18129479885101318, 0.18860819935798645, 0.19592159986495972, 0.2032349854707718, 0.21054838597774506, 0.21786178648471832, 0.2251751869916916, 0.23248857259750366]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 2.0, 5.0, 8.0, 11.0, 9.0, 22.0, 29.0, 38.0, 46.0, 67.0, 97.0, 155.0, 206.0, 306.0, 380.0, 624.0, 990.0, 1500.0, 2370.0, 4369.0, 8777.0, 23098.0, 105017.0, 761661.0, 97966.0, 21523.0, 8328.0, 4204.0, 2272.0, 1443.0, 993.0, 632.0, 437.0, 273.0, 182.0, 126.0, 106.0, 89.0, 56.0, 47.0, 20.0, 28.0, 15.0, 9.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.166015625, -0.16074180603027344, -0.15546798706054688, -0.1501941680908203, -0.14492034912109375, -0.1396465301513672, -0.13437271118164062, -0.12909889221191406, -0.1238250732421875, -0.11855125427246094, -0.11327743530273438, -0.10800361633300781, -0.10272979736328125, -0.09745597839355469, -0.09218215942382812, -0.08690834045410156, -0.081634521484375, -0.07636070251464844, -0.07108688354492188, -0.06581306457519531, -0.06053924560546875, -0.05526542663574219, -0.049991607666015625, -0.04471778869628906, -0.0394439697265625, -0.03417015075683594, -0.028896331787109375, -0.023622512817382812, -0.01834869384765625, -0.013074874877929688, -0.007801055908203125, -0.0025272369384765625, 0.00274658203125, 0.008020401000976562, 0.013294219970703125, 0.018568038940429688, 0.02384185791015625, 0.029115676879882812, 0.034389495849609375, 0.03966331481933594, 0.0449371337890625, 0.05021095275878906, 0.055484771728515625, 0.06075859069824219, 0.06603240966796875, 0.07130622863769531, 0.07658004760742188, 0.08185386657714844, 0.087127685546875, 0.09240150451660156, 0.09767532348632812, 0.10294914245605469, 0.10822296142578125, 0.11349678039550781, 0.11877059936523438, 0.12404441833496094, 0.1293182373046875, 0.13459205627441406, 0.13986587524414062, 0.1451396942138672, 0.15041351318359375, 0.1556873321533203, 0.16096115112304688, 0.16623497009277344, 0.1715087890625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 5.0, 9.0, 17.0, 41.0, 57.0, 110.0, 139.0, 143.0, 129.0, 107.0, 57.0, 45.0, 27.0, 23.0, 8.0, 8.0, 5.0, 8.0, 8.0, 5.0, 2.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0335693359375, -0.03258347511291504, -0.03159761428833008, -0.030611753463745117, -0.029625892639160156, -0.028640031814575195, -0.027654170989990234, -0.026668310165405273, -0.025682449340820312, -0.02469658851623535, -0.02371072769165039, -0.02272486686706543, -0.02173900604248047, -0.020753145217895508, -0.019767284393310547, -0.018781423568725586, -0.017795562744140625, -0.016809701919555664, -0.015823841094970703, -0.014837980270385742, -0.013852119445800781, -0.01286625862121582, -0.01188039779663086, -0.010894536972045898, -0.009908676147460938, -0.008922815322875977, -0.007936954498291016, -0.006951093673706055, -0.005965232849121094, -0.004979372024536133, -0.003993511199951172, -0.003007650375366211, -0.00202178955078125, -0.001035928726196289, -5.0067901611328125e-05, 0.0009357929229736328, 0.0019216537475585938, 0.0029075145721435547, 0.0038933753967285156, 0.0048792362213134766, 0.0058650970458984375, 0.0068509578704833984, 0.00783681869506836, 0.00882267951965332, 0.009808540344238281, 0.010794401168823242, 0.011780261993408203, 0.012766122817993164, 0.013751983642578125, 0.014737844467163086, 0.015723705291748047, 0.016709566116333008, 0.01769542694091797, 0.01868128776550293, 0.01966714859008789, 0.02065300941467285, 0.021638870239257812, 0.022624731063842773, 0.023610591888427734, 0.024596452713012695, 0.025582313537597656, 0.026568174362182617, 0.027554035186767578, 0.02853989601135254, 0.0295257568359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 8.0, 14.0, 23.0, 16.0, 22.0, 40.0, 38.0, 56.0, 73.0, 121.0, 154.0, 298.0, 728.0, 1957.0, 9024.0, 831282.0, 196166.0, 5606.0, 1507.0, 609.0, 256.0, 152.0, 106.0, 81.0, 58.0, 33.0, 29.0, 21.0, 16.0, 12.0, 8.0, 7.0, 8.0, 6.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4375, -0.4253082275390625, -0.413116455078125, -0.4009246826171875, -0.38873291015625, -0.3765411376953125, -0.364349365234375, -0.3521575927734375, -0.3399658203125, -0.3277740478515625, -0.315582275390625, -0.3033905029296875, -0.29119873046875, -0.2790069580078125, -0.266815185546875, -0.2546234130859375, -0.242431640625, -0.2302398681640625, -0.218048095703125, -0.2058563232421875, -0.19366455078125, -0.1814727783203125, -0.169281005859375, -0.1570892333984375, -0.1448974609375, -0.1327056884765625, -0.120513916015625, -0.1083221435546875, -0.09613037109375, -0.0839385986328125, -0.071746826171875, -0.0595550537109375, -0.04736328125, -0.0351715087890625, -0.022979736328125, -0.0107879638671875, 0.00140380859375, 0.0135955810546875, 0.025787353515625, 0.0379791259765625, 0.0501708984375, 0.0623626708984375, 0.074554443359375, 0.0867462158203125, 0.09893798828125, 0.1111297607421875, 0.123321533203125, 0.1355133056640625, 0.147705078125, 0.1598968505859375, 0.172088623046875, 0.1842803955078125, 0.19647216796875, 0.2086639404296875, 0.220855712890625, 0.2330474853515625, 0.2452392578125, 0.2574310302734375, 0.269622802734375, 0.2818145751953125, 0.29400634765625, 0.3061981201171875, 0.318389892578125, 0.3305816650390625, 0.3427734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 4.0, 12.0, 16.0, 11.0, 19.0, 19.0, 23.0, 27.0, 46.0, 39.0, 45.0, 41.0, 39.0, 48.0, 43.0, 49.0, 58.0, 59.0, 60.0, 33.0, 33.0, 29.0, 38.0, 35.0, 28.0, 22.0, 25.0, 24.0, 15.0, 13.0, 11.0, 12.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10858154296875, -0.1049795150756836, -0.10137748718261719, -0.09777545928955078, -0.09417343139648438, -0.09057140350341797, -0.08696937561035156, -0.08336734771728516, -0.07976531982421875, -0.07616329193115234, -0.07256126403808594, -0.06895923614501953, -0.06535720825195312, -0.06175518035888672, -0.05815315246582031, -0.054551124572753906, -0.0509490966796875, -0.047347068786621094, -0.04374504089355469, -0.04014301300048828, -0.036540985107421875, -0.03293895721435547, -0.029336929321289062, -0.025734901428222656, -0.02213287353515625, -0.018530845642089844, -0.014928817749023438, -0.011326789855957031, -0.007724761962890625, -0.004122734069824219, -0.0005207061767578125, 0.0030813217163085938, 0.006683349609375, 0.010285377502441406, 0.013887405395507812, 0.01748943328857422, 0.021091461181640625, 0.02469348907470703, 0.028295516967773438, 0.031897544860839844, 0.03549957275390625, 0.039101600646972656, 0.04270362854003906, 0.04630565643310547, 0.049907684326171875, 0.05350971221923828, 0.05711174011230469, 0.060713768005371094, 0.0643157958984375, 0.0679178237915039, 0.07151985168457031, 0.07512187957763672, 0.07872390747070312, 0.08232593536376953, 0.08592796325683594, 0.08952999114990234, 0.09313201904296875, 0.09673404693603516, 0.10033607482910156, 0.10393810272216797, 0.10754013061523438, 0.11114215850830078, 0.11474418640136719, 0.1183462142944336, 0.1219482421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 1.0, 5.0, 1.0, 9.0, 12.0, 13.0, 13.0, 26.0, 47.0, 55.0, 115.0, 245.0, 708.0, 2798.0, 362112.0, 677929.0, 3195.0, 640.0, 278.0, 151.0, 66.0, 36.0, 23.0, 21.0, 8.0, 12.0, 3.0, 6.0, 7.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015228271484375, -0.014720916748046875, -0.01421356201171875, -0.013706207275390625, -0.0131988525390625, -0.012691497802734375, -0.01218414306640625, -0.011676788330078125, -0.01116943359375, -0.010662078857421875, -0.01015472412109375, -0.009647369384765625, -0.0091400146484375, -0.008632659912109375, -0.00812530517578125, -0.007617950439453125, -0.007110595703125, -0.006603240966796875, -0.00609588623046875, -0.005588531494140625, -0.0050811767578125, -0.004573822021484375, -0.00406646728515625, -0.003559112548828125, -0.0030517578125, -0.002544403076171875, -0.00203704833984375, -0.001529693603515625, -0.0010223388671875, -0.000514984130859375, -7.62939453125e-06, 0.000499725341796875, 0.001007080078125, 0.001514434814453125, 0.00202178955078125, 0.002529144287109375, 0.0030364990234375, 0.003543853759765625, 0.00405120849609375, 0.004558563232421875, 0.00506591796875, 0.005573272705078125, 0.00608062744140625, 0.006587982177734375, 0.0070953369140625, 0.007602691650390625, 0.00811004638671875, 0.008617401123046875, 0.009124755859375, 0.009632110595703125, 0.01013946533203125, 0.010646820068359375, 0.0111541748046875, 0.011661529541015625, 0.01216888427734375, 0.012676239013671875, 0.01318359375, 0.013690948486328125, 0.01419830322265625, 0.014705657958984375, 0.0152130126953125, 0.015720367431640625, 0.01622772216796875, 0.016735076904296875, 0.017242431640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 7.0, 0.0, 6.0, 6.0, 8.0, 11.0, 8.0, 8.0, 22.0, 18.0, 15.0, 30.0, 23.0, 45.0, 79.0, 85.0, 93.0, 92.0, 87.0, 72.0, 59.0, 53.0, 35.0, 34.0, 21.0, 24.0, 14.0, 16.0, 3.0, 9.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.279613494873047e-05, -4.143174737691879e-05, -4.006735980510712e-05, -3.870297223329544e-05, -3.7338584661483765e-05, -3.597419708967209e-05, -3.460980951786041e-05, -3.3245421946048737e-05, -3.188103437423706e-05, -3.0516646802425385e-05, -2.915225923061371e-05, -2.7787871658802032e-05, -2.6423484086990356e-05, -2.505909651517868e-05, -2.3694708943367004e-05, -2.233032137155533e-05, -2.0965933799743652e-05, -1.9601546227931976e-05, -1.82371586561203e-05, -1.6872771084308624e-05, -1.5508383512496948e-05, -1.4143995940685272e-05, -1.2779608368873596e-05, -1.141522079706192e-05, -1.0050833225250244e-05, -8.686445653438568e-06, -7.322058081626892e-06, -5.957670509815216e-06, -4.59328293800354e-06, -3.228895366191864e-06, -1.864507794380188e-06, -5.00120222568512e-07, 8.642673492431641e-07, 2.22865492105484e-06, 3.593042492866516e-06, 4.957430064678192e-06, 6.321817636489868e-06, 7.686205208301544e-06, 9.05059278011322e-06, 1.0414980351924896e-05, 1.1779367923736572e-05, 1.3143755495548248e-05, 1.4508143067359924e-05, 1.58725306391716e-05, 1.7236918210983276e-05, 1.8601305782794952e-05, 1.996569335460663e-05, 2.1330080926418304e-05, 2.269446849822998e-05, 2.4058856070041656e-05, 2.5423243641853333e-05, 2.678763121366501e-05, 2.8152018785476685e-05, 2.951640635728836e-05, 3.088079392910004e-05, 3.224518150091171e-05, 3.360956907272339e-05, 3.4973956644535065e-05, 3.633834421634674e-05, 3.770273178815842e-05, 3.906711935997009e-05, 4.043150693178177e-05, 4.1795894503593445e-05, 4.316028207540512e-05, 4.45246696472168e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 13.0, 16.0, 21.0, 35.0, 48.0, 74.0, 126.0, 289.0, 1016.0, 7942.0, 1025832.0, 11094.0, 1296.0, 352.0, 142.0, 79.0, 47.0, 34.0, 24.0, 15.0, 8.0, 13.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02947998046875, -0.028574228286743164, -0.027668476104736328, -0.026762723922729492, -0.025856971740722656, -0.02495121955871582, -0.024045467376708984, -0.02313971519470215, -0.022233963012695312, -0.021328210830688477, -0.02042245864868164, -0.019516706466674805, -0.01861095428466797, -0.017705202102661133, -0.016799449920654297, -0.01589369773864746, -0.014987945556640625, -0.014082193374633789, -0.013176441192626953, -0.012270689010620117, -0.011364936828613281, -0.010459184646606445, -0.00955343246459961, -0.008647680282592773, -0.0077419281005859375, -0.0068361759185791016, -0.005930423736572266, -0.00502467155456543, -0.004118919372558594, -0.003213167190551758, -0.002307415008544922, -0.001401662826538086, -0.00049591064453125, 0.00040984153747558594, 0.0013155937194824219, 0.002221345901489258, 0.0031270980834960938, 0.00403285026550293, 0.004938602447509766, 0.0058443546295166016, 0.0067501068115234375, 0.0076558589935302734, 0.00856161117553711, 0.009467363357543945, 0.010373115539550781, 0.011278867721557617, 0.012184619903564453, 0.013090372085571289, 0.013996124267578125, 0.014901876449584961, 0.015807628631591797, 0.016713380813598633, 0.01761913299560547, 0.018524885177612305, 0.01943063735961914, 0.020336389541625977, 0.021242141723632812, 0.02214789390563965, 0.023053646087646484, 0.02395939826965332, 0.024865150451660156, 0.025770902633666992, 0.026676654815673828, 0.027582406997680664, 0.0284881591796875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 5.0, 6.0, 22.0, 16.0, 37.0, 103.0, 166.0, 292.0, 164.0, 83.0, 34.0, 28.0, 11.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0108184814453125, -0.010473847389221191, -0.010129213333129883, -0.009784579277038574, -0.009439945220947266, -0.009095311164855957, -0.008750677108764648, -0.00840604305267334, -0.008061408996582031, -0.007716774940490723, -0.007372140884399414, -0.0070275068283081055, -0.006682872772216797, -0.006338238716125488, -0.00599360466003418, -0.005648970603942871, -0.0053043365478515625, -0.004959702491760254, -0.004615068435668945, -0.004270434379577637, -0.003925800323486328, -0.0035811662673950195, -0.003236532211303711, -0.0028918981552124023, -0.0025472640991210938, -0.002202630043029785, -0.0018579959869384766, -0.001513361930847168, -0.0011687278747558594, -0.0008240938186645508, -0.0004794597625732422, -0.0001348257064819336, 0.000209808349609375, 0.0005544424057006836, 0.0008990764617919922, 0.0012437105178833008, 0.0015883445739746094, 0.001932978630065918, 0.0022776126861572266, 0.002622246742248535, 0.0029668807983398438, 0.0033115148544311523, 0.003656148910522461, 0.0040007829666137695, 0.004345417022705078, 0.004690051078796387, 0.005034685134887695, 0.005379319190979004, 0.0057239532470703125, 0.006068587303161621, 0.00641322135925293, 0.006757855415344238, 0.007102489471435547, 0.0074471235275268555, 0.007791757583618164, 0.008136391639709473, 0.008481025695800781, 0.00882565975189209, 0.009170293807983398, 0.009514927864074707, 0.009859561920166016, 0.010204195976257324, 0.010548830032348633, 0.010893464088439941, 0.01123809814453125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 68.0, 924.0, 21.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.005024909973145, -7.865721225738525, -7.726417541503906, -7.587113857269287, -7.447810173034668, -7.308506488800049, -7.16920280456543, -7.029898643493652, -6.890595436096191, -6.751291751861572, -6.611988067626953, -6.472684383392334, -6.333380699157715, -6.194077014923096, -6.054773330688477, -5.915469169616699, -5.77616548538208, -5.636861801147461, -5.497558116912842, -5.358254432678223, -5.2189507484436035, -5.079647064208984, -4.940343379974365, -4.801039695739746, -4.661735534667969, -4.52243185043335, -4.3831281661987305, -4.243824481964111, -4.104520797729492, -3.965217113494873, -3.825913190841675, -3.6866095066070557, -3.547306537628174, -3.4080028533935547, -3.2686991691589355, -3.1293954849243164, -2.9900918006896973, -2.850788116455078, -2.71148419380188, -2.5721805095672607, -2.4328765869140625, -2.2935729026794434, -2.154269218444824, -2.014965534210205, -1.8756617307662964, -1.7363580465316772, -1.5970542430877686, -1.4577505588531494, -1.3184469938278198, -1.1791433095932007, -1.039839506149292, -0.9005358219146729, -0.7612321376800537, -0.6219284534454346, -0.48262470960617065, -0.34332096576690674, -0.2040172815322876, -0.06471356749534607, 0.07459014654159546, 0.213893860578537, 0.3531975746154785, 0.49250125885009766, 0.6318050026893616, 0.7711087465286255, 0.9104124307632446]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 7.0, 3.0, 8.0, 13.0, 16.0, 15.0, 11.0, 17.0, 25.0, 27.0, 30.0, 24.0, 34.0, 38.0, 34.0, 47.0, 33.0, 59.0, 54.0, 38.0, 44.0, 39.0, 44.0, 37.0, 24.0, 32.0, 33.0, 28.0, 29.0, 23.0, 23.0, 18.0, 14.0, 12.0, 9.0, 8.0, 10.0, 7.0, 6.0, 3.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.6520004868507385, -0.6329001784324646, -0.6137998700141907, -0.5946995615959167, -0.5755993127822876, -0.5564990043640137, -0.5373986959457397, -0.5182983875274658, -0.4991980791091919, -0.48009777069091797, -0.46099746227264404, -0.4418971836566925, -0.4227968752384186, -0.40369656682014465, -0.3845962882041931, -0.3654959797859192, -0.34639567136764526, -0.32729536294937134, -0.3081950545310974, -0.2890947759151459, -0.26999446749687195, -0.250894159078598, -0.2317938655614853, -0.21269357204437256, -0.19359326362609863, -0.1744929552078247, -0.15539266169071198, -0.13629236817359924, -0.11719205975532532, -0.09809175878763199, -0.07899145781993866, -0.05989116430282593, -0.040790855884552, -0.021690554916858673, -0.0025902539491653442, 0.016510047018527985, 0.035610347986221313, 0.05471064895391464, 0.07381094992160797, 0.0929112434387207, 0.11201155185699463, 0.13111186027526855, 0.1502121537923813, 0.16931244730949402, 0.18841275572776794, 0.20751306414604187, 0.2266133576631546, 0.24571365118026733, 0.26481395959854126, 0.2839142680168152, 0.3030145764350891, 0.32211485505104065, 0.3412151634693146, 0.3603154718875885, 0.37941575050354004, 0.39851605892181396, 0.4176163673400879, 0.4367166757583618, 0.45581698417663574, 0.4749172627925873, 0.4940175712108612, 0.5131178498268127, 0.5322181582450867, 0.5513184666633606, 0.5704187750816345]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 5.0, 10.0, 16.0, 23.0, 41.0, 61.0, 120.0, 257.0, 720.0, 5805.0, 4182173.0, 3808.0, 637.0, 247.0, 113.0, 81.0, 40.0, 26.0, 19.0, 13.0, 7.0, 9.0, 8.0, 7.0, 4.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.467529296875, -0.4531059265136719, -0.43868255615234375, -0.4242591857910156, -0.4098358154296875, -0.3954124450683594, -0.38098907470703125, -0.3665657043457031, -0.352142333984375, -0.3377189636230469, -0.32329559326171875, -0.3088722229003906, -0.2944488525390625, -0.2800254821777344, -0.26560211181640625, -0.2511787414550781, -0.23675537109375, -0.22233200073242188, -0.20790863037109375, -0.19348526000976562, -0.1790618896484375, -0.16463851928710938, -0.15021514892578125, -0.13579177856445312, -0.121368408203125, -0.10694503784179688, -0.09252166748046875, -0.07809829711914062, -0.0636749267578125, -0.049251556396484375, -0.03482818603515625, -0.020404815673828125, -0.0059814453125, 0.008441925048828125, 0.02286529541015625, 0.037288665771484375, 0.0517120361328125, 0.06613540649414062, 0.08055877685546875, 0.09498214721679688, 0.109405517578125, 0.12382888793945312, 0.13825225830078125, 0.15267562866210938, 0.1670989990234375, 0.18152236938476562, 0.19594573974609375, 0.21036911010742188, 0.22479248046875, 0.23921585083007812, 0.25363922119140625, 0.2680625915527344, 0.2824859619140625, 0.2969093322753906, 0.31133270263671875, 0.3257560729980469, 0.340179443359375, 0.3546028137207031, 0.36902618408203125, 0.3834495544433594, 0.3978729248046875, 0.4122962951660156, 0.42671966552734375, 0.4411430358886719, 0.45556640625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 3.0, 5.0, 14.0, 16.0, 26.0, 32.0, 62.0, 93.0, 114.0, 131.0, 116.0, 89.0, 70.0, 69.0, 31.0, 33.0, 14.0, 12.0, 9.0, 4.0, 6.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0292816162109375, -0.028374433517456055, -0.02746725082397461, -0.026560068130493164, -0.02565288543701172, -0.024745702743530273, -0.023838520050048828, -0.022931337356567383, -0.022024154663085938, -0.021116971969604492, -0.020209789276123047, -0.0193026065826416, -0.018395423889160156, -0.01748824119567871, -0.016581058502197266, -0.01567387580871582, -0.014766693115234375, -0.01385951042175293, -0.012952327728271484, -0.012045145034790039, -0.011137962341308594, -0.010230779647827148, -0.009323596954345703, -0.008416414260864258, -0.0075092315673828125, -0.006602048873901367, -0.005694866180419922, -0.0047876834869384766, -0.0038805007934570312, -0.002973318099975586, -0.0020661354064941406, -0.0011589527130126953, -0.00025177001953125, 0.0006554126739501953, 0.0015625953674316406, 0.002469778060913086, 0.0033769607543945312, 0.0042841434478759766, 0.005191326141357422, 0.006098508834838867, 0.0070056915283203125, 0.007912874221801758, 0.008820056915283203, 0.009727239608764648, 0.010634422302246094, 0.011541604995727539, 0.012448787689208984, 0.01335597038269043, 0.014263153076171875, 0.01517033576965332, 0.016077518463134766, 0.01698470115661621, 0.017891883850097656, 0.0187990665435791, 0.019706249237060547, 0.020613431930541992, 0.021520614624023438, 0.022427797317504883, 0.023334980010986328, 0.024242162704467773, 0.02514934539794922, 0.026056528091430664, 0.02696371078491211, 0.027870893478393555, 0.028778076171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 5.0, 8.0, 13.0, 16.0, 25.0, 61.0, 106.0, 332.0, 1121.0, 7589.0, 4140858.0, 39710.0, 3214.0, 793.0, 218.0, 84.0, 33.0, 23.0, 13.0, 11.0, 8.0, 11.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.29456329345703125, -0.2846832275390625, -0.27480316162109375, -0.264923095703125, -0.25504302978515625, -0.2451629638671875, -0.23528289794921875, -0.22540283203125, -0.21552276611328125, -0.2056427001953125, -0.19576263427734375, -0.185882568359375, -0.17600250244140625, -0.1661224365234375, -0.15624237060546875, -0.1463623046875, -0.13648223876953125, -0.1266021728515625, -0.11672210693359375, -0.106842041015625, -0.09696197509765625, -0.0870819091796875, -0.07720184326171875, -0.06732177734375, -0.05744171142578125, -0.0475616455078125, -0.03768157958984375, -0.027801513671875, -0.01792144775390625, -0.0080413818359375, 0.00183868408203125, 0.01171875, 0.02159881591796875, 0.0314788818359375, 0.04135894775390625, 0.051239013671875, 0.06111907958984375, 0.0709991455078125, 0.08087921142578125, 0.09075927734375, 0.10063934326171875, 0.1105194091796875, 0.12039947509765625, 0.130279541015625, 0.14015960693359375, 0.1500396728515625, 0.15991973876953125, 0.1697998046875, 0.17967987060546875, 0.1895599365234375, 0.19944000244140625, 0.209320068359375, 0.21920013427734375, 0.2290802001953125, 0.23896026611328125, 0.24884033203125, 0.25872039794921875, 0.2686004638671875, 0.27848052978515625, 0.288360595703125, 0.29824066162109375, 0.3081207275390625, 0.31800079345703125, 0.327880859375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 4.0, 7.0, 5.0, 7.0, 7.0, 11.0, 25.0, 31.0, 175.0, 3645.0, 67.0, 11.0, 12.0, 10.0, 10.0, 5.0, 2.0, 7.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.053619384765625, -0.0519556999206543, -0.050292015075683594, -0.04862833023071289, -0.04696464538574219, -0.045300960540771484, -0.04363727569580078, -0.04197359085083008, -0.040309906005859375, -0.03864622116088867, -0.03698253631591797, -0.035318851470947266, -0.03365516662597656, -0.03199148178100586, -0.030327796936035156, -0.028664112091064453, -0.02700042724609375, -0.025336742401123047, -0.023673057556152344, -0.02200937271118164, -0.020345687866210938, -0.018682003021240234, -0.01701831817626953, -0.015354633331298828, -0.013690948486328125, -0.012027263641357422, -0.010363578796386719, -0.008699893951416016, -0.0070362091064453125, -0.005372524261474609, -0.0037088394165039062, -0.002045154571533203, -0.0003814697265625, 0.0012822151184082031, 0.0029458999633789062, 0.004609584808349609, 0.0062732696533203125, 0.007936954498291016, 0.009600639343261719, 0.011264324188232422, 0.012928009033203125, 0.014591693878173828, 0.01625537872314453, 0.017919063568115234, 0.019582748413085938, 0.02124643325805664, 0.022910118103027344, 0.024573802947998047, 0.02623748779296875, 0.027901172637939453, 0.029564857482910156, 0.03122854232788086, 0.03289222717285156, 0.034555912017822266, 0.03621959686279297, 0.03788328170776367, 0.039546966552734375, 0.04121065139770508, 0.04287433624267578, 0.044538021087646484, 0.04620170593261719, 0.04786539077758789, 0.049529075622558594, 0.0511927604675293, 0.0528564453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 1006.0, 6.0], "bins": [-4.4444966316223145, -4.373301029205322, -4.30210542678833, -4.230909824371338, -4.159714221954346, -4.0885186195373535, -4.017323017120361, -3.9461276531219482, -3.874932050704956, -3.803736448287964, -3.7325408458709717, -3.6613452434539795, -3.5901498794555664, -3.518954277038574, -3.447758674621582, -3.37656307220459, -3.3053674697875977, -3.2341718673706055, -3.1629762649536133, -3.091780662536621, -3.020585060119629, -2.949389696121216, -2.8781940937042236, -2.8069984912872314, -2.7358028888702393, -2.664607286453247, -2.593411684036255, -2.5222160816192627, -2.4510207176208496, -2.3798251152038574, -2.3086295127868652, -2.237433910369873, -2.166238307952881, -2.0950427055358887, -2.0238471031188965, -1.9526516199111938, -1.8814560174942017, -1.8102604150772095, -1.7390649318695068, -1.6678693294525146, -1.596673846244812, -1.5254782438278198, -1.4542827606201172, -1.383087158203125, -1.3118915557861328, -1.2406959533691406, -1.1695003509521484, -1.0983048677444458, -1.0271092653274536, -0.9559136629104614, -0.884718120098114, -0.8135225772857666, -0.7423269748687744, -0.6711313724517822, -0.5999358296394348, -0.5287402868270874, -0.45754462480545044, -0.38634905219078064, -0.31515347957611084, -0.24395790696144104, -0.17276233434677124, -0.10156676173210144, -0.03037118911743164, 0.04082438349723816, 0.11201994866132736]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 13.0, 6.0, 8.0, 17.0, 21.0, 20.0, 15.0, 26.0, 38.0, 38.0, 38.0, 54.0, 54.0, 53.0, 54.0, 64.0, 53.0, 49.0, 73.0, 45.0, 45.0, 44.0, 36.0, 38.0, 17.0, 18.0, 15.0, 19.0, 10.0, 6.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1196402907371521, -0.11546975374221802, -0.11129921674728394, -0.10712868720293045, -0.10295815020799637, -0.09878761321306229, -0.0946170836687088, -0.09044654667377472, -0.08627600967884064, -0.08210547268390656, -0.07793493568897247, -0.07376440614461899, -0.0695938691496849, -0.06542333215475082, -0.06125279888510704, -0.05708226561546326, -0.052911728620529175, -0.04874119162559509, -0.04457065835595131, -0.040400125086307526, -0.036229588091373444, -0.03205905109643936, -0.027888517826795578, -0.023717982694506645, -0.019547447562217712, -0.01537691242992878, -0.011206377297639847, -0.007035842165350914, -0.002865307033061981, 0.0013052280992269516, 0.005475763231515884, 0.009646298363804817, 0.01381683349609375, 0.017987368628382683, 0.022157903760671616, 0.02632843889296055, 0.03049897402524948, 0.03466951102018356, 0.03884004428982735, 0.04301057755947113, 0.04718111455440521, 0.051351651549339294, 0.05552218481898308, 0.05969271808862686, 0.06386325508356094, 0.06803379207849503, 0.07220432162284851, 0.07637485861778259, 0.08054539561271667, 0.08471593260765076, 0.08888646960258484, 0.09305699914693832, 0.0972275361418724, 0.10139807313680649, 0.10556860268115997, 0.10973913967609406, 0.11390967667102814, 0.11808021366596222, 0.1222507506608963, 0.12642128765583038, 0.13059180974960327, 0.13476234674453735, 0.13893288373947144, 0.14310342073440552, 0.1472739577293396]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 2.0, 6.0, 9.0, 6.0, 14.0, 25.0, 42.0, 43.0, 66.0, 76.0, 110.0, 177.0, 246.0, 368.0, 525.0, 786.0, 1252.0, 1976.0, 3369.0, 6215.0, 13042.0, 35114.0, 153241.0, 673946.0, 105207.0, 27963.0, 11116.0, 5448.0, 3006.0, 1753.0, 1129.0, 709.0, 503.0, 303.0, 214.0, 152.0, 110.0, 86.0, 52.0, 39.0, 25.0, 25.0, 17.0, 11.0, 9.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0775146484375, -0.07512187957763672, -0.07272911071777344, -0.07033634185791016, -0.06794357299804688, -0.0655508041381836, -0.06315803527832031, -0.06076526641845703, -0.05837249755859375, -0.05597972869873047, -0.05358695983886719, -0.051194190979003906, -0.048801422119140625, -0.046408653259277344, -0.04401588439941406, -0.04162311553955078, -0.0392303466796875, -0.03683757781982422, -0.03444480895996094, -0.032052040100097656, -0.029659271240234375, -0.027266502380371094, -0.024873733520507812, -0.02248096466064453, -0.02008819580078125, -0.01769542694091797, -0.015302658081054688, -0.012909889221191406, -0.010517120361328125, -0.008124351501464844, -0.0057315826416015625, -0.0033388137817382812, -0.000946044921875, 0.0014467239379882812, 0.0038394927978515625, 0.006232261657714844, 0.008625030517578125, 0.011017799377441406, 0.013410568237304688, 0.01580333709716797, 0.01819610595703125, 0.02058887481689453, 0.022981643676757812, 0.025374412536621094, 0.027767181396484375, 0.030159950256347656, 0.03255271911621094, 0.03494548797607422, 0.0373382568359375, 0.03973102569580078, 0.04212379455566406, 0.044516563415527344, 0.046909332275390625, 0.049302101135253906, 0.05169486999511719, 0.05408763885498047, 0.05648040771484375, 0.05887317657470703, 0.06126594543457031, 0.0636587142944336, 0.06605148315429688, 0.06844425201416016, 0.07083702087402344, 0.07322978973388672, 0.07562255859375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 6.0, 6.0, 2.0, 7.0, 11.0, 24.0, 22.0, 35.0, 54.0, 88.0, 112.0, 127.0, 124.0, 80.0, 80.0, 54.0, 48.0, 23.0, 22.0, 13.0, 11.0, 8.0, 3.0, 8.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02813720703125, -0.027268648147583008, -0.026400089263916016, -0.025531530380249023, -0.02466297149658203, -0.02379441261291504, -0.022925853729248047, -0.022057294845581055, -0.021188735961914062, -0.02032017707824707, -0.019451618194580078, -0.018583059310913086, -0.017714500427246094, -0.0168459415435791, -0.01597738265991211, -0.015108823776245117, -0.014240264892578125, -0.013371706008911133, -0.01250314712524414, -0.011634588241577148, -0.010766029357910156, -0.009897470474243164, -0.009028911590576172, -0.00816035270690918, -0.0072917938232421875, -0.006423234939575195, -0.005554676055908203, -0.004686117172241211, -0.0038175582885742188, -0.0029489994049072266, -0.0020804405212402344, -0.0012118816375732422, -0.00034332275390625, 0.0005252361297607422, 0.0013937950134277344, 0.0022623538970947266, 0.0031309127807617188, 0.003999471664428711, 0.004868030548095703, 0.005736589431762695, 0.0066051483154296875, 0.00747370719909668, 0.008342266082763672, 0.009210824966430664, 0.010079383850097656, 0.010947942733764648, 0.01181650161743164, 0.012685060501098633, 0.013553619384765625, 0.014422178268432617, 0.01529073715209961, 0.0161592960357666, 0.017027854919433594, 0.017896413803100586, 0.018764972686767578, 0.01963353157043457, 0.020502090454101562, 0.021370649337768555, 0.022239208221435547, 0.02310776710510254, 0.02397632598876953, 0.024844884872436523, 0.025713443756103516, 0.026582002639770508, 0.0274505615234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 4.0, 4.0, 8.0, 10.0, 17.0, 5.0, 28.0, 24.0, 30.0, 43.0, 46.0, 48.0, 56.0, 91.0, 143.0, 285.0, 571.0, 1279.0, 3418.0, 32756.0, 957643.0, 45363.0, 3816.0, 1347.0, 626.0, 295.0, 170.0, 92.0, 72.0, 59.0, 44.0, 29.0, 25.0, 16.0, 20.0, 13.0, 11.0, 15.0, 5.0, 13.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2109375, -0.20425033569335938, -0.19756317138671875, -0.19087600708007812, -0.1841888427734375, -0.17750167846679688, -0.17081451416015625, -0.16412734985351562, -0.157440185546875, -0.15075302124023438, -0.14406585693359375, -0.13737869262695312, -0.1306915283203125, -0.12400436401367188, -0.11731719970703125, -0.11063003540039062, -0.10394287109375, -0.09725570678710938, -0.09056854248046875, -0.08388137817382812, -0.0771942138671875, -0.07050704956054688, -0.06381988525390625, -0.057132720947265625, -0.050445556640625, -0.043758392333984375, -0.03707122802734375, -0.030384063720703125, -0.0236968994140625, -0.017009735107421875, -0.01032257080078125, -0.003635406494140625, 0.0030517578125, 0.009738922119140625, 0.01642608642578125, 0.023113250732421875, 0.0298004150390625, 0.036487579345703125, 0.04317474365234375, 0.049861907958984375, 0.056549072265625, 0.06323623657226562, 0.06992340087890625, 0.07661056518554688, 0.0832977294921875, 0.08998489379882812, 0.09667205810546875, 0.10335922241210938, 0.11004638671875, 0.11673355102539062, 0.12342071533203125, 0.13010787963867188, 0.1367950439453125, 0.14348220825195312, 0.15016937255859375, 0.15685653686523438, 0.163543701171875, 0.17023086547851562, 0.17691802978515625, 0.18360519409179688, 0.1902923583984375, 0.19697952270507812, 0.20366668701171875, 0.21035385131835938, 0.217041015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 10.0, 8.0, 13.0, 12.0, 12.0, 11.0, 16.0, 21.0, 19.0, 28.0, 22.0, 29.0, 25.0, 40.0, 37.0, 40.0, 33.0, 50.0, 34.0, 43.0, 54.0, 54.0, 44.0, 36.0, 35.0, 25.0, 33.0, 28.0, 24.0, 18.0, 28.0, 19.0, 26.0, 16.0, 11.0, 10.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083984375, -0.0813741683959961, -0.07876396179199219, -0.07615375518798828, -0.07354354858398438, -0.07093334197998047, -0.06832313537597656, -0.06571292877197266, -0.06310272216796875, -0.060492515563964844, -0.05788230895996094, -0.05527210235595703, -0.052661895751953125, -0.05005168914794922, -0.04744148254394531, -0.044831275939941406, -0.0422210693359375, -0.039610862731933594, -0.03700065612792969, -0.03439044952392578, -0.031780242919921875, -0.02917003631591797, -0.026559829711914062, -0.023949623107910156, -0.02133941650390625, -0.018729209899902344, -0.016119003295898438, -0.013508796691894531, -0.010898590087890625, -0.008288383483886719, -0.0056781768798828125, -0.0030679702758789062, -0.000457763671875, 0.0021524429321289062, 0.0047626495361328125, 0.007372856140136719, 0.009983062744140625, 0.012593269348144531, 0.015203475952148438, 0.017813682556152344, 0.02042388916015625, 0.023034095764160156, 0.025644302368164062, 0.02825450897216797, 0.030864715576171875, 0.03347492218017578, 0.03608512878417969, 0.038695335388183594, 0.0413055419921875, 0.043915748596191406, 0.04652595520019531, 0.04913616180419922, 0.051746368408203125, 0.05435657501220703, 0.05696678161621094, 0.059576988220214844, 0.06218719482421875, 0.06479740142822266, 0.06740760803222656, 0.07001781463623047, 0.07262802124023438, 0.07523822784423828, 0.07784843444824219, 0.0804586410522461, 0.08306884765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 7.0, 4.0, 2.0, 3.0, 9.0, 5.0, 7.0, 14.0, 30.0, 32.0, 42.0, 71.0, 160.0, 382.0, 1724.0, 40426.0, 999745.0, 4657.0, 695.0, 222.0, 103.0, 63.0, 31.0, 24.0, 23.0, 12.0, 17.0, 9.0, 11.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01221466064453125, -0.011835575103759766, -0.011456489562988281, -0.011077404022216797, -0.010698318481445312, -0.010319232940673828, -0.009940147399902344, -0.00956106185913086, -0.009181976318359375, -0.00880289077758789, -0.008423805236816406, -0.008044719696044922, -0.0076656341552734375, -0.007286548614501953, -0.006907463073730469, -0.006528377532958984, -0.0061492919921875, -0.005770206451416016, -0.005391120910644531, -0.005012035369873047, -0.0046329498291015625, -0.004253864288330078, -0.0038747787475585938, -0.0034956932067871094, -0.003116607666015625, -0.0027375221252441406, -0.0023584365844726562, -0.001979351043701172, -0.0016002655029296875, -0.0012211799621582031, -0.0008420944213867188, -0.0004630088806152344, -8.392333984375e-05, 0.0002951622009277344, 0.0006742477416992188, 0.0010533332824707031, 0.0014324188232421875, 0.0018115043640136719, 0.0021905899047851562, 0.0025696754455566406, 0.002948760986328125, 0.0033278465270996094, 0.0037069320678710938, 0.004086017608642578, 0.0044651031494140625, 0.004844188690185547, 0.005223274230957031, 0.005602359771728516, 0.0059814453125, 0.006360530853271484, 0.006739616394042969, 0.007118701934814453, 0.0074977874755859375, 0.007876873016357422, 0.008255958557128906, 0.00863504409790039, 0.009014129638671875, 0.00939321517944336, 0.009772300720214844, 0.010151386260986328, 0.010530471801757812, 0.010909557342529297, 0.011288642883300781, 0.011667728424072266, 0.01204681396484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 4.0, 4.0, 4.0, 10.0, 11.0, 13.0, 15.0, 13.0, 13.0, 27.0, 31.0, 29.0, 30.0, 67.0, 96.0, 143.0, 148.0, 72.0, 46.0, 37.0, 35.0, 30.0, 15.0, 17.0, 12.0, 8.0, 15.0, 12.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.166364669799805e-05, -4.0261074900627136e-05, -3.8858503103256226e-05, -3.7455931305885315e-05, -3.6053359508514404e-05, -3.4650787711143494e-05, -3.324821591377258e-05, -3.184564411640167e-05, -3.0443072319030762e-05, -2.904050052165985e-05, -2.763792872428894e-05, -2.623535692691803e-05, -2.483278512954712e-05, -2.343021333217621e-05, -2.2027641534805298e-05, -2.0625069737434387e-05, -1.9222497940063477e-05, -1.7819926142692566e-05, -1.6417354345321655e-05, -1.5014782547950745e-05, -1.3612210750579834e-05, -1.2209638953208923e-05, -1.0807067155838013e-05, -9.404495358467102e-06, -8.001923561096191e-06, -6.599351763725281e-06, -5.19677996635437e-06, -3.7942081689834595e-06, -2.391636371612549e-06, -9.890645742416382e-07, 4.1350722312927246e-07, 1.816079020500183e-06, 3.2186508178710938e-06, 4.621222615242004e-06, 6.023794412612915e-06, 7.426366209983826e-06, 8.828938007354736e-06, 1.0231509804725647e-05, 1.1634081602096558e-05, 1.3036653399467468e-05, 1.4439225196838379e-05, 1.584179699420929e-05, 1.72443687915802e-05, 1.864694058895111e-05, 2.004951238632202e-05, 2.1452084183692932e-05, 2.2854655981063843e-05, 2.4257227778434753e-05, 2.5659799575805664e-05, 2.7062371373176575e-05, 2.8464943170547485e-05, 2.9867514967918396e-05, 3.127008676528931e-05, 3.267265856266022e-05, 3.407523036003113e-05, 3.547780215740204e-05, 3.688037395477295e-05, 3.828294575214386e-05, 3.968551754951477e-05, 4.108808934688568e-05, 4.249066114425659e-05, 4.38932329416275e-05, 4.529580473899841e-05, 4.6698376536369324e-05, 4.8100948333740234e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 7.0, 11.0, 10.0, 13.0, 18.0, 44.0, 48.0, 134.0, 291.0, 1058.0, 15970.0, 1025587.0, 4264.0, 648.0, 210.0, 99.0, 47.0, 28.0, 18.0, 13.0, 5.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.035614013671875, -0.034708261489868164, -0.03380250930786133, -0.03289675712585449, -0.031991004943847656, -0.03108525276184082, -0.030179500579833984, -0.02927374839782715, -0.028367996215820312, -0.027462244033813477, -0.02655649185180664, -0.025650739669799805, -0.02474498748779297, -0.023839235305786133, -0.022933483123779297, -0.02202773094177246, -0.021121978759765625, -0.02021622657775879, -0.019310474395751953, -0.018404722213745117, -0.01749897003173828, -0.016593217849731445, -0.01568746566772461, -0.014781713485717773, -0.013875961303710938, -0.012970209121704102, -0.012064456939697266, -0.01115870475769043, -0.010252952575683594, -0.009347200393676758, -0.008441448211669922, -0.007535696029663086, -0.00662994384765625, -0.005724191665649414, -0.004818439483642578, -0.003912687301635742, -0.0030069351196289062, -0.0021011829376220703, -0.0011954307556152344, -0.00028967857360839844, 0.0006160736083984375, 0.0015218257904052734, 0.0024275779724121094, 0.0033333301544189453, 0.004239082336425781, 0.005144834518432617, 0.006050586700439453, 0.006956338882446289, 0.007862091064453125, 0.008767843246459961, 0.009673595428466797, 0.010579347610473633, 0.011485099792480469, 0.012390851974487305, 0.01329660415649414, 0.014202356338500977, 0.015108108520507812, 0.01601386070251465, 0.016919612884521484, 0.01782536506652832, 0.018731117248535156, 0.019636869430541992, 0.020542621612548828, 0.021448373794555664, 0.0223541259765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 7.0, 9.0, 4.0, 16.0, 27.0, 47.0, 97.0, 190.0, 245.0, 135.0, 81.0, 45.0, 21.0, 14.0, 11.0, 8.0, 4.0, 8.0, 4.0, 5.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008636474609375, -0.00829458236694336, -0.007952690124511719, -0.007610797882080078, -0.0072689056396484375, -0.006927013397216797, -0.006585121154785156, -0.006243228912353516, -0.005901336669921875, -0.005559444427490234, -0.005217552185058594, -0.004875659942626953, -0.0045337677001953125, -0.004191875457763672, -0.0038499832153320312, -0.0035080909729003906, -0.00316619873046875, -0.0028243064880371094, -0.0024824142456054688, -0.002140522003173828, -0.0017986297607421875, -0.0014567375183105469, -0.0011148452758789062, -0.0007729530334472656, -0.000431060791015625, -8.916854858398438e-05, 0.00025272369384765625, 0.0005946159362792969, 0.0009365081787109375, 0.0012784004211425781, 0.0016202926635742188, 0.0019621849060058594, 0.0023040771484375, 0.0026459693908691406, 0.0029878616333007812, 0.003329753875732422, 0.0036716461181640625, 0.004013538360595703, 0.004355430603027344, 0.004697322845458984, 0.005039215087890625, 0.005381107330322266, 0.005722999572753906, 0.006064891815185547, 0.0064067840576171875, 0.006748676300048828, 0.007090568542480469, 0.007432460784912109, 0.00777435302734375, 0.00811624526977539, 0.008458137512207031, 0.008800029754638672, 0.009141921997070312, 0.009483814239501953, 0.009825706481933594, 0.010167598724365234, 0.010509490966796875, 0.010851383209228516, 0.011193275451660156, 0.011535167694091797, 0.011877059936523438, 0.012218952178955078, 0.012560844421386719, 0.01290273666381836, 0.01324462890625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 21.0, 208.0, 734.0, 46.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.108874797821045, -3.05159592628479, -2.994317054748535, -2.9370384216308594, -2.8797595500946045, -2.8224806785583496, -2.765202045440674, -2.707923173904419, -2.650644302368164, -2.593365430831909, -2.5360865592956543, -2.4788079261779785, -2.4215290546417236, -2.3642501831054688, -2.306971549987793, -2.249692678451538, -2.192413806915283, -2.1351349353790283, -2.0778560638427734, -2.0205774307250977, -1.9632985591888428, -1.906019687652588, -1.8487409353256226, -1.7914621829986572, -1.7341833114624023, -1.6769044399261475, -1.6196256875991821, -1.5623469352722168, -1.505068063735962, -1.447789192199707, -1.3905104398727417, -1.3332316875457764, -1.275952696800232, -1.2186739444732666, -1.1613950729370117, -1.1041162014007568, -1.0468374490737915, -0.9895586371421814, -0.9322798252105713, -0.8750010132789612, -0.8177222013473511, -0.760443389415741, -0.7031645774841309, -0.6458857655525208, -0.5886069536209106, -0.5313281416893005, -0.47404932975769043, -0.4167705178260803, -0.3594917058944702, -0.3022128939628601, -0.24493408203125, -0.1876552700996399, -0.13037645816802979, -0.07309764623641968, -0.01581883430480957, 0.04145997762680054, 0.09873878955841064, 0.15601760149002075, 0.21329641342163086, 0.27057522535324097, 0.3278540372848511, 0.3851328492164612, 0.4424116611480713, 0.4996904730796814, 0.5569692850112915]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 8.0, 7.0, 12.0, 21.0, 13.0, 20.0, 11.0, 17.0, 27.0, 31.0, 28.0, 40.0, 45.0, 32.0, 45.0, 45.0, 54.0, 35.0, 41.0, 38.0, 53.0, 36.0, 34.0, 36.0, 29.0, 29.0, 33.0, 32.0, 25.0, 13.0, 17.0, 12.0, 11.0, 6.0, 10.0, 13.0, 4.0, 5.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4919113516807556, -0.4765775203704834, -0.46124371886253357, -0.44590988755226135, -0.43057605624198914, -0.4152422547340393, -0.3999084234237671, -0.3845745921134949, -0.36924076080322266, -0.35390692949295044, -0.3385731279850006, -0.3232392966747284, -0.3079054653644562, -0.29257166385650635, -0.27723783254623413, -0.2619040012359619, -0.2465701848268509, -0.23123636841773987, -0.21590253710746765, -0.20056872069835663, -0.1852348893880844, -0.1699010729789734, -0.15456724166870117, -0.13923342525959015, -0.12389960139989853, -0.10856577754020691, -0.09323195368051529, -0.07789812982082367, -0.06256431341171265, -0.04723048955202103, -0.03189666569232941, -0.016562841832637787, -0.001229017972946167, 0.014104804955422878, 0.029438627883791924, 0.044772449880838394, 0.060106273740530014, 0.07544009387493134, 0.09077391773462296, 0.10610774159431458, 0.1214415654540062, 0.13677538931369781, 0.15210920572280884, 0.16744303703308105, 0.18277685344219208, 0.1981106698513031, 0.21344450116157532, 0.22877833247184753, 0.24411214888095856, 0.2594459652900696, 0.2747797966003418, 0.290113627910614, 0.30544742941856384, 0.32078126072883606, 0.3361150920391083, 0.3514488935470581, 0.3667827248573303, 0.38211655616760254, 0.39745035767555237, 0.4127841889858246, 0.4281180202960968, 0.44345182180404663, 0.45878565311431885, 0.47411948442459106, 0.4894533157348633]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 4.0, 5.0, 16.0, 21.0, 30.0, 42.0, 63.0, 112.0, 183.0, 806.0, 4191336.0, 1107.0, 227.0, 85.0, 71.0, 34.0, 23.0, 22.0, 16.0, 8.0, 10.0, 14.0, 6.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.390625, -0.3782463073730469, -0.36586761474609375, -0.3534889221191406, -0.3411102294921875, -0.3287315368652344, -0.31635284423828125, -0.3039741516113281, -0.291595458984375, -0.2792167663574219, -0.26683807373046875, -0.2544593811035156, -0.2420806884765625, -0.22970199584960938, -0.21732330322265625, -0.20494461059570312, -0.19256591796875, -0.18018722534179688, -0.16780853271484375, -0.15542984008789062, -0.1430511474609375, -0.13067245483398438, -0.11829376220703125, -0.10591506958007812, -0.093536376953125, -0.08115768432617188, -0.06877899169921875, -0.056400299072265625, -0.0440216064453125, -0.031642913818359375, -0.01926422119140625, -0.006885528564453125, 0.0054931640625, 0.017871856689453125, 0.03025054931640625, 0.042629241943359375, 0.0550079345703125, 0.06738662719726562, 0.07976531982421875, 0.09214401245117188, 0.104522705078125, 0.11690139770507812, 0.12928009033203125, 0.14165878295898438, 0.1540374755859375, 0.16641616821289062, 0.17879486083984375, 0.19117355346679688, 0.20355224609375, 0.21593093872070312, 0.22830963134765625, 0.24068832397460938, 0.2530670166015625, 0.2654457092285156, 0.27782440185546875, 0.2902030944824219, 0.302581787109375, 0.3149604797363281, 0.32733917236328125, 0.3397178649902344, 0.3520965576171875, 0.3644752502441406, 0.37685394287109375, 0.3892326354980469, 0.401611328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 4.0, 8.0, 26.0, 21.0, 38.0, 49.0, 81.0, 105.0, 99.0, 103.0, 90.0, 84.0, 69.0, 51.0, 28.0, 24.0, 16.0, 19.0, 8.0, 12.0, 14.0, 6.0, 6.0, 1.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025146484375, -0.024355649948120117, -0.023564815521240234, -0.02277398109436035, -0.02198314666748047, -0.021192312240600586, -0.020401477813720703, -0.01961064338684082, -0.018819808959960938, -0.018028974533081055, -0.017238140106201172, -0.01644730567932129, -0.015656471252441406, -0.014865636825561523, -0.01407480239868164, -0.013283967971801758, -0.012493133544921875, -0.011702299118041992, -0.01091146469116211, -0.010120630264282227, -0.009329795837402344, -0.008538961410522461, -0.007748126983642578, -0.006957292556762695, -0.0061664581298828125, -0.00537562370300293, -0.004584789276123047, -0.003793954849243164, -0.0030031204223632812, -0.0022122859954833984, -0.0014214515686035156, -0.0006306171417236328, 0.00016021728515625, 0.0009510517120361328, 0.0017418861389160156, 0.0025327205657958984, 0.0033235549926757812, 0.004114389419555664, 0.004905223846435547, 0.00569605827331543, 0.0064868927001953125, 0.007277727127075195, 0.008068561553955078, 0.008859395980834961, 0.009650230407714844, 0.010441064834594727, 0.01123189926147461, 0.012022733688354492, 0.012813568115234375, 0.013604402542114258, 0.01439523696899414, 0.015186071395874023, 0.015976905822753906, 0.01676774024963379, 0.017558574676513672, 0.018349409103393555, 0.019140243530273438, 0.01993107795715332, 0.020721912384033203, 0.021512746810913086, 0.02230358123779297, 0.02309441566467285, 0.023885250091552734, 0.024676084518432617, 0.0254669189453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 5.0, 19.0, 38.0, 96.0, 238.0, 704.0, 2225.0, 13427.0, 4169797.0, 5771.0, 1334.0, 389.0, 113.0, 50.0, 28.0, 14.0, 11.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1220703125, -0.11850929260253906, -0.11494827270507812, -0.11138725280761719, -0.10782623291015625, -0.10426521301269531, -0.10070419311523438, -0.09714317321777344, -0.0935821533203125, -0.09002113342285156, -0.08646011352539062, -0.08289909362792969, -0.07933807373046875, -0.07577705383300781, -0.07221603393554688, -0.06865501403808594, -0.065093994140625, -0.06153297424316406, -0.057971954345703125, -0.05441093444824219, -0.05084991455078125, -0.04728889465332031, -0.043727874755859375, -0.04016685485839844, -0.0366058349609375, -0.03304481506347656, -0.029483795166015625, -0.025922775268554688, -0.02236175537109375, -0.018800735473632812, -0.015239715576171875, -0.011678695678710938, -0.00811767578125, -0.0045566558837890625, -0.000995635986328125, 0.0025653839111328125, 0.00612640380859375, 0.009687423706054688, 0.013248443603515625, 0.016809463500976562, 0.0203704833984375, 0.023931503295898438, 0.027492523193359375, 0.031053543090820312, 0.03461456298828125, 0.03817558288574219, 0.041736602783203125, 0.04529762268066406, 0.048858642578125, 0.05241966247558594, 0.055980682373046875, 0.05954170227050781, 0.06310272216796875, 0.06666374206542969, 0.07022476196289062, 0.07378578186035156, 0.0773468017578125, 0.08090782165527344, 0.08446884155273438, 0.08802986145019531, 0.09159088134765625, 0.09515190124511719, 0.09871292114257812, 0.10227394104003906, 0.1058349609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 10.0, 27.0, 139.0, 3774.0, 66.0, 23.0, 10.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0230255126953125, -0.022264480590820312, -0.021503448486328125, -0.020742416381835938, -0.01998138427734375, -0.019220352172851562, -0.018459320068359375, -0.017698287963867188, -0.016937255859375, -0.016176223754882812, -0.015415191650390625, -0.014654159545898438, -0.01389312744140625, -0.013132095336914062, -0.012371063232421875, -0.011610031127929688, -0.0108489990234375, -0.010087966918945312, -0.009326934814453125, -0.008565902709960938, -0.00780487060546875, -0.0070438385009765625, -0.006282806396484375, -0.0055217742919921875, -0.0047607421875, -0.0039997100830078125, -0.003238677978515625, -0.0024776458740234375, -0.00171661376953125, -0.0009555816650390625, -0.000194549560546875, 0.0005664825439453125, 0.0013275146484375, 0.0020885467529296875, 0.002849578857421875, 0.0036106109619140625, 0.00437164306640625, 0.0051326751708984375, 0.005893707275390625, 0.0066547393798828125, 0.007415771484375, 0.008176803588867188, 0.008937835693359375, 0.009698867797851562, 0.01045989990234375, 0.011220932006835938, 0.011981964111328125, 0.012742996215820312, 0.0135040283203125, 0.014265060424804688, 0.015026092529296875, 0.015787124633789062, 0.01654815673828125, 0.017309188842773438, 0.018070220947265625, 0.018831253051757812, 0.01959228515625, 0.020353317260742188, 0.021114349365234375, 0.021875381469726562, 0.02263641357421875, 0.023397445678710938, 0.024158477783203125, 0.024919509887695312, 0.0256805419921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 26.0, 95.0, 664.0, 182.0, 23.0, 11.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02374577894806862, -0.021013734862208366, -0.018281690776348114, -0.015549646690487862, -0.01281760260462761, -0.010085558518767357, -0.0073535144329071045, -0.004621470347046852, -0.0018894262611865997, 0.0008426178246736526, 0.003574661910533905, 0.006306705996394157, 0.00903875008225441, 0.011770794168114662, 0.014502838253974915, 0.017234882339835167, 0.01996692642569542, 0.02269897051155567, 0.025431014597415924, 0.028163058683276176, 0.03089510276913643, 0.03362714499235153, 0.036359190940856934, 0.039091236889362335, 0.04182327911257744, 0.04455532133579254, 0.04728736728429794, 0.050019413232803345, 0.05275145545601845, 0.05548349767923355, 0.05821554362773895, 0.060947589576244354, 0.06367963552474976, 0.06641168147325516, 0.06914372742176056, 0.07187576591968536, 0.07460781186819077, 0.07733985781669617, 0.08007189631462097, 0.08280394226312637, 0.08553598821163177, 0.08826803416013718, 0.09100008010864258, 0.09373211860656738, 0.09646416455507278, 0.09919621050357819, 0.10192824900150299, 0.10466029495000839, 0.1073923408985138, 0.1101243868470192, 0.1128564327955246, 0.1155884712934494, 0.1183205172419548, 0.1210525631904602, 0.12378460168838501, 0.126516655087471, 0.1292486935853958, 0.13198073208332062, 0.13471278548240662, 0.13744482398033142, 0.14017686247825623, 0.14290891587734222, 0.14564095437526703, 0.14837300777435303, 0.15110504627227783]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 10.0, 12.0, 15.0, 19.0, 25.0, 24.0, 31.0, 31.0, 44.0, 38.0, 36.0, 76.0, 54.0, 55.0, 51.0, 53.0, 46.0, 56.0, 40.0, 35.0, 46.0, 32.0, 32.0, 38.0, 31.0, 12.0, 9.0, 12.0, 7.0, 2.0, 6.0, 0.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034337759017944336, -0.03314549848437309, -0.03195323795080185, -0.030760977417230606, -0.029568716883659363, -0.02837645635008812, -0.027184195816516876, -0.025991935282945633, -0.02479967474937439, -0.023607414215803146, -0.022415153682231903, -0.02122289314866066, -0.020030632615089417, -0.018838372081518173, -0.01764611154794693, -0.016453851014375687, -0.015261590480804443, -0.0140693299472332, -0.012877069413661957, -0.011684808880090714, -0.01049254834651947, -0.009300287812948227, -0.008108027279376984, -0.00691576674580574, -0.005723506212234497, -0.004531245678663254, -0.0033389851450920105, -0.002146724611520767, -0.0009544640779495239, 0.00023779645562171936, 0.0014300569891929626, 0.002622317522764206, 0.0038145780563354492, 0.0050068385899066925, 0.006199099123477936, 0.007391359657049179, 0.008583620190620422, 0.009775880724191666, 0.010968141257762909, 0.012160401791334152, 0.013352662324905396, 0.014544922858476639, 0.015737183392047882, 0.016929443925619125, 0.01812170445919037, 0.019313964992761612, 0.020506225526332855, 0.0216984860599041, 0.022890746593475342, 0.024083007127046585, 0.02527526766061783, 0.02646752819418907, 0.027659788727760315, 0.028852049261331558, 0.0300443097949028, 0.031236570328474045, 0.03242883086204529, 0.03362109139561653, 0.034813351929187775, 0.03600561246275902, 0.03719787299633026, 0.038390133529901505, 0.03958239406347275, 0.04077465459704399, 0.041966915130615234]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 10.0, 8.0, 15.0, 13.0, 19.0, 47.0, 47.0, 79.0, 118.0, 175.0, 273.0, 376.0, 635.0, 1032.0, 1763.0, 3183.0, 5731.0, 12789.0, 32893.0, 125702.0, 647680.0, 150027.0, 36870.0, 13889.0, 6707.0, 3441.0, 1830.0, 1136.0, 764.0, 473.0, 253.0, 188.0, 118.0, 86.0, 52.0, 42.0, 38.0, 17.0, 6.0, 10.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.052703857421875, -0.05108499526977539, -0.04946613311767578, -0.04784727096557617, -0.04622840881347656, -0.04460954666137695, -0.042990684509277344, -0.041371822357177734, -0.039752960205078125, -0.038134098052978516, -0.036515235900878906, -0.0348963737487793, -0.03327751159667969, -0.03165864944458008, -0.03003978729248047, -0.02842092514038086, -0.02680206298828125, -0.02518320083618164, -0.02356433868408203, -0.021945476531982422, -0.020326614379882812, -0.018707752227783203, -0.017088890075683594, -0.015470027923583984, -0.013851165771484375, -0.012232303619384766, -0.010613441467285156, -0.008994579315185547, -0.0073757171630859375, -0.005756855010986328, -0.004137992858886719, -0.0025191307067871094, -0.0009002685546875, 0.0007185935974121094, 0.0023374557495117188, 0.003956317901611328, 0.0055751800537109375, 0.007194042205810547, 0.008812904357910156, 0.010431766510009766, 0.012050628662109375, 0.013669490814208984, 0.015288352966308594, 0.016907215118408203, 0.018526077270507812, 0.020144939422607422, 0.02176380157470703, 0.02338266372680664, 0.02500152587890625, 0.02662038803100586, 0.02823925018310547, 0.029858112335205078, 0.03147697448730469, 0.0330958366394043, 0.034714698791503906, 0.036333560943603516, 0.037952423095703125, 0.039571285247802734, 0.041190147399902344, 0.04280900955200195, 0.04442787170410156, 0.04604673385620117, 0.04766559600830078, 0.04928445816040039, 0.0509033203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 5.0, 3.0, 8.0, 4.0, 5.0, 5.0, 15.0, 24.0, 30.0, 37.0, 60.0, 89.0, 104.0, 101.0, 96.0, 88.0, 82.0, 62.0, 48.0, 22.0, 20.0, 18.0, 15.0, 8.0, 14.0, 10.0, 8.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0245361328125, -0.02375626564025879, -0.022976398468017578, -0.022196531295776367, -0.021416664123535156, -0.020636796951293945, -0.019856929779052734, -0.019077062606811523, -0.018297195434570312, -0.0175173282623291, -0.01673746109008789, -0.01595759391784668, -0.015177726745605469, -0.014397859573364258, -0.013617992401123047, -0.012838125228881836, -0.012058258056640625, -0.011278390884399414, -0.010498523712158203, -0.009718656539916992, -0.008938789367675781, -0.00815892219543457, -0.007379055023193359, -0.0065991878509521484, -0.0058193206787109375, -0.0050394535064697266, -0.004259586334228516, -0.0034797191619873047, -0.0026998519897460938, -0.0019199848175048828, -0.0011401176452636719, -0.00036025047302246094, 0.00041961669921875, 0.001199483871459961, 0.001979351043701172, 0.002759218215942383, 0.0035390853881835938, 0.004318952560424805, 0.005098819732666016, 0.0058786869049072266, 0.0066585540771484375, 0.0074384212493896484, 0.00821828842163086, 0.00899815559387207, 0.009778022766113281, 0.010557889938354492, 0.011337757110595703, 0.012117624282836914, 0.012897491455078125, 0.013677358627319336, 0.014457225799560547, 0.015237092971801758, 0.01601696014404297, 0.01679682731628418, 0.01757669448852539, 0.0183565616607666, 0.019136428833007812, 0.019916296005249023, 0.020696163177490234, 0.021476030349731445, 0.022255897521972656, 0.023035764694213867, 0.023815631866455078, 0.02459549903869629, 0.0253753662109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 7.0, 12.0, 19.0, 11.0, 21.0, 19.0, 33.0, 41.0, 54.0, 55.0, 76.0, 119.0, 156.0, 253.0, 400.0, 556.0, 971.0, 1850.0, 4997.0, 28305.0, 606758.0, 371921.0, 23186.0, 4382.0, 1643.0, 916.0, 552.0, 352.0, 244.0, 156.0, 112.0, 86.0, 66.0, 36.0, 48.0, 27.0, 22.0, 19.0, 17.0, 12.0, 7.0, 6.0, 5.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09161376953125, -0.08844947814941406, -0.08528518676757812, -0.08212089538574219, -0.07895660400390625, -0.07579231262207031, -0.07262802124023438, -0.06946372985839844, -0.0662994384765625, -0.06313514709472656, -0.059970855712890625, -0.05680656433105469, -0.05364227294921875, -0.05047798156738281, -0.047313690185546875, -0.04414939880371094, -0.040985107421875, -0.03782081604003906, -0.034656524658203125, -0.03149223327636719, -0.02832794189453125, -0.025163650512695312, -0.021999359130859375, -0.018835067749023438, -0.0156707763671875, -0.012506484985351562, -0.009342193603515625, -0.0061779022216796875, -0.00301361083984375, 0.0001506805419921875, 0.003314971923828125, 0.0064792633056640625, 0.0096435546875, 0.012807846069335938, 0.015972137451171875, 0.019136428833007812, 0.02230072021484375, 0.025465011596679688, 0.028629302978515625, 0.03179359436035156, 0.0349578857421875, 0.03812217712402344, 0.041286468505859375, 0.04445075988769531, 0.04761505126953125, 0.05077934265136719, 0.053943634033203125, 0.05710792541503906, 0.060272216796875, 0.06343650817871094, 0.06660079956054688, 0.06976509094238281, 0.07292938232421875, 0.07609367370605469, 0.07925796508789062, 0.08242225646972656, 0.0855865478515625, 0.08875083923339844, 0.09191513061523438, 0.09507942199707031, 0.09824371337890625, 0.10140800476074219, 0.10457229614257812, 0.10773658752441406, 0.11090087890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 8.0, 10.0, 14.0, 14.0, 18.0, 18.0, 20.0, 26.0, 27.0, 33.0, 28.0, 30.0, 30.0, 35.0, 36.0, 52.0, 30.0, 42.0, 38.0, 39.0, 43.0, 36.0, 39.0, 26.0, 34.0, 27.0, 41.0, 26.0, 16.0, 25.0, 18.0, 19.0, 15.0, 13.0, 10.0, 10.0, 10.0, 8.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.07598876953125, -0.07383108139038086, -0.07167339324951172, -0.06951570510864258, -0.06735801696777344, -0.0652003288269043, -0.06304264068603516, -0.060884952545166016, -0.058727264404296875, -0.056569576263427734, -0.054411888122558594, -0.05225419998168945, -0.05009651184082031, -0.04793882369995117, -0.04578113555908203, -0.04362344741821289, -0.04146575927734375, -0.03930807113647461, -0.03715038299560547, -0.03499269485473633, -0.03283500671386719, -0.030677318572998047, -0.028519630432128906, -0.026361942291259766, -0.024204254150390625, -0.022046566009521484, -0.019888877868652344, -0.017731189727783203, -0.015573501586914062, -0.013415813446044922, -0.011258125305175781, -0.00910043716430664, -0.0069427490234375, -0.004785060882568359, -0.0026273727416992188, -0.0004696846008300781, 0.0016880035400390625, 0.003845691680908203, 0.006003379821777344, 0.008161067962646484, 0.010318756103515625, 0.012476444244384766, 0.014634132385253906, 0.016791820526123047, 0.018949508666992188, 0.021107196807861328, 0.02326488494873047, 0.02542257308959961, 0.02758026123046875, 0.02973794937133789, 0.03189563751220703, 0.03405332565307617, 0.03621101379394531, 0.03836870193481445, 0.040526390075683594, 0.042684078216552734, 0.044841766357421875, 0.046999454498291016, 0.049157142639160156, 0.0513148307800293, 0.05347251892089844, 0.05563020706176758, 0.05778789520263672, 0.05994558334350586, 0.062103271484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 9.0, 8.0, 25.0, 25.0, 21.0, 22.0, 27.0, 54.0, 70.0, 84.0, 123.0, 174.0, 314.0, 580.0, 1559.0, 5723.0, 52761.0, 949563.0, 30380.0, 4316.0, 1233.0, 558.0, 244.0, 176.0, 129.0, 85.0, 60.0, 51.0, 27.0, 27.0, 16.0, 21.0, 14.0, 10.0, 9.0, 7.0, 5.0, 7.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00449371337890625, -0.004359185695648193, -0.004224658012390137, -0.00409013032913208, -0.0039556026458740234, -0.003821074962615967, -0.00368654727935791, -0.0035520195960998535, -0.003417491912841797, -0.0032829642295837402, -0.0031484365463256836, -0.003013908863067627, -0.0028793811798095703, -0.0027448534965515137, -0.002610325813293457, -0.0024757981300354004, -0.0023412704467773438, -0.002206742763519287, -0.0020722150802612305, -0.0019376873970031738, -0.0018031597137451172, -0.0016686320304870605, -0.001534104347229004, -0.0013995766639709473, -0.0012650489807128906, -0.001130521297454834, -0.0009959936141967773, -0.0008614659309387207, -0.0007269382476806641, -0.0005924105644226074, -0.0004578828811645508, -0.00032335519790649414, -0.0001888275146484375, -5.429983139038086e-05, 8.022785186767578e-05, 0.00021475553512573242, 0.00034928321838378906, 0.0004838109016418457, 0.0006183385848999023, 0.000752866268157959, 0.0008873939514160156, 0.0010219216346740723, 0.001156449317932129, 0.0012909770011901855, 0.0014255046844482422, 0.0015600323677062988, 0.0016945600509643555, 0.0018290877342224121, 0.0019636154174804688, 0.0020981431007385254, 0.002232670783996582, 0.0023671984672546387, 0.0025017261505126953, 0.002636253833770752, 0.0027707815170288086, 0.0029053092002868652, 0.003039836883544922, 0.0031743645668029785, 0.003308892250061035, 0.003443419933319092, 0.0035779476165771484, 0.003712475299835205, 0.0038470029830932617, 0.003981530666351318, 0.004116058349609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 3.0, 3.0, 7.0, 7.0, 16.0, 22.0, 15.0, 27.0, 50.0, 66.0, 83.0, 162.0, 171.0, 106.0, 79.0, 38.0, 32.0, 30.0, 15.0, 14.0, 11.0, 7.0, 7.0, 3.0, 7.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.0558319091796875e-05, -5.8671459555625916e-05, -5.6784600019454956e-05, -5.4897740483283997e-05, -5.301088094711304e-05, -5.112402141094208e-05, -4.923716187477112e-05, -4.735030233860016e-05, -4.54634428024292e-05, -4.357658326625824e-05, -4.168972373008728e-05, -3.980286419391632e-05, -3.791600465774536e-05, -3.60291451215744e-05, -3.414228558540344e-05, -3.225542604923248e-05, -3.0368566513061523e-05, -2.8481706976890564e-05, -2.6594847440719604e-05, -2.4707987904548645e-05, -2.2821128368377686e-05, -2.0934268832206726e-05, -1.9047409296035767e-05, -1.7160549759864807e-05, -1.5273690223693848e-05, -1.3386830687522888e-05, -1.1499971151351929e-05, -9.61311161518097e-06, -7.72625207901001e-06, -5.83939254283905e-06, -3.952533006668091e-06, -2.0656734704971313e-06, -1.7881393432617188e-07, 1.7080456018447876e-06, 3.594905138015747e-06, 5.4817646741867065e-06, 7.368624210357666e-06, 9.255483746528625e-06, 1.1142343282699585e-05, 1.3029202818870544e-05, 1.4916062355041504e-05, 1.6802921891212463e-05, 1.8689781427383423e-05, 2.0576640963554382e-05, 2.2463500499725342e-05, 2.43503600358963e-05, 2.623721957206726e-05, 2.812407910823822e-05, 3.001093864440918e-05, 3.189779818058014e-05, 3.37846577167511e-05, 3.567151725292206e-05, 3.755837678909302e-05, 3.944523632526398e-05, 4.1332095861434937e-05, 4.3218955397605896e-05, 4.5105814933776855e-05, 4.6992674469947815e-05, 4.8879534006118774e-05, 5.0766393542289734e-05, 5.265325307846069e-05, 5.454011261463165e-05, 5.642697215080261e-05, 5.831383168697357e-05, 6.020069122314453e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 23.0, 14.0, 27.0, 31.0, 48.0, 62.0, 100.0, 177.0, 320.0, 719.0, 2729.0, 23573.0, 995007.0, 21240.0, 2796.0, 843.0, 319.0, 176.0, 93.0, 66.0, 43.0, 35.0, 30.0, 16.0, 10.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0117645263671875, -0.011423349380493164, -0.011082172393798828, -0.010740995407104492, -0.010399818420410156, -0.01005864143371582, -0.009717464447021484, -0.009376287460327148, -0.009035110473632812, -0.008693933486938477, -0.00835275650024414, -0.008011579513549805, -0.007670402526855469, -0.007329225540161133, -0.006988048553466797, -0.006646871566772461, -0.006305694580078125, -0.005964517593383789, -0.005623340606689453, -0.005282163619995117, -0.004940986633300781, -0.004599809646606445, -0.004258632659912109, -0.0039174556732177734, -0.0035762786865234375, -0.0032351016998291016, -0.0028939247131347656, -0.0025527477264404297, -0.0022115707397460938, -0.0018703937530517578, -0.0015292167663574219, -0.001188039779663086, -0.00084686279296875, -0.0005056858062744141, -0.00016450881958007812, 0.0001766681671142578, 0.0005178451538085938, 0.0008590221405029297, 0.0012001991271972656, 0.0015413761138916016, 0.0018825531005859375, 0.0022237300872802734, 0.0025649070739746094, 0.0029060840606689453, 0.0032472610473632812, 0.003588438034057617, 0.003929615020751953, 0.004270792007446289, 0.004611968994140625, 0.004953145980834961, 0.005294322967529297, 0.005635499954223633, 0.005976676940917969, 0.006317853927612305, 0.006659030914306641, 0.0070002079010009766, 0.0073413848876953125, 0.0076825618743896484, 0.008023738861083984, 0.00836491584777832, 0.008706092834472656, 0.009047269821166992, 0.009388446807861328, 0.009729623794555664, 0.01007080078125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 7.0, 6.0, 12.0, 21.0, 27.0, 28.0, 61.0, 91.0, 155.0, 202.0, 136.0, 65.0, 46.0, 23.0, 23.0, 17.0, 11.0, 4.0, 8.0, 6.0, 6.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0066375732421875, -0.0064125657081604, -0.006187558174133301, -0.005962550640106201, -0.0057375431060791016, -0.005512535572052002, -0.005287528038024902, -0.005062520503997803, -0.004837512969970703, -0.0046125054359436035, -0.004387497901916504, -0.004162490367889404, -0.003937482833862305, -0.003712475299835205, -0.0034874677658081055, -0.003262460231781006, -0.0030374526977539062, -0.0028124451637268066, -0.002587437629699707, -0.0023624300956726074, -0.002137422561645508, -0.0019124150276184082, -0.0016874074935913086, -0.001462399959564209, -0.0012373924255371094, -0.0010123848915100098, -0.0007873773574829102, -0.0005623698234558105, -0.00033736228942871094, -0.00011235475540161133, 0.00011265277862548828, 0.0003376603126525879, 0.0005626678466796875, 0.0007876753807067871, 0.0010126829147338867, 0.0012376904487609863, 0.001462697982788086, 0.0016877055168151855, 0.0019127130508422852, 0.0021377205848693848, 0.0023627281188964844, 0.002587735652923584, 0.0028127431869506836, 0.003037750720977783, 0.003262758255004883, 0.0034877657890319824, 0.003712773323059082, 0.003937780857086182, 0.004162788391113281, 0.004387795925140381, 0.0046128034591674805, 0.00483781099319458, 0.00506281852722168, 0.005287826061248779, 0.005512833595275879, 0.0057378411293029785, 0.005962848663330078, 0.006187856197357178, 0.006412863731384277, 0.006637871265411377, 0.0068628787994384766, 0.007087886333465576, 0.007312893867492676, 0.007537901401519775, 0.007762908935546875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 13.0, 17.0, 69.0, 297.0, 535.0, 54.0, 15.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5895233154296875, -1.5601515769958496, -1.5307799577713013, -1.501408338546753, -1.472036600112915, -1.4426648616790771, -1.4132932424545288, -1.3839216232299805, -1.3545498847961426, -1.3251781463623047, -1.2958065271377563, -1.266434907913208, -1.2370631694793701, -1.2076914310455322, -1.1783198118209839, -1.1489481925964355, -1.1195764541625977, -1.0902047157287598, -1.0608330965042114, -1.031461477279663, -1.0020897388458252, -0.9727180600166321, -0.943346381187439, -0.9139747023582458, -0.8846030235290527, -0.8552313446998596, -0.8258596658706665, -0.7964879870414734, -0.7671163082122803, -0.7377446293830872, -0.708372950553894, -0.6790012717247009, -0.6496295928955078, -0.6202579140663147, -0.5908862352371216, -0.5615145564079285, -0.5321428775787354, -0.5027711987495422, -0.4733995199203491, -0.444027841091156, -0.4146561622619629, -0.3852844834327698, -0.35591280460357666, -0.32654112577438354, -0.29716944694519043, -0.2677977681159973, -0.2384260892868042, -0.20905441045761108, -0.17968273162841797, -0.15031105279922485, -0.12093937397003174, -0.09156769514083862, -0.06219601631164551, -0.03282433748245239, -0.0034526586532592773, 0.025919020175933838, 0.05529069900512695, 0.08466237783432007, 0.11403405666351318, 0.1434057354927063, 0.17277741432189941, 0.20214909315109253, 0.23152077198028564, 0.26089245080947876, 0.2902641296386719]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 4.0, 7.0, 6.0, 10.0, 13.0, 15.0, 22.0, 19.0, 18.0, 35.0, 33.0, 36.0, 41.0, 46.0, 37.0, 49.0, 62.0, 54.0, 55.0, 64.0, 47.0, 44.0, 43.0, 27.0, 42.0, 36.0, 20.0, 21.0, 16.0, 14.0, 8.0, 12.0, 6.0, 7.0, 6.0, 5.0, 6.0, 6.0, 0.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.5914543867111206, -0.5761537551879883, -0.560853123664856, -0.5455524921417236, -0.5302518606185913, -0.5149512887001038, -0.49965065717697144, -0.4843500256538391, -0.4690493941307068, -0.45374876260757446, -0.43844813108444214, -0.4231475293636322, -0.4078468978404999, -0.39254626631736755, -0.3772456645965576, -0.3619450330734253, -0.34664440155029297, -0.33134377002716064, -0.3160431385040283, -0.3007425367832184, -0.28544190526008606, -0.27014127373695374, -0.2548406720161438, -0.23954004049301147, -0.22423940896987915, -0.20893877744674683, -0.1936381608247757, -0.17833754420280457, -0.16303691267967224, -0.14773628115653992, -0.1324356645345688, -0.11713504046201706, -0.10183441638946533, -0.0865337923169136, -0.07123316824436188, -0.05593254417181015, -0.04063192009925842, -0.025331296026706696, -0.010030671954154968, 0.005269952118396759, 0.020570576190948486, 0.035871200263500214, 0.05117182433605194, 0.06647244840860367, 0.0817730724811554, 0.09707369655370712, 0.11237432062625885, 0.12767493724822998, 0.1429755687713623, 0.15827620029449463, 0.17357681691646576, 0.1888774335384369, 0.2041780650615692, 0.21947869658470154, 0.23477931320667267, 0.2500799298286438, 0.2653805613517761, 0.28068119287490845, 0.29598182439804077, 0.3112824261188507, 0.32658305764198303, 0.34188368916511536, 0.3571842908859253, 0.3724849224090576, 0.38778555393218994]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 9.0, 3.0, 5.0, 11.0, 14.0, 16.0, 29.0, 33.0, 43.0, 58.0, 81.0, 93.0, 167.0, 280.0, 467.0, 822.0, 1455.0, 3965.0, 51894.0, 4117068.0, 12179.0, 2467.0, 1092.0, 661.0, 394.0, 274.0, 164.0, 145.0, 93.0, 71.0, 46.0, 48.0, 31.0, 29.0, 9.0, 19.0, 9.0, 8.0, 8.0, 5.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.050140380859375, -0.04848670959472656, -0.046833038330078125, -0.04517936706542969, -0.04352569580078125, -0.04187202453613281, -0.040218353271484375, -0.03856468200683594, -0.0369110107421875, -0.03525733947753906, -0.033603668212890625, -0.03194999694824219, -0.03029632568359375, -0.028642654418945312, -0.026988983154296875, -0.025335311889648438, -0.023681640625, -0.022027969360351562, -0.020374298095703125, -0.018720626831054688, -0.01706695556640625, -0.015413284301757812, -0.013759613037109375, -0.012105941772460938, -0.0104522705078125, -0.008798599243164062, -0.007144927978515625, -0.0054912567138671875, -0.00383758544921875, -0.0021839141845703125, -0.000530242919921875, 0.0011234283447265625, 0.002777099609375, 0.0044307708740234375, 0.006084442138671875, 0.0077381134033203125, 0.00939178466796875, 0.011045455932617188, 0.012699127197265625, 0.014352798461914062, 0.0160064697265625, 0.017660140991210938, 0.019313812255859375, 0.020967483520507812, 0.02262115478515625, 0.024274826049804688, 0.025928497314453125, 0.027582168579101562, 0.02923583984375, 0.030889511108398438, 0.032543182373046875, 0.03419685363769531, 0.03585052490234375, 0.03750419616699219, 0.039157867431640625, 0.04081153869628906, 0.0424652099609375, 0.04411888122558594, 0.045772552490234375, 0.04742622375488281, 0.04907989501953125, 0.05073356628417969, 0.052387237548828125, 0.05404090881347656, 0.055694580078125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 3.0, 6.0, 11.0, 17.0, 21.0, 34.0, 52.0, 55.0, 90.0, 98.0, 108.0, 80.0, 96.0, 67.0, 63.0, 36.0, 35.0, 24.0, 14.0, 22.0, 8.0, 9.0, 5.0, 10.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0225677490234375, -0.021822690963745117, -0.021077632904052734, -0.02033257484436035, -0.01958751678466797, -0.018842458724975586, -0.018097400665283203, -0.01735234260559082, -0.016607284545898438, -0.015862226486206055, -0.015117168426513672, -0.014372110366821289, -0.013627052307128906, -0.012881994247436523, -0.01213693618774414, -0.011391878128051758, -0.010646820068359375, -0.009901762008666992, -0.00915670394897461, -0.008411645889282227, -0.007666587829589844, -0.006921529769897461, -0.006176471710205078, -0.005431413650512695, -0.0046863555908203125, -0.00394129753112793, -0.003196239471435547, -0.002451181411743164, -0.0017061233520507812, -0.0009610652923583984, -0.00021600723266601562, 0.0005290508270263672, 0.00127410888671875, 0.002019166946411133, 0.0027642250061035156, 0.0035092830657958984, 0.004254341125488281, 0.004999399185180664, 0.005744457244873047, 0.00648951530456543, 0.0072345733642578125, 0.007979631423950195, 0.008724689483642578, 0.009469747543334961, 0.010214805603027344, 0.010959863662719727, 0.01170492172241211, 0.012449979782104492, 0.013195037841796875, 0.013940095901489258, 0.01468515396118164, 0.015430212020874023, 0.016175270080566406, 0.01692032814025879, 0.017665386199951172, 0.018410444259643555, 0.019155502319335938, 0.01990056037902832, 0.020645618438720703, 0.021390676498413086, 0.02213573455810547, 0.02288079261779785, 0.023625850677490234, 0.024370908737182617, 0.025115966796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 20.0, 21.0, 47.0, 132.0, 511.0, 2511.0, 4009577.0, 179171.0, 1652.0, 392.0, 130.0, 62.0, 18.0, 18.0, 1.0, 7.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218994140625, -0.2121448516845703, -0.20529556274414062, -0.19844627380371094, -0.19159698486328125, -0.18474769592285156, -0.17789840698242188, -0.1710491180419922, -0.1641998291015625, -0.1573505401611328, -0.15050125122070312, -0.14365196228027344, -0.13680267333984375, -0.12995338439941406, -0.12310409545898438, -0.11625480651855469, -0.109405517578125, -0.10255622863769531, -0.09570693969726562, -0.08885765075683594, -0.08200836181640625, -0.07515907287597656, -0.06830978393554688, -0.06146049499511719, -0.0546112060546875, -0.04776191711425781, -0.040912628173828125, -0.03406333923339844, -0.02721405029296875, -0.020364761352539062, -0.013515472412109375, -0.0066661834716796875, 0.00018310546875, 0.0070323944091796875, 0.013881683349609375, 0.020730972290039062, 0.02758026123046875, 0.03442955017089844, 0.041278839111328125, 0.04812812805175781, 0.0549774169921875, 0.06182670593261719, 0.06867599487304688, 0.07552528381347656, 0.08237457275390625, 0.08922386169433594, 0.09607315063476562, 0.10292243957519531, 0.109771728515625, 0.11662101745605469, 0.12347030639648438, 0.13031959533691406, 0.13716888427734375, 0.14401817321777344, 0.15086746215820312, 0.1577167510986328, 0.1645660400390625, 0.1714153289794922, 0.17826461791992188, 0.18511390686035156, 0.19196319580078125, 0.19881248474121094, 0.20566177368164062, 0.2125110626220703, 0.2193603515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 4.0, 2.0, 8.0, 3.0, 17.0, 48.0, 2816.0, 1091.0, 51.0, 15.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05950927734375, -0.057587623596191406, -0.05566596984863281, -0.05374431610107422, -0.051822662353515625, -0.04990100860595703, -0.04797935485839844, -0.046057701110839844, -0.04413604736328125, -0.042214393615722656, -0.04029273986816406, -0.03837108612060547, -0.036449432373046875, -0.03452777862548828, -0.03260612487792969, -0.030684471130371094, -0.0287628173828125, -0.026841163635253906, -0.024919509887695312, -0.02299785614013672, -0.021076202392578125, -0.01915454864501953, -0.017232894897460938, -0.015311241149902344, -0.01338958740234375, -0.011467933654785156, -0.009546279907226562, -0.007624626159667969, -0.005702972412109375, -0.0037813186645507812, -0.0018596649169921875, 6.198883056640625e-05, 0.001983642578125, 0.0039052963256835938, 0.0058269500732421875, 0.007748603820800781, 0.009670257568359375, 0.011591911315917969, 0.013513565063476562, 0.015435218811035156, 0.01735687255859375, 0.019278526306152344, 0.021200180053710938, 0.02312183380126953, 0.025043487548828125, 0.02696514129638672, 0.028886795043945312, 0.030808448791503906, 0.0327301025390625, 0.034651756286621094, 0.03657341003417969, 0.03849506378173828, 0.040416717529296875, 0.04233837127685547, 0.04426002502441406, 0.046181678771972656, 0.04810333251953125, 0.050024986267089844, 0.05194664001464844, 0.05386829376220703, 0.055789947509765625, 0.05771160125732422, 0.05963325500488281, 0.061554908752441406, 0.0634765625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 15.0, 46.0, 381.0, 462.0, 70.0, 18.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138719379901886, -0.13294430077075958, -0.12716922163963318, -0.12139414250850677, -0.11561906337738037, -0.10984398424625397, -0.10406890511512756, -0.09829382598400116, -0.09251874685287476, -0.08674366772174835, -0.08096858859062195, -0.07519350945949554, -0.06941843032836914, -0.06364335119724274, -0.05786827206611633, -0.05209319293498993, -0.046318113803863525, -0.04054303467273712, -0.03476795554161072, -0.028992876410484314, -0.02321779727935791, -0.017442718148231506, -0.011667639017105103, -0.005892559885978699, -0.00011748075485229492, 0.005657598376274109, 0.011432677507400513, 0.017207756638526917, 0.02298283576965332, 0.028757914900779724, 0.03453299403190613, 0.04030807316303253, 0.046083152294158936, 0.05185823142528534, 0.05763331055641174, 0.06340838968753815, 0.06918346881866455, 0.07495854794979095, 0.08073362708091736, 0.08650870621204376, 0.09228378534317017, 0.09805886447429657, 0.10383394360542297, 0.10960902273654938, 0.11538410186767578, 0.12115918099880219, 0.1269342601299286, 0.132709339261055, 0.1384844183921814, 0.1442594975233078, 0.1500345766544342, 0.1558096557855606, 0.161584734916687, 0.16735981404781342, 0.17313489317893982, 0.17890997231006622, 0.18468505144119263, 0.19046013057231903, 0.19623520970344543, 0.20201028883457184, 0.20778536796569824, 0.21356044709682465, 0.21933552622795105, 0.22511060535907745, 0.23088568449020386]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 10.0, 12.0, 11.0, 13.0, 24.0, 32.0, 40.0, 52.0, 60.0, 58.0, 66.0, 73.0, 68.0, 71.0, 72.0, 71.0, 43.0, 50.0, 45.0, 29.0, 23.0, 18.0, 18.0, 9.0, 11.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0848386287689209, -0.08125575631856918, -0.07767288386821747, -0.07409001141786575, -0.07050713896751404, -0.06692426651716232, -0.06334139406681061, -0.05975852161645889, -0.05617564916610718, -0.05259277671575546, -0.04900990426540375, -0.04542703181505203, -0.04184415936470032, -0.0382612869143486, -0.03467841446399689, -0.031095542013645172, -0.027512669563293457, -0.023929797112941742, -0.020346924662590027, -0.016764052212238312, -0.013181179761886597, -0.009598307311534882, -0.0060154348611831665, -0.0024325624108314514, 0.0011503100395202637, 0.004733182489871979, 0.008316054940223694, 0.011898927390575409, 0.015481799840927124, 0.01906467229127884, 0.022647544741630554, 0.02623041719198227, 0.029813289642333984, 0.0333961620926857, 0.036979034543037415, 0.04056190699338913, 0.044144779443740845, 0.04772765189409256, 0.051310524344444275, 0.05489339679479599, 0.058476269245147705, 0.06205914169549942, 0.06564201414585114, 0.06922488659620285, 0.07280775904655457, 0.07639063149690628, 0.079973503947258, 0.08355637639760971, 0.08713924884796143, 0.09072212129831314, 0.09430499374866486, 0.09788786619901657, 0.10147073864936829, 0.10505361109972, 0.10863648355007172, 0.11221935600042343, 0.11580222845077515, 0.11938510090112686, 0.12296797335147858, 0.1265508532524109, 0.130133718252182, 0.13371658325195312, 0.13729946315288544, 0.14088234305381775, 0.14446520805358887]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 3.0, 5.0, 10.0, 13.0, 14.0, 18.0, 20.0, 31.0, 56.0, 71.0, 133.0, 164.0, 262.0, 419.0, 704.0, 1209.0, 2345.0, 4778.0, 10989.0, 34388.0, 201238.0, 687438.0, 70991.0, 18548.0, 7119.0, 3310.0, 1726.0, 956.0, 529.0, 347.0, 242.0, 150.0, 96.0, 63.0, 43.0, 41.0, 30.0, 18.0, 11.0, 7.0, 3.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0721435546875, -0.06975841522216797, -0.06737327575683594, -0.0649881362915039, -0.06260299682617188, -0.060217857360839844, -0.05783271789550781, -0.05544757843017578, -0.05306243896484375, -0.05067729949951172, -0.04829216003417969, -0.045907020568847656, -0.043521881103515625, -0.041136741638183594, -0.03875160217285156, -0.03636646270751953, -0.0339813232421875, -0.03159618377685547, -0.029211044311523438, -0.026825904846191406, -0.024440765380859375, -0.022055625915527344, -0.019670486450195312, -0.01728534698486328, -0.01490020751953125, -0.012515068054199219, -0.010129928588867188, -0.007744789123535156, -0.005359649658203125, -0.0029745101928710938, -0.0005893707275390625, 0.0017957687377929688, 0.004180908203125, 0.006566047668457031, 0.008951187133789062, 0.011336326599121094, 0.013721466064453125, 0.016106605529785156, 0.018491744995117188, 0.02087688446044922, 0.02326202392578125, 0.02564716339111328, 0.028032302856445312, 0.030417442321777344, 0.032802581787109375, 0.035187721252441406, 0.03757286071777344, 0.03995800018310547, 0.0423431396484375, 0.04472827911376953, 0.04711341857910156, 0.049498558044433594, 0.051883697509765625, 0.054268836975097656, 0.05665397644042969, 0.05903911590576172, 0.06142425537109375, 0.06380939483642578, 0.06619453430175781, 0.06857967376708984, 0.07096481323242188, 0.0733499526977539, 0.07573509216308594, 0.07812023162841797, 0.08050537109375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 2.0, 5.0, 4.0, 5.0, 5.0, 17.0, 9.0, 33.0, 38.0, 54.0, 72.0, 81.0, 95.0, 104.0, 96.0, 82.0, 65.0, 63.0, 37.0, 23.0, 24.0, 13.0, 15.0, 13.0, 6.0, 6.0, 7.0, 3.0, 8.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0223236083984375, -0.02157878875732422, -0.020833969116210938, -0.020089149475097656, -0.019344329833984375, -0.018599510192871094, -0.017854690551757812, -0.01710987091064453, -0.01636505126953125, -0.015620231628417969, -0.014875411987304688, -0.014130592346191406, -0.013385772705078125, -0.012640953063964844, -0.011896133422851562, -0.011151313781738281, -0.010406494140625, -0.009661674499511719, -0.008916854858398438, -0.008172035217285156, -0.007427215576171875, -0.006682395935058594, -0.0059375762939453125, -0.005192756652832031, -0.00444793701171875, -0.0037031173706054688, -0.0029582977294921875, -0.0022134780883789062, -0.001468658447265625, -0.0007238388061523438, 2.09808349609375e-05, 0.0007658004760742188, 0.0015106201171875, 0.0022554397583007812, 0.0030002593994140625, 0.0037450790405273438, 0.004489898681640625, 0.005234718322753906, 0.0059795379638671875, 0.006724357604980469, 0.00746917724609375, 0.008213996887207031, 0.008958816528320312, 0.009703636169433594, 0.010448455810546875, 0.011193275451660156, 0.011938095092773438, 0.012682914733886719, 0.013427734375, 0.014172554016113281, 0.014917373657226562, 0.015662193298339844, 0.016407012939453125, 0.017151832580566406, 0.017896652221679688, 0.01864147186279297, 0.01938629150390625, 0.02013111114501953, 0.020875930786132812, 0.021620750427246094, 0.022365570068359375, 0.023110389709472656, 0.023855209350585938, 0.02460002899169922, 0.0253448486328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 11.0, 12.0, 14.0, 10.0, 20.0, 24.0, 30.0, 42.0, 40.0, 76.0, 81.0, 99.0, 187.0, 288.0, 468.0, 1088.0, 3462.0, 28012.0, 823952.0, 176568.0, 10000.0, 2026.0, 818.0, 396.0, 214.0, 149.0, 111.0, 65.0, 59.0, 44.0, 32.0, 28.0, 27.0, 23.0, 12.0, 16.0, 10.0, 3.0, 9.0, 5.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11138916015625, -0.10752010345458984, -0.10365104675292969, -0.09978199005126953, -0.09591293334960938, -0.09204387664794922, -0.08817481994628906, -0.0843057632446289, -0.08043670654296875, -0.0765676498413086, -0.07269859313964844, -0.06882953643798828, -0.06496047973632812, -0.06109142303466797, -0.05722236633300781, -0.053353309631347656, -0.0494842529296875, -0.045615196228027344, -0.04174613952636719, -0.03787708282470703, -0.034008026123046875, -0.03013896942138672, -0.026269912719726562, -0.022400856018066406, -0.01853179931640625, -0.014662742614746094, -0.010793685913085938, -0.006924629211425781, -0.003055572509765625, 0.0008134841918945312, 0.0046825408935546875, 0.008551597595214844, 0.012420654296875, 0.016289710998535156, 0.020158767700195312, 0.02402782440185547, 0.027896881103515625, 0.03176593780517578, 0.03563499450683594, 0.039504051208496094, 0.04337310791015625, 0.047242164611816406, 0.05111122131347656, 0.05498027801513672, 0.058849334716796875, 0.06271839141845703, 0.06658744812011719, 0.07045650482177734, 0.0743255615234375, 0.07819461822509766, 0.08206367492675781, 0.08593273162841797, 0.08980178833007812, 0.09367084503173828, 0.09753990173339844, 0.1014089584350586, 0.10527801513671875, 0.1091470718383789, 0.11301612854003906, 0.11688518524169922, 0.12075424194335938, 0.12462329864501953, 0.1284923553466797, 0.13236141204833984, 0.13623046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 6.0, 7.0, 6.0, 8.0, 11.0, 13.0, 13.0, 15.0, 23.0, 21.0, 22.0, 38.0, 29.0, 24.0, 37.0, 38.0, 33.0, 32.0, 32.0, 49.0, 36.0, 46.0, 37.0, 47.0, 35.0, 39.0, 31.0, 41.0, 30.0, 28.0, 32.0, 19.0, 28.0, 15.0, 15.0, 18.0, 9.0, 12.0, 5.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0], "bins": [-0.07342529296875, -0.07135438919067383, -0.06928348541259766, -0.06721258163452148, -0.06514167785644531, -0.06307077407836914, -0.06099987030029297, -0.0589289665222168, -0.056858062744140625, -0.05478715896606445, -0.05271625518798828, -0.05064535140991211, -0.04857444763183594, -0.046503543853759766, -0.044432640075683594, -0.04236173629760742, -0.04029083251953125, -0.03821992874145508, -0.036149024963378906, -0.034078121185302734, -0.03200721740722656, -0.02993631362915039, -0.02786540985107422, -0.025794506072998047, -0.023723602294921875, -0.021652698516845703, -0.01958179473876953, -0.01751089096069336, -0.015439987182617188, -0.013369083404541016, -0.011298179626464844, -0.009227275848388672, -0.0071563720703125, -0.005085468292236328, -0.0030145645141601562, -0.0009436607360839844, 0.0011272430419921875, 0.0031981468200683594, 0.005269050598144531, 0.007339954376220703, 0.009410858154296875, 0.011481761932373047, 0.013552665710449219, 0.01562356948852539, 0.017694473266601562, 0.019765377044677734, 0.021836280822753906, 0.023907184600830078, 0.02597808837890625, 0.028048992156982422, 0.030119895935058594, 0.032190799713134766, 0.03426170349121094, 0.03633260726928711, 0.03840351104736328, 0.04047441482543945, 0.042545318603515625, 0.0446162223815918, 0.04668712615966797, 0.04875802993774414, 0.05082893371582031, 0.052899837493896484, 0.054970741271972656, 0.05704164505004883, 0.059112548828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 6.0, 6.0, 13.0, 22.0, 29.0, 47.0, 66.0, 119.0, 289.0, 756.0, 2338.0, 14479.0, 1013316.0, 13411.0, 2308.0, 716.0, 270.0, 135.0, 57.0, 42.0, 38.0, 16.0, 14.0, 16.0, 5.0, 5.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011444091796875, -0.01106870174407959, -0.01069331169128418, -0.01031792163848877, -0.00994253158569336, -0.00956714153289795, -0.009191751480102539, -0.008816361427307129, -0.008440971374511719, -0.008065581321716309, -0.0076901912689208984, -0.007314801216125488, -0.006939411163330078, -0.006564021110534668, -0.006188631057739258, -0.005813241004943848, -0.0054378509521484375, -0.005062460899353027, -0.004687070846557617, -0.004311680793762207, -0.003936290740966797, -0.0035609006881713867, -0.0031855106353759766, -0.0028101205825805664, -0.0024347305297851562, -0.002059340476989746, -0.001683950424194336, -0.0013085603713989258, -0.0009331703186035156, -0.0005577802658081055, -0.0001823902130126953, 0.00019299983978271484, 0.000568389892578125, 0.0009437799453735352, 0.0013191699981689453, 0.0016945600509643555, 0.0020699501037597656, 0.0024453401565551758, 0.002820730209350586, 0.003196120262145996, 0.0035715103149414062, 0.003946900367736816, 0.0043222904205322266, 0.004697680473327637, 0.005073070526123047, 0.005448460578918457, 0.005823850631713867, 0.006199240684509277, 0.0065746307373046875, 0.006950020790100098, 0.007325410842895508, 0.007700800895690918, 0.008076190948486328, 0.008451581001281738, 0.008826971054077148, 0.009202361106872559, 0.009577751159667969, 0.009953141212463379, 0.010328531265258789, 0.0107039213180542, 0.01107931137084961, 0.01145470142364502, 0.01183009147644043, 0.01220548152923584, 0.01258087158203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 7.0, 5.0, 6.0, 23.0, 125.0, 525.0, 183.0, 44.0, 9.0, 9.0, 11.0, 3.0, 4.0, 2.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002741813659667969, -0.00026551634073257446, -0.00025685131549835205, -0.00024818629026412964, -0.00023952126502990723, -0.00023085623979568481, -0.0002221912145614624, -0.00021352618932724, -0.00020486116409301758, -0.00019619613885879517, -0.00018753111362457275, -0.00017886608839035034, -0.00017020106315612793, -0.00016153603792190552, -0.0001528710126876831, -0.0001442059874534607, -0.00013554096221923828, -0.00012687593698501587, -0.00011821091175079346, -0.00010954588651657104, -0.00010088086128234863, -9.221583604812622e-05, -8.355081081390381e-05, -7.48857855796814e-05, -6.622076034545898e-05, -5.755573511123657e-05, -4.889070987701416e-05, -4.022568464279175e-05, -3.1560659408569336e-05, -2.2895634174346924e-05, -1.4230608940124512e-05, -5.5655837059021e-06, 3.0994415283203125e-06, 1.1764466762542725e-05, 2.0429491996765137e-05, 2.909451723098755e-05, 3.775954246520996e-05, 4.642456769943237e-05, 5.5089592933654785e-05, 6.37546181678772e-05, 7.241964340209961e-05, 8.108466863632202e-05, 8.974969387054443e-05, 9.841471910476685e-05, 0.00010707974433898926, 0.00011574476957321167, 0.00012440979480743408, 0.0001330748200416565, 0.0001417398452758789, 0.00015040487051010132, 0.00015906989574432373, 0.00016773492097854614, 0.00017639994621276855, 0.00018506497144699097, 0.00019372999668121338, 0.0002023950219154358, 0.0002110600471496582, 0.00021972507238388062, 0.00022839009761810303, 0.00023705512285232544, 0.00024572014808654785, 0.00025438517332077026, 0.0002630501985549927, 0.0002717152237892151, 0.0002803802490234375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 9.0, 11.0, 17.0, 34.0, 73.0, 167.0, 622.0, 6612.0, 1032828.0, 7174.0, 679.0, 153.0, 69.0, 31.0, 20.0, 17.0, 13.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.033050537109375, -0.03203392028808594, -0.031017303466796875, -0.030000686645507812, -0.02898406982421875, -0.027967453002929688, -0.026950836181640625, -0.025934219360351562, -0.0249176025390625, -0.023900985717773438, -0.022884368896484375, -0.021867752075195312, -0.02085113525390625, -0.019834518432617188, -0.018817901611328125, -0.017801284790039062, -0.01678466796875, -0.015768051147460938, -0.014751434326171875, -0.013734817504882812, -0.01271820068359375, -0.011701583862304688, -0.010684967041015625, -0.009668350219726562, -0.0086517333984375, -0.0076351165771484375, -0.006618499755859375, -0.0056018829345703125, -0.00458526611328125, -0.0035686492919921875, -0.002552032470703125, -0.0015354156494140625, -0.000518798828125, 0.0004978179931640625, 0.001514434814453125, 0.0025310516357421875, 0.00354766845703125, 0.0045642852783203125, 0.005580902099609375, 0.0065975189208984375, 0.0076141357421875, 0.008630752563476562, 0.009647369384765625, 0.010663986206054688, 0.01168060302734375, 0.012697219848632812, 0.013713836669921875, 0.014730453491210938, 0.0157470703125, 0.016763687133789062, 0.017780303955078125, 0.018796920776367188, 0.01981353759765625, 0.020830154418945312, 0.021846771240234375, 0.022863388061523438, 0.0238800048828125, 0.024896621704101562, 0.025913238525390625, 0.026929855346679688, 0.02794647216796875, 0.028963088989257812, 0.029979705810546875, 0.030996322631835938, 0.032012939453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 11.0, 11.0, 16.0, 28.0, 55.0, 176.0, 408.0, 152.0, 49.0, 33.0, 15.0, 6.0, 9.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0156097412109375, -0.01511383056640625, -0.014617919921875, -0.01412200927734375, -0.0136260986328125, -0.01313018798828125, -0.01263427734375, -0.01213836669921875, -0.0116424560546875, -0.01114654541015625, -0.010650634765625, -0.01015472412109375, -0.0096588134765625, -0.00916290283203125, -0.0086669921875, -0.00817108154296875, -0.0076751708984375, -0.00717926025390625, -0.006683349609375, -0.00618743896484375, -0.0056915283203125, -0.00519561767578125, -0.00469970703125, -0.00420379638671875, -0.0037078857421875, -0.00321197509765625, -0.002716064453125, -0.00222015380859375, -0.0017242431640625, -0.00122833251953125, -0.000732421875, -0.00023651123046875, 0.0002593994140625, 0.00075531005859375, 0.001251220703125, 0.00174713134765625, 0.0022430419921875, 0.00273895263671875, 0.00323486328125, 0.00373077392578125, 0.0042266845703125, 0.00472259521484375, 0.005218505859375, 0.00571441650390625, 0.0062103271484375, 0.00670623779296875, 0.0072021484375, 0.00769805908203125, 0.0081939697265625, 0.00868988037109375, 0.009185791015625, 0.00968170166015625, 0.0101776123046875, 0.01067352294921875, 0.01116943359375, 0.01166534423828125, 0.0121612548828125, 0.01265716552734375, 0.013153076171875, 0.01364898681640625, 0.0141448974609375, 0.01464080810546875, 0.01513671875, 0.01563262939453125, 0.0161285400390625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 12.0, 23.0, 42.0, 165.0, 491.0, 187.0, 56.0, 15.0, 10.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18612724542617798, -0.1666599065065384, -0.1471925675868988, -0.12772522866725922, -0.10825788974761963, -0.08879055082798004, -0.06932321190834045, -0.04985587298870087, -0.03038853406906128, -0.010921195149421692, 0.008546143770217896, 0.028013482689857483, 0.04748082160949707, 0.06694816052913666, 0.08641549944877625, 0.10588283836841583, 0.12535017728805542, 0.144817516207695, 0.1642848551273346, 0.18375219404697418, 0.20321953296661377, 0.22268687188625336, 0.24215421080589294, 0.26162153482437134, 0.2810888886451721, 0.3005562424659729, 0.3200235664844513, 0.3394908905029297, 0.35895824432373047, 0.37842559814453125, 0.39789292216300964, 0.41736024618148804, 0.43682754039764404, 0.4562948942184448, 0.4757622182369232, 0.4952295422554016, 0.5146968960762024, 0.5341642498970032, 0.5536315441131592, 0.57309889793396, 0.5925662517547607, 0.6120336055755615, 0.6315009593963623, 0.6509682536125183, 0.6704356074333191, 0.6899029612541199, 0.7093702554702759, 0.7288376092910767, 0.7483049631118774, 0.7677723169326782, 0.787239670753479, 0.806706964969635, 0.8261743187904358, 0.8456416726112366, 0.8651089668273926, 0.8845763206481934, 0.9040436744689941, 0.9235110282897949, 0.9429783821105957, 0.9624456763267517, 0.9819130301475525, 1.0013803243637085, 1.0208476781845093, 1.04031503200531, 1.0597823858261108]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 10.0, 9.0, 13.0, 19.0, 12.0, 18.0, 23.0, 28.0, 29.0, 29.0, 38.0, 29.0, 49.0, 52.0, 44.0, 46.0, 42.0, 42.0, 42.0, 37.0, 29.0, 43.0, 44.0, 34.0, 20.0, 30.0, 30.0, 21.0, 22.0, 20.0, 18.0, 9.0, 6.0, 8.0, 8.0, 9.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36525487899780273, -0.3532108962535858, -0.3411669433116913, -0.32912296056747437, -0.31707900762557983, -0.3050350248813629, -0.292991042137146, -0.28094708919525146, -0.26890313625335693, -0.25685915350914, -0.24481520056724548, -0.23277121782302856, -0.22072726488113403, -0.20868328213691711, -0.1966393142938614, -0.18459534645080566, -0.17255136370658875, -0.16050739586353302, -0.1484634280204773, -0.13641944527626038, -0.12437548488378525, -0.11233151704072952, -0.1002875417470932, -0.08824357390403748, -0.07619960606098175, -0.06415563821792603, -0.05211166664958, -0.04006769508123398, -0.028023727238178253, -0.015979759395122528, -0.003935784101486206, 0.008108183741569519, 0.020152151584625244, 0.03219611942768097, 0.04424009099602699, 0.056284062564373016, 0.06832803040742874, 0.08037199825048447, 0.09241597354412079, 0.10445994138717651, 0.11650390923023224, 0.12854787707328796, 0.1405918449163437, 0.15263581275939941, 0.16467979550361633, 0.17672374844551086, 0.18876773118972778, 0.2008116990327835, 0.21285566687583923, 0.22489963471889496, 0.23694360256195068, 0.2489875853061676, 0.26103153824806213, 0.27307552099227905, 0.2851194739341736, 0.2971634566783905, 0.3092074394226074, 0.32125142216682434, 0.33329537510871887, 0.3453393578529358, 0.3573833107948303, 0.36942729353904724, 0.38147127628326416, 0.3935152292251587, 0.4055591821670532]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 5.0, 6.0, 5.0, 12.0, 18.0, 35.0, 41.0, 54.0, 76.0, 112.0, 252.0, 3029.0, 4189715.0, 483.0, 126.0, 80.0, 63.0, 39.0, 24.0, 18.0, 16.0, 15.0, 7.0, 7.0, 8.0, 6.0, 4.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.26416015625, -0.2551116943359375, -0.246063232421875, -0.2370147705078125, -0.22796630859375, -0.2189178466796875, -0.209869384765625, -0.2008209228515625, -0.1917724609375, -0.1827239990234375, -0.173675537109375, -0.1646270751953125, -0.15557861328125, -0.1465301513671875, -0.137481689453125, -0.1284332275390625, -0.119384765625, -0.1103363037109375, -0.101287841796875, -0.0922393798828125, -0.08319091796875, -0.0741424560546875, -0.065093994140625, -0.0560455322265625, -0.0469970703125, -0.0379486083984375, -0.028900146484375, -0.0198516845703125, -0.01080322265625, -0.0017547607421875, 0.007293701171875, 0.0163421630859375, 0.025390625, 0.0344390869140625, 0.043487548828125, 0.0525360107421875, 0.06158447265625, 0.0706329345703125, 0.079681396484375, 0.0887298583984375, 0.0977783203125, 0.1068267822265625, 0.115875244140625, 0.1249237060546875, 0.13397216796875, 0.1430206298828125, 0.152069091796875, 0.1611175537109375, 0.170166015625, 0.1792144775390625, 0.188262939453125, 0.1973114013671875, 0.20635986328125, 0.2154083251953125, 0.224456787109375, 0.2335052490234375, 0.2425537109375, 0.2516021728515625, 0.260650634765625, 0.2696990966796875, 0.27874755859375, 0.2877960205078125, 0.296844482421875, 0.3058929443359375, 0.31494140625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 6.0, 5.0, 12.0, 14.0, 33.0, 33.0, 55.0, 65.0, 76.0, 88.0, 91.0, 81.0, 98.0, 52.0, 65.0, 59.0, 30.0, 33.0, 16.0, 12.0, 15.0, 9.0, 6.0, 6.0, 8.0, 4.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02093505859375, -0.020221710205078125, -0.01950836181640625, -0.018795013427734375, -0.0180816650390625, -0.017368316650390625, -0.01665496826171875, -0.015941619873046875, -0.015228271484375, -0.014514923095703125, -0.01380157470703125, -0.013088226318359375, -0.0123748779296875, -0.011661529541015625, -0.01094818115234375, -0.010234832763671875, -0.009521484375, -0.008808135986328125, -0.00809478759765625, -0.007381439208984375, -0.0066680908203125, -0.005954742431640625, -0.00524139404296875, -0.004528045654296875, -0.003814697265625, -0.003101348876953125, -0.00238800048828125, -0.001674652099609375, -0.0009613037109375, -0.000247955322265625, 0.00046539306640625, 0.001178741455078125, 0.00189208984375, 0.002605438232421875, 0.00331878662109375, 0.004032135009765625, 0.0047454833984375, 0.005458831787109375, 0.00617218017578125, 0.006885528564453125, 0.007598876953125, 0.008312225341796875, 0.00902557373046875, 0.009738922119140625, 0.0104522705078125, 0.011165618896484375, 0.01187896728515625, 0.012592315673828125, 0.0133056640625, 0.014019012451171875, 0.01473236083984375, 0.015445709228515625, 0.0161590576171875, 0.016872406005859375, 0.01758575439453125, 0.018299102783203125, 0.019012451171875, 0.019725799560546875, 0.02043914794921875, 0.021152496337890625, 0.0218658447265625, 0.022579193115234375, 0.02329254150390625, 0.024005889892578125, 0.02471923828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 25.0, 50.0, 190.0, 713.0, 3134.0, 4149615.0, 37978.0, 1774.0, 500.0, 190.0, 52.0, 19.0, 13.0, 9.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.08020210266113281, -0.07776260375976562, -0.07532310485839844, -0.07288360595703125, -0.07044410705566406, -0.06800460815429688, -0.06556510925292969, -0.0631256103515625, -0.06068611145019531, -0.058246612548828125, -0.05580711364746094, -0.05336761474609375, -0.05092811584472656, -0.048488616943359375, -0.04604911804199219, -0.043609619140625, -0.04117012023925781, -0.038730621337890625, -0.03629112243652344, -0.03385162353515625, -0.03141212463378906, -0.028972625732421875, -0.026533126831054688, -0.0240936279296875, -0.021654129028320312, -0.019214630126953125, -0.016775131225585938, -0.01433563232421875, -0.011896133422851562, -0.009456634521484375, -0.0070171356201171875, -0.00457763671875, -0.0021381378173828125, 0.000301361083984375, 0.0027408599853515625, 0.00518035888671875, 0.0076198577880859375, 0.010059356689453125, 0.012498855590820312, 0.0149383544921875, 0.017377853393554688, 0.019817352294921875, 0.022256851196289062, 0.02469635009765625, 0.027135848999023438, 0.029575347900390625, 0.03201484680175781, 0.034454345703125, 0.03689384460449219, 0.039333343505859375, 0.04177284240722656, 0.04421234130859375, 0.04665184020996094, 0.049091339111328125, 0.05153083801269531, 0.0539703369140625, 0.05640983581542969, 0.058849334716796875, 0.06128883361816406, 0.06372833251953125, 0.06616783142089844, 0.06860733032226562, 0.07104682922363281, 0.073486328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 15.0, 26.0, 88.0, 3779.0, 93.0, 20.0, 13.0, 13.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01548004150390625, -0.014955401420593262, -0.014430761337280273, -0.013906121253967285, -0.013381481170654297, -0.012856841087341309, -0.01233220100402832, -0.011807560920715332, -0.011282920837402344, -0.010758280754089355, -0.010233640670776367, -0.009709000587463379, -0.00918436050415039, -0.008659720420837402, -0.008135080337524414, -0.007610440254211426, -0.0070858001708984375, -0.006561160087585449, -0.006036520004272461, -0.005511879920959473, -0.004987239837646484, -0.004462599754333496, -0.003937959671020508, -0.0034133195877075195, -0.0028886795043945312, -0.002364039421081543, -0.0018393993377685547, -0.0013147592544555664, -0.0007901191711425781, -0.00026547908782958984, 0.00025916099548339844, 0.0007838010787963867, 0.001308441162109375, 0.0018330812454223633, 0.0023577213287353516, 0.00288236141204834, 0.003407001495361328, 0.003931641578674316, 0.004456281661987305, 0.004980921745300293, 0.005505561828613281, 0.0060302019119262695, 0.006554841995239258, 0.007079482078552246, 0.007604122161865234, 0.008128762245178223, 0.008653402328491211, 0.0091780424118042, 0.009702682495117188, 0.010227322578430176, 0.010751962661743164, 0.011276602745056152, 0.01180124282836914, 0.012325882911682129, 0.012850522994995117, 0.013375163078308105, 0.013899803161621094, 0.014424443244934082, 0.01494908332824707, 0.015473723411560059, 0.015998363494873047, 0.016523003578186035, 0.017047643661499023, 0.01757228374481201, 0.018096923828125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 22.0, 78.0, 650.0, 221.0, 31.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12705132365226746, -0.12464351952075958, -0.12223571538925171, -0.11982790380716324, -0.11742009967565536, -0.11501229554414749, -0.11260449141263962, -0.11019668728113174, -0.10778887569904327, -0.1053810715675354, -0.10297326743602753, -0.10056545585393906, -0.09815765172243118, -0.09574984759092331, -0.09334204345941544, -0.09093423932790756, -0.08852643519639969, -0.08611863106489182, -0.08371082693338394, -0.08130301535129547, -0.0788952112197876, -0.07648740708827972, -0.07407960295677185, -0.07167179882526398, -0.0692639946937561, -0.06685619056224823, -0.06444838643074036, -0.062040578573942184, -0.05963277071714401, -0.05722496658563614, -0.054817162454128265, -0.05240935832262039, -0.05000155046582222, -0.047593746334314346, -0.045185938477516174, -0.0427781343460083, -0.04037033021450043, -0.037962522357702255, -0.03555471822619438, -0.03314691036939621, -0.030739106237888336, -0.028331300243735313, -0.02592349424958229, -0.023515690118074417, -0.021107884123921394, -0.01870007812976837, -0.016292273998260498, -0.013884468004107475, -0.011476662009954453, -0.00906885601580143, -0.006661050952970982, -0.004253245424479246, -0.0018454398959875107, 0.0005623660981655121, 0.0029701711609959602, 0.005377976223826408, 0.007785782217979431, 0.010193588212132454, 0.012601393274962902, 0.01500919833779335, 0.017417004331946373, 0.019824810326099396, 0.02223261445760727, 0.024640420451760292, 0.027048226445913315]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 8.0, 3.0, 11.0, 6.0, 13.0, 18.0, 31.0, 32.0, 41.0, 47.0, 45.0, 61.0, 57.0, 77.0, 85.0, 72.0, 52.0, 56.0, 61.0, 50.0, 39.0, 48.0, 27.0, 22.0, 17.0, 5.0, 7.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026152849197387695, -0.02509773150086403, -0.024042613804340363, -0.022987496107816696, -0.02193237841129303, -0.020877260714769363, -0.019822143018245697, -0.01876702532172203, -0.017711907625198364, -0.016656789928674698, -0.015601672232151031, -0.014546554535627365, -0.013491436839103699, -0.012436319142580032, -0.011381201446056366, -0.0103260837495327, -0.009270966053009033, -0.008215848356485367, -0.0071607306599617004, -0.006105612963438034, -0.005050495266914368, -0.003995377570390701, -0.002940259873867035, -0.0018851421773433685, -0.0008300244808197021, 0.00022509321570396423, 0.0012802109122276306, 0.002335328608751297, 0.0033904463052749634, 0.00444556400179863, 0.005500681698322296, 0.0065557993948459625, 0.007610917091369629, 0.008666034787893295, 0.009721152484416962, 0.010776270180940628, 0.011831387877464294, 0.01288650557398796, 0.013941623270511627, 0.014996740967035294, 0.01605185866355896, 0.017106976360082626, 0.018162094056606293, 0.01921721175312996, 0.020272329449653625, 0.021327447146177292, 0.022382564842700958, 0.023437682539224625, 0.02449280023574829, 0.025547917932271957, 0.026603035628795624, 0.02765815332531929, 0.028713271021842957, 0.029768388718366623, 0.03082350641489029, 0.031878624111413956, 0.03293374180793762, 0.03398885950446129, 0.035043977200984955, 0.03609909489750862, 0.03715421259403229, 0.038209330290555954, 0.03926444798707962, 0.04031956568360329, 0.04137468338012695]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 12.0, 14.0, 10.0, 19.0, 44.0, 37.0, 90.0, 111.0, 169.0, 255.0, 411.0, 754.0, 1409.0, 2865.0, 6383.0, 16929.0, 63722.0, 614746.0, 274258.0, 43086.0, 12726.0, 5188.0, 2437.0, 1143.0, 672.0, 354.0, 215.0, 160.0, 94.0, 67.0, 46.0, 38.0, 26.0, 12.0, 12.0, 5.0, 3.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06756591796875, -0.06530380249023438, -0.06304168701171875, -0.060779571533203125, -0.0585174560546875, -0.056255340576171875, -0.05399322509765625, -0.051731109619140625, -0.049468994140625, -0.047206878662109375, -0.04494476318359375, -0.042682647705078125, -0.0404205322265625, -0.038158416748046875, -0.03589630126953125, -0.033634185791015625, -0.0313720703125, -0.029109954833984375, -0.02684783935546875, -0.024585723876953125, -0.0223236083984375, -0.020061492919921875, -0.01779937744140625, -0.015537261962890625, -0.013275146484375, -0.011013031005859375, -0.00875091552734375, -0.006488800048828125, -0.0042266845703125, -0.001964569091796875, 0.00029754638671875, 0.002559661865234375, 0.00482177734375, 0.007083892822265625, 0.00934600830078125, 0.011608123779296875, 0.0138702392578125, 0.016132354736328125, 0.01839447021484375, 0.020656585693359375, 0.022918701171875, 0.025180816650390625, 0.02744293212890625, 0.029705047607421875, 0.0319671630859375, 0.034229278564453125, 0.03649139404296875, 0.038753509521484375, 0.041015625, 0.043277740478515625, 0.04553985595703125, 0.047801971435546875, 0.0500640869140625, 0.052326202392578125, 0.05458831787109375, 0.056850433349609375, 0.059112548828125, 0.061374664306640625, 0.06363677978515625, 0.06589889526367188, 0.0681610107421875, 0.07042312622070312, 0.07268524169921875, 0.07494735717773438, 0.07720947265625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 7.0, 3.0, 6.0, 4.0, 14.0, 15.0, 32.0, 37.0, 53.0, 62.0, 80.0, 85.0, 96.0, 85.0, 90.0, 52.0, 65.0, 56.0, 41.0, 20.0, 16.0, 14.0, 14.0, 10.0, 9.0, 3.0, 8.0, 5.0, 7.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020904541015625, -0.020190715789794922, -0.019476890563964844, -0.018763065338134766, -0.018049240112304688, -0.01733541488647461, -0.01662158966064453, -0.015907764434814453, -0.015193939208984375, -0.014480113983154297, -0.013766288757324219, -0.01305246353149414, -0.012338638305664062, -0.011624813079833984, -0.010910987854003906, -0.010197162628173828, -0.00948333740234375, -0.008769512176513672, -0.008055686950683594, -0.007341861724853516, -0.0066280364990234375, -0.005914211273193359, -0.005200386047363281, -0.004486560821533203, -0.003772735595703125, -0.003058910369873047, -0.0023450851440429688, -0.0016312599182128906, -0.0009174346923828125, -0.00020360946655273438, 0.0005102157592773438, 0.0012240409851074219, 0.0019378662109375, 0.002651691436767578, 0.0033655166625976562, 0.004079341888427734, 0.0047931671142578125, 0.005506992340087891, 0.006220817565917969, 0.006934642791748047, 0.007648468017578125, 0.008362293243408203, 0.009076118469238281, 0.00978994369506836, 0.010503768920898438, 0.011217594146728516, 0.011931419372558594, 0.012645244598388672, 0.01335906982421875, 0.014072895050048828, 0.014786720275878906, 0.015500545501708984, 0.016214370727539062, 0.01692819595336914, 0.01764202117919922, 0.018355846405029297, 0.019069671630859375, 0.019783496856689453, 0.02049732208251953, 0.02121114730834961, 0.021924972534179688, 0.022638797760009766, 0.023352622985839844, 0.024066448211669922, 0.0247802734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 6.0, 1.0, 8.0, 6.0, 8.0, 4.0, 5.0, 11.0, 18.0, 17.0, 19.0, 28.0, 29.0, 46.0, 60.0, 74.0, 81.0, 127.0, 247.0, 349.0, 777.0, 1951.0, 11103.0, 443339.0, 573835.0, 12432.0, 2005.0, 819.0, 379.0, 216.0, 143.0, 101.0, 71.0, 51.0, 41.0, 32.0, 23.0, 25.0, 25.0, 12.0, 12.0, 8.0, 2.0, 5.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1370849609375, -0.1329326629638672, -0.12878036499023438, -0.12462806701660156, -0.12047576904296875, -0.11632347106933594, -0.11217117309570312, -0.10801887512207031, -0.1038665771484375, -0.09971427917480469, -0.09556198120117188, -0.09140968322753906, -0.08725738525390625, -0.08310508728027344, -0.07895278930664062, -0.07480049133300781, -0.070648193359375, -0.06649589538574219, -0.062343597412109375, -0.05819129943847656, -0.05403900146484375, -0.04988670349121094, -0.045734405517578125, -0.04158210754394531, -0.0374298095703125, -0.03327751159667969, -0.029125213623046875, -0.024972915649414062, -0.02082061767578125, -0.016668319702148438, -0.012516021728515625, -0.008363723754882812, -0.00421142578125, -5.91278076171875e-05, 0.004093170166015625, 0.008245468139648438, 0.01239776611328125, 0.016550064086914062, 0.020702362060546875, 0.024854660034179688, 0.0290069580078125, 0.03315925598144531, 0.037311553955078125, 0.04146385192871094, 0.04561614990234375, 0.04976844787597656, 0.053920745849609375, 0.05807304382324219, 0.062225341796875, 0.06637763977050781, 0.07052993774414062, 0.07468223571777344, 0.07883453369140625, 0.08298683166503906, 0.08713912963867188, 0.09129142761230469, 0.0954437255859375, 0.09959602355957031, 0.10374832153320312, 0.10790061950683594, 0.11205291748046875, 0.11620521545410156, 0.12035751342773438, 0.12450981140136719, 0.128662109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 9.0, 9.0, 16.0, 9.0, 16.0, 14.0, 19.0, 22.0, 32.0, 38.0, 24.0, 33.0, 32.0, 39.0, 44.0, 43.0, 39.0, 41.0, 50.0, 45.0, 44.0, 32.0, 34.0, 39.0, 43.0, 34.0, 30.0, 23.0, 18.0, 25.0, 16.0, 17.0, 13.0, 11.0, 11.0, 8.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0631103515625, -0.06107807159423828, -0.05904579162597656, -0.057013511657714844, -0.054981231689453125, -0.052948951721191406, -0.05091667175292969, -0.04888439178466797, -0.04685211181640625, -0.04481983184814453, -0.04278755187988281, -0.040755271911621094, -0.038722991943359375, -0.036690711975097656, -0.03465843200683594, -0.03262615203857422, -0.0305938720703125, -0.02856159210205078, -0.026529312133789062, -0.024497032165527344, -0.022464752197265625, -0.020432472229003906, -0.018400192260742188, -0.01636791229248047, -0.01433563232421875, -0.012303352355957031, -0.010271072387695312, -0.008238792419433594, -0.006206512451171875, -0.004174232482910156, -0.0021419525146484375, -0.00010967254638671875, 0.001922607421875, 0.003954887390136719, 0.0059871673583984375, 0.008019447326660156, 0.010051727294921875, 0.012084007263183594, 0.014116287231445312, 0.01614856719970703, 0.01818084716796875, 0.02021312713623047, 0.022245407104492188, 0.024277687072753906, 0.026309967041015625, 0.028342247009277344, 0.030374526977539062, 0.03240680694580078, 0.0344390869140625, 0.03647136688232422, 0.03850364685058594, 0.040535926818847656, 0.042568206787109375, 0.044600486755371094, 0.04663276672363281, 0.04866504669189453, 0.05069732666015625, 0.05272960662841797, 0.05476188659667969, 0.056794166564941406, 0.058826446533203125, 0.060858726501464844, 0.06289100646972656, 0.06492328643798828, 0.06695556640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 5.0, 8.0, 12.0, 24.0, 31.0, 44.0, 62.0, 114.0, 220.0, 403.0, 785.0, 1890.0, 4632.0, 19574.0, 999092.0, 14420.0, 4017.0, 1601.0, 731.0, 355.0, 204.0, 104.0, 59.0, 37.0, 26.0, 19.0, 20.0, 14.0, 13.0, 3.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01654052734375, -0.016045808792114258, -0.015551090240478516, -0.015056371688842773, -0.014561653137207031, -0.014066934585571289, -0.013572216033935547, -0.013077497482299805, -0.012582778930664062, -0.01208806037902832, -0.011593341827392578, -0.011098623275756836, -0.010603904724121094, -0.010109186172485352, -0.00961446762084961, -0.009119749069213867, -0.008625030517578125, -0.008130311965942383, -0.007635593414306641, -0.0071408748626708984, -0.006646156311035156, -0.006151437759399414, -0.005656719207763672, -0.00516200065612793, -0.0046672821044921875, -0.004172563552856445, -0.003677845001220703, -0.003183126449584961, -0.0026884078979492188, -0.0021936893463134766, -0.0016989707946777344, -0.0012042522430419922, -0.00070953369140625, -0.0002148151397705078, 0.0002799034118652344, 0.0007746219635009766, 0.0012693405151367188, 0.001764059066772461, 0.002258777618408203, 0.0027534961700439453, 0.0032482147216796875, 0.0037429332733154297, 0.004237651824951172, 0.004732370376586914, 0.005227088928222656, 0.0057218074798583984, 0.006216526031494141, 0.006711244583129883, 0.007205963134765625, 0.007700681686401367, 0.00819540023803711, 0.008690118789672852, 0.009184837341308594, 0.009679555892944336, 0.010174274444580078, 0.01066899299621582, 0.011163711547851562, 0.011658430099487305, 0.012153148651123047, 0.012647867202758789, 0.013142585754394531, 0.013637304306030273, 0.014132022857666016, 0.014626741409301758, 0.0151214599609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 4.0, 17.0, 50.0, 178.0, 526.0, 145.0, 33.0, 12.0, 4.0, 5.0, 0.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003387928009033203, -0.00032726675271987915, -0.000315740704536438, -0.0003042146563529968, -0.00029268860816955566, -0.0002811625599861145, -0.00026963651180267334, -0.0002581104636192322, -0.000246584415435791, -0.00023505836725234985, -0.0002235323190689087, -0.00021200627088546753, -0.00020048022270202637, -0.0001889541745185852, -0.00017742812633514404, -0.00016590207815170288, -0.00015437602996826172, -0.00014284998178482056, -0.0001313239336013794, -0.00011979788541793823, -0.00010827183723449707, -9.674578905105591e-05, -8.521974086761475e-05, -7.369369268417358e-05, -6.216764450073242e-05, -5.064159631729126e-05, -3.91155481338501e-05, -2.7589499950408936e-05, -1.6063451766967773e-05, -4.537403583526611e-06, 6.988644599914551e-06, 1.8514692783355713e-05, 3.0040740966796875e-05, 4.156678915023804e-05, 5.30928373336792e-05, 6.461888551712036e-05, 7.614493370056152e-05, 8.767098188400269e-05, 9.919703006744385e-05, 0.00011072307825088501, 0.00012224912643432617, 0.00013377517461776733, 0.0001453012228012085, 0.00015682727098464966, 0.00016835331916809082, 0.00017987936735153198, 0.00019140541553497314, 0.0002029314637184143, 0.00021445751190185547, 0.00022598356008529663, 0.0002375096082687378, 0.00024903565645217896, 0.0002605617046356201, 0.0002720877528190613, 0.00028361380100250244, 0.0002951398491859436, 0.00030666589736938477, 0.00031819194555282593, 0.0003297179937362671, 0.00034124404191970825, 0.0003527700901031494, 0.0003642961382865906, 0.00037582218647003174, 0.0003873482346534729, 0.00039887428283691406]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 10.0, 13.0, 14.0, 45.0, 52.0, 136.0, 452.0, 4718.0, 1032084.0, 10018.0, 640.0, 185.0, 67.0, 41.0, 16.0, 16.0, 7.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.047271728515625, -0.04586505889892578, -0.04445838928222656, -0.043051719665527344, -0.041645050048828125, -0.040238380432128906, -0.03883171081542969, -0.03742504119873047, -0.03601837158203125, -0.03461170196533203, -0.03320503234863281, -0.031798362731933594, -0.030391693115234375, -0.028985023498535156, -0.027578353881835938, -0.02617168426513672, -0.0247650146484375, -0.02335834503173828, -0.021951675415039062, -0.020545005798339844, -0.019138336181640625, -0.017731666564941406, -0.016324996948242188, -0.014918327331542969, -0.01351165771484375, -0.012104988098144531, -0.010698318481445312, -0.009291648864746094, -0.007884979248046875, -0.006478309631347656, -0.0050716400146484375, -0.0036649703979492188, -0.00225830078125, -0.0008516311645507812, 0.0005550384521484375, 0.0019617080688476562, 0.003368377685546875, 0.004775047302246094, 0.0061817169189453125, 0.007588386535644531, 0.00899505615234375, 0.010401725769042969, 0.011808395385742188, 0.013215065002441406, 0.014621734619140625, 0.016028404235839844, 0.017435073852539062, 0.01884174346923828, 0.0202484130859375, 0.02165508270263672, 0.023061752319335938, 0.024468421936035156, 0.025875091552734375, 0.027281761169433594, 0.028688430786132812, 0.03009510040283203, 0.03150177001953125, 0.03290843963623047, 0.03431510925292969, 0.035721778869628906, 0.037128448486328125, 0.038535118103027344, 0.03994178771972656, 0.04134845733642578, 0.042755126953125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 9.0, 10.0, 11.0, 16.0, 29.0, 65.0, 192.0, 352.0, 145.0, 58.0, 21.0, 16.0, 17.0, 8.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016326904296875, -0.015790224075317383, -0.015253543853759766, -0.014716863632202148, -0.014180183410644531, -0.013643503189086914, -0.013106822967529297, -0.01257014274597168, -0.012033462524414062, -0.011496782302856445, -0.010960102081298828, -0.010423421859741211, -0.009886741638183594, -0.009350061416625977, -0.00881338119506836, -0.008276700973510742, -0.007740020751953125, -0.007203340530395508, -0.006666660308837891, -0.0061299800872802734, -0.005593299865722656, -0.005056619644165039, -0.004519939422607422, -0.003983259201049805, -0.0034465789794921875, -0.0029098987579345703, -0.002373218536376953, -0.001836538314819336, -0.0012998580932617188, -0.0007631778717041016, -0.00022649765014648438, 0.0003101825714111328, 0.00084686279296875, 0.0013835430145263672, 0.0019202232360839844, 0.0024569034576416016, 0.0029935836791992188, 0.003530263900756836, 0.004066944122314453, 0.00460362434387207, 0.0051403045654296875, 0.005676984786987305, 0.006213665008544922, 0.006750345230102539, 0.007287025451660156, 0.007823705673217773, 0.00836038589477539, 0.008897066116333008, 0.009433746337890625, 0.009970426559448242, 0.01050710678100586, 0.011043787002563477, 0.011580467224121094, 0.012117147445678711, 0.012653827667236328, 0.013190507888793945, 0.013727188110351562, 0.01426386833190918, 0.014800548553466797, 0.015337228775024414, 0.01587390899658203, 0.01641058921813965, 0.016947269439697266, 0.017483949661254883, 0.0180206298828125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 6.0, 77.0, 795.0, 121.0, 13.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18552322685718536, -0.13408255577087402, -0.08264187723398209, -0.03120119869709015, 0.02023947238922119, 0.07168014347553253, 0.12312082946300507, 0.1745614856481552, 0.22600217163562775, 0.2774428427219391, 0.3288835287094116, 0.38032418489456177, 0.4317648708820343, 0.48320555686950684, 0.534646213054657, 0.5860868692398071, 0.637527585029602, 0.6889682412147522, 0.7404089570045471, 0.7918496131896973, 0.8432902693748474, 0.8947309255599976, 0.9461716413497925, 0.9976122975349426, 1.0490529537200928, 1.1004936695098877, 1.151934266090393, 1.203374981880188, 1.254815697669983, 1.3062562942504883, 1.3576970100402832, 1.4091377258300781, 1.4605783224105835, 1.5120190382003784, 1.5634596347808838, 1.6149003505706787, 1.6663410663604736, 1.717781662940979, 1.769222378730774, 1.8206629753112793, 1.8721036911010742, 1.9235444068908691, 1.9749850034713745, 2.026425838470459, 2.077866315841675, 2.1293070316314697, 2.1807477474212646, 2.2321884632110596, 2.2836291790008545, 2.3350698947906494, 2.3865106105804443, 2.43795108795166, 2.489391803741455, 2.54083251953125, 2.592273235321045, 2.64371395111084, 2.6951544284820557, 2.7465951442718506, 2.7980358600616455, 2.8494763374328613, 2.9009170532226562, 2.952357769012451, 3.003798484802246, 3.055239200592041, 3.106679916381836]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 7.0, 8.0, 11.0, 11.0, 14.0, 15.0, 26.0, 20.0, 28.0, 35.0, 46.0, 50.0, 44.0, 53.0, 62.0, 61.0, 54.0, 55.0, 51.0, 58.0, 45.0, 43.0, 40.0, 32.0, 21.0, 25.0, 16.0, 13.0, 19.0, 13.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4125663638114929, -0.3979475796222687, -0.38332876563072205, -0.3687099814414978, -0.35409119725227356, -0.3394724130630493, -0.3248535990715027, -0.31023481488227844, -0.2956160306930542, -0.28099724650382996, -0.2663784325122833, -0.2517596483230591, -0.23714086413383484, -0.2225220650434494, -0.20790326595306396, -0.19328448176383972, -0.17866568267345428, -0.16404688358306885, -0.1494280993938446, -0.13480930030345917, -0.12019051611423492, -0.10557171702384949, -0.09095292538404465, -0.07633413374423981, -0.06171534210443497, -0.04709655046463013, -0.03247775882482529, -0.01785896345973015, -0.0032401718199253082, 0.01137862354516983, 0.02599741518497467, 0.04061620682477951, 0.05523499846458435, 0.06985379010438919, 0.08447258174419403, 0.09909138083457947, 0.11371016502380371, 0.12832896411418915, 0.14294776320457458, 0.15756654739379883, 0.17218533158302307, 0.1868041306734085, 0.20142291486263275, 0.2160417139530182, 0.23066049814224243, 0.24527929723262787, 0.2598980963230133, 0.27451688051223755, 0.2891356945037842, 0.3037544786930084, 0.31837329268455505, 0.3329920768737793, 0.34761086106300354, 0.3622296452522278, 0.3768484592437744, 0.39146724343299866, 0.4060860276222229, 0.42070481181144714, 0.4353236258029938, 0.449942409992218, 0.46456119418144226, 0.4791799783706665, 0.49379879236221313, 0.5084176063537598, 0.5230363607406616]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 6.0, 4.0, 6.0, 11.0, 19.0, 18.0, 32.0, 43.0, 60.0, 84.0, 130.0, 181.0, 333.0, 669.0, 19541.0, 4171276.0, 843.0, 348.0, 225.0, 122.0, 93.0, 65.0, 45.0, 27.0, 28.0, 14.0, 8.0, 19.0, 7.0, 6.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.15952110290527344, -0.15363693237304688, -0.1477527618408203, -0.14186859130859375, -0.1359844207763672, -0.13010025024414062, -0.12421607971191406, -0.1183319091796875, -0.11244773864746094, -0.10656356811523438, -0.10067939758300781, -0.09479522705078125, -0.08891105651855469, -0.08302688598632812, -0.07714271545410156, -0.071258544921875, -0.06537437438964844, -0.059490203857421875, -0.05360603332519531, -0.04772186279296875, -0.04183769226074219, -0.035953521728515625, -0.030069351196289062, -0.0241851806640625, -0.018301010131835938, -0.012416839599609375, -0.0065326690673828125, -0.00064849853515625, 0.0052356719970703125, 0.011119842529296875, 0.017004013061523438, 0.02288818359375, 0.028772354125976562, 0.034656524658203125, 0.04054069519042969, 0.04642486572265625, 0.05230903625488281, 0.058193206787109375, 0.06407737731933594, 0.0699615478515625, 0.07584571838378906, 0.08172988891601562, 0.08761405944824219, 0.09349822998046875, 0.09938240051269531, 0.10526657104492188, 0.11115074157714844, 0.117034912109375, 0.12291908264160156, 0.12880325317382812, 0.1346874237060547, 0.14057159423828125, 0.1464557647705078, 0.15233993530273438, 0.15822410583496094, 0.1641082763671875, 0.16999244689941406, 0.17587661743164062, 0.1817607879638672, 0.18764495849609375, 0.1935291290283203, 0.19941329956054688, 0.20529747009277344, 0.211181640625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 11.0, 16.0, 20.0, 34.0, 35.0, 56.0, 63.0, 79.0, 76.0, 87.0, 93.0, 54.0, 69.0, 64.0, 52.0, 36.0, 27.0, 26.0, 12.0, 14.0, 14.0, 6.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019805908203125, -0.01912665367126465, -0.018447399139404297, -0.017768144607543945, -0.017088890075683594, -0.016409635543823242, -0.01573038101196289, -0.015051126480102539, -0.014371871948242188, -0.013692617416381836, -0.013013362884521484, -0.012334108352661133, -0.011654853820800781, -0.01097559928894043, -0.010296344757080078, -0.009617090225219727, -0.008937835693359375, -0.008258581161499023, -0.007579326629638672, -0.00690007209777832, -0.006220817565917969, -0.005541563034057617, -0.004862308502197266, -0.004183053970336914, -0.0035037994384765625, -0.002824544906616211, -0.0021452903747558594, -0.0014660358428955078, -0.0007867813110351562, -0.00010752677917480469, 0.0005717277526855469, 0.0012509822845458984, 0.00193023681640625, 0.0026094913482666016, 0.003288745880126953, 0.003968000411987305, 0.004647254943847656, 0.005326509475708008, 0.006005764007568359, 0.006685018539428711, 0.0073642730712890625, 0.008043527603149414, 0.008722782135009766, 0.009402036666870117, 0.010081291198730469, 0.01076054573059082, 0.011439800262451172, 0.012119054794311523, 0.012798309326171875, 0.013477563858032227, 0.014156818389892578, 0.01483607292175293, 0.015515327453613281, 0.016194581985473633, 0.016873836517333984, 0.017553091049194336, 0.018232345581054688, 0.01891160011291504, 0.01959085464477539, 0.020270109176635742, 0.020949363708496094, 0.021628618240356445, 0.022307872772216797, 0.02298712730407715, 0.0236663818359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 14.0, 30.0, 103.0, 214.0, 488.0, 1732.0, 4174460.0, 15837.0, 1005.0, 262.0, 83.0, 29.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08349609375, -0.07983207702636719, -0.07616806030273438, -0.07250404357910156, -0.06884002685546875, -0.06517601013183594, -0.061511993408203125, -0.05784797668457031, -0.0541839599609375, -0.05051994323730469, -0.046855926513671875, -0.04319190979003906, -0.03952789306640625, -0.03586387634277344, -0.032199859619140625, -0.028535842895507812, -0.024871826171875, -0.021207809448242188, -0.017543792724609375, -0.013879776000976562, -0.01021575927734375, -0.0065517425537109375, -0.002887725830078125, 0.0007762908935546875, 0.0044403076171875, 0.008104324340820312, 0.011768341064453125, 0.015432357788085938, 0.01909637451171875, 0.022760391235351562, 0.026424407958984375, 0.030088424682617188, 0.03375244140625, 0.03741645812988281, 0.041080474853515625, 0.04474449157714844, 0.04840850830078125, 0.05207252502441406, 0.055736541748046875, 0.05940055847167969, 0.0630645751953125, 0.06672859191894531, 0.07039260864257812, 0.07405662536621094, 0.07772064208984375, 0.08138465881347656, 0.08504867553710938, 0.08871269226074219, 0.092376708984375, 0.09604072570800781, 0.09970474243164062, 0.10336875915527344, 0.10703277587890625, 0.11069679260253906, 0.11436080932617188, 0.11802482604980469, 0.1216888427734375, 0.1253528594970703, 0.12901687622070312, 0.13268089294433594, 0.13634490966796875, 0.14000892639160156, 0.14367294311523438, 0.1473369598388672, 0.1510009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 16.0, 41.0, 167.0, 3720.0, 83.0, 22.0, 11.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03985595703125, -0.038936614990234375, -0.03801727294921875, -0.037097930908203125, -0.0361785888671875, -0.035259246826171875, -0.03433990478515625, -0.033420562744140625, -0.032501220703125, -0.031581878662109375, -0.03066253662109375, -0.029743194580078125, -0.0288238525390625, -0.027904510498046875, -0.02698516845703125, -0.026065826416015625, -0.025146484375, -0.024227142333984375, -0.02330780029296875, -0.022388458251953125, -0.0214691162109375, -0.020549774169921875, -0.01963043212890625, -0.018711090087890625, -0.017791748046875, -0.016872406005859375, -0.01595306396484375, -0.015033721923828125, -0.0141143798828125, -0.013195037841796875, -0.01227569580078125, -0.011356353759765625, -0.01043701171875, -0.009517669677734375, -0.00859832763671875, -0.007678985595703125, -0.0067596435546875, -0.005840301513671875, -0.00492095947265625, -0.004001617431640625, -0.003082275390625, -0.002162933349609375, -0.00124359130859375, -0.000324249267578125, 0.0005950927734375, 0.001514434814453125, 0.00243377685546875, 0.003353118896484375, 0.0042724609375, 0.005191802978515625, 0.00611114501953125, 0.007030487060546875, 0.0079498291015625, 0.008869171142578125, 0.00978851318359375, 0.010707855224609375, 0.011627197265625, 0.012546539306640625, 0.01346588134765625, 0.014385223388671875, 0.0153045654296875, 0.016223907470703125, 0.01714324951171875, 0.018062591552734375, 0.01898193359375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 783.0, 236.0, 3.0], "bins": [-1.6484768390655518, -1.6218676567077637, -1.5952584743499756, -1.5686492919921875, -1.5420401096343994, -1.5154309272766113, -1.4888217449188232, -1.4622125625610352, -1.4356034994125366, -1.4089943170547485, -1.3823851346969604, -1.3557759523391724, -1.3291667699813843, -1.3025575876235962, -1.2759485244750977, -1.2493393421173096, -1.222730040550232, -1.1961208581924438, -1.1695116758346558, -1.1429024934768677, -1.1162933111190796, -1.0896841287612915, -1.063075065612793, -1.0364658832550049, -1.0098567008972168, -0.9832475185394287, -0.9566383361816406, -0.9300291538238525, -0.9034200310707092, -0.8768108487129211, -0.8502016663551331, -0.823592483997345, -0.7969832420349121, -0.770374059677124, -0.7437648773193359, -0.7171556949615479, -0.6905465722084045, -0.6639373898506165, -0.6373282074928284, -0.6107190251350403, -0.5841098427772522, -0.5575006604194641, -0.530891478061676, -0.5042823553085327, -0.47767314314842224, -0.45106399059295654, -0.42445480823516846, -0.39784562587738037, -0.3712364733219147, -0.3446272909641266, -0.3180181384086609, -0.2914089560508728, -0.2647997736930847, -0.23819060623645782, -0.21158143877983093, -0.18497225642204285, -0.15836310386657715, -0.13175393640995026, -0.10514475405216217, -0.07853558659553528, -0.05192641168832779, -0.0253172367811203, 0.0012919306755065918, 0.027901113033294678, 0.05451028794050217]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 8.0, 13.0, 16.0, 23.0, 46.0, 56.0, 58.0, 72.0, 73.0, 75.0, 78.0, 65.0, 83.0, 88.0, 56.0, 44.0, 38.0, 36.0, 18.0, 15.0, 15.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048928022384643555, -0.0472177192568779, -0.045507416129112244, -0.04379710927605629, -0.042086806148290634, -0.04037650302052498, -0.038666196167469025, -0.03695589303970337, -0.035245589911937714, -0.03353528678417206, -0.0318249836564064, -0.03011467680335045, -0.028404373675584793, -0.026694070547819138, -0.024983765557408333, -0.023273460566997528, -0.021563157439231873, -0.019852854311466217, -0.018142549321055412, -0.016432244330644608, -0.014721941202878952, -0.013011637143790722, -0.011301333084702492, -0.009591029025614262, -0.007880724966526031, -0.006170420907437801, -0.004460116848349571, -0.002749812789261341, -0.001039508730173111, 0.0006707953289151192, 0.0023810993880033493, 0.0040914034470915794, 0.00580170750617981, 0.00751201156526804, 0.00922231562435627, 0.0109326196834445, 0.01264292374253273, 0.01435322780162096, 0.01606353186070919, 0.017773836851119995, 0.01948413997888565, 0.021194443106651306, 0.02290474809706211, 0.024615053087472916, 0.02632535621523857, 0.028035659343004227, 0.02974596433341503, 0.031456269323825836, 0.03316657245159149, 0.03487687557935715, 0.0365871787071228, 0.03829748556017876, 0.04000778868794441, 0.04171809181571007, 0.04342839866876602, 0.04513870179653168, 0.04684900492429733, 0.04855930805206299, 0.050269611179828644, 0.0519799180328846, 0.05369022116065025, 0.05540052428841591, 0.05711083114147186, 0.05882113426923752, 0.060531437397003174]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 9.0, 13.0, 17.0, 21.0, 31.0, 60.0, 74.0, 121.0, 201.0, 307.0, 538.0, 1046.0, 2063.0, 4525.0, 12246.0, 44698.0, 471023.0, 446801.0, 43751.0, 11993.0, 4448.0, 2103.0, 1012.0, 564.0, 338.0, 188.0, 124.0, 70.0, 54.0, 26.0, 29.0, 15.0, 11.0, 8.0, 8.0, 2.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06402587890625, -0.06219625473022461, -0.06036663055419922, -0.05853700637817383, -0.05670738220214844, -0.05487775802612305, -0.053048133850097656, -0.051218509674072266, -0.049388885498046875, -0.047559261322021484, -0.045729637145996094, -0.0439000129699707, -0.04207038879394531, -0.04024076461791992, -0.03841114044189453, -0.03658151626586914, -0.03475189208984375, -0.03292226791381836, -0.03109264373779297, -0.029263019561767578, -0.027433395385742188, -0.025603771209716797, -0.023774147033691406, -0.021944522857666016, -0.020114898681640625, -0.018285274505615234, -0.016455650329589844, -0.014626026153564453, -0.012796401977539062, -0.010966777801513672, -0.009137153625488281, -0.007307529449462891, -0.0054779052734375, -0.0036482810974121094, -0.0018186569213867188, 1.0967254638671875e-05, 0.0018405914306640625, 0.003670215606689453, 0.005499839782714844, 0.007329463958740234, 0.009159088134765625, 0.010988712310791016, 0.012818336486816406, 0.014647960662841797, 0.016477584838867188, 0.018307209014892578, 0.02013683319091797, 0.02196645736694336, 0.02379608154296875, 0.02562570571899414, 0.02745532989501953, 0.029284954071044922, 0.031114578247070312, 0.0329442024230957, 0.034773826599121094, 0.036603450775146484, 0.038433074951171875, 0.040262699127197266, 0.042092323303222656, 0.04392194747924805, 0.04575157165527344, 0.04758119583129883, 0.04941082000732422, 0.05124044418334961, 0.053070068359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 4.0, 8.0, 10.0, 18.0, 21.0, 30.0, 39.0, 51.0, 62.0, 87.0, 64.0, 92.0, 93.0, 59.0, 64.0, 65.0, 53.0, 37.0, 23.0, 27.0, 12.0, 11.0, 16.0, 7.0, 7.0, 8.0, 3.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0196990966796875, -0.019023895263671875, -0.01834869384765625, -0.017673492431640625, -0.016998291015625, -0.016323089599609375, -0.01564788818359375, -0.014972686767578125, -0.0142974853515625, -0.013622283935546875, -0.01294708251953125, -0.012271881103515625, -0.0115966796875, -0.010921478271484375, -0.01024627685546875, -0.009571075439453125, -0.0088958740234375, -0.008220672607421875, -0.00754547119140625, -0.006870269775390625, -0.006195068359375, -0.005519866943359375, -0.00484466552734375, -0.004169464111328125, -0.0034942626953125, -0.002819061279296875, -0.00214385986328125, -0.001468658447265625, -0.00079345703125, -0.000118255615234375, 0.00055694580078125, 0.001232147216796875, 0.0019073486328125, 0.002582550048828125, 0.00325775146484375, 0.003932952880859375, 0.004608154296875, 0.005283355712890625, 0.00595855712890625, 0.006633758544921875, 0.0073089599609375, 0.007984161376953125, 0.00865936279296875, 0.009334564208984375, 0.010009765625, 0.010684967041015625, 0.01136016845703125, 0.012035369873046875, 0.0127105712890625, 0.013385772705078125, 0.01406097412109375, 0.014736175537109375, 0.015411376953125, 0.016086578369140625, 0.01676177978515625, 0.017436981201171875, 0.0181121826171875, 0.018787384033203125, 0.01946258544921875, 0.020137786865234375, 0.02081298828125, 0.021488189697265625, 0.02216339111328125, 0.022838592529296875, 0.0235137939453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 5.0, 9.0, 16.0, 16.0, 16.0, 29.0, 39.0, 48.0, 67.0, 69.0, 110.0, 138.0, 217.0, 344.0, 716.0, 2289.0, 23290.0, 946470.0, 68751.0, 3734.0, 870.0, 382.0, 280.0, 163.0, 129.0, 86.0, 56.0, 43.0, 34.0, 37.0, 20.0, 18.0, 10.0, 14.0, 9.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12234115600585938, -0.11870574951171875, -0.11507034301757812, -0.1114349365234375, -0.10779953002929688, -0.10416412353515625, -0.10052871704101562, -0.096893310546875, -0.09325790405273438, -0.08962249755859375, -0.08598709106445312, -0.0823516845703125, -0.07871627807617188, -0.07508087158203125, -0.07144546508789062, -0.06781005859375, -0.06417465209960938, -0.06053924560546875, -0.056903839111328125, -0.0532684326171875, -0.049633026123046875, -0.04599761962890625, -0.042362213134765625, -0.038726806640625, -0.035091400146484375, -0.03145599365234375, -0.027820587158203125, -0.0241851806640625, -0.020549774169921875, -0.01691436767578125, -0.013278961181640625, -0.0096435546875, -0.006008148193359375, -0.00237274169921875, 0.001262664794921875, 0.0048980712890625, 0.008533477783203125, 0.01216888427734375, 0.015804290771484375, 0.019439697265625, 0.023075103759765625, 0.02671051025390625, 0.030345916748046875, 0.0339813232421875, 0.037616729736328125, 0.04125213623046875, 0.044887542724609375, 0.04852294921875, 0.052158355712890625, 0.05579376220703125, 0.059429168701171875, 0.0630645751953125, 0.06669998168945312, 0.07033538818359375, 0.07397079467773438, 0.077606201171875, 0.08124160766601562, 0.08487701416015625, 0.08851242065429688, 0.0921478271484375, 0.09578323364257812, 0.09941864013671875, 0.10305404663085938, 0.106689453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 8.0, 13.0, 16.0, 14.0, 16.0, 13.0, 24.0, 23.0, 29.0, 35.0, 34.0, 31.0, 37.0, 45.0, 44.0, 55.0, 45.0, 46.0, 47.0, 42.0, 46.0, 32.0, 32.0, 43.0, 32.0, 36.0, 24.0, 17.0, 24.0, 12.0, 16.0, 8.0, 8.0, 12.0, 9.0, 6.0, 1.0, 4.0, 0.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07293701171875, -0.07087850570678711, -0.06881999969482422, -0.06676149368286133, -0.06470298767089844, -0.06264448165893555, -0.060585975646972656, -0.058527469635009766, -0.056468963623046875, -0.054410457611083984, -0.052351951599121094, -0.0502934455871582, -0.04823493957519531, -0.04617643356323242, -0.04411792755126953, -0.04205942153930664, -0.04000091552734375, -0.03794240951538086, -0.03588390350341797, -0.03382539749145508, -0.03176689147949219, -0.029708385467529297, -0.027649879455566406, -0.025591373443603516, -0.023532867431640625, -0.021474361419677734, -0.019415855407714844, -0.017357349395751953, -0.015298843383789062, -0.013240337371826172, -0.011181831359863281, -0.00912332534790039, -0.0070648193359375, -0.005006313323974609, -0.0029478073120117188, -0.0008893013000488281, 0.0011692047119140625, 0.003227710723876953, 0.005286216735839844, 0.007344722747802734, 0.009403228759765625, 0.011461734771728516, 0.013520240783691406, 0.015578746795654297, 0.017637252807617188, 0.019695758819580078, 0.02175426483154297, 0.02381277084350586, 0.02587127685546875, 0.02792978286743164, 0.02998828887939453, 0.03204679489135742, 0.03410530090332031, 0.0361638069152832, 0.038222312927246094, 0.040280818939208984, 0.042339324951171875, 0.044397830963134766, 0.046456336975097656, 0.04851484298706055, 0.05057334899902344, 0.05263185501098633, 0.05469036102294922, 0.05674886703491211, 0.058807373046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 10.0, 25.0, 28.0, 37.0, 57.0, 108.0, 282.0, 667.0, 2249.0, 9801.0, 902036.0, 123234.0, 7194.0, 1670.0, 580.0, 227.0, 101.0, 58.0, 50.0, 25.0, 22.0, 17.0, 12.0, 8.0, 1.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015655517578125, -0.015149116516113281, -0.014642715454101562, -0.014136314392089844, -0.013629913330078125, -0.013123512268066406, -0.012617111206054688, -0.012110710144042969, -0.01160430908203125, -0.011097908020019531, -0.010591506958007812, -0.010085105895996094, -0.009578704833984375, -0.009072303771972656, -0.008565902709960938, -0.008059501647949219, -0.0075531005859375, -0.007046699523925781, -0.0065402984619140625, -0.006033897399902344, -0.005527496337890625, -0.005021095275878906, -0.0045146942138671875, -0.004008293151855469, -0.00350189208984375, -0.0029954910278320312, -0.0024890899658203125, -0.0019826889038085938, -0.001476287841796875, -0.0009698867797851562, -0.0004634857177734375, 4.291534423828125e-05, 0.00054931640625, 0.0010557174682617188, 0.0015621185302734375, 0.0020685195922851562, 0.002574920654296875, 0.0030813217163085938, 0.0035877227783203125, 0.004094123840332031, 0.00460052490234375, 0.005106925964355469, 0.0056133270263671875, 0.006119728088378906, 0.006626129150390625, 0.007132530212402344, 0.0076389312744140625, 0.008145332336425781, 0.0086517333984375, 0.009158134460449219, 0.009664535522460938, 0.010170936584472656, 0.010677337646484375, 0.011183738708496094, 0.011690139770507812, 0.012196540832519531, 0.01270294189453125, 0.013209342956542969, 0.013715744018554688, 0.014222145080566406, 0.014728546142578125, 0.015234947204589844, 0.015741348266601562, 0.01624774932861328, 0.016754150390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 9.0, 28.0, 56.0, 82.0, 227.0, 361.0, 113.0, 59.0, 19.0, 13.0, 7.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008444786071777344, -0.0008133724331855774, -0.0007822662591934204, -0.0007511600852012634, -0.0007200539112091064, -0.0006889477372169495, -0.0006578415632247925, -0.0006267353892326355, -0.0005956292152404785, -0.0005645230412483215, -0.0005334168672561646, -0.0005023106932640076, -0.0004712045192718506, -0.0004400983452796936, -0.0004089921712875366, -0.00037788599729537964, -0.00034677982330322266, -0.0003156736493110657, -0.0002845674753189087, -0.0002534613013267517, -0.00022235512733459473, -0.00019124895334243774, -0.00016014277935028076, -0.00012903660535812378, -9.79304313659668e-05, -6.682425737380981e-05, -3.571808338165283e-05, -4.61190938949585e-06, 2.6494264602661133e-05, 5.7600438594818115e-05, 8.87066125869751e-05, 0.00011981278657913208, 0.00015091896057128906, 0.00018202513456344604, 0.00021313130855560303, 0.00024423748254776, 0.000275343656539917, 0.000306449830532074, 0.00033755600452423096, 0.00036866217851638794, 0.0003997683525085449, 0.0004308745265007019, 0.0004619807004928589, 0.0004930868744850159, 0.0005241930484771729, 0.0005552992224693298, 0.0005864053964614868, 0.0006175115704536438, 0.0006486177444458008, 0.0006797239184379578, 0.0007108300924301147, 0.0007419362664222717, 0.0007730424404144287, 0.0008041486144065857, 0.0008352547883987427, 0.0008663609623908997, 0.0008974671363830566, 0.0009285733103752136, 0.0009596794843673706, 0.0009907856583595276, 0.0010218918323516846, 0.0010529980063438416, 0.0010841041803359985, 0.0011152103543281555, 0.0011463165283203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 13.0, 28.0, 80.0, 337.0, 4478.0, 1034398.0, 8474.0, 497.0, 121.0, 35.0, 17.0, 7.0, 9.0, 10.0, 4.0, 7.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.051727294921875, -0.050452470779418945, -0.04917764663696289, -0.047902822494506836, -0.04662799835205078, -0.04535317420959473, -0.04407835006713867, -0.04280352592468262, -0.04152870178222656, -0.04025387763977051, -0.03897905349731445, -0.0377042293548584, -0.036429405212402344, -0.03515458106994629, -0.033879756927490234, -0.03260493278503418, -0.031330108642578125, -0.03005528450012207, -0.028780460357666016, -0.02750563621520996, -0.026230812072753906, -0.02495598793029785, -0.023681163787841797, -0.022406339645385742, -0.021131515502929688, -0.019856691360473633, -0.018581867218017578, -0.017307043075561523, -0.01603221893310547, -0.014757394790649414, -0.01348257064819336, -0.012207746505737305, -0.01093292236328125, -0.009658098220825195, -0.00838327407836914, -0.007108449935913086, -0.005833625793457031, -0.0045588016510009766, -0.003283977508544922, -0.002009153366088867, -0.0007343292236328125, 0.0005404949188232422, 0.0018153190612792969, 0.0030901432037353516, 0.004364967346191406, 0.005639791488647461, 0.006914615631103516, 0.00818943977355957, 0.009464263916015625, 0.01073908805847168, 0.012013912200927734, 0.013288736343383789, 0.014563560485839844, 0.0158383846282959, 0.017113208770751953, 0.018388032913208008, 0.019662857055664062, 0.020937681198120117, 0.022212505340576172, 0.023487329483032227, 0.02476215362548828, 0.026036977767944336, 0.02731180191040039, 0.028586626052856445, 0.0298614501953125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 8.0, 3.0, 5.0, 8.0, 9.0, 3.0, 16.0, 20.0, 29.0, 36.0, 115.0, 419.0, 173.0, 58.0, 28.0, 18.0, 14.0, 5.0, 6.0, 7.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011627197265625, -0.01113438606262207, -0.01064157485961914, -0.010148763656616211, -0.009655952453613281, -0.009163141250610352, -0.008670330047607422, -0.008177518844604492, -0.0076847076416015625, -0.007191896438598633, -0.006699085235595703, -0.0062062740325927734, -0.005713462829589844, -0.005220651626586914, -0.004727840423583984, -0.004235029220581055, -0.003742218017578125, -0.0032494068145751953, -0.0027565956115722656, -0.002263784408569336, -0.0017709732055664062, -0.0012781620025634766, -0.0007853507995605469, -0.0002925395965576172, 0.0002002716064453125, 0.0006930828094482422, 0.0011858940124511719, 0.0016787052154541016, 0.0021715164184570312, 0.002664327621459961, 0.0031571388244628906, 0.0036499500274658203, 0.00414276123046875, 0.00463557243347168, 0.005128383636474609, 0.005621194839477539, 0.006114006042480469, 0.0066068172454833984, 0.007099628448486328, 0.007592439651489258, 0.008085250854492188, 0.008578062057495117, 0.009070873260498047, 0.009563684463500977, 0.010056495666503906, 0.010549306869506836, 0.011042118072509766, 0.011534929275512695, 0.012027740478515625, 0.012520551681518555, 0.013013362884521484, 0.013506174087524414, 0.013998985290527344, 0.014491796493530273, 0.014984607696533203, 0.015477418899536133, 0.015970230102539062, 0.016463041305541992, 0.016955852508544922, 0.01744866371154785, 0.01794147491455078, 0.01843428611755371, 0.01892709732055664, 0.01941990852355957, 0.0199127197265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 18.0, 141.0, 721.0, 109.0, 12.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2854030132293701, -0.2550022006034851, -0.2246014028787613, -0.19420060515403748, -0.16379979252815247, -0.13339897990226746, -0.10299818217754364, -0.07259738445281982, -0.042196571826934814, -0.011795766651630402, 0.01860503852367401, 0.049005843698978424, 0.07940664887428284, 0.10980746150016785, 0.14020825922489166, 0.17060905694961548, 0.2010098695755005, 0.2314106822013855, 0.2618114948272705, 0.29221227765083313, 0.32261309027671814, 0.35301390290260315, 0.38341468572616577, 0.4138154983520508, 0.4442163109779358, 0.4746171236038208, 0.5050179362297058, 0.5354187488555908, 0.565819501876831, 0.5962203741073608, 0.6266211271286011, 0.6570219397544861, 0.6874227523803711, 0.7178235650062561, 0.7482243776321411, 0.7786251902580261, 0.8090260028839111, 0.8394267559051514, 0.8698275685310364, 0.9002283811569214, 0.9306291937828064, 0.9610300064086914, 0.9914308190345764, 1.0218316316604614, 1.0522323846817017, 1.0826332569122314, 1.1130340099334717, 1.143434762954712, 1.1738356351852417, 1.204236388206482, 1.2346372604370117, 1.265038013458252, 1.2954388856887817, 1.325839638710022, 1.3562405109405518, 1.386641263961792, 1.4170420169830322, 1.4474427700042725, 1.4778436422348022, 1.5082443952560425, 1.5386452674865723, 1.5690460205078125, 1.5994468927383423, 1.6298476457595825, 1.6602485179901123]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 12.0, 14.0, 19.0, 13.0, 21.0, 28.0, 28.0, 20.0, 20.0, 32.0, 29.0, 30.0, 36.0, 37.0, 45.0, 45.0, 55.0, 43.0, 48.0, 40.0, 46.0, 28.0, 38.0, 31.0, 27.0, 31.0, 27.0, 18.0, 19.0, 15.0, 19.0, 9.0, 14.0, 11.0, 6.0, 11.0, 3.0, 0.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2896274924278259, -0.28044748306274414, -0.27126750349998474, -0.26208749413490295, -0.25290748476982117, -0.24372749030590057, -0.23454749584197998, -0.2253674864768982, -0.2161874771118164, -0.2070074826478958, -0.19782747328281403, -0.18864747881889343, -0.17946746945381165, -0.17028747498989105, -0.16110748052597046, -0.15192747116088867, -0.14274747669696808, -0.13356748223304749, -0.1243874728679657, -0.1152074784040451, -0.10602746903896332, -0.09684747457504272, -0.08766747266054153, -0.07848747074604034, -0.06930746883153915, -0.060127466917037964, -0.050947465002536774, -0.04176746681332588, -0.03258746489882469, -0.0234074629843235, -0.01422746479511261, -0.00504746288061142, 0.0041325390338897705, 0.013312540017068386, 0.022492541000247, 0.03167254105210304, 0.04085254296660423, 0.05003254488110542, 0.059212543070316315, 0.0683925449848175, 0.0775725468993187, 0.08675254881381989, 0.09593255072832108, 0.10511255264282227, 0.11429254710674286, 0.12347255647182465, 0.13265255093574524, 0.14183256030082703, 0.15101255476474762, 0.1601925492286682, 0.16937255859375, 0.1785525530576706, 0.18773256242275238, 0.19691255688667297, 0.20609256625175476, 0.21527256071567535, 0.22445255517959595, 0.23363254964351654, 0.24281255900859833, 0.2519925534725189, 0.2611725628376007, 0.2703525722026825, 0.2795325517654419, 0.2887125611305237, 0.29789257049560547]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 8.0, 4.0, 8.0, 9.0, 18.0, 12.0, 28.0, 44.0, 45.0, 69.0, 69.0, 300.0, 6157.0, 4184446.0, 2529.0, 208.0, 82.0, 58.0, 49.0, 29.0, 20.0, 17.0, 9.0, 14.0, 14.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0521240234375, -0.05040931701660156, -0.048694610595703125, -0.04697990417480469, -0.04526519775390625, -0.04355049133300781, -0.041835784912109375, -0.04012107849121094, -0.0384063720703125, -0.03669166564941406, -0.034976959228515625, -0.03326225280761719, -0.03154754638671875, -0.029832839965820312, -0.028118133544921875, -0.026403427124023438, -0.024688720703125, -0.022974014282226562, -0.021259307861328125, -0.019544601440429688, -0.01782989501953125, -0.016115188598632812, -0.014400482177734375, -0.012685775756835938, -0.0109710693359375, -0.009256362915039062, -0.007541656494140625, -0.0058269500732421875, -0.00411224365234375, -0.0023975372314453125, -0.000682830810546875, 0.0010318756103515625, 0.00274658203125, 0.0044612884521484375, 0.006175994873046875, 0.007890701293945312, 0.00960540771484375, 0.011320114135742188, 0.013034820556640625, 0.014749526977539062, 0.0164642333984375, 0.018178939819335938, 0.019893646240234375, 0.021608352661132812, 0.02332305908203125, 0.025037765502929688, 0.026752471923828125, 0.028467178344726562, 0.030181884765625, 0.03189659118652344, 0.033611297607421875, 0.03532600402832031, 0.03704071044921875, 0.03875541687011719, 0.040470123291015625, 0.04218482971191406, 0.0438995361328125, 0.04561424255371094, 0.047328948974609375, 0.04904365539550781, 0.05075836181640625, 0.05247306823730469, 0.054187774658203125, 0.05590248107910156, 0.0576171875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 7.0, 4.0, 7.0, 13.0, 15.0, 13.0, 30.0, 40.0, 49.0, 64.0, 59.0, 72.0, 103.0, 96.0, 67.0, 58.0, 59.0, 57.0, 44.0, 26.0, 23.0, 21.0, 10.0, 10.0, 13.0, 11.0, 6.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020294189453125, -0.019627094268798828, -0.018959999084472656, -0.018292903900146484, -0.017625808715820312, -0.01695871353149414, -0.01629161834716797, -0.015624523162841797, -0.014957427978515625, -0.014290332794189453, -0.013623237609863281, -0.01295614242553711, -0.012289047241210938, -0.011621952056884766, -0.010954856872558594, -0.010287761688232422, -0.00962066650390625, -0.008953571319580078, -0.008286476135253906, -0.007619380950927734, -0.0069522857666015625, -0.006285190582275391, -0.005618095397949219, -0.004951000213623047, -0.004283905029296875, -0.003616809844970703, -0.0029497146606445312, -0.0022826194763183594, -0.0016155242919921875, -0.0009484291076660156, -0.00028133392333984375, 0.0003857612609863281, 0.0010528564453125, 0.0017199516296386719, 0.0023870468139648438, 0.0030541419982910156, 0.0037212371826171875, 0.004388332366943359, 0.005055427551269531, 0.005722522735595703, 0.006389617919921875, 0.007056713104248047, 0.007723808288574219, 0.00839090347290039, 0.009057998657226562, 0.009725093841552734, 0.010392189025878906, 0.011059284210205078, 0.01172637939453125, 0.012393474578857422, 0.013060569763183594, 0.013727664947509766, 0.014394760131835938, 0.01506185531616211, 0.01572895050048828, 0.016396045684814453, 0.017063140869140625, 0.017730236053466797, 0.01839733123779297, 0.01906442642211914, 0.019731521606445312, 0.020398616790771484, 0.021065711975097656, 0.021732807159423828, 0.02239990234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 4.0, 12.0, 28.0, 103.0, 336.0, 1141.0, 6974.0, 4176963.0, 7167.0, 1089.0, 298.0, 96.0, 32.0, 16.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0654296875, -0.0634164810180664, -0.06140327453613281, -0.05939006805419922, -0.057376861572265625, -0.05536365509033203, -0.05335044860839844, -0.051337242126464844, -0.04932403564453125, -0.047310829162597656, -0.04529762268066406, -0.04328441619873047, -0.041271209716796875, -0.03925800323486328, -0.03724479675292969, -0.035231590270996094, -0.0332183837890625, -0.031205177307128906, -0.029191970825195312, -0.02717876434326172, -0.025165557861328125, -0.02315235137939453, -0.021139144897460938, -0.019125938415527344, -0.01711273193359375, -0.015099525451660156, -0.013086318969726562, -0.011073112487792969, -0.009059906005859375, -0.007046699523925781, -0.0050334930419921875, -0.0030202865600585938, -0.001007080078125, 0.0010061264038085938, 0.0030193328857421875, 0.005032539367675781, 0.007045745849609375, 0.009058952331542969, 0.011072158813476562, 0.013085365295410156, 0.01509857177734375, 0.017111778259277344, 0.019124984741210938, 0.02113819122314453, 0.023151397705078125, 0.02516460418701172, 0.027177810668945312, 0.029191017150878906, 0.0312042236328125, 0.033217430114746094, 0.03523063659667969, 0.03724384307861328, 0.039257049560546875, 0.04127025604248047, 0.04328346252441406, 0.045296669006347656, 0.04730987548828125, 0.049323081970214844, 0.05133628845214844, 0.05334949493408203, 0.055362701416015625, 0.05737590789794922, 0.05938911437988281, 0.061402320861816406, 0.06341552734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 10.0, 24.0, 328.0, 3633.0, 36.0, 16.0, 7.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0162353515625, -0.015729427337646484, -0.015223503112792969, -0.014717578887939453, -0.014211654663085938, -0.013705730438232422, -0.013199806213378906, -0.01269388198852539, -0.012187957763671875, -0.01168203353881836, -0.011176109313964844, -0.010670185089111328, -0.010164260864257812, -0.009658336639404297, -0.009152412414550781, -0.008646488189697266, -0.00814056396484375, -0.007634639739990234, -0.007128715515136719, -0.006622791290283203, -0.0061168670654296875, -0.005610942840576172, -0.005105018615722656, -0.004599094390869141, -0.004093170166015625, -0.0035872459411621094, -0.0030813217163085938, -0.002575397491455078, -0.0020694732666015625, -0.0015635490417480469, -0.0010576248168945312, -0.0005517005920410156, -4.57763671875e-05, 0.0004601478576660156, 0.0009660720825195312, 0.0014719963073730469, 0.0019779205322265625, 0.002483844757080078, 0.0029897689819335938, 0.0034956932067871094, 0.004001617431640625, 0.004507541656494141, 0.005013465881347656, 0.005519390106201172, 0.0060253143310546875, 0.006531238555908203, 0.007037162780761719, 0.007543087005615234, 0.00804901123046875, 0.008554935455322266, 0.009060859680175781, 0.009566783905029297, 0.010072708129882812, 0.010578632354736328, 0.011084556579589844, 0.01159048080444336, 0.012096405029296875, 0.01260232925415039, 0.013108253479003906, 0.013614177703857422, 0.014120101928710938, 0.014626026153564453, 0.015131950378417969, 0.015637874603271484, 0.016143798828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 8.0, 19.0, 62.0, 369.0, 447.0, 88.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09399300068616867, -0.09218736737966537, -0.09038172662258148, -0.08857609331607819, -0.08677046000957489, -0.084964819252491, -0.0831591859459877, -0.0813535526394844, -0.07954791188240051, -0.07774227857589722, -0.07593663781881332, -0.07413100451231003, -0.07232537120580673, -0.07051973044872284, -0.06871409714221954, -0.06690846383571625, -0.06510283052921295, -0.06329719722270966, -0.06149156019091606, -0.05968592315912247, -0.05788028612732887, -0.05607464909553528, -0.05426901578903198, -0.05246337875723839, -0.050657741725444794, -0.0488521046936512, -0.0470464713871479, -0.04524083435535431, -0.043435197323560715, -0.04162956029176712, -0.039823926985263824, -0.03801828995347023, -0.036212652921676636, -0.03440701588988304, -0.032601382583379745, -0.03079574555158615, -0.028990108519792557, -0.02718447335064411, -0.025378838181495667, -0.023573201149702072, -0.021767565980553627, -0.019961930811405182, -0.018156293779611588, -0.016350658610463142, -0.014545022509992123, -0.012739386409521103, -0.010933751240372658, -0.009128115139901638, -0.007322479039430618, -0.0055168429389595985, -0.003711207304149866, -0.0019055716693401337, -9.993556886911392e-05, 0.0017057005316019058, 0.003511335700750351, 0.005316971801221371, 0.0071226079016923904, 0.00892824400216341, 0.01073388010263443, 0.012539515271782875, 0.014345151372253895, 0.016150787472724915, 0.01795642264187336, 0.019762057811021805, 0.0215676948428154]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 1.0, 4.0, 9.0, 11.0, 14.0, 18.0, 7.0, 15.0, 31.0, 28.0, 33.0, 39.0, 43.0, 38.0, 44.0, 53.0, 66.0, 47.0, 50.0, 56.0, 49.0, 58.0, 50.0, 36.0, 41.0, 22.0, 28.0, 31.0, 23.0, 17.0, 11.0, 5.0, 6.0, 5.0, 7.0, 0.0, 5.0, 5.0, 1.0, 1.0, 3.0], "bins": [-0.02752143144607544, -0.026845330372452736, -0.026169229298830032, -0.02549312822520733, -0.024817027151584625, -0.02414092607796192, -0.023464825004339218, -0.022788723930716515, -0.02211262285709381, -0.021436521783471107, -0.020760420709848404, -0.0200843196362257, -0.019408218562602997, -0.018732117488980293, -0.01805601641535759, -0.017379915341734886, -0.016703814268112183, -0.01602771319448948, -0.015351612120866776, -0.014675511047244072, -0.013999409973621368, -0.013323308899998665, -0.012647207826375961, -0.011971106752753258, -0.011295005679130554, -0.01061890460550785, -0.009942803531885147, -0.009266702458262444, -0.00859060138463974, -0.007914500311017036, -0.007238399237394333, -0.006562298163771629, -0.005886197090148926, -0.005210096016526222, -0.004533994942903519, -0.003857893869280815, -0.0031817927956581116, -0.002505691722035408, -0.0018295906484127045, -0.001153489574790001, -0.00047738850116729736, 0.0001987125724554062, 0.0008748136460781097, 0.0015509147197008133, 0.002227015793323517, 0.0029031168669462204, 0.003579217940568924, 0.0042553190141916275, 0.004931420087814331, 0.005607521161437035, 0.006283622235059738, 0.006959723308682442, 0.007635824382305145, 0.008311925455927849, 0.008988026529550552, 0.009664127603173256, 0.01034022867679596, 0.011016329750418663, 0.011692430824041367, 0.01236853189766407, 0.013044632971286774, 0.013720734044909477, 0.01439683511853218, 0.015072936192154884, 0.015749037265777588]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 8.0, 15.0, 11.0, 16.0, 23.0, 37.0, 49.0, 78.0, 106.0, 145.0, 198.0, 324.0, 418.0, 692.0, 1049.0, 1664.0, 2749.0, 4711.0, 9253.0, 19131.0, 46417.0, 154268.0, 582688.0, 141296.0, 43934.0, 18321.0, 8767.0, 4762.0, 2638.0, 1663.0, 1051.0, 639.0, 415.0, 304.0, 217.0, 141.0, 90.0, 77.0, 49.0, 36.0, 33.0, 18.0, 9.0, 9.0, 11.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0241851806640625, -0.0233914852142334, -0.022597789764404297, -0.021804094314575195, -0.021010398864746094, -0.020216703414916992, -0.01942300796508789, -0.01862931251525879, -0.017835617065429688, -0.017041921615600586, -0.016248226165771484, -0.015454530715942383, -0.014660835266113281, -0.01386713981628418, -0.013073444366455078, -0.012279748916625977, -0.011486053466796875, -0.010692358016967773, -0.009898662567138672, -0.00910496711730957, -0.008311271667480469, -0.007517576217651367, -0.006723880767822266, -0.005930185317993164, -0.0051364898681640625, -0.004342794418334961, -0.0035490989685058594, -0.002755403518676758, -0.0019617080688476562, -0.0011680126190185547, -0.0003743171691894531, 0.00041937828063964844, 0.00121307373046875, 0.0020067691802978516, 0.002800464630126953, 0.0035941600799560547, 0.004387855529785156, 0.005181550979614258, 0.005975246429443359, 0.006768941879272461, 0.0075626373291015625, 0.008356332778930664, 0.009150028228759766, 0.009943723678588867, 0.010737419128417969, 0.01153111457824707, 0.012324810028076172, 0.013118505477905273, 0.013912200927734375, 0.014705896377563477, 0.015499591827392578, 0.01629328727722168, 0.01708698272705078, 0.017880678176879883, 0.018674373626708984, 0.019468069076538086, 0.020261764526367188, 0.02105545997619629, 0.02184915542602539, 0.022642850875854492, 0.023436546325683594, 0.024230241775512695, 0.025023937225341797, 0.0258176326751709, 0.026611328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 7.0, 8.0, 20.0, 13.0, 23.0, 46.0, 48.0, 62.0, 65.0, 70.0, 101.0, 98.0, 66.0, 62.0, 56.0, 54.0, 49.0, 25.0, 23.0, 20.0, 10.0, 13.0, 11.0, 9.0, 8.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020294189453125, -0.01962733268737793, -0.01896047592163086, -0.01829361915588379, -0.01762676239013672, -0.01695990562438965, -0.016293048858642578, -0.015626192092895508, -0.014959335327148438, -0.014292478561401367, -0.013625621795654297, -0.012958765029907227, -0.012291908264160156, -0.011625051498413086, -0.010958194732666016, -0.010291337966918945, -0.009624481201171875, -0.008957624435424805, -0.008290767669677734, -0.007623910903930664, -0.006957054138183594, -0.0062901973724365234, -0.005623340606689453, -0.004956483840942383, -0.0042896270751953125, -0.003622770309448242, -0.002955913543701172, -0.0022890567779541016, -0.0016222000122070312, -0.0009553432464599609, -0.0002884864807128906, 0.0003783702850341797, 0.00104522705078125, 0.0017120838165283203, 0.0023789405822753906, 0.003045797348022461, 0.0037126541137695312, 0.0043795108795166016, 0.005046367645263672, 0.005713224411010742, 0.0063800811767578125, 0.007046937942504883, 0.007713794708251953, 0.008380651473999023, 0.009047508239746094, 0.009714365005493164, 0.010381221771240234, 0.011048078536987305, 0.011714935302734375, 0.012381792068481445, 0.013048648834228516, 0.013715505599975586, 0.014382362365722656, 0.015049219131469727, 0.015716075897216797, 0.016382932662963867, 0.017049789428710938, 0.017716646194458008, 0.018383502960205078, 0.01905035972595215, 0.01971721649169922, 0.02038407325744629, 0.02105093002319336, 0.02171778678894043, 0.0223846435546875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 9.0, 1.0, 5.0, 3.0, 10.0, 13.0, 14.0, 12.0, 11.0, 18.0, 32.0, 37.0, 47.0, 51.0, 50.0, 80.0, 105.0, 157.0, 291.0, 646.0, 3578.0, 74931.0, 936540.0, 28504.0, 2132.0, 453.0, 225.0, 141.0, 82.0, 93.0, 64.0, 54.0, 27.0, 27.0, 24.0, 22.0, 10.0, 13.0, 7.0, 6.0, 5.0, 6.0, 5.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.10369873046875, -0.10076618194580078, -0.09783363342285156, -0.09490108489990234, -0.09196853637695312, -0.0890359878540039, -0.08610343933105469, -0.08317089080810547, -0.08023834228515625, -0.07730579376220703, -0.07437324523925781, -0.0714406967163086, -0.06850814819335938, -0.06557559967041016, -0.06264305114746094, -0.05971050262451172, -0.0567779541015625, -0.05384540557861328, -0.05091285705566406, -0.047980308532714844, -0.045047760009765625, -0.042115211486816406, -0.03918266296386719, -0.03625011444091797, -0.03331756591796875, -0.03038501739501953, -0.027452468872070312, -0.024519920349121094, -0.021587371826171875, -0.018654823303222656, -0.015722274780273438, -0.012789726257324219, -0.009857177734375, -0.006924629211425781, -0.0039920806884765625, -0.0010595321655273438, 0.001873016357421875, 0.004805564880371094, 0.0077381134033203125, 0.010670661926269531, 0.01360321044921875, 0.01653575897216797, 0.019468307495117188, 0.022400856018066406, 0.025333404541015625, 0.028265953063964844, 0.031198501586914062, 0.03413105010986328, 0.0370635986328125, 0.03999614715576172, 0.04292869567871094, 0.045861244201660156, 0.048793792724609375, 0.051726341247558594, 0.05465888977050781, 0.05759143829345703, 0.06052398681640625, 0.06345653533935547, 0.06638908386230469, 0.0693216323852539, 0.07225418090820312, 0.07518672943115234, 0.07811927795410156, 0.08105182647705078, 0.083984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 4.0, 5.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 7.0, 15.0, 26.0, 16.0, 24.0, 26.0, 19.0, 26.0, 24.0, 33.0, 30.0, 28.0, 49.0, 49.0, 40.0, 46.0, 55.0, 49.0, 42.0, 25.0, 28.0, 28.0, 31.0, 33.0, 22.0, 28.0, 22.0, 15.0, 16.0, 17.0, 15.0, 15.0, 16.0, 4.0, 4.0, 4.0, 5.0, 6.0, 4.0, 10.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05029296875, -0.048638343811035156, -0.04698371887207031, -0.04532909393310547, -0.043674468994140625, -0.04201984405517578, -0.04036521911621094, -0.038710594177246094, -0.03705596923828125, -0.035401344299316406, -0.03374671936035156, -0.03209209442138672, -0.030437469482421875, -0.02878284454345703, -0.027128219604492188, -0.025473594665527344, -0.0238189697265625, -0.022164344787597656, -0.020509719848632812, -0.01885509490966797, -0.017200469970703125, -0.015545845031738281, -0.013891220092773438, -0.012236595153808594, -0.01058197021484375, -0.008927345275878906, -0.0072727203369140625, -0.005618095397949219, -0.003963470458984375, -0.0023088455200195312, -0.0006542205810546875, 0.0010004043579101562, 0.002655029296875, 0.004309654235839844, 0.0059642791748046875, 0.007618904113769531, 0.009273529052734375, 0.010928153991699219, 0.012582778930664062, 0.014237403869628906, 0.01589202880859375, 0.017546653747558594, 0.019201278686523438, 0.02085590362548828, 0.022510528564453125, 0.02416515350341797, 0.025819778442382812, 0.027474403381347656, 0.0291290283203125, 0.030783653259277344, 0.03243827819824219, 0.03409290313720703, 0.035747528076171875, 0.03740215301513672, 0.03905677795410156, 0.040711402893066406, 0.04236602783203125, 0.044020652770996094, 0.04567527770996094, 0.04732990264892578, 0.048984527587890625, 0.05063915252685547, 0.05229377746582031, 0.053948402404785156, 0.05560302734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 14.0, 10.0, 16.0, 25.0, 55.0, 77.0, 217.0, 990.0, 893407.0, 152589.0, 732.0, 183.0, 90.0, 50.0, 24.0, 17.0, 13.0, 6.0, 12.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01480865478515625, -0.01431429386138916, -0.01381993293762207, -0.01332557201385498, -0.01283121109008789, -0.0123368501663208, -0.011842489242553711, -0.011348128318786621, -0.010853767395019531, -0.010359406471252441, -0.009865045547485352, -0.009370684623718262, -0.008876323699951172, -0.008381962776184082, -0.007887601852416992, -0.007393240928649902, -0.0068988800048828125, -0.006404519081115723, -0.005910158157348633, -0.005415797233581543, -0.004921436309814453, -0.004427075386047363, -0.0039327144622802734, -0.0034383535385131836, -0.0029439926147460938, -0.002449631690979004, -0.001955270767211914, -0.0014609098434448242, -0.0009665489196777344, -0.00047218799591064453, 2.2172927856445312e-05, 0.0005165338516235352, 0.001010894775390625, 0.0015052556991577148, 0.0019996166229248047, 0.0024939775466918945, 0.0029883384704589844, 0.0034826993942260742, 0.003977060317993164, 0.004471421241760254, 0.004965782165527344, 0.005460143089294434, 0.0059545040130615234, 0.006448864936828613, 0.006943225860595703, 0.007437586784362793, 0.007931947708129883, 0.008426308631896973, 0.008920669555664062, 0.009415030479431152, 0.009909391403198242, 0.010403752326965332, 0.010898113250732422, 0.011392474174499512, 0.011886835098266602, 0.012381196022033691, 0.012875556945800781, 0.013369917869567871, 0.013864278793334961, 0.01435863971710205, 0.01485300064086914, 0.01534736156463623, 0.01584172248840332, 0.01633608341217041, 0.0168304443359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 4.0, 2.0, 3.0, 11.0, 9.0, 9.0, 19.0, 30.0, 62.0, 115.0, 314.0, 219.0, 77.0, 40.0, 23.0, 15.0, 3.0, 8.0, 8.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017976760864257812, -0.00017371401190757751, -0.0001676604151725769, -0.0001616068184375763, -0.00015555322170257568, -0.00014949962496757507, -0.00014344602823257446, -0.00013739243149757385, -0.00013133883476257324, -0.00012528523802757263, -0.00011923164129257202, -0.00011317804455757141, -0.0001071244478225708, -0.00010107085108757019, -9.501725435256958e-05, -8.896365761756897e-05, -8.291006088256836e-05, -7.685646414756775e-05, -7.080286741256714e-05, -6.474927067756653e-05, -5.869567394256592e-05, -5.264207720756531e-05, -4.65884804725647e-05, -4.053488373756409e-05, -3.4481287002563477e-05, -2.8427690267562866e-05, -2.2374093532562256e-05, -1.6320496797561646e-05, -1.0266900062561035e-05, -4.213303327560425e-06, 1.8402934074401855e-06, 7.893890142440796e-06, 1.3947486877441406e-05, 2.0001083612442017e-05, 2.6054680347442627e-05, 3.210827708244324e-05, 3.816187381744385e-05, 4.421547055244446e-05, 5.026906728744507e-05, 5.632266402244568e-05, 6.237626075744629e-05, 6.84298574924469e-05, 7.448345422744751e-05, 8.053705096244812e-05, 8.659064769744873e-05, 9.264424443244934e-05, 9.869784116744995e-05, 0.00010475143790245056, 0.00011080503463745117, 0.00011685863137245178, 0.0001229122281074524, 0.000128965824842453, 0.0001350194215774536, 0.00014107301831245422, 0.00014712661504745483, 0.00015318021178245544, 0.00015923380851745605, 0.00016528740525245667, 0.00017134100198745728, 0.00017739459872245789, 0.0001834481954574585, 0.0001895017921924591, 0.00019555538892745972, 0.00020160898566246033, 0.00020766258239746094]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 6.0, 17.0, 17.0, 35.0, 92.0, 524.0, 9922.0, 1033834.0, 3600.0, 347.0, 70.0, 24.0, 16.0, 14.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.020538330078125, -0.019922733306884766, -0.01930713653564453, -0.018691539764404297, -0.018075942993164062, -0.017460346221923828, -0.016844749450683594, -0.01622915267944336, -0.015613555908203125, -0.01499795913696289, -0.014382362365722656, -0.013766765594482422, -0.013151168823242188, -0.012535572052001953, -0.011919975280761719, -0.011304378509521484, -0.01068878173828125, -0.010073184967041016, -0.009457588195800781, -0.008841991424560547, -0.008226394653320312, -0.007610797882080078, -0.006995201110839844, -0.006379604339599609, -0.005764007568359375, -0.005148410797119141, -0.004532814025878906, -0.003917217254638672, -0.0033016204833984375, -0.002686023712158203, -0.0020704269409179688, -0.0014548301696777344, -0.0008392333984375, -0.00022363662719726562, 0.00039196014404296875, 0.0010075569152832031, 0.0016231536865234375, 0.002238750457763672, 0.0028543472290039062, 0.0034699440002441406, 0.004085540771484375, 0.004701137542724609, 0.005316734313964844, 0.005932331085205078, 0.0065479278564453125, 0.007163524627685547, 0.007779121398925781, 0.008394718170166016, 0.00901031494140625, 0.009625911712646484, 0.010241508483886719, 0.010857105255126953, 0.011472702026367188, 0.012088298797607422, 0.012703895568847656, 0.01331949234008789, 0.013935089111328125, 0.01455068588256836, 0.015166282653808594, 0.015781879425048828, 0.016397476196289062, 0.017013072967529297, 0.01762866973876953, 0.018244266510009766, 0.01885986328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 15.0, 18.0, 35.0, 62.0, 132.0, 285.0, 199.0, 99.0, 48.0, 28.0, 17.0, 14.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00852203369140625, -0.00824582576751709, -0.00796961784362793, -0.0076934099197387695, -0.007417201995849609, -0.007140994071960449, -0.006864786148071289, -0.006588578224182129, -0.006312370300292969, -0.006036162376403809, -0.0057599544525146484, -0.005483746528625488, -0.005207538604736328, -0.004931330680847168, -0.004655122756958008, -0.004378914833068848, -0.0041027069091796875, -0.0038264989852905273, -0.003550291061401367, -0.003274083137512207, -0.002997875213623047, -0.0027216672897338867, -0.0024454593658447266, -0.0021692514419555664, -0.0018930435180664062, -0.001616835594177246, -0.001340627670288086, -0.0010644197463989258, -0.0007882118225097656, -0.0005120038986206055, -0.0002357959747314453, 4.0411949157714844e-05, 0.000316619873046875, 0.0005928277969360352, 0.0008690357208251953, 0.0011452436447143555, 0.0014214515686035156, 0.0016976594924926758, 0.001973867416381836, 0.002250075340270996, 0.0025262832641601562, 0.0028024911880493164, 0.0030786991119384766, 0.0033549070358276367, 0.003631114959716797, 0.003907322883605957, 0.004183530807495117, 0.004459738731384277, 0.0047359466552734375, 0.005012154579162598, 0.005288362503051758, 0.005564570426940918, 0.005840778350830078, 0.006116986274719238, 0.0063931941986083984, 0.006669402122497559, 0.006945610046386719, 0.007221817970275879, 0.007498025894165039, 0.007774233818054199, 0.00805044174194336, 0.00832664966583252, 0.00860285758972168, 0.00887906551361084, 0.0091552734375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 11.0, 449.0, 531.0, 21.0, 5.0, 0.0, 2.0], "bins": [-2.8113479614257812, -2.7637081146240234, -2.7160680294036865, -2.6684279441833496, -2.620788097381592, -2.573148250579834, -2.525508165359497, -2.47786808013916, -2.4302282333374023, -2.3825883865356445, -2.3349483013153076, -2.2873082160949707, -2.239668369293213, -2.192028522491455, -2.144388437271118, -2.0967483520507812, -2.0491085052490234, -2.0014686584472656, -1.9538285732269287, -1.9061886072158813, -1.858548641204834, -1.8109086751937866, -1.7632687091827393, -1.715628743171692, -1.6679887771606445, -1.6203488111495972, -1.5727088451385498, -1.5250688791275024, -1.477428913116455, -1.4297889471054077, -1.3821489810943604, -1.334509015083313, -1.286868929862976, -1.2392289638519287, -1.1915889978408813, -1.143949031829834, -1.0963090658187866, -1.0486690998077393, -1.001029133796692, -0.9533891677856445, -0.9057492017745972, -0.8581092357635498, -0.8104692697525024, -0.7628293037414551, -0.7151893377304077, -0.6675493717193604, -0.619909405708313, -0.5722694396972656, -0.5246294736862183, -0.4769895076751709, -0.42934954166412354, -0.38170957565307617, -0.3340696096420288, -0.28642964363098145, -0.23878967761993408, -0.19114971160888672, -0.14350977540016174, -0.09586980938911438, -0.04822984337806702, -0.0005898773670196533, 0.04705008864402771, 0.09469005465507507, 0.14233002066612244, 0.1899699866771698, 0.23760995268821716]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 6.0, 7.0, 5.0, 11.0, 22.0, 13.0, 22.0, 18.0, 25.0, 31.0, 33.0, 38.0, 34.0, 31.0, 41.0, 52.0, 53.0, 35.0, 44.0, 35.0, 41.0, 39.0, 28.0, 43.0, 30.0, 32.0, 36.0, 24.0, 37.0, 21.0, 21.0, 15.0, 11.0, 12.0, 10.0, 8.0, 7.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2521507740020752, -0.24320858716964722, -0.23426640033721924, -0.22532421350479126, -0.21638204157352448, -0.2074398547410965, -0.19849766790866852, -0.18955549597740173, -0.18061330914497375, -0.17167112231254578, -0.1627289354801178, -0.15378674864768982, -0.14484457671642303, -0.13590238988399506, -0.12696020305156708, -0.1180180236697197, -0.10907582938671112, -0.10013364255428314, -0.09119146317243576, -0.08224927634000778, -0.0733070969581604, -0.06436491012573242, -0.05542272329330444, -0.04648054391145706, -0.03753835707902908, -0.028596173971891403, -0.019653989002108574, -0.010711804032325745, -0.0017696209251880646, 0.0071725621819496155, 0.016114749014377594, 0.025056928396224976, 0.033999115228652954, 0.042941298335790634, 0.051883481442928314, 0.06082566827535629, 0.06976784765720367, 0.07871003448963165, 0.08765222132205963, 0.09659440070390701, 0.10553658753633499, 0.11447877436876297, 0.12342095375061035, 0.13236314058303833, 0.1413053274154663, 0.1502475142478943, 0.15918970108032227, 0.16813187301158905, 0.17707405984401703, 0.186016246676445, 0.19495843350887299, 0.20390060544013977, 0.21284279227256775, 0.22178497910499573, 0.2307271659374237, 0.23966935276985168, 0.24861153960227966, 0.25755372643470764, 0.2664959132671356, 0.2754381000995636, 0.2843802869319916, 0.29332244396209717, 0.30226463079452515, 0.3112068176269531, 0.3201490044593811]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 5.0, 7.0, 11.0, 9.0, 17.0, 23.0, 36.0, 66.0, 88.0, 112.0, 228.0, 476.0, 2141.0, 4187700.0, 2230.0, 468.0, 222.0, 130.0, 92.0, 69.0, 32.0, 23.0, 16.0, 22.0, 13.0, 9.0, 7.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11077880859375, -0.10737228393554688, -0.10396575927734375, -0.10055923461914062, -0.0971527099609375, -0.09374618530273438, -0.09033966064453125, -0.08693313598632812, -0.083526611328125, -0.08012008666992188, -0.07671356201171875, -0.07330703735351562, -0.0699005126953125, -0.06649398803710938, -0.06308746337890625, -0.059680938720703125, -0.0562744140625, -0.052867889404296875, -0.04946136474609375, -0.046054840087890625, -0.0426483154296875, -0.039241790771484375, -0.03583526611328125, -0.032428741455078125, -0.029022216796875, -0.025615692138671875, -0.02220916748046875, -0.018802642822265625, -0.0153961181640625, -0.011989593505859375, -0.00858306884765625, -0.005176544189453125, -0.00177001953125, 0.001636505126953125, 0.00504302978515625, 0.008449554443359375, 0.0118560791015625, 0.015262603759765625, 0.01866912841796875, 0.022075653076171875, 0.025482177734375, 0.028888702392578125, 0.03229522705078125, 0.035701751708984375, 0.0391082763671875, 0.042514801025390625, 0.04592132568359375, 0.049327850341796875, 0.052734375, 0.056140899658203125, 0.05954742431640625, 0.06295394897460938, 0.0663604736328125, 0.06976699829101562, 0.07317352294921875, 0.07658004760742188, 0.079986572265625, 0.08339309692382812, 0.08679962158203125, 0.09020614624023438, 0.0936126708984375, 0.09701919555664062, 0.10042572021484375, 0.10383224487304688, 0.10723876953125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 5.0, 6.0, 11.0, 9.0, 11.0, 19.0, 26.0, 42.0, 49.0, 52.0, 83.0, 75.0, 95.0, 83.0, 78.0, 52.0, 70.0, 49.0, 40.0, 38.0, 18.0, 17.0, 11.0, 15.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0207977294921875, -0.02015519142150879, -0.019512653350830078, -0.018870115280151367, -0.018227577209472656, -0.017585039138793945, -0.016942501068115234, -0.016299962997436523, -0.015657424926757812, -0.015014886856079102, -0.01437234878540039, -0.01372981071472168, -0.013087272644042969, -0.012444734573364258, -0.011802196502685547, -0.011159658432006836, -0.010517120361328125, -0.009874582290649414, -0.009232044219970703, -0.008589506149291992, -0.007946968078613281, -0.00730443000793457, -0.006661891937255859, -0.0060193538665771484, -0.0053768157958984375, -0.0047342777252197266, -0.004091739654541016, -0.0034492015838623047, -0.0028066635131835938, -0.002164125442504883, -0.0015215873718261719, -0.0008790493011474609, -0.00023651123046875, 0.00040602684020996094, 0.0010485649108886719, 0.0016911029815673828, 0.0023336410522460938, 0.0029761791229248047, 0.0036187171936035156, 0.0042612552642822266, 0.0049037933349609375, 0.0055463314056396484, 0.006188869476318359, 0.00683140754699707, 0.007473945617675781, 0.008116483688354492, 0.008759021759033203, 0.009401559829711914, 0.010044097900390625, 0.010686635971069336, 0.011329174041748047, 0.011971712112426758, 0.012614250183105469, 0.01325678825378418, 0.01389932632446289, 0.014541864395141602, 0.015184402465820312, 0.015826940536499023, 0.016469478607177734, 0.017112016677856445, 0.017754554748535156, 0.018397092819213867, 0.019039630889892578, 0.01968216896057129, 0.02032470703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 9.0, 15.0, 38.0, 111.0, 416.0, 1997.0, 14459.0, 4169203.0, 6231.0, 1375.0, 316.0, 63.0, 20.0, 4.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.052276611328125, -0.0505523681640625, -0.048828125, -0.0471038818359375, -0.045379638671875, -0.0436553955078125, -0.04193115234375, -0.0402069091796875, -0.038482666015625, -0.0367584228515625, -0.0350341796875, -0.0333099365234375, -0.031585693359375, -0.0298614501953125, -0.02813720703125, -0.0264129638671875, -0.024688720703125, -0.0229644775390625, -0.021240234375, -0.0195159912109375, -0.017791748046875, -0.0160675048828125, -0.01434326171875, -0.0126190185546875, -0.010894775390625, -0.0091705322265625, -0.0074462890625, -0.0057220458984375, -0.003997802734375, -0.0022735595703125, -0.00054931640625, 0.0011749267578125, 0.002899169921875, 0.0046234130859375, 0.00634765625, 0.0080718994140625, 0.009796142578125, 0.0115203857421875, 0.01324462890625, 0.0149688720703125, 0.016693115234375, 0.0184173583984375, 0.0201416015625, 0.0218658447265625, 0.023590087890625, 0.0253143310546875, 0.02703857421875, 0.0287628173828125, 0.030487060546875, 0.0322113037109375, 0.033935546875, 0.0356597900390625, 0.037384033203125, 0.0391082763671875, 0.04083251953125, 0.0425567626953125, 0.044281005859375, 0.0460052490234375, 0.0477294921875, 0.0494537353515625, 0.051177978515625, 0.0529022216796875, 0.05462646484375, 0.0563507080078125, 0.058074951171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 18.0, 36.0, 146.0, 3799.0, 20.0, 14.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01149749755859375, -0.011160492897033691, -0.010823488235473633, -0.010486483573913574, -0.010149478912353516, -0.009812474250793457, -0.009475469589233398, -0.00913846492767334, -0.008801460266113281, -0.008464455604553223, -0.008127450942993164, -0.0077904462814331055, -0.007453441619873047, -0.007116436958312988, -0.00677943229675293, -0.006442427635192871, -0.0061054229736328125, -0.005768418312072754, -0.005431413650512695, -0.005094408988952637, -0.004757404327392578, -0.0044203996658325195, -0.004083395004272461, -0.0037463903427124023, -0.0034093856811523438, -0.003072381019592285, -0.0027353763580322266, -0.002398371696472168, -0.0020613670349121094, -0.0017243623733520508, -0.0013873577117919922, -0.0010503530502319336, -0.000713348388671875, -0.0003763437271118164, -3.933906555175781e-05, 0.0002976655960083008, 0.0006346702575683594, 0.000971674919128418, 0.0013086795806884766, 0.0016456842422485352, 0.0019826889038085938, 0.0023196935653686523, 0.002656698226928711, 0.0029937028884887695, 0.003330707550048828, 0.0036677122116088867, 0.004004716873168945, 0.004341721534729004, 0.0046787261962890625, 0.005015730857849121, 0.00535273551940918, 0.005689740180969238, 0.006026744842529297, 0.0063637495040893555, 0.006700754165649414, 0.007037758827209473, 0.007374763488769531, 0.00771176815032959, 0.008048772811889648, 0.008385777473449707, 0.008722782135009766, 0.009059786796569824, 0.009396791458129883, 0.009733796119689941, 0.01007080078125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 18.0, 826.0, 164.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16483236849308014, -0.16170695424079895, -0.15858155488967896, -0.15545614063739777, -0.15233074128627777, -0.14920532703399658, -0.1460799276828766, -0.1429545134305954, -0.1398291140794754, -0.1367036998271942, -0.13357830047607422, -0.13045288622379303, -0.12732748687267303, -0.12420208007097244, -0.12107667326927185, -0.11795126646757126, -0.11482585966587067, -0.11170045286417007, -0.10857504606246948, -0.10544963926076889, -0.1023242324590683, -0.0991988256573677, -0.09607341885566711, -0.09294801205396652, -0.08982259780168533, -0.08669719099998474, -0.08357178419828415, -0.08044637739658356, -0.07732097059488297, -0.07419556379318237, -0.07107015699148178, -0.06794475018978119, -0.0648193359375, -0.06169392913579941, -0.058568522334098816, -0.055443115532398224, -0.05231770873069763, -0.04919230192899704, -0.04606689512729645, -0.042941488325595856, -0.039816081523895264, -0.03669067472219467, -0.03356526792049408, -0.030439861118793488, -0.027314454317092896, -0.024189045652747154, -0.021063638851046562, -0.01793823204934597, -0.014812827110290527, -0.011687420308589935, -0.008562013506889343, -0.005436605773866177, -0.0023111989721655846, 0.0008142087608575821, 0.003939615562558174, 0.007065022364258766, 0.010190429165959358, 0.01331583596765995, 0.016441242769360542, 0.019566651433706284, 0.022692058235406876, 0.025817465037107468, 0.02894287183880806, 0.03206827864050865, 0.035193685442209244]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 6.0, 10.0, 10.0, 10.0, 11.0, 15.0, 18.0, 21.0, 23.0, 27.0, 26.0, 30.0, 26.0, 41.0, 45.0, 41.0, 36.0, 46.0, 44.0, 39.0, 38.0, 35.0, 47.0, 40.0, 28.0, 36.0, 22.0, 29.0, 23.0, 23.0, 21.0, 18.0, 17.0, 12.0, 14.0, 10.0, 7.0, 10.0, 6.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.011601507663726807, -0.011241189204156399, -0.010880870744585991, -0.010520552285015583, -0.010160233825445175, -0.009799915365874767, -0.00943959690630436, -0.009079278446733952, -0.008718959987163544, -0.008358641527593136, -0.007998323068022728, -0.00763800460845232, -0.007277686148881912, -0.006917367689311504, -0.0065570492297410965, -0.006196730770170689, -0.005836412310600281, -0.005476093851029873, -0.005115775391459465, -0.004755456931889057, -0.004395138472318649, -0.004034820012748241, -0.0036745015531778336, -0.0033141830936074257, -0.002953864634037018, -0.00259354617446661, -0.002233227714896202, -0.0018729092553257942, -0.0015125907957553864, -0.0011522723361849785, -0.0007919538766145706, -0.00043163541704416275, -7.131695747375488e-05, 0.000289001502096653, 0.0006493199616670609, 0.0010096384212374687, 0.0013699568808078766, 0.0017302753403782845, 0.0020905937999486923, 0.0024509122595191, 0.002811230719089508, 0.003171549178659916, 0.003531867638230324, 0.0038921860978007317, 0.0042525045573711395, 0.004612823016941547, 0.004973141476511955, 0.005333459936082363, 0.005693778395652771, 0.006054096855223179, 0.006414415314793587, 0.006774733774363995, 0.0071350522339344025, 0.00749537069350481, 0.007855689153075218, 0.008216007612645626, 0.008576326072216034, 0.008936644531786442, 0.00929696299135685, 0.009657281450927258, 0.010017599910497665, 0.010377918370068073, 0.010738236829638481, 0.011098555289208889, 0.011458873748779297]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 13.0, 13.0, 12.0, 16.0, 31.0, 51.0, 72.0, 118.0, 166.0, 271.0, 475.0, 762.0, 1375.0, 2772.0, 5725.0, 13108.0, 37134.0, 146360.0, 644157.0, 136419.0, 35297.0, 12616.0, 5527.0, 2654.0, 1414.0, 773.0, 415.0, 303.0, 175.0, 103.0, 72.0, 43.0, 31.0, 32.0, 15.0, 9.0, 4.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035919189453125, -0.03477811813354492, -0.033637046813964844, -0.032495975494384766, -0.03135490417480469, -0.03021383285522461, -0.02907276153564453, -0.027931690216064453, -0.026790618896484375, -0.025649547576904297, -0.02450847625732422, -0.02336740493774414, -0.022226333618164062, -0.021085262298583984, -0.019944190979003906, -0.018803119659423828, -0.01766204833984375, -0.016520977020263672, -0.015379905700683594, -0.014238834381103516, -0.013097763061523438, -0.01195669174194336, -0.010815620422363281, -0.009674549102783203, -0.008533477783203125, -0.007392406463623047, -0.006251335144042969, -0.005110263824462891, -0.0039691925048828125, -0.0028281211853027344, -0.0016870498657226562, -0.0005459785461425781, 0.0005950927734375, 0.0017361640930175781, 0.0028772354125976562, 0.004018306732177734, 0.0051593780517578125, 0.006300449371337891, 0.007441520690917969, 0.008582592010498047, 0.009723663330078125, 0.010864734649658203, 0.012005805969238281, 0.01314687728881836, 0.014287948608398438, 0.015429019927978516, 0.016570091247558594, 0.017711162567138672, 0.01885223388671875, 0.019993305206298828, 0.021134376525878906, 0.022275447845458984, 0.023416519165039062, 0.02455759048461914, 0.02569866180419922, 0.026839733123779297, 0.027980804443359375, 0.029121875762939453, 0.03026294708251953, 0.03140401840209961, 0.03254508972167969, 0.033686161041259766, 0.034827232360839844, 0.03596830368041992, 0.037109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 11.0, 5.0, 15.0, 14.0, 30.0, 41.0, 47.0, 50.0, 87.0, 72.0, 100.0, 81.0, 81.0, 53.0, 68.0, 45.0, 45.0, 31.0, 22.0, 17.0, 12.0, 14.0, 11.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02069091796875, -0.02005171775817871, -0.019412517547607422, -0.018773317337036133, -0.018134117126464844, -0.017494916915893555, -0.016855716705322266, -0.016216516494750977, -0.015577316284179688, -0.014938116073608398, -0.01429891586303711, -0.01365971565246582, -0.013020515441894531, -0.012381315231323242, -0.011742115020751953, -0.011102914810180664, -0.010463714599609375, -0.009824514389038086, -0.009185314178466797, -0.008546113967895508, -0.007906913757324219, -0.00726771354675293, -0.006628513336181641, -0.0059893131256103516, -0.0053501129150390625, -0.0047109127044677734, -0.004071712493896484, -0.0034325122833251953, -0.0027933120727539062, -0.002154111862182617, -0.0015149116516113281, -0.0008757114410400391, -0.00023651123046875, 0.00040268898010253906, 0.0010418891906738281, 0.0016810894012451172, 0.0023202896118164062, 0.0029594898223876953, 0.0035986900329589844, 0.0042378902435302734, 0.0048770904541015625, 0.0055162906646728516, 0.006155490875244141, 0.00679469108581543, 0.007433891296386719, 0.008073091506958008, 0.008712291717529297, 0.009351491928100586, 0.009990692138671875, 0.010629892349243164, 0.011269092559814453, 0.011908292770385742, 0.012547492980957031, 0.01318669319152832, 0.01382589340209961, 0.014465093612670898, 0.015104293823242188, 0.015743494033813477, 0.016382694244384766, 0.017021894454956055, 0.017661094665527344, 0.018300294876098633, 0.018939495086669922, 0.01957869529724121, 0.0202178955078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 2.0, 5.0, 4.0, 6.0, 8.0, 10.0, 15.0, 15.0, 12.0, 22.0, 29.0, 34.0, 32.0, 44.0, 64.0, 82.0, 106.0, 133.0, 220.0, 429.0, 935.0, 4763.0, 113487.0, 907729.0, 16847.0, 1906.0, 607.0, 271.0, 179.0, 134.0, 107.0, 56.0, 56.0, 35.0, 26.0, 27.0, 20.0, 20.0, 25.0, 6.0, 9.0, 10.0, 4.0, 4.0, 4.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.098388671875, -0.09513568878173828, -0.09188270568847656, -0.08862972259521484, -0.08537673950195312, -0.0821237564086914, -0.07887077331542969, -0.07561779022216797, -0.07236480712890625, -0.06911182403564453, -0.06585884094238281, -0.0626058578491211, -0.059352874755859375, -0.056099891662597656, -0.05284690856933594, -0.04959392547607422, -0.0463409423828125, -0.04308795928955078, -0.03983497619628906, -0.036581993103027344, -0.033329010009765625, -0.030076026916503906, -0.026823043823242188, -0.02357006072998047, -0.02031707763671875, -0.01706409454345703, -0.013811111450195312, -0.010558128356933594, -0.007305145263671875, -0.004052162170410156, -0.0007991790771484375, 0.0024538040161132812, 0.005706787109375, 0.008959770202636719, 0.012212753295898438, 0.015465736389160156, 0.018718719482421875, 0.021971702575683594, 0.025224685668945312, 0.02847766876220703, 0.03173065185546875, 0.03498363494873047, 0.03823661804199219, 0.041489601135253906, 0.044742584228515625, 0.047995567321777344, 0.05124855041503906, 0.05450153350830078, 0.0577545166015625, 0.06100749969482422, 0.06426048278808594, 0.06751346588134766, 0.07076644897460938, 0.0740194320678711, 0.07727241516113281, 0.08052539825439453, 0.08377838134765625, 0.08703136444091797, 0.09028434753417969, 0.0935373306274414, 0.09679031372070312, 0.10004329681396484, 0.10329627990722656, 0.10654926300048828, 0.10980224609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 9.0, 5.0, 11.0, 15.0, 13.0, 15.0, 24.0, 23.0, 20.0, 27.0, 26.0, 28.0, 36.0, 39.0, 36.0, 40.0, 52.0, 43.0, 27.0, 42.0, 44.0, 49.0, 37.0, 32.0, 34.0, 37.0, 34.0, 34.0, 20.0, 21.0, 20.0, 18.0, 12.0, 6.0, 14.0, 8.0, 8.0, 6.0, 4.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.052642822265625, -0.051000118255615234, -0.04935741424560547, -0.0477147102355957, -0.04607200622558594, -0.04442930221557617, -0.042786598205566406, -0.04114389419555664, -0.039501190185546875, -0.03785848617553711, -0.036215782165527344, -0.03457307815551758, -0.03293037414550781, -0.03128767013549805, -0.02964496612548828, -0.028002262115478516, -0.02635955810546875, -0.024716854095458984, -0.02307415008544922, -0.021431446075439453, -0.019788742065429688, -0.018146038055419922, -0.016503334045410156, -0.01486063003540039, -0.013217926025390625, -0.01157522201538086, -0.009932518005371094, -0.008289813995361328, -0.0066471099853515625, -0.005004405975341797, -0.0033617019653320312, -0.0017189979553222656, -7.62939453125e-05, 0.0015664100646972656, 0.0032091140747070312, 0.004851818084716797, 0.0064945220947265625, 0.008137226104736328, 0.009779930114746094, 0.01142263412475586, 0.013065338134765625, 0.01470804214477539, 0.016350746154785156, 0.017993450164794922, 0.019636154174804688, 0.021278858184814453, 0.02292156219482422, 0.024564266204833984, 0.02620697021484375, 0.027849674224853516, 0.02949237823486328, 0.031135082244873047, 0.03277778625488281, 0.03442049026489258, 0.036063194274902344, 0.03770589828491211, 0.039348602294921875, 0.04099130630493164, 0.042634010314941406, 0.04427671432495117, 0.04591941833496094, 0.0475621223449707, 0.04920482635498047, 0.050847530364990234, 0.052490234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 4.0, 11.0, 11.0, 18.0, 24.0, 26.0, 45.0, 49.0, 68.0, 105.0, 153.0, 351.0, 1463.0, 8400.0, 909885.0, 121765.0, 4451.0, 940.0, 300.0, 142.0, 82.0, 52.0, 43.0, 32.0, 24.0, 20.0, 11.0, 13.0, 7.0, 9.0, 5.0, 4.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00897979736328125, -0.008714556694030762, -0.008449316024780273, -0.008184075355529785, -0.007918834686279297, -0.007653594017028809, -0.00738835334777832, -0.007123112678527832, -0.006857872009277344, -0.0065926313400268555, -0.006327390670776367, -0.006062150001525879, -0.005796909332275391, -0.005531668663024902, -0.005266427993774414, -0.005001187324523926, -0.0047359466552734375, -0.004470705986022949, -0.004205465316772461, -0.003940224647521973, -0.0036749839782714844, -0.003409743309020996, -0.003144502639770508, -0.0028792619705200195, -0.0026140213012695312, -0.002348780632019043, -0.0020835399627685547, -0.0018182992935180664, -0.0015530586242675781, -0.0012878179550170898, -0.0010225772857666016, -0.0007573366165161133, -0.000492095947265625, -0.00022685527801513672, 3.838539123535156e-05, 0.00030362606048583984, 0.0005688667297363281, 0.0008341073989868164, 0.0010993480682373047, 0.001364588737487793, 0.0016298294067382812, 0.0018950700759887695, 0.002160310745239258, 0.002425551414489746, 0.0026907920837402344, 0.0029560327529907227, 0.003221273422241211, 0.0034865140914916992, 0.0037517547607421875, 0.004016995429992676, 0.004282236099243164, 0.004547476768493652, 0.004812717437744141, 0.005077958106994629, 0.005343198776245117, 0.0056084394454956055, 0.005873680114746094, 0.006138920783996582, 0.00640416145324707, 0.006669402122497559, 0.006934642791748047, 0.007199883460998535, 0.0074651241302490234, 0.007730364799499512, 0.00799560546875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 2.0, 6.0, 11.0, 8.0, 16.0, 42.0, 70.0, 346.0, 290.0, 74.0, 25.0, 16.0, 8.0, 5.0, 6.0, 2.0, 7.0, 4.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0003542900085449219, -0.0003444477915763855, -0.0003346055746078491, -0.00032476335763931274, -0.00031492114067077637, -0.00030507892370224, -0.0002952367067337036, -0.00028539448976516724, -0.00027555227279663086, -0.0002657100558280945, -0.0002558678388595581, -0.00024602562189102173, -0.00023618340492248535, -0.00022634118795394897, -0.0002164989709854126, -0.00020665675401687622, -0.00019681453704833984, -0.00018697232007980347, -0.0001771301031112671, -0.0001672878861427307, -0.00015744566917419434, -0.00014760345220565796, -0.00013776123523712158, -0.0001279190182685852, -0.00011807680130004883, -0.00010823458433151245, -9.839236736297607e-05, -8.85501503944397e-05, -7.870793342590332e-05, -6.886571645736694e-05, -5.9023499488830566e-05, -4.918128252029419e-05, -3.933906555175781e-05, -2.9496848583221436e-05, -1.965463161468506e-05, -9.812414646148682e-06, 2.9802322387695312e-08, 9.872019290924072e-06, 1.971423625946045e-05, 2.9556453227996826e-05, 3.93986701965332e-05, 4.924088716506958e-05, 5.908310413360596e-05, 6.892532110214233e-05, 7.876753807067871e-05, 8.860975503921509e-05, 9.845197200775146e-05, 0.00010829418897628784, 0.00011813640594482422, 0.0001279786229133606, 0.00013782083988189697, 0.00014766305685043335, 0.00015750527381896973, 0.0001673474907875061, 0.00017718970775604248, 0.00018703192472457886, 0.00019687414169311523, 0.0002067163586616516, 0.000216558575630188, 0.00022640079259872437, 0.00023624300956726074, 0.0002460852265357971, 0.0002559274435043335, 0.0002657696604728699, 0.00027561187744140625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 7.0, 8.0, 12.0, 13.0, 22.0, 37.0, 76.0, 151.0, 443.0, 3135.0, 983800.0, 58693.0, 1514.0, 354.0, 103.0, 70.0, 35.0, 22.0, 15.0, 18.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02386474609375, -0.023216962814331055, -0.02256917953491211, -0.021921396255493164, -0.02127361297607422, -0.020625829696655273, -0.019978046417236328, -0.019330263137817383, -0.018682479858398438, -0.018034696578979492, -0.017386913299560547, -0.0167391300201416, -0.016091346740722656, -0.015443563461303711, -0.014795780181884766, -0.01414799690246582, -0.013500213623046875, -0.01285243034362793, -0.012204647064208984, -0.011556863784790039, -0.010909080505371094, -0.010261297225952148, -0.009613513946533203, -0.008965730667114258, -0.008317947387695312, -0.007670164108276367, -0.007022380828857422, -0.0063745975494384766, -0.005726814270019531, -0.005079030990600586, -0.004431247711181641, -0.0037834644317626953, -0.00313568115234375, -0.0024878978729248047, -0.0018401145935058594, -0.001192331314086914, -0.0005445480346679688, 0.00010323524475097656, 0.0007510185241699219, 0.0013988018035888672, 0.0020465850830078125, 0.002694368362426758, 0.003342151641845703, 0.0039899349212646484, 0.004637718200683594, 0.005285501480102539, 0.005933284759521484, 0.00658106803894043, 0.007228851318359375, 0.00787663459777832, 0.008524417877197266, 0.009172201156616211, 0.009819984436035156, 0.010467767715454102, 0.011115550994873047, 0.011763334274291992, 0.012411117553710938, 0.013058900833129883, 0.013706684112548828, 0.014354467391967773, 0.015002250671386719, 0.015650033950805664, 0.01629781723022461, 0.016945600509643555, 0.0175933837890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 14.0, 10.0, 10.0, 15.0, 25.0, 42.0, 55.0, 130.0, 245.0, 196.0, 93.0, 54.0, 40.0, 20.0, 16.0, 8.0, 7.0, 3.0, 6.0, 3.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008514404296875, -0.008172154426574707, -0.007829904556274414, -0.007487654685974121, -0.007145404815673828, -0.006803154945373535, -0.006460905075073242, -0.006118655204772949, -0.005776405334472656, -0.005434155464172363, -0.00509190559387207, -0.004749655723571777, -0.004407405853271484, -0.004065155982971191, -0.0037229061126708984, -0.0033806562423706055, -0.0030384063720703125, -0.0026961565017700195, -0.0023539066314697266, -0.0020116567611694336, -0.0016694068908691406, -0.0013271570205688477, -0.0009849071502685547, -0.0006426572799682617, -0.00030040740966796875, 4.184246063232422e-05, 0.0003840923309326172, 0.0007263422012329102, 0.0010685920715332031, 0.001410841941833496, 0.001753091812133789, 0.002095341682434082, 0.002437591552734375, 0.002779841423034668, 0.003122091293334961, 0.003464341163635254, 0.003806591033935547, 0.00414884090423584, 0.004491090774536133, 0.004833340644836426, 0.005175590515136719, 0.005517840385437012, 0.005860090255737305, 0.006202340126037598, 0.006544589996337891, 0.006886839866638184, 0.0072290897369384766, 0.0075713396072387695, 0.007913589477539062, 0.008255839347839355, 0.008598089218139648, 0.008940339088439941, 0.009282588958740234, 0.009624838829040527, 0.00996708869934082, 0.010309338569641113, 0.010651588439941406, 0.0109938383102417, 0.011336088180541992, 0.011678338050842285, 0.012020587921142578, 0.012362837791442871, 0.012705087661743164, 0.013047337532043457, 0.01338958740234375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 116.0, 803.0, 82.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9232122898101807, -1.8808120489120483, -1.8384116888046265, -1.7960114479064941, -1.7536112070083618, -1.7112109661102295, -1.6688106060028076, -1.6264103651046753, -1.584010124206543, -1.5416098833084106, -1.4992095232009888, -1.4568092823028564, -1.4144090414047241, -1.3720088005065918, -1.32960844039917, -1.2872081995010376, -1.2448078393936157, -1.2024075984954834, -1.1600072383880615, -1.1176069974899292, -1.0752067565917969, -1.032806396484375, -0.9904061555862427, -0.9480059146881104, -0.9056056141853333, -0.8632053136825562, -0.8208050727844238, -0.7784047722816467, -0.7360044717788696, -0.6936042308807373, -0.6512039303779602, -0.6088036298751831, -0.5664033889770508, -0.5240030884742737, -0.48160284757614136, -0.43920254707336426, -0.39680227637290955, -0.35440200567245483, -0.31200170516967773, -0.269601434469223, -0.2272011637687683, -0.1848008930683136, -0.1424006074666977, -0.10000032186508179, -0.057600051164627075, -0.015199780464172363, 0.027200520038604736, 0.06960079073905945, 0.11200106143951416, 0.15440133213996887, 0.19680161774158478, 0.23920190334320068, 0.2816021740436554, 0.3240024447441101, 0.3664027452468872, 0.4088030159473419, 0.45120328664779663, 0.49360355734825134, 0.536003828048706, 0.5784041285514832, 0.6208044290542603, 0.6632046699523926, 0.7056049704551697, 0.7480052709579468, 0.7904055118560791]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 9.0, 10.0, 6.0, 11.0, 13.0, 13.0, 15.0, 13.0, 19.0, 35.0, 33.0, 27.0, 37.0, 33.0, 47.0, 37.0, 43.0, 36.0, 57.0, 52.0, 45.0, 33.0, 48.0, 31.0, 39.0, 31.0, 32.0, 27.0, 40.0, 28.0, 13.0, 20.0, 16.0, 10.0, 13.0, 8.0, 3.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2909756302833557, -0.2822502851486206, -0.2735249400138855, -0.2647995948791504, -0.2560742497444153, -0.24734888970851898, -0.23862352967262268, -0.22989818453788757, -0.22117283940315247, -0.21244749426841736, -0.20372214913368225, -0.19499678909778595, -0.18627144396305084, -0.17754609882831573, -0.16882073879241943, -0.16009539365768433, -0.15137004852294922, -0.1426447033882141, -0.133919358253479, -0.1251939982175827, -0.1164686530828476, -0.10774330794811249, -0.09901795536279678, -0.09029260277748108, -0.08156725764274597, -0.07284191250801086, -0.06411655992269516, -0.055391211062669754, -0.04666586220264435, -0.03794051334261894, -0.029215164482593536, -0.02048981562256813, -0.011764466762542725, -0.0030391179025173187, 0.005686230957508087, 0.014411579817533493, 0.0231369286775589, 0.031862277537584305, 0.04058762639760971, 0.04931297525763512, 0.05803832411766052, 0.06676366925239563, 0.07548902183771133, 0.08421437442302704, 0.09293971955776215, 0.10166506469249725, 0.11039041727781296, 0.11911576986312866, 0.12784111499786377, 0.13656646013259888, 0.14529180526733398, 0.15401716530323029, 0.1627425104379654, 0.1714678555727005, 0.1801932156085968, 0.1889185607433319, 0.19764390587806702, 0.20636925101280212, 0.21509459614753723, 0.22381995618343353, 0.23254530131816864, 0.24127064645290375, 0.24999600648880005, 0.25872135162353516, 0.26744669675827026]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 15.0, 12.0, 25.0, 42.0, 53.0, 102.0, 132.0, 277.0, 626.0, 6930.0, 4184543.0, 732.0, 279.0, 166.0, 115.0, 64.0, 36.0, 31.0, 16.0, 13.0, 14.0, 7.0, 9.0, 3.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.24978256225585938, -0.24175262451171875, -0.23372268676757812, -0.2256927490234375, -0.21766281127929688, -0.20963287353515625, -0.20160293579101562, -0.193572998046875, -0.18554306030273438, -0.17751312255859375, -0.16948318481445312, -0.1614532470703125, -0.15342330932617188, -0.14539337158203125, -0.13736343383789062, -0.12933349609375, -0.12130355834960938, -0.11327362060546875, -0.10524368286132812, -0.0972137451171875, -0.08918380737304688, -0.08115386962890625, -0.07312393188476562, -0.065093994140625, -0.057064056396484375, -0.04903411865234375, -0.041004180908203125, -0.0329742431640625, -0.024944305419921875, -0.01691436767578125, -0.008884429931640625, -0.0008544921875, 0.007175445556640625, 0.01520538330078125, 0.023235321044921875, 0.0312652587890625, 0.039295196533203125, 0.04732513427734375, 0.055355072021484375, 0.063385009765625, 0.07141494750976562, 0.07944488525390625, 0.08747482299804688, 0.0955047607421875, 0.10353469848632812, 0.11156463623046875, 0.11959457397460938, 0.12762451171875, 0.13565444946289062, 0.14368438720703125, 0.15171432495117188, 0.1597442626953125, 0.16777420043945312, 0.17580413818359375, 0.18383407592773438, 0.191864013671875, 0.19989395141601562, 0.20792388916015625, 0.21595382690429688, 0.2239837646484375, 0.23201370239257812, 0.24004364013671875, 0.24807357788085938, 0.256103515625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 11.0, 10.0, 11.0, 18.0, 25.0, 35.0, 55.0, 51.0, 79.0, 90.0, 92.0, 105.0, 67.0, 59.0, 61.0, 59.0, 46.0, 23.0, 21.0, 19.0, 11.0, 10.0, 6.0, 6.0, 7.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020751953125, -0.020109176635742188, -0.019466400146484375, -0.018823623657226562, -0.01818084716796875, -0.017538070678710938, -0.016895294189453125, -0.016252517700195312, -0.0156097412109375, -0.014966964721679688, -0.014324188232421875, -0.013681411743164062, -0.01303863525390625, -0.012395858764648438, -0.011753082275390625, -0.011110305786132812, -0.010467529296875, -0.009824752807617188, -0.009181976318359375, -0.008539199829101562, -0.00789642333984375, -0.0072536468505859375, -0.006610870361328125, -0.0059680938720703125, -0.0053253173828125, -0.0046825408935546875, -0.004039764404296875, -0.0033969879150390625, -0.00275421142578125, -0.0021114349365234375, -0.001468658447265625, -0.0008258819580078125, -0.00018310546875, 0.0004596710205078125, 0.001102447509765625, 0.0017452239990234375, 0.00238800048828125, 0.0030307769775390625, 0.003673553466796875, 0.0043163299560546875, 0.0049591064453125, 0.0056018829345703125, 0.006244659423828125, 0.0068874359130859375, 0.00753021240234375, 0.008172988891601562, 0.008815765380859375, 0.009458541870117188, 0.010101318359375, 0.010744094848632812, 0.011386871337890625, 0.012029647827148438, 0.01267242431640625, 0.013315200805664062, 0.013957977294921875, 0.014600753784179688, 0.0152435302734375, 0.015886306762695312, 0.016529083251953125, 0.017171859741210938, 0.01781463623046875, 0.018457412719726562, 0.019100189208984375, 0.019742965698242188, 0.0203857421875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 39.0, 128.0, 484.0, 7355.0, 4184123.0, 1783.0, 281.0, 51.0, 25.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08624267578125, -0.0832986831665039, -0.08035469055175781, -0.07741069793701172, -0.07446670532226562, -0.07152271270751953, -0.06857872009277344, -0.06563472747802734, -0.06269073486328125, -0.059746742248535156, -0.05680274963378906, -0.05385875701904297, -0.050914764404296875, -0.04797077178955078, -0.04502677917480469, -0.042082786560058594, -0.0391387939453125, -0.036194801330566406, -0.03325080871582031, -0.03030681610107422, -0.027362823486328125, -0.02441883087158203, -0.021474838256835938, -0.018530845642089844, -0.01558685302734375, -0.012642860412597656, -0.009698867797851562, -0.006754875183105469, -0.003810882568359375, -0.0008668899536132812, 0.0020771026611328125, 0.005021095275878906, 0.007965087890625, 0.010909080505371094, 0.013853073120117188, 0.01679706573486328, 0.019741058349609375, 0.02268505096435547, 0.025629043579101562, 0.028573036193847656, 0.03151702880859375, 0.034461021423339844, 0.03740501403808594, 0.04034900665283203, 0.043292999267578125, 0.04623699188232422, 0.04918098449707031, 0.052124977111816406, 0.0550689697265625, 0.058012962341308594, 0.06095695495605469, 0.06390094757080078, 0.06684494018554688, 0.06978893280029297, 0.07273292541503906, 0.07567691802978516, 0.07862091064453125, 0.08156490325927734, 0.08450889587402344, 0.08745288848876953, 0.09039688110351562, 0.09334087371826172, 0.09628486633300781, 0.0992288589477539, 0.1021728515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 9.0, 12.0, 46.0, 3682.0, 246.0, 40.0, 18.0, 9.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018341064453125, -0.017800092697143555, -0.01725912094116211, -0.016718149185180664, -0.01617717742919922, -0.015636205673217773, -0.015095233917236328, -0.014554262161254883, -0.014013290405273438, -0.013472318649291992, -0.012931346893310547, -0.012390375137329102, -0.011849403381347656, -0.011308431625366211, -0.010767459869384766, -0.01022648811340332, -0.009685516357421875, -0.00914454460144043, -0.008603572845458984, -0.008062601089477539, -0.007521629333496094, -0.0069806575775146484, -0.006439685821533203, -0.005898714065551758, -0.0053577423095703125, -0.004816770553588867, -0.004275798797607422, -0.0037348270416259766, -0.0031938552856445312, -0.002652883529663086, -0.0021119117736816406, -0.0015709400177001953, -0.00102996826171875, -0.0004889965057373047, 5.1975250244140625e-05, 0.0005929470062255859, 0.0011339187622070312, 0.0016748905181884766, 0.002215862274169922, 0.002756834030151367, 0.0032978057861328125, 0.003838777542114258, 0.004379749298095703, 0.0049207210540771484, 0.005461692810058594, 0.006002664566040039, 0.006543636322021484, 0.00708460807800293, 0.007625579833984375, 0.00816655158996582, 0.008707523345947266, 0.009248495101928711, 0.009789466857910156, 0.010330438613891602, 0.010871410369873047, 0.011412382125854492, 0.011953353881835938, 0.012494325637817383, 0.013035297393798828, 0.013576269149780273, 0.014117240905761719, 0.014658212661743164, 0.01519918441772461, 0.015740156173706055, 0.0162811279296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 24.0, 254.0, 689.0, 39.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1266936957836151, -0.12328440696001053, -0.11987511813640594, -0.11646582931280136, -0.11305654048919678, -0.1096472516655922, -0.10623796284198761, -0.10282867401838303, -0.09941938519477844, -0.09601009637117386, -0.09260080754756927, -0.08919151872396469, -0.08578222990036011, -0.08237294107675552, -0.07896365225315094, -0.07555436342954636, -0.07214507460594177, -0.06873578578233719, -0.0653264969587326, -0.06191720813512802, -0.05850791931152344, -0.055098630487918854, -0.05168934166431427, -0.048280052840709686, -0.0448707640171051, -0.04146147519350052, -0.038052186369895935, -0.03464289754629135, -0.031233608722686768, -0.027824319899082184, -0.0244150310754776, -0.021005742251873016, -0.017596445977687836, -0.014187157154083252, -0.010777868330478668, -0.0073685795068740845, -0.003959290683269501, -0.000550001859664917, 0.0028592869639396667, 0.0062685757875442505, 0.009677864611148834, 0.013087153434753418, 0.016496442258358, 0.019905731081962585, 0.02331501990556717, 0.026724308729171753, 0.030133597552776337, 0.03354288637638092, 0.036952175199985504, 0.04036146402359009, 0.04377075284719467, 0.047180041670799255, 0.05058933049440384, 0.05399861931800842, 0.05740790814161301, 0.06081719696521759, 0.06422648578882217, 0.06763577461242676, 0.07104506343603134, 0.07445435225963593, 0.07786364108324051, 0.08127292990684509, 0.08468221873044968, 0.08809150755405426, 0.09150079637765884]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 10.0, 11.0, 12.0, 22.0, 26.0, 24.0, 27.0, 31.0, 41.0, 42.0, 52.0, 44.0, 56.0, 56.0, 70.0, 64.0, 45.0, 54.0, 45.0, 50.0, 42.0, 29.0, 39.0, 19.0, 20.0, 14.0, 17.0, 12.0, 5.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.018992483615875244, -0.0183461494743824, -0.017699817195534706, -0.01705348491668701, -0.016407150775194168, -0.015760816633701324, -0.01511448435485363, -0.014468151144683361, -0.013821817934513092, -0.013175484724342823, -0.012529151514172554, -0.011882818304002285, -0.011236485093832016, -0.010590151883661747, -0.009943818673491478, -0.009297485463321209, -0.00865115225315094, -0.008004819042980671, -0.007358485832810402, -0.006712152622640133, -0.006065819412469864, -0.005419486202299595, -0.004773152992129326, -0.004126819781959057, -0.003480486571788788, -0.002834153361618519, -0.00218782015144825, -0.0015414869412779808, -0.0008951537311077118, -0.0002488205209374428, 0.00039751268923282623, 0.0010438458994030952, 0.0016901791095733643, 0.0023365123197436333, 0.0029828455299139023, 0.0036291787400841713, 0.00427551195025444, 0.004921845160424709, 0.005568178370594978, 0.006214511580765247, 0.006860844790935516, 0.007507178001105785, 0.008153511211276054, 0.008799844421446323, 0.009446177631616592, 0.010092510841786861, 0.01073884405195713, 0.0113851772621274, 0.012031510472297668, 0.012677843682467937, 0.013324176892638206, 0.013970510102808475, 0.014616843312978745, 0.015263176523149014, 0.015909509733319283, 0.016555842012166977, 0.01720217615365982, 0.017848510295152664, 0.01849484257400036, 0.019141174852848053, 0.019787508994340897, 0.02043384313583374, 0.021080175414681435, 0.02172650769352913, 0.022372841835021973]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 10.0, 4.0, 7.0, 11.0, 23.0, 20.0, 30.0, 43.0, 54.0, 102.0, 142.0, 257.0, 325.0, 554.0, 922.0, 1611.0, 3241.0, 6919.0, 17021.0, 55413.0, 347947.0, 511509.0, 67026.0, 19542.0, 7767.0, 3530.0, 1787.0, 1036.0, 582.0, 397.0, 241.0, 148.0, 87.0, 68.0, 50.0, 39.0, 23.0, 15.0, 11.0, 15.0, 7.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.032135009765625, -0.03116321563720703, -0.030191421508789062, -0.029219627380371094, -0.028247833251953125, -0.027276039123535156, -0.026304244995117188, -0.02533245086669922, -0.02436065673828125, -0.02338886260986328, -0.022417068481445312, -0.021445274353027344, -0.020473480224609375, -0.019501686096191406, -0.018529891967773438, -0.01755809783935547, -0.0165863037109375, -0.015614509582519531, -0.014642715454101562, -0.013670921325683594, -0.012699127197265625, -0.011727333068847656, -0.010755538940429688, -0.009783744812011719, -0.00881195068359375, -0.007840156555175781, -0.0068683624267578125, -0.005896568298339844, -0.004924774169921875, -0.003952980041503906, -0.0029811859130859375, -0.0020093917846679688, -0.00103759765625, -6.580352783203125e-05, 0.0009059906005859375, 0.0018777847290039062, 0.002849578857421875, 0.0038213729858398438, 0.0047931671142578125, 0.005764961242675781, 0.00673675537109375, 0.007708549499511719, 0.008680343627929688, 0.009652137756347656, 0.010623931884765625, 0.011595726013183594, 0.012567520141601562, 0.013539314270019531, 0.0145111083984375, 0.015482902526855469, 0.016454696655273438, 0.017426490783691406, 0.018398284912109375, 0.019370079040527344, 0.020341873168945312, 0.02131366729736328, 0.02228546142578125, 0.02325725555419922, 0.024229049682617188, 0.025200843811035156, 0.026172637939453125, 0.027144432067871094, 0.028116226196289062, 0.02908802032470703, 0.030059814453125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 8.0, 9.0, 8.0, 13.0, 14.0, 33.0, 35.0, 45.0, 53.0, 87.0, 87.0, 95.0, 104.0, 72.0, 52.0, 67.0, 56.0, 41.0, 27.0, 19.0, 21.0, 10.0, 10.0, 5.0, 6.0, 8.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0208740234375, -0.020227670669555664, -0.019581317901611328, -0.018934965133666992, -0.018288612365722656, -0.01764225959777832, -0.016995906829833984, -0.01634955406188965, -0.015703201293945312, -0.015056848526000977, -0.01441049575805664, -0.013764142990112305, -0.013117790222167969, -0.012471437454223633, -0.011825084686279297, -0.011178731918334961, -0.010532379150390625, -0.009886026382446289, -0.009239673614501953, -0.008593320846557617, -0.007946968078613281, -0.007300615310668945, -0.006654262542724609, -0.0060079097747802734, -0.0053615570068359375, -0.0047152042388916016, -0.004068851470947266, -0.0034224987030029297, -0.0027761459350585938, -0.002129793167114258, -0.0014834403991699219, -0.0008370876312255859, -0.00019073486328125, 0.00045561790466308594, 0.0011019706726074219, 0.0017483234405517578, 0.0023946762084960938, 0.0030410289764404297, 0.0036873817443847656, 0.0043337345123291016, 0.0049800872802734375, 0.0056264400482177734, 0.006272792816162109, 0.006919145584106445, 0.007565498352050781, 0.008211851119995117, 0.008858203887939453, 0.009504556655883789, 0.010150909423828125, 0.010797262191772461, 0.011443614959716797, 0.012089967727661133, 0.012736320495605469, 0.013382673263549805, 0.01402902603149414, 0.014675378799438477, 0.015321731567382812, 0.01596808433532715, 0.016614437103271484, 0.01726078987121582, 0.017907142639160156, 0.018553495407104492, 0.019199848175048828, 0.019846200942993164, 0.0204925537109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 6.0, 8.0, 18.0, 21.0, 20.0, 28.0, 39.0, 69.0, 79.0, 102.0, 163.0, 376.0, 875.0, 9438.0, 1013298.0, 21695.0, 1223.0, 406.0, 230.0, 126.0, 69.0, 62.0, 52.0, 41.0, 15.0, 14.0, 7.0, 9.0, 14.0, 8.0, 6.0, 2.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.12841796875, -0.12459468841552734, -0.12077140808105469, -0.11694812774658203, -0.11312484741210938, -0.10930156707763672, -0.10547828674316406, -0.1016550064086914, -0.09783172607421875, -0.0940084457397461, -0.09018516540527344, -0.08636188507080078, -0.08253860473632812, -0.07871532440185547, -0.07489204406738281, -0.07106876373291016, -0.0672454833984375, -0.06342220306396484, -0.05959892272949219, -0.05577564239501953, -0.051952362060546875, -0.04812908172607422, -0.04430580139160156, -0.040482521057128906, -0.03665924072265625, -0.032835960388183594, -0.029012680053710938, -0.02518939971923828, -0.021366119384765625, -0.01754283905029297, -0.013719558715820312, -0.009896278381347656, -0.006072998046875, -0.0022497177124023438, 0.0015735626220703125, 0.005396842956542969, 0.009220123291015625, 0.013043403625488281, 0.016866683959960938, 0.020689964294433594, 0.02451324462890625, 0.028336524963378906, 0.03215980529785156, 0.03598308563232422, 0.039806365966796875, 0.04362964630126953, 0.04745292663574219, 0.051276206970214844, 0.0550994873046875, 0.058922767639160156, 0.06274604797363281, 0.06656932830810547, 0.07039260864257812, 0.07421588897705078, 0.07803916931152344, 0.0818624496459961, 0.08568572998046875, 0.0895090103149414, 0.09333229064941406, 0.09715557098388672, 0.10097885131835938, 0.10480213165283203, 0.10862541198730469, 0.11244869232177734, 0.11627197265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 9.0, 4.0, 13.0, 17.0, 16.0, 25.0, 19.0, 20.0, 35.0, 30.0, 40.0, 34.0, 53.0, 46.0, 50.0, 44.0, 67.0, 56.0, 46.0, 39.0, 43.0, 46.0, 34.0, 32.0, 42.0, 24.0, 25.0, 13.0, 13.0, 14.0, 14.0, 4.0, 2.0, 12.0, 5.0, 7.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0511474609375, -0.04936027526855469, -0.047573089599609375, -0.04578590393066406, -0.04399871826171875, -0.04221153259277344, -0.040424346923828125, -0.03863716125488281, -0.0368499755859375, -0.03506278991699219, -0.033275604248046875, -0.03148841857910156, -0.02970123291015625, -0.027914047241210938, -0.026126861572265625, -0.024339675903320312, -0.022552490234375, -0.020765304565429688, -0.018978118896484375, -0.017190933227539062, -0.01540374755859375, -0.013616561889648438, -0.011829376220703125, -0.010042190551757812, -0.0082550048828125, -0.0064678192138671875, -0.004680633544921875, -0.0028934478759765625, -0.00110626220703125, 0.0006809234619140625, 0.002468109130859375, 0.0042552947998046875, 0.00604248046875, 0.007829666137695312, 0.009616851806640625, 0.011404037475585938, 0.01319122314453125, 0.014978408813476562, 0.016765594482421875, 0.018552780151367188, 0.0203399658203125, 0.022127151489257812, 0.023914337158203125, 0.025701522827148438, 0.02748870849609375, 0.029275894165039062, 0.031063079833984375, 0.03285026550292969, 0.034637451171875, 0.03642463684082031, 0.038211822509765625, 0.03999900817871094, 0.04178619384765625, 0.04357337951660156, 0.045360565185546875, 0.04714775085449219, 0.0489349365234375, 0.05072212219238281, 0.052509307861328125, 0.05429649353027344, 0.05608367919921875, 0.05787086486816406, 0.059658050537109375, 0.06144523620605469, 0.063232421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 19.0, 16.0, 23.0, 60.0, 153.0, 999.0, 1024091.0, 22551.0, 392.0, 100.0, 53.0, 24.0, 21.0, 7.0, 10.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01363372802734375, -0.01312553882598877, -0.012617349624633789, -0.012109160423278809, -0.011600971221923828, -0.011092782020568848, -0.010584592819213867, -0.010076403617858887, -0.009568214416503906, -0.009060025215148926, -0.008551836013793945, -0.008043646812438965, -0.007535457611083984, -0.007027268409729004, -0.0065190792083740234, -0.006010890007019043, -0.0055027008056640625, -0.004994511604309082, -0.0044863224029541016, -0.003978133201599121, -0.0034699440002441406, -0.00296175479888916, -0.0024535655975341797, -0.0019453763961791992, -0.0014371871948242188, -0.0009289979934692383, -0.0004208087921142578, 8.738040924072266e-05, 0.0005955696105957031, 0.0011037588119506836, 0.001611948013305664, 0.0021201372146606445, 0.002628326416015625, 0.0031365156173706055, 0.003644704818725586, 0.004152894020080566, 0.004661083221435547, 0.005169272422790527, 0.005677461624145508, 0.006185650825500488, 0.006693840026855469, 0.007202029228210449, 0.00771021842956543, 0.00821840763092041, 0.00872659683227539, 0.009234786033630371, 0.009742975234985352, 0.010251164436340332, 0.010759353637695312, 0.011267542839050293, 0.011775732040405273, 0.012283921241760254, 0.012792110443115234, 0.013300299644470215, 0.013808488845825195, 0.014316678047180176, 0.014824867248535156, 0.015333056449890137, 0.015841245651245117, 0.016349434852600098, 0.016857624053955078, 0.01736581325531006, 0.01787400245666504, 0.01838219165802002, 0.018890380859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 9.0, 12.0, 16.0, 14.0, 20.0, 34.0, 47.0, 106.0, 454.0, 81.0, 41.0, 22.0, 21.0, 21.0, 13.0, 11.0, 8.0, 9.0, 4.0, 5.0, 4.0, 5.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003314018249511719, -0.0003217644989490509, -0.00031212717294692993, -0.00030248984694480896, -0.000292852520942688, -0.000283215194940567, -0.00027357786893844604, -0.0002639405429363251, -0.0002543032169342041, -0.00024466589093208313, -0.00023502856492996216, -0.0002253912389278412, -0.00021575391292572021, -0.00020611658692359924, -0.00019647926092147827, -0.0001868419349193573, -0.00017720460891723633, -0.00016756728291511536, -0.00015792995691299438, -0.0001482926309108734, -0.00013865530490875244, -0.00012901797890663147, -0.0001193806529045105, -0.00010974332690238953, -0.00010010600090026855, -9.046867489814758e-05, -8.083134889602661e-05, -7.119402289390564e-05, -6.155669689178467e-05, -5.1919370889663696e-05, -4.2282044887542725e-05, -3.264471888542175e-05, -2.300739288330078e-05, -1.337006688117981e-05, -3.732740879058838e-06, 5.904585123062134e-06, 1.5541911125183105e-05, 2.5179237127304077e-05, 3.481656312942505e-05, 4.445388913154602e-05, 5.409121513366699e-05, 6.372854113578796e-05, 7.336586713790894e-05, 8.300319314002991e-05, 9.264051914215088e-05, 0.00010227784514427185, 0.00011191517114639282, 0.0001215524971485138, 0.00013118982315063477, 0.00014082714915275574, 0.0001504644751548767, 0.00016010180115699768, 0.00016973912715911865, 0.00017937645316123962, 0.0001890137791633606, 0.00019865110516548157, 0.00020828843116760254, 0.0002179257571697235, 0.00022756308317184448, 0.00023720040917396545, 0.0002468377351760864, 0.0002564750611782074, 0.00026611238718032837, 0.00027574971318244934, 0.0002853870391845703]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 8.0, 7.0, 16.0, 33.0, 31.0, 84.0, 294.0, 8870.0, 1036859.0, 2005.0, 176.0, 63.0, 31.0, 28.0, 11.0, 14.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.026153564453125, -0.02541375160217285, -0.024673938751220703, -0.023934125900268555, -0.023194313049316406, -0.022454500198364258, -0.02171468734741211, -0.02097487449645996, -0.020235061645507812, -0.019495248794555664, -0.018755435943603516, -0.018015623092651367, -0.01727581024169922, -0.01653599739074707, -0.015796184539794922, -0.015056371688842773, -0.014316558837890625, -0.013576745986938477, -0.012836933135986328, -0.01209712028503418, -0.011357307434082031, -0.010617494583129883, -0.009877681732177734, -0.009137868881225586, -0.008398056030273438, -0.007658243179321289, -0.006918430328369141, -0.006178617477416992, -0.005438804626464844, -0.004698991775512695, -0.003959178924560547, -0.0032193660736083984, -0.00247955322265625, -0.0017397403717041016, -0.0009999275207519531, -0.0002601146697998047, 0.00047969818115234375, 0.0012195110321044922, 0.0019593238830566406, 0.002699136734008789, 0.0034389495849609375, 0.004178762435913086, 0.004918575286865234, 0.005658388137817383, 0.006398200988769531, 0.00713801383972168, 0.007877826690673828, 0.008617639541625977, 0.009357452392578125, 0.010097265243530273, 0.010837078094482422, 0.01157689094543457, 0.012316703796386719, 0.013056516647338867, 0.013796329498291016, 0.014536142349243164, 0.015275955200195312, 0.01601576805114746, 0.01675558090209961, 0.017495393753051758, 0.018235206604003906, 0.018975019454956055, 0.019714832305908203, 0.02045464515686035, 0.0211944580078125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 5.0, 15.0, 13.0, 23.0, 22.0, 14.0, 52.0, 64.0, 147.0, 314.0, 119.0, 63.0, 43.0, 28.0, 23.0, 10.0, 9.0, 11.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007007598876953125, -0.006761133670806885, -0.0065146684646606445, -0.006268203258514404, -0.006021738052368164, -0.005775272846221924, -0.005528807640075684, -0.005282342433929443, -0.005035877227783203, -0.004789412021636963, -0.004542946815490723, -0.004296481609344482, -0.004050016403198242, -0.003803551197052002, -0.0035570859909057617, -0.0033106207847595215, -0.0030641555786132812, -0.002817690372467041, -0.0025712251663208008, -0.0023247599601745605, -0.0020782947540283203, -0.00183182954788208, -0.0015853643417358398, -0.0013388991355895996, -0.0010924339294433594, -0.0008459687232971191, -0.0005995035171508789, -0.00035303831100463867, -0.00010657310485839844, 0.0001398921012878418, 0.00038635730743408203, 0.0006328225135803223, 0.0008792877197265625, 0.0011257529258728027, 0.001372218132019043, 0.0016186833381652832, 0.0018651485443115234, 0.0021116137504577637, 0.002358078956604004, 0.002604544162750244, 0.0028510093688964844, 0.0030974745750427246, 0.003343939781188965, 0.003590404987335205, 0.0038368701934814453, 0.0040833353996276855, 0.004329800605773926, 0.004576265811920166, 0.004822731018066406, 0.0050691962242126465, 0.005315661430358887, 0.005562126636505127, 0.005808591842651367, 0.006055057048797607, 0.006301522254943848, 0.006547987461090088, 0.006794452667236328, 0.007040917873382568, 0.007287383079528809, 0.007533848285675049, 0.007780313491821289, 0.00802677869796753, 0.00827324390411377, 0.00851970911026001, 0.00876617431640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 49.0, 774.0, 176.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8410512208938599, -1.8073618412017822, -1.7736724615097046, -1.739983081817627, -1.7062937021255493, -1.6726043224334717, -1.638914942741394, -1.6052255630493164, -1.5715363025665283, -1.5378469228744507, -1.504157543182373, -1.4704681634902954, -1.4367787837982178, -1.4030894041061401, -1.3694000244140625, -1.3357107639312744, -1.3020212650299072, -1.2683318853378296, -1.234642505645752, -1.2009531259536743, -1.1672637462615967, -1.133574366569519, -1.0998849868774414, -1.0661957263946533, -1.0325062274932861, -0.9988168478012085, -0.9651274681091309, -0.9314380884170532, -0.8977487087249756, -0.864059329032898, -0.8303700089454651, -0.7966806292533875, -0.7629913091659546, -0.729301929473877, -0.6956125497817993, -0.6619231700897217, -0.628233790397644, -0.5945444107055664, -0.5608550906181335, -0.5271657109260559, -0.49347633123397827, -0.45978695154190063, -0.426097571849823, -0.39240822196006775, -0.3587188422679901, -0.3250294625759125, -0.2913401126861572, -0.2576507329940796, -0.22396135330200195, -0.19027197360992432, -0.15658260881900787, -0.12289323657751083, -0.0892038643360138, -0.05551448464393616, -0.021825119853019714, 0.011864244937896729, 0.045553624629974365, 0.0792429968714714, 0.11293236911296844, 0.1466217339038849, 0.18031111359596252, 0.21400049328804016, 0.2476898580789566, 0.28137922286987305, 0.3150686025619507]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 6.0, 10.0, 11.0, 5.0, 7.0, 18.0, 15.0, 12.0, 19.0, 12.0, 15.0, 19.0, 31.0, 24.0, 39.0, 34.0, 37.0, 43.0, 42.0, 30.0, 33.0, 31.0, 54.0, 40.0, 38.0, 32.0, 28.0, 29.0, 30.0, 39.0, 25.0, 28.0, 24.0, 23.0, 17.0, 18.0, 18.0, 11.0, 13.0, 8.0, 7.0, 7.0, 2.0, 5.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.20592063665390015, -0.1988634467124939, -0.19180627167224884, -0.18474909663200378, -0.17769190669059753, -0.17063471674919128, -0.16357754170894623, -0.15652036666870117, -0.14946317672729492, -0.14240598678588867, -0.13534881174564362, -0.12829163670539856, -0.12123444676399231, -0.11417726427316666, -0.107120081782341, -0.10006289929151535, -0.0930057168006897, -0.08594853430986404, -0.07889135181903839, -0.07183416932821274, -0.06477698683738708, -0.05771980434656143, -0.05066262185573578, -0.043605439364910126, -0.03654825687408447, -0.02949107438325882, -0.022433891892433167, -0.015376709401607513, -0.00831952691078186, -0.0012623444199562073, 0.005794838070869446, 0.012852020561695099, 0.019909203052520752, 0.026966385543346405, 0.03402356803417206, 0.04108075052499771, 0.048137933015823364, 0.05519511550664902, 0.06225229799747467, 0.06930948048830032, 0.07636666297912598, 0.08342384546995163, 0.09048102796077728, 0.09753821045160294, 0.10459539294242859, 0.11165257543325424, 0.1187097579240799, 0.12576693296432495, 0.1328241229057312, 0.13988131284713745, 0.1469384878873825, 0.15399566292762756, 0.1610528528690338, 0.16811004281044006, 0.17516721785068512, 0.18222439289093018, 0.18928158283233643, 0.19633877277374268, 0.20339594781398773, 0.2104531228542328, 0.21751031279563904, 0.2245675027370453, 0.23162467777729034, 0.2386818528175354, 0.24573904275894165]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 8.0, 8.0, 14.0, 10.0, 18.0, 27.0, 48.0, 55.0, 76.0, 78.0, 97.0, 4193370.0, 87.0, 65.0, 66.0, 57.0, 43.0, 39.0, 26.0, 25.0, 13.0, 11.0, 10.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.177734375, -0.17232513427734375, -0.1669158935546875, -0.16150665283203125, -0.156097412109375, -0.15068817138671875, -0.1452789306640625, -0.13986968994140625, -0.13446044921875, -0.12905120849609375, -0.1236419677734375, -0.11823272705078125, -0.112823486328125, -0.10741424560546875, -0.1020050048828125, -0.09659576416015625, -0.0911865234375, -0.08577728271484375, -0.0803680419921875, -0.07495880126953125, -0.069549560546875, -0.06414031982421875, -0.0587310791015625, -0.05332183837890625, -0.04791259765625, -0.04250335693359375, -0.0370941162109375, -0.03168487548828125, -0.026275634765625, -0.02086639404296875, -0.0154571533203125, -0.01004791259765625, -0.004638671875, 0.00077056884765625, 0.0061798095703125, 0.01158905029296875, 0.016998291015625, 0.02240753173828125, 0.0278167724609375, 0.03322601318359375, 0.03863525390625, 0.04404449462890625, 0.0494537353515625, 0.05486297607421875, 0.060272216796875, 0.06568145751953125, 0.0710906982421875, 0.07649993896484375, 0.0819091796875, 0.08731842041015625, 0.0927276611328125, 0.09813690185546875, 0.103546142578125, 0.10895538330078125, 0.1143646240234375, 0.11977386474609375, 0.12518310546875, 0.13059234619140625, 0.1360015869140625, 0.14141082763671875, 0.146820068359375, 0.15222930908203125, 0.1576385498046875, 0.16304779052734375, 0.16845703125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 4.0, 10.0, 7.0, 16.0, 11.0, 26.0, 41.0, 52.0, 61.0, 81.0, 91.0, 100.0, 83.0, 72.0, 61.0, 69.0, 49.0, 43.0, 26.0, 26.0, 17.0, 8.0, 14.0, 6.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0203094482421875, -0.01967906951904297, -0.019048690795898438, -0.018418312072753906, -0.017787933349609375, -0.017157554626464844, -0.016527175903320312, -0.01589679718017578, -0.01526641845703125, -0.014636039733886719, -0.014005661010742188, -0.013375282287597656, -0.012744903564453125, -0.012114524841308594, -0.011484146118164062, -0.010853767395019531, -0.010223388671875, -0.009593009948730469, -0.008962631225585938, -0.008332252502441406, -0.007701873779296875, -0.007071495056152344, -0.0064411163330078125, -0.005810737609863281, -0.00518035888671875, -0.004549980163574219, -0.0039196014404296875, -0.0032892227172851562, -0.002658843994140625, -0.0020284652709960938, -0.0013980865478515625, -0.0007677078247070312, -0.0001373291015625, 0.0004930496215820312, 0.0011234283447265625, 0.0017538070678710938, 0.002384185791015625, 0.0030145645141601562, 0.0036449432373046875, 0.004275321960449219, 0.00490570068359375, 0.005536079406738281, 0.0061664581298828125, 0.006796836853027344, 0.007427215576171875, 0.008057594299316406, 0.008687973022460938, 0.009318351745605469, 0.00994873046875, 0.010579109191894531, 0.011209487915039062, 0.011839866638183594, 0.012470245361328125, 0.013100624084472656, 0.013731002807617188, 0.014361381530761719, 0.01499176025390625, 0.015622138977050781, 0.016252517700195312, 0.016882896423339844, 0.017513275146484375, 0.018143653869628906, 0.018774032592773438, 0.01940441131591797, 0.0200347900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 3.0, 8.0, 6.0, 7.0, 9.0, 17.0, 25.0, 21.0, 21.0, 25.0, 35.0, 38.0, 46.0, 59.0, 88.0, 200.0, 1835.0, 4190965.0, 263.0, 129.0, 87.0, 66.0, 45.0, 36.0, 42.0, 33.0, 27.0, 29.0, 26.0, 13.0, 18.0, 14.0, 11.0, 11.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.004913330078125, -0.004784703254699707, -0.004656076431274414, -0.004527449607849121, -0.004398822784423828, -0.004270195960998535, -0.004141569137573242, -0.004012942314147949, -0.0038843154907226562, -0.0037556886672973633, -0.0036270618438720703, -0.0034984350204467773, -0.0033698081970214844, -0.0032411813735961914, -0.0031125545501708984, -0.0029839277267456055, -0.0028553009033203125, -0.0027266740798950195, -0.0025980472564697266, -0.0024694204330444336, -0.0023407936096191406, -0.0022121667861938477, -0.0020835399627685547, -0.0019549131393432617, -0.0018262863159179688, -0.0016976594924926758, -0.0015690326690673828, -0.0014404058456420898, -0.0013117790222167969, -0.001183152198791504, -0.001054525375366211, -0.000925898551940918, -0.000797271728515625, -0.000668644905090332, -0.0005400180816650391, -0.0004113912582397461, -0.0002827644348144531, -0.00015413761138916016, -2.5510787963867188e-05, 0.00010311603546142578, 0.00023174285888671875, 0.0003603696823120117, 0.0004889965057373047, 0.0006176233291625977, 0.0007462501525878906, 0.0008748769760131836, 0.0010035037994384766, 0.0011321306228637695, 0.0012607574462890625, 0.0013893842697143555, 0.0015180110931396484, 0.0016466379165649414, 0.0017752647399902344, 0.0019038915634155273, 0.0020325183868408203, 0.0021611452102661133, 0.0022897720336914062, 0.0024183988571166992, 0.002547025680541992, 0.002675652503967285, 0.002804279327392578, 0.002932906150817871, 0.003061532974243164, 0.003190159797668457, 0.00331878662109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 4083.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0590763092041016e-05, -1.4564953744411469e-05, 1.1460855603218079e-05, 3.7486664950847626e-05, 6.351247429847717e-05, 8.953828364610672e-05, 0.00011556409299373627, 0.00014158990234136581, 0.00016761571168899536, 0.0001936415210366249, 0.00021966733038425446, 0.000245693139731884, 0.00027171894907951355, 0.0002977447584271431, 0.00032377056777477264, 0.0003497963771224022, 0.00037582218647003174, 0.0004018479958176613, 0.00042787380516529083, 0.0004538996145129204, 0.0004799254238605499, 0.0005059512332081795, 0.000531977042555809, 0.0005580028519034386, 0.0005840286612510681, 0.0006100544705986977, 0.0006360802799463272, 0.0006621060892939568, 0.0006881318986415863, 0.0007141577079892159, 0.0007401835173368454, 0.0007662093266844749, 0.0007922351360321045, 0.000818260945379734, 0.0008442867547273636, 0.0008703125640749931, 0.0008963383734226227, 0.0009223641827702522, 0.0009483899921178818, 0.0009744158014655113, 0.0010004416108131409, 0.0010264674201607704, 0.0010524932295084, 0.0010785190388560295, 0.001104544848203659, 0.0011305706575512886, 0.0011565964668989182, 0.0011826222762465477, 0.0012086480855941772, 0.0012346738949418068, 0.0012606997042894363, 0.0012867255136370659, 0.0013127513229846954, 0.001338777132332325, 0.0013648029416799545, 0.001390828751027584, 0.0014168545603752136, 0.0014428803697228432, 0.0014689061790704727, 0.0014949319884181023, 0.0015209577977657318, 0.0015469836071133614, 0.001573009416460991, 0.0015990352258086205, 0.00162506103515625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 16.0, 811.0, 176.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.016410663723945618, -0.01611698605120182, -0.015823308378458023, -0.0155296316370368, -0.015235954895615578, -0.01494227722287178, -0.014648599550127983, -0.01435492280870676, -0.014061245135962963, -0.013767567463219166, -0.013473890721797943, -0.013180213049054146, -0.012886536307632923, -0.012592858634889126, -0.012299181893467903, -0.012005504220724106, -0.011711826547980309, -0.011418148875236511, -0.011124472133815289, -0.010830794461071491, -0.010537117719650269, -0.010243440046906471, -0.009949762374162674, -0.009656085632741451, -0.009362408891320229, -0.009068731218576431, -0.008775054477155209, -0.008481376804411411, -0.008187700062990189, -0.007894022390246391, -0.007600345183163881, -0.007306667976081371, -0.007012990303337574, -0.006719313096255064, -0.006425635889172554, -0.006131958216428757, -0.005838281009346247, -0.005544603802263737, -0.005250926595181227, -0.004957249388098717, -0.004663572181016207, -0.004369894973933697, -0.004076217766851187, -0.003782540326938033, -0.0034888628870248795, -0.0031951856799423695, -0.0029015084728598595, -0.002607831032946706, -0.002314153825864196, -0.002020476618781686, -0.0017267991788685322, -0.0014331219717860222, -0.0011394446482881904, -0.0008457673247903585, -0.0005520901177078485, -0.0002584126777946949, 3.5264529287815094e-05, 0.00032894182368181646, 0.0006226191180758178, 0.0009162963833659887, 0.0012099737068638206, 0.0015036510303616524, 0.0017973282374441624, 0.002091005677357316, 0.002384682884439826]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 12.0, 18.0, 37.0, 63.0, 122.0, 172.0, 164.0, 142.0, 107.0, 79.0, 31.0, 28.0, 9.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014180541038513184, -0.001345757395029068, -0.0012734606862068176, -0.0012011639773845673, -0.001128867268562317, -0.0010565705597400665, -0.0009842738509178162, -0.0009119771420955658, -0.0008396804332733154, -0.0007673837244510651, -0.0006950870156288147, -0.0006227903068065643, -0.000550493597984314, -0.0004781968891620636, -0.00040590018033981323, -0.00033360347151756287, -0.0002613067626953125, -0.00018901005387306213, -0.00011671334505081177, -4.44166362285614e-05, 2.7880072593688965e-05, 0.00010017678141593933, 0.0001724734902381897, 0.00024477019906044006, 0.00031706690788269043, 0.0003893636167049408, 0.00046166032552719116, 0.0005339570343494415, 0.0006062537431716919, 0.0006785504519939423, 0.0007508471608161926, 0.000823143869638443, 0.0008954405784606934, 0.0009677372872829437, 0.001040033996105194, 0.0011123307049274445, 0.0011846274137496948, 0.0012569241225719452, 0.0013292208313941956, 0.001401517540216446, 0.0014738142490386963, 0.0015461109578609467, 0.001618407666683197, 0.0016907043755054474, 0.0017630010843276978, 0.0018352977931499481, 0.0019075945019721985, 0.001979891210794449, 0.0020521879196166992, 0.0021244846284389496, 0.0021967813372612, 0.0022690780460834503, 0.0023413747549057007, 0.002413671463727951, 0.0024859681725502014, 0.0025582648813724518, 0.002630561590194702, 0.0027028582990169525, 0.002775155007839203, 0.0028474517166614532, 0.0029197484254837036, 0.002992045134305954, 0.0030643418431282043, 0.0031366385519504547, 0.003208935260772705]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 6.0, 5.0, 4.0, 9.0, 10.0, 21.0, 25.0, 28.0, 49.0, 58.0, 91.0, 152.0, 230.0, 345.0, 574.0, 1024.0, 1986.0, 4118.0, 10061.0, 31578.0, 162042.0, 697282.0, 100448.0, 23091.0, 7939.0, 3451.0, 1617.0, 871.0, 553.0, 284.0, 185.0, 125.0, 81.0, 57.0, 50.0, 29.0, 19.0, 13.0, 15.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.03460693359375, -0.03350400924682617, -0.032401084899902344, -0.031298160552978516, -0.030195236206054688, -0.02909231185913086, -0.02798938751220703, -0.026886463165283203, -0.025783538818359375, -0.024680614471435547, -0.02357769012451172, -0.02247476577758789, -0.021371841430664062, -0.020268917083740234, -0.019165992736816406, -0.018063068389892578, -0.01696014404296875, -0.015857219696044922, -0.014754295349121094, -0.013651371002197266, -0.012548446655273438, -0.01144552230834961, -0.010342597961425781, -0.009239673614501953, -0.008136749267578125, -0.007033824920654297, -0.005930900573730469, -0.004827976226806641, -0.0037250518798828125, -0.0026221275329589844, -0.0015192031860351562, -0.0004162788391113281, 0.0006866455078125, 0.0017895698547363281, 0.0028924942016601562, 0.003995418548583984, 0.0050983428955078125, 0.006201267242431641, 0.007304191589355469, 0.008407115936279297, 0.009510040283203125, 0.010612964630126953, 0.011715888977050781, 0.01281881332397461, 0.013921737670898438, 0.015024662017822266, 0.016127586364746094, 0.017230510711669922, 0.01833343505859375, 0.019436359405517578, 0.020539283752441406, 0.021642208099365234, 0.022745132446289062, 0.02384805679321289, 0.02495098114013672, 0.026053905487060547, 0.027156829833984375, 0.028259754180908203, 0.02936267852783203, 0.03046560287475586, 0.03156852722167969, 0.032671451568603516, 0.033774375915527344, 0.03487730026245117, 0.035980224609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 4.0, 10.0, 9.0, 14.0, 11.0, 28.0, 39.0, 53.0, 60.0, 80.0, 92.0, 100.0, 85.0, 71.0, 60.0, 72.0, 46.0, 44.0, 26.0, 25.0, 17.0, 8.0, 14.0, 6.0, 3.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0203094482421875, -0.019678831100463867, -0.019048213958740234, -0.0184175968170166, -0.01778697967529297, -0.017156362533569336, -0.016525745391845703, -0.01589512825012207, -0.015264511108398438, -0.014633893966674805, -0.014003276824951172, -0.013372659683227539, -0.012742042541503906, -0.012111425399780273, -0.01148080825805664, -0.010850191116333008, -0.010219573974609375, -0.009588956832885742, -0.00895833969116211, -0.008327722549438477, -0.007697105407714844, -0.007066488265991211, -0.006435871124267578, -0.005805253982543945, -0.0051746368408203125, -0.00454401969909668, -0.003913402557373047, -0.003282785415649414, -0.0026521682739257812, -0.0020215511322021484, -0.0013909339904785156, -0.0007603168487548828, -0.00012969970703125, 0.0005009174346923828, 0.0011315345764160156, 0.0017621517181396484, 0.0023927688598632812, 0.003023386001586914, 0.003654003143310547, 0.00428462028503418, 0.0049152374267578125, 0.005545854568481445, 0.006176471710205078, 0.006807088851928711, 0.007437705993652344, 0.008068323135375977, 0.00869894027709961, 0.009329557418823242, 0.009960174560546875, 0.010590791702270508, 0.01122140884399414, 0.011852025985717773, 0.012482643127441406, 0.013113260269165039, 0.013743877410888672, 0.014374494552612305, 0.015005111694335938, 0.01563572883605957, 0.016266345977783203, 0.016896963119506836, 0.01752758026123047, 0.0181581974029541, 0.018788814544677734, 0.019419431686401367, 0.020050048828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 1.0, 5.0, 5.0, 7.0, 4.0, 9.0, 12.0, 12.0, 13.0, 21.0, 29.0, 36.0, 42.0, 59.0, 83.0, 148.0, 305.0, 865.0, 11790.0, 1010737.0, 22455.0, 1003.0, 385.0, 180.0, 87.0, 67.0, 44.0, 43.0, 19.0, 21.0, 21.0, 14.0, 8.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.105224609375, -0.10166549682617188, -0.09810638427734375, -0.09454727172851562, -0.0909881591796875, -0.08742904663085938, -0.08386993408203125, -0.08031082153320312, -0.076751708984375, -0.07319259643554688, -0.06963348388671875, -0.06607437133789062, -0.0625152587890625, -0.058956146240234375, -0.05539703369140625, -0.051837921142578125, -0.04827880859375, -0.044719696044921875, -0.04116058349609375, -0.037601470947265625, -0.0340423583984375, -0.030483245849609375, -0.02692413330078125, -0.023365020751953125, -0.019805908203125, -0.016246795654296875, -0.01268768310546875, -0.009128570556640625, -0.0055694580078125, -0.002010345458984375, 0.00154876708984375, 0.005107879638671875, 0.0086669921875, 0.012226104736328125, 0.01578521728515625, 0.019344329833984375, 0.0229034423828125, 0.026462554931640625, 0.03002166748046875, 0.033580780029296875, 0.037139892578125, 0.040699005126953125, 0.04425811767578125, 0.047817230224609375, 0.0513763427734375, 0.054935455322265625, 0.05849456787109375, 0.062053680419921875, 0.06561279296875, 0.06917190551757812, 0.07273101806640625, 0.07629013061523438, 0.0798492431640625, 0.08340835571289062, 0.08696746826171875, 0.09052658081054688, 0.094085693359375, 0.09764480590820312, 0.10120391845703125, 0.10476303100585938, 0.1083221435546875, 0.11188125610351562, 0.11544036865234375, 0.11899948120117188, 0.12255859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 11.0, 11.0, 12.0, 13.0, 12.0, 13.0, 21.0, 24.0, 34.0, 32.0, 37.0, 32.0, 24.0, 42.0, 49.0, 43.0, 42.0, 44.0, 40.0, 42.0, 43.0, 43.0, 40.0, 38.0, 38.0, 35.0, 26.0, 25.0, 21.0, 19.0, 19.0, 14.0, 11.0, 8.0, 15.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048187255859375, -0.046746253967285156, -0.04530525207519531, -0.04386425018310547, -0.042423248291015625, -0.04098224639892578, -0.03954124450683594, -0.038100242614746094, -0.03665924072265625, -0.035218238830566406, -0.03377723693847656, -0.03233623504638672, -0.030895233154296875, -0.02945423126220703, -0.028013229370117188, -0.026572227478027344, -0.0251312255859375, -0.023690223693847656, -0.022249221801757812, -0.02080821990966797, -0.019367218017578125, -0.01792621612548828, -0.016485214233398438, -0.015044212341308594, -0.01360321044921875, -0.012162208557128906, -0.010721206665039062, -0.009280204772949219, -0.007839202880859375, -0.006398200988769531, -0.0049571990966796875, -0.0035161972045898438, -0.0020751953125, -0.0006341934204101562, 0.0008068084716796875, 0.0022478103637695312, 0.003688812255859375, 0.005129814147949219, 0.0065708160400390625, 0.008011817932128906, 0.00945281982421875, 0.010893821716308594, 0.012334823608398438, 0.013775825500488281, 0.015216827392578125, 0.01665782928466797, 0.018098831176757812, 0.019539833068847656, 0.0209808349609375, 0.022421836853027344, 0.023862838745117188, 0.02530384063720703, 0.026744842529296875, 0.02818584442138672, 0.029626846313476562, 0.031067848205566406, 0.03250885009765625, 0.033949851989746094, 0.03539085388183594, 0.03683185577392578, 0.038272857666015625, 0.03971385955810547, 0.04115486145019531, 0.042595863342285156, 0.044036865234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 7.0, 6.0, 4.0, 8.0, 25.0, 33.0, 59.0, 203.0, 686.0, 8524.0, 1029593.0, 8397.0, 655.0, 172.0, 73.0, 27.0, 26.0, 16.0, 12.0, 4.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013671875, -0.013251185417175293, -0.012830495834350586, -0.012409806251525879, -0.011989116668701172, -0.011568427085876465, -0.011147737503051758, -0.01072704792022705, -0.010306358337402344, -0.009885668754577637, -0.00946497917175293, -0.009044289588928223, -0.008623600006103516, -0.008202910423278809, -0.0077822208404541016, -0.0073615312576293945, -0.0069408416748046875, -0.0065201520919799805, -0.0060994625091552734, -0.005678772926330566, -0.005258083343505859, -0.004837393760681152, -0.004416704177856445, -0.003996014595031738, -0.0035753250122070312, -0.0031546354293823242, -0.002733945846557617, -0.00231325626373291, -0.0018925666809082031, -0.001471877098083496, -0.001051187515258789, -0.000630497932434082, -0.000209808349609375, 0.00021088123321533203, 0.0006315708160400391, 0.001052260398864746, 0.0014729499816894531, 0.0018936395645141602, 0.002314329147338867, 0.0027350187301635742, 0.0031557083129882812, 0.0035763978958129883, 0.003997087478637695, 0.004417777061462402, 0.004838466644287109, 0.005259156227111816, 0.0056798458099365234, 0.0061005353927612305, 0.0065212249755859375, 0.0069419145584106445, 0.0073626041412353516, 0.007783293724060059, 0.008203983306884766, 0.008624672889709473, 0.00904536247253418, 0.009466052055358887, 0.009886741638183594, 0.0103074312210083, 0.010728120803833008, 0.011148810386657715, 0.011569499969482422, 0.011990189552307129, 0.012410879135131836, 0.012831568717956543, 0.01325225830078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 1.0, 5.0, 7.0, 10.0, 12.0, 17.0, 23.0, 29.0, 47.0, 79.0, 228.0, 283.0, 90.0, 48.0, 34.0, 17.0, 11.0, 14.0, 8.0, 8.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003342628479003906, -0.00032474473118782043, -0.00031522661447525024, -0.00030570849776268005, -0.00029619038105010986, -0.00028667226433753967, -0.0002771541476249695, -0.0002676360309123993, -0.0002581179141998291, -0.0002485997974872589, -0.00023908168077468872, -0.00022956356406211853, -0.00022004544734954834, -0.00021052733063697815, -0.00020100921392440796, -0.00019149109721183777, -0.00018197298049926758, -0.0001724548637866974, -0.0001629367470741272, -0.000153418630361557, -0.00014390051364898682, -0.00013438239693641663, -0.00012486428022384644, -0.00011534616351127625, -0.00010582804679870605, -9.630993008613586e-05, -8.679181337356567e-05, -7.727369666099548e-05, -6.775557994842529e-05, -5.82374632358551e-05, -4.871934652328491e-05, -3.920122981071472e-05, -2.968311309814453e-05, -2.016499638557434e-05, -1.064687967300415e-05, -1.12876296043396e-06, 8.38935375213623e-06, 1.790747046470642e-05, 2.742558717727661e-05, 3.69437038898468e-05, 4.646182060241699e-05, 5.597993731498718e-05, 6.549805402755737e-05, 7.501617074012756e-05, 8.453428745269775e-05, 9.405240416526794e-05, 0.00010357052087783813, 0.00011308863759040833, 0.00012260675430297852, 0.0001321248710155487, 0.0001416429877281189, 0.0001511611044406891, 0.00016067922115325928, 0.00017019733786582947, 0.00017971545457839966, 0.00018923357129096985, 0.00019875168800354004, 0.00020826980471611023, 0.00021778792142868042, 0.0002273060381412506, 0.0002368241548538208, 0.000246342271566391, 0.0002558603882789612, 0.00026537850499153137, 0.00027489662170410156]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 13.0, 8.0, 15.0, 34.0, 49.0, 77.0, 243.0, 2401.0, 1024924.0, 19918.0, 588.0, 128.0, 58.0, 25.0, 18.0, 10.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015716552734375, -0.015221118927001953, -0.014725685119628906, -0.01423025131225586, -0.013734817504882812, -0.013239383697509766, -0.012743949890136719, -0.012248516082763672, -0.011753082275390625, -0.011257648468017578, -0.010762214660644531, -0.010266780853271484, -0.009771347045898438, -0.00927591323852539, -0.008780479431152344, -0.008285045623779297, -0.00778961181640625, -0.007294178009033203, -0.006798744201660156, -0.006303310394287109, -0.0058078765869140625, -0.005312442779541016, -0.004817008972167969, -0.004321575164794922, -0.003826141357421875, -0.003330707550048828, -0.0028352737426757812, -0.0023398399353027344, -0.0018444061279296875, -0.0013489723205566406, -0.0008535385131835938, -0.0003581047058105469, 0.0001373291015625, 0.0006327629089355469, 0.0011281967163085938, 0.0016236305236816406, 0.0021190643310546875, 0.0026144981384277344, 0.0031099319458007812, 0.003605365753173828, 0.004100799560546875, 0.004596233367919922, 0.005091667175292969, 0.005587100982666016, 0.0060825347900390625, 0.006577968597412109, 0.007073402404785156, 0.007568836212158203, 0.00806427001953125, 0.008559703826904297, 0.009055137634277344, 0.00955057144165039, 0.010046005249023438, 0.010541439056396484, 0.011036872863769531, 0.011532306671142578, 0.012027740478515625, 0.012523174285888672, 0.013018608093261719, 0.013514041900634766, 0.014009475708007812, 0.01450490951538086, 0.015000343322753906, 0.015495777130126953, 0.0159912109375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 2.0, 8.0, 10.0, 18.0, 15.0, 28.0, 20.0, 40.0, 66.0, 82.0, 118.0, 105.0, 122.0, 101.0, 64.0, 40.0, 32.0, 25.0, 19.0, 17.0, 13.0, 14.0, 4.0, 7.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.005321502685546875, -0.005158364772796631, -0.004995226860046387, -0.004832088947296143, -0.0046689510345458984, -0.004505813121795654, -0.00434267520904541, -0.004179537296295166, -0.004016399383544922, -0.0038532614707946777, -0.0036901235580444336, -0.0035269856452941895, -0.0033638477325439453, -0.003200709819793701, -0.003037571907043457, -0.002874433994293213, -0.0027112960815429688, -0.0025481581687927246, -0.0023850202560424805, -0.0022218823432922363, -0.002058744430541992, -0.001895606517791748, -0.001732468605041504, -0.0015693306922912598, -0.0014061927795410156, -0.0012430548667907715, -0.0010799169540405273, -0.0009167790412902832, -0.0007536411285400391, -0.0005905032157897949, -0.0004273653030395508, -0.00026422739028930664, -0.0001010894775390625, 6.204843521118164e-05, 0.00022518634796142578, 0.0003883242607116699, 0.0005514621734619141, 0.0007146000862121582, 0.0008777379989624023, 0.0010408759117126465, 0.0012040138244628906, 0.0013671517372131348, 0.001530289649963379, 0.001693427562713623, 0.0018565654754638672, 0.0020197033882141113, 0.0021828413009643555, 0.0023459792137145996, 0.0025091171264648438, 0.002672255039215088, 0.002835392951965332, 0.002998530864715576, 0.0031616687774658203, 0.0033248066902160645, 0.0034879446029663086, 0.0036510825157165527, 0.003814220428466797, 0.003977358341217041, 0.004140496253967285, 0.004303634166717529, 0.0044667720794677734, 0.004629909992218018, 0.004793047904968262, 0.004956185817718506, 0.00511932373046875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 11.0, 8.0, 15.0, 18.0, 34.0, 54.0, 85.0, 152.0, 214.0, 143.0, 80.0, 50.0, 32.0, 21.0, 18.0, 19.0, 13.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15116441249847412, -0.1470138430595398, -0.14286325871944427, -0.13871268928050995, -0.13456210494041443, -0.1304115355014801, -0.12626096606254578, -0.12211038917303085, -0.11795981228351593, -0.11380923539400101, -0.10965865850448608, -0.10550808906555176, -0.10135751217603683, -0.09720693528652191, -0.09305636584758759, -0.08890578895807266, -0.08475521206855774, -0.08060463517904282, -0.0764540582895279, -0.07230348885059357, -0.06815291196107864, -0.06400233507156372, -0.059851761907339096, -0.05570118874311447, -0.05155061185359955, -0.047400034964084625, -0.04324946179986, -0.039098888635635376, -0.03494831174612045, -0.03079773671925068, -0.026647161692380905, -0.02249658666551113, -0.01834602653980255, -0.014195451512932777, -0.010044876486063004, -0.00589430145919323, -0.0017437264323234558, 0.002406848594546318, 0.006557423621416092, 0.010707998648285866, 0.01485857367515564, 0.019009148702025414, 0.023159723728895187, 0.02731029875576496, 0.031460873782634735, 0.03561145067214966, 0.03976202383637428, 0.04391259700059891, 0.04806317389011383, 0.052213750779628754, 0.05636432394385338, 0.060514897108078, 0.06466547399759293, 0.06881605088710785, 0.07296662032604218, 0.0771171972155571, 0.08126777410507202, 0.08541835099458694, 0.08956892788410187, 0.0937194973230362, 0.09787007421255112, 0.10202065110206604, 0.10617122054100037, 0.11032179743051529, 0.11447237432003021]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 5.0, 9.0, 6.0, 8.0, 13.0, 17.0, 20.0, 22.0, 17.0, 30.0, 22.0, 44.0, 35.0, 33.0, 45.0, 54.0, 36.0, 46.0, 49.0, 54.0, 51.0, 36.0, 45.0, 35.0, 34.0, 22.0, 31.0, 24.0, 18.0, 20.0, 13.0, 12.0, 10.0, 6.0, 11.0, 19.0, 8.0, 12.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0], "bins": [-0.24026131629943848, -0.23348981142044067, -0.22671830654144287, -0.21994680166244507, -0.21317531168460846, -0.20640380680561066, -0.19963230192661285, -0.19286079704761505, -0.18608930706977844, -0.17931780219078064, -0.17254629731178284, -0.16577479243278503, -0.15900330245494843, -0.15223179757595062, -0.14546029269695282, -0.13868878781795502, -0.13191728293895721, -0.1251457780599594, -0.1183742806315422, -0.1116027757525444, -0.1048312783241272, -0.0980597734451294, -0.09128826856613159, -0.08451676368713379, -0.07774526625871658, -0.07097376137971878, -0.06420226395130157, -0.05743075907230377, -0.05065925791859627, -0.04388775676488876, -0.03711625188589096, -0.030344750732183456, -0.023573249578475952, -0.016801748424768448, -0.010030245408415794, -0.003258742392063141, 0.0035127587616443634, 0.010284259915351868, 0.01705576479434967, 0.023827265948057175, 0.03059876710176468, 0.03737026825547218, 0.04414176940917969, 0.05091327428817749, 0.057684775441884995, 0.0644562765955925, 0.0712277814745903, 0.07799927890300751, 0.08477078378200531, 0.09154228866100311, 0.09831378608942032, 0.10508529096841812, 0.11185678839683533, 0.11862829327583313, 0.12539979815483093, 0.13217130303382874, 0.13894280791282654, 0.14571431279182434, 0.15248581767082214, 0.15925732254981995, 0.16602881252765656, 0.17280031740665436, 0.17957182228565216, 0.18634332716464996, 0.19311481714248657]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 7.0, 6.0, 6.0, 10.0, 11.0, 20.0, 37.0, 36.0, 63.0, 60.0, 77.0, 127.0, 225.0, 479.0, 2137.0, 4187797.0, 2077.0, 456.0, 217.0, 126.0, 87.0, 60.0, 35.0, 30.0, 18.0, 21.0, 25.0, 10.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00174713134765625, -0.0016857683658599854, -0.0016244053840637207, -0.001563042402267456, -0.0015016794204711914, -0.0014403164386749268, -0.0013789534568786621, -0.0013175904750823975, -0.0012562274932861328, -0.0011948645114898682, -0.0011335015296936035, -0.0010721385478973389, -0.0010107755661010742, -0.0009494125843048096, -0.0008880496025085449, -0.0008266866207122803, -0.0007653236389160156, -0.000703960657119751, -0.0006425976753234863, -0.0005812346935272217, -0.000519871711730957, -0.0004585087299346924, -0.00039714574813842773, -0.0003357827663421631, -0.00027441978454589844, -0.0002130568027496338, -0.00015169382095336914, -9.033083915710449e-05, -2.8967857360839844e-05, 3.2395124435424805e-05, 9.375810623168945e-05, 0.0001551210880279541, 0.00021648406982421875, 0.0002778470516204834, 0.00033921003341674805, 0.0004005730152130127, 0.00046193599700927734, 0.000523298978805542, 0.0005846619606018066, 0.0006460249423980713, 0.0007073879241943359, 0.0007687509059906006, 0.0008301138877868652, 0.0008914768695831299, 0.0009528398513793945, 0.0010142028331756592, 0.0010755658149719238, 0.0011369287967681885, 0.0011982917785644531, 0.0012596547603607178, 0.0013210177421569824, 0.001382380723953247, 0.0014437437057495117, 0.0015051066875457764, 0.001566469669342041, 0.0016278326511383057, 0.0016891956329345703, 0.001750558614730835, 0.0018119215965270996, 0.0018732845783233643, 0.001934647560119629, 0.0019960105419158936, 0.002057373523712158, 0.002118736505508423, 0.0021800994873046875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 7.0, 7.0, 13.0, 16.0, 32.0, 29.0, 53.0, 65.0, 76.0, 80.0, 95.0, 95.0, 91.0, 65.0, 65.0, 51.0, 39.0, 31.0, 20.0, 18.0, 12.0, 9.0, 7.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0202178955078125, -0.01959395408630371, -0.018970012664794922, -0.018346071243286133, -0.017722129821777344, -0.017098188400268555, -0.016474246978759766, -0.015850305557250977, -0.015226364135742188, -0.014602422714233398, -0.01397848129272461, -0.01335453987121582, -0.012730598449707031, -0.012106657028198242, -0.011482715606689453, -0.010858774185180664, -0.010234832763671875, -0.009610891342163086, -0.008986949920654297, -0.008363008499145508, -0.007739067077636719, -0.00711512565612793, -0.006491184234619141, -0.0058672428131103516, -0.0052433013916015625, -0.0046193599700927734, -0.003995418548583984, -0.0033714771270751953, -0.0027475357055664062, -0.002123594284057617, -0.0014996528625488281, -0.0008757114410400391, -0.00025177001953125, 0.00037217140197753906, 0.0009961128234863281, 0.0016200542449951172, 0.0022439956665039062, 0.0028679370880126953, 0.0034918785095214844, 0.0041158199310302734, 0.0047397613525390625, 0.0053637027740478516, 0.005987644195556641, 0.00661158561706543, 0.007235527038574219, 0.007859468460083008, 0.008483409881591797, 0.009107351303100586, 0.009731292724609375, 0.010355234146118164, 0.010979175567626953, 0.011603116989135742, 0.012227058410644531, 0.01285099983215332, 0.01347494125366211, 0.014098882675170898, 0.014722824096679688, 0.015346765518188477, 0.015970706939697266, 0.016594648361206055, 0.017218589782714844, 0.017842531204223633, 0.018466472625732422, 0.01909041404724121, 0.01971435546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 4.0, 6.0, 15.0, 16.0, 24.0, 25.0, 47.0, 73.0, 99.0, 159.0, 264.0, 444.0, 812.0, 7540.0, 4181688.0, 1503.0, 545.0, 365.0, 213.0, 151.0, 104.0, 61.0, 38.0, 27.0, 12.0, 14.0, 6.0, 5.0, 3.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013666152954101562, -0.001322820782661438, -0.0012790262699127197, -0.0012352317571640015, -0.0011914372444152832, -0.001147642731666565, -0.0011038482189178467, -0.0010600537061691284, -0.0010162591934204102, -0.0009724646806716919, -0.0009286701679229736, -0.0008848756551742554, -0.0008410811424255371, -0.0007972866296768188, -0.0007534921169281006, -0.0007096976041793823, -0.0006659030914306641, -0.0006221085786819458, -0.0005783140659332275, -0.0005345195531845093, -0.000490725040435791, -0.00044693052768707275, -0.0004031360149383545, -0.00035934150218963623, -0.00031554698944091797, -0.0002717524766921997, -0.00022795796394348145, -0.00018416345119476318, -0.00014036893844604492, -9.657442569732666e-05, -5.27799129486084e-05, -8.985400199890137e-06, 3.4809112548828125e-05, 7.860362529754639e-05, 0.00012239813804626465, 0.0001661926507949829, 0.00020998716354370117, 0.00025378167629241943, 0.0002975761890411377, 0.00034137070178985596, 0.0003851652145385742, 0.0004289597272872925, 0.00047275424003601074, 0.000516548752784729, 0.0005603432655334473, 0.0006041377782821655, 0.0006479322910308838, 0.000691726803779602, 0.0007355213165283203, 0.0007793158292770386, 0.0008231103420257568, 0.0008669048547744751, 0.0009106993675231934, 0.0009544938802719116, 0.0009982883930206299, 0.0010420829057693481, 0.0010858774185180664, 0.0011296719312667847, 0.001173466444015503, 0.0012172609567642212, 0.0012610554695129395, 0.0013048499822616577, 0.001348644495010376, 0.0013924390077590942, 0.0014362335205078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 4064.0, 9.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00035762786865234375, -0.00034628063440322876, -0.00033493340015411377, -0.0003235861659049988, -0.0003122389316558838, -0.0003008916974067688, -0.0002895444631576538, -0.0002781972289085388, -0.00026684999465942383, -0.00025550276041030884, -0.00024415552616119385, -0.00023280829191207886, -0.00022146105766296387, -0.00021011382341384888, -0.0001987665891647339, -0.0001874193549156189, -0.0001760721206665039, -0.00016472488641738892, -0.00015337765216827393, -0.00014203041791915894, -0.00013068318367004395, -0.00011933594942092896, -0.00010798871517181396, -9.664148092269897e-05, -8.529424667358398e-05, -7.3947012424469e-05, -6.2599778175354e-05, -5.1252543926239014e-05, -3.9905309677124023e-05, -2.8558075428009033e-05, -1.7210841178894043e-05, -5.863606929779053e-06, 5.4836273193359375e-06, 1.6830861568450928e-05, 2.8178095817565918e-05, 3.952533006668091e-05, 5.08725643157959e-05, 6.221979856491089e-05, 7.356703281402588e-05, 8.491426706314087e-05, 9.626150131225586e-05, 0.00010760873556137085, 0.00011895596981048584, 0.00013030320405960083, 0.00014165043830871582, 0.0001529976725578308, 0.0001643449068069458, 0.0001756921410560608, 0.00018703937530517578, 0.00019838660955429077, 0.00020973384380340576, 0.00022108107805252075, 0.00023242831230163574, 0.00024377554655075073, 0.0002551227807998657, 0.0002664700150489807, 0.0002778172492980957, 0.0002891644835472107, 0.0003005117177963257, 0.0003118589520454407, 0.00032320618629455566, 0.00033455342054367065, 0.00034590065479278564, 0.00035724788904190063, 0.0003685951232910156]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 39.0, 921.0, 47.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00319444527849555, -0.0030787005089223385, -0.002962955739349127, -0.002847210969775915, -0.00273146596737206, -0.002615721197798848, -0.0024999764282256365, -0.002384231658652425, -0.002268486889079213, -0.0021527421195060015, -0.00203699734993279, -0.0019212524639442563, -0.0018055076943710446, -0.0016897628083825111, -0.0015740180388092995, -0.0014582732692360878, -0.0013425283832475543, -0.0012267836136743426, -0.0011110387276858091, -0.0009952939581125975, -0.0008795491885393858, -0.0007638043607585132, -0.0006480595329776406, -0.000532314763404429, -0.0004165699356235564, -0.00030082513694651425, -0.0001850803237175569, -6.933551048859954e-05, 4.640928818844259e-05, 0.00016215408686548471, 0.0002778989146463573, 0.00039364368421956897, 0.0005093885120004416, 0.0006251333397813141, 0.0007408781093545258, 0.0008566229371353984, 0.0009723677067086101, 0.0010881125926971436, 0.0012038573622703552, 0.001319602131843567, 0.0014353469014167786, 0.0015510916709899902, 0.0016668365569785237, 0.0017825813265517354, 0.001898326096124947, 0.0020140709821134806, 0.0021298157516866922, 0.002245560521259904, 0.0023613055236637592, 0.002477050293236971, 0.0025927950628101826, 0.0027085398323833942, 0.0028242848347872496, 0.0029400296043604612, 0.003055774373933673, 0.0031715191435068846, 0.0032872639130800962, 0.003403008682653308, 0.0035187534522265196, 0.003634498454630375, 0.0037502432242035866, 0.0038659879937767982, 0.00398173276335001, 0.004097477532923222, 0.004213222302496433]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 22.0, 44.0, 31.0, 58.0, 79.0, 91.0, 94.0, 111.0, 92.0, 86.0, 85.0, 58.0, 40.0, 28.0, 27.0, 12.0, 11.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032806396484375, -0.00031471624970436096, -0.0003013685345649719, -0.0002880208194255829, -0.00027467310428619385, -0.0002613253891468048, -0.00024797767400741577, -0.00023462995886802673, -0.0002212822437286377, -0.00020793452858924866, -0.00019458681344985962, -0.00018123909831047058, -0.00016789138317108154, -0.0001545436680316925, -0.00014119595289230347, -0.00012784823775291443, -0.00011450052261352539, -0.00010115280747413635, -8.780509233474731e-05, -7.445737719535828e-05, -6.110966205596924e-05, -4.77619469165802e-05, -3.441423177719116e-05, -2.1066516637802124e-05, -7.718801498413086e-06, 5.628913640975952e-06, 1.897662878036499e-05, 3.232434391975403e-05, 4.5672059059143066e-05, 5.9019774198532104e-05, 7.236748933792114e-05, 8.571520447731018e-05, 9.906291961669922e-05, 0.00011241063475608826, 0.0001257583498954773, 0.00013910606503486633, 0.00015245378017425537, 0.0001658014953136444, 0.00017914921045303345, 0.00019249692559242249, 0.00020584464073181152, 0.00021919235587120056, 0.0002325400710105896, 0.00024588778614997864, 0.0002592355012893677, 0.0002725832164287567, 0.00028593093156814575, 0.0002992786467075348, 0.00031262636184692383, 0.00032597407698631287, 0.0003393217921257019, 0.00035266950726509094, 0.00036601722240448, 0.000379364937543869, 0.00039271265268325806, 0.0004060603678226471, 0.00041940808296203613, 0.00043275579810142517, 0.0004461035132408142, 0.00045945122838020325, 0.0004727989435195923, 0.0004861466586589813, 0.0004994943737983704, 0.0005128420889377594, 0.0005261898040771484]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 8.0, 13.0, 20.0, 27.0, 42.0, 47.0, 63.0, 81.0, 142.0, 215.0, 307.0, 442.0, 794.0, 1362.0, 2374.0, 4618.0, 10207.0, 25876.0, 83979.0, 520448.0, 299400.0, 60011.0, 20329.0, 8389.0, 4014.0, 2134.0, 1137.0, 709.0, 444.0, 272.0, 183.0, 130.0, 91.0, 65.0, 43.0, 36.0, 21.0, 18.0, 10.0, 13.0, 6.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.024627685546875, -0.02387857437133789, -0.02312946319580078, -0.022380352020263672, -0.021631240844726562, -0.020882129669189453, -0.020133018493652344, -0.019383907318115234, -0.018634796142578125, -0.017885684967041016, -0.017136573791503906, -0.016387462615966797, -0.015638351440429688, -0.014889240264892578, -0.014140129089355469, -0.01339101791381836, -0.01264190673828125, -0.01189279556274414, -0.011143684387207031, -0.010394573211669922, -0.009645462036132812, -0.008896350860595703, -0.008147239685058594, -0.007398128509521484, -0.006649017333984375, -0.005899906158447266, -0.005150794982910156, -0.004401683807373047, -0.0036525726318359375, -0.002903461456298828, -0.0021543502807617188, -0.0014052391052246094, -0.0006561279296875, 9.298324584960938e-05, 0.0008420944213867188, 0.0015912055969238281, 0.0023403167724609375, 0.003089427947998047, 0.0038385391235351562, 0.004587650299072266, 0.005336761474609375, 0.006085872650146484, 0.006834983825683594, 0.007584095001220703, 0.008333206176757812, 0.009082317352294922, 0.009831428527832031, 0.01058053970336914, 0.01132965087890625, 0.01207876205444336, 0.012827873229980469, 0.013576984405517578, 0.014326095581054688, 0.015075206756591797, 0.015824317932128906, 0.016573429107666016, 0.017322540283203125, 0.018071651458740234, 0.018820762634277344, 0.019569873809814453, 0.020318984985351562, 0.021068096160888672, 0.02181720733642578, 0.02256631851196289, 0.0233154296875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 7.0, 7.0, 12.0, 17.0, 32.0, 28.0, 54.0, 63.0, 76.0, 80.0, 96.0, 92.0, 94.0, 66.0, 64.0, 52.0, 39.0, 31.0, 19.0, 19.0, 12.0, 9.0, 6.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0202178955078125, -0.019594192504882812, -0.018970489501953125, -0.018346786499023438, -0.01772308349609375, -0.017099380493164062, -0.016475677490234375, -0.015851974487304688, -0.015228271484375, -0.014604568481445312, -0.013980865478515625, -0.013357162475585938, -0.01273345947265625, -0.012109756469726562, -0.011486053466796875, -0.010862350463867188, -0.0102386474609375, -0.009614944458007812, -0.008991241455078125, -0.008367538452148438, -0.00774383544921875, -0.0071201324462890625, -0.006496429443359375, -0.0058727264404296875, -0.0052490234375, -0.0046253204345703125, -0.004001617431640625, -0.0033779144287109375, -0.00275421142578125, -0.0021305084228515625, -0.001506805419921875, -0.0008831024169921875, -0.0002593994140625, 0.0003643035888671875, 0.000988006591796875, 0.0016117095947265625, 0.00223541259765625, 0.0028591156005859375, 0.003482818603515625, 0.0041065216064453125, 0.004730224609375, 0.0053539276123046875, 0.005977630615234375, 0.0066013336181640625, 0.00722503662109375, 0.007848739624023438, 0.008472442626953125, 0.009096145629882812, 0.0097198486328125, 0.010343551635742188, 0.010967254638671875, 0.011590957641601562, 0.01221466064453125, 0.012838363647460938, 0.013462066650390625, 0.014085769653320312, 0.01470947265625, 0.015333175659179688, 0.015956878662109375, 0.016580581665039062, 0.01720428466796875, 0.017827987670898438, 0.018451690673828125, 0.019075393676757812, 0.0196990966796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 6.0, 11.0, 14.0, 10.0, 13.0, 22.0, 21.0, 26.0, 33.0, 47.0, 42.0, 90.0, 120.0, 197.0, 386.0, 1004.0, 9510.0, 895738.0, 136390.0, 3325.0, 689.0, 283.0, 149.0, 107.0, 66.0, 40.0, 48.0, 30.0, 24.0, 17.0, 15.0, 13.0, 11.0, 6.0, 7.0, 7.0, 6.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0736083984375, -0.07121944427490234, -0.06883049011230469, -0.06644153594970703, -0.06405258178710938, -0.06166362762451172, -0.05927467346191406, -0.056885719299316406, -0.05449676513671875, -0.052107810974121094, -0.04971885681152344, -0.04732990264892578, -0.044940948486328125, -0.04255199432373047, -0.04016304016113281, -0.037774085998535156, -0.0353851318359375, -0.032996177673339844, -0.030607223510742188, -0.02821826934814453, -0.025829315185546875, -0.02344036102294922, -0.021051406860351562, -0.018662452697753906, -0.01627349853515625, -0.013884544372558594, -0.011495590209960938, -0.009106636047363281, -0.006717681884765625, -0.004328727722167969, -0.0019397735595703125, 0.00044918060302734375, 0.002838134765625, 0.005227088928222656, 0.0076160430908203125, 0.010004997253417969, 0.012393951416015625, 0.014782905578613281, 0.017171859741210938, 0.019560813903808594, 0.02194976806640625, 0.024338722229003906, 0.026727676391601562, 0.02911663055419922, 0.031505584716796875, 0.03389453887939453, 0.03628349304199219, 0.038672447204589844, 0.0410614013671875, 0.043450355529785156, 0.04583930969238281, 0.04822826385498047, 0.050617218017578125, 0.05300617218017578, 0.05539512634277344, 0.057784080505371094, 0.06017303466796875, 0.0625619888305664, 0.06495094299316406, 0.06733989715576172, 0.06972885131835938, 0.07211780548095703, 0.07450675964355469, 0.07689571380615234, 0.07928466796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 7.0, 5.0, 6.0, 7.0, 10.0, 15.0, 15.0, 11.0, 15.0, 21.0, 32.0, 22.0, 31.0, 31.0, 22.0, 45.0, 42.0, 37.0, 41.0, 25.0, 47.0, 52.0, 37.0, 21.0, 31.0, 52.0, 40.0, 18.0, 22.0, 22.0, 31.0, 33.0, 21.0, 17.0, 18.0, 14.0, 10.0, 10.0, 13.0, 10.0, 9.0, 5.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032684326171875, -0.031556129455566406, -0.030427932739257812, -0.02929973602294922, -0.028171539306640625, -0.02704334259033203, -0.025915145874023438, -0.024786949157714844, -0.02365875244140625, -0.022530555725097656, -0.021402359008789062, -0.02027416229248047, -0.019145965576171875, -0.01801776885986328, -0.016889572143554688, -0.015761375427246094, -0.0146331787109375, -0.013504981994628906, -0.012376785278320312, -0.011248588562011719, -0.010120391845703125, -0.008992195129394531, -0.007863998413085938, -0.006735801696777344, -0.00560760498046875, -0.004479408264160156, -0.0033512115478515625, -0.0022230148315429688, -0.001094818115234375, 3.337860107421875e-05, 0.0011615753173828125, 0.0022897720336914062, 0.00341796875, 0.004546165466308594, 0.0056743621826171875, 0.006802558898925781, 0.007930755615234375, 0.009058952331542969, 0.010187149047851562, 0.011315345764160156, 0.01244354248046875, 0.013571739196777344, 0.014699935913085938, 0.01582813262939453, 0.016956329345703125, 0.01808452606201172, 0.019212722778320312, 0.020340919494628906, 0.0214691162109375, 0.022597312927246094, 0.023725509643554688, 0.02485370635986328, 0.025981903076171875, 0.02711009979248047, 0.028238296508789062, 0.029366493225097656, 0.03049468994140625, 0.031622886657714844, 0.03275108337402344, 0.03387928009033203, 0.035007476806640625, 0.03613567352294922, 0.03726387023925781, 0.038392066955566406, 0.039520263671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 9.0, 36.0, 100.0, 1110.0, 1046273.0, 848.0, 97.0, 22.0, 17.0, 9.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.052703857421875, -0.05151820182800293, -0.05033254623413086, -0.04914689064025879, -0.04796123504638672, -0.04677557945251465, -0.04558992385864258, -0.04440426826477051, -0.04321861267089844, -0.04203295707702637, -0.0408473014831543, -0.03966164588928223, -0.038475990295410156, -0.037290334701538086, -0.036104679107666016, -0.034919023513793945, -0.033733367919921875, -0.032547712326049805, -0.031362056732177734, -0.030176401138305664, -0.028990745544433594, -0.027805089950561523, -0.026619434356689453, -0.025433778762817383, -0.024248123168945312, -0.023062467575073242, -0.021876811981201172, -0.0206911563873291, -0.01950550079345703, -0.01831984519958496, -0.01713418960571289, -0.01594853401184082, -0.01476287841796875, -0.01357722282409668, -0.01239156723022461, -0.011205911636352539, -0.010020256042480469, -0.008834600448608398, -0.007648944854736328, -0.006463289260864258, -0.0052776336669921875, -0.004091978073120117, -0.002906322479248047, -0.0017206668853759766, -0.0005350112915039062, 0.0006506443023681641, 0.0018362998962402344, 0.0030219554901123047, 0.004207611083984375, 0.005393266677856445, 0.006578922271728516, 0.007764577865600586, 0.008950233459472656, 0.010135889053344727, 0.011321544647216797, 0.012507200241088867, 0.013692855834960938, 0.014878511428833008, 0.016064167022705078, 0.01724982261657715, 0.01843547821044922, 0.01962113380432129, 0.02080678939819336, 0.02199244499206543, 0.0231781005859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 20.0, 621.0, 317.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005645751953125, -0.0005450323224067688, -0.0005254894495010376, -0.0005059465765953064, -0.0004864037036895752, -0.000466860830783844, -0.0004473179578781128, -0.0004277750849723816, -0.0004082322120666504, -0.0003886893391609192, -0.000369146466255188, -0.0003496035933494568, -0.0003300607204437256, -0.0003105178475379944, -0.0002909749746322632, -0.000271432101726532, -0.0002518892288208008, -0.00023234635591506958, -0.00021280348300933838, -0.00019326061010360718, -0.00017371773719787598, -0.00015417486429214478, -0.00013463199138641357, -0.00011508911848068237, -9.554624557495117e-05, -7.600337266921997e-05, -5.646049976348877e-05, -3.691762685775757e-05, -1.7374753952026367e-05, 2.168118953704834e-06, 2.1710991859436035e-05, 4.1253864765167236e-05, 6.079673767089844e-05, 8.033961057662964e-05, 9.988248348236084e-05, 0.00011942535638809204, 0.00013896822929382324, 0.00015851110219955444, 0.00017805397510528564, 0.00019759684801101685, 0.00021713972091674805, 0.00023668259382247925, 0.00025622546672821045, 0.00027576833963394165, 0.00029531121253967285, 0.00031485408544540405, 0.00033439695835113525, 0.00035393983125686646, 0.00037348270416259766, 0.00039302557706832886, 0.00041256844997406006, 0.00043211132287979126, 0.00045165419578552246, 0.00047119706869125366, 0.0004907399415969849, 0.0005102828145027161, 0.0005298256874084473, 0.0005493685603141785, 0.0005689114332199097, 0.0005884543061256409, 0.0006079971790313721, 0.0006275400519371033, 0.0006470829248428345, 0.0006666257977485657, 0.0006861686706542969]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 18.0, 33.0, 140.0, 561.0, 1042538.0, 4937.0, 228.0, 59.0, 13.0, 8.0, 10.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0172882080078125, -0.015819311141967773, -0.014350414276123047, -0.01288151741027832, -0.011412620544433594, -0.009943723678588867, -0.00847482681274414, -0.007005929946899414, -0.0055370330810546875, -0.004068136215209961, -0.0025992393493652344, -0.0011303424835205078, 0.00033855438232421875, 0.0018074512481689453, 0.003276348114013672, 0.0047452449798583984, 0.006214141845703125, 0.0076830387115478516, 0.009151935577392578, 0.010620832443237305, 0.012089729309082031, 0.013558626174926758, 0.015027523040771484, 0.01649641990661621, 0.017965316772460938, 0.019434213638305664, 0.02090311050415039, 0.022372007369995117, 0.023840904235839844, 0.02530980110168457, 0.026778697967529297, 0.028247594833374023, 0.02971649169921875, 0.031185388565063477, 0.0326542854309082, 0.03412318229675293, 0.035592079162597656, 0.03706097602844238, 0.03852987289428711, 0.039998769760131836, 0.04146766662597656, 0.04293656349182129, 0.044405460357666016, 0.04587435722351074, 0.04734325408935547, 0.048812150955200195, 0.05028104782104492, 0.05174994468688965, 0.053218841552734375, 0.0546877384185791, 0.05615663528442383, 0.057625532150268555, 0.05909442901611328, 0.06056332588195801, 0.062032222747802734, 0.06350111961364746, 0.06497001647949219, 0.06643891334533691, 0.06790781021118164, 0.06937670707702637, 0.0708456039428711, 0.07231450080871582, 0.07378339767456055, 0.07525229454040527, 0.07672119140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 10.0, 12.0, 26.0, 80.0, 342.0, 369.0, 88.0, 47.0, 19.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03271484375, -0.03204786777496338, -0.03138089179992676, -0.030713915824890137, -0.030046939849853516, -0.029379963874816895, -0.028712987899780273, -0.028046011924743652, -0.02737903594970703, -0.02671205997467041, -0.02604508399963379, -0.025378108024597168, -0.024711132049560547, -0.024044156074523926, -0.023377180099487305, -0.022710204124450684, -0.022043228149414062, -0.02137625217437744, -0.02070927619934082, -0.0200423002243042, -0.019375324249267578, -0.018708348274230957, -0.018041372299194336, -0.017374396324157715, -0.016707420349121094, -0.016040444374084473, -0.015373468399047852, -0.01470649242401123, -0.01403951644897461, -0.013372540473937988, -0.012705564498901367, -0.012038588523864746, -0.011371612548828125, -0.010704636573791504, -0.010037660598754883, -0.009370684623718262, -0.00870370864868164, -0.00803673267364502, -0.0073697566986083984, -0.006702780723571777, -0.006035804748535156, -0.005368828773498535, -0.004701852798461914, -0.004034876823425293, -0.003367900848388672, -0.0027009248733520508, -0.0020339488983154297, -0.0013669729232788086, -0.0006999969482421875, -3.3020973205566406e-05, 0.0006339550018310547, 0.0013009309768676758, 0.001967906951904297, 0.002634882926940918, 0.003301858901977539, 0.00396883487701416, 0.004635810852050781, 0.005302786827087402, 0.0059697628021240234, 0.0066367387771606445, 0.007303714752197266, 0.007970690727233887, 0.008637666702270508, 0.009304642677307129, 0.00997161865234375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 15.0, 291.0, 668.0, 38.0, 6.0, 2.0, 1.0, 1.0], "bins": [-1.9654268026351929, -1.9315918684005737, -1.8977569341659546, -1.8639219999313354, -1.8300870656967163, -1.7962521314620972, -1.762417197227478, -1.7285822629928589, -1.6947473287582397, -1.6609123945236206, -1.6270774602890015, -1.5932425260543823, -1.5594075918197632, -1.525572657585144, -1.491737723350525, -1.4579027891159058, -1.4240678548812866, -1.3902329206466675, -1.3563979864120483, -1.3225630521774292, -1.28872811794281, -1.254893183708191, -1.2210582494735718, -1.1872233152389526, -1.1533883810043335, -1.1195534467697144, -1.0857185125350952, -1.051883578300476, -1.018048644065857, -0.9842137098312378, -0.9503787755966187, -0.9165438413619995, -0.8827088475227356, -0.8488739132881165, -0.8150389790534973, -0.7812040448188782, -0.747369110584259, -0.7135341763496399, -0.6796992421150208, -0.6458643078804016, -0.6120293736457825, -0.5781944394111633, -0.5443595051765442, -0.510524570941925, -0.4766896367073059, -0.44285470247268677, -0.4090197682380676, -0.3751848340034485, -0.34134989976882935, -0.3075149655342102, -0.27368003129959106, -0.23984509706497192, -0.20601016283035278, -0.17217522859573364, -0.1383402943611145, -0.10450536012649536, -0.07067042589187622, -0.03683549165725708, -0.0030005574226379395, 0.0308343768119812, 0.06466931104660034, 0.09850424528121948, 0.13233917951583862, 0.16617411375045776, 0.2000090479850769]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 3.0, 5.0, 9.0, 11.0, 9.0, 7.0, 10.0, 21.0, 11.0, 19.0, 22.0, 24.0, 31.0, 28.0, 31.0, 39.0, 31.0, 38.0, 43.0, 43.0, 44.0, 46.0, 27.0, 48.0, 27.0, 31.0, 41.0, 28.0, 30.0, 32.0, 30.0, 28.0, 25.0, 23.0, 20.0, 11.0, 15.0, 10.0, 7.0, 11.0, 6.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.18563055992126465, -0.18013067543506622, -0.1746307909488678, -0.16913089156150818, -0.16363100707530975, -0.15813112258911133, -0.1526312232017517, -0.14713133871555328, -0.14163145422935486, -0.13613156974315643, -0.130631685256958, -0.1251317858695984, -0.11963190138339996, -0.11413201689720154, -0.10863212496042252, -0.1031322330236435, -0.09763234853744507, -0.09213246405124664, -0.08663257211446762, -0.0811326801776886, -0.07563279569149017, -0.07013291120529175, -0.06463301926851273, -0.059133131057024, -0.05363324284553528, -0.048133354634046555, -0.04263346642255783, -0.03713357821106911, -0.03163368999958038, -0.02613380178809166, -0.020633913576602936, -0.015134025365114212, -0.009634137153625488, -0.0041342489421367645, 0.0013656392693519592, 0.006865527480840683, 0.012365415692329407, 0.01786530390381813, 0.023365192115306854, 0.028865080326795578, 0.0343649685382843, 0.039864856749773026, 0.04536474496126175, 0.05086463317275047, 0.0563645213842392, 0.06186440959572792, 0.06736429780721664, 0.07286418974399567, 0.07836407423019409, 0.08386395871639252, 0.08936385065317154, 0.09486374258995056, 0.10036362707614899, 0.10586351156234741, 0.11136340349912643, 0.11686329543590546, 0.12236317992210388, 0.1278630644083023, 0.13336294889450073, 0.13886284828186035, 0.14436273276805878, 0.1498626172542572, 0.15536251664161682, 0.16086240112781525, 0.16636228561401367]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 4.0, 8.0, 3.0, 7.0, 15.0, 33.0, 30.0, 39.0, 50.0, 77.0, 105.0, 159.0, 238.0, 414.0, 837.0, 2128.0, 7651.0, 4172090.0, 6660.0, 1820.0, 752.0, 379.0, 220.0, 129.0, 102.0, 96.0, 55.0, 39.0, 27.0, 22.0, 21.0, 11.0, 11.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004711151123046875, -0.0004565976560115814, -0.00044208019971847534, -0.00042756274342536926, -0.0004130452871322632, -0.0003985278308391571, -0.000384010374546051, -0.00036949291825294495, -0.00035497546195983887, -0.0003404580056667328, -0.0003259405493736267, -0.00031142309308052063, -0.00029690563678741455, -0.00028238818049430847, -0.0002678707242012024, -0.0002533532679080963, -0.00023883581161499023, -0.00022431835532188416, -0.00020980089902877808, -0.000195283442735672, -0.00018076598644256592, -0.00016624853014945984, -0.00015173107385635376, -0.00013721361756324768, -0.0001226961612701416, -0.00010817870497703552, -9.366124868392944e-05, -7.914379239082336e-05, -6.462633609771729e-05, -5.0108879804611206e-05, -3.559142351150513e-05, -2.1073967218399048e-05, -6.556510925292969e-06, 7.96094536781311e-06, 2.247840166091919e-05, 3.699585795402527e-05, 5.151331424713135e-05, 6.603077054023743e-05, 8.05482268333435e-05, 9.506568312644958e-05, 0.00010958313941955566, 0.00012410059571266174, 0.00013861805200576782, 0.0001531355082988739, 0.00016765296459197998, 0.00018217042088508606, 0.00019668787717819214, 0.00021120533347129822, 0.0002257227897644043, 0.00024024024605751038, 0.00025475770235061646, 0.00026927515864372253, 0.0002837926149368286, 0.0002983100712299347, 0.00031282752752304077, 0.00032734498381614685, 0.00034186244010925293, 0.000356379896402359, 0.0003708973526954651, 0.00038541480898857117, 0.00039993226528167725, 0.0004144497215747833, 0.0004289671778678894, 0.0004434846341609955, 0.00045800209045410156]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 9.0, 5.0, 16.0, 19.0, 29.0, 31.0, 56.0, 64.0, 82.0, 78.0, 87.0, 109.0, 83.0, 74.0, 49.0, 57.0, 38.0, 27.0, 22.0, 13.0, 12.0, 9.0, 9.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0202484130859375, -0.019620656967163086, -0.018992900848388672, -0.018365144729614258, -0.017737388610839844, -0.01710963249206543, -0.016481876373291016, -0.0158541202545166, -0.015226364135742188, -0.014598608016967773, -0.01397085189819336, -0.013343095779418945, -0.012715339660644531, -0.012087583541870117, -0.011459827423095703, -0.010832071304321289, -0.010204315185546875, -0.009576559066772461, -0.008948802947998047, -0.008321046829223633, -0.007693290710449219, -0.007065534591674805, -0.006437778472900391, -0.0058100223541259766, -0.0051822662353515625, -0.0045545101165771484, -0.003926753997802734, -0.0032989978790283203, -0.0026712417602539062, -0.002043485641479492, -0.0014157295227050781, -0.0007879734039306641, -0.00016021728515625, 0.00046753883361816406, 0.0010952949523925781, 0.0017230510711669922, 0.0023508071899414062, 0.0029785633087158203, 0.0036063194274902344, 0.0042340755462646484, 0.0048618316650390625, 0.0054895877838134766, 0.006117343902587891, 0.006745100021362305, 0.007372856140136719, 0.008000612258911133, 0.008628368377685547, 0.009256124496459961, 0.009883880615234375, 0.010511636734008789, 0.011139392852783203, 0.011767148971557617, 0.012394905090332031, 0.013022661209106445, 0.01365041732788086, 0.014278173446655273, 0.014905929565429688, 0.015533685684204102, 0.016161441802978516, 0.01678919792175293, 0.017416954040527344, 0.018044710159301758, 0.018672466278076172, 0.019300222396850586, 0.019927978515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 11.0, 10.0, 17.0, 34.0, 27.0, 33.0, 35.0, 75.0, 91.0, 118.0, 143.0, 292.0, 711.0, 2345.0, 14793.0, 4169319.0, 3907.0, 1144.0, 423.0, 191.0, 121.0, 101.0, 75.0, 56.0, 55.0, 31.0, 24.0, 27.0, 14.0, 17.0, 15.0, 5.0, 4.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010328292846679688, -0.0010017156600952148, -0.0009706020355224609, -0.000939488410949707, -0.0009083747863769531, -0.0008772611618041992, -0.0008461475372314453, -0.0008150339126586914, -0.0007839202880859375, -0.0007528066635131836, -0.0007216930389404297, -0.0006905794143676758, -0.0006594657897949219, -0.000628352165222168, -0.0005972385406494141, -0.0005661249160766602, -0.0005350112915039062, -0.0005038976669311523, -0.00047278404235839844, -0.00044167041778564453, -0.0004105567932128906, -0.0003794431686401367, -0.0003483295440673828, -0.0003172159194946289, -0.000286102294921875, -0.0002549886703491211, -0.0002238750457763672, -0.00019276142120361328, -0.00016164779663085938, -0.00013053417205810547, -9.942054748535156e-05, -6.830692291259766e-05, -3.719329833984375e-05, -6.079673767089844e-06, 2.5033950805664062e-05, 5.614757537841797e-05, 8.726119995117188e-05, 0.00011837482452392578, 0.0001494884490966797, 0.0001806020736694336, 0.0002117156982421875, 0.0002428293228149414, 0.0002739429473876953, 0.0003050565719604492, 0.0003361701965332031, 0.00036728382110595703, 0.00039839744567871094, 0.00042951107025146484, 0.00046062469482421875, 0.0004917383193969727, 0.0005228519439697266, 0.0005539655685424805, 0.0005850791931152344, 0.0006161928176879883, 0.0006473064422607422, 0.0006784200668334961, 0.00070953369140625, 0.0007406473159790039, 0.0007717609405517578, 0.0008028745651245117, 0.0008339881896972656, 0.0008651018142700195, 0.0008962154388427734, 0.0009273290634155273, 0.0009584426879882812]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 22.0, 4028.0, 7.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012350082397460938, -0.00011544302105903625, -0.00010738521814346313, -9.932741522789001e-05, -9.12696123123169e-05, -8.321180939674377e-05, -7.515400648117065e-05, -6.709620356559753e-05, -5.9038400650024414e-05, -5.0980597734451294e-05, -4.2922794818878174e-05, -3.4864991903305054e-05, -2.6807188987731934e-05, -1.8749386072158813e-05, -1.0691583156585693e-05, -2.6337802410125732e-06, 5.424022674560547e-06, 1.3481825590133667e-05, 2.1539628505706787e-05, 2.9597431421279907e-05, 3.765523433685303e-05, 4.571303725242615e-05, 5.377084016799927e-05, 6.182864308357239e-05, 6.988644599914551e-05, 7.794424891471863e-05, 8.600205183029175e-05, 9.405985474586487e-05, 0.00010211765766143799, 0.00011017546057701111, 0.00011823326349258423, 0.00012629106640815735, 0.00013434886932373047, 0.0001424066722393036, 0.0001504644751548767, 0.00015852227807044983, 0.00016658008098602295, 0.00017463788390159607, 0.0001826956868171692, 0.0001907534897327423, 0.00019881129264831543, 0.00020686909556388855, 0.00021492689847946167, 0.0002229847013950348, 0.0002310425043106079, 0.00023910030722618103, 0.00024715811014175415, 0.00025521591305732727, 0.0002632737159729004, 0.0002713315188884735, 0.00027938932180404663, 0.00028744712471961975, 0.00029550492763519287, 0.000303562730550766, 0.0003116205334663391, 0.00031967833638191223, 0.00032773613929748535, 0.00033579394221305847, 0.0003438517451286316, 0.0003519095480442047, 0.00035996735095977783, 0.00036802515387535095, 0.00037608295679092407, 0.0003841407597064972, 0.0003921985626220703]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 26.0, 95.0, 577.0, 229.0, 60.0, 13.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003884966135956347, -0.0003482723259367049, -0.00030804803827777505, -0.0002678237797226757, -0.00022759949206374586, -0.00018737520440481603, -0.00014715093129780143, -0.00010692665819078684, -6.670237053185701e-05, -2.6478090148884803e-05, 1.3746190234087408e-05, 5.397047061705962e-05, 9.419475100003183e-05, 0.00013441903865896165, 0.00017464331176597625, 0.00021486758487299085, 0.00025509187253192067, 0.0002953161601908505, 0.0003355404478497803, 0.0003757647064048797, 0.0004159889940638095, 0.00045621328172273934, 0.0004964375402778387, 0.0005366618279367685, 0.0005768861155956984, 0.0006171104032546282, 0.000657334690913558, 0.0006975589785724878, 0.0007377832662314177, 0.0007780075538903475, 0.0008182317833416164, 0.0008584560710005462, 0.000898680416867137, 0.0009389047045260668, 0.0009791289921849966, 0.0010193532798439264, 0.0010595775675028563, 0.001099801855161786, 0.001140026142820716, 0.0011802504304796457, 0.0012204747181385756, 0.0012606990057975054, 0.0013009232934564352, 0.001341147581115365, 0.0013813718687742949, 0.0014215961564332247, 0.0014618204440921545, 0.0015020447317510843, 0.0015422689029946923, 0.0015824931906536222, 0.001622717478312552, 0.0016629417659714818, 0.0017031660536304116, 0.0017433903412893414, 0.0017836146289482713, 0.0018238388001918793, 0.001864063087850809, 0.001904287375509739, 0.0019445116631686687, 0.0019847359508275986, 0.0020249602384865284, 0.0020651845261454582, 0.002105408813804388, 0.002145633101463318, 0.0021858573891222477]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 10.0, 3.0, 10.0, 7.0, 7.0, 17.0, 14.0, 22.0, 17.0, 21.0, 29.0, 40.0, 41.0, 51.0, 44.0, 55.0, 48.0, 58.0, 46.0, 50.0, 43.0, 48.0, 49.0, 43.0, 42.0, 38.0, 30.0, 14.0, 16.0, 18.0, 20.0, 14.0, 7.0, 10.0, 5.0, 9.0, 0.0, 5.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.0003345012664794922, -0.0003262395039200783, -0.00031797774136066437, -0.00030971597880125046, -0.00030145421624183655, -0.00029319245368242264, -0.00028493069112300873, -0.0002766689285635948, -0.0002684071660041809, -0.000260145403444767, -0.0002518836408853531, -0.00024362187832593918, -0.00023536011576652527, -0.00022709835320711136, -0.00021883659064769745, -0.00021057482808828354, -0.00020231306552886963, -0.00019405130296945572, -0.0001857895404100418, -0.0001775277778506279, -0.000169266015291214, -0.00016100425273180008, -0.00015274249017238617, -0.00014448072761297226, -0.00013621896505355835, -0.00012795720249414444, -0.00011969543993473053, -0.00011143367737531662, -0.00010317191481590271, -9.49101522564888e-05, -8.664838969707489e-05, -7.838662713766098e-05, -7.012486457824707e-05, -6.186310201883316e-05, -5.360133945941925e-05, -4.533957690000534e-05, -3.707781434059143e-05, -2.881605178117752e-05, -2.055428922176361e-05, -1.2292526662349701e-05, -4.030764102935791e-06, 4.230998456478119e-06, 1.2492761015892029e-05, 2.075452357530594e-05, 2.901628613471985e-05, 3.727804869413376e-05, 4.553981125354767e-05, 5.380157381296158e-05, 6.206333637237549e-05, 7.03250989317894e-05, 7.858686149120331e-05, 8.684862405061722e-05, 9.511038661003113e-05, 0.00010337214916944504, 0.00011163391172885895, 0.00011989567428827286, 0.00012815743684768677, 0.00013641919940710068, 0.0001446809619665146, 0.0001529427245259285, 0.0001612044870853424, 0.00016946624964475632, 0.00017772801220417023, 0.00018598977476358414, 0.00019425153732299805]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 2.0, 9.0, 9.0, 5.0, 4.0, 14.0, 20.0, 30.0, 25.0, 48.0, 55.0, 88.0, 118.0, 147.0, 218.0, 357.0, 543.0, 823.0, 1406.0, 2450.0, 4724.0, 9321.0, 20529.0, 53369.0, 197486.0, 568318.0, 119003.0, 37587.0, 15288.0, 7251.0, 3593.0, 2154.0, 1236.0, 749.0, 486.0, 317.0, 229.0, 145.0, 108.0, 83.0, 46.0, 31.0, 33.0, 31.0, 21.0, 10.0, 6.0, 8.0, 9.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0], "bins": [-0.0214385986328125, -0.020775556564331055, -0.02011251449584961, -0.019449472427368164, -0.01878643035888672, -0.018123388290405273, -0.017460346221923828, -0.016797304153442383, -0.016134262084960938, -0.015471220016479492, -0.014808177947998047, -0.014145135879516602, -0.013482093811035156, -0.012819051742553711, -0.012156009674072266, -0.01149296760559082, -0.010829925537109375, -0.01016688346862793, -0.009503841400146484, -0.008840799331665039, -0.008177757263183594, -0.0075147151947021484, -0.006851673126220703, -0.006188631057739258, -0.0055255889892578125, -0.004862546920776367, -0.004199504852294922, -0.0035364627838134766, -0.0028734207153320312, -0.002210378646850586, -0.0015473365783691406, -0.0008842945098876953, -0.00022125244140625, 0.0004417896270751953, 0.0011048316955566406, 0.001767873764038086, 0.0024309158325195312, 0.0030939579010009766, 0.003756999969482422, 0.004420042037963867, 0.0050830841064453125, 0.005746126174926758, 0.006409168243408203, 0.0070722103118896484, 0.007735252380371094, 0.008398294448852539, 0.009061336517333984, 0.00972437858581543, 0.010387420654296875, 0.01105046272277832, 0.011713504791259766, 0.012376546859741211, 0.013039588928222656, 0.013702630996704102, 0.014365673065185547, 0.015028715133666992, 0.015691757202148438, 0.016354799270629883, 0.017017841339111328, 0.017680883407592773, 0.01834392547607422, 0.019006967544555664, 0.01967000961303711, 0.020333051681518555, 0.02099609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 5.0, 10.0, 4.0, 16.0, 19.0, 30.0, 30.0, 57.0, 63.0, 83.0, 79.0, 85.0, 109.0, 84.0, 74.0, 51.0, 56.0, 36.0, 27.0, 22.0, 13.0, 12.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.020233154296875, -0.019605636596679688, -0.018978118896484375, -0.018350601196289062, -0.01772308349609375, -0.017095565795898438, -0.016468048095703125, -0.015840530395507812, -0.0152130126953125, -0.014585494995117188, -0.013957977294921875, -0.013330459594726562, -0.01270294189453125, -0.012075424194335938, -0.011447906494140625, -0.010820388793945312, -0.01019287109375, -0.009565353393554688, -0.008937835693359375, -0.008310317993164062, -0.00768280029296875, -0.0070552825927734375, -0.006427764892578125, -0.0058002471923828125, -0.0051727294921875, -0.0045452117919921875, -0.003917694091796875, -0.0032901763916015625, -0.00266265869140625, -0.0020351409912109375, -0.001407623291015625, -0.0007801055908203125, -0.000152587890625, 0.0004749298095703125, 0.001102447509765625, 0.0017299652099609375, 0.00235748291015625, 0.0029850006103515625, 0.003612518310546875, 0.0042400360107421875, 0.0048675537109375, 0.0054950714111328125, 0.006122589111328125, 0.0067501068115234375, 0.00737762451171875, 0.008005142211914062, 0.008632659912109375, 0.009260177612304688, 0.0098876953125, 0.010515213012695312, 0.011142730712890625, 0.011770248413085938, 0.01239776611328125, 0.013025283813476562, 0.013652801513671875, 0.014280319213867188, 0.0149078369140625, 0.015535354614257812, 0.016162872314453125, 0.016790390014648438, 0.01741790771484375, 0.018045425415039062, 0.018672943115234375, 0.019300460815429688, 0.019927978515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 11.0, 6.0, 13.0, 12.0, 14.0, 18.0, 17.0, 31.0, 38.0, 44.0, 70.0, 104.0, 148.0, 301.0, 734.0, 3476.0, 91051.0, 935994.0, 13895.0, 1472.0, 443.0, 211.0, 118.0, 72.0, 54.0, 42.0, 38.0, 30.0, 17.0, 12.0, 14.0, 16.0, 9.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07122802734375, -0.06894969940185547, -0.06667137145996094, -0.0643930435180664, -0.062114715576171875, -0.059836387634277344, -0.05755805969238281, -0.05527973175048828, -0.05300140380859375, -0.05072307586669922, -0.04844474792480469, -0.046166419982910156, -0.043888092041015625, -0.041609764099121094, -0.03933143615722656, -0.03705310821533203, -0.0347747802734375, -0.03249645233154297, -0.030218124389648438, -0.027939796447753906, -0.025661468505859375, -0.023383140563964844, -0.021104812622070312, -0.01882648468017578, -0.01654815673828125, -0.014269828796386719, -0.011991500854492188, -0.009713172912597656, -0.007434844970703125, -0.005156517028808594, -0.0028781890869140625, -0.0005998611450195312, 0.001678466796875, 0.003956794738769531, 0.0062351226806640625, 0.008513450622558594, 0.010791778564453125, 0.013070106506347656, 0.015348434448242188, 0.01762676239013672, 0.01990509033203125, 0.02218341827392578, 0.024461746215820312, 0.026740074157714844, 0.029018402099609375, 0.031296730041503906, 0.03357505798339844, 0.03585338592529297, 0.0381317138671875, 0.04041004180908203, 0.04268836975097656, 0.044966697692871094, 0.047245025634765625, 0.049523353576660156, 0.05180168151855469, 0.05408000946044922, 0.05635833740234375, 0.05863666534423828, 0.06091499328613281, 0.06319332122802734, 0.06547164916992188, 0.0677499771118164, 0.07002830505371094, 0.07230663299560547, 0.0745849609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 9.0, 9.0, 11.0, 16.0, 12.0, 20.0, 23.0, 21.0, 29.0, 27.0, 36.0, 27.0, 36.0, 38.0, 45.0, 37.0, 38.0, 35.0, 24.0, 45.0, 41.0, 33.0, 45.0, 37.0, 42.0, 20.0, 27.0, 27.0, 28.0, 21.0, 14.0, 18.0, 16.0, 19.0, 14.0, 7.0, 11.0, 4.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.038848876953125, -0.03767251968383789, -0.03649616241455078, -0.03531980514526367, -0.03414344787597656, -0.03296709060668945, -0.031790733337402344, -0.030614376068115234, -0.029438018798828125, -0.028261661529541016, -0.027085304260253906, -0.025908946990966797, -0.024732589721679688, -0.023556232452392578, -0.02237987518310547, -0.02120351791381836, -0.02002716064453125, -0.01885080337524414, -0.01767444610595703, -0.016498088836669922, -0.015321731567382812, -0.014145374298095703, -0.012969017028808594, -0.011792659759521484, -0.010616302490234375, -0.009439945220947266, -0.008263587951660156, -0.007087230682373047, -0.0059108734130859375, -0.004734516143798828, -0.0035581588745117188, -0.0023818016052246094, -0.0012054443359375, -2.9087066650390625e-05, 0.0011472702026367188, 0.002323627471923828, 0.0034999847412109375, 0.004676342010498047, 0.005852699279785156, 0.007029056549072266, 0.008205413818359375, 0.009381771087646484, 0.010558128356933594, 0.011734485626220703, 0.012910842895507812, 0.014087200164794922, 0.015263557434082031, 0.01643991470336914, 0.01761627197265625, 0.01879262924194336, 0.01996898651123047, 0.021145343780517578, 0.022321701049804688, 0.023498058319091797, 0.024674415588378906, 0.025850772857666016, 0.027027130126953125, 0.028203487396240234, 0.029379844665527344, 0.030556201934814453, 0.03173255920410156, 0.03290891647338867, 0.03408527374267578, 0.03526163101196289, 0.03643798828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 6.0, 8.0, 18.0, 14.0, 17.0, 14.0, 34.0, 53.0, 107.0, 257.0, 2400.0, 1032287.0, 12558.0, 437.0, 117.0, 69.0, 30.0, 28.0, 15.0, 18.0, 12.0, 7.0, 7.0, 5.0, 6.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01131439208984375, -0.010919928550720215, -0.01052546501159668, -0.010131001472473145, -0.00973653793334961, -0.009342074394226074, -0.008947610855102539, -0.008553147315979004, -0.008158683776855469, -0.007764220237731934, -0.0073697566986083984, -0.006975293159484863, -0.006580829620361328, -0.006186366081237793, -0.005791902542114258, -0.005397439002990723, -0.0050029754638671875, -0.004608511924743652, -0.004214048385620117, -0.003819584846496582, -0.003425121307373047, -0.0030306577682495117, -0.0026361942291259766, -0.0022417306900024414, -0.0018472671508789062, -0.001452803611755371, -0.001058340072631836, -0.0006638765335083008, -0.0002694129943847656, 0.00012505054473876953, 0.0005195140838623047, 0.0009139776229858398, 0.001308441162109375, 0.0017029047012329102, 0.0020973682403564453, 0.0024918317794799805, 0.0028862953186035156, 0.0032807588577270508, 0.003675222396850586, 0.004069685935974121, 0.004464149475097656, 0.004858613014221191, 0.0052530765533447266, 0.005647540092468262, 0.006042003631591797, 0.006436467170715332, 0.006830930709838867, 0.007225394248962402, 0.0076198577880859375, 0.008014321327209473, 0.008408784866333008, 0.008803248405456543, 0.009197711944580078, 0.009592175483703613, 0.009986639022827148, 0.010381102561950684, 0.010775566101074219, 0.011170029640197754, 0.011564493179321289, 0.011958956718444824, 0.01235342025756836, 0.012747883796691895, 0.01314234733581543, 0.013536810874938965, 0.0139312744140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 4.0, 12.0, 3.0, 4.0, 19.0, 45.0, 490.0, 322.0, 37.0, 9.0, 15.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00037860870361328125, -0.00036710500717163086, -0.00035560131072998047, -0.0003440976142883301, -0.0003325939178466797, -0.0003210902214050293, -0.0003095865249633789, -0.0002980828285217285, -0.0002865791320800781, -0.00027507543563842773, -0.00026357173919677734, -0.00025206804275512695, -0.00024056434631347656, -0.00022906064987182617, -0.00021755695343017578, -0.0002060532569885254, -0.000194549560546875, -0.0001830458641052246, -0.00017154216766357422, -0.00016003847122192383, -0.00014853477478027344, -0.00013703107833862305, -0.00012552738189697266, -0.00011402368545532227, -0.00010251998901367188, -9.101629257202148e-05, -7.95125961303711e-05, -6.80088996887207e-05, -5.650520324707031e-05, -4.500150680541992e-05, -3.349781036376953e-05, -2.199411392211914e-05, -1.049041748046875e-05, 1.0132789611816406e-06, 1.2516975402832031e-05, 2.4020671844482422e-05, 3.552436828613281e-05, 4.70280647277832e-05, 5.8531761169433594e-05, 7.003545761108398e-05, 8.153915405273438e-05, 9.304285049438477e-05, 0.00010454654693603516, 0.00011605024337768555, 0.00012755393981933594, 0.00013905763626098633, 0.00015056133270263672, 0.0001620650291442871, 0.0001735687255859375, 0.0001850724220275879, 0.00019657611846923828, 0.00020807981491088867, 0.00021958351135253906, 0.00023108720779418945, 0.00024259090423583984, 0.00025409460067749023, 0.0002655982971191406, 0.000277101993560791, 0.0002886056900024414, 0.0003001093864440918, 0.0003116130828857422, 0.0003231167793273926, 0.00033462047576904297, 0.00034612417221069336, 0.00035762786865234375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 9.0, 10.0, 9.0, 14.0, 25.0, 31.0, 64.0, 87.0, 217.0, 878.0, 12391.0, 1024568.0, 9044.0, 724.0, 216.0, 97.0, 52.0, 25.0, 16.0, 12.0, 12.0, 11.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.01509857177734375, -0.014684438705444336, -0.014270305633544922, -0.013856172561645508, -0.013442039489746094, -0.01302790641784668, -0.012613773345947266, -0.012199640274047852, -0.011785507202148438, -0.011371374130249023, -0.01095724105834961, -0.010543107986450195, -0.010128974914550781, -0.009714841842651367, -0.009300708770751953, -0.008886575698852539, -0.008472442626953125, -0.008058309555053711, -0.007644176483154297, -0.007230043411254883, -0.006815910339355469, -0.006401777267456055, -0.005987644195556641, -0.0055735111236572266, -0.0051593780517578125, -0.0047452449798583984, -0.004331111907958984, -0.00391697883605957, -0.0035028457641601562, -0.003088712692260742, -0.002674579620361328, -0.002260446548461914, -0.0018463134765625, -0.001432180404663086, -0.0010180473327636719, -0.0006039142608642578, -0.00018978118896484375, 0.0002243518829345703, 0.0006384849548339844, 0.0010526180267333984, 0.0014667510986328125, 0.0018808841705322266, 0.0022950172424316406, 0.0027091503143310547, 0.0031232833862304688, 0.003537416458129883, 0.003951549530029297, 0.004365682601928711, 0.004779815673828125, 0.005193948745727539, 0.005608081817626953, 0.006022214889526367, 0.006436347961425781, 0.006850481033325195, 0.007264614105224609, 0.0076787471771240234, 0.008092880249023438, 0.008507013320922852, 0.008921146392822266, 0.00933527946472168, 0.009749412536621094, 0.010163545608520508, 0.010577678680419922, 0.010991811752319336, 0.01140594482421875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 11.0, 3.0, 5.0, 11.0, 7.0, 16.0, 31.0, 41.0, 68.0, 201.0, 271.0, 135.0, 78.0, 32.0, 21.0, 14.0, 14.0, 7.0, 5.0, 2.0, 10.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00937652587890625, -0.009095072746276855, -0.008813619613647461, -0.008532166481018066, -0.008250713348388672, -0.007969260215759277, -0.007687807083129883, -0.007406353950500488, -0.007124900817871094, -0.006843447685241699, -0.006561994552612305, -0.00628054141998291, -0.005999088287353516, -0.005717635154724121, -0.0054361820220947266, -0.005154728889465332, -0.0048732757568359375, -0.004591822624206543, -0.0043103694915771484, -0.004028916358947754, -0.0037474632263183594, -0.003466010093688965, -0.0031845569610595703, -0.0029031038284301758, -0.0026216506958007812, -0.0023401975631713867, -0.002058744430541992, -0.0017772912979125977, -0.0014958381652832031, -0.0012143850326538086, -0.0009329319000244141, -0.0006514787673950195, -0.000370025634765625, -8.857250213623047e-05, 0.00019288063049316406, 0.0004743337631225586, 0.0007557868957519531, 0.0010372400283813477, 0.0013186931610107422, 0.0016001462936401367, 0.0018815994262695312, 0.0021630525588989258, 0.0024445056915283203, 0.002725958824157715, 0.0030074119567871094, 0.003288865089416504, 0.0035703182220458984, 0.003851771354675293, 0.0041332244873046875, 0.004414677619934082, 0.0046961307525634766, 0.004977583885192871, 0.005259037017822266, 0.00554049015045166, 0.005821943283081055, 0.006103396415710449, 0.006384849548339844, 0.006666302680969238, 0.006947755813598633, 0.007229208946228027, 0.007510662078857422, 0.007792115211486816, 0.008073568344116211, 0.008355021476745605, 0.008636474609375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 22.0, 176.0, 757.0, 49.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5261597037315369, -0.49573713541030884, -0.4653145372867584, -0.4348919689655304, -0.40446937084198, -0.37404680252075195, -0.3436242341995239, -0.3132016658782959, -0.2827790677547455, -0.25235649943351746, -0.22193390130996704, -0.191511332988739, -0.1610887497663498, -0.13066616654396057, -0.10024359822273254, -0.06982101500034332, -0.0393984317779541, -0.008975852280855179, 0.021446727216243744, 0.05186930298805237, 0.08229188621044159, 0.11271446943283081, 0.14313703775405884, 0.17355962097644806, 0.20398220419883728, 0.2344047874212265, 0.2648273706436157, 0.29524993896484375, 0.3256725072860718, 0.3560951054096222, 0.3865176737308502, 0.41694027185440063, 0.4473627805709839, 0.4777853488922119, 0.5082079172134399, 0.538630485534668, 0.5690531134605408, 0.5994756817817688, 0.6298982501029968, 0.6603208184242249, 0.6907434463500977, 0.7211660146713257, 0.7515885829925537, 0.7820111513137817, 0.8124337792396545, 0.8428563475608826, 0.8732789158821106, 0.9037014842033386, 0.9341240525245667, 0.9645466208457947, 0.9949691891670227, 1.0253918170928955, 1.0558143854141235, 1.0862369537353516, 1.1166595220565796, 1.1470820903778076, 1.1775046586990356, 1.2079272270202637, 1.2383497953414917, 1.2687723636627197, 1.2991949319839478, 1.3296175003051758, 1.3600401878356934, 1.3904627561569214, 1.4208853244781494]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 7.0, 3.0, 9.0, 4.0, 9.0, 18.0, 11.0, 10.0, 21.0, 21.0, 16.0, 25.0, 36.0, 38.0, 33.0, 40.0, 45.0, 48.0, 44.0, 54.0, 58.0, 44.0, 58.0, 37.0, 21.0, 35.0, 42.0, 25.0, 31.0, 27.0, 24.0, 22.0, 12.0, 14.0, 19.0, 10.0, 5.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1732161045074463, -0.16705545783042908, -0.16089482605457306, -0.15473417937755585, -0.14857354760169983, -0.14241290092468262, -0.1362522542476654, -0.1300916075706482, -0.12393097579479218, -0.11777033656835556, -0.11160969734191895, -0.10544905066490173, -0.09928841143846512, -0.0931277722120285, -0.08696712553501129, -0.08080648630857468, -0.07464584708213806, -0.06848520785570145, -0.06232456490397453, -0.05616392195224762, -0.050003282725811005, -0.04384264349937439, -0.037682000547647476, -0.03152135759592056, -0.025360718369483948, -0.019200077280402184, -0.01303943619132042, -0.006878795102238655, -0.0007181540131568909, 0.005442487075924873, 0.011603128165006638, 0.01776377111673355, 0.023924410343170166, 0.03008505143225193, 0.036245692521333694, 0.04240633547306061, 0.04856697469949722, 0.05472761392593384, 0.06088825687766075, 0.06704889982938766, 0.07320953905582428, 0.0793701782822609, 0.08553081750869751, 0.09169146418571472, 0.09785210341215134, 0.10401274263858795, 0.11017338931560516, 0.11633402854204178, 0.1224946677684784, 0.1286553144454956, 0.13481594622135162, 0.14097659289836884, 0.14713722467422485, 0.15329787135124207, 0.15945851802825928, 0.1656191647052765, 0.1717797964811325, 0.17794044315814972, 0.18410107493400574, 0.19026172161102295, 0.19642236828804016, 0.20258300006389618, 0.2087436467409134, 0.2149042785167694, 0.22106492519378662]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 4.0, 8.0, 11.0, 23.0, 36.0, 55.0, 51.0, 90.0, 167.0, 506.0, 1952.0, 4169092.0, 20328.0, 1239.0, 319.0, 140.0, 76.0, 41.0, 37.0, 26.0, 19.0, 12.0, 5.0, 9.0, 8.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005279541015625, -0.005102813243865967, -0.004926085472106934, -0.0047493577003479, -0.004572629928588867, -0.004395902156829834, -0.004219174385070801, -0.004042446613311768, -0.0038657188415527344, -0.003688991069793701, -0.003512263298034668, -0.0033355355262756348, -0.0031588077545166016, -0.0029820799827575684, -0.002805352210998535, -0.002628624439239502, -0.0024518966674804688, -0.0022751688957214355, -0.0020984411239624023, -0.0019217133522033691, -0.001744985580444336, -0.0015682578086853027, -0.0013915300369262695, -0.0012148022651672363, -0.0010380744934082031, -0.0008613467216491699, -0.0006846189498901367, -0.0005078911781311035, -0.0003311634063720703, -0.0001544356346130371, 2.2292137145996094e-05, 0.0001990199089050293, 0.0003757476806640625, 0.0005524754524230957, 0.0007292032241821289, 0.0009059309959411621, 0.0010826587677001953, 0.0012593865394592285, 0.0014361143112182617, 0.001612842082977295, 0.0017895698547363281, 0.0019662976264953613, 0.0021430253982543945, 0.0023197531700134277, 0.002496480941772461, 0.002673208713531494, 0.0028499364852905273, 0.0030266642570495605, 0.0032033920288085938, 0.003380119800567627, 0.00355684757232666, 0.0037335753440856934, 0.0039103031158447266, 0.00408703088760376, 0.004263758659362793, 0.004440486431121826, 0.004617214202880859, 0.004793941974639893, 0.004970669746398926, 0.005147397518157959, 0.005324125289916992, 0.005500853061676025, 0.005677580833435059, 0.005854308605194092, 0.006031036376953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 19.0, 14.0, 37.0, 27.0, 37.0, 51.0, 80.0, 75.0, 75.0, 99.0, 97.0, 82.0, 59.0, 71.0, 40.0, 32.0, 17.0, 24.0, 11.0, 11.0, 6.0, 11.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0186920166015625, -0.018103837966918945, -0.01751565933227539, -0.016927480697631836, -0.01633930206298828, -0.015751123428344727, -0.015162944793701172, -0.014574766159057617, -0.013986587524414062, -0.013398408889770508, -0.012810230255126953, -0.012222051620483398, -0.011633872985839844, -0.011045694351196289, -0.010457515716552734, -0.00986933708190918, -0.009281158447265625, -0.00869297981262207, -0.008104801177978516, -0.007516622543334961, -0.006928443908691406, -0.0063402652740478516, -0.005752086639404297, -0.005163908004760742, -0.0045757293701171875, -0.003987550735473633, -0.003399372100830078, -0.0028111934661865234, -0.0022230148315429688, -0.001634836196899414, -0.0010466575622558594, -0.0004584789276123047, 0.00012969970703125, 0.0007178783416748047, 0.0013060569763183594, 0.001894235610961914, 0.0024824142456054688, 0.0030705928802490234, 0.003658771514892578, 0.004246950149536133, 0.0048351287841796875, 0.005423307418823242, 0.006011486053466797, 0.0065996646881103516, 0.007187843322753906, 0.007776021957397461, 0.008364200592041016, 0.00895237922668457, 0.009540557861328125, 0.01012873649597168, 0.010716915130615234, 0.011305093765258789, 0.011893272399902344, 0.012481451034545898, 0.013069629669189453, 0.013657808303833008, 0.014245986938476562, 0.014834165573120117, 0.015422344207763672, 0.016010522842407227, 0.01659870147705078, 0.017186880111694336, 0.01777505874633789, 0.018363237380981445, 0.018951416015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 4.0, 5.0, 16.0, 17.0, 22.0, 19.0, 20.0, 19.0, 29.0, 25.0, 25.0, 36.0, 43.0, 49.0, 80.0, 179.0, 560.0, 3100.0, 4176375.0, 11904.0, 1013.0, 297.0, 112.0, 50.0, 33.0, 36.0, 22.0, 38.0, 24.0, 15.0, 14.0, 22.0, 18.0, 10.0, 15.0, 6.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.005706787109375, -0.005547046661376953, -0.005387306213378906, -0.005227565765380859, -0.0050678253173828125, -0.004908084869384766, -0.004748344421386719, -0.004588603973388672, -0.004428863525390625, -0.004269123077392578, -0.004109382629394531, -0.003949642181396484, -0.0037899017333984375, -0.0036301612854003906, -0.0034704208374023438, -0.003310680389404297, -0.00315093994140625, -0.002991199493408203, -0.0028314590454101562, -0.0026717185974121094, -0.0025119781494140625, -0.0023522377014160156, -0.0021924972534179688, -0.002032756805419922, -0.001873016357421875, -0.0017132759094238281, -0.0015535354614257812, -0.0013937950134277344, -0.0012340545654296875, -0.0010743141174316406, -0.0009145736694335938, -0.0007548332214355469, -0.0005950927734375, -0.0004353523254394531, -0.00027561187744140625, -0.00011587142944335938, 4.38690185546875e-05, 0.00020360946655273438, 0.00036334991455078125, 0.0005230903625488281, 0.000682830810546875, 0.0008425712585449219, 0.0010023117065429688, 0.0011620521545410156, 0.0013217926025390625, 0.0014815330505371094, 0.0016412734985351562, 0.0018010139465332031, 0.00196075439453125, 0.002120494842529297, 0.0022802352905273438, 0.0024399757385253906, 0.0025997161865234375, 0.0027594566345214844, 0.0029191970825195312, 0.003078937530517578, 0.003238677978515625, 0.003398418426513672, 0.0035581588745117188, 0.0037178993225097656, 0.0038776397705078125, 0.004037380218505859, 0.004197120666503906, 0.004356861114501953, 0.0045166015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 8.0, 20.0, 4015.0, 32.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005016326904296875, -0.004924491047859192, -0.004832655191421509, -0.004740819334983826, -0.004648983478546143, -0.0045571476221084595, -0.004465311765670776, -0.004373475909233093, -0.00428164005279541, -0.004189804196357727, -0.004097968339920044, -0.004006132483482361, -0.003914296627044678, -0.0038224607706069946, -0.0037306249141693115, -0.0036387890577316284, -0.0035469532012939453, -0.003455117344856262, -0.003363281488418579, -0.003271445631980896, -0.003179609775543213, -0.00308777391910553, -0.0029959380626678467, -0.0029041022062301636, -0.0028122663497924805, -0.0027204304933547974, -0.0026285946369171143, -0.002536758780479431, -0.002444922924041748, -0.002353087067604065, -0.002261251211166382, -0.0021694153547286987, -0.0020775794982910156, -0.0019857436418533325, -0.0018939077854156494, -0.0018020719289779663, -0.0017102360725402832, -0.0016184002161026, -0.001526564359664917, -0.0014347285032272339, -0.0013428926467895508, -0.0012510567903518677, -0.0011592209339141846, -0.0010673850774765015, -0.0009755492210388184, -0.0008837133646011353, -0.0007918775081634521, -0.000700041651725769, -0.0006082057952880859, -0.0005163699388504028, -0.0004245340824127197, -0.0003326982259750366, -0.00024086236953735352, -0.0001490265130996704, -5.7190656661987305e-05, 3.46451997756958e-05, 0.0001264810562133789, 0.000218316912651062, 0.0003101527690887451, 0.0004019886255264282, 0.0004938244819641113, 0.0005856603384017944, 0.0006774961948394775, 0.0007693320512771606, 0.0008611679077148438]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 10.0, 25.0, 52.0, 174.0, 507.0, 158.0, 51.0, 17.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006068538874387741, -0.005855209659785032, -0.0056418804451823235, -0.005428551230579615, -0.005215222015976906, -0.005001893267035484, -0.0047885640524327755, -0.004575234837830067, -0.004361905623227358, -0.004148576408624649, -0.00393524719402194, -0.003721918212249875, -0.0035085889976471663, -0.0032952597830444574, -0.0030819308012723923, -0.0028686015866696835, -0.0026552723720669746, -0.002441943157464266, -0.002228613942861557, -0.002015284961089492, -0.001801955746486783, -0.0015886265318840742, -0.0013752974336966872, -0.0011619683355093002, -0.0009486391209065914, -0.0007353099645115435, -0.0005219808081164956, -0.0003086516517214477, -9.53224953263998e-05, 0.00011800671927630901, 0.000331335817463696, 0.000544664915651083, 0.0007579936645925045, 0.0009713228209875524, 0.0011846519773826003, 0.0013979810755699873, 0.0016113102901726961, 0.001824639504775405, 0.00203796848654747, 0.002251297701150179, 0.0024646269157528877, 0.0026779561303555965, 0.0028912853449583054, 0.0031046143267303705, 0.0033179435413330793, 0.003531272755935788, 0.0037446017377078533, 0.003957930952310562, 0.004171260166913271, 0.00438458938151598, 0.004597918596118689, 0.004811247810721397, 0.005024576559662819, 0.005237906239926815, 0.0054512349888682365, 0.005664564203470945, 0.005877893418073654, 0.006091222632676363, 0.006304551847279072, 0.006517881061881781, 0.0067312102764844894, 0.006944539025425911, 0.00715786824002862, 0.007371197454631329, 0.007584526669234037]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 8.0, 4.0, 7.0, 10.0, 14.0, 29.0, 46.0, 62.0, 87.0, 85.0, 115.0, 129.0, 127.0, 89.0, 63.0, 36.0, 30.0, 22.0, 12.0, 9.0, 6.0, 6.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.009160101413726807, -0.008966248482465744, -0.008772395551204681, -0.008578542619943619, -0.008384689688682556, -0.008190836757421494, -0.007996983826160431, -0.007803130894899368, -0.007609277963638306, -0.007415425032377243, -0.00722157210111618, -0.007027719169855118, -0.006833866238594055, -0.0066400133073329926, -0.00644616037607193, -0.006252307444810867, -0.006058454513549805, -0.005864601582288742, -0.0056707486510276794, -0.005476895719766617, -0.005283042788505554, -0.005089189857244492, -0.004895336925983429, -0.004701483994722366, -0.004507631063461304, -0.004313778132200241, -0.0041199252009391785, -0.003926072269678116, -0.0037322193384170532, -0.0035383664071559906, -0.003344513475894928, -0.0031506605446338654, -0.0029568076133728027, -0.00276295468211174, -0.0025691017508506775, -0.002375248819589615, -0.0021813958883285522, -0.0019875429570674896, -0.001793690025806427, -0.0015998370945453644, -0.0014059841632843018, -0.0012121312320232391, -0.0010182783007621765, -0.0008244253695011139, -0.0006305724382400513, -0.00043671950697898865, -0.00024286657571792603, -4.90136444568634e-05, 0.00014483928680419922, 0.00033869221806526184, 0.0005325451493263245, 0.0007263980805873871, 0.0009202510118484497, 0.0011141039431095123, 0.001307956874370575, 0.0015018098056316376, 0.0016956627368927002, 0.0018895156681537628, 0.0020833685994148254, 0.002277221530675888, 0.0024710744619369507, 0.0026649273931980133, 0.002858780324459076, 0.0030526332557201385, 0.003246486186981201]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 8.0, 9.0, 8.0, 16.0, 18.0, 46.0, 55.0, 87.0, 150.0, 227.0, 474.0, 827.0, 1846.0, 4931.0, 16907.0, 100527.0, 781190.0, 114025.0, 18087.0, 5036.0, 2029.0, 907.0, 482.0, 248.0, 135.0, 74.0, 60.0, 40.0, 35.0, 16.0, 11.0, 4.0, 12.0, 10.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03863525390625, -0.03740978240966797, -0.03618431091308594, -0.034958839416503906, -0.033733367919921875, -0.032507896423339844, -0.03128242492675781, -0.03005695343017578, -0.02883148193359375, -0.02760601043701172, -0.026380538940429688, -0.025155067443847656, -0.023929595947265625, -0.022704124450683594, -0.021478652954101562, -0.02025318145751953, -0.0190277099609375, -0.01780223846435547, -0.016576766967773438, -0.015351295471191406, -0.014125823974609375, -0.012900352478027344, -0.011674880981445312, -0.010449409484863281, -0.00922393798828125, -0.007998466491699219, -0.0067729949951171875, -0.005547523498535156, -0.004322052001953125, -0.0030965805053710938, -0.0018711090087890625, -0.0006456375122070312, 0.000579833984375, 0.0018053054809570312, 0.0030307769775390625, 0.004256248474121094, 0.005481719970703125, 0.006707191467285156, 0.007932662963867188, 0.009158134460449219, 0.01038360595703125, 0.011609077453613281, 0.012834548950195312, 0.014060020446777344, 0.015285491943359375, 0.016510963439941406, 0.017736434936523438, 0.01896190643310547, 0.0201873779296875, 0.02141284942626953, 0.022638320922851562, 0.023863792419433594, 0.025089263916015625, 0.026314735412597656, 0.027540206909179688, 0.02876567840576172, 0.02999114990234375, 0.03121662139892578, 0.03244209289550781, 0.033667564392089844, 0.034893035888671875, 0.036118507385253906, 0.03734397888183594, 0.03856945037841797, 0.039794921875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 18.0, 17.0, 34.0, 32.0, 31.0, 56.0, 81.0, 69.0, 79.0, 96.0, 103.0, 78.0, 64.0, 64.0, 43.0, 31.0, 17.0, 25.0, 10.0, 11.0, 6.0, 10.0, 5.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0186920166015625, -0.018103837966918945, -0.01751565933227539, -0.016927480697631836, -0.01633930206298828, -0.015751123428344727, -0.015162944793701172, -0.014574766159057617, -0.013986587524414062, -0.013398408889770508, -0.012810230255126953, -0.012222051620483398, -0.011633872985839844, -0.011045694351196289, -0.010457515716552734, -0.00986933708190918, -0.009281158447265625, -0.00869297981262207, -0.008104801177978516, -0.007516622543334961, -0.006928443908691406, -0.0063402652740478516, -0.005752086639404297, -0.005163908004760742, -0.0045757293701171875, -0.003987550735473633, -0.003399372100830078, -0.0028111934661865234, -0.0022230148315429688, -0.001634836196899414, -0.0010466575622558594, -0.0004584789276123047, 0.00012969970703125, 0.0007178783416748047, 0.0013060569763183594, 0.001894235610961914, 0.0024824142456054688, 0.0030705928802490234, 0.003658771514892578, 0.004246950149536133, 0.0048351287841796875, 0.005423307418823242, 0.006011486053466797, 0.0065996646881103516, 0.007187843322753906, 0.007776021957397461, 0.008364200592041016, 0.00895237922668457, 0.009540557861328125, 0.01012873649597168, 0.010716915130615234, 0.011305093765258789, 0.011893272399902344, 0.012481451034545898, 0.013069629669189453, 0.013657808303833008, 0.014245986938476562, 0.014834165573120117, 0.015422344207763672, 0.016010522842407227, 0.01659870147705078, 0.017186880111694336, 0.01777505874633789, 0.018363237380981445, 0.018951416015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 10.0, 7.0, 13.0, 10.0, 10.0, 10.0, 20.0, 21.0, 26.0, 47.0, 73.0, 95.0, 163.0, 295.0, 550.0, 1361.0, 5705.0, 69024.0, 901414.0, 62072.0, 5017.0, 1241.0, 563.0, 285.0, 165.0, 72.0, 84.0, 43.0, 34.0, 22.0, 19.0, 11.0, 17.0, 9.0, 20.0, 12.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.051788330078125, -0.050328731536865234, -0.04886913299560547, -0.0474095344543457, -0.04594993591308594, -0.04449033737182617, -0.043030738830566406, -0.04157114028930664, -0.040111541748046875, -0.03865194320678711, -0.037192344665527344, -0.03573274612426758, -0.03427314758300781, -0.03281354904174805, -0.03135395050048828, -0.029894351959228516, -0.02843475341796875, -0.026975154876708984, -0.02551555633544922, -0.024055957794189453, -0.022596359252929688, -0.021136760711669922, -0.019677162170410156, -0.01821756362915039, -0.016757965087890625, -0.01529836654663086, -0.013838768005371094, -0.012379169464111328, -0.010919570922851562, -0.009459972381591797, -0.008000373840332031, -0.006540775299072266, -0.0050811767578125, -0.0036215782165527344, -0.0021619796752929688, -0.0007023811340332031, 0.0007572174072265625, 0.002216815948486328, 0.0036764144897460938, 0.005136013031005859, 0.006595611572265625, 0.00805521011352539, 0.009514808654785156, 0.010974407196044922, 0.012434005737304688, 0.013893604278564453, 0.015353202819824219, 0.016812801361083984, 0.01827239990234375, 0.019731998443603516, 0.02119159698486328, 0.022651195526123047, 0.024110794067382812, 0.025570392608642578, 0.027029991149902344, 0.02848958969116211, 0.029949188232421875, 0.03140878677368164, 0.032868385314941406, 0.03432798385620117, 0.03578758239746094, 0.0372471809387207, 0.03870677947998047, 0.040166378021240234, 0.0416259765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 6.0, 11.0, 9.0, 12.0, 11.0, 22.0, 14.0, 14.0, 20.0, 21.0, 43.0, 31.0, 36.0, 35.0, 39.0, 53.0, 42.0, 56.0, 42.0, 52.0, 42.0, 48.0, 50.0, 43.0, 40.0, 40.0, 30.0, 14.0, 26.0, 20.0, 19.0, 16.0, 9.0, 8.0, 9.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04437255859375, -0.043074607849121094, -0.04177665710449219, -0.04047870635986328, -0.039180755615234375, -0.03788280487060547, -0.03658485412597656, -0.035286903381347656, -0.03398895263671875, -0.032691001892089844, -0.03139305114746094, -0.03009510040283203, -0.028797149658203125, -0.02749919891357422, -0.026201248168945312, -0.024903297424316406, -0.0236053466796875, -0.022307395935058594, -0.021009445190429688, -0.01971149444580078, -0.018413543701171875, -0.01711559295654297, -0.015817642211914062, -0.014519691467285156, -0.01322174072265625, -0.011923789978027344, -0.010625839233398438, -0.009327888488769531, -0.008029937744140625, -0.006731986999511719, -0.0054340362548828125, -0.004136085510253906, -0.002838134765625, -0.0015401840209960938, -0.0002422332763671875, 0.0010557174682617188, 0.002353668212890625, 0.0036516189575195312, 0.0049495697021484375, 0.006247520446777344, 0.00754547119140625, 0.008843421936035156, 0.010141372680664062, 0.011439323425292969, 0.012737274169921875, 0.014035224914550781, 0.015333175659179688, 0.016631126403808594, 0.0179290771484375, 0.019227027893066406, 0.020524978637695312, 0.02182292938232422, 0.023120880126953125, 0.02441883087158203, 0.025716781616210938, 0.027014732360839844, 0.02831268310546875, 0.029610633850097656, 0.030908584594726562, 0.03220653533935547, 0.033504486083984375, 0.03480243682861328, 0.03610038757324219, 0.037398338317871094, 0.0386962890625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 15.0, 13.0, 37.0, 56.0, 164.0, 1448.0, 1042664.0, 3697.0, 290.0, 88.0, 45.0, 12.0, 9.0, 1.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.024932861328125, -0.024397850036621094, -0.023862838745117188, -0.02332782745361328, -0.022792816162109375, -0.02225780487060547, -0.021722793579101562, -0.021187782287597656, -0.02065277099609375, -0.020117759704589844, -0.019582748413085938, -0.01904773712158203, -0.018512725830078125, -0.01797771453857422, -0.017442703247070312, -0.016907691955566406, -0.0163726806640625, -0.015837669372558594, -0.015302658081054688, -0.014767646789550781, -0.014232635498046875, -0.013697624206542969, -0.013162612915039062, -0.012627601623535156, -0.01209259033203125, -0.011557579040527344, -0.011022567749023438, -0.010487556457519531, -0.009952545166015625, -0.009417533874511719, -0.008882522583007812, -0.008347511291503906, -0.0078125, -0.007277488708496094, -0.0067424774169921875, -0.006207466125488281, -0.005672454833984375, -0.005137443542480469, -0.0046024322509765625, -0.004067420959472656, -0.00353240966796875, -0.0029973983764648438, -0.0024623870849609375, -0.0019273757934570312, -0.001392364501953125, -0.0008573532104492188, -0.0003223419189453125, 0.00021266937255859375, 0.0007476806640625, 0.0012826919555664062, 0.0018177032470703125, 0.0023527145385742188, 0.002887725830078125, 0.0034227371215820312, 0.0039577484130859375, 0.004492759704589844, 0.00502777099609375, 0.005562782287597656, 0.0060977935791015625, 0.006632804870605469, 0.007167816162109375, 0.007702827453613281, 0.008237838745117188, 0.008772850036621094, 0.009307861328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 11.0, 5.0, 12.0, 43.0, 61.0, 137.0, 408.0, 166.0, 67.0, 33.0, 27.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003120899200439453, -0.00030553434044122696, -0.0002989787608385086, -0.00029242318123579025, -0.0002858676016330719, -0.00027931202203035355, -0.0002727564424276352, -0.00026620086282491684, -0.0002596452832221985, -0.00025308970361948013, -0.0002465341240167618, -0.00023997854441404343, -0.00023342296481132507, -0.00022686738520860672, -0.00022031180560588837, -0.00021375622600317, -0.00020720064640045166, -0.0002006450667977333, -0.00019408948719501495, -0.0001875339075922966, -0.00018097832798957825, -0.0001744227483868599, -0.00016786716878414154, -0.0001613115891814232, -0.00015475600957870483, -0.00014820042997598648, -0.00014164485037326813, -0.00013508927077054977, -0.00012853369116783142, -0.00012197811156511307, -0.00011542253196239471, -0.00010886695235967636, -0.00010231137275695801, -9.575579315423965e-05, -8.92002135515213e-05, -8.264463394880295e-05, -7.60890543460846e-05, -6.953347474336624e-05, -6.297789514064789e-05, -5.6422315537929535e-05, -4.986673593521118e-05, -4.331115633249283e-05, -3.6755576729774475e-05, -3.0199997127056122e-05, -2.364441752433777e-05, -1.7088837921619415e-05, -1.0533258318901062e-05, -3.977678716182709e-06, 2.5779008865356445e-06, 9.133480489253998e-06, 1.568906009197235e-05, 2.2244639694690704e-05, 2.8800219297409058e-05, 3.535579890012741e-05, 4.1911378502845764e-05, 4.846695810556412e-05, 5.502253770828247e-05, 6.157811731100082e-05, 6.813369691371918e-05, 7.468927651643753e-05, 8.124485611915588e-05, 8.780043572187424e-05, 9.435601532459259e-05, 0.00010091159492731094, 0.0001074671745300293]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 4.0, 10.0, 12.0, 41.0, 93.0, 228.0, 900.0, 18872.0, 1025167.0, 2572.0, 411.0, 141.0, 38.0, 27.0, 10.0, 10.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0163116455078125, -0.015712976455688477, -0.015114307403564453, -0.01451563835144043, -0.013916969299316406, -0.013318300247192383, -0.01271963119506836, -0.012120962142944336, -0.011522293090820312, -0.010923624038696289, -0.010324954986572266, -0.009726285934448242, -0.009127616882324219, -0.008528947830200195, -0.007930278778076172, -0.0073316097259521484, -0.006732940673828125, -0.0061342716217041016, -0.005535602569580078, -0.004936933517456055, -0.004338264465332031, -0.003739595413208008, -0.0031409263610839844, -0.002542257308959961, -0.0019435882568359375, -0.001344919204711914, -0.0007462501525878906, -0.0001475811004638672, 0.00045108795166015625, 0.0010497570037841797, 0.0016484260559082031, 0.0022470951080322266, 0.00284576416015625, 0.0034444332122802734, 0.004043102264404297, 0.00464177131652832, 0.005240440368652344, 0.005839109420776367, 0.006437778472900391, 0.007036447525024414, 0.0076351165771484375, 0.008233785629272461, 0.008832454681396484, 0.009431123733520508, 0.010029792785644531, 0.010628461837768555, 0.011227130889892578, 0.011825799942016602, 0.012424468994140625, 0.013023138046264648, 0.013621807098388672, 0.014220476150512695, 0.014819145202636719, 0.015417814254760742, 0.016016483306884766, 0.01661515235900879, 0.017213821411132812, 0.017812490463256836, 0.01841115951538086, 0.019009828567504883, 0.019608497619628906, 0.02020716667175293, 0.020805835723876953, 0.021404504776000977, 0.022003173828125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 3.0, 16.0, 30.0, 71.0, 297.0, 399.0, 110.0, 34.0, 21.0, 9.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01983642578125, -0.019272327423095703, -0.018708229064941406, -0.01814413070678711, -0.017580032348632812, -0.017015933990478516, -0.01645183563232422, -0.015887737274169922, -0.015323638916015625, -0.014759540557861328, -0.014195442199707031, -0.013631343841552734, -0.013067245483398438, -0.01250314712524414, -0.011939048767089844, -0.011374950408935547, -0.01081085205078125, -0.010246753692626953, -0.009682655334472656, -0.00911855697631836, -0.008554458618164062, -0.007990360260009766, -0.007426261901855469, -0.006862163543701172, -0.006298065185546875, -0.005733966827392578, -0.005169868469238281, -0.004605770111083984, -0.0040416717529296875, -0.0034775733947753906, -0.0029134750366210938, -0.002349376678466797, -0.0017852783203125, -0.0012211799621582031, -0.0006570816040039062, -9.298324584960938e-05, 0.0004711151123046875, 0.0010352134704589844, 0.0015993118286132812, 0.002163410186767578, 0.002727508544921875, 0.003291606903076172, 0.0038557052612304688, 0.004419803619384766, 0.0049839019775390625, 0.005548000335693359, 0.006112098693847656, 0.006676197052001953, 0.00724029541015625, 0.007804393768310547, 0.008368492126464844, 0.00893259048461914, 0.009496688842773438, 0.010060787200927734, 0.010624885559082031, 0.011188983917236328, 0.011753082275390625, 0.012317180633544922, 0.012881278991699219, 0.013445377349853516, 0.014009475708007812, 0.01457357406616211, 0.015137672424316406, 0.015701770782470703, 0.016265869140625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 24.0, 234.0, 689.0, 55.0, 11.0, 2.0], "bins": [-1.5053203105926514, -1.4803191423416138, -1.4553178548812866, -1.430316686630249, -1.4053155183792114, -1.3803143501281738, -1.3553130626678467, -1.330311894416809, -1.3053107261657715, -1.2803095579147339, -1.2553082704544067, -1.2303071022033691, -1.2053059339523315, -1.180304765701294, -1.1553034782409668, -1.1303023099899292, -1.1053011417388916, -1.080299973487854, -1.0552986860275269, -1.0302975177764893, -1.0052963495254517, -0.9802951216697693, -0.9552939534187317, -0.9302927255630493, -0.9052914977073669, -0.8802902698516846, -0.855289101600647, -0.8302878737449646, -0.805286705493927, -0.7802854776382446, -0.755284309387207, -0.7302830815315247, -0.7052818536758423, -0.6802806258201599, -0.6552794575691223, -0.6302782297134399, -0.6052770614624023, -0.58027583360672, -0.5552746653556824, -0.5302734375, -0.5052722692489624, -0.4802710711956024, -0.45526987314224243, -0.43026867508888245, -0.40526747703552246, -0.3802662491798401, -0.3552650809288025, -0.3302638530731201, -0.3052626848220825, -0.28026148676872253, -0.25526028871536255, -0.23025909066200256, -0.20525789260864258, -0.1802566796541214, -0.1552554816007614, -0.13025428354740143, -0.10525307804346085, -0.08025187999010086, -0.05525067821145058, -0.030249476432800293, -0.005248278379440308, 0.019752927124500275, 0.04475412517786026, 0.06975532323122025, 0.09475652128458023]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 8.0, 5.0, 2.0, 3.0, 5.0, 12.0, 8.0, 7.0, 14.0, 9.0, 15.0, 19.0, 19.0, 23.0, 18.0, 27.0, 30.0, 24.0, 34.0, 46.0, 49.0, 33.0, 40.0, 44.0, 46.0, 60.0, 54.0, 33.0, 30.0, 34.0, 30.0, 35.0, 23.0, 28.0, 20.0, 23.0, 16.0, 12.0, 9.0, 14.0, 12.0, 11.0, 9.0, 5.0, 1.0, 3.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14891719818115234, -0.14399610459804535, -0.13907501101493835, -0.13415393233299255, -0.12923283874988556, -0.12431174516677856, -0.11939065903425217, -0.11446957290172577, -0.10954847931861877, -0.10462738573551178, -0.09970629960298538, -0.09478521347045898, -0.08986411988735199, -0.084943026304245, -0.0800219401717186, -0.0751008540391922, -0.0701797604560852, -0.06525866687297821, -0.06033758074045181, -0.05541649088263512, -0.05049540102481842, -0.045574311167001724, -0.04065322130918503, -0.03573213145136833, -0.030811041593551636, -0.02588995173573494, -0.020968861877918243, -0.016047772020101547, -0.011126682162284851, -0.006205592304468155, -0.0012845024466514587, 0.0036365874111652374, 0.008557677268981934, 0.01347876712679863, 0.018399856984615326, 0.023320946842432022, 0.028242036700248718, 0.033163126558065414, 0.03808421641588211, 0.04300530627369881, 0.0479263961315155, 0.0528474859893322, 0.057768575847148895, 0.06268966197967529, 0.06761075556278229, 0.07253184914588928, 0.07745293527841568, 0.08237402141094208, 0.08729511499404907, 0.09221620857715607, 0.09713729470968246, 0.10205838084220886, 0.10697947442531586, 0.11190056800842285, 0.11682165414094925, 0.12174274027347565, 0.12666383385658264, 0.13158492743968964, 0.13650602102279663, 0.14142709970474243, 0.14634819328784943, 0.15126928687095642, 0.15619036555290222, 0.16111145913600922, 0.1660325527191162]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 11.0, 9.0, 16.0, 17.0, 22.0, 41.0, 50.0, 91.0, 126.0, 197.0, 327.0, 566.0, 1468.0, 3290.0, 13133.0, 150524.0, 3908791.0, 101624.0, 8815.0, 2633.0, 963.0, 526.0, 359.0, 192.0, 147.0, 102.0, 60.0, 38.0, 35.0, 25.0, 19.0, 14.0, 8.0, 10.0, 7.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.016357421875, -0.01578235626220703, -0.015207290649414062, -0.014632225036621094, -0.014057159423828125, -0.013482093811035156, -0.012907028198242188, -0.012331962585449219, -0.01175689697265625, -0.011181831359863281, -0.010606765747070312, -0.010031700134277344, -0.009456634521484375, -0.008881568908691406, -0.008306503295898438, -0.007731437683105469, -0.0071563720703125, -0.006581306457519531, -0.0060062408447265625, -0.005431175231933594, -0.004856109619140625, -0.004281044006347656, -0.0037059783935546875, -0.0031309127807617188, -0.00255584716796875, -0.0019807815551757812, -0.0014057159423828125, -0.0008306503295898438, -0.000255584716796875, 0.00031948089599609375, 0.0008945465087890625, 0.0014696121215820312, 0.002044677734375, 0.0026197433471679688, 0.0031948089599609375, 0.0037698745727539062, 0.004344940185546875, 0.004920005798339844, 0.0054950714111328125, 0.006070137023925781, 0.00664520263671875, 0.007220268249511719, 0.0077953338623046875, 0.008370399475097656, 0.008945465087890625, 0.009520530700683594, 0.010095596313476562, 0.010670661926269531, 0.0112457275390625, 0.011820793151855469, 0.012395858764648438, 0.012970924377441406, 0.013545989990234375, 0.014121055603027344, 0.014696121215820312, 0.015271186828613281, 0.01584625244140625, 0.01642131805419922, 0.016996383666992188, 0.017571449279785156, 0.018146514892578125, 0.018721580505371094, 0.019296646118164062, 0.01987171173095703, 0.02044677734375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 11.0, 18.0, 21.0, 26.0, 36.0, 50.0, 63.0, 79.0, 76.0, 88.0, 88.0, 93.0, 98.0, 72.0, 47.0, 26.0, 30.0, 10.0, 14.0, 17.0, 5.0, 4.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0179290771484375, -0.017354726791381836, -0.016780376434326172, -0.016206026077270508, -0.015631675720214844, -0.01505732536315918, -0.014482975006103516, -0.013908624649047852, -0.013334274291992188, -0.012759923934936523, -0.01218557357788086, -0.011611223220825195, -0.011036872863769531, -0.010462522506713867, -0.009888172149658203, -0.009313821792602539, -0.008739471435546875, -0.008165121078491211, -0.007590770721435547, -0.007016420364379883, -0.006442070007324219, -0.005867719650268555, -0.005293369293212891, -0.0047190189361572266, -0.0041446685791015625, -0.0035703182220458984, -0.0029959678649902344, -0.0024216175079345703, -0.0018472671508789062, -0.0012729167938232422, -0.0006985664367675781, -0.00012421607971191406, 0.00045013427734375, 0.001024484634399414, 0.0015988349914550781, 0.002173185348510742, 0.0027475357055664062, 0.0033218860626220703, 0.0038962364196777344, 0.0044705867767333984, 0.0050449371337890625, 0.0056192874908447266, 0.006193637847900391, 0.006767988204956055, 0.007342338562011719, 0.007916688919067383, 0.008491039276123047, 0.009065389633178711, 0.009639739990234375, 0.010214090347290039, 0.010788440704345703, 0.011362791061401367, 0.011937141418457031, 0.012511491775512695, 0.01308584213256836, 0.013660192489624023, 0.014234542846679688, 0.014808893203735352, 0.015383243560791016, 0.01595759391784668, 0.016531944274902344, 0.017106294631958008, 0.017680644989013672, 0.018254995346069336, 0.018829345703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 11.0, 3.0, 20.0, 47.0, 84.0, 264.0, 721.0, 2338.0, 9412.0, 3733183.0, 437195.0, 7689.0, 2080.0, 738.0, 261.0, 110.0, 45.0, 23.0, 10.0, 9.0, 7.0, 2.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.034698486328125, -0.0336761474609375, -0.03265380859375, -0.0316314697265625, -0.030609130859375, -0.0295867919921875, -0.028564453125, -0.0275421142578125, -0.026519775390625, -0.0254974365234375, -0.02447509765625, -0.0234527587890625, -0.022430419921875, -0.0214080810546875, -0.0203857421875, -0.0193634033203125, -0.018341064453125, -0.0173187255859375, -0.01629638671875, -0.0152740478515625, -0.014251708984375, -0.0132293701171875, -0.01220703125, -0.0111846923828125, -0.010162353515625, -0.0091400146484375, -0.00811767578125, -0.0070953369140625, -0.006072998046875, -0.0050506591796875, -0.0040283203125, -0.0030059814453125, -0.001983642578125, -0.0009613037109375, 6.103515625e-05, 0.0010833740234375, 0.002105712890625, 0.0031280517578125, 0.004150390625, 0.0051727294921875, 0.006195068359375, 0.0072174072265625, 0.00823974609375, 0.0092620849609375, 0.010284423828125, 0.0113067626953125, 0.0123291015625, 0.0133514404296875, 0.014373779296875, 0.0153961181640625, 0.01641845703125, 0.0174407958984375, 0.018463134765625, 0.0194854736328125, 0.0205078125, 0.0215301513671875, 0.022552490234375, 0.0235748291015625, 0.02459716796875, 0.0256195068359375, 0.026641845703125, 0.0276641845703125, 0.0286865234375, 0.0297088623046875, 0.030731201171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 8.0, 1.0, 2.0, 7.0, 12.0, 14.0, 15.0, 49.0, 131.0, 504.0, 2313.0, 727.0, 175.0, 55.0, 20.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.023162841796875, -0.022454261779785156, -0.021745681762695312, -0.02103710174560547, -0.020328521728515625, -0.01961994171142578, -0.018911361694335938, -0.018202781677246094, -0.01749420166015625, -0.016785621643066406, -0.016077041625976562, -0.015368461608886719, -0.014659881591796875, -0.013951301574707031, -0.013242721557617188, -0.012534141540527344, -0.0118255615234375, -0.011116981506347656, -0.010408401489257812, -0.009699821472167969, -0.008991241455078125, -0.008282661437988281, -0.0075740814208984375, -0.006865501403808594, -0.00615692138671875, -0.005448341369628906, -0.0047397613525390625, -0.004031181335449219, -0.003322601318359375, -0.0026140213012695312, -0.0019054412841796875, -0.0011968612670898438, -0.00048828125, 0.00022029876708984375, 0.0009288787841796875, 0.0016374588012695312, 0.002346038818359375, 0.0030546188354492188, 0.0037631988525390625, 0.004471778869628906, 0.00518035888671875, 0.005888938903808594, 0.0065975189208984375, 0.007306098937988281, 0.008014678955078125, 0.008723258972167969, 0.009431838989257812, 0.010140419006347656, 0.0108489990234375, 0.011557579040527344, 0.012266159057617188, 0.012974739074707031, 0.013683319091796875, 0.014391899108886719, 0.015100479125976562, 0.015809059143066406, 0.01651763916015625, 0.017226219177246094, 0.017934799194335938, 0.01864337921142578, 0.019351959228515625, 0.02006053924560547, 0.020769119262695312, 0.021477699279785156, 0.022186279296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 12.0, 15.0, 36.0, 81.0, 267.0, 386.0, 125.0, 35.0, 29.0, 12.0, 3.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.19926783442497253, -0.19537487626075745, -0.19148191809654236, -0.18758895993232727, -0.18369600176811218, -0.1798030436038971, -0.175910085439682, -0.17201711237430573, -0.16812415421009064, -0.16423119604587555, -0.16033823788166046, -0.15644527971744537, -0.15255232155323029, -0.148659348487854, -0.14476639032363892, -0.14087343215942383, -0.13698047399520874, -0.13308751583099365, -0.12919455766677856, -0.12530159950256348, -0.12140863388776779, -0.1175156757235527, -0.11362271755933762, -0.10972975939512253, -0.10583680868148804, -0.10194385051727295, -0.09805089235305786, -0.09415793418884277, -0.09026496857404709, -0.086372010409832, -0.08247905224561691, -0.07858609408140182, -0.07469313591718674, -0.07080017775297165, -0.06690721958875656, -0.06301425397396088, -0.05912129580974579, -0.0552283376455307, -0.05133537948131561, -0.047442421317100525, -0.04354945942759514, -0.03965650126338005, -0.035763539373874664, -0.031870581209659576, -0.02797762118279934, -0.024084661155939102, -0.020191702991724014, -0.016298742964863777, -0.01240578293800354, -0.008512822911143303, -0.00461986381560564, -0.0007269047200679779, 0.003166055306792259, 0.007059015333652496, 0.010951973497867584, 0.014844933524727821, 0.01873789355158806, 0.022630853578448296, 0.026523813605308533, 0.03041677176952362, 0.03430972993373871, 0.038202691823244095, 0.04209564998745918, 0.04598861187696457, 0.04988157004117966]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 3.0, 8.0, 7.0, 7.0, 6.0, 20.0, 9.0, 20.0, 23.0, 30.0, 22.0, 33.0, 30.0, 46.0, 44.0, 35.0, 50.0, 45.0, 50.0, 47.0, 55.0, 48.0, 44.0, 39.0, 33.0, 33.0, 40.0, 31.0, 24.0, 18.0, 15.0, 16.0, 19.0, 9.0, 11.0, 8.0, 5.0, 7.0, 8.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05647921562194824, -0.054582379758358, -0.05268554389476776, -0.05078870430588722, -0.04889186844229698, -0.04699503257870674, -0.0450981929898262, -0.04320135712623596, -0.04130452126264572, -0.03940768539905548, -0.03751084953546524, -0.0356140099465847, -0.03371717408299446, -0.03182033821940422, -0.02992350049316883, -0.02802666276693344, -0.0261298269033432, -0.02423299103975296, -0.02233615331351757, -0.02043931558728218, -0.01854247972369194, -0.0166456438601017, -0.01474880613386631, -0.012851969338953495, -0.01095513254404068, -0.009058295749127865, -0.00716145895421505, -0.005264622159302235, -0.0033677853643894196, -0.0014709485694766045, 0.00042588822543621063, 0.0023227250203490257, 0.004219561815261841, 0.006116398610174656, 0.008013235405087471, 0.009910072200000286, 0.011806908994913101, 0.013703745789825916, 0.015600582584738731, 0.01749742031097412, 0.01939425617456436, 0.021291092038154602, 0.023187929764389992, 0.02508476749062538, 0.026981603354215622, 0.028878439217805862, 0.030775276944041252, 0.03267211467027664, 0.03456895053386688, 0.03646578639745712, 0.03836262226104736, 0.0402594618499279, 0.04215629771351814, 0.04405313357710838, 0.04594997316598892, 0.04784680902957916, 0.0497436448931694, 0.051640480756759644, 0.053537316620349884, 0.05543415620923042, 0.05733099207282066, 0.059227827936410904, 0.06112466752529144, 0.06302150338888168, 0.06491833925247192]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 12.0, 21.0, 12.0, 21.0, 38.0, 42.0, 71.0, 80.0, 116.0, 186.0, 273.0, 463.0, 650.0, 1095.0, 2041.0, 3776.0, 8095.0, 19869.0, 63256.0, 409999.0, 434710.0, 66680.0, 19895.0, 8092.0, 3808.0, 2104.0, 1080.0, 714.0, 434.0, 278.0, 195.0, 129.0, 81.0, 52.0, 59.0, 29.0, 25.0, 15.0, 13.0, 9.0, 10.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.0321044921875, -0.031131982803344727, -0.030159473419189453, -0.02918696403503418, -0.028214454650878906, -0.027241945266723633, -0.02626943588256836, -0.025296926498413086, -0.024324417114257812, -0.02335190773010254, -0.022379398345947266, -0.021406888961791992, -0.02043437957763672, -0.019461870193481445, -0.018489360809326172, -0.0175168514251709, -0.016544342041015625, -0.015571832656860352, -0.014599323272705078, -0.013626813888549805, -0.012654304504394531, -0.011681795120239258, -0.010709285736083984, -0.009736776351928711, -0.008764266967773438, -0.007791757583618164, -0.006819248199462891, -0.005846738815307617, -0.004874229431152344, -0.0039017200469970703, -0.002929210662841797, -0.0019567012786865234, -0.00098419189453125, -1.1682510375976562e-05, 0.0009608268737792969, 0.0019333362579345703, 0.0029058456420898438, 0.003878355026245117, 0.004850864410400391, 0.005823373794555664, 0.0067958831787109375, 0.007768392562866211, 0.008740901947021484, 0.009713411331176758, 0.010685920715332031, 0.011658430099487305, 0.012630939483642578, 0.013603448867797852, 0.014575958251953125, 0.015548467636108398, 0.016520977020263672, 0.017493486404418945, 0.01846599578857422, 0.019438505172729492, 0.020411014556884766, 0.02138352394104004, 0.022356033325195312, 0.023328542709350586, 0.02430105209350586, 0.025273561477661133, 0.026246070861816406, 0.02721858024597168, 0.028191089630126953, 0.029163599014282227, 0.0301361083984375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 17.0, 22.0, 21.0, 41.0, 41.0, 58.0, 82.0, 72.0, 77.0, 93.0, 97.0, 92.0, 77.0, 65.0, 32.0, 30.0, 7.0, 15.0, 10.0, 11.0, 6.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0170745849609375, -0.016513586044311523, -0.015952587127685547, -0.01539158821105957, -0.014830589294433594, -0.014269590377807617, -0.01370859146118164, -0.013147592544555664, -0.012586593627929688, -0.012025594711303711, -0.011464595794677734, -0.010903596878051758, -0.010342597961425781, -0.009781599044799805, -0.009220600128173828, -0.008659601211547852, -0.008098602294921875, -0.0075376033782958984, -0.006976604461669922, -0.006415605545043945, -0.005854606628417969, -0.005293607711791992, -0.004732608795166016, -0.004171609878540039, -0.0036106109619140625, -0.003049612045288086, -0.0024886131286621094, -0.0019276142120361328, -0.0013666152954101562, -0.0008056163787841797, -0.0002446174621582031, 0.00031638145446777344, 0.00087738037109375, 0.0014383792877197266, 0.001999378204345703, 0.0025603771209716797, 0.0031213760375976562, 0.003682374954223633, 0.004243373870849609, 0.004804372787475586, 0.0053653717041015625, 0.005926370620727539, 0.006487369537353516, 0.007048368453979492, 0.007609367370605469, 0.008170366287231445, 0.008731365203857422, 0.009292364120483398, 0.009853363037109375, 0.010414361953735352, 0.010975360870361328, 0.011536359786987305, 0.012097358703613281, 0.012658357620239258, 0.013219356536865234, 0.013780355453491211, 0.014341354370117188, 0.014902353286743164, 0.01546335220336914, 0.016024351119995117, 0.016585350036621094, 0.01714634895324707, 0.017707347869873047, 0.018268346786499023, 0.018829345703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 10.0, 10.0, 13.0, 19.0, 20.0, 40.0, 43.0, 63.0, 80.0, 165.0, 298.0, 550.0, 1070.0, 2891.0, 12548.0, 142717.0, 827099.0, 50545.0, 6579.0, 1918.0, 811.0, 401.0, 237.0, 144.0, 95.0, 63.0, 39.0, 18.0, 12.0, 8.0, 7.0, 9.0, 6.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.051544189453125, -0.05016279220581055, -0.048781394958496094, -0.04739999771118164, -0.04601860046386719, -0.044637203216552734, -0.04325580596923828, -0.04187440872192383, -0.040493011474609375, -0.03911161422729492, -0.03773021697998047, -0.036348819732666016, -0.03496742248535156, -0.03358602523803711, -0.032204627990722656, -0.030823230743408203, -0.02944183349609375, -0.028060436248779297, -0.026679039001464844, -0.02529764175415039, -0.023916244506835938, -0.022534847259521484, -0.02115345001220703, -0.019772052764892578, -0.018390655517578125, -0.017009258270263672, -0.01562786102294922, -0.014246463775634766, -0.012865066528320312, -0.01148366928100586, -0.010102272033691406, -0.008720874786376953, -0.0073394775390625, -0.005958080291748047, -0.004576683044433594, -0.0031952857971191406, -0.0018138885498046875, -0.0004324913024902344, 0.0009489059448242188, 0.002330303192138672, 0.003711700439453125, 0.005093097686767578, 0.006474494934082031, 0.007855892181396484, 0.009237289428710938, 0.01061868667602539, 0.012000083923339844, 0.013381481170654297, 0.01476287841796875, 0.016144275665283203, 0.017525672912597656, 0.01890707015991211, 0.020288467407226562, 0.021669864654541016, 0.02305126190185547, 0.024432659149169922, 0.025814056396484375, 0.027195453643798828, 0.02857685089111328, 0.029958248138427734, 0.03133964538574219, 0.03272104263305664, 0.034102439880371094, 0.03548383712768555, 0.036865234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 4.0, 13.0, 14.0, 15.0, 20.0, 22.0, 26.0, 27.0, 27.0, 31.0, 31.0, 33.0, 23.0, 47.0, 49.0, 35.0, 49.0, 45.0, 48.0, 36.0, 51.0, 37.0, 36.0, 33.0, 37.0, 30.0, 29.0, 32.0, 12.0, 13.0, 15.0, 10.0, 15.0, 8.0, 6.0, 7.0, 4.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036865234375, -0.035726070404052734, -0.03458690643310547, -0.0334477424621582, -0.03230857849121094, -0.031169414520263672, -0.030030250549316406, -0.02889108657836914, -0.027751922607421875, -0.02661275863647461, -0.025473594665527344, -0.024334430694580078, -0.023195266723632812, -0.022056102752685547, -0.02091693878173828, -0.019777774810791016, -0.01863861083984375, -0.017499446868896484, -0.01636028289794922, -0.015221118927001953, -0.014081954956054688, -0.012942790985107422, -0.011803627014160156, -0.01066446304321289, -0.009525299072265625, -0.00838613510131836, -0.007246971130371094, -0.006107807159423828, -0.0049686431884765625, -0.003829479217529297, -0.0026903152465820312, -0.0015511512756347656, -0.0004119873046875, 0.0007271766662597656, 0.0018663406372070312, 0.003005504608154297, 0.0041446685791015625, 0.005283832550048828, 0.006422996520996094, 0.007562160491943359, 0.008701324462890625, 0.00984048843383789, 0.010979652404785156, 0.012118816375732422, 0.013257980346679688, 0.014397144317626953, 0.015536308288574219, 0.016675472259521484, 0.01781463623046875, 0.018953800201416016, 0.02009296417236328, 0.021232128143310547, 0.022371292114257812, 0.023510456085205078, 0.024649620056152344, 0.02578878402709961, 0.026927947998046875, 0.02806711196899414, 0.029206275939941406, 0.030345439910888672, 0.03148460388183594, 0.0326237678527832, 0.03376293182373047, 0.034902095794677734, 0.036041259765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 9.0, 22.0, 19.0, 57.0, 77.0, 190.0, 451.0, 1878.0, 61387.0, 976390.0, 6605.0, 894.0, 305.0, 125.0, 56.0, 43.0, 23.0, 9.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01141357421875, -0.011115193367004395, -0.010816812515258789, -0.010518431663513184, -0.010220050811767578, -0.009921669960021973, -0.009623289108276367, -0.009324908256530762, -0.009026527404785156, -0.00872814655303955, -0.008429765701293945, -0.00813138484954834, -0.007833003997802734, -0.007534623146057129, -0.0072362422943115234, -0.006937861442565918, -0.0066394805908203125, -0.006341099739074707, -0.0060427188873291016, -0.005744338035583496, -0.005445957183837891, -0.005147576332092285, -0.00484919548034668, -0.004550814628601074, -0.004252433776855469, -0.003954052925109863, -0.003655672073364258, -0.0033572912216186523, -0.003058910369873047, -0.0027605295181274414, -0.002462148666381836, -0.0021637678146362305, -0.001865386962890625, -0.0015670061111450195, -0.001268625259399414, -0.0009702444076538086, -0.0006718635559082031, -0.00037348270416259766, -7.510185241699219e-05, 0.00022327899932861328, 0.0005216598510742188, 0.0008200407028198242, 0.0011184215545654297, 0.0014168024063110352, 0.0017151832580566406, 0.002013564109802246, 0.0023119449615478516, 0.002610325813293457, 0.0029087066650390625, 0.003207087516784668, 0.0035054683685302734, 0.003803849220275879, 0.004102230072021484, 0.00440061092376709, 0.004698991775512695, 0.004997372627258301, 0.005295753479003906, 0.005594134330749512, 0.005892515182495117, 0.006190896034240723, 0.006489276885986328, 0.006787657737731934, 0.007086038589477539, 0.0073844194412231445, 0.00768280029296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 7.0, 5.0, 12.0, 21.0, 16.0, 38.0, 64.0, 61.0, 93.0, 141.0, 157.0, 116.0, 82.0, 51.0, 31.0, 32.0, 13.0, 11.0, 12.0, 13.0, 2.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011163949966430664, -0.0001084720715880394, -0.00010530464351177216, -0.00010213721543550491, -9.896978735923767e-05, -9.580235928297043e-05, -9.263493120670319e-05, -8.946750313043594e-05, -8.63000750541687e-05, -8.313264697790146e-05, -7.996521890163422e-05, -7.679779082536697e-05, -7.363036274909973e-05, -7.046293467283249e-05, -6.729550659656525e-05, -6.4128078520298e-05, -6.096065044403076e-05, -5.779322236776352e-05, -5.462579429149628e-05, -5.1458366215229034e-05, -4.829093813896179e-05, -4.512351006269455e-05, -4.195608198642731e-05, -3.8788653910160065e-05, -3.562122583389282e-05, -3.245379775762558e-05, -2.9286369681358337e-05, -2.6118941605091095e-05, -2.2951513528823853e-05, -1.978408545255661e-05, -1.6616657376289368e-05, -1.3449229300022125e-05, -1.0281801223754883e-05, -7.11437314748764e-06, -3.946945071220398e-06, -7.795169949531555e-07, 2.387911081314087e-06, 5.555339157581329e-06, 8.722767233848572e-06, 1.1890195310115814e-05, 1.5057623386383057e-05, 1.82250514626503e-05, 2.139247953891754e-05, 2.4559907615184784e-05, 2.7727335691452026e-05, 3.089476376771927e-05, 3.406219184398651e-05, 3.7229619920253754e-05, 4.0397047996520996e-05, 4.356447607278824e-05, 4.673190414905548e-05, 4.9899332225322723e-05, 5.3066760301589966e-05, 5.623418837785721e-05, 5.940161645412445e-05, 6.256904453039169e-05, 6.573647260665894e-05, 6.890390068292618e-05, 7.207132875919342e-05, 7.523875683546066e-05, 7.84061849117279e-05, 8.157361298799515e-05, 8.474104106426239e-05, 8.790846914052963e-05, 9.107589721679688e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 3.0, 10.0, 14.0, 18.0, 23.0, 34.0, 39.0, 73.0, 150.0, 361.0, 917.0, 4207.0, 105135.0, 920752.0, 14117.0, 1671.0, 555.0, 196.0, 115.0, 55.0, 37.0, 23.0, 18.0, 11.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007022857666015625, -0.006755173206329346, -0.006487488746643066, -0.006219804286956787, -0.005952119827270508, -0.0056844353675842285, -0.005416750907897949, -0.00514906644821167, -0.004881381988525391, -0.004613697528839111, -0.004346013069152832, -0.004078328609466553, -0.0038106441497802734, -0.003542959690093994, -0.003275275230407715, -0.0030075907707214355, -0.0027399063110351562, -0.002472221851348877, -0.0022045373916625977, -0.0019368529319763184, -0.001669168472290039, -0.0014014840126037598, -0.0011337995529174805, -0.0008661150932312012, -0.0005984306335449219, -0.0003307461738586426, -6.306171417236328e-05, 0.00020462274551391602, 0.0004723072052001953, 0.0007399916648864746, 0.001007676124572754, 0.0012753605842590332, 0.0015430450439453125, 0.0018107295036315918, 0.002078413963317871, 0.0023460984230041504, 0.0026137828826904297, 0.002881467342376709, 0.0031491518020629883, 0.0034168362617492676, 0.003684520721435547, 0.003952205181121826, 0.0042198896408081055, 0.004487574100494385, 0.004755258560180664, 0.005022943019866943, 0.005290627479553223, 0.005558311939239502, 0.005825996398925781, 0.0060936808586120605, 0.00636136531829834, 0.006629049777984619, 0.0068967342376708984, 0.007164418697357178, 0.007432103157043457, 0.007699787616729736, 0.007967472076416016, 0.008235156536102295, 0.008502840995788574, 0.008770525455474854, 0.009038209915161133, 0.009305894374847412, 0.009573578834533691, 0.00984126329421997, 0.01010894775390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 4.0, 3.0, 6.0, 9.0, 15.0, 16.0, 21.0, 16.0, 24.0, 35.0, 37.0, 31.0, 58.0, 74.0, 82.0, 66.0, 93.0, 73.0, 58.0, 54.0, 39.0, 38.0, 25.0, 20.0, 12.0, 19.0, 14.0, 13.0, 16.0, 6.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042572021484375, -0.004114091396331787, -0.003970980644226074, -0.0038278698921203613, -0.0036847591400146484, -0.0035416483879089355, -0.0033985376358032227, -0.0032554268836975098, -0.003112316131591797, -0.002969205379486084, -0.002826094627380371, -0.002682983875274658, -0.0025398731231689453, -0.0023967623710632324, -0.0022536516189575195, -0.0021105408668518066, -0.0019674301147460938, -0.0018243193626403809, -0.001681208610534668, -0.001538097858428955, -0.0013949871063232422, -0.0012518763542175293, -0.0011087656021118164, -0.0009656548500061035, -0.0008225440979003906, -0.0006794333457946777, -0.0005363225936889648, -0.00039321184158325195, -0.00025010108947753906, -0.00010699033737182617, 3.612041473388672e-05, 0.0001792311668395996, 0.0003223419189453125, 0.0004654526710510254, 0.0006085634231567383, 0.0007516741752624512, 0.0008947849273681641, 0.001037895679473877, 0.0011810064315795898, 0.0013241171836853027, 0.0014672279357910156, 0.0016103386878967285, 0.0017534494400024414, 0.0018965601921081543, 0.002039670944213867, 0.00218278169631958, 0.002325892448425293, 0.002469003200531006, 0.0026121139526367188, 0.0027552247047424316, 0.0028983354568481445, 0.0030414462089538574, 0.0031845569610595703, 0.003327667713165283, 0.003470778465270996, 0.003613889217376709, 0.003756999969482422, 0.0039001107215881348, 0.004043221473693848, 0.0041863322257995605, 0.0043294429779052734, 0.004472553730010986, 0.004615664482116699, 0.004758775234222412, 0.004901885986328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 8.0, 79.0, 800.0, 114.0, 13.0, 2.0, 1.0, 1.0], "bins": [-1.8321216106414795, -1.8008090257644653, -1.7694965600967407, -1.7381839752197266, -1.706871509552002, -1.6755589246749878, -1.6442463397979736, -1.612933874130249, -1.5816212892532349, -1.5503087043762207, -1.518996238708496, -1.487683653831482, -1.4563710689544678, -1.4250586032867432, -1.393746018409729, -1.3624335527420044, -1.3311209678649902, -1.299808382987976, -1.2684959173202515, -1.2371833324432373, -1.2058708667755127, -1.1745582818984985, -1.1432456970214844, -1.1119332313537598, -1.0806206464767456, -1.0493080615997314, -1.0179955959320068, -0.9866830110549927, -0.9553704857826233, -0.9240579605102539, -0.8927453756332397, -0.8614328503608704, -0.8301204442977905, -0.7988079190254211, -0.7674953937530518, -0.7361828088760376, -0.7048702836036682, -0.6735577583312988, -0.6422451734542847, -0.6109326481819153, -0.5796201229095459, -0.5483075976371765, -0.5169950723648071, -0.48568248748779297, -0.4543699622154236, -0.4230574369430542, -0.3917448818683624, -0.36043232679367065, -0.32911980152130127, -0.2978072762489319, -0.2664947211742401, -0.23518218100070953, -0.20386964082717896, -0.17255710065364838, -0.1412445604801178, -0.10993202030658722, -0.07861948013305664, -0.04730693995952606, -0.015994399785995483, 0.015318140387535095, 0.046630680561065674, 0.07794322073459625, 0.10925576090812683, 0.1405683010816574, 0.171880841255188]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 4.0, 8.0, 4.0, 6.0, 11.0, 13.0, 26.0, 16.0, 19.0, 19.0, 22.0, 25.0, 31.0, 25.0, 44.0, 51.0, 52.0, 57.0, 58.0, 58.0, 66.0, 41.0, 56.0, 38.0, 39.0, 28.0, 30.0, 31.0, 20.0, 18.0, 20.0, 9.0, 9.0, 9.0, 4.0, 5.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.16554975509643555, -0.16077828407287598, -0.1560068130493164, -0.15123534202575684, -0.14646387100219727, -0.1416924148797989, -0.13692094385623932, -0.13214947283267975, -0.12737800180912018, -0.12260653078556061, -0.11783505976200104, -0.11306359618902206, -0.1082921251654625, -0.10352065414190292, -0.09874919056892395, -0.09397771954536438, -0.08920624852180481, -0.08443477749824524, -0.07966330647468567, -0.0748918429017067, -0.07012037187814713, -0.06534890085458755, -0.06057743355631828, -0.05580596625804901, -0.05103449523448944, -0.04626302421092987, -0.0414915569126606, -0.03672008961439133, -0.03194861859083176, -0.027177149429917336, -0.022405680269002914, -0.017634212970733643, -0.012862741947174072, -0.008091272786259651, -0.00331980362534523, 0.001451665535569191, 0.006223134696483612, 0.010994603857398033, 0.015766073018312454, 0.020537540316581726, 0.025309011340141296, 0.030080480501055717, 0.03485194966197014, 0.03962341696023941, 0.04439488798379898, 0.04916635900735855, 0.05393782630562782, 0.058709293603897095, 0.06348076462745667, 0.06825223565101624, 0.0730237066745758, 0.07779517024755478, 0.08256664127111435, 0.08733811229467392, 0.0921095758676529, 0.09688104689121246, 0.10165251791477203, 0.1064239889383316, 0.11119545996189117, 0.11596692353487015, 0.12073839455842972, 0.1255098581314087, 0.13028132915496826, 0.13505280017852783, 0.1398242712020874]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 0.0, 5.0, 8.0, 20.0, 12.0, 24.0, 47.0, 65.0, 92.0, 141.0, 192.0, 337.0, 1062.0, 4190995.0, 511.0, 255.0, 160.0, 109.0, 67.0, 64.0, 32.0, 20.0, 18.0, 12.0, 5.0, 12.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.385986328125, -0.3694496154785156, -0.35291290283203125, -0.3363761901855469, -0.3198394775390625, -0.3033027648925781, -0.28676605224609375, -0.2702293395996094, -0.253692626953125, -0.23715591430664062, -0.22061920166015625, -0.20408248901367188, -0.1875457763671875, -0.17100906372070312, -0.15447235107421875, -0.13793563842773438, -0.12139892578125, -0.10486221313476562, -0.08832550048828125, -0.07178878784179688, -0.0552520751953125, -0.038715362548828125, -0.02217864990234375, -0.005641937255859375, 0.010894775390625, 0.027431488037109375, 0.04396820068359375, 0.060504913330078125, 0.0770416259765625, 0.09357833862304688, 0.11011505126953125, 0.12665176391601562, 0.1431884765625, 0.15972518920898438, 0.17626190185546875, 0.19279861450195312, 0.2093353271484375, 0.22587203979492188, 0.24240875244140625, 0.2589454650878906, 0.275482177734375, 0.2920188903808594, 0.30855560302734375, 0.3250923156738281, 0.3416290283203125, 0.3581657409667969, 0.37470245361328125, 0.3912391662597656, 0.40777587890625, 0.4243125915527344, 0.44084930419921875, 0.4573860168457031, 0.4739227294921875, 0.4904594421386719, 0.5069961547851562, 0.5235328674316406, 0.540069580078125, 0.5566062927246094, 0.5731430053710938, 0.5896797180175781, 0.6062164306640625, 0.6227531433105469, 0.6392898559570312, 0.6558265686035156, 0.67236328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 15.0, 14.0, 21.0, 27.0, 48.0, 48.0, 58.0, 71.0, 77.0, 86.0, 85.0, 104.0, 75.0, 65.0, 51.0, 43.0, 32.0, 13.0, 12.0, 13.0, 7.0, 4.0, 8.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0157318115234375, -0.01519465446472168, -0.01465749740600586, -0.014120340347290039, -0.013583183288574219, -0.013046026229858398, -0.012508869171142578, -0.011971712112426758, -0.011434555053710938, -0.010897397994995117, -0.010360240936279297, -0.009823083877563477, -0.009285926818847656, -0.008748769760131836, -0.008211612701416016, -0.007674455642700195, -0.007137298583984375, -0.006600141525268555, -0.006062984466552734, -0.005525827407836914, -0.004988670349121094, -0.0044515132904052734, -0.003914356231689453, -0.003377199172973633, -0.0028400421142578125, -0.002302885055541992, -0.0017657279968261719, -0.0012285709381103516, -0.0006914138793945312, -0.00015425682067871094, 0.0003829002380371094, 0.0009200572967529297, 0.00145721435546875, 0.0019943714141845703, 0.0025315284729003906, 0.003068685531616211, 0.0036058425903320312, 0.0041429996490478516, 0.004680156707763672, 0.005217313766479492, 0.0057544708251953125, 0.006291627883911133, 0.006828784942626953, 0.0073659420013427734, 0.007903099060058594, 0.008440256118774414, 0.008977413177490234, 0.009514570236206055, 0.010051727294921875, 0.010588884353637695, 0.011126041412353516, 0.011663198471069336, 0.012200355529785156, 0.012737512588500977, 0.013274669647216797, 0.013811826705932617, 0.014348983764648438, 0.014886140823364258, 0.015423297882080078, 0.0159604549407959, 0.01649761199951172, 0.01703476905822754, 0.01757192611694336, 0.01810908317565918, 0.018646240234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 6.0, 19.0, 10.0, 23.0, 36.0, 63.0, 136.0, 265.0, 394.0, 780.0, 1541.0, 2960.0, 6398.0, 17658.0, 187983.0, 3922658.0, 34808.0, 9878.0, 4337.0, 2066.0, 1053.0, 545.0, 299.0, 152.0, 68.0, 53.0, 25.0, 25.0, 11.0, 9.0, 8.0, 7.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014923095703125, -0.014354228973388672, -0.013785362243652344, -0.013216495513916016, -0.012647628784179688, -0.01207876205444336, -0.011509895324707031, -0.010941028594970703, -0.010372161865234375, -0.009803295135498047, -0.009234428405761719, -0.00866556167602539, -0.008096694946289062, -0.007527828216552734, -0.006958961486816406, -0.006390094757080078, -0.00582122802734375, -0.005252361297607422, -0.004683494567871094, -0.004114627838134766, -0.0035457611083984375, -0.0029768943786621094, -0.0024080276489257812, -0.0018391609191894531, -0.001270294189453125, -0.0007014274597167969, -0.00013256072998046875, 0.0004363059997558594, 0.0010051727294921875, 0.0015740394592285156, 0.0021429061889648438, 0.002711772918701172, 0.0032806396484375, 0.003849506378173828, 0.004418373107910156, 0.004987239837646484, 0.0055561065673828125, 0.006124973297119141, 0.006693840026855469, 0.007262706756591797, 0.007831573486328125, 0.008400440216064453, 0.008969306945800781, 0.00953817367553711, 0.010107040405273438, 0.010675907135009766, 0.011244773864746094, 0.011813640594482422, 0.01238250732421875, 0.012951374053955078, 0.013520240783691406, 0.014089107513427734, 0.014657974243164062, 0.01522684097290039, 0.01579570770263672, 0.016364574432373047, 0.016933441162109375, 0.017502307891845703, 0.01807117462158203, 0.01864004135131836, 0.019208908081054688, 0.019777774810791016, 0.020346641540527344, 0.020915508270263672, 0.021484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 5.0, 11.0, 12.0, 15.0, 25.0, 107.0, 416.0, 2505.0, 723.0, 106.0, 36.0, 27.0, 14.0, 7.0, 4.0, 7.0, 7.0, 2.0, 4.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0193634033203125, -0.01880502700805664, -0.01824665069580078, -0.017688274383544922, -0.017129898071289062, -0.016571521759033203, -0.016013145446777344, -0.015454769134521484, -0.014896392822265625, -0.014338016510009766, -0.013779640197753906, -0.013221263885498047, -0.012662887573242188, -0.012104511260986328, -0.011546134948730469, -0.01098775863647461, -0.01042938232421875, -0.00987100601196289, -0.009312629699707031, -0.008754253387451172, -0.008195877075195312, -0.007637500762939453, -0.007079124450683594, -0.006520748138427734, -0.005962371826171875, -0.005403995513916016, -0.004845619201660156, -0.004287242889404297, -0.0037288665771484375, -0.003170490264892578, -0.0026121139526367188, -0.0020537376403808594, -0.001495361328125, -0.0009369850158691406, -0.00037860870361328125, 0.00017976760864257812, 0.0007381439208984375, 0.0012965202331542969, 0.0018548965454101562, 0.0024132728576660156, 0.002971649169921875, 0.0035300254821777344, 0.004088401794433594, 0.004646778106689453, 0.0052051544189453125, 0.005763530731201172, 0.006321907043457031, 0.006880283355712891, 0.00743865966796875, 0.00799703598022461, 0.008555412292480469, 0.009113788604736328, 0.009672164916992188, 0.010230541229248047, 0.010788917541503906, 0.011347293853759766, 0.011905670166015625, 0.012464046478271484, 0.013022422790527344, 0.013580799102783203, 0.014139175415039062, 0.014697551727294922, 0.015255928039550781, 0.01581430435180664, 0.0163726806640625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 6.0, 12.0, 21.0, 41.0, 63.0, 144.0, 277.0, 206.0, 112.0, 41.0, 32.0, 17.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11407141387462616, -0.11077532172203064, -0.10747922211885452, -0.104183129966259, -0.10088703036308289, -0.09759093821048737, -0.09429483860731125, -0.09099874645471573, -0.08770264685153961, -0.08440655469894409, -0.08111045509576797, -0.07781436294317245, -0.07451826333999634, -0.07122217118740082, -0.0679260715842247, -0.06462997943162918, -0.06133388355374336, -0.058037787675857544, -0.054741691797971725, -0.05144559592008591, -0.04814950004220009, -0.04485340416431427, -0.04155731201171875, -0.03826121240854263, -0.03496512025594711, -0.031669024378061295, -0.028372928500175476, -0.025076832622289658, -0.02178073674440384, -0.01848464272916317, -0.015188546851277351, -0.011892450973391533, -0.008596353232860565, -0.005300257354974747, -0.0020041619427502155, 0.0012919334694743156, 0.004588029347360134, 0.007884124293923378, 0.011180220171809196, 0.014476316049695015, 0.017772411927580833, 0.021068507805466652, 0.02436460368335247, 0.02766069769859314, 0.030956793576478958, 0.03425288945436478, 0.037548985332250595, 0.040845081210136414, 0.04414117708802223, 0.04743727296590805, 0.05073336884379387, 0.05402946472167969, 0.057325560599565506, 0.060621656477451324, 0.06391774863004684, 0.06721384823322296, 0.07050994038581848, 0.073806032538414, 0.07710213214159012, 0.08039822429418564, 0.08369432389736176, 0.08699041604995728, 0.09028651565313339, 0.09358260780572891, 0.09687870740890503]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 1.0, 14.0, 7.0, 7.0, 15.0, 13.0, 16.0, 15.0, 26.0, 16.0, 28.0, 22.0, 23.0, 33.0, 38.0, 43.0, 52.0, 47.0, 59.0, 46.0, 44.0, 54.0, 52.0, 34.0, 35.0, 37.0, 32.0, 28.0, 21.0, 29.0, 18.0, 18.0, 10.0, 13.0, 8.0, 8.0, 7.0, 3.0, 6.0, 0.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.05529212951660156, -0.053685516119003296, -0.05207889899611473, -0.050472281873226166, -0.0488656684756279, -0.04725905507802963, -0.04565243795514107, -0.0440458208322525, -0.042439207434654236, -0.04083259403705597, -0.039225976914167404, -0.03761935979127884, -0.03601274639368057, -0.034406132996082306, -0.03279951587319374, -0.031192900612950325, -0.02958628535270691, -0.027979670092463493, -0.026373054832220078, -0.02476643957197666, -0.023159824311733246, -0.02155320905148983, -0.019946593791246414, -0.018339978531003, -0.016733363270759583, -0.015126748010516167, -0.01352013275027275, -0.011913517490029335, -0.01030690222978592, -0.008700286969542503, -0.0070936717092990875, -0.005487056449055672, -0.003880441188812256, -0.00227382592856884, -0.0006672106683254242, 0.0009394045919179916, 0.0025460198521614075, 0.004152635112404823, 0.005759250372648239, 0.007365865632891655, 0.00897248089313507, 0.010579096153378487, 0.012185711413621902, 0.013792326673865318, 0.015398941934108734, 0.01700555719435215, 0.018612172454595566, 0.02021878771483898, 0.021825402975082397, 0.023432018235325813, 0.02503863349556923, 0.026645248755812645, 0.02825186401605606, 0.029858479276299477, 0.03146509453654289, 0.03307171165943146, 0.034678325057029724, 0.03628493845462799, 0.037891555577516556, 0.03949817270040512, 0.04110478609800339, 0.042711399495601654, 0.04431801661849022, 0.045924633741378784, 0.04753124713897705]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 10.0, 20.0, 47.0, 70.0, 109.0, 214.0, 410.0, 953.0, 2534.0, 9247.0, 56105.0, 780967.0, 173063.0, 17777.0, 4329.0, 1433.0, 637.0, 273.0, 141.0, 81.0, 44.0, 23.0, 21.0, 17.0, 7.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043212890625, -0.04165363311767578, -0.04009437561035156, -0.038535118103027344, -0.036975860595703125, -0.035416603088378906, -0.03385734558105469, -0.03229808807373047, -0.03073883056640625, -0.02917957305908203, -0.027620315551757812, -0.026061058044433594, -0.024501800537109375, -0.022942543029785156, -0.021383285522460938, -0.01982402801513672, -0.0182647705078125, -0.01670551300048828, -0.015146255493164062, -0.013586997985839844, -0.012027740478515625, -0.010468482971191406, -0.008909225463867188, -0.007349967956542969, -0.00579071044921875, -0.004231452941894531, -0.0026721954345703125, -0.0011129379272460938, 0.000446319580078125, 0.0020055770874023438, 0.0035648345947265625, 0.005124092102050781, 0.006683349609375, 0.008242607116699219, 0.009801864624023438, 0.011361122131347656, 0.012920379638671875, 0.014479637145996094, 0.016038894653320312, 0.01759815216064453, 0.01915740966796875, 0.02071666717529297, 0.022275924682617188, 0.023835182189941406, 0.025394439697265625, 0.026953697204589844, 0.028512954711914062, 0.03007221221923828, 0.0316314697265625, 0.03319072723388672, 0.03474998474121094, 0.036309242248535156, 0.037868499755859375, 0.039427757263183594, 0.04098701477050781, 0.04254627227783203, 0.04410552978515625, 0.04566478729248047, 0.04722404479980469, 0.048783302307128906, 0.050342559814453125, 0.051901817321777344, 0.05346107482910156, 0.05502033233642578, 0.05657958984375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 0.0, 3.0, 11.0, 13.0, 20.0, 24.0, 33.0, 53.0, 62.0, 72.0, 67.0, 85.0, 91.0, 99.0, 89.0, 65.0, 67.0, 38.0, 26.0, 17.0, 20.0, 15.0, 2.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0152587890625, -0.014724016189575195, -0.01418924331665039, -0.013654470443725586, -0.013119697570800781, -0.012584924697875977, -0.012050151824951172, -0.011515378952026367, -0.010980606079101562, -0.010445833206176758, -0.009911060333251953, -0.009376287460327148, -0.008841514587402344, -0.008306741714477539, -0.007771968841552734, -0.00723719596862793, -0.006702423095703125, -0.00616765022277832, -0.005632877349853516, -0.005098104476928711, -0.004563331604003906, -0.0040285587310791016, -0.003493785858154297, -0.002959012985229492, -0.0024242401123046875, -0.0018894672393798828, -0.0013546943664550781, -0.0008199214935302734, -0.00028514862060546875, 0.00024962425231933594, 0.0007843971252441406, 0.0013191699981689453, 0.00185394287109375, 0.0023887157440185547, 0.0029234886169433594, 0.003458261489868164, 0.003993034362792969, 0.0045278072357177734, 0.005062580108642578, 0.005597352981567383, 0.0061321258544921875, 0.006666898727416992, 0.007201671600341797, 0.0077364444732666016, 0.008271217346191406, 0.008805990219116211, 0.009340763092041016, 0.00987553596496582, 0.010410308837890625, 0.01094508171081543, 0.011479854583740234, 0.012014627456665039, 0.012549400329589844, 0.013084173202514648, 0.013618946075439453, 0.014153718948364258, 0.014688491821289062, 0.015223264694213867, 0.015758037567138672, 0.016292810440063477, 0.01682758331298828, 0.017362356185913086, 0.01789712905883789, 0.018431901931762695, 0.0189666748046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 13.0, 21.0, 20.0, 40.0, 37.0, 87.0, 105.0, 141.0, 248.0, 431.0, 855.0, 1834.0, 4517.0, 12538.0, 38032.0, 152969.0, 632465.0, 146951.0, 36880.0, 12032.0, 4504.0, 1810.0, 855.0, 409.0, 251.0, 166.0, 90.0, 66.0, 42.0, 30.0, 23.0, 18.0, 16.0, 8.0, 10.0, 6.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0213623046875, -0.02070474624633789, -0.02004718780517578, -0.019389629364013672, -0.018732070922851562, -0.018074512481689453, -0.017416954040527344, -0.016759395599365234, -0.016101837158203125, -0.015444278717041016, -0.014786720275878906, -0.014129161834716797, -0.013471603393554688, -0.012814044952392578, -0.012156486511230469, -0.01149892807006836, -0.01084136962890625, -0.01018381118774414, -0.009526252746582031, -0.008868694305419922, -0.008211135864257812, -0.007553577423095703, -0.006896018981933594, -0.006238460540771484, -0.005580902099609375, -0.004923343658447266, -0.004265785217285156, -0.003608226776123047, -0.0029506683349609375, -0.002293109893798828, -0.0016355514526367188, -0.0009779930114746094, -0.0003204345703125, 0.0003371238708496094, 0.0009946823120117188, 0.0016522407531738281, 0.0023097991943359375, 0.002967357635498047, 0.0036249160766601562, 0.004282474517822266, 0.004940032958984375, 0.005597591400146484, 0.006255149841308594, 0.006912708282470703, 0.0075702667236328125, 0.008227825164794922, 0.008885383605957031, 0.00954294204711914, 0.01020050048828125, 0.01085805892944336, 0.011515617370605469, 0.012173175811767578, 0.012830734252929688, 0.013488292694091797, 0.014145851135253906, 0.014803409576416016, 0.015460968017578125, 0.016118526458740234, 0.016776084899902344, 0.017433643341064453, 0.018091201782226562, 0.018748760223388672, 0.01940631866455078, 0.02006387710571289, 0.020721435546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 4.0, 6.0, 7.0, 8.0, 7.0, 17.0, 7.0, 16.0, 20.0, 15.0, 16.0, 22.0, 25.0, 24.0, 38.0, 31.0, 42.0, 43.0, 39.0, 39.0, 38.0, 52.0, 35.0, 49.0, 36.0, 35.0, 34.0, 38.0, 37.0, 23.0, 34.0, 20.0, 29.0, 18.0, 14.0, 23.0, 7.0, 7.0, 10.0, 9.0, 6.0, 8.0, 1.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0278778076171875, -0.026966571807861328, -0.026055335998535156, -0.025144100189208984, -0.024232864379882812, -0.02332162857055664, -0.02241039276123047, -0.021499156951904297, -0.020587921142578125, -0.019676685333251953, -0.01876544952392578, -0.01785421371459961, -0.016942977905273438, -0.016031742095947266, -0.015120506286621094, -0.014209270477294922, -0.01329803466796875, -0.012386798858642578, -0.011475563049316406, -0.010564327239990234, -0.009653091430664062, -0.00874185562133789, -0.007830619812011719, -0.006919384002685547, -0.006008148193359375, -0.005096912384033203, -0.004185676574707031, -0.0032744407653808594, -0.0023632049560546875, -0.0014519691467285156, -0.0005407333374023438, 0.0003705024719238281, 0.00128173828125, 0.002192974090576172, 0.0031042098999023438, 0.004015445709228516, 0.0049266815185546875, 0.005837917327880859, 0.006749153137207031, 0.007660388946533203, 0.008571624755859375, 0.009482860565185547, 0.010394096374511719, 0.01130533218383789, 0.012216567993164062, 0.013127803802490234, 0.014039039611816406, 0.014950275421142578, 0.01586151123046875, 0.016772747039794922, 0.017683982849121094, 0.018595218658447266, 0.019506454467773438, 0.02041769027709961, 0.02132892608642578, 0.022240161895751953, 0.023151397705078125, 0.024062633514404297, 0.02497386932373047, 0.02588510513305664, 0.026796340942382812, 0.027707576751708984, 0.028618812561035156, 0.029530048370361328, 0.0304412841796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 8.0, 20.0, 25.0, 49.0, 91.0, 210.0, 546.0, 2527.0, 987552.0, 54659.0, 2014.0, 479.0, 177.0, 80.0, 44.0, 25.0, 11.0, 13.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140869140625, -0.13659286499023438, -0.13231658935546875, -0.12804031372070312, -0.1237640380859375, -0.11948776245117188, -0.11521148681640625, -0.11093521118164062, -0.106658935546875, -0.10238265991210938, -0.09810638427734375, -0.09383010864257812, -0.0895538330078125, -0.08527755737304688, -0.08100128173828125, -0.07672500610351562, -0.07244873046875, -0.06817245483398438, -0.06389617919921875, -0.059619903564453125, -0.0553436279296875, -0.051067352294921875, -0.04679107666015625, -0.042514801025390625, -0.038238525390625, -0.033962249755859375, -0.02968597412109375, -0.025409698486328125, -0.0211334228515625, -0.016857147216796875, -0.01258087158203125, -0.008304595947265625, -0.0040283203125, 0.000247955322265625, 0.00452423095703125, 0.008800506591796875, 0.0130767822265625, 0.017353057861328125, 0.02162933349609375, 0.025905609130859375, 0.030181884765625, 0.034458160400390625, 0.03873443603515625, 0.043010711669921875, 0.0472869873046875, 0.051563262939453125, 0.05583953857421875, 0.060115814208984375, 0.06439208984375, 0.06866836547851562, 0.07294464111328125, 0.07722091674804688, 0.0814971923828125, 0.08577346801757812, 0.09004974365234375, 0.09432601928710938, 0.098602294921875, 0.10287857055664062, 0.10715484619140625, 0.11143112182617188, 0.1157073974609375, 0.11998367309570312, 0.12425994873046875, 0.12853622436523438, 0.1328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 11.0, 6.0, 9.0, 13.0, 10.0, 12.0, 13.0, 19.0, 21.0, 37.0, 33.0, 72.0, 85.0, 107.0, 77.0, 99.0, 70.0, 58.0, 61.0, 26.0, 25.0, 26.0, 21.0, 11.0, 16.0, 2.0, 9.0, 9.0, 4.0, 4.0, 2.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.933906555175781e-05, -3.795977681875229e-05, -3.6580488085746765e-05, -3.520119935274124e-05, -3.382191061973572e-05, -3.2442621886730194e-05, -3.106333315372467e-05, -2.9684044420719147e-05, -2.8304755687713623e-05, -2.69254669547081e-05, -2.5546178221702576e-05, -2.4166889488697052e-05, -2.278760075569153e-05, -2.1408312022686005e-05, -2.002902328968048e-05, -1.8649734556674957e-05, -1.7270445823669434e-05, -1.589115709066391e-05, -1.4511868357658386e-05, -1.3132579624652863e-05, -1.1753290891647339e-05, -1.0374002158641815e-05, -8.994713425636292e-06, -7.615424692630768e-06, -6.236135959625244e-06, -4.8568472266197205e-06, -3.4775584936141968e-06, -2.098269760608673e-06, -7.189810276031494e-07, 6.603077054023743e-07, 2.039596438407898e-06, 3.4188851714134216e-06, 4.798173904418945e-06, 6.177462637424469e-06, 7.556751370429993e-06, 8.936040103435516e-06, 1.031532883644104e-05, 1.1694617569446564e-05, 1.3073906302452087e-05, 1.4453195035457611e-05, 1.5832483768463135e-05, 1.721177250146866e-05, 1.8591061234474182e-05, 1.9970349967479706e-05, 2.134963870048523e-05, 2.2728927433490753e-05, 2.4108216166496277e-05, 2.54875048995018e-05, 2.6866793632507324e-05, 2.8246082365512848e-05, 2.962537109851837e-05, 3.1004659831523895e-05, 3.238394856452942e-05, 3.376323729753494e-05, 3.5142526030540466e-05, 3.652181476354599e-05, 3.7901103496551514e-05, 3.928039222955704e-05, 4.065968096256256e-05, 4.2038969695568085e-05, 4.341825842857361e-05, 4.479754716157913e-05, 4.6176835894584656e-05, 4.755612462759018e-05, 4.89354133605957e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 13.0, 14.0, 18.0, 31.0, 64.0, 171.0, 596.0, 3587.0, 1026843.0, 15478.0, 1267.0, 266.0, 88.0, 54.0, 27.0, 11.0, 12.0, 7.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12078857421875, -0.11750125885009766, -0.11421394348144531, -0.11092662811279297, -0.10763931274414062, -0.10435199737548828, -0.10106468200683594, -0.0977773666381836, -0.09449005126953125, -0.0912027359008789, -0.08791542053222656, -0.08462810516357422, -0.08134078979492188, -0.07805347442626953, -0.07476615905761719, -0.07147884368896484, -0.0681915283203125, -0.06490421295166016, -0.06161689758300781, -0.05832958221435547, -0.055042266845703125, -0.05175495147705078, -0.04846763610839844, -0.045180320739746094, -0.04189300537109375, -0.038605690002441406, -0.03531837463378906, -0.03203105926513672, -0.028743743896484375, -0.02545642852783203, -0.022169113159179688, -0.018881797790527344, -0.015594482421875, -0.012307167053222656, -0.009019851684570312, -0.005732536315917969, -0.002445220947265625, 0.0008420944213867188, 0.0041294097900390625, 0.007416725158691406, 0.01070404052734375, 0.013991355895996094, 0.017278671264648438, 0.02056598663330078, 0.023853302001953125, 0.02714061737060547, 0.030427932739257812, 0.033715248107910156, 0.0370025634765625, 0.040289878845214844, 0.04357719421386719, 0.04686450958251953, 0.050151824951171875, 0.05343914031982422, 0.05672645568847656, 0.060013771057128906, 0.06330108642578125, 0.0665884017944336, 0.06987571716308594, 0.07316303253173828, 0.07645034790039062, 0.07973766326904297, 0.08302497863769531, 0.08631229400634766, 0.089599609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 7.0, 30.0, 120.0, 579.0, 190.0, 25.0, 10.0, 7.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033477783203125, -0.03192472457885742, -0.030371665954589844, -0.028818607330322266, -0.027265548706054688, -0.02571249008178711, -0.02415943145751953, -0.022606372833251953, -0.021053314208984375, -0.019500255584716797, -0.01794719696044922, -0.01639413833618164, -0.014841079711914062, -0.013288021087646484, -0.011734962463378906, -0.010181903839111328, -0.00862884521484375, -0.007075786590576172, -0.005522727966308594, -0.003969669342041016, -0.0024166107177734375, -0.0008635520935058594, 0.0006895065307617188, 0.002242565155029297, 0.003795623779296875, 0.005348682403564453, 0.006901741027832031, 0.00845479965209961, 0.010007858276367188, 0.011560916900634766, 0.013113975524902344, 0.014667034149169922, 0.0162200927734375, 0.017773151397705078, 0.019326210021972656, 0.020879268646240234, 0.022432327270507812, 0.02398538589477539, 0.02553844451904297, 0.027091503143310547, 0.028644561767578125, 0.030197620391845703, 0.03175067901611328, 0.03330373764038086, 0.03485679626464844, 0.036409854888916016, 0.037962913513183594, 0.03951597213745117, 0.04106903076171875, 0.04262208938598633, 0.044175148010253906, 0.045728206634521484, 0.04728126525878906, 0.04883432388305664, 0.05038738250732422, 0.0519404411315918, 0.053493499755859375, 0.05504655838012695, 0.05659961700439453, 0.05815267562866211, 0.05970573425292969, 0.061258792877197266, 0.06281185150146484, 0.06436491012573242, 0.06591796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 11.0, 48.0, 161.0, 557.0, 174.0, 38.0, 11.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1114814281463623, -1.0865565538406372, -1.0616317987442017, -1.0367069244384766, -1.0117820501327515, -0.9868572354316711, -0.9619324207305908, -0.9370075464248657, -0.9120827317237854, -0.8871579170227051, -0.86223304271698, -0.8373082280158997, -0.8123834133148193, -0.7874585390090942, -0.7625337243080139, -0.7376089096069336, -0.7126840353012085, -0.6877592206001282, -0.6628343462944031, -0.6379095315933228, -0.6129847168922424, -0.5880598425865173, -0.563135027885437, -0.5382101535797119, -0.5132853984832764, -0.48836055397987366, -0.46343573927879333, -0.4385108947753906, -0.4135860502719879, -0.3886612057685852, -0.3637363910675049, -0.3388115465641022, -0.31388670206069946, -0.28896185755729675, -0.26403704285621643, -0.23911219835281372, -0.214187353849411, -0.1892625242471695, -0.16433769464492798, -0.13941285014152527, -0.11448802053928375, -0.08956318348646164, -0.06463834643363953, -0.03971351683139801, -0.014788679778575897, 0.010136157274246216, 0.03506098687648773, 0.05998583137989044, 0.08491066098213196, 0.10983549803495407, 0.13476033508777618, 0.1596851646900177, 0.1846100091934204, 0.20953483879566193, 0.23445966839790344, 0.25938451290130615, 0.2843093276023865, 0.3092341721057892, 0.3341589868068695, 0.3590838313102722, 0.3840086758136749, 0.40893352031707764, 0.43385833501815796, 0.45878317952156067, 0.4837080240249634]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 5.0, 8.0, 12.0, 19.0, 19.0, 23.0, 36.0, 34.0, 29.0, 38.0, 50.0, 38.0, 52.0, 56.0, 43.0, 65.0, 63.0, 62.0, 40.0, 35.0, 31.0, 35.0, 28.0, 25.0, 22.0, 13.0, 16.0, 14.0, 13.0, 13.0, 10.0, 7.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1524093747138977, -0.14752794802188873, -0.14264653623104095, -0.13776510953903198, -0.1328836977481842, -0.12800227105617523, -0.12312085181474686, -0.11823943257331848, -0.1133580133318901, -0.10847659409046173, -0.10359517484903336, -0.09871375560760498, -0.09383232891559601, -0.08895091712474823, -0.08406949043273926, -0.07918807119131088, -0.07430665194988251, -0.06942523270845413, -0.06454381346702576, -0.05966239050030708, -0.05478097125887871, -0.04989955201745033, -0.04501812905073166, -0.040136709809303284, -0.03525529056787491, -0.030373871326446533, -0.02549245022237301, -0.020611029118299484, -0.01572960987687111, -0.010848190635442734, -0.005966769531369209, -0.0010853484272956848, 0.0037960708141326904, 0.00867749098688364, 0.01355891115963459, 0.018440332263708115, 0.02332175150513649, 0.028203170746564865, 0.03308459371328354, 0.037966012954711914, 0.04284743219614029, 0.047728851437568665, 0.05261027067899704, 0.057491693645715714, 0.06237311288714409, 0.06725452840328217, 0.07213595509529114, 0.07701737433671951, 0.08189879357814789, 0.08678021281957626, 0.09166163206100464, 0.09654305130243301, 0.10142447054386139, 0.10630589723587036, 0.11118731647729874, 0.11606873571872711, 0.12095015496015549, 0.12583157420158386, 0.13071300089359283, 0.1355944126844406, 0.14047583937644958, 0.14535725116729736, 0.15023867785930634, 0.1551201045513153, 0.16000151634216309]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 9.0, 7.0, 9.0, 18.0, 21.0, 21.0, 29.0, 29.0, 55.0, 107.0, 170.0, 367.0, 1018.0, 8573.0, 4155253.0, 25872.0, 1664.0, 497.0, 210.0, 108.0, 67.0, 47.0, 27.0, 25.0, 18.0, 16.0, 9.0, 12.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052581787109375, -0.05044698715209961, -0.04831218719482422, -0.04617738723754883, -0.04404258728027344, -0.04190778732299805, -0.039772987365722656, -0.037638187408447266, -0.035503387451171875, -0.033368587493896484, -0.031233787536621094, -0.029098987579345703, -0.026964187622070312, -0.024829387664794922, -0.02269458770751953, -0.02055978775024414, -0.01842498779296875, -0.01629018783569336, -0.014155387878417969, -0.012020587921142578, -0.009885787963867188, -0.007750988006591797, -0.005616188049316406, -0.0034813880920410156, -0.001346588134765625, 0.0007882118225097656, 0.0029230117797851562, 0.005057811737060547, 0.0071926116943359375, 0.009327411651611328, 0.011462211608886719, 0.01359701156616211, 0.0157318115234375, 0.01786661148071289, 0.02000141143798828, 0.022136211395263672, 0.024271011352539062, 0.026405811309814453, 0.028540611267089844, 0.030675411224365234, 0.032810211181640625, 0.034945011138916016, 0.037079811096191406, 0.0392146110534668, 0.04134941101074219, 0.04348421096801758, 0.04561901092529297, 0.04775381088256836, 0.04988861083984375, 0.05202341079711914, 0.05415821075439453, 0.05629301071166992, 0.05842781066894531, 0.0605626106262207, 0.0626974105834961, 0.06483221054077148, 0.06696701049804688, 0.06910181045532227, 0.07123661041259766, 0.07337141036987305, 0.07550621032714844, 0.07764101028442383, 0.07977581024169922, 0.08191061019897461, 0.08404541015625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 13.0, 8.0, 9.0, 22.0, 25.0, 30.0, 58.0, 55.0, 81.0, 70.0, 80.0, 109.0, 83.0, 79.0, 71.0, 64.0, 34.0, 24.0, 27.0, 22.0, 8.0, 5.0, 7.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01534271240234375, -0.01482236385345459, -0.01430201530456543, -0.01378166675567627, -0.01326131820678711, -0.01274096965789795, -0.012220621109008789, -0.011700272560119629, -0.011179924011230469, -0.010659575462341309, -0.010139226913452148, -0.009618878364562988, -0.009098529815673828, -0.008578181266784668, -0.008057832717895508, -0.007537484169006348, -0.0070171356201171875, -0.006496787071228027, -0.005976438522338867, -0.005456089973449707, -0.004935741424560547, -0.004415392875671387, -0.0038950443267822266, -0.0033746957778930664, -0.0028543472290039062, -0.002333998680114746, -0.001813650131225586, -0.0012933015823364258, -0.0007729530334472656, -0.00025260448455810547, 0.0002677440643310547, 0.0007880926132202148, 0.001308441162109375, 0.0018287897109985352, 0.0023491382598876953, 0.0028694868087768555, 0.0033898353576660156, 0.003910183906555176, 0.004430532455444336, 0.004950881004333496, 0.005471229553222656, 0.005991578102111816, 0.0065119266510009766, 0.007032275199890137, 0.007552623748779297, 0.008072972297668457, 0.008593320846557617, 0.009113669395446777, 0.009634017944335938, 0.010154366493225098, 0.010674715042114258, 0.011195063591003418, 0.011715412139892578, 0.012235760688781738, 0.012756109237670898, 0.013276457786560059, 0.013796806335449219, 0.014317154884338379, 0.014837503433227539, 0.0153578519821167, 0.01587820053100586, 0.01639854907989502, 0.01691889762878418, 0.01743924617767334, 0.0179595947265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 16.0, 12.0, 19.0, 40.0, 74.0, 138.0, 390.0, 3710.0, 4137344.0, 50724.0, 1046.0, 285.0, 160.0, 109.0, 64.0, 56.0, 32.0, 21.0, 16.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12017822265625, -0.117156982421875, -0.1141357421875, -0.111114501953125, -0.10809326171875, -0.105072021484375, -0.10205078125, -0.099029541015625, -0.09600830078125, -0.092987060546875, -0.0899658203125, -0.086944580078125, -0.08392333984375, -0.080902099609375, -0.077880859375, -0.074859619140625, -0.07183837890625, -0.068817138671875, -0.0657958984375, -0.062774658203125, -0.05975341796875, -0.056732177734375, -0.0537109375, -0.050689697265625, -0.04766845703125, -0.044647216796875, -0.0416259765625, -0.038604736328125, -0.03558349609375, -0.032562255859375, -0.029541015625, -0.026519775390625, -0.02349853515625, -0.020477294921875, -0.0174560546875, -0.014434814453125, -0.01141357421875, -0.008392333984375, -0.00537109375, -0.002349853515625, 0.00067138671875, 0.003692626953125, 0.0067138671875, 0.009735107421875, 0.01275634765625, 0.015777587890625, 0.018798828125, 0.021820068359375, 0.02484130859375, 0.027862548828125, 0.0308837890625, 0.033905029296875, 0.03692626953125, 0.039947509765625, 0.04296875, 0.045989990234375, 0.04901123046875, 0.052032470703125, 0.0550537109375, 0.058074951171875, 0.06109619140625, 0.064117431640625, 0.067138671875, 0.070159912109375, 0.07318115234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 8.0, 15.0, 22.0, 52.0, 181.0, 2529.0, 1073.0, 125.0, 44.0, 16.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290679931640625, -0.02711176872253418, -0.02515554428100586, -0.02319931983947754, -0.02124309539794922, -0.0192868709564209, -0.017330646514892578, -0.015374422073364258, -0.013418197631835938, -0.011461973190307617, -0.009505748748779297, -0.0075495243072509766, -0.005593299865722656, -0.003637075424194336, -0.0016808509826660156, 0.0002753734588623047, 0.002231597900390625, 0.004187822341918945, 0.006144046783447266, 0.008100271224975586, 0.010056495666503906, 0.012012720108032227, 0.013968944549560547, 0.015925168991088867, 0.017881393432617188, 0.019837617874145508, 0.021793842315673828, 0.02375006675720215, 0.02570629119873047, 0.02766251564025879, 0.02961874008178711, 0.03157496452331543, 0.03353118896484375, 0.03548741340637207, 0.03744363784790039, 0.03939986228942871, 0.04135608673095703, 0.04331231117248535, 0.04526853561401367, 0.04722476005554199, 0.04918098449707031, 0.05113720893859863, 0.05309343338012695, 0.05504965782165527, 0.057005882263183594, 0.058962106704711914, 0.060918331146240234, 0.06287455558776855, 0.06483078002929688, 0.0667870044708252, 0.06874322891235352, 0.07069945335388184, 0.07265567779541016, 0.07461190223693848, 0.0765681266784668, 0.07852435111999512, 0.08048057556152344, 0.08243680000305176, 0.08439302444458008, 0.0863492488861084, 0.08830547332763672, 0.09026169776916504, 0.09221792221069336, 0.09417414665222168, 0.09613037109375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 11.0, 14.0, 16.0, 21.0, 38.0, 79.0, 155.0, 199.0, 168.0, 79.0, 57.0, 42.0, 31.0, 20.0, 11.0, 19.0, 10.0, 8.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28262707591056824, -0.2751024663448334, -0.2675778269767761, -0.26005321741104126, -0.2525286078453064, -0.24500398337841034, -0.23747935891151428, -0.22995474934577942, -0.22243012487888336, -0.2149055004119873, -0.20738089084625244, -0.19985626637935638, -0.19233165681362152, -0.18480703234672546, -0.1772824227809906, -0.16975779831409454, -0.1622331738471985, -0.15470854938030243, -0.14718393981456757, -0.1396593153476715, -0.13213470578193665, -0.12461008131504059, -0.11708546429872513, -0.10956084728240967, -0.1020362377166748, -0.09451162070035934, -0.08698700368404388, -0.07946237921714783, -0.07193776220083237, -0.0644131451845169, -0.05688852816820145, -0.04936390742659569, -0.04183928668498993, -0.03431466966867447, -0.02679004892706871, -0.01926543191075325, -0.01174081303179264, -0.004216194152832031, 0.003308422863483429, 0.010833043605089188, 0.018357660621404648, 0.025882279500365257, 0.03340689837932587, 0.04093151539564133, 0.04845613241195679, 0.055980753153562546, 0.06350536644458771, 0.07102999091148376, 0.07855460792779922, 0.08607922494411469, 0.09360384196043015, 0.1011284589767456, 0.10865308344364166, 0.11617770045995712, 0.12370231747627258, 0.13122694194316864, 0.1387515515089035, 0.14627617597579956, 0.15380078554153442, 0.16132541000843048, 0.16885001957416534, 0.1763746440410614, 0.18389925360679626, 0.19142387807369232, 0.19894850254058838]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 12.0, 8.0, 5.0, 8.0, 7.0, 7.0, 16.0, 19.0, 11.0, 33.0, 25.0, 25.0, 30.0, 30.0, 27.0, 28.0, 36.0, 46.0, 50.0, 48.0, 49.0, 45.0, 38.0, 56.0, 56.0, 42.0, 32.0, 29.0, 30.0, 19.0, 28.0, 11.0, 17.0, 11.0, 12.0, 9.0, 10.0, 9.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.14713478088378906, -0.14239844679832458, -0.1376621127128601, -0.13292576372623444, -0.12818942964076996, -0.12345309555530548, -0.1187167540192604, -0.11398041248321533, -0.10924407839775085, -0.10450774431228638, -0.0997714027762413, -0.09503506124019623, -0.09029872715473175, -0.08556239306926727, -0.0808260515332222, -0.07608970999717712, -0.07135337591171265, -0.06661704182624817, -0.061880700290203094, -0.05714436247944832, -0.05240802466869354, -0.047671686857938766, -0.04293534904718399, -0.038199011236429214, -0.03346267342567444, -0.028726335614919662, -0.023989997804164886, -0.01925365999341011, -0.014517322182655334, -0.009780984371900558, -0.0050446465611457825, -0.00030830875039100647, 0.0044280290603637695, 0.009164366871118546, 0.013900704681873322, 0.018637042492628098, 0.023373380303382874, 0.02810971811413765, 0.032846055924892426, 0.0375823937356472, 0.04231873154640198, 0.047055069357156754, 0.05179140716791153, 0.056527744978666306, 0.06126408278942108, 0.06600041687488556, 0.07073675841093063, 0.07547309994697571, 0.08020943403244019, 0.08494576811790466, 0.08968210965394974, 0.09441845118999481, 0.09915478527545929, 0.10389111936092377, 0.10862746089696884, 0.11336380243301392, 0.1181001365184784, 0.12283647060394287, 0.12757280468940735, 0.13230915367603302, 0.1370454877614975, 0.14178182184696198, 0.14651817083358765, 0.15125450491905212, 0.1559908390045166]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 11.0, 5.0, 15.0, 33.0, 43.0, 82.0, 115.0, 144.0, 242.0, 364.0, 732.0, 1230.0, 2434.0, 4948.0, 10648.0, 26336.0, 71049.0, 236234.0, 462555.0, 147715.0, 49019.0, 18586.0, 7923.0, 3710.0, 1843.0, 1052.0, 565.0, 308.0, 223.0, 122.0, 93.0, 50.0, 37.0, 27.0, 11.0, 18.0, 12.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01611328125, -0.015523433685302734, -0.014933586120605469, -0.014343738555908203, -0.013753890991210938, -0.013164043426513672, -0.012574195861816406, -0.01198434829711914, -0.011394500732421875, -0.01080465316772461, -0.010214805603027344, -0.009624958038330078, -0.009035110473632812, -0.008445262908935547, -0.007855415344238281, -0.007265567779541016, -0.00667572021484375, -0.006085872650146484, -0.005496025085449219, -0.004906177520751953, -0.0043163299560546875, -0.003726482391357422, -0.0031366348266601562, -0.0025467872619628906, -0.001956939697265625, -0.0013670921325683594, -0.0007772445678710938, -0.00018739700317382812, 0.0004024505615234375, 0.0009922981262207031, 0.0015821456909179688, 0.0021719932556152344, 0.0027618408203125, 0.0033516883850097656, 0.003941535949707031, 0.004531383514404297, 0.0051212310791015625, 0.005711078643798828, 0.006300926208496094, 0.006890773773193359, 0.007480621337890625, 0.00807046890258789, 0.008660316467285156, 0.009250164031982422, 0.009840011596679688, 0.010429859161376953, 0.011019706726074219, 0.011609554290771484, 0.01219940185546875, 0.012789249420166016, 0.013379096984863281, 0.013968944549560547, 0.014558792114257812, 0.015148639678955078, 0.015738487243652344, 0.01632833480834961, 0.016918182373046875, 0.01750802993774414, 0.018097877502441406, 0.018687725067138672, 0.019277572631835938, 0.019867420196533203, 0.02045726776123047, 0.021047115325927734, 0.021636962890625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 13.0, 10.0, 20.0, 28.0, 42.0, 45.0, 70.0, 65.0, 73.0, 85.0, 61.0, 93.0, 75.0, 64.0, 59.0, 48.0, 37.0, 29.0, 25.0, 6.0, 12.0, 10.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01473236083984375, -0.014180302619934082, -0.013628244400024414, -0.013076186180114746, -0.012524127960205078, -0.01197206974029541, -0.011420011520385742, -0.010867953300476074, -0.010315895080566406, -0.009763836860656738, -0.00921177864074707, -0.008659720420837402, -0.008107662200927734, -0.007555603981018066, -0.0070035457611083984, -0.0064514875411987305, -0.0058994293212890625, -0.0053473711013793945, -0.0047953128814697266, -0.004243254661560059, -0.0036911964416503906, -0.0031391382217407227, -0.0025870800018310547, -0.0020350217819213867, -0.0014829635620117188, -0.0009309053421020508, -0.0003788471221923828, 0.00017321109771728516, 0.0007252693176269531, 0.001277327537536621, 0.001829385757446289, 0.002381443977355957, 0.002933502197265625, 0.003485560417175293, 0.004037618637084961, 0.004589676856994629, 0.005141735076904297, 0.005693793296813965, 0.006245851516723633, 0.006797909736633301, 0.007349967956542969, 0.007902026176452637, 0.008454084396362305, 0.009006142616271973, 0.00955820083618164, 0.010110259056091309, 0.010662317276000977, 0.011214375495910645, 0.011766433715820312, 0.01231849193572998, 0.012870550155639648, 0.013422608375549316, 0.013974666595458984, 0.014526724815368652, 0.01507878303527832, 0.01563084125518799, 0.016182899475097656, 0.016734957695007324, 0.017287015914916992, 0.01783907413482666, 0.018391132354736328, 0.018943190574645996, 0.019495248794555664, 0.020047307014465332, 0.020599365234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 16.0, 6.0, 26.0, 28.0, 54.0, 78.0, 169.0, 336.0, 816.0, 2798.0, 14832.0, 375730.0, 631742.0, 17153.0, 3074.0, 897.0, 396.0, 168.0, 93.0, 49.0, 32.0, 19.0, 11.0, 7.0, 4.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07696533203125, -0.07463550567626953, -0.07230567932128906, -0.0699758529663086, -0.06764602661132812, -0.06531620025634766, -0.06298637390136719, -0.06065654754638672, -0.05832672119140625, -0.05599689483642578, -0.05366706848144531, -0.051337242126464844, -0.049007415771484375, -0.046677589416503906, -0.04434776306152344, -0.04201793670654297, -0.0396881103515625, -0.03735828399658203, -0.03502845764160156, -0.032698631286621094, -0.030368804931640625, -0.028038978576660156, -0.025709152221679688, -0.02337932586669922, -0.02104949951171875, -0.01871967315673828, -0.016389846801757812, -0.014060020446777344, -0.011730194091796875, -0.009400367736816406, -0.0070705413818359375, -0.004740715026855469, -0.002410888671875, -8.106231689453125e-05, 0.0022487640380859375, 0.004578590393066406, 0.006908416748046875, 0.009238243103027344, 0.011568069458007812, 0.013897895812988281, 0.01622772216796875, 0.01855754852294922, 0.020887374877929688, 0.023217201232910156, 0.025547027587890625, 0.027876853942871094, 0.030206680297851562, 0.03253650665283203, 0.0348663330078125, 0.03719615936279297, 0.03952598571777344, 0.041855812072753906, 0.044185638427734375, 0.046515464782714844, 0.04884529113769531, 0.05117511749267578, 0.05350494384765625, 0.05583477020263672, 0.05816459655761719, 0.060494422912597656, 0.06282424926757812, 0.0651540756225586, 0.06748390197753906, 0.06981372833251953, 0.0721435546875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 9.0, 4.0, 11.0, 7.0, 11.0, 16.0, 32.0, 31.0, 43.0, 47.0, 55.0, 69.0, 65.0, 72.0, 93.0, 64.0, 63.0, 42.0, 62.0, 50.0, 38.0, 24.0, 18.0, 14.0, 9.0, 15.0, 9.0, 8.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.071533203125, -0.069305419921875, -0.06707763671875, -0.064849853515625, -0.0626220703125, -0.060394287109375, -0.05816650390625, -0.055938720703125, -0.0537109375, -0.051483154296875, -0.04925537109375, -0.047027587890625, -0.0447998046875, -0.042572021484375, -0.04034423828125, -0.038116455078125, -0.035888671875, -0.033660888671875, -0.03143310546875, -0.029205322265625, -0.0269775390625, -0.024749755859375, -0.02252197265625, -0.020294189453125, -0.01806640625, -0.015838623046875, -0.01361083984375, -0.011383056640625, -0.0091552734375, -0.006927490234375, -0.00469970703125, -0.002471923828125, -0.000244140625, 0.001983642578125, 0.00421142578125, 0.006439208984375, 0.0086669921875, 0.010894775390625, 0.01312255859375, 0.015350341796875, 0.017578125, 0.019805908203125, 0.02203369140625, 0.024261474609375, 0.0264892578125, 0.028717041015625, 0.03094482421875, 0.033172607421875, 0.035400390625, 0.037628173828125, 0.03985595703125, 0.042083740234375, 0.0443115234375, 0.046539306640625, 0.04876708984375, 0.050994873046875, 0.05322265625, 0.055450439453125, 0.05767822265625, 0.059906005859375, 0.0621337890625, 0.064361572265625, 0.06658935546875, 0.068817138671875, 0.071044921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 8.0, 11.0, 8.0, 19.0, 29.0, 49.0, 40.0, 74.0, 111.0, 177.0, 280.0, 470.0, 801.0, 1539.0, 3057.0, 7669.0, 25775.0, 929813.0, 57059.0, 12454.0, 4502.0, 2000.0, 1007.0, 594.0, 358.0, 207.0, 146.0, 80.0, 50.0, 42.0, 35.0, 17.0, 15.0, 11.0, 9.0, 6.0, 5.0, 5.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038177490234375, -0.03689289093017578, -0.03560829162597656, -0.034323692321777344, -0.033039093017578125, -0.031754493713378906, -0.030469894409179688, -0.02918529510498047, -0.02790069580078125, -0.02661609649658203, -0.025331497192382812, -0.024046897888183594, -0.022762298583984375, -0.021477699279785156, -0.020193099975585938, -0.01890850067138672, -0.0176239013671875, -0.01633930206298828, -0.015054702758789062, -0.013770103454589844, -0.012485504150390625, -0.011200904846191406, -0.009916305541992188, -0.008631706237792969, -0.00734710693359375, -0.006062507629394531, -0.0047779083251953125, -0.0034933090209960938, -0.002208709716796875, -0.0009241104125976562, 0.0003604888916015625, 0.0016450881958007812, 0.0029296875, 0.004214286804199219, 0.0054988861083984375, 0.006783485412597656, 0.008068084716796875, 0.009352684020996094, 0.010637283325195312, 0.011921882629394531, 0.01320648193359375, 0.014491081237792969, 0.015775680541992188, 0.017060279846191406, 0.018344879150390625, 0.019629478454589844, 0.020914077758789062, 0.02219867706298828, 0.0234832763671875, 0.02476787567138672, 0.026052474975585938, 0.027337074279785156, 0.028621673583984375, 0.029906272888183594, 0.031190872192382812, 0.03247547149658203, 0.03376007080078125, 0.03504467010498047, 0.03632926940917969, 0.037613868713378906, 0.038898468017578125, 0.040183067321777344, 0.04146766662597656, 0.04275226593017578, 0.044036865234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 4.0, 8.0, 7.0, 7.0, 6.0, 8.0, 18.0, 20.0, 30.0, 36.0, 47.0, 92.0, 86.0, 96.0, 121.0, 102.0, 73.0, 57.0, 39.0, 28.0, 21.0, 19.0, 14.0, 7.0, 7.0, 6.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8710575103759766e-05, -5.676690489053726e-05, -5.482323467731476e-05, -5.2879564464092255e-05, -5.093589425086975e-05, -4.899222403764725e-05, -4.7048553824424744e-05, -4.510488361120224e-05, -4.3161213397979736e-05, -4.121754318475723e-05, -3.927387297153473e-05, -3.7330202758312225e-05, -3.538653254508972e-05, -3.344286233186722e-05, -3.1499192118644714e-05, -2.955552190542221e-05, -2.7611851692199707e-05, -2.5668181478977203e-05, -2.37245112657547e-05, -2.1780841052532196e-05, -1.9837170839309692e-05, -1.789350062608719e-05, -1.5949830412864685e-05, -1.4006160199642181e-05, -1.2062489986419678e-05, -1.0118819773197174e-05, -8.17514955997467e-06, -6.231479346752167e-06, -4.287809133529663e-06, -2.3441389203071594e-06, -4.0046870708465576e-07, 1.543201506137848e-06, 3.4868717193603516e-06, 5.430541932582855e-06, 7.374212145805359e-06, 9.317882359027863e-06, 1.1261552572250366e-05, 1.320522278547287e-05, 1.5148892998695374e-05, 1.7092563211917877e-05, 1.903623342514038e-05, 2.0979903638362885e-05, 2.2923573851585388e-05, 2.4867244064807892e-05, 2.6810914278030396e-05, 2.87545844912529e-05, 3.06982547044754e-05, 3.2641924917697906e-05, 3.458559513092041e-05, 3.6529265344142914e-05, 3.847293555736542e-05, 4.041660577058792e-05, 4.2360275983810425e-05, 4.430394619703293e-05, 4.624761641025543e-05, 4.8191286623477936e-05, 5.013495683670044e-05, 5.207862704992294e-05, 5.402229726314545e-05, 5.596596747636795e-05, 5.7909637689590454e-05, 5.985330790281296e-05, 6.179697811603546e-05, 6.374064832925797e-05, 6.568431854248047e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 6.0, 4.0, 5.0, 11.0, 4.0, 12.0, 21.0, 34.0, 57.0, 129.0, 240.0, 736.0, 2265.0, 9146.0, 82464.0, 934213.0, 14435.0, 3141.0, 952.0, 358.0, 148.0, 60.0, 42.0, 22.0, 14.0, 9.0, 5.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07110595703125, -0.06908226013183594, -0.06705856323242188, -0.06503486633300781, -0.06301116943359375, -0.06098747253417969, -0.058963775634765625, -0.05694007873535156, -0.0549163818359375, -0.05289268493652344, -0.050868988037109375, -0.04884529113769531, -0.04682159423828125, -0.04479789733886719, -0.042774200439453125, -0.04075050354003906, -0.038726806640625, -0.03670310974121094, -0.034679412841796875, -0.03265571594238281, -0.03063201904296875, -0.028608322143554688, -0.026584625244140625, -0.024560928344726562, -0.0225372314453125, -0.020513534545898438, -0.018489837646484375, -0.016466140747070312, -0.01444244384765625, -0.012418746948242188, -0.010395050048828125, -0.008371353149414062, -0.00634765625, -0.0043239593505859375, -0.002300262451171875, -0.0002765655517578125, 0.00174713134765625, 0.0037708282470703125, 0.005794525146484375, 0.007818222045898438, 0.0098419189453125, 0.011865615844726562, 0.013889312744140625, 0.015913009643554688, 0.01793670654296875, 0.019960403442382812, 0.021984100341796875, 0.024007797241210938, 0.026031494140625, 0.028055191040039062, 0.030078887939453125, 0.03210258483886719, 0.03412628173828125, 0.03614997863769531, 0.038173675537109375, 0.04019737243652344, 0.0422210693359375, 0.04424476623535156, 0.046268463134765625, 0.04829216003417969, 0.05031585693359375, 0.05233955383300781, 0.054363250732421875, 0.05638694763183594, 0.05841064453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 7.0, 6.0, 9.0, 13.0, 11.0, 13.0, 29.0, 136.0, 453.0, 167.0, 43.0, 15.0, 14.0, 6.0, 6.0, 4.0, 7.0, 7.0, 7.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03997802734375, -0.03862476348876953, -0.03727149963378906, -0.035918235778808594, -0.034564971923828125, -0.033211708068847656, -0.03185844421386719, -0.03050518035888672, -0.02915191650390625, -0.02779865264892578, -0.026445388793945312, -0.025092124938964844, -0.023738861083984375, -0.022385597229003906, -0.021032333374023438, -0.01967906951904297, -0.0183258056640625, -0.01697254180908203, -0.015619277954101562, -0.014266014099121094, -0.012912750244140625, -0.011559486389160156, -0.010206222534179688, -0.008852958679199219, -0.00749969482421875, -0.006146430969238281, -0.0047931671142578125, -0.0034399032592773438, -0.002086639404296875, -0.0007333755493164062, 0.0006198883056640625, 0.0019731521606445312, 0.003326416015625, 0.004679679870605469, 0.0060329437255859375, 0.007386207580566406, 0.008739471435546875, 0.010092735290527344, 0.011445999145507812, 0.012799263000488281, 0.01415252685546875, 0.015505790710449219, 0.016859054565429688, 0.018212318420410156, 0.019565582275390625, 0.020918846130371094, 0.022272109985351562, 0.02362537384033203, 0.0249786376953125, 0.02633190155029297, 0.027685165405273438, 0.029038429260253906, 0.030391693115234375, 0.031744956970214844, 0.03309822082519531, 0.03445148468017578, 0.03580474853515625, 0.03715801239013672, 0.03851127624511719, 0.039864540100097656, 0.041217803955078125, 0.042571067810058594, 0.04392433166503906, 0.04527759552001953, 0.046630859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 9.0, 20.0, 29.0, 42.0, 66.0, 132.0, 246.0, 213.0, 116.0, 59.0, 21.0, 14.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4694001078605652, -0.45262354612350464, -0.4358469545841217, -0.41907039284706116, -0.4022938311100006, -0.3855172395706177, -0.36874067783355713, -0.3519641160964966, -0.33518755435943604, -0.3184109926223755, -0.30163440108299255, -0.284857839345932, -0.26808127760887146, -0.2513046860694885, -0.23452812433242798, -0.21775156259536743, -0.2009749710559845, -0.18419839441776276, -0.1674218326807022, -0.15064525604248047, -0.13386869430541992, -0.11709211766719818, -0.10031554102897644, -0.0835389718413353, -0.06676240265369415, -0.04998583346605301, -0.03320926055312157, -0.016432687640190125, 0.0003438815474510193, 0.017120450735092163, 0.033897027373313904, 0.05067359656095505, 0.06745016574859619, 0.08422673493623734, 0.10100330412387848, 0.11777988076210022, 0.13455644249916077, 0.1513330191373825, 0.16810959577560425, 0.1848861575126648, 0.20166273415088654, 0.21843931078910828, 0.23521587252616882, 0.25199246406555176, 0.2687690258026123, 0.28554558753967285, 0.3023221492767334, 0.31909874081611633, 0.3358753025531769, 0.3526518642902374, 0.36942845582962036, 0.3862050175666809, 0.40298157930374146, 0.419758141040802, 0.43653473258018494, 0.4533112943172455, 0.4700878858566284, 0.48686444759368896, 0.5036410093307495, 0.5204175710678101, 0.5371941924095154, 0.5539707541465759, 0.5707473158836365, 0.587523877620697, 0.6043004393577576]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 1.0, 8.0, 11.0, 16.0, 15.0, 13.0, 21.0, 19.0, 19.0, 23.0, 23.0, 25.0, 37.0, 32.0, 44.0, 41.0, 56.0, 63.0, 70.0, 56.0, 44.0, 34.0, 41.0, 36.0, 32.0, 26.0, 21.0, 22.0, 20.0, 18.0, 15.0, 13.0, 11.0, 14.0, 11.0, 2.0, 11.0, 10.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2635602355003357, -0.25540804862976074, -0.2472558319568634, -0.23910364508628845, -0.2309514433145523, -0.22279924154281616, -0.2146470546722412, -0.20649485290050507, -0.19834265112876892, -0.19019044935703278, -0.18203824758529663, -0.17388606071472168, -0.16573385894298553, -0.1575816571712494, -0.14942947030067444, -0.1412772685289383, -0.13312506675720215, -0.124972864985466, -0.11682067066431046, -0.10866847634315491, -0.10051627457141876, -0.09236407279968262, -0.08421187847852707, -0.07605968415737152, -0.06790748238563538, -0.05975528433918953, -0.05160308629274368, -0.043450888246297836, -0.03529869019985199, -0.027146492153406143, -0.018994294106960297, -0.01084209606051445, -0.0026898980140686035, 0.005462300032377243, 0.01361449807882309, 0.021766696125268936, 0.029918894171714783, 0.03807109221816063, 0.046223290264606476, 0.05437548831105232, 0.06252768635749817, 0.07067988812923431, 0.07883208245038986, 0.08698427677154541, 0.09513647854328156, 0.1032886803150177, 0.11144087463617325, 0.1195930689573288, 0.12774527072906494, 0.1358974725008011, 0.14404967427253723, 0.15220186114311218, 0.16035406291484833, 0.16850626468658447, 0.17665845155715942, 0.18481065332889557, 0.1929628551006317, 0.20111505687236786, 0.209267258644104, 0.21741944551467896, 0.2255716472864151, 0.23372384905815125, 0.2418760359287262, 0.25002825260162354, 0.2581804394721985]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 11.0, 15.0, 13.0, 16.0, 22.0, 42.0, 50.0, 52.0, 87.0, 147.0, 242.0, 457.0, 1042.0, 2611.0, 8130.0, 50952.0, 3364708.0, 733292.0, 22956.0, 5410.0, 2008.0, 914.0, 413.0, 240.0, 141.0, 88.0, 50.0, 50.0, 42.0, 19.0, 15.0, 13.0, 8.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.034149169921875, -0.033246755599975586, -0.03234434127807617, -0.03144192695617676, -0.030539512634277344, -0.02963709831237793, -0.028734683990478516, -0.0278322696685791, -0.026929855346679688, -0.026027441024780273, -0.02512502670288086, -0.024222612380981445, -0.02332019805908203, -0.022417783737182617, -0.021515369415283203, -0.02061295509338379, -0.019710540771484375, -0.01880812644958496, -0.017905712127685547, -0.017003297805786133, -0.01610088348388672, -0.015198469161987305, -0.01429605484008789, -0.013393640518188477, -0.012491226196289062, -0.011588811874389648, -0.010686397552490234, -0.00978398323059082, -0.008881568908691406, -0.007979154586791992, -0.007076740264892578, -0.006174325942993164, -0.00527191162109375, -0.004369497299194336, -0.003467082977294922, -0.002564668655395508, -0.0016622543334960938, -0.0007598400115966797, 0.00014257431030273438, 0.0010449886322021484, 0.0019474029541015625, 0.0028498172760009766, 0.0037522315979003906, 0.004654645919799805, 0.005557060241699219, 0.006459474563598633, 0.007361888885498047, 0.008264303207397461, 0.009166717529296875, 0.010069131851196289, 0.010971546173095703, 0.011873960494995117, 0.012776374816894531, 0.013678789138793945, 0.01458120346069336, 0.015483617782592773, 0.016386032104492188, 0.0172884464263916, 0.018190860748291016, 0.01909327507019043, 0.019995689392089844, 0.020898103713989258, 0.021800518035888672, 0.022702932357788086, 0.0236053466796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 10.0, 11.0, 13.0, 17.0, 29.0, 31.0, 38.0, 41.0, 50.0, 74.0, 50.0, 79.0, 61.0, 85.0, 63.0, 60.0, 53.0, 43.0, 50.0, 32.0, 20.0, 25.0, 12.0, 6.0, 10.0, 9.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01512908935546875, -0.014623284339904785, -0.01411747932434082, -0.013611674308776855, -0.01310586929321289, -0.012600064277648926, -0.012094259262084961, -0.011588454246520996, -0.011082649230957031, -0.010576844215393066, -0.010071039199829102, -0.009565234184265137, -0.009059429168701172, -0.008553624153137207, -0.008047819137573242, -0.007542014122009277, -0.0070362091064453125, -0.006530404090881348, -0.006024599075317383, -0.005518794059753418, -0.005012989044189453, -0.004507184028625488, -0.0040013790130615234, -0.0034955739974975586, -0.0029897689819335938, -0.002483963966369629, -0.001978158950805664, -0.0014723539352416992, -0.0009665489196777344, -0.00046074390411376953, 4.506111145019531e-05, 0.0005508661270141602, 0.001056671142578125, 0.0015624761581420898, 0.0020682811737060547, 0.0025740861892700195, 0.0030798912048339844, 0.0035856962203979492, 0.004091501235961914, 0.004597306251525879, 0.005103111267089844, 0.005608916282653809, 0.0061147212982177734, 0.006620526313781738, 0.007126331329345703, 0.007632136344909668, 0.008137941360473633, 0.008643746376037598, 0.009149551391601562, 0.009655356407165527, 0.010161161422729492, 0.010666966438293457, 0.011172771453857422, 0.011678576469421387, 0.012184381484985352, 0.012690186500549316, 0.013195991516113281, 0.013701796531677246, 0.014207601547241211, 0.014713406562805176, 0.01521921157836914, 0.015725016593933105, 0.01623082160949707, 0.016736626625061035, 0.017242431640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 9.0, 8.0, 13.0, 29.0, 25.0, 50.0, 61.0, 87.0, 131.0, 203.0, 438.0, 928.0, 3336.0, 24751.0, 3947400.0, 200883.0, 11019.0, 2590.0, 958.0, 487.0, 264.0, 201.0, 123.0, 74.0, 76.0, 33.0, 32.0, 25.0, 8.0, 15.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052947998046875, -0.05116987228393555, -0.049391746520996094, -0.04761362075805664, -0.04583549499511719, -0.044057369232177734, -0.04227924346923828, -0.04050111770629883, -0.038722991943359375, -0.03694486618041992, -0.03516674041748047, -0.033388614654541016, -0.03161048889160156, -0.02983236312866211, -0.028054237365722656, -0.026276111602783203, -0.02449798583984375, -0.022719860076904297, -0.020941734313964844, -0.01916360855102539, -0.017385482788085938, -0.015607357025146484, -0.013829231262207031, -0.012051105499267578, -0.010272979736328125, -0.008494853973388672, -0.006716728210449219, -0.004938602447509766, -0.0031604766845703125, -0.0013823509216308594, 0.00039577484130859375, 0.002173900604248047, 0.0039520263671875, 0.005730152130126953, 0.007508277893066406, 0.00928640365600586, 0.011064529418945312, 0.012842655181884766, 0.014620780944824219, 0.016398906707763672, 0.018177032470703125, 0.019955158233642578, 0.02173328399658203, 0.023511409759521484, 0.025289535522460938, 0.02706766128540039, 0.028845787048339844, 0.030623912811279297, 0.03240203857421875, 0.0341801643371582, 0.035958290100097656, 0.03773641586303711, 0.03951454162597656, 0.041292667388916016, 0.04307079315185547, 0.04484891891479492, 0.046627044677734375, 0.04840517044067383, 0.05018329620361328, 0.051961421966552734, 0.05373954772949219, 0.05551767349243164, 0.057295799255371094, 0.05907392501831055, 0.06085205078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 15.0, 22.0, 50.0, 94.0, 235.0, 1187.0, 1767.0, 400.0, 118.0, 54.0, 28.0, 23.0, 14.0, 12.0, 7.0, 8.0, 5.0, 4.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.025299072265625, -0.02415752410888672, -0.023015975952148438, -0.021874427795410156, -0.020732879638671875, -0.019591331481933594, -0.018449783325195312, -0.01730823516845703, -0.01616668701171875, -0.015025138854980469, -0.013883590698242188, -0.012742042541503906, -0.011600494384765625, -0.010458946228027344, -0.009317398071289062, -0.008175849914550781, -0.0070343017578125, -0.005892753601074219, -0.0047512054443359375, -0.0036096572875976562, -0.002468109130859375, -0.0013265609741210938, -0.0001850128173828125, 0.0009565353393554688, 0.00209808349609375, 0.0032396316528320312, 0.0043811798095703125, 0.005522727966308594, 0.006664276123046875, 0.007805824279785156, 0.008947372436523438, 0.010088920593261719, 0.01123046875, 0.012372016906738281, 0.013513565063476562, 0.014655113220214844, 0.015796661376953125, 0.016938209533691406, 0.018079757690429688, 0.01922130584716797, 0.02036285400390625, 0.02150440216064453, 0.022645950317382812, 0.023787498474121094, 0.024929046630859375, 0.026070594787597656, 0.027212142944335938, 0.02835369110107422, 0.0294952392578125, 0.03063678741455078, 0.03177833557128906, 0.032919883728027344, 0.034061431884765625, 0.035202980041503906, 0.03634452819824219, 0.03748607635498047, 0.03862762451171875, 0.03976917266845703, 0.04091072082519531, 0.042052268981933594, 0.043193817138671875, 0.044335365295410156, 0.04547691345214844, 0.04661846160888672, 0.047760009765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 16.0, 39.0, 61.0, 135.0, 233.0, 219.0, 126.0, 69.0, 34.0, 21.0, 14.0, 11.0, 7.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3248322010040283, -0.31391409039497375, -0.3029959797859192, -0.2920778691768646, -0.28115975856781006, -0.2702416181564331, -0.2593235373497009, -0.24840539693832397, -0.2374872863292694, -0.22656917572021484, -0.21565106511116028, -0.2047329545021057, -0.19381482899188995, -0.1828967183828354, -0.17197860777378082, -0.16106048226356506, -0.1501423865556717, -0.13922427594661713, -0.12830616533756256, -0.1173880472779274, -0.10646992921829224, -0.09555181860923767, -0.0846337080001831, -0.07371558994054794, -0.06279747933149338, -0.051879364997148514, -0.04096125066280365, -0.030043140053749084, -0.01912502571940422, -0.008206911385059357, 0.0027111992239952087, 0.013629317283630371, 0.024547427892684937, 0.0354655422270298, 0.046383656561374664, 0.05730176717042923, 0.06821988523006439, 0.07913799583911896, 0.09005610644817352, 0.10097422450780869, 0.11189233511686325, 0.12281044572591782, 0.13372856378555298, 0.14464667439460754, 0.1555647850036621, 0.16648289561271667, 0.17740100622177124, 0.188319131731987, 0.19923724234104156, 0.21015535295009613, 0.2210734635591507, 0.23199158906936646, 0.24290969967842102, 0.2538278102874756, 0.26474592089653015, 0.2756640315055847, 0.2865821421146393, 0.29750025272369385, 0.3084183633327484, 0.319336473941803, 0.33025458455085754, 0.3411726951599121, 0.35209083557128906, 0.36300894618034363, 0.3739270567893982]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 6.0, 12.0, 8.0, 11.0, 10.0, 11.0, 21.0, 25.0, 22.0, 26.0, 45.0, 36.0, 54.0, 55.0, 43.0, 53.0, 55.0, 60.0, 47.0, 55.0, 45.0, 52.0, 36.0, 36.0, 27.0, 23.0, 22.0, 21.0, 16.0, 17.0, 14.0, 12.0, 2.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12280076742172241, -0.1182720810174942, -0.1137433871626854, -0.10921470075845718, -0.10468600690364838, -0.10015732049942017, -0.09562863409519196, -0.09109994769096375, -0.08657125383615494, -0.08204256743192673, -0.07751387357711792, -0.07298518717288971, -0.0684565007686615, -0.06392780691385269, -0.05939912050962448, -0.05487043038010597, -0.05034174025058746, -0.045813050121068954, -0.041284359991550446, -0.036755673587322235, -0.032226983457803726, -0.027698293328285217, -0.023169605061411858, -0.018640916794538498, -0.014112226665019989, -0.009583537466824055, -0.00505484826862812, -0.0005261590704321861, 0.004002530127763748, 0.008531220257282257, 0.013059908524155617, 0.017588596791028976, 0.022117286920547485, 0.026645977050065994, 0.031174665316939354, 0.035703353583812714, 0.04023204371333122, 0.04476073384284973, 0.04928942024707794, 0.05381811037659645, 0.05834680050611496, 0.06287548691034317, 0.06740418076515198, 0.07193286716938019, 0.0764615535736084, 0.0809902474284172, 0.08551893383264542, 0.09004762768745422, 0.09457631409168243, 0.09910500049591064, 0.10363369435071945, 0.10816238075494766, 0.11269107460975647, 0.11721976101398468, 0.12174844741821289, 0.1262771338224411, 0.1308058202266693, 0.13533450663089752, 0.13986319303512573, 0.14439189434051514, 0.14892058074474335, 0.15344926714897156, 0.15797795355319977, 0.16250663995742798, 0.16703534126281738]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 3.0, 5.0, 4.0, 8.0, 19.0, 15.0, 30.0, 64.0, 104.0, 133.0, 202.0, 381.0, 682.0, 1332.0, 2336.0, 4567.0, 9702.0, 21728.0, 53459.0, 152650.0, 416720.0, 245100.0, 81522.0, 31709.0, 13427.0, 6106.0, 2984.0, 1556.0, 845.0, 479.0, 257.0, 172.0, 87.0, 58.0, 28.0, 31.0, 16.0, 13.0, 11.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0213470458984375, -0.02062845230102539, -0.01990985870361328, -0.019191265106201172, -0.018472671508789062, -0.017754077911376953, -0.017035484313964844, -0.016316890716552734, -0.015598297119140625, -0.014879703521728516, -0.014161109924316406, -0.013442516326904297, -0.012723922729492188, -0.012005329132080078, -0.011286735534667969, -0.01056814193725586, -0.00984954833984375, -0.00913095474243164, -0.008412361145019531, -0.007693767547607422, -0.0069751739501953125, -0.006256580352783203, -0.005537986755371094, -0.004819393157958984, -0.004100799560546875, -0.0033822059631347656, -0.0026636123657226562, -0.0019450187683105469, -0.0012264251708984375, -0.0005078315734863281, 0.00021076202392578125, 0.0009293556213378906, 0.00164794921875, 0.0023665428161621094, 0.0030851364135742188, 0.003803730010986328, 0.0045223236083984375, 0.005240917205810547, 0.005959510803222656, 0.006678104400634766, 0.007396697998046875, 0.008115291595458984, 0.008833885192871094, 0.009552478790283203, 0.010271072387695312, 0.010989665985107422, 0.011708259582519531, 0.01242685317993164, 0.01314544677734375, 0.01386404037475586, 0.014582633972167969, 0.015301227569580078, 0.016019821166992188, 0.016738414764404297, 0.017457008361816406, 0.018175601959228516, 0.018894195556640625, 0.019612789154052734, 0.020331382751464844, 0.021049976348876953, 0.021768569946289062, 0.022487163543701172, 0.02320575714111328, 0.02392435073852539, 0.0246429443359375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 9.0, 13.0, 8.0, 25.0, 30.0, 37.0, 45.0, 48.0, 54.0, 63.0, 53.0, 69.0, 81.0, 74.0, 76.0, 58.0, 43.0, 36.0, 40.0, 36.0, 33.0, 14.0, 11.0, 12.0, 5.0, 7.0, 5.0, 8.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01506805419921875, -0.01455986499786377, -0.014051675796508789, -0.013543486595153809, -0.013035297393798828, -0.012527108192443848, -0.012018918991088867, -0.011510729789733887, -0.011002540588378906, -0.010494351387023926, -0.009986162185668945, -0.009477972984313965, -0.008969783782958984, -0.008461594581604004, -0.007953405380249023, -0.007445216178894043, -0.0069370269775390625, -0.006428837776184082, -0.0059206485748291016, -0.005412459373474121, -0.004904270172119141, -0.00439608097076416, -0.0038878917694091797, -0.0033797025680541992, -0.0028715133666992188, -0.0023633241653442383, -0.0018551349639892578, -0.0013469457626342773, -0.0008387565612792969, -0.0003305673599243164, 0.00017762184143066406, 0.0006858110427856445, 0.001194000244140625, 0.0017021894454956055, 0.002210378646850586, 0.0027185678482055664, 0.003226757049560547, 0.0037349462509155273, 0.004243135452270508, 0.004751324653625488, 0.005259513854980469, 0.005767703056335449, 0.00627589225769043, 0.00678408145904541, 0.007292270660400391, 0.007800459861755371, 0.008308649063110352, 0.008816838264465332, 0.009325027465820312, 0.009833216667175293, 0.010341405868530273, 0.010849595069885254, 0.011357784271240234, 0.011865973472595215, 0.012374162673950195, 0.012882351875305176, 0.013390541076660156, 0.013898730278015137, 0.014406919479370117, 0.014915108680725098, 0.015423297882080078, 0.01593148708343506, 0.01643967628479004, 0.01694786548614502, 0.0174560546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 22.0, 18.0, 36.0, 53.0, 115.0, 204.0, 399.0, 789.0, 2034.0, 6380.0, 27249.0, 175548.0, 723357.0, 88889.0, 16484.0, 4289.0, 1400.0, 586.0, 288.0, 148.0, 87.0, 55.0, 37.0, 24.0, 11.0, 10.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04412841796875, -0.042571067810058594, -0.04101371765136719, -0.03945636749267578, -0.037899017333984375, -0.03634166717529297, -0.03478431701660156, -0.033226966857910156, -0.03166961669921875, -0.030112266540527344, -0.028554916381835938, -0.02699756622314453, -0.025440216064453125, -0.02388286590576172, -0.022325515747070312, -0.020768165588378906, -0.0192108154296875, -0.017653465270996094, -0.016096115112304688, -0.014538764953613281, -0.012981414794921875, -0.011424064636230469, -0.009866714477539062, -0.008309364318847656, -0.00675201416015625, -0.005194664001464844, -0.0036373138427734375, -0.0020799636840820312, -0.000522613525390625, 0.0010347366333007812, 0.0025920867919921875, 0.004149436950683594, 0.005706787109375, 0.007264137268066406, 0.008821487426757812, 0.010378837585449219, 0.011936187744140625, 0.013493537902832031, 0.015050888061523438, 0.016608238220214844, 0.01816558837890625, 0.019722938537597656, 0.021280288696289062, 0.02283763885498047, 0.024394989013671875, 0.02595233917236328, 0.027509689331054688, 0.029067039489746094, 0.0306243896484375, 0.032181739807128906, 0.03373908996582031, 0.03529644012451172, 0.036853790283203125, 0.03841114044189453, 0.03996849060058594, 0.041525840759277344, 0.04308319091796875, 0.044640541076660156, 0.04619789123535156, 0.04775524139404297, 0.049312591552734375, 0.05086994171142578, 0.05242729187011719, 0.053984642028808594, 0.0555419921875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 6.0, 7.0, 12.0, 16.0, 12.0, 13.0, 15.0, 20.0, 29.0, 31.0, 35.0, 47.0, 43.0, 42.0, 43.0, 54.0, 45.0, 60.0, 56.0, 51.0, 51.0, 51.0, 36.0, 43.0, 27.0, 22.0, 26.0, 19.0, 13.0, 17.0, 13.0, 11.0, 6.0, 11.0, 5.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.044189453125, -0.04262685775756836, -0.04106426239013672, -0.03950166702270508, -0.03793907165527344, -0.0363764762878418, -0.034813880920410156, -0.033251285552978516, -0.031688690185546875, -0.030126094818115234, -0.028563499450683594, -0.027000904083251953, -0.025438308715820312, -0.023875713348388672, -0.02231311798095703, -0.02075052261352539, -0.01918792724609375, -0.01762533187866211, -0.01606273651123047, -0.014500141143798828, -0.012937545776367188, -0.011374950408935547, -0.009812355041503906, -0.008249759674072266, -0.006687164306640625, -0.005124568939208984, -0.0035619735717773438, -0.001999378204345703, -0.0004367828369140625, 0.0011258125305175781, 0.0026884078979492188, 0.004251003265380859, 0.0058135986328125, 0.007376194000244141, 0.008938789367675781, 0.010501384735107422, 0.012063980102539062, 0.013626575469970703, 0.015189170837402344, 0.016751766204833984, 0.018314361572265625, 0.019876956939697266, 0.021439552307128906, 0.023002147674560547, 0.024564743041992188, 0.026127338409423828, 0.02768993377685547, 0.02925252914428711, 0.03081512451171875, 0.03237771987915039, 0.03394031524658203, 0.03550291061401367, 0.03706550598144531, 0.03862810134887695, 0.040190696716308594, 0.041753292083740234, 0.043315887451171875, 0.044878482818603516, 0.046441078186035156, 0.0480036735534668, 0.04956626892089844, 0.05112886428833008, 0.05269145965576172, 0.05425405502319336, 0.055816650390625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 6.0, 16.0, 15.0, 20.0, 47.0, 42.0, 56.0, 97.0, 123.0, 215.0, 333.0, 488.0, 775.0, 1374.0, 2317.0, 4386.0, 8798.0, 23552.0, 168660.0, 766351.0, 44576.0, 12897.0, 5857.0, 3083.0, 1681.0, 1019.0, 640.0, 388.0, 230.0, 149.0, 120.0, 80.0, 36.0, 31.0, 27.0, 13.0, 11.0, 12.0, 6.0, 5.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.031036376953125, -0.030179500579833984, -0.02932262420654297, -0.028465747833251953, -0.027608871459960938, -0.026751995086669922, -0.025895118713378906, -0.02503824234008789, -0.024181365966796875, -0.02332448959350586, -0.022467613220214844, -0.021610736846923828, -0.020753860473632812, -0.019896984100341797, -0.01904010772705078, -0.018183231353759766, -0.01732635498046875, -0.016469478607177734, -0.015612602233886719, -0.014755725860595703, -0.013898849487304688, -0.013041973114013672, -0.012185096740722656, -0.01132822036743164, -0.010471343994140625, -0.00961446762084961, -0.008757591247558594, -0.007900714874267578, -0.0070438385009765625, -0.006186962127685547, -0.005330085754394531, -0.004473209381103516, -0.0036163330078125, -0.0027594566345214844, -0.0019025802612304688, -0.0010457038879394531, -0.0001888275146484375, 0.0006680488586425781, 0.0015249252319335938, 0.0023818016052246094, 0.003238677978515625, 0.004095554351806641, 0.004952430725097656, 0.005809307098388672, 0.0066661834716796875, 0.007523059844970703, 0.008379936218261719, 0.009236812591552734, 0.01009368896484375, 0.010950565338134766, 0.011807441711425781, 0.012664318084716797, 0.013521194458007812, 0.014378070831298828, 0.015234947204589844, 0.01609182357788086, 0.016948699951171875, 0.01780557632446289, 0.018662452697753906, 0.019519329071044922, 0.020376205444335938, 0.021233081817626953, 0.02208995819091797, 0.022946834564208984, 0.0238037109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 3.0, 6.0, 11.0, 17.0, 20.0, 46.0, 56.0, 55.0, 89.0, 108.0, 84.0, 126.0, 91.0, 79.0, 47.0, 43.0, 29.0, 23.0, 15.0, 9.0, 7.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.557868957519531e-05, -7.35679641366005e-05, -7.155723869800568e-05, -6.954651325941086e-05, -6.753578782081604e-05, -6.552506238222122e-05, -6.35143369436264e-05, -6.150361150503159e-05, -5.949288606643677e-05, -5.748216062784195e-05, -5.547143518924713e-05, -5.346070975065231e-05, -5.1449984312057495e-05, -4.943925887346268e-05, -4.742853343486786e-05, -4.541780799627304e-05, -4.340708255767822e-05, -4.1396357119083405e-05, -3.9385631680488586e-05, -3.737490624189377e-05, -3.536418080329895e-05, -3.335345536470413e-05, -3.1342729926109314e-05, -2.9332004487514496e-05, -2.7321279048919678e-05, -2.531055361032486e-05, -2.329982817173004e-05, -2.1289102733135223e-05, -1.9278377294540405e-05, -1.7267651855945587e-05, -1.5256926417350769e-05, -1.3246200978755951e-05, -1.1235475540161133e-05, -9.224750101566315e-06, -7.214024662971497e-06, -5.2032992243766785e-06, -3.1925737857818604e-06, -1.1818483471870422e-06, 8.288770914077759e-07, 2.839602530002594e-06, 4.850327968597412e-06, 6.86105340719223e-06, 8.871778845787048e-06, 1.0882504284381866e-05, 1.2893229722976685e-05, 1.4903955161571503e-05, 1.691468060016632e-05, 1.892540603876114e-05, 2.0936131477355957e-05, 2.2946856915950775e-05, 2.4957582354545593e-05, 2.696830779314041e-05, 2.897903323173523e-05, 3.098975867033005e-05, 3.3000484108924866e-05, 3.5011209547519684e-05, 3.70219349861145e-05, 3.903266042470932e-05, 4.104338586330414e-05, 4.3054111301898956e-05, 4.5064836740493774e-05, 4.707556217908859e-05, 4.908628761768341e-05, 5.109701305627823e-05, 5.310773849487305e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 10.0, 12.0, 10.0, 30.0, 45.0, 65.0, 95.0, 193.0, 366.0, 827.0, 2082.0, 6565.0, 29529.0, 881879.0, 108380.0, 12440.0, 3531.0, 1283.0, 594.0, 274.0, 127.0, 92.0, 42.0, 33.0, 15.0, 11.0, 8.0, 2.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045806884765625, -0.044316768646240234, -0.04282665252685547, -0.0413365364074707, -0.03984642028808594, -0.03835630416870117, -0.036866188049316406, -0.03537607192993164, -0.033885955810546875, -0.03239583969116211, -0.030905723571777344, -0.029415607452392578, -0.027925491333007812, -0.026435375213623047, -0.02494525909423828, -0.023455142974853516, -0.02196502685546875, -0.020474910736083984, -0.01898479461669922, -0.017494678497314453, -0.016004562377929688, -0.014514446258544922, -0.013024330139160156, -0.01153421401977539, -0.010044097900390625, -0.00855398178100586, -0.007063865661621094, -0.005573749542236328, -0.0040836334228515625, -0.002593517303466797, -0.0011034011840820312, 0.0003867149353027344, 0.0018768310546875, 0.0033669471740722656, 0.004857063293457031, 0.006347179412841797, 0.007837295532226562, 0.009327411651611328, 0.010817527770996094, 0.01230764389038086, 0.013797760009765625, 0.01528787612915039, 0.016777992248535156, 0.018268108367919922, 0.019758224487304688, 0.021248340606689453, 0.02273845672607422, 0.024228572845458984, 0.02571868896484375, 0.027208805084228516, 0.02869892120361328, 0.030189037322998047, 0.03167915344238281, 0.03316926956176758, 0.034659385681152344, 0.03614950180053711, 0.037639617919921875, 0.03912973403930664, 0.040619850158691406, 0.04210996627807617, 0.04360008239746094, 0.0450901985168457, 0.04658031463623047, 0.048070430755615234, 0.049560546875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 6.0, 4.0, 11.0, 10.0, 29.0, 72.0, 127.0, 224.0, 191.0, 139.0, 61.0, 23.0, 26.0, 9.0, 8.0, 8.0, 4.0, 5.0, 5.0, 4.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0262451171875, -0.025341033935546875, -0.02443695068359375, -0.023532867431640625, -0.0226287841796875, -0.021724700927734375, -0.02082061767578125, -0.019916534423828125, -0.019012451171875, -0.018108367919921875, -0.01720428466796875, -0.016300201416015625, -0.0153961181640625, -0.014492034912109375, -0.01358795166015625, -0.012683868408203125, -0.01177978515625, -0.010875701904296875, -0.00997161865234375, -0.009067535400390625, -0.0081634521484375, -0.007259368896484375, -0.00635528564453125, -0.005451202392578125, -0.004547119140625, -0.003643035888671875, -0.00273895263671875, -0.001834869384765625, -0.0009307861328125, -2.6702880859375e-05, 0.00087738037109375, 0.001781463623046875, 0.002685546875, 0.003589630126953125, 0.00449371337890625, 0.005397796630859375, 0.0063018798828125, 0.007205963134765625, 0.00811004638671875, 0.009014129638671875, 0.009918212890625, 0.010822296142578125, 0.01172637939453125, 0.012630462646484375, 0.0135345458984375, 0.014438629150390625, 0.01534271240234375, 0.016246795654296875, 0.01715087890625, 0.018054962158203125, 0.01895904541015625, 0.019863128662109375, 0.0207672119140625, 0.021671295166015625, 0.02257537841796875, 0.023479461669921875, 0.024383544921875, 0.025287628173828125, 0.02619171142578125, 0.027095794677734375, 0.0279998779296875, 0.028903961181640625, 0.02980804443359375, 0.030712127685546875, 0.0316162109375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 5.0, 17.0, 23.0, 40.0, 59.0, 98.0, 136.0, 255.0, 151.0, 69.0, 62.0, 30.0, 15.0, 4.0, 9.0, 3.0, 1.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39762502908706665, -0.38466352224349976, -0.37170201539993286, -0.35874050855636597, -0.3457790017127991, -0.3328174948692322, -0.31985601782798767, -0.3068945109844208, -0.2939330041408539, -0.280971497297287, -0.2680099904537201, -0.2550484836101532, -0.2420869916677475, -0.2291254848241806, -0.2161639928817749, -0.203202486038208, -0.1902409791946411, -0.17727947235107422, -0.16431796550750732, -0.15135647356510162, -0.13839496672153473, -0.12543345987796783, -0.11247196048498154, -0.09951046109199524, -0.08654895424842834, -0.07358744740486145, -0.06062594801187515, -0.047664444893598557, -0.03470294177532196, -0.021741434931755066, -0.008779935538768768, 0.004181563854217529, 0.017143070697784424, 0.03010457381606102, 0.043066076934337616, 0.05602758005261421, 0.06898908317089081, 0.0819505900144577, 0.094912089407444, 0.1078735888004303, 0.12083509564399719, 0.1337966024875641, 0.14675810933113098, 0.15971960127353668, 0.17268110811710358, 0.18564261496067047, 0.19860410690307617, 0.21156561374664307, 0.22452712059020996, 0.23748862743377686, 0.25045013427734375, 0.26341164112091064, 0.27637314796447754, 0.28933465480804443, 0.30229613184928894, 0.31525763869285583, 0.32821914553642273, 0.3411806523799896, 0.3541421592235565, 0.3671036660671234, 0.3800651431083679, 0.3930266499519348, 0.4059881567955017, 0.4189496636390686, 0.4319111704826355]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 9.0, 1.0, 10.0, 14.0, 15.0, 22.0, 17.0, 25.0, 19.0, 32.0, 11.0, 24.0, 32.0, 37.0, 38.0, 39.0, 68.0, 76.0, 62.0, 61.0, 50.0, 45.0, 31.0, 35.0, 27.0, 21.0, 15.0, 27.0, 12.0, 19.0, 28.0, 12.0, 10.0, 10.0, 8.0, 9.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19505393505096436, -0.18864333629608154, -0.18223273754119873, -0.1758221536874771, -0.1694115549325943, -0.1630009561777115, -0.15659037232398987, -0.15017977356910706, -0.14376917481422424, -0.13735857605934143, -0.13094797730445862, -0.124537393450737, -0.11812679469585419, -0.11171619594097137, -0.10530560463666916, -0.09889501333236694, -0.09248441457748413, -0.08607381582260132, -0.0796632245182991, -0.07325263321399689, -0.06684203445911407, -0.06043143942952156, -0.05402084439992905, -0.04761024937033653, -0.04119965434074402, -0.034789059311151505, -0.02837846428155899, -0.021967869251966476, -0.015557274222373962, -0.009146679192781448, -0.0027360841631889343, 0.0036745108664035797, 0.010085105895996094, 0.016495700925588608, 0.022906295955181122, 0.029316890984773636, 0.03572748601436615, 0.042138081043958664, 0.04854867607355118, 0.05495927110314369, 0.061369866132736206, 0.06778046488761902, 0.07419105619192123, 0.08060164749622345, 0.08701224625110626, 0.09342284500598907, 0.09983343631029129, 0.1062440276145935, 0.11265462636947632, 0.11906522512435913, 0.12547582387924194, 0.13188640773296356, 0.13829700648784637, 0.1447076052427292, 0.1511181890964508, 0.15752878785133362, 0.16393938660621643, 0.17034998536109924, 0.17676058411598206, 0.18317116796970367, 0.1895817667245865, 0.1959923654794693, 0.20240294933319092, 0.20881354808807373, 0.21522414684295654]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 9.0, 8.0, 13.0, 16.0, 27.0, 36.0, 50.0, 77.0, 119.0, 169.0, 297.0, 477.0, 946.0, 2077.0, 4773.0, 13224.0, 55148.0, 806576.0, 3113775.0, 158819.0, 23790.0, 7572.0, 3038.0, 1420.0, 729.0, 401.0, 234.0, 149.0, 94.0, 79.0, 45.0, 25.0, 18.0, 17.0, 12.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.03082275390625, -0.029995203018188477, -0.029167652130126953, -0.02834010124206543, -0.027512550354003906, -0.026684999465942383, -0.02585744857788086, -0.025029897689819336, -0.024202346801757812, -0.02337479591369629, -0.022547245025634766, -0.021719694137573242, -0.02089214324951172, -0.020064592361450195, -0.019237041473388672, -0.01840949058532715, -0.017581939697265625, -0.0167543888092041, -0.015926837921142578, -0.015099287033081055, -0.014271736145019531, -0.013444185256958008, -0.012616634368896484, -0.011789083480834961, -0.010961532592773438, -0.010133981704711914, -0.00930643081665039, -0.008478879928588867, -0.007651329040527344, -0.00682377815246582, -0.005996227264404297, -0.0051686763763427734, -0.00434112548828125, -0.0035135746002197266, -0.002686023712158203, -0.0018584728240966797, -0.0010309219360351562, -0.0002033710479736328, 0.0006241798400878906, 0.001451730728149414, 0.0022792816162109375, 0.003106832504272461, 0.003934383392333984, 0.004761934280395508, 0.005589485168457031, 0.006417036056518555, 0.007244586944580078, 0.008072137832641602, 0.008899688720703125, 0.009727239608764648, 0.010554790496826172, 0.011382341384887695, 0.012209892272949219, 0.013037443161010742, 0.013864994049072266, 0.014692544937133789, 0.015520095825195312, 0.016347646713256836, 0.01717519760131836, 0.018002748489379883, 0.018830299377441406, 0.01965785026550293, 0.020485401153564453, 0.021312952041625977, 0.0221405029296875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 9.0, 13.0, 13.0, 20.0, 24.0, 25.0, 42.0, 39.0, 43.0, 54.0, 53.0, 63.0, 70.0, 51.0, 57.0, 69.0, 75.0, 58.0, 52.0, 39.0, 27.0, 24.0, 15.0, 13.0, 13.0, 9.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0147552490234375, -0.014284849166870117, -0.013814449310302734, -0.013344049453735352, -0.012873649597167969, -0.012403249740600586, -0.011932849884033203, -0.01146245002746582, -0.010992050170898438, -0.010521650314331055, -0.010051250457763672, -0.009580850601196289, -0.009110450744628906, -0.008640050888061523, -0.00816965103149414, -0.007699251174926758, -0.007228851318359375, -0.006758451461791992, -0.006288051605224609, -0.0058176517486572266, -0.005347251892089844, -0.004876852035522461, -0.004406452178955078, -0.003936052322387695, -0.0034656524658203125, -0.0029952526092529297, -0.002524852752685547, -0.002054452896118164, -0.0015840530395507812, -0.0011136531829833984, -0.0006432533264160156, -0.0001728534698486328, 0.00029754638671875, 0.0007679462432861328, 0.0012383460998535156, 0.0017087459564208984, 0.0021791458129882812, 0.002649545669555664, 0.003119945526123047, 0.0035903453826904297, 0.0040607452392578125, 0.004531145095825195, 0.005001544952392578, 0.005471944808959961, 0.005942344665527344, 0.0064127445220947266, 0.006883144378662109, 0.007353544235229492, 0.007823944091796875, 0.008294343948364258, 0.00876474380493164, 0.009235143661499023, 0.009705543518066406, 0.010175943374633789, 0.010646343231201172, 0.011116743087768555, 0.011587142944335938, 0.01205754280090332, 0.012527942657470703, 0.012998342514038086, 0.013468742370605469, 0.013939142227172852, 0.014409542083740234, 0.014879941940307617, 0.015350341796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 7.0, 10.0, 13.0, 22.0, 12.0, 21.0, 36.0, 45.0, 57.0, 92.0, 146.0, 282.0, 714.0, 4648.0, 417992.0, 3759640.0, 8650.0, 978.0, 395.0, 188.0, 102.0, 63.0, 38.0, 33.0, 16.0, 22.0, 15.0, 8.0, 11.0, 5.0, 6.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.095458984375, -0.09193801879882812, -0.08841705322265625, -0.08489608764648438, -0.0813751220703125, -0.07785415649414062, -0.07433319091796875, -0.07081222534179688, -0.067291259765625, -0.06377029418945312, -0.06024932861328125, -0.056728363037109375, -0.0532073974609375, -0.049686431884765625, -0.04616546630859375, -0.042644500732421875, -0.03912353515625, -0.035602569580078125, -0.03208160400390625, -0.028560638427734375, -0.0250396728515625, -0.021518707275390625, -0.01799774169921875, -0.014476776123046875, -0.010955810546875, -0.007434844970703125, -0.00391387939453125, -0.000392913818359375, 0.0031280517578125, 0.006649017333984375, 0.01016998291015625, 0.013690948486328125, 0.0172119140625, 0.020732879638671875, 0.02425384521484375, 0.027774810791015625, 0.0312957763671875, 0.034816741943359375, 0.03833770751953125, 0.041858673095703125, 0.045379638671875, 0.048900604248046875, 0.05242156982421875, 0.055942535400390625, 0.0594635009765625, 0.06298446655273438, 0.06650543212890625, 0.07002639770507812, 0.07354736328125, 0.07706832885742188, 0.08058929443359375, 0.08411026000976562, 0.0876312255859375, 0.09115219116210938, 0.09467315673828125, 0.09819412231445312, 0.101715087890625, 0.10523605346679688, 0.10875701904296875, 0.11227798461914062, 0.1157989501953125, 0.11931991577148438, 0.12284088134765625, 0.12636184692382812, 0.1298828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 12.0, 16.0, 27.0, 32.0, 51.0, 74.0, 138.0, 342.0, 953.0, 1362.0, 598.0, 192.0, 93.0, 65.0, 45.0, 21.0, 13.0, 10.0, 3.0, 9.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036834716796875, -0.03548479080200195, -0.034134864807128906, -0.03278493881225586, -0.03143501281738281, -0.030085086822509766, -0.02873516082763672, -0.027385234832763672, -0.026035308837890625, -0.024685382843017578, -0.02333545684814453, -0.021985530853271484, -0.020635604858398438, -0.01928567886352539, -0.017935752868652344, -0.016585826873779297, -0.01523590087890625, -0.013885974884033203, -0.012536048889160156, -0.01118612289428711, -0.009836196899414062, -0.008486270904541016, -0.007136344909667969, -0.005786418914794922, -0.004436492919921875, -0.003086566925048828, -0.0017366409301757812, -0.0003867149353027344, 0.0009632110595703125, 0.0023131370544433594, 0.0036630630493164062, 0.005012989044189453, 0.0063629150390625, 0.007712841033935547, 0.009062767028808594, 0.01041269302368164, 0.011762619018554688, 0.013112545013427734, 0.014462471008300781, 0.015812397003173828, 0.017162322998046875, 0.018512248992919922, 0.01986217498779297, 0.021212100982666016, 0.022562026977539062, 0.02391195297241211, 0.025261878967285156, 0.026611804962158203, 0.02796173095703125, 0.029311656951904297, 0.030661582946777344, 0.03201150894165039, 0.03336143493652344, 0.034711360931396484, 0.03606128692626953, 0.03741121292114258, 0.038761138916015625, 0.04011106491088867, 0.04146099090576172, 0.042810916900634766, 0.04416084289550781, 0.04551076889038086, 0.046860694885253906, 0.04821062088012695, 0.049560546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 8.0, 19.0, 36.0, 76.0, 195.0, 326.0, 212.0, 71.0, 29.0, 12.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5154139995574951, -0.49460044503211975, -0.4737868905067444, -0.452973335981369, -0.43215978145599365, -0.4113462567329407, -0.3905327022075653, -0.36971914768218994, -0.3489055931568146, -0.3280920386314392, -0.30727848410606384, -0.2864649295806885, -0.2656514048576355, -0.24483783543109894, -0.22402429580688477, -0.2032107412815094, -0.18239718675613403, -0.16158363223075867, -0.1407700777053833, -0.11995653808116913, -0.09914298355579376, -0.0783294290304184, -0.05751588195562363, -0.03670233488082886, -0.01588878035545349, 0.0049247704446315765, 0.025738321244716644, 0.04655187204480171, 0.06736542284488678, 0.08817897737026215, 0.10899252444505692, 0.12980607151985168, 0.15061962604522705, 0.17143318057060242, 0.19224673509597778, 0.21306027472019196, 0.23387382924556732, 0.2546873688697815, 0.27550092339515686, 0.2963144779205322, 0.3171280324459076, 0.33794158697128296, 0.3587551414966583, 0.3795686960220337, 0.40038222074508667, 0.4211958050727844, 0.4420093297958374, 0.46282288432121277, 0.48363643884658813, 0.5044499635696411, 0.5252635478973389, 0.5460770726203918, 0.5668906569480896, 0.5877041816711426, 0.6085177659988403, 0.6293312907218933, 0.6501448154449463, 0.6709583401679993, 0.691771924495697, 0.71258544921875, 0.7333990335464478, 0.7542125582695007, 0.7750261425971985, 0.7958396673202515, 0.8166532516479492]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 11.0, 6.0, 12.0, 16.0, 15.0, 28.0, 27.0, 41.0, 29.0, 58.0, 49.0, 68.0, 53.0, 74.0, 72.0, 66.0, 73.0, 63.0, 33.0, 39.0, 45.0, 34.0, 18.0, 16.0, 18.0, 15.0, 8.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18904048204421997, -0.1836414635181427, -0.17824243009090424, -0.17284341156482697, -0.1674443781375885, -0.16204535961151123, -0.15664634108543396, -0.1512473225593567, -0.14584828913211823, -0.14044927060604095, -0.1350502371788025, -0.12965121865272522, -0.12425219267606735, -0.11885316669940948, -0.11345414817333221, -0.10805512219667435, -0.10265609622001648, -0.09725707024335861, -0.09185804426670074, -0.08645902574062347, -0.0810599997639656, -0.07566097378730774, -0.07026195526123047, -0.0648629292845726, -0.059463903307914734, -0.054064877331256866, -0.0486658550798893, -0.04326683282852173, -0.03786780685186386, -0.032468780875205994, -0.027069758623838425, -0.021670736372470856, -0.01627171039581299, -0.01087268628180027, -0.005473662167787552, -7.463805377483368e-05, 0.0053243860602378845, 0.010723410174250603, 0.01612243428826332, 0.02152145653963089, 0.026920482516288757, 0.032319508492946625, 0.037718530744314194, 0.04311755299568176, 0.04851657897233963, 0.0539156049489975, 0.059314627200365067, 0.06471364945173264, 0.0701126754283905, 0.07551170140504837, 0.08091072738170624, 0.08630974590778351, 0.09170877188444138, 0.09710779786109924, 0.10250681638717651, 0.10790584236383438, 0.11330486834049225, 0.11870389431715012, 0.12410292029380798, 0.12950193881988525, 0.13490095734596252, 0.140299990773201, 0.14569900929927826, 0.15109804272651672, 0.156497061252594]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 15.0, 12.0, 16.0, 23.0, 36.0, 47.0, 84.0, 95.0, 182.0, 228.0, 354.0, 603.0, 878.0, 1329.0, 2336.0, 3816.0, 6800.0, 12473.0, 24208.0, 50953.0, 112633.0, 253025.0, 301524.0, 146214.0, 64654.0, 30488.0, 15563.0, 8266.0, 4578.0, 2644.0, 1645.0, 973.0, 613.0, 386.0, 294.0, 182.0, 115.0, 68.0, 63.0, 42.0, 27.0, 17.0, 14.0, 15.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0218353271484375, -0.02121424674987793, -0.02059316635131836, -0.01997208595275879, -0.01935100555419922, -0.01872992515563965, -0.018108844757080078, -0.017487764358520508, -0.016866683959960938, -0.016245603561401367, -0.015624523162841797, -0.015003442764282227, -0.014382362365722656, -0.013761281967163086, -0.013140201568603516, -0.012519121170043945, -0.011898040771484375, -0.011276960372924805, -0.010655879974365234, -0.010034799575805664, -0.009413719177246094, -0.008792638778686523, -0.008171558380126953, -0.007550477981567383, -0.0069293975830078125, -0.006308317184448242, -0.005687236785888672, -0.0050661563873291016, -0.004445075988769531, -0.003823995590209961, -0.0032029151916503906, -0.0025818347930908203, -0.00196075439453125, -0.0013396739959716797, -0.0007185935974121094, -9.751319885253906e-05, 0.0005235671997070312, 0.0011446475982666016, 0.0017657279968261719, 0.002386808395385742, 0.0030078887939453125, 0.003628969192504883, 0.004250049591064453, 0.0048711299896240234, 0.005492210388183594, 0.006113290786743164, 0.006734371185302734, 0.007355451583862305, 0.007976531982421875, 0.008597612380981445, 0.009218692779541016, 0.009839773178100586, 0.010460853576660156, 0.011081933975219727, 0.011703014373779297, 0.012324094772338867, 0.012945175170898438, 0.013566255569458008, 0.014187335968017578, 0.014808416366577148, 0.015429496765136719, 0.01605057716369629, 0.01667165756225586, 0.01729273796081543, 0.017913818359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 11.0, 17.0, 20.0, 26.0, 24.0, 38.0, 43.0, 38.0, 48.0, 67.0, 59.0, 60.0, 75.0, 73.0, 55.0, 58.0, 45.0, 40.0, 50.0, 30.0, 22.0, 23.0, 19.0, 11.0, 14.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0147705078125, -0.014300346374511719, -0.013830184936523438, -0.013360023498535156, -0.012889862060546875, -0.012419700622558594, -0.011949539184570312, -0.011479377746582031, -0.01100921630859375, -0.010539054870605469, -0.010068893432617188, -0.009598731994628906, -0.009128570556640625, -0.008658409118652344, -0.008188247680664062, -0.007718086242675781, -0.0072479248046875, -0.006777763366699219, -0.0063076019287109375, -0.005837440490722656, -0.005367279052734375, -0.004897117614746094, -0.0044269561767578125, -0.003956794738769531, -0.00348663330078125, -0.0030164718627929688, -0.0025463104248046875, -0.0020761489868164062, -0.001605987548828125, -0.0011358261108398438, -0.0006656646728515625, -0.00019550323486328125, 0.000274658203125, 0.0007448196411132812, 0.0012149810791015625, 0.0016851425170898438, 0.002155303955078125, 0.0026254653930664062, 0.0030956268310546875, 0.0035657882690429688, 0.00403594970703125, 0.004506111145019531, 0.0049762725830078125, 0.005446434020996094, 0.005916595458984375, 0.006386756896972656, 0.0068569183349609375, 0.007327079772949219, 0.0077972412109375, 0.008267402648925781, 0.008737564086914062, 0.009207725524902344, 0.009677886962890625, 0.010148048400878906, 0.010618209838867188, 0.011088371276855469, 0.01155853271484375, 0.012028694152832031, 0.012498855590820312, 0.012969017028808594, 0.013439178466796875, 0.013909339904785156, 0.014379501342773438, 0.014849662780761719, 0.01531982421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 7.0, 18.0, 22.0, 25.0, 37.0, 66.0, 100.0, 159.0, 266.0, 560.0, 1159.0, 2679.0, 6483.0, 17832.0, 58122.0, 233257.0, 570757.0, 108865.0, 30417.0, 10286.0, 3963.0, 1769.0, 754.0, 374.0, 192.0, 124.0, 85.0, 50.0, 40.0, 20.0, 16.0, 12.0, 11.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0325927734375, -0.031477928161621094, -0.030363082885742188, -0.02924823760986328, -0.028133392333984375, -0.02701854705810547, -0.025903701782226562, -0.024788856506347656, -0.02367401123046875, -0.022559165954589844, -0.021444320678710938, -0.02032947540283203, -0.019214630126953125, -0.01809978485107422, -0.016984939575195312, -0.015870094299316406, -0.0147552490234375, -0.013640403747558594, -0.012525558471679688, -0.011410713195800781, -0.010295867919921875, -0.009181022644042969, -0.008066177368164062, -0.006951332092285156, -0.00583648681640625, -0.004721641540527344, -0.0036067962646484375, -0.0024919509887695312, -0.001377105712890625, -0.00026226043701171875, 0.0008525848388671875, 0.0019674301147460938, 0.003082275390625, 0.004197120666503906, 0.0053119659423828125, 0.006426811218261719, 0.007541656494140625, 0.008656501770019531, 0.009771347045898438, 0.010886192321777344, 0.01200103759765625, 0.013115882873535156, 0.014230728149414062, 0.015345573425292969, 0.016460418701171875, 0.01757526397705078, 0.018690109252929688, 0.019804954528808594, 0.0209197998046875, 0.022034645080566406, 0.023149490356445312, 0.02426433563232422, 0.025379180908203125, 0.02649402618408203, 0.027608871459960938, 0.028723716735839844, 0.02983856201171875, 0.030953407287597656, 0.03206825256347656, 0.03318309783935547, 0.034297943115234375, 0.03541278839111328, 0.03652763366699219, 0.037642478942871094, 0.03875732421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 6.0, 10.0, 10.0, 14.0, 14.0, 7.0, 21.0, 32.0, 34.0, 39.0, 26.0, 26.0, 43.0, 44.0, 50.0, 36.0, 42.0, 50.0, 45.0, 48.0, 34.0, 40.0, 28.0, 50.0, 33.0, 27.0, 16.0, 22.0, 17.0, 18.0, 20.0, 9.0, 5.0, 11.0, 8.0, 6.0, 6.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.031768798828125, -0.03062152862548828, -0.029474258422851562, -0.028326988220214844, -0.027179718017578125, -0.026032447814941406, -0.024885177612304688, -0.02373790740966797, -0.02259063720703125, -0.02144336700439453, -0.020296096801757812, -0.019148826599121094, -0.018001556396484375, -0.016854286193847656, -0.015707015991210938, -0.014559745788574219, -0.0134124755859375, -0.012265205383300781, -0.011117935180664062, -0.009970664978027344, -0.008823394775390625, -0.007676124572753906, -0.0065288543701171875, -0.005381584167480469, -0.00423431396484375, -0.0030870437622070312, -0.0019397735595703125, -0.0007925033569335938, 0.000354766845703125, 0.0015020370483398438, 0.0026493072509765625, 0.0037965774536132812, 0.00494384765625, 0.006091117858886719, 0.0072383880615234375, 0.008385658264160156, 0.009532928466796875, 0.010680198669433594, 0.011827468872070312, 0.012974739074707031, 0.01412200927734375, 0.015269279479980469, 0.016416549682617188, 0.017563819885253906, 0.018711090087890625, 0.019858360290527344, 0.021005630493164062, 0.02215290069580078, 0.0233001708984375, 0.02444744110107422, 0.025594711303710938, 0.026741981506347656, 0.027889251708984375, 0.029036521911621094, 0.030183792114257812, 0.03133106231689453, 0.03247833251953125, 0.03362560272216797, 0.03477287292480469, 0.035920143127441406, 0.037067413330078125, 0.038214683532714844, 0.03936195373535156, 0.04050922393798828, 0.041656494140625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 16.0, 16.0, 23.0, 42.0, 40.0, 62.0, 125.0, 167.0, 284.0, 409.0, 686.0, 1179.0, 1929.0, 3573.0, 7090.0, 15757.0, 47097.0, 297274.0, 580932.0, 56876.0, 18059.0, 7721.0, 3868.0, 2045.0, 1252.0, 701.0, 461.0, 279.0, 175.0, 107.0, 78.0, 59.0, 44.0, 41.0, 21.0, 16.0, 11.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.023956298828125, -0.023209333419799805, -0.02246236801147461, -0.021715402603149414, -0.02096843719482422, -0.020221471786499023, -0.019474506378173828, -0.018727540969848633, -0.017980575561523438, -0.017233610153198242, -0.016486644744873047, -0.01573967933654785, -0.014992713928222656, -0.014245748519897461, -0.013498783111572266, -0.01275181770324707, -0.012004852294921875, -0.01125788688659668, -0.010510921478271484, -0.009763956069946289, -0.009016990661621094, -0.008270025253295898, -0.007523059844970703, -0.006776094436645508, -0.0060291290283203125, -0.005282163619995117, -0.004535198211669922, -0.0037882328033447266, -0.0030412673950195312, -0.002294301986694336, -0.0015473365783691406, -0.0008003711700439453, -5.340576171875e-05, 0.0006935596466064453, 0.0014405250549316406, 0.002187490463256836, 0.0029344558715820312, 0.0036814212799072266, 0.004428386688232422, 0.005175352096557617, 0.0059223175048828125, 0.006669282913208008, 0.007416248321533203, 0.008163213729858398, 0.008910179138183594, 0.009657144546508789, 0.010404109954833984, 0.01115107536315918, 0.011898040771484375, 0.01264500617980957, 0.013391971588134766, 0.014138936996459961, 0.014885902404785156, 0.01563286781311035, 0.016379833221435547, 0.017126798629760742, 0.017873764038085938, 0.018620729446411133, 0.019367694854736328, 0.020114660263061523, 0.02086162567138672, 0.021608591079711914, 0.02235555648803711, 0.023102521896362305, 0.0238494873046875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 4.0, 7.0, 6.0, 17.0, 19.0, 23.0, 25.0, 31.0, 56.0, 63.0, 102.0, 103.0, 95.0, 123.0, 88.0, 56.0, 46.0, 38.0, 23.0, 27.0, 12.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02467155456543e-05, -4.828162491321564e-05, -4.631653428077698e-05, -4.435144364833832e-05, -4.238635301589966e-05, -4.0421262383461e-05, -3.845617175102234e-05, -3.649108111858368e-05, -3.452599048614502e-05, -3.256089985370636e-05, -3.05958092212677e-05, -2.863071858882904e-05, -2.666562795639038e-05, -2.470053732395172e-05, -2.273544669151306e-05, -2.0770356059074402e-05, -1.8805265426635742e-05, -1.6840174794197083e-05, -1.4875084161758423e-05, -1.2909993529319763e-05, -1.0944902896881104e-05, -8.979812264442444e-06, -7.014721632003784e-06, -5.0496309995651245e-06, -3.084540367126465e-06, -1.1194497346878052e-06, 8.456408977508545e-07, 2.810731530189514e-06, 4.775822162628174e-06, 6.7409127950668335e-06, 8.706003427505493e-06, 1.0671094059944153e-05, 1.2636184692382812e-05, 1.4601275324821472e-05, 1.6566365957260132e-05, 1.853145658969879e-05, 2.049654722213745e-05, 2.246163785457611e-05, 2.442672848701477e-05, 2.639181911945343e-05, 2.835690975189209e-05, 3.032200038433075e-05, 3.228709101676941e-05, 3.425218164920807e-05, 3.621727228164673e-05, 3.818236291408539e-05, 4.014745354652405e-05, 4.211254417896271e-05, 4.407763481140137e-05, 4.604272544384003e-05, 4.8007816076278687e-05, 4.9972906708717346e-05, 5.1937997341156006e-05, 5.3903087973594666e-05, 5.5868178606033325e-05, 5.7833269238471985e-05, 5.9798359870910645e-05, 6.17634505033493e-05, 6.372854113578796e-05, 6.569363176822662e-05, 6.765872240066528e-05, 6.962381303310394e-05, 7.15889036655426e-05, 7.355399429798126e-05, 7.551908493041992e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 13.0, 12.0, 34.0, 45.0, 68.0, 120.0, 245.0, 436.0, 879.0, 2005.0, 4875.0, 14064.0, 59714.0, 741106.0, 183963.0, 27111.0, 8135.0, 3023.0, 1332.0, 637.0, 307.0, 199.0, 91.0, 53.0, 28.0, 19.0, 16.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0254974365234375, -0.02450728416442871, -0.023517131805419922, -0.022526979446411133, -0.021536827087402344, -0.020546674728393555, -0.019556522369384766, -0.018566370010375977, -0.017576217651367188, -0.0165860652923584, -0.01559591293334961, -0.01460576057434082, -0.013615608215332031, -0.012625455856323242, -0.011635303497314453, -0.010645151138305664, -0.009654998779296875, -0.008664846420288086, -0.007674694061279297, -0.006684541702270508, -0.005694389343261719, -0.00470423698425293, -0.0037140846252441406, -0.0027239322662353516, -0.0017337799072265625, -0.0007436275482177734, 0.0002465248107910156, 0.0012366771697998047, 0.0022268295288085938, 0.003216981887817383, 0.004207134246826172, 0.005197286605834961, 0.00618743896484375, 0.007177591323852539, 0.008167743682861328, 0.009157896041870117, 0.010148048400878906, 0.011138200759887695, 0.012128353118896484, 0.013118505477905273, 0.014108657836914062, 0.015098810195922852, 0.01608896255493164, 0.01707911491394043, 0.01806926727294922, 0.019059419631958008, 0.020049571990966797, 0.021039724349975586, 0.022029876708984375, 0.023020029067993164, 0.024010181427001953, 0.025000333786010742, 0.02599048614501953, 0.02698063850402832, 0.02797079086303711, 0.0289609432220459, 0.029951095581054688, 0.030941247940063477, 0.031931400299072266, 0.032921552658081055, 0.033911705017089844, 0.03490185737609863, 0.03589200973510742, 0.03688216209411621, 0.037872314453125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 5.0, 7.0, 15.0, 22.0, 35.0, 50.0, 101.0, 154.0, 195.0, 156.0, 95.0, 47.0, 31.0, 24.0, 14.0, 6.0, 9.0, 7.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033599853515625, -0.03270125389099121, -0.03180265426635742, -0.030904054641723633, -0.030005455017089844, -0.029106855392456055, -0.028208255767822266, -0.027309656143188477, -0.026411056518554688, -0.0255124568939209, -0.02461385726928711, -0.02371525764465332, -0.02281665802001953, -0.021918058395385742, -0.021019458770751953, -0.020120859146118164, -0.019222259521484375, -0.018323659896850586, -0.017425060272216797, -0.016526460647583008, -0.01562786102294922, -0.01472926139831543, -0.01383066177368164, -0.012932062149047852, -0.012033462524414062, -0.011134862899780273, -0.010236263275146484, -0.009337663650512695, -0.008439064025878906, -0.007540464401245117, -0.006641864776611328, -0.005743265151977539, -0.00484466552734375, -0.003946065902709961, -0.003047466278076172, -0.002148866653442383, -0.0012502670288085938, -0.0003516674041748047, 0.0005469322204589844, 0.0014455318450927734, 0.0023441314697265625, 0.0032427310943603516, 0.004141330718994141, 0.00503993034362793, 0.005938529968261719, 0.006837129592895508, 0.007735729217529297, 0.008634328842163086, 0.009532928466796875, 0.010431528091430664, 0.011330127716064453, 0.012228727340698242, 0.013127326965332031, 0.01402592658996582, 0.01492452621459961, 0.0158231258392334, 0.016721725463867188, 0.017620325088500977, 0.018518924713134766, 0.019417524337768555, 0.020316123962402344, 0.021214723587036133, 0.022113323211669922, 0.02301192283630371, 0.0239105224609375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 13.0, 26.0, 73.0, 153.0, 409.0, 204.0, 68.0, 24.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8900133371353149, -0.8636792898178101, -0.8373452425003052, -0.8110111951828003, -0.7846771478652954, -0.7583431005477905, -0.7320090532302856, -0.7056750059127808, -0.6793409585952759, -0.653006911277771, -0.6266728639602661, -0.6003388166427612, -0.5740047693252563, -0.5476707220077515, -0.5213366746902466, -0.4950026273727417, -0.4686685800552368, -0.44233453273773193, -0.41600048542022705, -0.38966643810272217, -0.3633323907852173, -0.3369983434677124, -0.3106642961502075, -0.28433024883270264, -0.25799620151519775, -0.23166215419769287, -0.205328106880188, -0.1789940595626831, -0.15266001224517822, -0.12632596492767334, -0.09999191761016846, -0.07365787029266357, -0.04732388257980347, -0.020989835262298584, 0.005344212055206299, 0.03167825937271118, 0.058012306690216064, 0.08434635400772095, 0.11068040132522583, 0.1370144486427307, 0.1633484959602356, 0.18968254327774048, 0.21601659059524536, 0.24235063791275024, 0.2686846852302551, 0.29501873254776, 0.3213527798652649, 0.3476868271827698, 0.37402087450027466, 0.40035492181777954, 0.4266889691352844, 0.4530230164527893, 0.4793570637702942, 0.5056911110877991, 0.532025158405304, 0.5583592057228088, 0.5846932530403137, 0.6110273003578186, 0.6373613476753235, 0.6636953949928284, 0.6900294423103333, 0.7163634896278381, 0.742697536945343, 0.7690315842628479, 0.7953656315803528]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 9.0, 6.0, 8.0, 10.0, 10.0, 18.0, 13.0, 18.0, 29.0, 22.0, 33.0, 30.0, 31.0, 29.0, 52.0, 47.0, 64.0, 102.0, 71.0, 36.0, 39.0, 42.0, 34.0, 28.0, 25.0, 30.0, 23.0, 18.0, 22.0, 18.0, 20.0, 10.0, 6.0, 11.0, 4.0, 7.0, 4.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.19877541065216064, -0.19333045184612274, -0.18788549304008484, -0.18244054913520813, -0.17699559032917023, -0.17155063152313232, -0.16610568761825562, -0.1606607288122177, -0.1552157700061798, -0.1497708112001419, -0.144325852394104, -0.1388809084892273, -0.1334359496831894, -0.1279909908771515, -0.12254603952169418, -0.11710108816623688, -0.11165612936019897, -0.10621117055416107, -0.10076621919870377, -0.09532126784324646, -0.08987630903720856, -0.08443135023117065, -0.07898639887571335, -0.07354144752025604, -0.06809648871421814, -0.06265152990818024, -0.05720657855272293, -0.05176162347197533, -0.04631666839122772, -0.04087171331048012, -0.03542675822973251, -0.02998180314898491, -0.024536848068237305, -0.0190918929874897, -0.013646937906742096, -0.008201982825994492, -0.002757027745246887, 0.002687927335500717, 0.008132882416248322, 0.013577837496995926, 0.01902279257774353, 0.024467747658491135, 0.02991270273923874, 0.03535765781998634, 0.04080261290073395, 0.04624756798148155, 0.051692523062229156, 0.05713747814297676, 0.06258243322372437, 0.06802739202976227, 0.07347234338521957, 0.07891729474067688, 0.08436225354671478, 0.08980721235275269, 0.09525216370820999, 0.1006971150636673, 0.1061420738697052, 0.1115870326757431, 0.11703198403120041, 0.12247693538665771, 0.12792189419269562, 0.13336685299873352, 0.13881179690361023, 0.14425675570964813, 0.14970171451568604]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 12.0, 12.0, 19.0, 31.0, 44.0, 61.0, 107.0, 167.0, 248.0, 478.0, 764.0, 1379.0, 2557.0, 5726.0, 15952.0, 95472.0, 2379714.0, 1594299.0, 72640.0, 13828.0, 5181.0, 2437.0, 1237.0, 715.0, 420.0, 261.0, 185.0, 115.0, 58.0, 49.0, 30.0, 18.0, 25.0, 11.0, 3.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0241241455078125, -0.0233919620513916, -0.022659778594970703, -0.021927595138549805, -0.021195411682128906, -0.020463228225708008, -0.01973104476928711, -0.01899886131286621, -0.018266677856445312, -0.017534494400024414, -0.016802310943603516, -0.016070127487182617, -0.015337944030761719, -0.01460576057434082, -0.013873577117919922, -0.013141393661499023, -0.012409210205078125, -0.011677026748657227, -0.010944843292236328, -0.01021265983581543, -0.009480476379394531, -0.008748292922973633, -0.008016109466552734, -0.007283926010131836, -0.0065517425537109375, -0.005819559097290039, -0.005087375640869141, -0.004355192184448242, -0.0036230087280273438, -0.0028908252716064453, -0.002158641815185547, -0.0014264583587646484, -0.00069427490234375, 3.790855407714844e-05, 0.0007700920104980469, 0.0015022754669189453, 0.0022344589233398438, 0.002966642379760742, 0.0036988258361816406, 0.004431009292602539, 0.0051631927490234375, 0.005895376205444336, 0.006627559661865234, 0.007359743118286133, 0.008091926574707031, 0.00882411003112793, 0.009556293487548828, 0.010288476943969727, 0.011020660400390625, 0.011752843856811523, 0.012485027313232422, 0.01321721076965332, 0.013949394226074219, 0.014681577682495117, 0.015413761138916016, 0.016145944595336914, 0.016878128051757812, 0.01761031150817871, 0.01834249496459961, 0.019074678421020508, 0.019806861877441406, 0.020539045333862305, 0.021271228790283203, 0.0220034122467041, 0.022735595703125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 10.0, 8.0, 9.0, 10.0, 21.0, 29.0, 38.0, 43.0, 53.0, 53.0, 57.0, 66.0, 59.0, 71.0, 78.0, 54.0, 49.0, 56.0, 42.0, 38.0, 26.0, 22.0, 19.0, 16.0, 11.0, 11.0, 12.0, 12.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.015716552734375, -0.015274763107299805, -0.01483297348022461, -0.014391183853149414, -0.013949394226074219, -0.013507604598999023, -0.013065814971923828, -0.012624025344848633, -0.012182235717773438, -0.011740446090698242, -0.011298656463623047, -0.010856866836547852, -0.010415077209472656, -0.009973287582397461, -0.009531497955322266, -0.00908970832824707, -0.008647918701171875, -0.00820612907409668, -0.007764339447021484, -0.007322549819946289, -0.006880760192871094, -0.0064389705657958984, -0.005997180938720703, -0.005555391311645508, -0.0051136016845703125, -0.004671812057495117, -0.004230022430419922, -0.0037882328033447266, -0.0033464431762695312, -0.002904653549194336, -0.0024628639221191406, -0.0020210742950439453, -0.00157928466796875, -0.0011374950408935547, -0.0006957054138183594, -0.00025391578674316406, 0.00018787384033203125, 0.0006296634674072266, 0.0010714530944824219, 0.0015132427215576172, 0.0019550323486328125, 0.002396821975708008, 0.002838611602783203, 0.0032804012298583984, 0.0037221908569335938, 0.004163980484008789, 0.004605770111083984, 0.00504755973815918, 0.005489349365234375, 0.00593113899230957, 0.006372928619384766, 0.006814718246459961, 0.007256507873535156, 0.0076982975006103516, 0.008140087127685547, 0.008581876754760742, 0.009023666381835938, 0.009465456008911133, 0.009907245635986328, 0.010349035263061523, 0.010790824890136719, 0.011232614517211914, 0.01167440414428711, 0.012116193771362305, 0.0125579833984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 7.0, 10.0, 10.0, 22.0, 25.0, 40.0, 62.0, 75.0, 127.0, 448.0, 4356.0, 3484205.0, 700659.0, 3371.0, 375.0, 147.0, 93.0, 76.0, 49.0, 30.0, 30.0, 20.0, 9.0, 10.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.184326171875, -0.1795940399169922, -0.17486190795898438, -0.17012977600097656, -0.16539764404296875, -0.16066551208496094, -0.15593338012695312, -0.1512012481689453, -0.1464691162109375, -0.1417369842529297, -0.13700485229492188, -0.13227272033691406, -0.12754058837890625, -0.12280845642089844, -0.11807632446289062, -0.11334419250488281, -0.108612060546875, -0.10387992858886719, -0.09914779663085938, -0.09441566467285156, -0.08968353271484375, -0.08495140075683594, -0.08021926879882812, -0.07548713684082031, -0.0707550048828125, -0.06602287292480469, -0.061290740966796875, -0.05655860900878906, -0.05182647705078125, -0.04709434509277344, -0.042362213134765625, -0.03763008117675781, -0.03289794921875, -0.028165817260742188, -0.023433685302734375, -0.018701553344726562, -0.01396942138671875, -0.009237289428710938, -0.004505157470703125, 0.0002269744873046875, 0.0049591064453125, 0.009691238403320312, 0.014423370361328125, 0.019155502319335938, 0.02388763427734375, 0.028619766235351562, 0.033351898193359375, 0.03808403015136719, 0.042816162109375, 0.04754829406738281, 0.052280426025390625, 0.05701255798339844, 0.06174468994140625, 0.06647682189941406, 0.07120895385742188, 0.07594108581542969, 0.0806732177734375, 0.08540534973144531, 0.09013748168945312, 0.09486961364746094, 0.09960174560546875, 0.10433387756347656, 0.10906600952148438, 0.11379814147949219, 0.1185302734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 18.0, 23.0, 46.0, 152.0, 1236.0, 2195.0, 258.0, 79.0, 47.0, 11.0, 7.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040008544921875, -0.03718423843383789, -0.03435993194580078, -0.03153562545776367, -0.028711318969726562, -0.025887012481689453, -0.023062705993652344, -0.020238399505615234, -0.017414093017578125, -0.014589786529541016, -0.011765480041503906, -0.008941173553466797, -0.0061168670654296875, -0.003292560577392578, -0.00046825408935546875, 0.0023560523986816406, 0.00518035888671875, 0.00800466537475586, 0.010828971862792969, 0.013653278350830078, 0.016477584838867188, 0.019301891326904297, 0.022126197814941406, 0.024950504302978516, 0.027774810791015625, 0.030599117279052734, 0.033423423767089844, 0.03624773025512695, 0.03907203674316406, 0.04189634323120117, 0.04472064971923828, 0.04754495620727539, 0.0503692626953125, 0.05319356918334961, 0.05601787567138672, 0.05884218215942383, 0.06166648864746094, 0.06449079513549805, 0.06731510162353516, 0.07013940811157227, 0.07296371459960938, 0.07578802108764648, 0.0786123275756836, 0.0814366340637207, 0.08426094055175781, 0.08708524703979492, 0.08990955352783203, 0.09273386001586914, 0.09555816650390625, 0.09838247299194336, 0.10120677947998047, 0.10403108596801758, 0.10685539245605469, 0.1096796989440918, 0.1125040054321289, 0.11532831192016602, 0.11815261840820312, 0.12097692489624023, 0.12380123138427734, 0.12662553787231445, 0.12944984436035156, 0.13227415084838867, 0.13509845733642578, 0.1379227638244629, 0.1407470703125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 7.0, 12.0, 21.0, 30.0, 41.0, 80.0, 105.0, 150.0, 149.0, 131.0, 84.0, 67.0, 45.0, 26.0, 20.0, 9.0, 7.0, 3.0, 5.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20781758427619934, -0.19840659201145172, -0.1889955997467041, -0.17958460748195648, -0.17017361521720886, -0.16076262295246124, -0.15135163068771362, -0.141940638422966, -0.13252964615821838, -0.12311865389347076, -0.11370766162872314, -0.10429666936397552, -0.0948856770992279, -0.08547468483448029, -0.07606369256973267, -0.06665270030498505, -0.05724170804023743, -0.04783071577548981, -0.03841972351074219, -0.029008731245994568, -0.019597738981246948, -0.010186746716499329, -0.000775754451751709, 0.00863523781299591, 0.01804623007774353, 0.02745722234249115, 0.03686821460723877, 0.04627920687198639, 0.05569019913673401, 0.06510119140148163, 0.07451218366622925, 0.08392317593097687, 0.09333419799804688, 0.1027451902627945, 0.11215618252754211, 0.12156717479228973, 0.13097816705703735, 0.14038915932178497, 0.1498001515865326, 0.1592111438512802, 0.16862213611602783, 0.17803312838077545, 0.18744412064552307, 0.1968551129102707, 0.2062661051750183, 0.21567709743976593, 0.22508808970451355, 0.23449908196926117, 0.2439100742340088, 0.2533210515975952, 0.26273205876350403, 0.27214306592941284, 0.28155404329299927, 0.2909650206565857, 0.3003760278224945, 0.3097870349884033, 0.31919801235198975, 0.32860898971557617, 0.338019996881485, 0.3474310040473938, 0.3568419814109802, 0.36625295877456665, 0.37566396594047546, 0.3850749731063843, 0.3944859504699707]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 7.0, 4.0, 8.0, 9.0, 11.0, 14.0, 14.0, 19.0, 24.0, 30.0, 26.0, 43.0, 41.0, 41.0, 63.0, 34.0, 52.0, 52.0, 54.0, 55.0, 42.0, 45.0, 46.0, 31.0, 44.0, 38.0, 28.0, 33.0, 19.0, 17.0, 16.0, 8.0, 6.0, 2.0, 10.0, 6.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.18049389123916626, -0.17510296404361725, -0.16971203684806824, -0.16432110965251923, -0.15893018245697021, -0.15353924036026, -0.148148313164711, -0.142757385969162, -0.13736645877361298, -0.13197553157806396, -0.12658460438251495, -0.12119366973638535, -0.11580274254083633, -0.11041181534528732, -0.10502088069915771, -0.0996299535036087, -0.09423902630805969, -0.08884809911251068, -0.08345717191696167, -0.07806623727083206, -0.07267531007528305, -0.06728438287973404, -0.06189345195889473, -0.05650252103805542, -0.05111159384250641, -0.0457206666469574, -0.04032973572611809, -0.03493880480527878, -0.029547877609729767, -0.024156948551535606, -0.018766019493341446, -0.013375088572502136, -0.007984161376953125, -0.0025932323187589645, 0.002797696739435196, 0.008188625797629356, 0.013579554855823517, 0.018970483914017677, 0.024361412972211838, 0.029752343893051147, 0.03514327108860016, 0.04053419828414917, 0.04592512920498848, 0.05131606012582779, 0.0567069873213768, 0.06209791451692581, 0.06748884916305542, 0.07287977635860443, 0.07827070355415344, 0.08366163074970245, 0.08905255794525146, 0.09444349259138107, 0.09983441978693008, 0.1052253469824791, 0.1106162816286087, 0.11600720882415771, 0.12139813601970673, 0.12678906321525574, 0.13217999041080475, 0.13757091760635376, 0.14296185970306396, 0.14835278689861298, 0.153743714094162, 0.159134641289711, 0.16452556848526]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 12.0, 15.0, 13.0, 33.0, 50.0, 91.0, 128.0, 201.0, 307.0, 501.0, 766.0, 1326.0, 2253.0, 4161.0, 7972.0, 16474.0, 38009.0, 108706.0, 378643.0, 329766.0, 93974.0, 33950.0, 14989.0, 7233.0, 3773.0, 2068.0, 1183.0, 697.0, 432.0, 278.0, 171.0, 124.0, 73.0, 69.0, 29.0, 18.0, 17.0, 15.0, 7.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0299530029296875, -0.029015064239501953, -0.028077125549316406, -0.02713918685913086, -0.026201248168945312, -0.025263309478759766, -0.02432537078857422, -0.023387432098388672, -0.022449493408203125, -0.021511554718017578, -0.02057361602783203, -0.019635677337646484, -0.018697738647460938, -0.01775979995727539, -0.016821861267089844, -0.015883922576904297, -0.01494598388671875, -0.014008045196533203, -0.013070106506347656, -0.01213216781616211, -0.011194229125976562, -0.010256290435791016, -0.009318351745605469, -0.008380413055419922, -0.007442474365234375, -0.006504535675048828, -0.005566596984863281, -0.004628658294677734, -0.0036907196044921875, -0.0027527809143066406, -0.0018148422241210938, -0.0008769035339355469, 6.103515625e-05, 0.0009989738464355469, 0.0019369125366210938, 0.0028748512268066406, 0.0038127899169921875, 0.004750728607177734, 0.005688667297363281, 0.006626605987548828, 0.007564544677734375, 0.008502483367919922, 0.009440422058105469, 0.010378360748291016, 0.011316299438476562, 0.01225423812866211, 0.013192176818847656, 0.014130115509033203, 0.01506805419921875, 0.016005992889404297, 0.016943931579589844, 0.01788187026977539, 0.018819808959960938, 0.019757747650146484, 0.02069568634033203, 0.021633625030517578, 0.022571563720703125, 0.023509502410888672, 0.02444744110107422, 0.025385379791259766, 0.026323318481445312, 0.02726125717163086, 0.028199195861816406, 0.029137134552001953, 0.0300750732421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 7.0, 5.0, 1.0, 8.0, 13.0, 7.0, 13.0, 17.0, 13.0, 27.0, 22.0, 37.0, 48.0, 41.0, 59.0, 53.0, 52.0, 58.0, 60.0, 64.0, 59.0, 51.0, 41.0, 41.0, 33.0, 23.0, 24.0, 18.0, 24.0, 18.0, 14.0, 14.0, 12.0, 6.0, 6.0, 9.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0151824951171875, -0.01474153995513916, -0.01430058479309082, -0.01385962963104248, -0.01341867446899414, -0.0129777193069458, -0.012536764144897461, -0.012095808982849121, -0.011654853820800781, -0.011213898658752441, -0.010772943496704102, -0.010331988334655762, -0.009891033172607422, -0.009450078010559082, -0.009009122848510742, -0.008568167686462402, -0.008127212524414062, -0.007686257362365723, -0.007245302200317383, -0.006804347038269043, -0.006363391876220703, -0.005922436714172363, -0.0054814815521240234, -0.005040526390075684, -0.004599571228027344, -0.004158616065979004, -0.003717660903930664, -0.0032767057418823242, -0.0028357505798339844, -0.0023947954177856445, -0.0019538402557373047, -0.0015128850936889648, -0.001071929931640625, -0.0006309747695922852, -0.0001900196075439453, 0.00025093555450439453, 0.0006918907165527344, 0.0011328458786010742, 0.001573801040649414, 0.002014756202697754, 0.0024557113647460938, 0.0028966665267944336, 0.0033376216888427734, 0.0037785768508911133, 0.004219532012939453, 0.004660487174987793, 0.005101442337036133, 0.005542397499084473, 0.0059833526611328125, 0.006424307823181152, 0.006865262985229492, 0.007306218147277832, 0.007747173309326172, 0.008188128471374512, 0.008629083633422852, 0.009070038795471191, 0.009510993957519531, 0.009951949119567871, 0.010392904281616211, 0.01083385944366455, 0.01127481460571289, 0.01171576976776123, 0.01215672492980957, 0.01259768009185791, 0.01303863525390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 11.0, 9.0, 15.0, 20.0, 23.0, 36.0, 68.0, 85.0, 115.0, 172.0, 248.0, 424.0, 662.0, 1215.0, 2300.0, 4546.0, 10390.0, 28975.0, 102582.0, 625719.0, 194943.0, 46918.0, 15789.0, 6399.0, 3004.0, 1560.0, 872.0, 508.0, 311.0, 200.0, 120.0, 97.0, 62.0, 46.0, 24.0, 20.0, 21.0, 15.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.033782958984375, -0.03264570236206055, -0.031508445739746094, -0.03037118911743164, -0.029233932495117188, -0.028096675872802734, -0.02695941925048828, -0.025822162628173828, -0.024684906005859375, -0.023547649383544922, -0.02241039276123047, -0.021273136138916016, -0.020135879516601562, -0.01899862289428711, -0.017861366271972656, -0.016724109649658203, -0.01558685302734375, -0.014449596405029297, -0.013312339782714844, -0.01217508316040039, -0.011037826538085938, -0.009900569915771484, -0.008763313293457031, -0.007626056671142578, -0.006488800048828125, -0.005351543426513672, -0.004214286804199219, -0.0030770301818847656, -0.0019397735595703125, -0.0008025169372558594, 0.00033473968505859375, 0.0014719963073730469, 0.0026092529296875, 0.003746509552001953, 0.004883766174316406, 0.006021022796630859, 0.0071582794189453125, 0.008295536041259766, 0.009432792663574219, 0.010570049285888672, 0.011707305908203125, 0.012844562530517578, 0.013981819152832031, 0.015119075775146484, 0.016256332397460938, 0.01739358901977539, 0.018530845642089844, 0.019668102264404297, 0.02080535888671875, 0.021942615509033203, 0.023079872131347656, 0.02421712875366211, 0.025354385375976562, 0.026491641998291016, 0.02762889862060547, 0.028766155242919922, 0.029903411865234375, 0.031040668487548828, 0.03217792510986328, 0.033315181732177734, 0.03445243835449219, 0.03558969497680664, 0.036726951599121094, 0.03786420822143555, 0.03900146484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 4.0, 9.0, 8.0, 4.0, 11.0, 7.0, 14.0, 14.0, 30.0, 25.0, 32.0, 36.0, 39.0, 36.0, 58.0, 34.0, 62.0, 56.0, 51.0, 44.0, 54.0, 51.0, 52.0, 34.0, 40.0, 40.0, 23.0, 29.0, 20.0, 21.0, 16.0, 10.0, 11.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0552978515625, -0.05356597900390625, -0.0518341064453125, -0.05010223388671875, -0.048370361328125, -0.04663848876953125, -0.0449066162109375, -0.04317474365234375, -0.04144287109375, -0.03971099853515625, -0.0379791259765625, -0.03624725341796875, -0.034515380859375, -0.03278350830078125, -0.0310516357421875, -0.02931976318359375, -0.027587890625, -0.02585601806640625, -0.0241241455078125, -0.02239227294921875, -0.020660400390625, -0.01892852783203125, -0.0171966552734375, -0.01546478271484375, -0.01373291015625, -0.01200103759765625, -0.0102691650390625, -0.00853729248046875, -0.006805419921875, -0.00507354736328125, -0.0033416748046875, -0.00160980224609375, 0.0001220703125, 0.00185394287109375, 0.0035858154296875, 0.00531768798828125, 0.007049560546875, 0.00878143310546875, 0.0105133056640625, 0.01224517822265625, 0.01397705078125, 0.01570892333984375, 0.0174407958984375, 0.01917266845703125, 0.020904541015625, 0.02263641357421875, 0.0243682861328125, 0.02610015869140625, 0.02783203125, 0.02956390380859375, 0.0312957763671875, 0.03302764892578125, 0.034759521484375, 0.03649139404296875, 0.0382232666015625, 0.03995513916015625, 0.04168701171875, 0.04341888427734375, 0.0451507568359375, 0.04688262939453125, 0.048614501953125, 0.05034637451171875, 0.0520782470703125, 0.05381011962890625, 0.0555419921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 10.0, 2.0, 12.0, 11.0, 22.0, 21.0, 35.0, 34.0, 70.0, 85.0, 162.0, 296.0, 568.0, 1313.0, 3792.0, 15394.0, 136521.0, 838731.0, 39619.0, 7649.0, 2307.0, 876.0, 424.0, 214.0, 120.0, 75.0, 64.0, 35.0, 18.0, 16.0, 10.0, 17.0, 6.0, 8.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.040740966796875, -0.03958559036254883, -0.038430213928222656, -0.037274837493896484, -0.03611946105957031, -0.03496408462524414, -0.03380870819091797, -0.0326533317565918, -0.031497955322265625, -0.030342578887939453, -0.02918720245361328, -0.02803182601928711, -0.026876449584960938, -0.025721073150634766, -0.024565696716308594, -0.023410320281982422, -0.02225494384765625, -0.021099567413330078, -0.019944190979003906, -0.018788814544677734, -0.017633438110351562, -0.01647806167602539, -0.015322685241699219, -0.014167308807373047, -0.013011932373046875, -0.011856555938720703, -0.010701179504394531, -0.00954580307006836, -0.008390426635742188, -0.007235050201416016, -0.006079673767089844, -0.004924297332763672, -0.0037689208984375, -0.002613544464111328, -0.0014581680297851562, -0.0003027915954589844, 0.0008525848388671875, 0.0020079612731933594, 0.0031633377075195312, 0.004318714141845703, 0.005474090576171875, 0.006629467010498047, 0.007784843444824219, 0.00894021987915039, 0.010095596313476562, 0.011250972747802734, 0.012406349182128906, 0.013561725616455078, 0.01471710205078125, 0.015872478485107422, 0.017027854919433594, 0.018183231353759766, 0.019338607788085938, 0.02049398422241211, 0.02164936065673828, 0.022804737091064453, 0.023960113525390625, 0.025115489959716797, 0.02627086639404297, 0.02742624282836914, 0.028581619262695312, 0.029736995697021484, 0.030892372131347656, 0.03204774856567383, 0.033203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 11.0, 23.0, 46.0, 101.0, 150.0, 232.0, 206.0, 95.0, 58.0, 29.0, 16.0, 11.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013327598571777344, -0.00012918561697006226, -0.00012509524822235107, -0.00012100487947463989, -0.00011691451072692871, -0.00011282414197921753, -0.00010873377323150635, -0.00010464340448379517, -0.00010055303573608398, -9.64626669883728e-05, -9.237229824066162e-05, -8.828192949295044e-05, -8.419156074523926e-05, -8.010119199752808e-05, -7.60108232498169e-05, -7.192045450210571e-05, -6.783008575439453e-05, -6.373971700668335e-05, -5.964934825897217e-05, -5.5558979511260986e-05, -5.1468610763549805e-05, -4.737824201583862e-05, -4.328787326812744e-05, -3.919750452041626e-05, -3.510713577270508e-05, -3.1016767024993896e-05, -2.6926398277282715e-05, -2.2836029529571533e-05, -1.874566078186035e-05, -1.465529203414917e-05, -1.0564923286437988e-05, -6.474554538726807e-06, -2.384185791015625e-06, 1.7061829566955566e-06, 5.796551704406738e-06, 9.88692045211792e-06, 1.3977289199829102e-05, 1.8067657947540283e-05, 2.2158026695251465e-05, 2.6248395442962646e-05, 3.0338764190673828e-05, 3.442913293838501e-05, 3.851950168609619e-05, 4.260987043380737e-05, 4.6700239181518555e-05, 5.0790607929229736e-05, 5.488097667694092e-05, 5.89713454246521e-05, 6.306171417236328e-05, 6.715208292007446e-05, 7.124245166778564e-05, 7.533282041549683e-05, 7.942318916320801e-05, 8.351355791091919e-05, 8.760392665863037e-05, 9.169429540634155e-05, 9.578466415405273e-05, 9.987503290176392e-05, 0.0001039654016494751, 0.00010805577039718628, 0.00011214613914489746, 0.00011623650789260864, 0.00012032687664031982, 0.000124417245388031, 0.0001285076141357422]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 8.0, 8.0, 8.0, 15.0, 16.0, 25.0, 29.0, 39.0, 71.0, 87.0, 147.0, 224.0, 394.0, 775.0, 1585.0, 3983.0, 14239.0, 99316.0, 851896.0, 58889.0, 10376.0, 3302.0, 1444.0, 690.0, 363.0, 188.0, 136.0, 92.0, 69.0, 42.0, 27.0, 20.0, 8.0, 7.0, 7.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028594970703125, -0.027587890625, -0.026580810546875, -0.02557373046875, -0.024566650390625, -0.0235595703125, -0.022552490234375, -0.02154541015625, -0.020538330078125, -0.01953125, -0.018524169921875, -0.01751708984375, -0.016510009765625, -0.0155029296875, -0.014495849609375, -0.01348876953125, -0.012481689453125, -0.011474609375, -0.010467529296875, -0.00946044921875, -0.008453369140625, -0.0074462890625, -0.006439208984375, -0.00543212890625, -0.004425048828125, -0.00341796875, -0.002410888671875, -0.00140380859375, -0.000396728515625, 0.0006103515625, 0.001617431640625, 0.00262451171875, 0.003631591796875, 0.004638671875, 0.005645751953125, 0.00665283203125, 0.007659912109375, 0.0086669921875, 0.009674072265625, 0.01068115234375, 0.011688232421875, 0.0126953125, 0.013702392578125, 0.01470947265625, 0.015716552734375, 0.0167236328125, 0.017730712890625, 0.01873779296875, 0.019744873046875, 0.020751953125, 0.021759033203125, 0.02276611328125, 0.023773193359375, 0.0247802734375, 0.025787353515625, 0.02679443359375, 0.027801513671875, 0.02880859375, 0.029815673828125, 0.03082275390625, 0.031829833984375, 0.0328369140625, 0.033843994140625, 0.03485107421875, 0.035858154296875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 2.0, 4.0, 6.0, 10.0, 19.0, 29.0, 39.0, 56.0, 82.0, 126.0, 189.0, 149.0, 95.0, 57.0, 40.0, 33.0, 22.0, 5.0, 9.0, 9.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.035888671875, -0.035117506980895996, -0.03434634208679199, -0.03357517719268799, -0.032804012298583984, -0.03203284740447998, -0.03126168251037598, -0.030490517616271973, -0.02971935272216797, -0.028948187828063965, -0.02817702293395996, -0.027405858039855957, -0.026634693145751953, -0.02586352825164795, -0.025092363357543945, -0.02432119846343994, -0.023550033569335938, -0.022778868675231934, -0.02200770378112793, -0.021236538887023926, -0.020465373992919922, -0.019694209098815918, -0.018923044204711914, -0.01815187931060791, -0.017380714416503906, -0.016609549522399902, -0.0158383846282959, -0.015067219734191895, -0.01429605484008789, -0.013524889945983887, -0.012753725051879883, -0.011982560157775879, -0.011211395263671875, -0.010440230369567871, -0.009669065475463867, -0.008897900581359863, -0.00812673568725586, -0.0073555707931518555, -0.0065844058990478516, -0.005813241004943848, -0.005042076110839844, -0.00427091121673584, -0.003499746322631836, -0.002728581428527832, -0.001957416534423828, -0.0011862516403198242, -0.0004150867462158203, 0.0003560781478881836, 0.0011272430419921875, 0.0018984079360961914, 0.0026695728302001953, 0.0034407377243041992, 0.004211902618408203, 0.004983067512512207, 0.005754232406616211, 0.006525397300720215, 0.007296562194824219, 0.008067727088928223, 0.008838891983032227, 0.00961005687713623, 0.010381221771240234, 0.011152386665344238, 0.011923551559448242, 0.012694716453552246, 0.01346588134765625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 14.0, 21.0, 32.0, 49.0, 78.0, 170.0, 365.0, 150.0, 72.0, 26.0, 16.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5270462036132812, -0.5084968209266663, -0.48994749784469604, -0.47139811515808105, -0.45284876227378845, -0.43429940938949585, -0.41575002670288086, -0.39720067381858826, -0.37865132093429565, -0.36010196805000305, -0.34155261516571045, -0.32300323247909546, -0.30445387959480286, -0.28590452671051025, -0.26735514402389526, -0.24880579113960266, -0.23025643825531006, -0.21170708537101746, -0.19315771758556366, -0.17460834980010986, -0.15605899691581726, -0.13750964403152466, -0.11896027624607086, -0.10041090846061707, -0.08186155557632446, -0.06331219524145126, -0.044762834906578064, -0.026213474571704865, -0.007664114236831665, 0.010885246098041534, 0.029434606432914734, 0.04798397421836853, 0.06653332710266113, 0.08508268743753433, 0.10363204777240753, 0.12218140810728073, 0.14073076844215393, 0.15928012132644653, 0.17782948911190033, 0.19637885689735413, 0.21492820978164673, 0.23347756266593933, 0.25202691555023193, 0.2705762982368469, 0.2891256511211395, 0.30767500400543213, 0.3262243866920471, 0.3447737395763397, 0.3633230924606323, 0.3818724453449249, 0.40042179822921753, 0.4189711809158325, 0.4375205338001251, 0.4560698866844177, 0.4746192693710327, 0.4931686222553253, 0.5117179751396179, 0.5302673578262329, 0.5488166809082031, 0.5673660635948181, 0.5859154462814331, 0.6044647693634033, 0.6230141520500183, 0.6415635347366333, 0.6601128578186035]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 4.0, 10.0, 8.0, 8.0, 12.0, 16.0, 8.0, 13.0, 15.0, 24.0, 22.0, 22.0, 32.0, 33.0, 30.0, 51.0, 64.0, 114.0, 98.0, 60.0, 50.0, 53.0, 31.0, 33.0, 27.0, 27.0, 13.0, 15.0, 15.0, 14.0, 5.0, 15.0, 16.0, 12.0, 8.0, 7.0, 6.0, 1.0, 4.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2553887367248535, -0.24745464324951172, -0.23952054977416992, -0.23158645629882812, -0.22365237772464752, -0.21571828424930573, -0.20778419077396393, -0.19985009729862213, -0.19191601872444153, -0.18398192524909973, -0.17604783177375793, -0.16811373829841614, -0.16017965972423553, -0.15224556624889374, -0.14431147277355194, -0.13637737929821014, -0.12844328582286835, -0.12050919234752655, -0.11257510632276535, -0.10464101284742355, -0.09670692682266235, -0.08877283334732056, -0.08083873987197876, -0.07290464639663696, -0.06497056037187576, -0.057036470621824265, -0.049102380871772766, -0.04116828739643097, -0.03323419764637947, -0.025300107896327972, -0.017366014420986176, -0.009431924670934677, -0.0014978349208831787, 0.006436255760490894, 0.014370346441864967, 0.022304438054561615, 0.030238527804613113, 0.03817261755466461, 0.04610671103000641, 0.05404080078005791, 0.061974890530109406, 0.0699089840054512, 0.0778430700302124, 0.0857771635055542, 0.093711256980896, 0.1016453430056572, 0.10957943648099899, 0.11751352250576019, 0.125447615981102, 0.1333817094564438, 0.14131580293178558, 0.1492498815059662, 0.15718397498130798, 0.16511806845664978, 0.17305216193199158, 0.18098625540733337, 0.18892034888267517, 0.19685444235801697, 0.20478853583335876, 0.21272262930870056, 0.22065670788288116, 0.22859080135822296, 0.23652489483356476, 0.24445898830890656, 0.25239306688308716]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 10.0, 7.0, 7.0, 19.0, 22.0, 21.0, 32.0, 51.0, 66.0, 105.0, 128.0, 176.0, 224.0, 300.0, 443.0, 824.0, 1628.0, 4864.0, 23428.0, 745697.0, 3354164.0, 49361.0, 7617.0, 2326.0, 933.0, 525.0, 348.0, 249.0, 187.0, 126.0, 95.0, 63.0, 55.0, 42.0, 33.0, 20.0, 21.0, 12.0, 13.0, 9.0, 8.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.067138671875, -0.06498432159423828, -0.06282997131347656, -0.060675621032714844, -0.058521270751953125, -0.056366920471191406, -0.05421257019042969, -0.05205821990966797, -0.04990386962890625, -0.04774951934814453, -0.04559516906738281, -0.043440818786621094, -0.041286468505859375, -0.039132118225097656, -0.03697776794433594, -0.03482341766357422, -0.0326690673828125, -0.03051471710205078, -0.028360366821289062, -0.026206016540527344, -0.024051666259765625, -0.021897315979003906, -0.019742965698242188, -0.01758861541748047, -0.01543426513671875, -0.013279914855957031, -0.011125564575195312, -0.008971214294433594, -0.006816864013671875, -0.004662513732910156, -0.0025081634521484375, -0.00035381317138671875, 0.001800537109375, 0.003954887390136719, 0.0061092376708984375, 0.008263587951660156, 0.010417938232421875, 0.012572288513183594, 0.014726638793945312, 0.01688098907470703, 0.01903533935546875, 0.02118968963623047, 0.023344039916992188, 0.025498390197753906, 0.027652740478515625, 0.029807090759277344, 0.03196144104003906, 0.03411579132080078, 0.0362701416015625, 0.03842449188232422, 0.04057884216308594, 0.042733192443847656, 0.044887542724609375, 0.047041893005371094, 0.04919624328613281, 0.05135059356689453, 0.05350494384765625, 0.05565929412841797, 0.05781364440917969, 0.059967994689941406, 0.062122344970703125, 0.06427669525146484, 0.06643104553222656, 0.06858539581298828, 0.07073974609375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 3.0, 6.0, 11.0, 6.0, 10.0, 13.0, 19.0, 18.0, 31.0, 40.0, 39.0, 47.0, 65.0, 52.0, 62.0, 69.0, 58.0, 64.0, 59.0, 49.0, 55.0, 35.0, 34.0, 23.0, 21.0, 17.0, 16.0, 10.0, 14.0, 15.0, 2.0, 6.0, 5.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01580810546875, -0.015344977378845215, -0.01488184928894043, -0.014418721199035645, -0.01395559310913086, -0.013492465019226074, -0.013029336929321289, -0.012566208839416504, -0.012103080749511719, -0.011639952659606934, -0.011176824569702148, -0.010713696479797363, -0.010250568389892578, -0.009787440299987793, -0.009324312210083008, -0.008861184120178223, -0.008398056030273438, -0.007934927940368652, -0.007471799850463867, -0.007008671760559082, -0.006545543670654297, -0.006082415580749512, -0.0056192874908447266, -0.005156159400939941, -0.004693031311035156, -0.004229903221130371, -0.003766775131225586, -0.0033036470413208008, -0.0028405189514160156, -0.0023773908615112305, -0.0019142627716064453, -0.0014511346817016602, -0.000988006591796875, -0.0005248785018920898, -6.175041198730469e-05, 0.00040137767791748047, 0.0008645057678222656, 0.0013276338577270508, 0.001790761947631836, 0.002253890037536621, 0.0027170181274414062, 0.0031801462173461914, 0.0036432743072509766, 0.004106402397155762, 0.004569530487060547, 0.005032658576965332, 0.005495786666870117, 0.005958914756774902, 0.0064220428466796875, 0.006885170936584473, 0.007348299026489258, 0.007811427116394043, 0.008274555206298828, 0.008737683296203613, 0.009200811386108398, 0.009663939476013184, 0.010127067565917969, 0.010590195655822754, 0.011053323745727539, 0.011516451835632324, 0.01197957992553711, 0.012442708015441895, 0.01290583610534668, 0.013368964195251465, 0.01383209228515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 6.0, 14.0, 24.0, 41.0, 65.0, 148.0, 188.0, 383.0, 834.0, 2551.0, 48906.0, 4111047.0, 26448.0, 1996.0, 759.0, 394.0, 210.0, 121.0, 68.0, 34.0, 24.0, 7.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.108154296875, -0.10258674621582031, -0.09701919555664062, -0.09145164489746094, -0.08588409423828125, -0.08031654357910156, -0.07474899291992188, -0.06918144226074219, -0.0636138916015625, -0.05804634094238281, -0.052478790283203125, -0.04691123962402344, -0.04134368896484375, -0.03577613830566406, -0.030208587646484375, -0.024641036987304688, -0.019073486328125, -0.013505935668945312, -0.007938385009765625, -0.0023708343505859375, 0.00319671630859375, 0.008764266967773438, 0.014331817626953125, 0.019899368286132812, 0.0254669189453125, 0.031034469604492188, 0.036602020263671875, 0.04216957092285156, 0.04773712158203125, 0.05330467224121094, 0.058872222900390625, 0.06443977355957031, 0.07000732421875, 0.07557487487792969, 0.08114242553710938, 0.08670997619628906, 0.09227752685546875, 0.09784507751464844, 0.10341262817382812, 0.10898017883300781, 0.1145477294921875, 0.12011528015136719, 0.12568283081054688, 0.13125038146972656, 0.13681793212890625, 0.14238548278808594, 0.14795303344726562, 0.1535205841064453, 0.159088134765625, 0.1646556854248047, 0.17022323608398438, 0.17579078674316406, 0.18135833740234375, 0.18692588806152344, 0.19249343872070312, 0.1980609893798828, 0.2036285400390625, 0.2091960906982422, 0.21476364135742188, 0.22033119201660156, 0.22589874267578125, 0.23146629333496094, 0.23703384399414062, 0.2426013946533203, 0.2481689453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 12.0, 33.0, 48.0, 131.0, 425.0, 1677.0, 1249.0, 272.0, 116.0, 41.0, 28.0, 13.0, 8.0, 9.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1024169921875, -0.09898185729980469, -0.09554672241210938, -0.09211158752441406, -0.08867645263671875, -0.08524131774902344, -0.08180618286132812, -0.07837104797363281, -0.0749359130859375, -0.07150077819824219, -0.06806564331054688, -0.06463050842285156, -0.06119537353515625, -0.05776023864746094, -0.054325103759765625, -0.05088996887207031, -0.047454833984375, -0.04401969909667969, -0.040584564208984375, -0.03714942932128906, -0.03371429443359375, -0.030279159545898438, -0.026844024658203125, -0.023408889770507812, -0.0199737548828125, -0.016538619995117188, -0.013103485107421875, -0.009668350219726562, -0.00623321533203125, -0.0027980804443359375, 0.000637054443359375, 0.0040721893310546875, 0.00750732421875, 0.010942459106445312, 0.014377593994140625, 0.017812728881835938, 0.02124786376953125, 0.024682998657226562, 0.028118133544921875, 0.03155326843261719, 0.0349884033203125, 0.03842353820800781, 0.041858673095703125, 0.04529380798339844, 0.04872894287109375, 0.05216407775878906, 0.055599212646484375, 0.05903434753417969, 0.062469482421875, 0.06590461730957031, 0.06933975219726562, 0.07277488708496094, 0.07621002197265625, 0.07964515686035156, 0.08308029174804688, 0.08651542663574219, 0.0899505615234375, 0.09338569641113281, 0.09682083129882812, 0.10025596618652344, 0.10369110107421875, 0.10712623596191406, 0.11056137084960938, 0.11399650573730469, 0.117431640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 14.0, 26.0, 50.0, 107.0, 244.0, 256.0, 150.0, 70.0, 34.0, 16.0, 15.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4478585422039032, -0.4181429445743561, -0.3884273171424866, -0.35871171951293945, -0.32899612188339233, -0.2992805242538452, -0.2695649266242981, -0.2398492991924286, -0.21013370156288147, -0.18041810393333435, -0.15070249140262604, -0.12098688632249832, -0.0912712812423706, -0.061555683612823486, -0.03184007108211517, -0.0021244585514068604, 0.02759113907814026, 0.057306744158267975, 0.08702234923839569, 0.11673795431852341, 0.14645355939865112, 0.17616915702819824, 0.20588476955890656, 0.23560038208961487, 0.265315979719162, 0.2950315773487091, 0.3247472047805786, 0.35446280241012573, 0.38417840003967285, 0.41389399766921997, 0.4436095952987671, 0.4733252227306366, 0.5030407905578613, 0.5327563881874084, 0.5624719858169556, 0.5921875834465027, 0.6219031810760498, 0.6516188383102417, 0.6813344359397888, 0.7110500335693359, 0.7407656311988831, 0.7704812288284302, 0.8001968264579773, 0.8299124240875244, 0.8596280813217163, 0.8893436193466187, 0.9190592765808105, 0.9487748742103577, 0.9784904718399048, 1.0082061290740967, 1.037921667098999, 1.067637324333191, 1.0973528623580933, 1.1270685195922852, 1.1567840576171875, 1.1864997148513794, 1.2162153720855713, 1.2459310293197632, 1.2756465673446655, 1.3053622245788574, 1.3350777626037598, 1.3647934198379517, 1.394508957862854, 1.424224615097046, 1.4539401531219482]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 12.0, 8.0, 8.0, 12.0, 12.0, 14.0, 27.0, 33.0, 27.0, 52.0, 45.0, 45.0, 59.0, 43.0, 48.0, 44.0, 50.0, 45.0, 38.0, 32.0, 57.0, 47.0, 33.0, 38.0, 47.0, 20.0, 25.0, 18.0, 16.0, 14.0, 13.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.3338594436645508, -0.32600292563438416, -0.31814640760421753, -0.3102899193763733, -0.30243340134620667, -0.29457688331604004, -0.2867203652858734, -0.2788638472557068, -0.27100732922554016, -0.26315081119537354, -0.2552942931652069, -0.24743779003620148, -0.23958127200603485, -0.23172476887702942, -0.2238682508468628, -0.21601173281669617, -0.20815522968769073, -0.2002987116575241, -0.19244220852851868, -0.18458569049835205, -0.17672917246818542, -0.1688726544380188, -0.16101615130901337, -0.15315963327884674, -0.1453031301498413, -0.13744661211967468, -0.12959010899066925, -0.12173359096050262, -0.113877072930336, -0.10602056235074997, -0.09816405177116394, -0.09030753374099731, -0.08245101571083069, -0.07459450513124466, -0.06673798710107803, -0.058881476521492004, -0.05102496221661568, -0.04316844791173935, -0.03531193733215332, -0.027455423027276993, -0.019598908722400665, -0.011742395348846912, -0.0038858819752931595, 0.003970630466938019, 0.011827144771814346, 0.019683659076690674, 0.027540169656276703, 0.03539668396115303, 0.04325319826602936, 0.051109712570905685, 0.05896622687578201, 0.06682273745536804, 0.07467925548553467, 0.0825357660651207, 0.09039227664470673, 0.09824879467487335, 0.10610530525445938, 0.11396181583404541, 0.12181833386421204, 0.12967485189437866, 0.1375313550233841, 0.14538787305355072, 0.15324437618255615, 0.16110089421272278, 0.1689574122428894]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 4.0, 9.0, 4.0, 8.0, 9.0, 12.0, 18.0, 19.0, 31.0, 44.0, 66.0, 90.0, 143.0, 178.0, 275.0, 408.0, 596.0, 935.0, 1522.0, 2705.0, 4572.0, 8516.0, 15962.0, 31530.0, 66145.0, 150707.0, 328890.0, 239764.0, 100170.0, 45453.0, 22480.0, 11778.0, 6401.0, 3460.0, 2054.0, 1257.0, 741.0, 490.0, 328.0, 237.0, 139.0, 100.0, 88.0, 70.0, 38.0, 34.0, 19.0, 18.0, 15.0, 13.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0240325927734375, -0.02325129508972168, -0.02246999740600586, -0.02168869972229004, -0.02090740203857422, -0.0201261043548584, -0.019344806671142578, -0.018563508987426758, -0.017782211303710938, -0.017000913619995117, -0.016219615936279297, -0.015438318252563477, -0.014657020568847656, -0.013875722885131836, -0.013094425201416016, -0.012313127517700195, -0.011531829833984375, -0.010750532150268555, -0.009969234466552734, -0.009187936782836914, -0.008406639099121094, -0.0076253414154052734, -0.006844043731689453, -0.006062746047973633, -0.0052814483642578125, -0.004500150680541992, -0.003718852996826172, -0.0029375553131103516, -0.0021562576293945312, -0.001374959945678711, -0.0005936622619628906, 0.0001876354217529297, 0.00096893310546875, 0.0017502307891845703, 0.0025315284729003906, 0.003312826156616211, 0.004094123840332031, 0.0048754215240478516, 0.005656719207763672, 0.006438016891479492, 0.0072193145751953125, 0.008000612258911133, 0.008781909942626953, 0.009563207626342773, 0.010344505310058594, 0.011125802993774414, 0.011907100677490234, 0.012688398361206055, 0.013469696044921875, 0.014250993728637695, 0.015032291412353516, 0.015813589096069336, 0.016594886779785156, 0.017376184463500977, 0.018157482147216797, 0.018938779830932617, 0.019720077514648438, 0.020501375198364258, 0.021282672882080078, 0.0220639705657959, 0.02284526824951172, 0.02362656593322754, 0.02440786361694336, 0.02518916130065918, 0.025970458984375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 2.0, 4.0, 5.0, 4.0, 11.0, 8.0, 12.0, 13.0, 22.0, 16.0, 25.0, 27.0, 46.0, 52.0, 37.0, 49.0, 50.0, 51.0, 61.0, 49.0, 71.0, 51.0, 43.0, 44.0, 36.0, 34.0, 36.0, 26.0, 29.0, 15.0, 19.0, 11.0, 14.0, 9.0, 6.0, 4.0, 6.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0178070068359375, -0.01725172996520996, -0.016696453094482422, -0.016141176223754883, -0.015585899353027344, -0.015030622482299805, -0.014475345611572266, -0.013920068740844727, -0.013364791870117188, -0.012809514999389648, -0.01225423812866211, -0.01169896125793457, -0.011143684387207031, -0.010588407516479492, -0.010033130645751953, -0.009477853775024414, -0.008922576904296875, -0.008367300033569336, -0.007812023162841797, -0.007256746292114258, -0.006701469421386719, -0.00614619255065918, -0.005590915679931641, -0.0050356388092041016, -0.0044803619384765625, -0.0039250850677490234, -0.0033698081970214844, -0.0028145313262939453, -0.0022592544555664062, -0.0017039775848388672, -0.0011487007141113281, -0.0005934238433837891, -3.814697265625e-05, 0.0005171298980712891, 0.0010724067687988281, 0.0016276836395263672, 0.0021829605102539062, 0.0027382373809814453, 0.0032935142517089844, 0.0038487911224365234, 0.0044040679931640625, 0.0049593448638916016, 0.005514621734619141, 0.00606989860534668, 0.006625175476074219, 0.007180452346801758, 0.007735729217529297, 0.008291006088256836, 0.008846282958984375, 0.009401559829711914, 0.009956836700439453, 0.010512113571166992, 0.011067390441894531, 0.01162266731262207, 0.01217794418334961, 0.012733221054077148, 0.013288497924804688, 0.013843774795532227, 0.014399051666259766, 0.014954328536987305, 0.015509605407714844, 0.016064882278442383, 0.016620159149169922, 0.01717543601989746, 0.017730712890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 8.0, 16.0, 17.0, 31.0, 35.0, 52.0, 72.0, 116.0, 160.0, 297.0, 478.0, 824.0, 1950.0, 6979.0, 55641.0, 841653.0, 123581.0, 11648.0, 2562.0, 977.0, 537.0, 296.0, 195.0, 124.0, 97.0, 67.0, 34.0, 24.0, 19.0, 12.0, 13.0, 6.0, 4.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0714111328125, -0.06891822814941406, -0.06642532348632812, -0.06393241882324219, -0.06143951416015625, -0.05894660949707031, -0.056453704833984375, -0.05396080017089844, -0.0514678955078125, -0.04897499084472656, -0.046482086181640625, -0.04398918151855469, -0.04149627685546875, -0.03900337219238281, -0.036510467529296875, -0.03401756286621094, -0.031524658203125, -0.029031753540039062, -0.026538848876953125, -0.024045944213867188, -0.02155303955078125, -0.019060134887695312, -0.016567230224609375, -0.014074325561523438, -0.0115814208984375, -0.009088516235351562, -0.006595611572265625, -0.0041027069091796875, -0.00160980224609375, 0.0008831024169921875, 0.003376007080078125, 0.0058689117431640625, 0.00836181640625, 0.010854721069335938, 0.013347625732421875, 0.015840530395507812, 0.01833343505859375, 0.020826339721679688, 0.023319244384765625, 0.025812149047851562, 0.0283050537109375, 0.030797958374023438, 0.033290863037109375, 0.03578376770019531, 0.03827667236328125, 0.04076957702636719, 0.043262481689453125, 0.04575538635253906, 0.048248291015625, 0.05074119567871094, 0.053234100341796875, 0.05572700500488281, 0.05821990966796875, 0.06071281433105469, 0.06320571899414062, 0.06569862365722656, 0.0681915283203125, 0.07068443298339844, 0.07317733764648438, 0.07567024230957031, 0.07816314697265625, 0.08065605163574219, 0.08314895629882812, 0.08564186096191406, 0.088134765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 4.0, 5.0, 10.0, 13.0, 16.0, 27.0, 19.0, 31.0, 35.0, 53.0, 60.0, 66.0, 84.0, 74.0, 82.0, 83.0, 61.0, 62.0, 50.0, 43.0, 30.0, 21.0, 26.0, 13.0, 14.0, 7.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1038818359375, -0.10082626342773438, -0.09777069091796875, -0.09471511840820312, -0.0916595458984375, -0.08860397338867188, -0.08554840087890625, -0.08249282836914062, -0.079437255859375, -0.07638168334960938, -0.07332611083984375, -0.07027053833007812, -0.0672149658203125, -0.06415939331054688, -0.06110382080078125, -0.058048248291015625, -0.05499267578125, -0.051937103271484375, -0.04888153076171875, -0.045825958251953125, -0.0427703857421875, -0.039714813232421875, -0.03665924072265625, -0.033603668212890625, -0.030548095703125, -0.027492523193359375, -0.02443695068359375, -0.021381378173828125, -0.0183258056640625, -0.015270233154296875, -0.01221466064453125, -0.009159088134765625, -0.006103515625, -0.003047943115234375, 7.62939453125e-06, 0.003063201904296875, 0.0061187744140625, 0.009174346923828125, 0.01222991943359375, 0.015285491943359375, 0.018341064453125, 0.021396636962890625, 0.02445220947265625, 0.027507781982421875, 0.0305633544921875, 0.033618927001953125, 0.03667449951171875, 0.039730072021484375, 0.04278564453125, 0.045841217041015625, 0.04889678955078125, 0.051952362060546875, 0.0550079345703125, 0.058063507080078125, 0.06111907958984375, 0.06417465209960938, 0.067230224609375, 0.07028579711914062, 0.07334136962890625, 0.07639694213867188, 0.0794525146484375, 0.08250808715820312, 0.08556365966796875, 0.08861923217773438, 0.0916748046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 8.0, 6.0, 6.0, 16.0, 13.0, 33.0, 32.0, 54.0, 86.0, 142.0, 276.0, 521.0, 1229.0, 3500.0, 13493.0, 76482.0, 784362.0, 139154.0, 20884.0, 5125.0, 1615.0, 700.0, 309.0, 176.0, 105.0, 74.0, 48.0, 24.0, 20.0, 18.0, 16.0, 6.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.016448974609375, -0.0158538818359375, -0.0152587890625, -0.0146636962890625, -0.014068603515625, -0.0134735107421875, -0.01287841796875, -0.0122833251953125, -0.011688232421875, -0.0110931396484375, -0.010498046875, -0.0099029541015625, -0.009307861328125, -0.0087127685546875, -0.00811767578125, -0.0075225830078125, -0.006927490234375, -0.0063323974609375, -0.0057373046875, -0.0051422119140625, -0.004547119140625, -0.0039520263671875, -0.00335693359375, -0.0027618408203125, -0.002166748046875, -0.0015716552734375, -0.0009765625, -0.0003814697265625, 0.000213623046875, 0.0008087158203125, 0.00140380859375, 0.0019989013671875, 0.002593994140625, 0.0031890869140625, 0.0037841796875, 0.0043792724609375, 0.004974365234375, 0.0055694580078125, 0.00616455078125, 0.0067596435546875, 0.007354736328125, 0.0079498291015625, 0.008544921875, 0.0091400146484375, 0.009735107421875, 0.0103302001953125, 0.01092529296875, 0.0115203857421875, 0.012115478515625, 0.0127105712890625, 0.0133056640625, 0.0139007568359375, 0.014495849609375, 0.0150909423828125, 0.01568603515625, 0.0162811279296875, 0.016876220703125, 0.0174713134765625, 0.01806640625, 0.0186614990234375, 0.019256591796875, 0.0198516845703125, 0.02044677734375, 0.0210418701171875, 0.021636962890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 3.0, 9.0, 6.0, 8.0, 12.0, 7.0, 12.0, 21.0, 17.0, 23.0, 32.0, 39.0, 51.0, 55.0, 59.0, 82.0, 85.0, 82.0, 81.0, 54.0, 47.0, 52.0, 18.0, 28.0, 20.0, 14.0, 15.0, 7.0, 12.0, 8.0, 5.0, 6.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2557716369628906e-05, -4.120729863643646e-05, -3.985688090324402e-05, -3.8506463170051575e-05, -3.715604543685913e-05, -3.580562770366669e-05, -3.445520997047424e-05, -3.31047922372818e-05, -3.1754374504089355e-05, -3.040395677089691e-05, -2.9053539037704468e-05, -2.7703121304512024e-05, -2.635270357131958e-05, -2.5002285838127136e-05, -2.3651868104934692e-05, -2.230145037174225e-05, -2.0951032638549805e-05, -1.960061490535736e-05, -1.8250197172164917e-05, -1.6899779438972473e-05, -1.554936170578003e-05, -1.4198943972587585e-05, -1.2848526239395142e-05, -1.1498108506202698e-05, -1.0147690773010254e-05, -8.79727303981781e-06, -7.446855306625366e-06, -6.096437573432922e-06, -4.7460198402404785e-06, -3.3956021070480347e-06, -2.045184373855591e-06, -6.94766640663147e-07, 6.556510925292969e-07, 2.0060688257217407e-06, 3.3564865589141846e-06, 4.706904292106628e-06, 6.057322025299072e-06, 7.407739758491516e-06, 8.75815749168396e-06, 1.0108575224876404e-05, 1.1458992958068848e-05, 1.2809410691261292e-05, 1.4159828424453735e-05, 1.551024615764618e-05, 1.6860663890838623e-05, 1.8211081624031067e-05, 1.956149935722351e-05, 2.0911917090415955e-05, 2.22623348236084e-05, 2.3612752556800842e-05, 2.4963170289993286e-05, 2.631358802318573e-05, 2.7664005756378174e-05, 2.9014423489570618e-05, 3.036484122276306e-05, 3.1715258955955505e-05, 3.306567668914795e-05, 3.441609442234039e-05, 3.576651215553284e-05, 3.711692988872528e-05, 3.8467347621917725e-05, 3.981776535511017e-05, 4.116818308830261e-05, 4.2518600821495056e-05, 4.38690185546875e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 11.0, 9.0, 12.0, 19.0, 33.0, 48.0, 96.0, 136.0, 230.0, 414.0, 855.0, 1921.0, 5484.0, 23791.0, 188287.0, 753053.0, 58237.0, 10407.0, 3074.0, 1194.0, 553.0, 282.0, 158.0, 82.0, 48.0, 35.0, 25.0, 9.0, 21.0, 12.0, 5.0, 7.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.02362060546875, -0.022968769073486328, -0.022316932678222656, -0.021665096282958984, -0.021013259887695312, -0.02036142349243164, -0.01970958709716797, -0.019057750701904297, -0.018405914306640625, -0.017754077911376953, -0.01710224151611328, -0.01645040512084961, -0.015798568725585938, -0.015146732330322266, -0.014494895935058594, -0.013843059539794922, -0.01319122314453125, -0.012539386749267578, -0.011887550354003906, -0.011235713958740234, -0.010583877563476562, -0.00993204116821289, -0.009280204772949219, -0.008628368377685547, -0.007976531982421875, -0.007324695587158203, -0.006672859191894531, -0.006021022796630859, -0.0053691864013671875, -0.004717350006103516, -0.004065513610839844, -0.003413677215576172, -0.0027618408203125, -0.002110004425048828, -0.0014581680297851562, -0.0008063316345214844, -0.0001544952392578125, 0.0004973411560058594, 0.0011491775512695312, 0.0018010139465332031, 0.002452850341796875, 0.003104686737060547, 0.0037565231323242188, 0.004408359527587891, 0.0050601959228515625, 0.005712032318115234, 0.006363868713378906, 0.007015705108642578, 0.00766754150390625, 0.008319377899169922, 0.008971214294433594, 0.009623050689697266, 0.010274887084960938, 0.01092672348022461, 0.011578559875488281, 0.012230396270751953, 0.012882232666015625, 0.013534069061279297, 0.014185905456542969, 0.01483774185180664, 0.015489578247070312, 0.016141414642333984, 0.016793251037597656, 0.017445087432861328, 0.018096923828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 9.0, 6.0, 12.0, 13.0, 20.0, 24.0, 33.0, 33.0, 42.0, 44.0, 67.0, 76.0, 70.0, 82.0, 93.0, 62.0, 49.0, 43.0, 44.0, 33.0, 35.0, 17.0, 15.0, 18.0, 8.0, 14.0, 9.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01261138916015625, -0.01219475269317627, -0.011778116226196289, -0.011361479759216309, -0.010944843292236328, -0.010528206825256348, -0.010111570358276367, -0.009694933891296387, -0.009278297424316406, -0.008861660957336426, -0.008445024490356445, -0.008028388023376465, -0.007611751556396484, -0.007195115089416504, -0.0067784786224365234, -0.006361842155456543, -0.0059452056884765625, -0.005528569221496582, -0.0051119327545166016, -0.004695296287536621, -0.004278659820556641, -0.00386202335357666, -0.0034453868865966797, -0.0030287504196166992, -0.0026121139526367188, -0.0021954774856567383, -0.0017788410186767578, -0.0013622045516967773, -0.0009455680847167969, -0.0005289316177368164, -0.00011229515075683594, 0.00030434131622314453, 0.000720977783203125, 0.0011376142501831055, 0.001554250717163086, 0.0019708871841430664, 0.002387523651123047, 0.0028041601181030273, 0.003220796585083008, 0.0036374330520629883, 0.004054069519042969, 0.004470705986022949, 0.00488734245300293, 0.00530397891998291, 0.005720615386962891, 0.006137251853942871, 0.0065538883209228516, 0.006970524787902832, 0.0073871612548828125, 0.007803797721862793, 0.008220434188842773, 0.008637070655822754, 0.009053707122802734, 0.009470343589782715, 0.009886980056762695, 0.010303616523742676, 0.010720252990722656, 0.011136889457702637, 0.011553525924682617, 0.011970162391662598, 0.012386798858642578, 0.012803435325622559, 0.013220071792602539, 0.01363670825958252, 0.0140533447265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 9.0, 43.0, 176.0, 505.0, 189.0, 55.0, 14.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7443504929542542, -0.7126302123069763, -0.6809099316596985, -0.6491896510124207, -0.6174694299697876, -0.5857491493225098, -0.5540288686752319, -0.5223085880279541, -0.49058830738067627, -0.45886802673339844, -0.4271477460861206, -0.39542749524116516, -0.36370721459388733, -0.3319869339466095, -0.30026668310165405, -0.2685464024543762, -0.2368261218070984, -0.20510584115982056, -0.17338557541370392, -0.14166530966758728, -0.10994502902030945, -0.07822474837303162, -0.04650448262691498, -0.01478421688079834, 0.016936063766479492, 0.04865633696317673, 0.08037661015987396, 0.1120968833565712, 0.14381715655326843, 0.17553743720054626, 0.2072577029466629, 0.23897796869277954, 0.27069830894470215, 0.30241858959198, 0.3341388702392578, 0.36585912108421326, 0.3975794017314911, 0.4292996823787689, 0.46101993322372437, 0.4927402138710022, 0.52446049451828, 0.5561807751655579, 0.5879010558128357, 0.6196213364601135, 0.6513415575027466, 0.6830618381500244, 0.7147821187973022, 0.7465023994445801, 0.7782226800918579, 0.8099429607391357, 0.8416632413864136, 0.8733835220336914, 0.9051038026809692, 0.9368240833282471, 0.9685443043708801, 1.0002646446228027, 1.031984806060791, 1.0637050867080688, 1.0954253673553467, 1.1271456480026245, 1.1588659286499023, 1.1905862092971802, 1.222306489944458, 1.2540266513824463, 1.2857470512390137]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 6.0, 4.0, 6.0, 9.0, 9.0, 19.0, 11.0, 19.0, 18.0, 14.0, 21.0, 28.0, 27.0, 28.0, 33.0, 37.0, 66.0, 98.0, 104.0, 80.0, 38.0, 40.0, 39.0, 27.0, 21.0, 27.0, 16.0, 21.0, 9.0, 20.0, 14.0, 17.0, 15.0, 5.0, 10.0, 3.0, 5.0, 5.0, 1.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2552034258842468, -0.24712397158145905, -0.23904451727867126, -0.23096506297588348, -0.2228856086730957, -0.21480615437030792, -0.20672670006752014, -0.19864724576473236, -0.19056779146194458, -0.1824883371591568, -0.17440888285636902, -0.16632942855358124, -0.15824997425079346, -0.15017051994800568, -0.1420910656452179, -0.13401161134243011, -0.12593215703964233, -0.11785270273685455, -0.10977324843406677, -0.10169379413127899, -0.09361433982849121, -0.08553488552570343, -0.07745543122291565, -0.06937597692012787, -0.06129652261734009, -0.05321706831455231, -0.045137614011764526, -0.037058159708976746, -0.028978705406188965, -0.020899251103401184, -0.012819796800613403, -0.0047403424978256226, 0.003339111804962158, 0.011418566107749939, 0.01949802041053772, 0.0275774747133255, 0.03565692901611328, 0.04373638331890106, 0.05181583762168884, 0.059895291924476624, 0.0679747462272644, 0.07605420053005219, 0.08413365483283997, 0.09221310913562775, 0.10029256343841553, 0.10837201774120331, 0.11645147204399109, 0.12453092634677887, 0.13261038064956665, 0.14068983495235443, 0.1487692892551422, 0.15684874355793, 0.16492819786071777, 0.17300765216350555, 0.18108710646629333, 0.18916656076908112, 0.1972460150718689, 0.20532546937465668, 0.21340492367744446, 0.22148437798023224, 0.22956383228302002, 0.2376432865858078, 0.24572274088859558, 0.25380218029022217, 0.26188164949417114]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 6.0, 10.0, 23.0, 23.0, 37.0, 51.0, 66.0, 80.0, 119.0, 151.0, 221.0, 307.0, 501.0, 704.0, 1130.0, 1765.0, 3085.0, 5376.0, 10459.0, 22498.0, 58488.0, 196725.0, 823680.0, 1942106.0, 821778.0, 198645.0, 58807.0, 22830.0, 10628.0, 5520.0, 3162.0, 1794.0, 1156.0, 729.0, 457.0, 332.0, 220.0, 171.0, 108.0, 90.0, 68.0, 54.0, 22.0, 18.0, 17.0, 14.0, 7.0, 11.0, 4.0, 7.0, 3.0, 6.0, 4.0], "bins": [-0.0250396728515625, -0.024313926696777344, -0.023588180541992188, -0.02286243438720703, -0.022136688232421875, -0.02141094207763672, -0.020685195922851562, -0.019959449768066406, -0.01923370361328125, -0.018507957458496094, -0.017782211303710938, -0.01705646514892578, -0.016330718994140625, -0.015604972839355469, -0.014879226684570312, -0.014153480529785156, -0.013427734375, -0.012701988220214844, -0.011976242065429688, -0.011250495910644531, -0.010524749755859375, -0.009799003601074219, -0.009073257446289062, -0.008347511291503906, -0.00762176513671875, -0.006896018981933594, -0.0061702728271484375, -0.005444526672363281, -0.004718780517578125, -0.003993034362792969, -0.0032672882080078125, -0.0025415420532226562, -0.0018157958984375, -0.0010900497436523438, -0.0003643035888671875, 0.00036144256591796875, 0.001087188720703125, 0.0018129348754882812, 0.0025386810302734375, 0.0032644271850585938, 0.00399017333984375, 0.004715919494628906, 0.0054416656494140625, 0.006167411804199219, 0.006893157958984375, 0.007618904113769531, 0.008344650268554688, 0.009070396423339844, 0.009796142578125, 0.010521888732910156, 0.011247634887695312, 0.011973381042480469, 0.012699127197265625, 0.013424873352050781, 0.014150619506835938, 0.014876365661621094, 0.01560211181640625, 0.016327857971191406, 0.017053604125976562, 0.01777935028076172, 0.018505096435546875, 0.01923084259033203, 0.019956588745117188, 0.020682334899902344, 0.0214080810546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 4.0, 11.0, 11.0, 14.0, 12.0, 9.0, 24.0, 26.0, 37.0, 38.0, 49.0, 58.0, 58.0, 56.0, 68.0, 58.0, 60.0, 55.0, 48.0, 65.0, 44.0, 37.0, 28.0, 28.0, 23.0, 13.0, 19.0, 10.0, 7.0, 12.0, 5.0, 7.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0183258056640625, -0.017743587493896484, -0.01716136932373047, -0.016579151153564453, -0.015996932983398438, -0.015414714813232422, -0.014832496643066406, -0.01425027847290039, -0.013668060302734375, -0.01308584213256836, -0.012503623962402344, -0.011921405792236328, -0.011339187622070312, -0.010756969451904297, -0.010174751281738281, -0.009592533111572266, -0.00901031494140625, -0.008428096771240234, -0.007845878601074219, -0.007263660430908203, -0.0066814422607421875, -0.006099224090576172, -0.005517005920410156, -0.004934787750244141, -0.004352569580078125, -0.0037703514099121094, -0.0031881332397460938, -0.002605915069580078, -0.0020236968994140625, -0.0014414787292480469, -0.0008592605590820312, -0.0002770423889160156, 0.00030517578125, 0.0008873939514160156, 0.0014696121215820312, 0.002051830291748047, 0.0026340484619140625, 0.003216266632080078, 0.0037984848022460938, 0.004380702972412109, 0.004962921142578125, 0.005545139312744141, 0.006127357482910156, 0.006709575653076172, 0.0072917938232421875, 0.007874011993408203, 0.008456230163574219, 0.009038448333740234, 0.00962066650390625, 0.010202884674072266, 0.010785102844238281, 0.011367321014404297, 0.011949539184570312, 0.012531757354736328, 0.013113975524902344, 0.01369619369506836, 0.014278411865234375, 0.01486063003540039, 0.015442848205566406, 0.016025066375732422, 0.016607284545898438, 0.017189502716064453, 0.01777172088623047, 0.018353939056396484, 0.0189361572265625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 11.0, 15.0, 32.0, 65.0, 134.0, 264.0, 604.0, 1757.0, 12176.0, 3765459.0, 405779.0, 5903.0, 1229.0, 451.0, 202.0, 86.0, 50.0, 19.0, 17.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1339111328125, -0.1282978057861328, -0.12268447875976562, -0.11707115173339844, -0.11145782470703125, -0.10584449768066406, -0.10023117065429688, -0.09461784362792969, -0.0890045166015625, -0.08339118957519531, -0.07777786254882812, -0.07216453552246094, -0.06655120849609375, -0.06093788146972656, -0.055324554443359375, -0.04971122741699219, -0.044097900390625, -0.03848457336425781, -0.032871246337890625, -0.027257919311523438, -0.02164459228515625, -0.016031265258789062, -0.010417938232421875, -0.0048046112060546875, 0.0008087158203125, 0.0064220428466796875, 0.012035369873046875, 0.017648696899414062, 0.02326202392578125, 0.028875350952148438, 0.034488677978515625, 0.04010200500488281, 0.04571533203125, 0.05132865905761719, 0.056941986083984375, 0.06255531311035156, 0.06816864013671875, 0.07378196716308594, 0.07939529418945312, 0.08500862121582031, 0.0906219482421875, 0.09623527526855469, 0.10184860229492188, 0.10746192932128906, 0.11307525634765625, 0.11868858337402344, 0.12430191040039062, 0.1299152374267578, 0.135528564453125, 0.1411418914794922, 0.14675521850585938, 0.15236854553222656, 0.15798187255859375, 0.16359519958496094, 0.16920852661132812, 0.1748218536376953, 0.1804351806640625, 0.1860485076904297, 0.19166183471679688, 0.19727516174316406, 0.20288848876953125, 0.20850181579589844, 0.21411514282226562, 0.2197284698486328, 0.225341796875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 9.0, 9.0, 13.0, 27.0, 18.0, 45.0, 64.0, 68.0, 103.0, 166.0, 266.0, 369.0, 659.0, 753.0, 513.0, 301.0, 230.0, 126.0, 97.0, 55.0, 48.0, 33.0, 32.0, 16.0, 11.0, 8.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.08489990234375, -0.08267498016357422, -0.08045005798339844, -0.07822513580322266, -0.07600021362304688, -0.0737752914428711, -0.07155036926269531, -0.06932544708251953, -0.06710052490234375, -0.06487560272216797, -0.06265068054199219, -0.060425758361816406, -0.058200836181640625, -0.055975914001464844, -0.05375099182128906, -0.05152606964111328, -0.0493011474609375, -0.04707622528076172, -0.04485130310058594, -0.042626380920410156, -0.040401458740234375, -0.038176536560058594, -0.03595161437988281, -0.03372669219970703, -0.03150177001953125, -0.02927684783935547, -0.027051925659179688, -0.024827003479003906, -0.022602081298828125, -0.020377159118652344, -0.018152236938476562, -0.01592731475830078, -0.013702392578125, -0.011477470397949219, -0.009252548217773438, -0.007027626037597656, -0.004802703857421875, -0.0025777816772460938, -0.0003528594970703125, 0.0018720626831054688, 0.00409698486328125, 0.006321907043457031, 0.008546829223632812, 0.010771751403808594, 0.012996673583984375, 0.015221595764160156, 0.017446517944335938, 0.01967144012451172, 0.0218963623046875, 0.02412128448486328, 0.026346206665039062, 0.028571128845214844, 0.030796051025390625, 0.033020973205566406, 0.03524589538574219, 0.03747081756591797, 0.03969573974609375, 0.04192066192626953, 0.04414558410644531, 0.046370506286621094, 0.048595428466796875, 0.050820350646972656, 0.05304527282714844, 0.05527019500732422, 0.0574951171875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 10.0, 16.0, 18.0, 39.0, 65.0, 133.0, 202.0, 229.0, 124.0, 72.0, 35.0, 19.0, 12.0, 14.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9246997237205505, -0.8966338038444519, -0.8685678243637085, -0.8405019044876099, -0.8124359846115112, -0.7843700051307678, -0.7563040852546692, -0.7282381057739258, -0.7001721858978271, -0.6721062660217285, -0.6440402865409851, -0.6159743666648865, -0.5879083871841431, -0.5598424673080444, -0.5317765474319458, -0.5037106275558472, -0.47564464807510376, -0.44757869839668274, -0.4195127487182617, -0.3914468288421631, -0.36338087916374207, -0.33531492948532104, -0.3072490096092224, -0.2791830599308014, -0.25111711025238037, -0.22305116057395935, -0.19498522579669952, -0.1669192910194397, -0.13885334134101868, -0.11078739166259766, -0.08272145688533783, -0.054655522108078, -0.026589512825012207, 0.0014764294028282166, 0.02954237163066864, 0.057608313858509064, 0.08567425608634949, 0.11374020576477051, 0.14180614054203033, 0.16987207531929016, 0.19793802499771118, 0.2260039746761322, 0.2540699243545532, 0.28213584423065186, 0.3102017939090729, 0.3382677435874939, 0.36633366346359253, 0.39439961314201355, 0.42246556282043457, 0.4505315124988556, 0.4785974621772766, 0.5066633820533752, 0.5347293615341187, 0.5627952814102173, 0.5908612012863159, 0.6189271211624146, 0.646993100643158, 0.6750590205192566, 0.703125, 0.7311909198760986, 0.7592568397521973, 0.7873228192329407, 0.8153887391090393, 0.8434547185897827, 0.8715206384658813]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 9.0, 14.0, 8.0, 11.0, 23.0, 23.0, 24.0, 18.0, 25.0, 32.0, 32.0, 43.0, 33.0, 42.0, 46.0, 60.0, 63.0, 63.0, 54.0, 58.0, 39.0, 47.0, 38.0, 36.0, 31.0, 20.0, 18.0, 19.0, 14.0, 5.0, 9.0, 8.0, 4.0, 4.0, 6.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4024389386177063, -0.39043498039245605, -0.3784310221672058, -0.36642709374427795, -0.3544231355190277, -0.34241917729377747, -0.3304152488708496, -0.31841129064559937, -0.3064073324203491, -0.2944033741950989, -0.28239941596984863, -0.2703954875469208, -0.25839152932167053, -0.2463875710964203, -0.23438362777233124, -0.2223796844482422, -0.21037572622299194, -0.1983717679977417, -0.18636782467365265, -0.1743638813495636, -0.16235992312431335, -0.1503559648990631, -0.13835202157497406, -0.126348078250885, -0.11434412002563477, -0.10234016925096512, -0.09033621847629547, -0.07833226770162582, -0.06632831692695618, -0.05432436615228653, -0.04232041537761688, -0.030316464602947235, -0.018312513828277588, -0.006308563053607941, 0.0056953877210617065, 0.017699338495731354, 0.029703289270401, 0.04170724004507065, 0.053711190819740295, 0.06571514159440994, 0.07771909236907959, 0.08972304314374924, 0.10172699391841888, 0.11373094469308853, 0.12573489546775818, 0.13773885369300842, 0.14974279701709747, 0.16174674034118652, 0.17375069856643677, 0.185754656791687, 0.19775860011577606, 0.2097625434398651, 0.22176650166511536, 0.2337704598903656, 0.24577440321445465, 0.2577783465385437, 0.26978230476379395, 0.2817862629890442, 0.29379022121429443, 0.3057941496372223, 0.31779810786247253, 0.3298020660877228, 0.34180599451065063, 0.3538099527359009, 0.3658139109611511]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 4.0, 14.0, 11.0, 31.0, 33.0, 39.0, 64.0, 109.0, 172.0, 266.0, 570.0, 1014.0, 2202.0, 4674.0, 12078.0, 39509.0, 201085.0, 649884.0, 97895.0, 23922.0, 8127.0, 3476.0, 1565.0, 745.0, 441.0, 223.0, 150.0, 91.0, 59.0, 26.0, 28.0, 17.0, 7.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.042083740234375, -0.04089164733886719, -0.039699554443359375, -0.03850746154785156, -0.03731536865234375, -0.03612327575683594, -0.034931182861328125, -0.03373908996582031, -0.0325469970703125, -0.03135490417480469, -0.030162811279296875, -0.028970718383789062, -0.02777862548828125, -0.026586532592773438, -0.025394439697265625, -0.024202346801757812, -0.02301025390625, -0.021818161010742188, -0.020626068115234375, -0.019433975219726562, -0.01824188232421875, -0.017049789428710938, -0.015857696533203125, -0.014665603637695312, -0.0134735107421875, -0.012281417846679688, -0.011089324951171875, -0.009897232055664062, -0.00870513916015625, -0.0075130462646484375, -0.006320953369140625, -0.0051288604736328125, -0.003936767578125, -0.0027446746826171875, -0.001552581787109375, -0.0003604888916015625, 0.00083160400390625, 0.0020236968994140625, 0.003215789794921875, 0.0044078826904296875, 0.0055999755859375, 0.0067920684814453125, 0.007984161376953125, 0.009176254272460938, 0.01036834716796875, 0.011560440063476562, 0.012752532958984375, 0.013944625854492188, 0.01513671875, 0.016328811645507812, 0.017520904541015625, 0.018712997436523438, 0.01990509033203125, 0.021097183227539062, 0.022289276123046875, 0.023481369018554688, 0.0246734619140625, 0.025865554809570312, 0.027057647705078125, 0.028249740600585938, 0.02944183349609375, 0.030633926391601562, 0.031826019287109375, 0.03301811218261719, 0.034210205078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 10.0, 9.0, 7.0, 14.0, 17.0, 22.0, 22.0, 47.0, 51.0, 52.0, 70.0, 68.0, 61.0, 85.0, 81.0, 61.0, 65.0, 51.0, 51.0, 46.0, 24.0, 20.0, 15.0, 14.0, 10.0, 13.0, 5.0, 9.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03302001953125, -0.032064199447631836, -0.031108379364013672, -0.030152559280395508, -0.029196739196777344, -0.02824091911315918, -0.027285099029541016, -0.02632927894592285, -0.025373458862304688, -0.024417638778686523, -0.02346181869506836, -0.022505998611450195, -0.02155017852783203, -0.020594358444213867, -0.019638538360595703, -0.01868271827697754, -0.017726898193359375, -0.01677107810974121, -0.015815258026123047, -0.014859437942504883, -0.013903617858886719, -0.012947797775268555, -0.01199197769165039, -0.011036157608032227, -0.010080337524414062, -0.009124517440795898, -0.008168697357177734, -0.00721287727355957, -0.006257057189941406, -0.005301237106323242, -0.004345417022705078, -0.003389596939086914, -0.00243377685546875, -0.001477956771850586, -0.0005221366882324219, 0.0004336833953857422, 0.0013895034790039062, 0.0023453235626220703, 0.0033011436462402344, 0.0042569637298583984, 0.0052127838134765625, 0.0061686038970947266, 0.007124423980712891, 0.008080244064331055, 0.009036064147949219, 0.009991884231567383, 0.010947704315185547, 0.011903524398803711, 0.012859344482421875, 0.013815164566040039, 0.014770984649658203, 0.015726804733276367, 0.01668262481689453, 0.017638444900512695, 0.01859426498413086, 0.019550085067749023, 0.020505905151367188, 0.02146172523498535, 0.022417545318603516, 0.02337336540222168, 0.024329185485839844, 0.025285005569458008, 0.026240825653076172, 0.027196645736694336, 0.0281524658203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 5.0, 4.0, 8.0, 9.0, 15.0, 14.0, 36.0, 45.0, 76.0, 114.0, 155.0, 272.0, 588.0, 1455.0, 5383.0, 41575.0, 935879.0, 53666.0, 6136.0, 1654.0, 649.0, 299.0, 174.0, 100.0, 56.0, 59.0, 26.0, 26.0, 14.0, 15.0, 8.0, 9.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0654296875, -0.06341934204101562, -0.06140899658203125, -0.059398651123046875, -0.0573883056640625, -0.055377960205078125, -0.05336761474609375, -0.051357269287109375, -0.049346923828125, -0.047336578369140625, -0.04532623291015625, -0.043315887451171875, -0.0413055419921875, -0.039295196533203125, -0.03728485107421875, -0.035274505615234375, -0.03326416015625, -0.031253814697265625, -0.02924346923828125, -0.027233123779296875, -0.0252227783203125, -0.023212432861328125, -0.02120208740234375, -0.019191741943359375, -0.017181396484375, -0.015171051025390625, -0.01316070556640625, -0.011150360107421875, -0.0091400146484375, -0.007129669189453125, -0.00511932373046875, -0.003108978271484375, -0.0010986328125, 0.000911712646484375, 0.00292205810546875, 0.004932403564453125, 0.0069427490234375, 0.008953094482421875, 0.01096343994140625, 0.012973785400390625, 0.014984130859375, 0.016994476318359375, 0.01900482177734375, 0.021015167236328125, 0.0230255126953125, 0.025035858154296875, 0.02704620361328125, 0.029056549072265625, 0.03106689453125, 0.033077239990234375, 0.03508758544921875, 0.037097930908203125, 0.0391082763671875, 0.041118621826171875, 0.04312896728515625, 0.045139312744140625, 0.047149658203125, 0.049160003662109375, 0.05117034912109375, 0.053180694580078125, 0.0551910400390625, 0.057201385498046875, 0.05921173095703125, 0.061222076416015625, 0.063232421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 7.0, 9.0, 8.0, 15.0, 14.0, 17.0, 19.0, 17.0, 30.0, 46.0, 34.0, 40.0, 53.0, 71.0, 79.0, 75.0, 61.0, 56.0, 53.0, 41.0, 43.0, 36.0, 32.0, 21.0, 14.0, 21.0, 19.0, 13.0, 14.0, 3.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.07904052734375, -0.07653427124023438, -0.07402801513671875, -0.07152175903320312, -0.0690155029296875, -0.06650924682617188, -0.06400299072265625, -0.061496734619140625, -0.058990478515625, -0.056484222412109375, -0.05397796630859375, -0.051471710205078125, -0.0489654541015625, -0.046459197998046875, -0.04395294189453125, -0.041446685791015625, -0.0389404296875, -0.036434173583984375, -0.03392791748046875, -0.031421661376953125, -0.0289154052734375, -0.026409149169921875, -0.02390289306640625, -0.021396636962890625, -0.018890380859375, -0.016384124755859375, -0.01387786865234375, -0.011371612548828125, -0.0088653564453125, -0.006359100341796875, -0.00385284423828125, -0.001346588134765625, 0.00115966796875, 0.003665924072265625, 0.00617218017578125, 0.008678436279296875, 0.0111846923828125, 0.013690948486328125, 0.01619720458984375, 0.018703460693359375, 0.021209716796875, 0.023715972900390625, 0.02622222900390625, 0.028728485107421875, 0.0312347412109375, 0.033740997314453125, 0.03624725341796875, 0.038753509521484375, 0.041259765625, 0.043766021728515625, 0.04627227783203125, 0.048778533935546875, 0.0512847900390625, 0.053791046142578125, 0.05629730224609375, 0.058803558349609375, 0.061309814453125, 0.06381607055664062, 0.06632232666015625, 0.06882858276367188, 0.0713348388671875, 0.07384109497070312, 0.07634735107421875, 0.07885360717773438, 0.08135986328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 4.0, 6.0, 10.0, 6.0, 8.0, 9.0, 22.0, 27.0, 20.0, 41.0, 52.0, 106.0, 150.0, 311.0, 516.0, 1345.0, 4490.0, 22859.0, 926044.0, 78894.0, 9502.0, 2375.0, 798.0, 372.0, 218.0, 105.0, 71.0, 53.0, 32.0, 32.0, 20.0, 7.0, 12.0, 9.0, 7.0, 4.0, 8.0, 5.0, 2.0, 2.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0173492431640625, -0.016849994659423828, -0.016350746154785156, -0.015851497650146484, -0.015352249145507812, -0.01485300064086914, -0.014353752136230469, -0.013854503631591797, -0.013355255126953125, -0.012856006622314453, -0.012356758117675781, -0.01185750961303711, -0.011358261108398438, -0.010859012603759766, -0.010359764099121094, -0.009860515594482422, -0.00936126708984375, -0.008862018585205078, -0.008362770080566406, -0.007863521575927734, -0.0073642730712890625, -0.006865024566650391, -0.006365776062011719, -0.005866527557373047, -0.005367279052734375, -0.004868030548095703, -0.004368782043457031, -0.0038695335388183594, -0.0033702850341796875, -0.0028710365295410156, -0.0023717880249023438, -0.0018725395202636719, -0.001373291015625, -0.0008740425109863281, -0.00037479400634765625, 0.00012445449829101562, 0.0006237030029296875, 0.0011229515075683594, 0.0016222000122070312, 0.002121448516845703, 0.002620697021484375, 0.003119945526123047, 0.0036191940307617188, 0.004118442535400391, 0.0046176910400390625, 0.005116939544677734, 0.005616188049316406, 0.006115436553955078, 0.00661468505859375, 0.007113933563232422, 0.007613182067871094, 0.008112430572509766, 0.008611679077148438, 0.00911092758178711, 0.009610176086425781, 0.010109424591064453, 0.010608673095703125, 0.011107921600341797, 0.011607170104980469, 0.01210641860961914, 0.012605667114257812, 0.013104915618896484, 0.013604164123535156, 0.014103412628173828, 0.0146026611328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 8.0, 10.0, 7.0, 20.0, 21.0, 30.0, 28.0, 30.0, 51.0, 90.0, 99.0, 119.0, 106.0, 75.0, 51.0, 43.0, 36.0, 30.0, 27.0, 21.0, 13.0, 6.0, 11.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0], "bins": [-5.1975250244140625e-05, -5.0324946641922e-05, -4.867464303970337e-05, -4.702433943748474e-05, -4.537403583526611e-05, -4.3723732233047485e-05, -4.207342863082886e-05, -4.042312502861023e-05, -3.87728214263916e-05, -3.7122517824172974e-05, -3.5472214221954346e-05, -3.382191061973572e-05, -3.217160701751709e-05, -3.052130341529846e-05, -2.8870999813079834e-05, -2.7220696210861206e-05, -2.5570392608642578e-05, -2.392008900642395e-05, -2.2269785404205322e-05, -2.0619481801986694e-05, -1.8969178199768066e-05, -1.731887459754944e-05, -1.566857099533081e-05, -1.4018267393112183e-05, -1.2367963790893555e-05, -1.0717660188674927e-05, -9.067356586456299e-06, -7.417052984237671e-06, -5.766749382019043e-06, -4.116445779800415e-06, -2.466142177581787e-06, -8.158385753631592e-07, 8.344650268554688e-07, 2.4847686290740967e-06, 4.135072231292725e-06, 5.7853758335113525e-06, 7.4356794357299805e-06, 9.085983037948608e-06, 1.0736286640167236e-05, 1.2386590242385864e-05, 1.4036893844604492e-05, 1.568719744682312e-05, 1.7337501049041748e-05, 1.8987804651260376e-05, 2.0638108253479004e-05, 2.2288411855697632e-05, 2.393871545791626e-05, 2.5589019060134888e-05, 2.7239322662353516e-05, 2.8889626264572144e-05, 3.053992986679077e-05, 3.21902334690094e-05, 3.384053707122803e-05, 3.5490840673446655e-05, 3.714114427566528e-05, 3.879144787788391e-05, 4.044175148010254e-05, 4.209205508232117e-05, 4.3742358684539795e-05, 4.539266228675842e-05, 4.704296588897705e-05, 4.869326949119568e-05, 5.034357309341431e-05, 5.1993876695632935e-05, 5.364418029785156e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 4.0, 12.0, 12.0, 19.0, 29.0, 31.0, 45.0, 90.0, 137.0, 212.0, 331.0, 611.0, 1277.0, 2981.0, 8725.0, 42636.0, 916522.0, 57774.0, 10609.0, 3390.0, 1341.0, 712.0, 381.0, 230.0, 140.0, 86.0, 54.0, 49.0, 31.0, 15.0, 20.0, 10.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.013275146484375, -0.012840867042541504, -0.012406587600708008, -0.011972308158874512, -0.011538028717041016, -0.01110374927520752, -0.010669469833374023, -0.010235190391540527, -0.009800910949707031, -0.009366631507873535, -0.008932352066040039, -0.008498072624206543, -0.008063793182373047, -0.007629513740539551, -0.007195234298706055, -0.006760954856872559, -0.0063266754150390625, -0.005892395973205566, -0.00545811653137207, -0.005023837089538574, -0.004589557647705078, -0.004155278205871582, -0.003720998764038086, -0.00328671932220459, -0.0028524398803710938, -0.0024181604385375977, -0.0019838809967041016, -0.0015496015548706055, -0.0011153221130371094, -0.0006810426712036133, -0.0002467632293701172, 0.0001875162124633789, 0.000621795654296875, 0.001056075096130371, 0.0014903545379638672, 0.0019246339797973633, 0.0023589134216308594, 0.0027931928634643555, 0.0032274723052978516, 0.0036617517471313477, 0.004096031188964844, 0.00453031063079834, 0.004964590072631836, 0.005398869514465332, 0.005833148956298828, 0.006267428398132324, 0.00670170783996582, 0.007135987281799316, 0.0075702667236328125, 0.008004546165466309, 0.008438825607299805, 0.0088731050491333, 0.009307384490966797, 0.009741663932800293, 0.010175943374633789, 0.010610222816467285, 0.011044502258300781, 0.011478781700134277, 0.011913061141967773, 0.01234734058380127, 0.012781620025634766, 0.013215899467468262, 0.013650178909301758, 0.014084458351135254, 0.01451873779296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 12.0, 3.0, 9.0, 10.0, 9.0, 14.0, 27.0, 48.0, 114.0, 256.0, 226.0, 107.0, 44.0, 28.0, 17.0, 15.0, 9.0, 9.0, 5.0, 9.0, 6.0, 5.0, 4.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01430511474609375, -0.013773798942565918, -0.013242483139038086, -0.012711167335510254, -0.012179851531982422, -0.01164853572845459, -0.011117219924926758, -0.010585904121398926, -0.010054588317871094, -0.009523272514343262, -0.00899195671081543, -0.008460640907287598, -0.007929325103759766, -0.007398009300231934, -0.0068666934967041016, -0.0063353776931762695, -0.0058040618896484375, -0.0052727460861206055, -0.0047414302825927734, -0.004210114479064941, -0.0036787986755371094, -0.0031474828720092773, -0.0026161670684814453, -0.0020848512649536133, -0.0015535354614257812, -0.0010222196578979492, -0.0004909038543701172, 4.0411949157714844e-05, 0.0005717277526855469, 0.001103043556213379, 0.001634359359741211, 0.002165675163269043, 0.002696990966796875, 0.003228306770324707, 0.003759622573852539, 0.004290938377380371, 0.004822254180908203, 0.005353569984436035, 0.005884885787963867, 0.006416201591491699, 0.006947517395019531, 0.007478833198547363, 0.008010149002075195, 0.008541464805603027, 0.00907278060913086, 0.009604096412658691, 0.010135412216186523, 0.010666728019714355, 0.011198043823242188, 0.01172935962677002, 0.012260675430297852, 0.012791991233825684, 0.013323307037353516, 0.013854622840881348, 0.01438593864440918, 0.014917254447937012, 0.015448570251464844, 0.015979886054992676, 0.016511201858520508, 0.01704251766204834, 0.017573833465576172, 0.018105149269104004, 0.018636465072631836, 0.019167780876159668, 0.0196990966796875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 10.0, 10.0, 40.0, 90.0, 528.0, 160.0, 76.0, 46.0, 17.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23220795392990112, -0.21643856167793274, -0.20066916942596436, -0.18489976227283478, -0.1691303700208664, -0.153360977768898, -0.13759157061576843, -0.12182217836380005, -0.10605278611183167, -0.09028339385986328, -0.0745139941573143, -0.05874459818005562, -0.042975202202796936, -0.027205809950828552, -0.011436410248279572, 0.004332989454269409, 0.020102381706237793, 0.035871777683496475, 0.05164117366075516, 0.06741057336330414, 0.08317996561527252, 0.0989493578672409, 0.11471875756978989, 0.13048815727233887, 0.14625754952430725, 0.16202694177627563, 0.17779633402824402, 0.1935657411813736, 0.20933513343334198, 0.22510452568531036, 0.24087393283843994, 0.2566433250904083, 0.27241265773773193, 0.2881820499897003, 0.3039514422416687, 0.3197208344936371, 0.33549022674560547, 0.35125964879989624, 0.3670290410518646, 0.382798433303833, 0.3985678255558014, 0.4143372178077698, 0.43010661005973816, 0.44587600231170654, 0.4616454243659973, 0.4774147868156433, 0.4931842088699341, 0.5089535713195801, 0.5247229933738708, 0.5404924154281616, 0.5562617778778076, 0.5720311999320984, 0.5878005623817444, 0.6035699844360352, 0.6193393468856812, 0.6351087689399719, 0.6508781909942627, 0.6666476130485535, 0.6824169754981995, 0.6981863975524902, 0.7139557600021362, 0.729725182056427, 0.745494544506073, 0.7612639665603638, 0.7770333290100098]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 6.0, 11.0, 11.0, 18.0, 15.0, 20.0, 23.0, 24.0, 22.0, 43.0, 39.0, 131.0, 313.0, 89.0, 34.0, 22.0, 33.0, 24.0, 21.0, 27.0, 19.0, 8.0, 16.0, 8.0, 2.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1979086995124817, -0.18863563239574432, -0.17936256527900696, -0.1700894981622696, -0.16081643104553223, -0.15154334902763367, -0.1422702819108963, -0.13299721479415894, -0.12372414767742157, -0.1144510805606842, -0.10517801344394684, -0.09590493887662888, -0.08663187175989151, -0.07735880464315414, -0.06808573007583618, -0.058812662959098816, -0.04953959584236145, -0.040266528725624084, -0.03099345788359642, -0.021720388904213905, -0.01244731992483139, -0.0031742528080940247, 0.0060988180339336395, 0.015371888875961304, 0.02464495599269867, 0.033918023109436035, 0.0431910939514637, 0.052464164793491364, 0.06173723191022873, 0.0710102990269661, 0.08028337359428406, 0.08955644071102142, 0.09882950782775879, 0.10810257494449615, 0.11737564206123352, 0.1266487091779709, 0.13592177629470825, 0.1451948583126068, 0.15446792542934418, 0.16374099254608154, 0.1730140596628189, 0.18228712677955627, 0.19156019389629364, 0.200833261013031, 0.21010634303092957, 0.21937939524650574, 0.2286524772644043, 0.23792554438114166, 0.24719861149787903, 0.2564716935157776, 0.26574474573135376, 0.2750178277492523, 0.2842908799648285, 0.29356396198272705, 0.3028370141983032, 0.3121100962162018, 0.32138317823410034, 0.3306562602519989, 0.3399293124675751, 0.34920239448547363, 0.3584754467010498, 0.36774852871894836, 0.37702158093452454, 0.3862946629524231, 0.39556771516799927]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 2.0, 8.0, 3.0, 6.0, 11.0, 13.0, 11.0, 15.0, 11.0, 23.0, 16.0, 15.0, 27.0, 22.0, 22.0, 36.0, 34.0, 95.0, 227.0, 92.0, 40.0, 35.0, 26.0, 30.0, 16.0, 20.0, 15.0, 21.0, 14.0, 11.0, 10.0, 11.0, 10.0, 3.0, 6.0, 7.0, 3.0, 5.0, 5.0, 4.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0166778564453125, -0.01616644859313965, -0.015655040740966797, -0.015143632888793945, -0.014632225036621094, -0.014120817184448242, -0.01360940933227539, -0.013098001480102539, -0.012586593627929688, -0.012075185775756836, -0.011563777923583984, -0.011052370071411133, -0.010540962219238281, -0.01002955436706543, -0.009518146514892578, -0.009006738662719727, -0.008495330810546875, -0.007983922958374023, -0.007472515106201172, -0.00696110725402832, -0.006449699401855469, -0.005938291549682617, -0.005426883697509766, -0.004915475845336914, -0.0044040679931640625, -0.003892660140991211, -0.0033812522888183594, -0.002869844436645508, -0.0023584365844726562, -0.0018470287322998047, -0.0013356208801269531, -0.0008242130279541016, -0.00031280517578125, 0.00019860267639160156, 0.0007100105285644531, 0.0012214183807373047, 0.0017328262329101562, 0.002244234085083008, 0.0027556419372558594, 0.003267049789428711, 0.0037784576416015625, 0.004289865493774414, 0.004801273345947266, 0.005312681198120117, 0.005824089050292969, 0.00633549690246582, 0.006846904754638672, 0.0073583126068115234, 0.007869720458984375, 0.008381128311157227, 0.008892536163330078, 0.00940394401550293, 0.009915351867675781, 0.010426759719848633, 0.010938167572021484, 0.011449575424194336, 0.011960983276367188, 0.012472391128540039, 0.01298379898071289, 0.013495206832885742, 0.014006614685058594, 0.014518022537231445, 0.015029430389404297, 0.015540838241577148, 0.01605224609375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 1.0, 9.0, 16.0, 7.0, 16.0, 19.0, 46.0, 56.0, 166.0, 320.0, 818.0, 3056.0, 22070.0, 8347625.0, 11213.0, 2011.0, 648.0, 231.0, 99.0, 44.0, 35.0, 26.0, 24.0, 9.0, 4.0, 7.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2597764730453491, -0.25243186950683594, -0.24508728086948395, -0.23774269223213196, -0.23039808869361877, -0.22305350005626678, -0.2157088965177536, -0.2083643078804016, -0.20101970434188843, -0.19367511570453644, -0.18633051216602325, -0.17898592352867126, -0.17164131999015808, -0.1642967313528061, -0.1569521278142929, -0.14960753917694092, -0.14226293563842773, -0.13491834700107574, -0.12757374346256256, -0.12022914737462997, -0.11288455128669739, -0.1055399626493454, -0.09819535911083221, -0.09085077047348022, -0.08350618183612823, -0.07616158574819565, -0.06881698966026306, -0.061472393572330475, -0.05412779748439789, -0.0467832051217556, -0.03943860903382301, -0.03209401294589043, -0.02474941313266754, -0.017404817044734955, -0.010060221888124943, -0.0027156267315149307, 0.004628969356417656, 0.011973563581705093, 0.01931815966963768, 0.026662755757570267, 0.03400735184550285, 0.04135194793343544, 0.04869654402136803, 0.056041136384010315, 0.0633857324719429, 0.07073032855987549, 0.07807492464780807, 0.08541952073574066, 0.09276411682367325, 0.10010871291160583, 0.10745330899953842, 0.11479790508747101, 0.1221425011754036, 0.12948709726333618, 0.13683168590068817, 0.14417628943920135, 0.15152087807655334, 0.15886546671390533, 0.16621007025241852, 0.1735546588897705, 0.1808992624282837, 0.18824385106563568, 0.19558845460414886, 0.20293304324150085, 0.21027764678001404]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 7.0, 6.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 6.0, 2.0, 6.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21082796156406403, -0.20547974109649658, -0.20013152062892914, -0.1947833001613617, -0.18943509459495544, -0.184086874127388, -0.17873865365982056, -0.1733904331922531, -0.16804221272468567, -0.16269399225711823, -0.15734577178955078, -0.15199756622314453, -0.1466493457555771, -0.14130112528800964, -0.1359529048204422, -0.13060468435287476, -0.1252564787864685, -0.11990825831890106, -0.11456004530191422, -0.10921182483434677, -0.10386361181735992, -0.09851539134979248, -0.09316717088222504, -0.08781895041465759, -0.08247073739767075, -0.0771225169301033, -0.07177430391311646, -0.06642608344554901, -0.061077866703271866, -0.05572964996099472, -0.05038142949342728, -0.04503321275115013, -0.03968498110771179, -0.03433676436543465, -0.028988545760512352, -0.023640327155590057, -0.018292110413312912, -0.012943893671035767, -0.007595673203468323, -0.0022474564611911774, 0.003100760281085968, 0.008448977954685688, 0.013797195628285408, 0.019145414233207703, 0.024493630975484848, 0.029841847717761993, 0.03519006818532944, 0.04053828492760658, 0.04588650166988373, 0.05123471841216087, 0.05658293515443802, 0.06193115562200546, 0.06727936863899231, 0.07262758910655975, 0.0779758095741272, 0.08332403004169464, 0.08867224305868149, 0.09402046352624893, 0.09936867654323578, 0.10471689701080322, 0.11006511747837067, 0.11541333049535751, 0.12076155096292496, 0.1261097639799118, 0.13145798444747925]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 8.0, 18.0, 20.0, 23.0, 24.0, 54.0, 73.0, 115.0, 220.0, 335.0, 605.0, 1142.0, 2440.0, 5584.0, 14657.0, 42091.0, 137764.0, 206584.0, 73232.0, 23726.0, 8532.0, 3447.0, 1650.0, 800.0, 418.0, 242.0, 147.0, 95.0, 70.0, 39.0, 30.0, 22.0, 17.0, 13.0, 6.0, 3.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1739501953125, -0.1681957244873047, -0.16244125366210938, -0.15668678283691406, -0.15093231201171875, -0.14517784118652344, -0.13942337036132812, -0.1336688995361328, -0.1279144287109375, -0.12215995788574219, -0.11640548706054688, -0.11065101623535156, -0.10489654541015625, -0.09914207458496094, -0.09338760375976562, -0.08763313293457031, -0.081878662109375, -0.07612419128417969, -0.07036972045898438, -0.06461524963378906, -0.05886077880859375, -0.05310630798339844, -0.047351837158203125, -0.04159736633300781, -0.0358428955078125, -0.030088424682617188, -0.024333953857421875, -0.018579483032226562, -0.01282501220703125, -0.0070705413818359375, -0.001316070556640625, 0.0044384002685546875, 0.01019287109375, 0.015947341918945312, 0.021701812744140625, 0.027456283569335938, 0.03321075439453125, 0.03896522521972656, 0.044719696044921875, 0.05047416687011719, 0.0562286376953125, 0.06198310852050781, 0.06773757934570312, 0.07349205017089844, 0.07924652099609375, 0.08500099182128906, 0.09075546264648438, 0.09650993347167969, 0.102264404296875, 0.10801887512207031, 0.11377334594726562, 0.11952781677246094, 0.12528228759765625, 0.13103675842285156, 0.13679122924804688, 0.1425457000732422, 0.1483001708984375, 0.1540546417236328, 0.15980911254882812, 0.16556358337402344, 0.17131805419921875, 0.17707252502441406, 0.18282699584960938, 0.1885814666748047, 0.1943359375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 16.0, 15.0, 21.0, 28.0, 42.0, 56.0, 68.0, 79.0, 102.0, 106.0, 116.0, 93.0, 60.0, 50.0, 44.0, 24.0, 23.0, 12.0, 5.0, 17.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039459228515625, -0.03837132453918457, -0.03728342056274414, -0.03619551658630371, -0.03510761260986328, -0.03401970863342285, -0.03293180465698242, -0.03184390068054199, -0.030755996704101562, -0.029668092727661133, -0.028580188751220703, -0.027492284774780273, -0.026404380798339844, -0.025316476821899414, -0.024228572845458984, -0.023140668869018555, -0.022052764892578125, -0.020964860916137695, -0.019876956939697266, -0.018789052963256836, -0.017701148986816406, -0.016613245010375977, -0.015525341033935547, -0.014437437057495117, -0.013349533081054688, -0.012261629104614258, -0.011173725128173828, -0.010085821151733398, -0.008997917175292969, -0.007910013198852539, -0.006822109222412109, -0.00573420524597168, -0.00464630126953125, -0.0035583972930908203, -0.0024704933166503906, -0.001382589340209961, -0.00029468536376953125, 0.0007932186126708984, 0.0018811225891113281, 0.002969026565551758, 0.0040569305419921875, 0.005144834518432617, 0.006232738494873047, 0.0073206424713134766, 0.008408546447753906, 0.009496450424194336, 0.010584354400634766, 0.011672258377075195, 0.012760162353515625, 0.013848066329956055, 0.014935970306396484, 0.016023874282836914, 0.017111778259277344, 0.018199682235717773, 0.019287586212158203, 0.020375490188598633, 0.021463394165039062, 0.022551298141479492, 0.023639202117919922, 0.02472710609436035, 0.02581501007080078, 0.02690291404724121, 0.02799081802368164, 0.02907872200012207, 0.0301666259765625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 9.0, 7.0, 9.0, 11.0, 21.0, 36.0, 77.0, 125.0, 86.0, 44.0, 22.0, 14.0, 5.0, 4.0, 3.0, 5.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24039745330810547, -0.23246397078037262, -0.22453050315380096, -0.21659702062606812, -0.20866355299949646, -0.2007300704717636, -0.19279658794403076, -0.1848631203174591, -0.17692965269088745, -0.1689961701631546, -0.16106270253658295, -0.1531292200088501, -0.14519575238227844, -0.1372622698545456, -0.12932878732681274, -0.12139531970024109, -0.11346183717250824, -0.10552836209535599, -0.09759488701820374, -0.08966140449047089, -0.08172793686389923, -0.07379445433616638, -0.06586097925901413, -0.05792750418186188, -0.049994029104709625, -0.04206055402755737, -0.03412707895040512, -0.02619360014796257, -0.018260125070810318, -0.010326649993658066, -0.002393171191215515, 0.005540303885936737, 0.01347377896308899, 0.02140725404024124, 0.029340730980038643, 0.037274207919836044, 0.045207682996988297, 0.05314115807414055, 0.0610746368765831, 0.06900811195373535, 0.0769415870308876, 0.08487506210803986, 0.09280853718519211, 0.10074201226234436, 0.10867549479007721, 0.11660896241664886, 0.12454244494438171, 0.13247591257095337, 0.14040939509868622, 0.14834287762641907, 0.15627634525299072, 0.16420982778072357, 0.17214329540729523, 0.18007677793502808, 0.18801024556159973, 0.19594372808933258, 0.20387721061706543, 0.21181069314479828, 0.21974416077136993, 0.22767764329910278, 0.23561111092567444, 0.2435445934534073, 0.25147807598114014, 0.2594115436077118, 0.26734501123428345]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 6.0, 4.0, 12.0, 16.0, 19.0, 57.0, 82.0, 93.0, 67.0, 35.0, 17.0, 7.0, 5.0, 4.0, 4.0, 6.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13171684741973877, -0.12739770114421844, -0.12307855486869812, -0.1187594085931778, -0.11444026231765747, -0.11012111604213715, -0.10580196976661682, -0.1014828234910965, -0.09716367721557617, -0.09284453094005585, -0.08852538466453552, -0.0842062383890152, -0.07988709211349487, -0.07556794583797455, -0.07124879956245422, -0.0669296532869339, -0.06261050701141357, -0.05829136073589325, -0.053972214460372925, -0.0496530681848526, -0.045333921909332275, -0.04101477563381195, -0.036695629358291626, -0.0323764830827713, -0.028057336807250977, -0.023738190531730652, -0.019419044256210327, -0.015099897980690002, -0.010780751705169678, -0.006461605429649353, -0.0021424591541290283, 0.0021766871213912964, 0.006495833396911621, 0.010814979672431946, 0.01513412594795227, 0.019453272223472595, 0.02377241849899292, 0.028091564774513245, 0.03241071105003357, 0.036729857325553894, 0.04104900360107422, 0.04536814987659454, 0.04968729615211487, 0.05400644242763519, 0.05832558870315552, 0.06264473497867584, 0.06696388125419617, 0.07128302752971649, 0.07560217380523682, 0.07992132008075714, 0.08424046635627747, 0.08855961263179779, 0.09287875890731812, 0.09719790518283844, 0.10151705145835876, 0.10583619773387909, 0.11015534400939941, 0.11447449028491974, 0.11879363656044006, 0.12311278283596039, 0.1274319291114807, 0.13175107538700104, 0.13607022166252136, 0.1403893679380417, 0.144708514213562]}, "train/train_runtime": 5167.9675, "train/train_samples_per_second": 5.522, "train/train_steps_per_second": 0.086, "train/total_flos": 0.0, "train/train_loss": 4.734800568610563, "eval/loss": 5.330791473388672, "eval/wer": 2.4313764379214597, "eval/runtime": 1116.9995, "eval/samples_per_second": 2.365, "eval/steps_per_second": 0.296, "_wandb": {"runtime": 6670}} \ No newline at end of file