diff --git "a/wandb/run-20220302_021624-vszekdxg/files/wandb-summary.json" "b/wandb/run-20220302_021624-vszekdxg/files/wandb-summary.json" --- "a/wandb/run-20220302_021624-vszekdxg/files/wandb-summary.json" +++ "b/wandb/run-20220302_021624-vszekdxg/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.2767, "train/learning_rate": 2.1276595744680853e-06, "train/epoch": 1.0, "train/global_step": 594, "_runtime": 6892, "_timestamp": 1646194276, "_step": 596, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 9.0, 923.0, 85.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.87272644042969, -32.01921463012695, -20.16570472717285, -8.31219482421875, 3.5413169860839844, 15.394828796386719, 27.248336791992188, 39.10185241699219, 50.955360412597656, 62.80887222290039, 74.66238403320312, 86.5158920288086, 98.36940002441406, 110.22291564941406, 122.07642364501953, 133.929931640625, 145.783447265625, 157.636962890625, 169.49046325683594, 181.34397888183594, 193.19749450683594, 205.05099487304688, 216.90451049804688, 228.75802612304688, 240.61154174804688, 252.46505737304688, 264.3185729980469, 276.17205810546875, 288.02557373046875, 299.87908935546875, 311.73260498046875, 323.58612060546875, 335.4396057128906, 347.2931213378906, 359.1466369628906, 371.0001220703125, 382.8536376953125, 394.7071533203125, 406.5606689453125, 418.4141845703125, 430.2677001953125, 442.1212158203125, 453.9747314453125, 465.8282470703125, 477.6817321777344, 489.5352478027344, 501.3887634277344, 513.2423095703125, 525.0957641601562, 536.9492797851562, 548.8027954101562, 560.6563110351562, 572.5098266601562, 584.3633422851562, 596.216796875, 608.0703125, 619.9238891601562, 631.7774047851562, 643.6309204101562, 655.4844360351562, 667.3379516601562, 679.1914672851562, 691.044921875, 702.8984375, 714.751953125]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 6.0, 4.0, 8.0, 11.0, 17.0, 16.0, 17.0, 21.0, 28.0, 22.0, 38.0, 39.0, 49.0, 43.0, 54.0, 38.0, 54.0, 53.0, 52.0, 53.0, 51.0, 42.0, 36.0, 42.0, 33.0, 34.0, 42.0, 24.0, 20.0, 8.0, 9.0, 12.0, 5.0, 6.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.28767395019531, -48.571067810058594, -46.854461669921875, -45.137855529785156, -43.42124938964844, -41.70464324951172, -39.988037109375, -38.27143096923828, -36.55482482910156, -34.838218688964844, -33.121612548828125, -31.405006408691406, -29.688400268554688, -27.97179412841797, -26.25518798828125, -24.53858184814453, -22.821977615356445, -21.105371475219727, -19.388765335083008, -17.67215919494629, -15.95555305480957, -14.238947868347168, -12.52234172821045, -10.80573558807373, -9.089129447937012, -7.372523307800293, -5.655917167663574, -3.9393115043640137, -2.222705364227295, -0.5060997009277344, 1.2105064392089844, 2.927112579345703, 4.643718719482422, 6.360324859619141, 8.07693099975586, 9.793537139892578, 11.510143280029297, 13.2267484664917, 14.943354606628418, 16.659961700439453, 18.376567840576172, 20.09317398071289, 21.80978012084961, 23.526386260986328, 25.242992401123047, 26.959598541259766, 28.676204681396484, 30.392810821533203, 32.109413146972656, 33.826019287109375, 35.542625427246094, 37.25923156738281, 38.97583770751953, 40.69244384765625, 42.40904998779297, 44.12565612792969, 45.842262268066406, 47.558868408203125, 49.275474548339844, 50.99208068847656, 52.70868682861328, 54.42529296875, 56.14189910888672, 57.85850524902344, 59.575111389160156]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 9.0, 10.0, 4.0, 12.0, 16.0, 9.0, 12.0, 19.0, 23.0, 19.0, 24.0, 36.0, 27.0, 38.0, 25.0, 35.0, 33.0, 40.0, 37.0, 39.0, 41.0, 29.0, 38.0, 46.0, 28.0, 43.0, 35.0, 32.0, 28.0, 31.0, 29.0, 25.0, 31.0, 17.0, 21.0, 10.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.64453125, -1.59210205078125, -1.5396728515625, -1.48724365234375, -1.434814453125, -1.38238525390625, -1.3299560546875, -1.27752685546875, -1.22509765625, -1.17266845703125, -1.1202392578125, -1.06781005859375, -1.015380859375, -0.96295166015625, -0.9105224609375, -0.85809326171875, -0.8056640625, -0.75323486328125, -0.7008056640625, -0.64837646484375, -0.595947265625, -0.54351806640625, -0.4910888671875, -0.43865966796875, -0.38623046875, -0.33380126953125, -0.2813720703125, -0.22894287109375, -0.176513671875, -0.12408447265625, -0.0716552734375, -0.01922607421875, 0.033203125, 0.08563232421875, 0.1380615234375, 0.19049072265625, 0.242919921875, 0.29534912109375, 0.3477783203125, 0.40020751953125, 0.45263671875, 0.50506591796875, 0.5574951171875, 0.60992431640625, 0.662353515625, 0.71478271484375, 0.7672119140625, 0.81964111328125, 0.8720703125, 0.92449951171875, 0.9769287109375, 1.02935791015625, 1.081787109375, 1.13421630859375, 1.1866455078125, 1.23907470703125, 1.29150390625, 1.34393310546875, 1.3963623046875, 1.44879150390625, 1.501220703125, 1.55364990234375, 1.6060791015625, 1.65850830078125, 1.7109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 9.0, 10.0, 16.0, 17.0, 22.0, 27.0, 30.0, 48.0, 65.0, 93.0, 82.0, 140.0, 221.0, 317.0, 511.0, 797.0, 1340.0, 2651.0, 7074.0, 28746.0, 255415.0, 3042783.0, 777788.0, 57020.0, 10956.0, 3779.0, 1617.0, 921.0, 563.0, 375.0, 237.0, 190.0, 113.0, 89.0, 54.0, 42.0, 26.0, 22.0, 12.0, 12.0, 7.0, 5.0, 6.0, 10.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.796875, -8.5277099609375, -8.258544921875, -7.9893798828125, -7.72021484375, -7.4510498046875, -7.181884765625, -6.9127197265625, -6.6435546875, -6.3743896484375, -6.105224609375, -5.8360595703125, -5.56689453125, -5.2977294921875, -5.028564453125, -4.7593994140625, -4.490234375, -4.2210693359375, -3.951904296875, -3.6827392578125, -3.41357421875, -3.1444091796875, -2.875244140625, -2.6060791015625, -2.3369140625, -2.0677490234375, -1.798583984375, -1.5294189453125, -1.26025390625, -0.9910888671875, -0.721923828125, -0.4527587890625, -0.18359375, 0.0855712890625, 0.354736328125, 0.6239013671875, 0.89306640625, 1.1622314453125, 1.431396484375, 1.7005615234375, 1.9697265625, 2.2388916015625, 2.508056640625, 2.7772216796875, 3.04638671875, 3.3155517578125, 3.584716796875, 3.8538818359375, 4.123046875, 4.3922119140625, 4.661376953125, 4.9305419921875, 5.19970703125, 5.4688720703125, 5.738037109375, 6.0072021484375, 6.2763671875, 6.5455322265625, 6.814697265625, 7.0838623046875, 7.35302734375, 7.6221923828125, 7.891357421875, 8.1605224609375, 8.4296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 15.0, 18.0, 40.0, 65.0, 100.0, 182.0, 312.0, 521.0, 780.0, 720.0, 504.0, 298.0, 161.0, 115.0, 90.0, 47.0, 32.0, 21.0, 17.0, 7.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.3828125, -12.04638671875, -11.7099609375, -11.37353515625, -11.037109375, -10.70068359375, -10.3642578125, -10.02783203125, -9.69140625, -9.35498046875, -9.0185546875, -8.68212890625, -8.345703125, -8.00927734375, -7.6728515625, -7.33642578125, -7.0, -6.66357421875, -6.3271484375, -5.99072265625, -5.654296875, -5.31787109375, -4.9814453125, -4.64501953125, -4.30859375, -3.97216796875, -3.6357421875, -3.29931640625, -2.962890625, -2.62646484375, -2.2900390625, -1.95361328125, -1.6171875, -1.28076171875, -0.9443359375, -0.60791015625, -0.271484375, 0.06494140625, 0.4013671875, 0.73779296875, 1.07421875, 1.41064453125, 1.7470703125, 2.08349609375, 2.419921875, 2.75634765625, 3.0927734375, 3.42919921875, 3.765625, 4.10205078125, 4.4384765625, 4.77490234375, 5.111328125, 5.44775390625, 5.7841796875, 6.12060546875, 6.45703125, 6.79345703125, 7.1298828125, 7.46630859375, 7.802734375, 8.13916015625, 8.4755859375, 8.81201171875, 9.1484375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 8.0, 9.0, 10.0, 13.0, 31.0, 52.0, 94.0, 156.0, 366.0, 691.0, 1758.0, 8100.0, 1546976.0, 2622237.0, 9988.0, 2071.0, 774.0, 431.0, 208.0, 105.0, 80.0, 41.0, 18.0, 11.0, 5.0, 15.0, 11.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.25, -36.15576171875, -35.0615234375, -33.96728515625, -32.873046875, -31.77880859375, -30.6845703125, -29.59033203125, -28.49609375, -27.40185546875, -26.3076171875, -25.21337890625, -24.119140625, -23.02490234375, -21.9306640625, -20.83642578125, -19.7421875, -18.64794921875, -17.5537109375, -16.45947265625, -15.365234375, -14.27099609375, -13.1767578125, -12.08251953125, -10.98828125, -9.89404296875, -8.7998046875, -7.70556640625, -6.611328125, -5.51708984375, -4.4228515625, -3.32861328125, -2.234375, -1.14013671875, -0.0458984375, 1.04833984375, 2.142578125, 3.23681640625, 4.3310546875, 5.42529296875, 6.51953125, 7.61376953125, 8.7080078125, 9.80224609375, 10.896484375, 11.99072265625, 13.0849609375, 14.17919921875, 15.2734375, 16.36767578125, 17.4619140625, 18.55615234375, 19.650390625, 20.74462890625, 21.8388671875, 22.93310546875, 24.02734375, 25.12158203125, 26.2158203125, 27.31005859375, 28.404296875, 29.49853515625, 30.5927734375, 31.68701171875, 32.78125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 384.0, 620.0, 11.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-496.1153564453125, -487.0934143066406, -478.07147216796875, -469.04949951171875, -460.0275573730469, -451.005615234375, -441.9836730957031, -432.96173095703125, -423.93975830078125, -414.9178161621094, -405.8958740234375, -396.8739013671875, -387.8519592285156, -378.83001708984375, -369.8080749511719, -360.7861328125, -351.7641906738281, -342.74224853515625, -333.7203063964844, -324.6983337402344, -315.6763916015625, -306.6544494628906, -297.63250732421875, -288.6105651855469, -279.588623046875, -270.5666809082031, -261.54473876953125, -252.5227813720703, -243.50082397460938, -234.4788818359375, -225.45693969726562, -216.43499755859375, -207.41305541992188, -198.39111328125, -189.36915588378906, -180.3472137451172, -171.32525634765625, -162.30331420898438, -153.2813720703125, -144.25942993164062, -135.2374725341797, -126.21552276611328, -117.19357299804688, -108.171630859375, -99.1496810913086, -90.12773132324219, -81.10578918457031, -72.0838394165039, -63.0618896484375, -54.039939880371094, -45.01799392700195, -35.99604797363281, -26.974098205566406, -17.9521484375, -8.93020248413086, 0.09174346923828125, 9.113693237304688, 18.13564109802246, 27.157588958740234, 36.179534912109375, 45.20148468017578, 54.22343444824219, 63.24538040161133, 72.26732635498047, 81.28927612304688]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 5.0, 10.0, 15.0, 20.0, 25.0, 26.0, 29.0, 32.0, 45.0, 48.0, 48.0, 61.0, 62.0, 58.0, 74.0, 74.0, 61.0, 57.0, 45.0, 42.0, 30.0, 32.0, 28.0, 17.0, 16.0, 10.0, 8.0, 8.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.311134338378906, -54.782867431640625, -53.254600524902344, -51.72633361816406, -50.19806671142578, -48.6697998046875, -47.14153289794922, -45.61326599121094, -44.084999084472656, -42.556732177734375, -41.028465270996094, -39.50019836425781, -37.97193145751953, -36.44366455078125, -34.91539764404297, -33.38713073730469, -31.85886573791504, -30.330598831176758, -28.802331924438477, -27.274065017700195, -25.745798110961914, -24.217531204223633, -22.689266204833984, -21.160999298095703, -19.632732391357422, -18.10446548461914, -16.57619857788086, -15.047931671142578, -13.519664764404297, -11.991397857666016, -10.46313190460205, -8.93486499786377, -7.406597137451172, -5.878330230712891, -4.350063323974609, -2.8217968940734863, -1.293529987335205, 0.23473691940307617, 1.7630033493041992, 3.2912702560424805, 4.819537162780762, 6.347804069519043, 7.876070976257324, 9.404336929321289, 10.93260383605957, 12.460870742797852, 13.989137649536133, 15.517404556274414, 17.045671463012695, 18.573938369750977, 20.102205276489258, 21.63047218322754, 23.15873908996582, 24.6870059967041, 26.21527099609375, 27.74353790283203, 29.271804809570312, 30.800071716308594, 32.328338623046875, 33.856605529785156, 35.38487243652344, 36.91313934326172, 38.44140625, 39.96967315673828, 41.49794006347656]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 4.0, 6.0, 4.0, 5.0, 8.0, 12.0, 8.0, 12.0, 22.0, 18.0, 18.0, 19.0, 22.0, 20.0, 25.0, 27.0, 36.0, 37.0, 29.0, 32.0, 31.0, 49.0, 35.0, 47.0, 31.0, 41.0, 42.0, 30.0, 32.0, 37.0, 36.0, 28.0, 31.0, 23.0, 15.0, 22.0, 16.0, 22.0, 11.0, 14.0, 12.0, 3.0, 4.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.771484375, -1.717926025390625, -1.66436767578125, -1.610809326171875, -1.5572509765625, -1.503692626953125, -1.45013427734375, -1.396575927734375, -1.343017578125, -1.289459228515625, -1.23590087890625, -1.182342529296875, -1.1287841796875, -1.075225830078125, -1.02166748046875, -0.968109130859375, -0.91455078125, -0.860992431640625, -0.80743408203125, -0.753875732421875, -0.7003173828125, -0.646759033203125, -0.59320068359375, -0.539642333984375, -0.486083984375, -0.432525634765625, -0.37896728515625, -0.325408935546875, -0.2718505859375, -0.218292236328125, -0.16473388671875, -0.111175537109375, -0.0576171875, -0.004058837890625, 0.04949951171875, 0.103057861328125, 0.1566162109375, 0.210174560546875, 0.26373291015625, 0.317291259765625, 0.370849609375, 0.424407958984375, 0.47796630859375, 0.531524658203125, 0.5850830078125, 0.638641357421875, 0.69219970703125, 0.745758056640625, 0.79931640625, 0.852874755859375, 0.90643310546875, 0.959991455078125, 1.0135498046875, 1.067108154296875, 1.12066650390625, 1.174224853515625, 1.227783203125, 1.281341552734375, 1.33489990234375, 1.388458251953125, 1.4420166015625, 1.495574951171875, 1.54913330078125, 1.602691650390625, 1.65625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 9.0, 18.0, 21.0, 34.0, 38.0, 64.0, 92.0, 137.0, 190.0, 302.0, 368.0, 608.0, 833.0, 1344.0, 1884.0, 2947.0, 4315.0, 6756.0, 10448.0, 16068.0, 24776.0, 39014.0, 60683.0, 93016.0, 137368.0, 178796.0, 155979.0, 109966.0, 71956.0, 46150.0, 29586.0, 19178.0, 11938.0, 7947.0, 5279.0, 3415.0, 2324.0, 1537.0, 1019.0, 700.0, 457.0, 320.0, 222.0, 117.0, 118.0, 63.0, 55.0, 43.0, 26.0, 17.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1435546875, -0.13916397094726562, -0.13477325439453125, -0.13038253784179688, -0.1259918212890625, -0.12160110473632812, -0.11721038818359375, -0.11281967163085938, -0.108428955078125, -0.10403823852539062, -0.09964752197265625, -0.09525680541992188, -0.0908660888671875, -0.08647537231445312, -0.08208465576171875, -0.07769393920898438, -0.07330322265625, -0.06891250610351562, -0.06452178955078125, -0.060131072998046875, -0.0557403564453125, -0.051349639892578125, -0.04695892333984375, -0.042568206787109375, -0.038177490234375, -0.033786773681640625, -0.02939605712890625, -0.025005340576171875, -0.0206146240234375, -0.016223907470703125, -0.01183319091796875, -0.007442474365234375, -0.0030517578125, 0.001338958740234375, 0.00572967529296875, 0.010120391845703125, 0.0145111083984375, 0.018901824951171875, 0.02329254150390625, 0.027683258056640625, 0.032073974609375, 0.036464691162109375, 0.04085540771484375, 0.045246124267578125, 0.0496368408203125, 0.054027557373046875, 0.05841827392578125, 0.06280899047851562, 0.06719970703125, 0.07159042358398438, 0.07598114013671875, 0.08037185668945312, 0.0847625732421875, 0.08915328979492188, 0.09354400634765625, 0.09793472290039062, 0.102325439453125, 0.10671615600585938, 0.11110687255859375, 0.11549758911132812, 0.1198883056640625, 0.12427902221679688, 0.12866973876953125, 0.13306045532226562, 0.137451171875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 8.0, 7.0, 11.0, 13.0, 13.0, 14.0, 23.0, 17.0, 19.0, 16.0, 29.0, 21.0, 33.0, 35.0, 29.0, 37.0, 22.0, 35.0, 44.0, 38.0, 1060.0, 35.0, 36.0, 34.0, 42.0, 34.0, 31.0, 32.0, 37.0, 18.0, 26.0, 13.0, 25.0, 16.0, 23.0, 11.0, 15.0, 9.0, 9.0, 8.0, 15.0, 4.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.1064453125, -1.072662353515625, -1.03887939453125, -1.005096435546875, -0.9713134765625, -0.937530517578125, -0.90374755859375, -0.869964599609375, -0.836181640625, -0.802398681640625, -0.76861572265625, -0.734832763671875, -0.7010498046875, -0.667266845703125, -0.63348388671875, -0.599700927734375, -0.56591796875, -0.532135009765625, -0.49835205078125, -0.464569091796875, -0.4307861328125, -0.397003173828125, -0.36322021484375, -0.329437255859375, -0.295654296875, -0.261871337890625, -0.22808837890625, -0.194305419921875, -0.1605224609375, -0.126739501953125, -0.09295654296875, -0.059173583984375, -0.025390625, 0.008392333984375, 0.04217529296875, 0.075958251953125, 0.1097412109375, 0.143524169921875, 0.17730712890625, 0.211090087890625, 0.244873046875, 0.278656005859375, 0.31243896484375, 0.346221923828125, 0.3800048828125, 0.413787841796875, 0.44757080078125, 0.481353759765625, 0.51513671875, 0.548919677734375, 0.58270263671875, 0.616485595703125, 0.6502685546875, 0.684051513671875, 0.71783447265625, 0.751617431640625, 0.785400390625, 0.819183349609375, 0.85296630859375, 0.886749267578125, 0.9205322265625, 0.954315185546875, 0.98809814453125, 1.021881103515625, 1.0556640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 6.0, 4.0, 10.0, 6.0, 11.0, 20.0, 26.0, 41.0, 59.0, 90.0, 124.0, 165.0, 296.0, 388.0, 599.0, 903.0, 1322.0, 2070.0, 3231.0, 4965.0, 7650.0, 11672.0, 18476.0, 27734.0, 42064.0, 62696.0, 89930.0, 121550.0, 979118.0, 348097.0, 115483.0, 85317.0, 58969.0, 39578.0, 26107.0, 16836.0, 11080.0, 7076.0, 4592.0, 2938.0, 1968.0, 1263.0, 883.0, 563.0, 373.0, 258.0, 174.0, 122.0, 78.0, 38.0, 35.0, 28.0, 18.0, 12.0, 8.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.0828857421875, -0.08028888702392578, -0.07769203186035156, -0.07509517669677734, -0.07249832153320312, -0.0699014663696289, -0.06730461120605469, -0.06470775604248047, -0.06211090087890625, -0.05951404571533203, -0.05691719055175781, -0.054320335388183594, -0.051723480224609375, -0.049126625061035156, -0.04652976989746094, -0.04393291473388672, -0.0413360595703125, -0.03873920440673828, -0.03614234924316406, -0.033545494079589844, -0.030948638916015625, -0.028351783752441406, -0.025754928588867188, -0.02315807342529297, -0.02056121826171875, -0.01796436309814453, -0.015367507934570312, -0.012770652770996094, -0.010173797607421875, -0.007576942443847656, -0.0049800872802734375, -0.0023832321166992188, 0.000213623046875, 0.0028104782104492188, 0.0054073333740234375, 0.008004188537597656, 0.010601043701171875, 0.013197898864746094, 0.015794754028320312, 0.01839160919189453, 0.02098846435546875, 0.02358531951904297, 0.026182174682617188, 0.028779029846191406, 0.031375885009765625, 0.033972740173339844, 0.03656959533691406, 0.03916645050048828, 0.0417633056640625, 0.04436016082763672, 0.04695701599121094, 0.049553871154785156, 0.052150726318359375, 0.054747581481933594, 0.05734443664550781, 0.05994129180908203, 0.06253814697265625, 0.06513500213623047, 0.06773185729980469, 0.0703287124633789, 0.07292556762695312, 0.07552242279052734, 0.07811927795410156, 0.08071613311767578, 0.08331298828125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 1.0, 6.0, 4.0, 11.0, 10.0, 6.0, 9.0, 8.0, 11.0, 13.0, 23.0, 23.0, 27.0, 45.0, 37.0, 59.0, 75.0, 70.0, 99.0, 88.0, 67.0, 46.0, 44.0, 32.0, 31.0, 23.0, 26.0, 21.0, 16.0, 10.0, 12.0, 7.0, 4.0, 2.0, 6.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00447845458984375, -0.004344522953033447, -0.0042105913162231445, -0.004076659679412842, -0.003942728042602539, -0.0038087964057922363, -0.0036748647689819336, -0.003540933132171631, -0.003407001495361328, -0.0032730698585510254, -0.0031391382217407227, -0.00300520658493042, -0.002871274948120117, -0.0027373433113098145, -0.0026034116744995117, -0.002469480037689209, -0.0023355484008789062, -0.0022016167640686035, -0.0020676851272583008, -0.001933753490447998, -0.0017998218536376953, -0.0016658902168273926, -0.0015319585800170898, -0.0013980269432067871, -0.0012640953063964844, -0.0011301636695861816, -0.000996232032775879, -0.0008623003959655762, -0.0007283687591552734, -0.0005944371223449707, -0.00046050548553466797, -0.00032657384872436523, -0.0001926422119140625, -5.8710575103759766e-05, 7.522106170654297e-05, 0.0002091526985168457, 0.00034308433532714844, 0.00047701597213745117, 0.0006109476089477539, 0.0007448792457580566, 0.0008788108825683594, 0.0010127425193786621, 0.0011466741561889648, 0.0012806057929992676, 0.0014145374298095703, 0.001548469066619873, 0.0016824007034301758, 0.0018163323402404785, 0.0019502639770507812, 0.002084195613861084, 0.0022181272506713867, 0.0023520588874816895, 0.002485990524291992, 0.002619922161102295, 0.0027538537979125977, 0.0028877854347229004, 0.003021717071533203, 0.003155648708343506, 0.0032895803451538086, 0.0034235119819641113, 0.003557443618774414, 0.003691375255584717, 0.0038253068923950195, 0.003959238529205322, 0.004093170166015625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 11.0, 11.0, 7.0, 15.0, 19.0, 18.0, 21.0, 19.0, 29.0, 53.0, 43.0, 86.0, 92.0, 126.0, 211.0, 289.0, 490.0, 1299.0, 944716.0, 98725.0, 851.0, 475.0, 252.0, 197.0, 108.0, 101.0, 56.0, 37.0, 33.0, 24.0, 25.0, 14.0, 19.0, 13.0, 14.0, 7.0, 11.0, 12.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08233642578125, -0.07957935333251953, -0.07682228088378906, -0.0740652084350586, -0.07130813598632812, -0.06855106353759766, -0.06579399108886719, -0.06303691864013672, -0.06027984619140625, -0.05752277374267578, -0.05476570129394531, -0.052008628845214844, -0.049251556396484375, -0.046494483947753906, -0.04373741149902344, -0.04098033905029297, -0.0382232666015625, -0.03546619415283203, -0.03270912170410156, -0.029952049255371094, -0.027194976806640625, -0.024437904357910156, -0.021680831909179688, -0.01892375946044922, -0.01616668701171875, -0.013409614562988281, -0.010652542114257812, -0.007895469665527344, -0.005138397216796875, -0.0023813247680664062, 0.0003757476806640625, 0.0031328201293945312, 0.005889892578125, 0.008646965026855469, 0.011404037475585938, 0.014161109924316406, 0.016918182373046875, 0.019675254821777344, 0.022432327270507812, 0.02518939971923828, 0.02794647216796875, 0.03070354461669922, 0.03346061706542969, 0.036217689514160156, 0.038974761962890625, 0.041731834411621094, 0.04448890686035156, 0.04724597930908203, 0.0500030517578125, 0.05276012420654297, 0.05551719665527344, 0.058274269104003906, 0.061031341552734375, 0.06378841400146484, 0.06654548645019531, 0.06930255889892578, 0.07205963134765625, 0.07481670379638672, 0.07757377624511719, 0.08033084869384766, 0.08308792114257812, 0.0858449935913086, 0.08860206604003906, 0.09135913848876953, 0.0941162109375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 223.0, 794.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10006608814001083, -0.09713046997785568, -0.09419485181570053, -0.09125923365354538, -0.08832362294197083, -0.08538800477981567, -0.08245238661766052, -0.07951676845550537, -0.07658115029335022, -0.07364553213119507, -0.07070991396903992, -0.06777429580688477, -0.06483867764472961, -0.06190306320786476, -0.05896744877099991, -0.05603183060884476, -0.053096212446689606, -0.050160594284534454, -0.0472249761223793, -0.04428936168551445, -0.0413537435233593, -0.03841812536120415, -0.035482510924339294, -0.03254689276218414, -0.02961127460002899, -0.02667565643787384, -0.023740040138363838, -0.020804423838853836, -0.017868805676698685, -0.014933188445866108, -0.011997571215033531, -0.009061954915523529, -0.006126329302787781, -0.003190712071955204, -0.00025509484112262726, 0.0026805223897099495, 0.005616139620542526, 0.008551756851375103, 0.01148737408220768, 0.014422990381717682, 0.017358608543872833, 0.020294226706027985, 0.023229843005537987, 0.02616545930504799, 0.02910107746720314, 0.03203669562935829, 0.034972310066223145, 0.037907928228378296, 0.04084354639053345, 0.0437791645526886, 0.04671478271484375, 0.0496503971517086, 0.052586015313863754, 0.055521633476018906, 0.05845724791288376, 0.06139286607503891, 0.06432848423719406, 0.06726410239934921, 0.07019972056150436, 0.07313533872365952, 0.07607094943523407, 0.07900656759738922, 0.08194218575954437, 0.08487780392169952, 0.08781342208385468]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 13.0, 15.0, 31.0, 25.0, 34.0, 36.0, 42.0, 49.0, 68.0, 82.0, 87.0, 73.0, 63.0, 68.0, 48.0, 53.0, 41.0, 42.0, 32.0, 23.0, 24.0, 19.0, 7.0, 8.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004254341125488281, -0.004040941596031189, -0.0038275420665740967, -0.0036141425371170044, -0.003400743007659912, -0.00318734347820282, -0.0029739439487457275, -0.0027605444192886353, -0.002547144889831543, -0.0023337453603744507, -0.0021203458309173584, -0.0019069463014602661, -0.0016935467720031738, -0.0014801472425460815, -0.0012667477130889893, -0.001053348183631897, -0.0008399486541748047, -0.0006265491247177124, -0.0004131495952606201, -0.00019975006580352783, 1.3649463653564453e-05, 0.00022704899311065674, 0.000440448522567749, 0.0006538480520248413, 0.0008672475814819336, 0.0010806471109390259, 0.0012940466403961182, 0.0015074461698532104, 0.0017208456993103027, 0.001934245228767395, 0.0021476447582244873, 0.0023610442876815796, 0.002574443817138672, 0.002787843346595764, 0.0030012428760528564, 0.0032146424055099487, 0.003428041934967041, 0.0036414414644241333, 0.0038548409938812256, 0.004068240523338318, 0.00428164005279541, 0.0044950395822525024, 0.004708439111709595, 0.004921838641166687, 0.005135238170623779, 0.005348637700080872, 0.005562037229537964, 0.005775436758995056, 0.0059888362884521484, 0.006202235817909241, 0.006415635347366333, 0.006629034876823425, 0.006842434406280518, 0.00705583393573761, 0.007269233465194702, 0.007482632994651794, 0.007696032524108887, 0.007909432053565979, 0.008122831583023071, 0.008336231112480164, 0.008549630641937256, 0.008763030171394348, 0.00897642970085144, 0.009189829230308533, 0.009403228759765625]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 4.0, 6.0, 4.0, 5.0, 8.0, 12.0, 8.0, 12.0, 22.0, 18.0, 18.0, 19.0, 22.0, 20.0, 25.0, 27.0, 36.0, 37.0, 29.0, 32.0, 31.0, 50.0, 34.0, 47.0, 31.0, 41.0, 42.0, 30.0, 32.0, 38.0, 35.0, 28.0, 31.0, 23.0, 15.0, 22.0, 16.0, 21.0, 12.0, 14.0, 12.0, 3.0, 4.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.771484375, -1.717926025390625, -1.66436767578125, -1.610809326171875, -1.5572509765625, -1.503692626953125, -1.45013427734375, -1.396575927734375, -1.343017578125, -1.289459228515625, -1.23590087890625, -1.182342529296875, -1.1287841796875, -1.075225830078125, -1.02166748046875, -0.968109130859375, -0.91455078125, -0.860992431640625, -0.80743408203125, -0.753875732421875, -0.7003173828125, -0.646759033203125, -0.59320068359375, -0.539642333984375, -0.486083984375, -0.432525634765625, -0.37896728515625, -0.325408935546875, -0.2718505859375, -0.218292236328125, -0.16473388671875, -0.111175537109375, -0.0576171875, -0.004058837890625, 0.04949951171875, 0.103057861328125, 0.1566162109375, 0.210174560546875, 0.26373291015625, 0.317291259765625, 0.370849609375, 0.424407958984375, 0.47796630859375, 0.531524658203125, 0.5850830078125, 0.638641357421875, 0.69219970703125, 0.745758056640625, 0.79931640625, 0.852874755859375, 0.90643310546875, 0.959991455078125, 1.0135498046875, 1.067108154296875, 1.12066650390625, 1.174224853515625, 1.227783203125, 1.281341552734375, 1.33489990234375, 1.388458251953125, 1.4420166015625, 1.495574951171875, 1.54913330078125, 1.602691650390625, 1.65625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 20.0, 31.0, 21.0, 34.0, 47.0, 54.0, 74.0, 98.0, 153.0, 186.0, 232.0, 319.0, 486.0, 627.0, 853.0, 1198.0, 1703.0, 2583.0, 3726.0, 5796.0, 9347.0, 16432.0, 34837.0, 92764.0, 262451.0, 352889.0, 152828.0, 52539.0, 22456.0, 11931.0, 7066.0, 4491.0, 2947.0, 2084.0, 1505.0, 1044.0, 702.0, 537.0, 364.0, 293.0, 218.0, 162.0, 117.0, 77.0, 61.0, 46.0, 41.0, 20.0, 21.0, 14.0, 11.0, 9.0, 7.0, 2.0, 4.0, 1.0], "bins": [-4.81640625, -4.67144775390625, -4.5264892578125, -4.38153076171875, -4.236572265625, -4.09161376953125, -3.9466552734375, -3.80169677734375, -3.65673828125, -3.51177978515625, -3.3668212890625, -3.22186279296875, -3.076904296875, -2.93194580078125, -2.7869873046875, -2.64202880859375, -2.4970703125, -2.35211181640625, -2.2071533203125, -2.06219482421875, -1.917236328125, -1.77227783203125, -1.6273193359375, -1.48236083984375, -1.33740234375, -1.19244384765625, -1.0474853515625, -0.90252685546875, -0.757568359375, -0.61260986328125, -0.4676513671875, -0.32269287109375, -0.177734375, -0.03277587890625, 0.1121826171875, 0.25714111328125, 0.402099609375, 0.54705810546875, 0.6920166015625, 0.83697509765625, 0.98193359375, 1.12689208984375, 1.2718505859375, 1.41680908203125, 1.561767578125, 1.70672607421875, 1.8516845703125, 1.99664306640625, 2.1416015625, 2.28656005859375, 2.4315185546875, 2.57647705078125, 2.721435546875, 2.86639404296875, 3.0113525390625, 3.15631103515625, 3.30126953125, 3.44622802734375, 3.5911865234375, 3.73614501953125, 3.881103515625, 4.02606201171875, 4.1710205078125, 4.31597900390625, 4.4609375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 2.0, 4.0, 6.0, 10.0, 10.0, 5.0, 12.0, 8.0, 21.0, 13.0, 18.0, 25.0, 36.0, 30.0, 35.0, 33.0, 60.0, 60.0, 93.0, 203.0, 281.0, 1295.0, 193.0, 136.0, 85.0, 65.0, 54.0, 39.0, 39.0, 31.0, 23.0, 28.0, 21.0, 7.0, 13.0, 14.0, 13.0, 10.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7734375, -5.5811767578125, -5.388916015625, -5.1966552734375, -5.00439453125, -4.8121337890625, -4.619873046875, -4.4276123046875, -4.2353515625, -4.0430908203125, -3.850830078125, -3.6585693359375, -3.46630859375, -3.2740478515625, -3.081787109375, -2.8895263671875, -2.697265625, -2.5050048828125, -2.312744140625, -2.1204833984375, -1.92822265625, -1.7359619140625, -1.543701171875, -1.3514404296875, -1.1591796875, -0.9669189453125, -0.774658203125, -0.5823974609375, -0.39013671875, -0.1978759765625, -0.005615234375, 0.1866455078125, 0.37890625, 0.5711669921875, 0.763427734375, 0.9556884765625, 1.14794921875, 1.3402099609375, 1.532470703125, 1.7247314453125, 1.9169921875, 2.1092529296875, 2.301513671875, 2.4937744140625, 2.68603515625, 2.8782958984375, 3.070556640625, 3.2628173828125, 3.455078125, 3.6473388671875, 3.839599609375, 4.0318603515625, 4.22412109375, 4.4163818359375, 4.608642578125, 4.8009033203125, 4.9931640625, 5.1854248046875, 5.377685546875, 5.5699462890625, 5.76220703125, 5.9544677734375, 6.146728515625, 6.3389892578125, 6.53125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 8.0, 4.0, 4.0, 12.0, 8.0, 13.0, 16.0, 21.0, 19.0, 16.0, 20.0, 34.0, 54.0, 64.0, 104.0, 177.0, 458.0, 1468.0, 45252.0, 3068675.0, 27089.0, 1273.0, 373.0, 168.0, 94.0, 54.0, 44.0, 25.0, 36.0, 21.0, 14.0, 16.0, 8.0, 7.0, 12.0, 8.0, 3.0, 7.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.375, -20.6494140625, -19.923828125, -19.1982421875, -18.47265625, -17.7470703125, -17.021484375, -16.2958984375, -15.5703125, -14.8447265625, -14.119140625, -13.3935546875, -12.66796875, -11.9423828125, -11.216796875, -10.4912109375, -9.765625, -9.0400390625, -8.314453125, -7.5888671875, -6.86328125, -6.1376953125, -5.412109375, -4.6865234375, -3.9609375, -3.2353515625, -2.509765625, -1.7841796875, -1.05859375, -0.3330078125, 0.392578125, 1.1181640625, 1.84375, 2.5693359375, 3.294921875, 4.0205078125, 4.74609375, 5.4716796875, 6.197265625, 6.9228515625, 7.6484375, 8.3740234375, 9.099609375, 9.8251953125, 10.55078125, 11.2763671875, 12.001953125, 12.7275390625, 13.453125, 14.1787109375, 14.904296875, 15.6298828125, 16.35546875, 17.0810546875, 17.806640625, 18.5322265625, 19.2578125, 19.9833984375, 20.708984375, 21.4345703125, 22.16015625, 22.8857421875, 23.611328125, 24.3369140625, 25.0625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 16.0, 990.0, 11.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.18864440917969, -31.492420196533203, -25.79619598388672, -20.099971771240234, -14.40374755859375, -8.707523345947266, -3.0112991333007812, 2.684925079345703, 8.381149291992188, 14.077373504638672, 19.773597717285156, 25.46982192993164, 31.166046142578125, 36.86227035522461, 42.558494567871094, 48.25471878051758, 53.95094299316406, 59.64716720581055, 65.34339141845703, 71.03961181640625, 76.73583984375, 82.43206787109375, 88.12828826904297, 93.82450866699219, 99.52073669433594, 105.21696472167969, 110.9131851196289, 116.60940551757812, 122.30563354492188, 128.00186157226562, 133.69808959960938, 139.39430236816406, 145.09054565429688, 150.78677368164062, 156.48300170898438, 162.17921447753906, 167.8754425048828, 173.57167053222656, 179.26788330078125, 184.964111328125, 190.66033935546875, 196.3565673828125, 202.05279541015625, 207.74900817871094, 213.4452362060547, 219.14146423339844, 224.83767700195312, 230.53390502929688, 236.23013305664062, 241.92636108398438, 247.62258911132812, 253.3188018798828, 259.0150146484375, 264.71124267578125, 270.407470703125, 276.10369873046875, 281.7999267578125, 287.49615478515625, 293.1923828125, 298.88861083984375, 304.5848388671875, 310.2810363769531, 315.9772644042969, 321.6734924316406, 327.3697204589844]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 1.0, 8.0, 8.0, 3.0, 8.0, 8.0, 17.0, 9.0, 15.0, 12.0, 14.0, 21.0, 18.0, 25.0, 27.0, 27.0, 37.0, 43.0, 45.0, 46.0, 43.0, 40.0, 54.0, 38.0, 38.0, 40.0, 39.0, 32.0, 30.0, 30.0, 27.0, 21.0, 18.0, 25.0, 23.0, 13.0, 15.0, 15.0, 11.0, 10.0, 16.0, 4.0, 9.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-17.912866592407227, -17.33602523803711, -16.759183883666992, -16.182342529296875, -15.605502128601074, -15.028660774230957, -14.451820373535156, -13.874979019165039, -13.298137664794922, -12.721296310424805, -12.144454956054688, -11.567614555358887, -10.99077320098877, -10.413931846618652, -9.837091445922852, -9.260250091552734, -8.683408737182617, -8.1065673828125, -7.529726505279541, -6.952885627746582, -6.376044273376465, -5.799202919006348, -5.222362041473389, -4.64552116394043, -4.0686798095703125, -3.4918386936187744, -2.9149975776672363, -2.3381564617156982, -1.7613153457641602, -1.184474229812622, -0.607633113861084, -0.030792236328125, 0.5460491180419922, 1.1228902339935303, 1.6997313499450684, 2.2765724658966064, 2.8534135818481445, 3.4302546977996826, 4.007095813751221, 4.58393669128418, 5.160778045654297, 5.737619400024414, 6.314460277557373, 6.891301155090332, 7.468142509460449, 8.044983863830566, 8.621824264526367, 9.198665618896484, 9.775506973266602, 10.352348327636719, 10.929189682006836, 11.506030082702637, 12.082871437072754, 12.659712791442871, 13.236553192138672, 13.813394546508789, 14.390235900878906, 14.967077255249023, 15.54391860961914, 16.120759963989258, 16.697601318359375, 17.27444076538086, 17.851282119750977, 18.428123474121094, 19.00496482849121]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 9.0, 11.0, 11.0, 12.0, 16.0, 14.0, 13.0, 17.0, 21.0, 21.0, 30.0, 30.0, 33.0, 33.0, 31.0, 45.0, 42.0, 46.0, 45.0, 36.0, 36.0, 29.0, 43.0, 43.0, 34.0, 44.0, 28.0, 42.0, 21.0, 21.0, 17.0, 24.0, 11.0, 18.0, 13.0, 13.0, 10.0, 5.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.056640625, -1.9964141845703125, -1.936187744140625, -1.8759613037109375, -1.81573486328125, -1.7555084228515625, -1.695281982421875, -1.6350555419921875, -1.5748291015625, -1.5146026611328125, -1.454376220703125, -1.3941497802734375, -1.33392333984375, -1.2736968994140625, -1.213470458984375, -1.1532440185546875, -1.093017578125, -1.0327911376953125, -0.972564697265625, -0.9123382568359375, -0.85211181640625, -0.7918853759765625, -0.731658935546875, -0.6714324951171875, -0.6112060546875, -0.5509796142578125, -0.490753173828125, -0.4305267333984375, -0.37030029296875, -0.3100738525390625, -0.249847412109375, -0.1896209716796875, -0.12939453125, -0.0691680908203125, -0.008941650390625, 0.0512847900390625, 0.11151123046875, 0.1717376708984375, 0.231964111328125, 0.2921905517578125, 0.3524169921875, 0.4126434326171875, 0.472869873046875, 0.5330963134765625, 0.59332275390625, 0.6535491943359375, 0.713775634765625, 0.7740020751953125, 0.834228515625, 0.8944549560546875, 0.954681396484375, 1.0149078369140625, 1.07513427734375, 1.1353607177734375, 1.195587158203125, 1.2558135986328125, 1.3160400390625, 1.3762664794921875, 1.436492919921875, 1.4967193603515625, 1.55694580078125, 1.6171722412109375, 1.677398681640625, 1.7376251220703125, 1.7978515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 4.0, 9.0, 9.0, 10.0, 14.0, 25.0, 16.0, 33.0, 38.0, 53.0, 56.0, 76.0, 114.0, 136.0, 190.0, 239.0, 372.0, 667.0, 1309.0, 3744.0, 14348.0, 86752.0, 1009503.0, 2735835.0, 293498.0, 34926.0, 7347.0, 2291.0, 956.0, 499.0, 321.0, 226.0, 164.0, 107.0, 95.0, 63.0, 58.0, 55.0, 25.0, 16.0, 12.0, 14.0, 15.0, 8.0, 5.0, 4.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.296875, -7.0557861328125, -6.814697265625, -6.5736083984375, -6.33251953125, -6.0914306640625, -5.850341796875, -5.6092529296875, -5.3681640625, -5.1270751953125, -4.885986328125, -4.6448974609375, -4.40380859375, -4.1627197265625, -3.921630859375, -3.6805419921875, -3.439453125, -3.1983642578125, -2.957275390625, -2.7161865234375, -2.47509765625, -2.2340087890625, -1.992919921875, -1.7518310546875, -1.5107421875, -1.2696533203125, -1.028564453125, -0.7874755859375, -0.54638671875, -0.3052978515625, -0.064208984375, 0.1768798828125, 0.41796875, 0.6590576171875, 0.900146484375, 1.1412353515625, 1.38232421875, 1.6234130859375, 1.864501953125, 2.1055908203125, 2.3466796875, 2.5877685546875, 2.828857421875, 3.0699462890625, 3.31103515625, 3.5521240234375, 3.793212890625, 4.0343017578125, 4.275390625, 4.5164794921875, 4.757568359375, 4.9986572265625, 5.23974609375, 5.4808349609375, 5.721923828125, 5.9630126953125, 6.2041015625, 6.4451904296875, 6.686279296875, 6.9273681640625, 7.16845703125, 7.4095458984375, 7.650634765625, 7.8917236328125, 8.1328125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 16.0, 14.0, 27.0, 33.0, 58.0, 54.0, 119.0, 163.0, 187.0, 309.0, 424.0, 480.0, 552.0, 454.0, 335.0, 261.0, 173.0, 136.0, 82.0, 60.0, 33.0, 26.0, 23.0, 15.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.30743408203125, -7.0797119140625, -6.85198974609375, -6.624267578125, -6.39654541015625, -6.1688232421875, -5.94110107421875, -5.71337890625, -5.48565673828125, -5.2579345703125, -5.03021240234375, -4.802490234375, -4.57476806640625, -4.3470458984375, -4.11932373046875, -3.8916015625, -3.66387939453125, -3.4361572265625, -3.20843505859375, -2.980712890625, -2.75299072265625, -2.5252685546875, -2.29754638671875, -2.06982421875, -1.84210205078125, -1.6143798828125, -1.38665771484375, -1.158935546875, -0.93121337890625, -0.7034912109375, -0.47576904296875, -0.248046875, -0.02032470703125, 0.2073974609375, 0.43511962890625, 0.662841796875, 0.89056396484375, 1.1182861328125, 1.34600830078125, 1.57373046875, 1.80145263671875, 2.0291748046875, 2.25689697265625, 2.484619140625, 2.71234130859375, 2.9400634765625, 3.16778564453125, 3.3955078125, 3.62322998046875, 3.8509521484375, 4.07867431640625, 4.306396484375, 4.53411865234375, 4.7618408203125, 4.98956298828125, 5.21728515625, 5.44500732421875, 5.6727294921875, 5.90045166015625, 6.128173828125, 6.35589599609375, 6.5836181640625, 6.81134033203125, 7.0390625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 11.0, 17.0, 26.0, 39.0, 104.0, 139.0, 310.0, 635.0, 1623.0, 4740.0, 34518.0, 791175.0, 3156677.0, 186934.0, 12707.0, 2775.0, 987.0, 428.0, 201.0, 103.0, 64.0, 29.0, 15.0, 8.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8984375, -15.3902587890625, -14.882080078125, -14.3739013671875, -13.86572265625, -13.3575439453125, -12.849365234375, -12.3411865234375, -11.8330078125, -11.3248291015625, -10.816650390625, -10.3084716796875, -9.80029296875, -9.2921142578125, -8.783935546875, -8.2757568359375, -7.767578125, -7.2593994140625, -6.751220703125, -6.2430419921875, -5.73486328125, -5.2266845703125, -4.718505859375, -4.2103271484375, -3.7021484375, -3.1939697265625, -2.685791015625, -2.1776123046875, -1.66943359375, -1.1612548828125, -0.653076171875, -0.1448974609375, 0.36328125, 0.8714599609375, 1.379638671875, 1.8878173828125, 2.39599609375, 2.9041748046875, 3.412353515625, 3.9205322265625, 4.4287109375, 4.9368896484375, 5.445068359375, 5.9532470703125, 6.46142578125, 6.9696044921875, 7.477783203125, 7.9859619140625, 8.494140625, 9.0023193359375, 9.510498046875, 10.0186767578125, 10.52685546875, 11.0350341796875, 11.543212890625, 12.0513916015625, 12.5595703125, 13.0677490234375, 13.575927734375, 14.0841064453125, 14.59228515625, 15.1004638671875, 15.608642578125, 16.1168212890625, 16.625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 9.0, 185.0, 564.0, 234.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.34942626953125, -60.21497344970703, -56.08051681518555, -51.94606399536133, -47.811607360839844, -43.677154541015625, -39.542701721191406, -35.40824890136719, -31.273792266845703, -27.13933753967285, -23.0048828125, -18.87042999267578, -14.73597526550293, -10.601520538330078, -6.467067718505859, -2.332612991333008, 1.8018417358398438, 5.936295986175537, 10.07075023651123, 14.205204010009766, 18.339658737182617, 22.47411346435547, 26.608566284179688, 30.74302101135254, 34.87747573852539, 39.01192855834961, 43.146385192871094, 47.28083801269531, 51.41529083251953, 55.549747467041016, 59.684200286865234, 63.81865692138672, 67.95310974121094, 72.08756256103516, 76.22201538085938, 80.35647583007812, 84.49092864990234, 88.62538146972656, 92.75983428955078, 96.894287109375, 101.02874755859375, 105.16320037841797, 109.29765319824219, 113.43211364746094, 117.56656646728516, 121.70101928710938, 125.8354721069336, 129.9699249267578, 134.1043701171875, 138.23883056640625, 142.37327575683594, 146.5077362060547, 150.64218139648438, 154.77664184570312, 158.91110229492188, 163.04554748535156, 167.1800079345703, 171.31446838378906, 175.44891357421875, 179.5833740234375, 183.7178192138672, 187.85227966308594, 191.98672485351562, 196.12118530273438, 200.25564575195312]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 10.0, 9.0, 10.0, 10.0, 12.0, 12.0, 16.0, 24.0, 25.0, 18.0, 21.0, 24.0, 28.0, 30.0, 21.0, 36.0, 35.0, 39.0, 33.0, 44.0, 34.0, 48.0, 46.0, 40.0, 38.0, 32.0, 37.0, 36.0, 23.0, 24.0, 29.0, 24.0, 24.0, 18.0, 17.0, 19.0, 15.0, 6.0, 11.0, 6.0, 7.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.43444061279297, -17.770204544067383, -17.105968475341797, -16.44173240661621, -15.777497291564941, -15.113261222839355, -14.449026107788086, -13.7847900390625, -13.120553970336914, -12.456317901611328, -11.792081832885742, -11.127846717834473, -10.463610649108887, -9.7993745803833, -9.135139465332031, -8.470903396606445, -7.806667327880859, -7.142431259155273, -6.478195667266846, -5.813960075378418, -5.149724006652832, -4.485487937927246, -3.8212523460388184, -3.1570167541503906, -2.4927806854248047, -1.8285448551177979, -1.164309024810791, -0.5000731945037842, 0.16416263580322266, 0.8283984661102295, 1.4926342964172363, 2.156869888305664, 2.82110595703125, 3.485341787338257, 4.149577617645264, 4.813813209533691, 5.478049278259277, 6.142285346984863, 6.806520938873291, 7.470756530761719, 8.134992599487305, 8.79922866821289, 9.463464736938477, 10.127699851989746, 10.791935920715332, 11.456171989440918, 12.120407104492188, 12.784643173217773, 13.44887924194336, 14.113115310668945, 14.777351379394531, 15.4415864944458, 16.105823516845703, 16.770057678222656, 17.434293746948242, 18.098529815673828, 18.762765884399414, 19.427001953125, 20.091238021850586, 20.755474090576172, 21.419708251953125, 22.08394432067871, 22.748180389404297, 23.412416458129883, 24.07665252685547]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 8.0, 5.0, 6.0, 7.0, 4.0, 13.0, 17.0, 19.0, 16.0, 17.0, 19.0, 24.0, 25.0, 30.0, 30.0, 36.0, 34.0, 42.0, 31.0, 49.0, 43.0, 36.0, 45.0, 40.0, 28.0, 34.0, 40.0, 43.0, 36.0, 33.0, 26.0, 27.0, 22.0, 17.0, 19.0, 15.0, 11.0, 12.0, 10.0, 12.0, 7.0, 4.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.1484375, -2.0880889892578125, -2.027740478515625, -1.9673919677734375, -1.90704345703125, -1.8466949462890625, -1.786346435546875, -1.7259979248046875, -1.6656494140625, -1.6053009033203125, -1.544952392578125, -1.4846038818359375, -1.42425537109375, -1.3639068603515625, -1.303558349609375, -1.2432098388671875, -1.182861328125, -1.1225128173828125, -1.062164306640625, -1.0018157958984375, -0.94146728515625, -0.8811187744140625, -0.820770263671875, -0.7604217529296875, -0.7000732421875, -0.6397247314453125, -0.579376220703125, -0.5190277099609375, -0.45867919921875, -0.3983306884765625, -0.337982177734375, -0.2776336669921875, -0.21728515625, -0.1569366455078125, -0.096588134765625, -0.0362396240234375, 0.02410888671875, 0.0844573974609375, 0.144805908203125, 0.2051544189453125, 0.2655029296875, 0.3258514404296875, 0.386199951171875, 0.4465484619140625, 0.50689697265625, 0.5672454833984375, 0.627593994140625, 0.6879425048828125, 0.748291015625, 0.8086395263671875, 0.868988037109375, 0.9293365478515625, 0.98968505859375, 1.0500335693359375, 1.110382080078125, 1.1707305908203125, 1.2310791015625, 1.2914276123046875, 1.351776123046875, 1.4121246337890625, 1.47247314453125, 1.5328216552734375, 1.593170166015625, 1.6535186767578125, 1.7138671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 7.0, 13.0, 13.0, 16.0, 32.0, 52.0, 62.0, 116.0, 164.0, 247.0, 352.0, 591.0, 852.0, 1297.0, 1962.0, 3019.0, 4765.0, 7474.0, 12053.0, 18645.0, 29798.0, 46195.0, 72207.0, 108329.0, 150231.0, 174010.0, 139787.0, 97493.0, 64958.0, 41244.0, 26483.0, 16597.0, 10596.0, 6726.0, 4348.0, 2747.0, 1777.0, 1087.0, 755.0, 473.0, 312.0, 213.0, 152.0, 97.0, 70.0, 51.0, 23.0, 29.0, 10.0, 9.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.1514892578125, -0.14694976806640625, -0.1424102783203125, -0.13787078857421875, -0.133331298828125, -0.12879180908203125, -0.1242523193359375, -0.11971282958984375, -0.11517333984375, -0.11063385009765625, -0.1060943603515625, -0.10155487060546875, -0.097015380859375, -0.09247589111328125, -0.0879364013671875, -0.08339691162109375, -0.078857421875, -0.07431793212890625, -0.0697784423828125, -0.06523895263671875, -0.060699462890625, -0.05615997314453125, -0.0516204833984375, -0.04708099365234375, -0.04254150390625, -0.03800201416015625, -0.0334625244140625, -0.02892303466796875, -0.024383544921875, -0.01984405517578125, -0.0153045654296875, -0.01076507568359375, -0.0062255859375, -0.00168609619140625, 0.0028533935546875, 0.00739288330078125, 0.011932373046875, 0.01647186279296875, 0.0210113525390625, 0.02555084228515625, 0.03009033203125, 0.03462982177734375, 0.0391693115234375, 0.04370880126953125, 0.048248291015625, 0.05278778076171875, 0.0573272705078125, 0.06186676025390625, 0.06640625, 0.07094573974609375, 0.0754852294921875, 0.08002471923828125, 0.084564208984375, 0.08910369873046875, 0.0936431884765625, 0.09818267822265625, 0.10272216796875, 0.10726165771484375, 0.1118011474609375, 0.11634063720703125, 0.120880126953125, 0.12541961669921875, 0.1299591064453125, 0.13449859619140625, 0.1390380859375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 1.0, 6.0, 9.0, 7.0, 11.0, 11.0, 20.0, 14.0, 14.0, 22.0, 24.0, 27.0, 32.0, 31.0, 32.0, 26.0, 37.0, 41.0, 41.0, 46.0, 40.0, 1059.0, 41.0, 54.0, 41.0, 30.0, 41.0, 23.0, 23.0, 34.0, 24.0, 22.0, 22.0, 16.0, 8.0, 16.0, 15.0, 13.0, 12.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.15234375, -1.1144866943359375, -1.076629638671875, -1.0387725830078125, -1.00091552734375, -0.9630584716796875, -0.925201416015625, -0.8873443603515625, -0.8494873046875, -0.8116302490234375, -0.773773193359375, -0.7359161376953125, -0.69805908203125, -0.6602020263671875, -0.622344970703125, -0.5844879150390625, -0.546630859375, -0.5087738037109375, -0.470916748046875, -0.4330596923828125, -0.39520263671875, -0.3573455810546875, -0.319488525390625, -0.2816314697265625, -0.2437744140625, -0.2059173583984375, -0.168060302734375, -0.1302032470703125, -0.09234619140625, -0.0544891357421875, -0.016632080078125, 0.0212249755859375, 0.05908203125, 0.0969390869140625, 0.134796142578125, 0.1726531982421875, 0.21051025390625, 0.2483673095703125, 0.286224365234375, 0.3240814208984375, 0.3619384765625, 0.3997955322265625, 0.437652587890625, 0.4755096435546875, 0.51336669921875, 0.5512237548828125, 0.589080810546875, 0.6269378662109375, 0.664794921875, 0.7026519775390625, 0.740509033203125, 0.7783660888671875, 0.81622314453125, 0.8540802001953125, 0.891937255859375, 0.9297943115234375, 0.9676513671875, 1.0055084228515625, 1.043365478515625, 1.0812225341796875, 1.11907958984375, 1.1569366455078125, 1.194793701171875, 1.2326507568359375, 1.2705078125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 8.0, 16.0, 23.0, 47.0, 49.0, 87.0, 121.0, 196.0, 259.0, 441.0, 663.0, 953.0, 1463.0, 2219.0, 3434.0, 5250.0, 8079.0, 12198.0, 18608.0, 28453.0, 42461.0, 62764.0, 89319.0, 121533.0, 962313.0, 359881.0, 115088.0, 84708.0, 59468.0, 39972.0, 26812.0, 17309.0, 11500.0, 7359.0, 4858.0, 3186.0, 2015.0, 1292.0, 913.0, 601.0, 376.0, 237.0, 185.0, 145.0, 97.0, 59.0, 34.0, 22.0, 26.0, 13.0, 8.0, 7.0, 2.0, 2.0], "bins": [-0.09521484375, -0.09248828887939453, -0.08976173400878906, -0.0870351791381836, -0.08430862426757812, -0.08158206939697266, -0.07885551452636719, -0.07612895965576172, -0.07340240478515625, -0.07067584991455078, -0.06794929504394531, -0.06522274017333984, -0.062496185302734375, -0.059769630432128906, -0.05704307556152344, -0.05431652069091797, -0.0515899658203125, -0.04886341094970703, -0.04613685607910156, -0.043410301208496094, -0.040683746337890625, -0.037957191467285156, -0.03523063659667969, -0.03250408172607422, -0.02977752685546875, -0.02705097198486328, -0.024324417114257812, -0.021597862243652344, -0.018871307373046875, -0.016144752502441406, -0.013418197631835938, -0.010691642761230469, -0.007965087890625, -0.005238533020019531, -0.0025119781494140625, 0.00021457672119140625, 0.002941131591796875, 0.005667686462402344, 0.008394241333007812, 0.011120796203613281, 0.01384735107421875, 0.01657390594482422, 0.019300460815429688, 0.022027015686035156, 0.024753570556640625, 0.027480125427246094, 0.030206680297851562, 0.03293323516845703, 0.0356597900390625, 0.03838634490966797, 0.04111289978027344, 0.043839454650878906, 0.046566009521484375, 0.049292564392089844, 0.05201911926269531, 0.05474567413330078, 0.05747222900390625, 0.06019878387451172, 0.06292533874511719, 0.06565189361572266, 0.06837844848632812, 0.0711050033569336, 0.07383155822753906, 0.07655811309814453, 0.07928466796875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 8.0, 6.0, 6.0, 6.0, 6.0, 7.0, 12.0, 24.0, 33.0, 29.0, 46.0, 59.0, 115.0, 113.0, 113.0, 104.0, 94.0, 41.0, 51.0, 27.0, 27.0, 21.0, 13.0, 6.0, 6.0, 5.0, 6.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009185791015625, -0.008950889110565186, -0.008715987205505371, -0.008481085300445557, -0.008246183395385742, -0.008011281490325928, -0.007776379585266113, -0.007541477680206299, -0.007306575775146484, -0.00707167387008667, -0.0068367719650268555, -0.006601870059967041, -0.0063669681549072266, -0.006132066249847412, -0.005897164344787598, -0.005662262439727783, -0.005427360534667969, -0.005192458629608154, -0.00495755672454834, -0.004722654819488525, -0.004487752914428711, -0.0042528510093688965, -0.004017949104309082, -0.0037830471992492676, -0.003548145294189453, -0.0033132433891296387, -0.0030783414840698242, -0.0028434395790100098, -0.0026085376739501953, -0.002373635768890381, -0.0021387338638305664, -0.001903831958770752, -0.0016689300537109375, -0.001434028148651123, -0.0011991262435913086, -0.0009642243385314941, -0.0007293224334716797, -0.0004944205284118652, -0.0002595186233520508, -2.4616718292236328e-05, 0.00021028518676757812, 0.0004451870918273926, 0.000680088996887207, 0.0009149909019470215, 0.001149892807006836, 0.0013847947120666504, 0.0016196966171264648, 0.0018545985221862793, 0.0020895004272460938, 0.002324402332305908, 0.0025593042373657227, 0.002794206142425537, 0.0030291080474853516, 0.003264009952545166, 0.0034989118576049805, 0.003733813762664795, 0.003968715667724609, 0.004203617572784424, 0.004438519477844238, 0.004673421382904053, 0.004908323287963867, 0.005143225193023682, 0.005378127098083496, 0.0056130290031433105, 0.005847930908203125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 7.0, 5.0, 3.0, 7.0, 4.0, 13.0, 11.0, 22.0, 24.0, 23.0, 31.0, 46.0, 71.0, 97.0, 189.0, 408.0, 1771.0, 1042453.0, 2436.0, 405.0, 187.0, 98.0, 62.0, 44.0, 42.0, 17.0, 14.0, 13.0, 11.0, 7.0, 13.0, 6.0, 1.0, 6.0, 1.0, 0.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138916015625, -0.1336822509765625, -0.128448486328125, -0.1232147216796875, -0.11798095703125, -0.1127471923828125, -0.107513427734375, -0.1022796630859375, -0.0970458984375, -0.0918121337890625, -0.086578369140625, -0.0813446044921875, -0.07611083984375, -0.0708770751953125, -0.065643310546875, -0.0604095458984375, -0.05517578125, -0.0499420166015625, -0.044708251953125, -0.0394744873046875, -0.03424072265625, -0.0290069580078125, -0.023773193359375, -0.0185394287109375, -0.0133056640625, -0.0080718994140625, -0.002838134765625, 0.0023956298828125, 0.00762939453125, 0.0128631591796875, 0.018096923828125, 0.0233306884765625, 0.028564453125, 0.0337982177734375, 0.039031982421875, 0.0442657470703125, 0.04949951171875, 0.0547332763671875, 0.059967041015625, 0.0652008056640625, 0.0704345703125, 0.0756683349609375, 0.080902099609375, 0.0861358642578125, 0.09136962890625, 0.0966033935546875, 0.101837158203125, 0.1070709228515625, 0.1123046875, 0.1175384521484375, 0.122772216796875, 0.1280059814453125, 0.13323974609375, 0.1384735107421875, 0.143707275390625, 0.1489410400390625, 0.1541748046875, 0.1594085693359375, 0.164642333984375, 0.1698760986328125, 0.17510986328125, 0.1803436279296875, 0.185577392578125, 0.1908111572265625, 0.196044921875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1009.0, 7.0, 0.0, 0.0, 1.0], "bins": [-0.2553044557571411, -0.2510179281234741, -0.24673143029212952, -0.24244491755962372, -0.23815840482711792, -0.23387187719345093, -0.22958537936210632, -0.22529885172843933, -0.22101233899593353, -0.21672582626342773, -0.21243931353092194, -0.20815280079841614, -0.20386628806591034, -0.19957977533340454, -0.19529324769973755, -0.19100673496723175, -0.18672022223472595, -0.18243370950222015, -0.17814719676971436, -0.17386068403720856, -0.16957417130470276, -0.16528764367103577, -0.16100114583969116, -0.15671461820602417, -0.15242812037467957, -0.14814160764217377, -0.14385509490966797, -0.13956858217716217, -0.13528206944465637, -0.13099554181098938, -0.12670904397964478, -0.12242252379655838, -0.11813601106405258, -0.11384949833154678, -0.10956298559904099, -0.10527646541595459, -0.10098995268344879, -0.096703439950943, -0.0924169272184372, -0.0881304144859314, -0.0838439017534256, -0.0795573890209198, -0.075270876288414, -0.0709843635559082, -0.06669784337282181, -0.06241133064031601, -0.05812481790781021, -0.05383830517530441, -0.04955178499221802, -0.04526527225971222, -0.04097875580191612, -0.036692243069410324, -0.03240572661161423, -0.02811921387910843, -0.02383270114660263, -0.019546186551451683, -0.015259671956300735, -0.010973157361149788, -0.006686643697321415, -0.002400130033493042, 0.0018863845616579056, 0.006172899156808853, 0.010459411889314651, 0.014745926484465599, 0.019032441079616547]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 10.0, 12.0, 12.0, 25.0, 23.0, 35.0, 47.0, 40.0, 46.0, 68.0, 62.0, 58.0, 67.0, 57.0, 51.0, 50.0, 48.0, 45.0, 41.0, 24.0, 29.0, 32.0, 28.0, 16.0, 23.0, 14.0, 9.0, 11.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005879044532775879, -0.005641903728246689, -0.005404762923717499, -0.005167622119188309, -0.004930481314659119, -0.004693340510129929, -0.0044561997056007385, -0.0042190589010715485, -0.003981918096542358, -0.0037447772920131683, -0.0035076364874839783, -0.003270495682954788, -0.003033354878425598, -0.002796214073896408, -0.002559073269367218, -0.002321932464838028, -0.002084791660308838, -0.0018476508557796478, -0.0016105100512504578, -0.0013733692467212677, -0.0011362284421920776, -0.0008990876376628876, -0.0006619468331336975, -0.00042480602860450745, -0.00018766522407531738, 4.947558045387268e-05, 0.00028661638498306274, 0.0005237571895122528, 0.0007608979940414429, 0.000998038798570633, 0.001235179603099823, 0.001472320407629013, 0.0017094612121582031, 0.0019466020166873932, 0.0021837428212165833, 0.0024208836257457733, 0.0026580244302749634, 0.0028951652348041534, 0.0031323060393333435, 0.0033694468438625336, 0.0036065876483917236, 0.0038437284529209137, 0.004080869257450104, 0.004318010061979294, 0.004555150866508484, 0.004792291671037674, 0.005029432475566864, 0.005266573280096054, 0.005503714084625244, 0.005740854889154434, 0.005977995693683624, 0.006215136498212814, 0.006452277302742004, 0.0066894181072711945, 0.0069265589118003845, 0.007163699716329575, 0.007400840520858765, 0.007637981325387955, 0.007875122129917145, 0.008112262934446335, 0.008349403738975525, 0.008586544543504715, 0.008823685348033905, 0.009060826152563095, 0.009297966957092285]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 8.0, 5.0, 6.0, 7.0, 4.0, 13.0, 17.0, 19.0, 16.0, 17.0, 19.0, 24.0, 25.0, 30.0, 30.0, 36.0, 34.0, 42.0, 31.0, 49.0, 43.0, 36.0, 45.0, 40.0, 28.0, 34.0, 41.0, 42.0, 36.0, 33.0, 26.0, 27.0, 22.0, 17.0, 19.0, 15.0, 11.0, 12.0, 10.0, 12.0, 7.0, 4.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.1484375, -2.0880889892578125, -2.027740478515625, -1.9673919677734375, -1.90704345703125, -1.8466949462890625, -1.786346435546875, -1.7259979248046875, -1.6656494140625, -1.6053009033203125, -1.544952392578125, -1.4846038818359375, -1.42425537109375, -1.3639068603515625, -1.303558349609375, -1.2432098388671875, -1.182861328125, -1.1225128173828125, -1.062164306640625, -1.0018157958984375, -0.94146728515625, -0.8811187744140625, -0.820770263671875, -0.7604217529296875, -0.7000732421875, -0.6397247314453125, -0.579376220703125, -0.5190277099609375, -0.45867919921875, -0.3983306884765625, -0.337982177734375, -0.2776336669921875, -0.21728515625, -0.1569366455078125, -0.096588134765625, -0.0362396240234375, 0.02410888671875, 0.0844573974609375, 0.144805908203125, 0.2051544189453125, 0.2655029296875, 0.3258514404296875, 0.386199951171875, 0.4465484619140625, 0.50689697265625, 0.5672454833984375, 0.627593994140625, 0.6879425048828125, 0.748291015625, 0.8086395263671875, 0.868988037109375, 0.9293365478515625, 0.98968505859375, 1.0500335693359375, 1.110382080078125, 1.1707305908203125, 1.2310791015625, 1.2914276123046875, 1.351776123046875, 1.4121246337890625, 1.47247314453125, 1.5328216552734375, 1.593170166015625, 1.6535186767578125, 1.7138671875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 15.0, 6.0, 10.0, 25.0, 31.0, 34.0, 38.0, 69.0, 95.0, 142.0, 190.0, 308.0, 444.0, 690.0, 1130.0, 2149.0, 4236.0, 9189.0, 20676.0, 47248.0, 108628.0, 219055.0, 288835.0, 186593.0, 88453.0, 38236.0, 16556.0, 7320.0, 3550.0, 1757.0, 1008.0, 633.0, 395.0, 256.0, 164.0, 109.0, 73.0, 56.0, 44.0, 36.0, 25.0, 21.0, 7.0, 10.0, 3.0, 5.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-2.39453125, -2.324859619140625, -2.25518798828125, -2.185516357421875, -2.1158447265625, -2.046173095703125, -1.97650146484375, -1.906829833984375, -1.837158203125, -1.767486572265625, -1.69781494140625, -1.628143310546875, -1.5584716796875, -1.488800048828125, -1.41912841796875, -1.349456787109375, -1.27978515625, -1.210113525390625, -1.14044189453125, -1.070770263671875, -1.0010986328125, -0.931427001953125, -0.86175537109375, -0.792083740234375, -0.722412109375, -0.652740478515625, -0.58306884765625, -0.513397216796875, -0.4437255859375, -0.374053955078125, -0.30438232421875, -0.234710693359375, -0.1650390625, -0.095367431640625, -0.02569580078125, 0.043975830078125, 0.1136474609375, 0.183319091796875, 0.25299072265625, 0.322662353515625, 0.392333984375, 0.462005615234375, 0.53167724609375, 0.601348876953125, 0.6710205078125, 0.740692138671875, 0.81036376953125, 0.880035400390625, 0.94970703125, 1.019378662109375, 1.08905029296875, 1.158721923828125, 1.2283935546875, 1.298065185546875, 1.36773681640625, 1.437408447265625, 1.507080078125, 1.576751708984375, 1.64642333984375, 1.716094970703125, 1.7857666015625, 1.855438232421875, 1.92510986328125, 1.994781494140625, 2.064453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 13.0, 11.0, 15.0, 17.0, 17.0, 22.0, 23.0, 31.0, 28.0, 43.0, 37.0, 55.0, 71.0, 99.0, 145.0, 236.0, 1339.0, 218.0, 125.0, 86.0, 56.0, 40.0, 39.0, 42.0, 31.0, 30.0, 17.0, 27.0, 21.0, 11.0, 20.0, 8.0, 16.0, 7.0, 8.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.8671875, -6.6549072265625, -6.442626953125, -6.2303466796875, -6.01806640625, -5.8057861328125, -5.593505859375, -5.3812255859375, -5.1689453125, -4.9566650390625, -4.744384765625, -4.5321044921875, -4.31982421875, -4.1075439453125, -3.895263671875, -3.6829833984375, -3.470703125, -3.2584228515625, -3.046142578125, -2.8338623046875, -2.62158203125, -2.4093017578125, -2.197021484375, -1.9847412109375, -1.7724609375, -1.5601806640625, -1.347900390625, -1.1356201171875, -0.92333984375, -0.7110595703125, -0.498779296875, -0.2864990234375, -0.07421875, 0.1380615234375, 0.350341796875, 0.5626220703125, 0.77490234375, 0.9871826171875, 1.199462890625, 1.4117431640625, 1.6240234375, 1.8363037109375, 2.048583984375, 2.2608642578125, 2.47314453125, 2.6854248046875, 2.897705078125, 3.1099853515625, 3.322265625, 3.5345458984375, 3.746826171875, 3.9591064453125, 4.17138671875, 4.3836669921875, 4.595947265625, 4.8082275390625, 5.0205078125, 5.2327880859375, 5.445068359375, 5.6573486328125, 5.86962890625, 6.0819091796875, 6.294189453125, 6.5064697265625, 6.71875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 9.0, 12.0, 5.0, 23.0, 10.0, 20.0, 16.0, 38.0, 40.0, 49.0, 53.0, 81.0, 146.0, 239.0, 440.0, 1196.0, 5456.0, 161564.0, 2896274.0, 74126.0, 3914.0, 931.0, 372.0, 201.0, 114.0, 64.0, 64.0, 51.0, 47.0, 24.0, 17.0, 21.0, 11.0, 14.0, 13.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-14.0, -13.568115234375, -13.13623046875, -12.704345703125, -12.2724609375, -11.840576171875, -11.40869140625, -10.976806640625, -10.544921875, -10.113037109375, -9.68115234375, -9.249267578125, -8.8173828125, -8.385498046875, -7.95361328125, -7.521728515625, -7.08984375, -6.657958984375, -6.22607421875, -5.794189453125, -5.3623046875, -4.930419921875, -4.49853515625, -4.066650390625, -3.634765625, -3.202880859375, -2.77099609375, -2.339111328125, -1.9072265625, -1.475341796875, -1.04345703125, -0.611572265625, -0.1796875, 0.252197265625, 0.68408203125, 1.115966796875, 1.5478515625, 1.979736328125, 2.41162109375, 2.843505859375, 3.275390625, 3.707275390625, 4.13916015625, 4.571044921875, 5.0029296875, 5.434814453125, 5.86669921875, 6.298583984375, 6.73046875, 7.162353515625, 7.59423828125, 8.026123046875, 8.4580078125, 8.889892578125, 9.32177734375, 9.753662109375, 10.185546875, 10.617431640625, 11.04931640625, 11.481201171875, 11.9130859375, 12.344970703125, 12.77685546875, 13.208740234375, 13.640625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 12.0, 333.0, 617.0, 51.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.640289306640625, -40.293643951416016, -37.946998596191406, -35.60034942626953, -33.25370407104492, -30.907058715820312, -28.56041145324707, -26.213764190673828, -23.86711883544922, -21.52047348022461, -19.173826217651367, -16.827178955078125, -14.480533599853516, -12.13388729095459, -9.787240982055664, -7.440593719482422, -5.0939483642578125, -2.7473020553588867, -0.40065574645996094, 1.9459905624389648, 4.292636871337891, 6.639283180236816, 8.985929489135742, 11.332576751708984, 13.679222106933594, 16.025867462158203, 18.372514724731445, 20.719161987304688, 23.065807342529297, 25.412452697753906, 27.75909996032715, 30.10574722290039, 32.452392578125, 34.79903793334961, 37.14568328857422, 39.492332458496094, 41.8389778137207, 44.18562316894531, 46.53227233886719, 48.8789176940918, 51.225563049316406, 53.572208404541016, 55.918853759765625, 58.2655029296875, 60.61214828491211, 62.95879364013672, 65.3054428100586, 67.65208435058594, 69.99873352050781, 72.34538269042969, 74.69202423095703, 77.0386734008789, 79.38531494140625, 81.73196411132812, 84.07861328125, 86.42526245117188, 88.77190399169922, 91.1185531616211, 93.46519470214844, 95.81184387207031, 98.15849304199219, 100.50513458251953, 102.8517837524414, 105.19842529296875, 107.54507446289062]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 5.0, 5.0, 12.0, 9.0, 14.0, 12.0, 20.0, 20.0, 20.0, 20.0, 33.0, 31.0, 28.0, 41.0, 28.0, 36.0, 34.0, 44.0, 34.0, 41.0, 43.0, 39.0, 50.0, 38.0, 37.0, 35.0, 35.0, 31.0, 34.0, 24.0, 18.0, 20.0, 18.0, 21.0, 10.0, 10.0, 4.0, 6.0, 12.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.50856590270996, -22.797746658325195, -22.086929321289062, -21.376110076904297, -20.665292739868164, -19.9544734954834, -19.243656158447266, -18.5328369140625, -17.822017669677734, -17.11119842529297, -16.400381088256836, -15.68956184387207, -14.978744506835938, -14.267925262451172, -13.557106971740723, -12.846288681030273, -12.13547134399414, -11.424653053283691, -10.713834762573242, -10.003015518188477, -9.292198181152344, -8.581378936767578, -7.870560646057129, -7.15974235534668, -6.4489240646362305, -5.738105773925781, -5.027287483215332, -4.316468715667725, -3.6056504249572754, -2.894832134246826, -2.1840133666992188, -1.4731950759887695, -0.7623748779296875, -0.05155646800994873, 0.65926194190979, 1.3700804710388184, 2.0808987617492676, 2.791717052459717, 3.502535820007324, 4.213354110717773, 4.924172401428223, 5.634990692138672, 6.345808982849121, 7.0566277503967285, 7.767446041107178, 8.478263854980469, 9.189083099365234, 9.899901390075684, 10.610719680786133, 11.321537971496582, 12.032356262207031, 12.743175506591797, 13.45399284362793, 14.164812088012695, 14.875630378723145, 15.586448669433594, 16.29726791381836, 17.008087158203125, 17.718904495239258, 18.429723739624023, 19.140541076660156, 19.851360321044922, 20.562179565429688, 21.27299690246582, 21.983814239501953]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 5.0, 8.0, 14.0, 15.0, 15.0, 15.0, 26.0, 25.0, 14.0, 32.0, 22.0, 47.0, 25.0, 33.0, 42.0, 42.0, 39.0, 52.0, 39.0, 38.0, 43.0, 38.0, 33.0, 40.0, 27.0, 38.0, 36.0, 28.0, 22.0, 24.0, 17.0, 15.0, 21.0, 12.0, 8.0, 12.0, 9.0, 11.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.1622314453125, -2.097900390625, -2.0335693359375, -1.96923828125, -1.9049072265625, -1.840576171875, -1.7762451171875, -1.7119140625, -1.6475830078125, -1.583251953125, -1.5189208984375, -1.45458984375, -1.3902587890625, -1.325927734375, -1.2615966796875, -1.197265625, -1.1329345703125, -1.068603515625, -1.0042724609375, -0.93994140625, -0.8756103515625, -0.811279296875, -0.7469482421875, -0.6826171875, -0.6182861328125, -0.553955078125, -0.4896240234375, -0.42529296875, -0.3609619140625, -0.296630859375, -0.2322998046875, -0.16796875, -0.1036376953125, -0.039306640625, 0.0250244140625, 0.08935546875, 0.1536865234375, 0.218017578125, 0.2823486328125, 0.3466796875, 0.4110107421875, 0.475341796875, 0.5396728515625, 0.60400390625, 0.6683349609375, 0.732666015625, 0.7969970703125, 0.861328125, 0.9256591796875, 0.989990234375, 1.0543212890625, 1.11865234375, 1.1829833984375, 1.247314453125, 1.3116455078125, 1.3759765625, 1.4403076171875, 1.504638671875, 1.5689697265625, 1.63330078125, 1.6976318359375, 1.761962890625, 1.8262939453125, 1.890625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 1.0, 9.0, 4.0, 10.0, 10.0, 7.0, 15.0, 22.0, 27.0, 31.0, 42.0, 42.0, 53.0, 63.0, 90.0, 101.0, 177.0, 360.0, 729.0, 1995.0, 7463.0, 34270.0, 219243.0, 1903308.0, 1781364.0, 201846.0, 32184.0, 6980.0, 1997.0, 763.0, 317.0, 191.0, 128.0, 74.0, 52.0, 58.0, 38.0, 43.0, 36.0, 30.0, 20.0, 17.0, 12.0, 13.0, 8.0, 7.0, 4.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0], "bins": [-6.97265625, -6.7674560546875, -6.562255859375, -6.3570556640625, -6.15185546875, -5.9466552734375, -5.741455078125, -5.5362548828125, -5.3310546875, -5.1258544921875, -4.920654296875, -4.7154541015625, -4.51025390625, -4.3050537109375, -4.099853515625, -3.8946533203125, -3.689453125, -3.4842529296875, -3.279052734375, -3.0738525390625, -2.86865234375, -2.6634521484375, -2.458251953125, -2.2530517578125, -2.0478515625, -1.8426513671875, -1.637451171875, -1.4322509765625, -1.22705078125, -1.0218505859375, -0.816650390625, -0.6114501953125, -0.40625, -0.2010498046875, 0.004150390625, 0.2093505859375, 0.41455078125, 0.6197509765625, 0.824951171875, 1.0301513671875, 1.2353515625, 1.4405517578125, 1.645751953125, 1.8509521484375, 2.05615234375, 2.2613525390625, 2.466552734375, 2.6717529296875, 2.876953125, 3.0821533203125, 3.287353515625, 3.4925537109375, 3.69775390625, 3.9029541015625, 4.108154296875, 4.3133544921875, 4.5185546875, 4.7237548828125, 4.928955078125, 5.1341552734375, 5.33935546875, 5.5445556640625, 5.749755859375, 5.9549560546875, 6.16015625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 10.0, 10.0, 6.0, 24.0, 16.0, 40.0, 43.0, 59.0, 81.0, 151.0, 188.0, 267.0, 393.0, 422.0, 487.0, 475.0, 354.0, 300.0, 234.0, 151.0, 116.0, 72.0, 56.0, 33.0, 24.0, 16.0, 16.0, 7.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41796875, -7.203857421875, -6.98974609375, -6.775634765625, -6.5615234375, -6.347412109375, -6.13330078125, -5.919189453125, -5.705078125, -5.490966796875, -5.27685546875, -5.062744140625, -4.8486328125, -4.634521484375, -4.42041015625, -4.206298828125, -3.9921875, -3.778076171875, -3.56396484375, -3.349853515625, -3.1357421875, -2.921630859375, -2.70751953125, -2.493408203125, -2.279296875, -2.065185546875, -1.85107421875, -1.636962890625, -1.4228515625, -1.208740234375, -0.99462890625, -0.780517578125, -0.56640625, -0.352294921875, -0.13818359375, 0.075927734375, 0.2900390625, 0.504150390625, 0.71826171875, 0.932373046875, 1.146484375, 1.360595703125, 1.57470703125, 1.788818359375, 2.0029296875, 2.217041015625, 2.43115234375, 2.645263671875, 2.859375, 3.073486328125, 3.28759765625, 3.501708984375, 3.7158203125, 3.929931640625, 4.14404296875, 4.358154296875, 4.572265625, 4.786376953125, 5.00048828125, 5.214599609375, 5.4287109375, 5.642822265625, 5.85693359375, 6.071044921875, 6.28515625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 8.0, 6.0, 13.0, 21.0, 41.0, 63.0, 83.0, 129.0, 237.0, 445.0, 951.0, 2098.0, 6399.0, 28303.0, 163798.0, 1136871.0, 2321547.0, 445705.0, 67888.0, 13294.0, 3548.0, 1405.0, 647.0, 314.0, 166.0, 96.0, 78.0, 35.0, 26.0, 21.0, 8.0, 7.0, 6.0, 10.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75, -9.44775390625, -9.1455078125, -8.84326171875, -8.541015625, -8.23876953125, -7.9365234375, -7.63427734375, -7.33203125, -7.02978515625, -6.7275390625, -6.42529296875, -6.123046875, -5.82080078125, -5.5185546875, -5.21630859375, -4.9140625, -4.61181640625, -4.3095703125, -4.00732421875, -3.705078125, -3.40283203125, -3.1005859375, -2.79833984375, -2.49609375, -2.19384765625, -1.8916015625, -1.58935546875, -1.287109375, -0.98486328125, -0.6826171875, -0.38037109375, -0.078125, 0.22412109375, 0.5263671875, 0.82861328125, 1.130859375, 1.43310546875, 1.7353515625, 2.03759765625, 2.33984375, 2.64208984375, 2.9443359375, 3.24658203125, 3.548828125, 3.85107421875, 4.1533203125, 4.45556640625, 4.7578125, 5.06005859375, 5.3623046875, 5.66455078125, 5.966796875, 6.26904296875, 6.5712890625, 6.87353515625, 7.17578125, 7.47802734375, 7.7802734375, 8.08251953125, 8.384765625, 8.68701171875, 8.9892578125, 9.29150390625, 9.59375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 25.0, 98.0, 258.0, 326.0, 219.0, 72.0, 13.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.46650695800781, -58.83403778076172, -56.201568603515625, -53.569095611572266, -50.93662643432617, -48.30415725708008, -45.67168426513672, -43.039215087890625, -40.40674591064453, -37.77427673339844, -35.141807556152344, -32.509334564208984, -29.87686538696289, -27.244396209716797, -24.61192512512207, -21.979454040527344, -19.34698486328125, -16.714515686035156, -14.08204460144043, -11.44957447052002, -8.81710433959961, -6.184634208679199, -3.552164077758789, -0.9196929931640625, 1.7127761840820312, 4.345246315002441, 6.977716445922852, 9.610186576843262, 12.242656707763672, 14.875126838684082, 17.507596969604492, 20.14006805419922, 22.77252960205078, 25.404998779296875, 28.0374698638916, 30.669940948486328, 33.30241012573242, 35.934879302978516, 38.567352294921875, 41.19982147216797, 43.83229064941406, 46.464759826660156, 49.09722900390625, 51.72970199584961, 54.3621711730957, 56.9946403503418, 59.627113342285156, 62.25958251953125, 64.89205169677734, 67.52452087402344, 70.15699005126953, 72.78945922851562, 75.42193603515625, 78.05440521240234, 80.68687438964844, 83.31934356689453, 85.95181274414062, 88.58428192138672, 91.21675109863281, 93.8492202758789, 96.481689453125, 99.11416625976562, 101.74663543701172, 104.37910461425781, 107.0115737915039]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 6.0, 4.0, 10.0, 12.0, 9.0, 12.0, 26.0, 20.0, 20.0, 31.0, 21.0, 16.0, 31.0, 37.0, 38.0, 48.0, 32.0, 33.0, 41.0, 48.0, 33.0, 35.0, 59.0, 49.0, 40.0, 31.0, 42.0, 42.0, 25.0, 24.0, 31.0, 24.0, 12.0, 13.0, 10.0, 10.0, 7.0, 5.0, 8.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.72806739807129, -19.070178985595703, -18.412290573120117, -17.75440216064453, -17.096513748168945, -16.43862533569336, -15.78073787689209, -15.122849464416504, -14.464961051940918, -13.807072639465332, -13.149184226989746, -12.49129581451416, -11.83340835571289, -11.175519943237305, -10.517631530761719, -9.859743118286133, -9.201854705810547, -8.543966293334961, -7.886077880859375, -7.228189945220947, -6.570301532745361, -5.912413120269775, -5.254525184631348, -4.596636772155762, -3.938748359680176, -3.28085994720459, -2.622971773147583, -1.9650834798812866, -1.3071951866149902, -0.6493067741394043, 0.008581399917602539, 0.6664695739746094, 1.3243560791015625, 1.9822443723678589, 2.6401326656341553, 3.298020839691162, 3.955909252166748, 4.613797664642334, 5.271685600280762, 5.929574012756348, 6.587462425231934, 7.2453508377075195, 7.9032392501831055, 8.561127662658691, 9.219015121459961, 9.876903533935547, 10.534791946411133, 11.192680358886719, 11.850568771362305, 12.50845718383789, 13.166345596313477, 13.824234008789062, 14.482122421264648, 15.140010833740234, 15.797898292541504, 16.455787658691406, 17.11367416381836, 17.771562576293945, 18.42945098876953, 19.087339401245117, 19.745227813720703, 20.40311622619629, 21.061004638671875, 21.718891143798828, 22.376781463623047]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 4.0, 4.0, 7.0, 12.0, 11.0, 12.0, 18.0, 17.0, 21.0, 21.0, 25.0, 31.0, 30.0, 31.0, 22.0, 31.0, 34.0, 36.0, 41.0, 28.0, 34.0, 37.0, 40.0, 38.0, 43.0, 40.0, 28.0, 37.0, 37.0, 28.0, 30.0, 20.0, 26.0, 20.0, 17.0, 12.0, 15.0, 9.0, 7.0, 10.0, 3.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-2.142578125, -2.08154296875, -2.0205078125, -1.95947265625, -1.8984375, -1.83740234375, -1.7763671875, -1.71533203125, -1.654296875, -1.59326171875, -1.5322265625, -1.47119140625, -1.41015625, -1.34912109375, -1.2880859375, -1.22705078125, -1.166015625, -1.10498046875, -1.0439453125, -0.98291015625, -0.921875, -0.86083984375, -0.7998046875, -0.73876953125, -0.677734375, -0.61669921875, -0.5556640625, -0.49462890625, -0.43359375, -0.37255859375, -0.3115234375, -0.25048828125, -0.189453125, -0.12841796875, -0.0673828125, -0.00634765625, 0.0546875, 0.11572265625, 0.1767578125, 0.23779296875, 0.298828125, 0.35986328125, 0.4208984375, 0.48193359375, 0.54296875, 0.60400390625, 0.6650390625, 0.72607421875, 0.787109375, 0.84814453125, 0.9091796875, 0.97021484375, 1.03125, 1.09228515625, 1.1533203125, 1.21435546875, 1.275390625, 1.33642578125, 1.3974609375, 1.45849609375, 1.51953125, 1.58056640625, 1.6416015625, 1.70263671875, 1.763671875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 19.0, 33.0, 23.0, 50.0, 61.0, 95.0, 125.0, 183.0, 289.0, 403.0, 570.0, 909.0, 1426.0, 2156.0, 3420.0, 5263.0, 8540.0, 13568.0, 21859.0, 35456.0, 58108.0, 93199.0, 141067.0, 185834.0, 165895.0, 115909.0, 73661.0, 45489.0, 27867.0, 17350.0, 10715.0, 6789.0, 4159.0, 2723.0, 1798.0, 1135.0, 759.0, 541.0, 333.0, 220.0, 153.0, 117.0, 78.0, 50.0, 41.0, 27.0, 17.0, 15.0, 13.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.1781005859375, -0.17266273498535156, -0.16722488403320312, -0.1617870330810547, -0.15634918212890625, -0.1509113311767578, -0.14547348022460938, -0.14003562927246094, -0.1345977783203125, -0.12915992736816406, -0.12372207641601562, -0.11828422546386719, -0.11284637451171875, -0.10740852355957031, -0.10197067260742188, -0.09653282165527344, -0.091094970703125, -0.08565711975097656, -0.08021926879882812, -0.07478141784667969, -0.06934356689453125, -0.06390571594238281, -0.058467864990234375, -0.05303001403808594, -0.0475921630859375, -0.04215431213378906, -0.036716461181640625, -0.03127861022949219, -0.02584075927734375, -0.020402908325195312, -0.014965057373046875, -0.009527206420898438, -0.00408935546875, 0.0013484954833984375, 0.006786346435546875, 0.012224197387695312, 0.01766204833984375, 0.023099899291992188, 0.028537750244140625, 0.03397560119628906, 0.0394134521484375, 0.04485130310058594, 0.050289154052734375, 0.05572700500488281, 0.06116485595703125, 0.06660270690917969, 0.07204055786132812, 0.07747840881347656, 0.082916259765625, 0.08835411071777344, 0.09379196166992188, 0.09922981262207031, 0.10466766357421875, 0.11010551452636719, 0.11554336547851562, 0.12098121643066406, 0.1264190673828125, 0.13185691833496094, 0.13729476928710938, 0.1427326202392578, 0.14817047119140625, 0.1536083221435547, 0.15904617309570312, 0.16448402404785156, 0.169921875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 0.0, 7.0, 5.0, 9.0, 3.0, 15.0, 11.0, 14.0, 13.0, 17.0, 21.0, 18.0, 21.0, 30.0, 38.0, 24.0, 33.0, 38.0, 37.0, 33.0, 35.0, 35.0, 1067.0, 39.0, 43.0, 43.0, 33.0, 30.0, 39.0, 20.0, 34.0, 27.0, 28.0, 28.0, 16.0, 25.0, 22.0, 10.0, 9.0, 10.0, 7.0, 14.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.3251953125, -1.285980224609375, -1.24676513671875, -1.207550048828125, -1.1683349609375, -1.129119873046875, -1.08990478515625, -1.050689697265625, -1.011474609375, -0.972259521484375, -0.93304443359375, -0.893829345703125, -0.8546142578125, -0.815399169921875, -0.77618408203125, -0.736968994140625, -0.69775390625, -0.658538818359375, -0.61932373046875, -0.580108642578125, -0.5408935546875, -0.501678466796875, -0.46246337890625, -0.423248291015625, -0.384033203125, -0.344818115234375, -0.30560302734375, -0.266387939453125, -0.2271728515625, -0.187957763671875, -0.14874267578125, -0.109527587890625, -0.0703125, -0.031097412109375, 0.00811767578125, 0.047332763671875, 0.0865478515625, 0.125762939453125, 0.16497802734375, 0.204193115234375, 0.243408203125, 0.282623291015625, 0.32183837890625, 0.361053466796875, 0.4002685546875, 0.439483642578125, 0.47869873046875, 0.517913818359375, 0.55712890625, 0.596343994140625, 0.63555908203125, 0.674774169921875, 0.7139892578125, 0.753204345703125, 0.79241943359375, 0.831634521484375, 0.870849609375, 0.910064697265625, 0.94927978515625, 0.988494873046875, 1.0277099609375, 1.066925048828125, 1.10614013671875, 1.145355224609375, 1.1845703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 14.0, 6.0, 11.0, 17.0, 30.0, 46.0, 63.0, 85.0, 125.0, 171.0, 244.0, 380.0, 535.0, 784.0, 1187.0, 1759.0, 2761.0, 4036.0, 6308.0, 9897.0, 14883.0, 22735.0, 34770.0, 51569.0, 73868.0, 102172.0, 143104.0, 1160210.0, 140182.0, 101772.0, 73388.0, 50689.0, 34267.0, 22324.0, 14631.0, 9461.0, 6316.0, 4090.0, 2750.0, 1779.0, 1235.0, 794.0, 539.0, 362.0, 262.0, 181.0, 124.0, 84.0, 45.0, 26.0, 18.0, 17.0, 10.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.09136962890625, -0.08846759796142578, -0.08556556701660156, -0.08266353607177734, -0.07976150512695312, -0.0768594741821289, -0.07395744323730469, -0.07105541229248047, -0.06815338134765625, -0.06525135040283203, -0.06234931945800781, -0.059447288513183594, -0.056545257568359375, -0.053643226623535156, -0.05074119567871094, -0.04783916473388672, -0.0449371337890625, -0.04203510284423828, -0.03913307189941406, -0.036231040954589844, -0.033329010009765625, -0.030426979064941406, -0.027524948120117188, -0.02462291717529297, -0.02172088623046875, -0.01881885528564453, -0.015916824340820312, -0.013014793395996094, -0.010112762451171875, -0.007210731506347656, -0.0043087005615234375, -0.0014066696166992188, 0.001495361328125, 0.004397392272949219, 0.0072994232177734375, 0.010201454162597656, 0.013103485107421875, 0.016005516052246094, 0.018907546997070312, 0.02180957794189453, 0.02471160888671875, 0.02761363983154297, 0.030515670776367188, 0.033417701721191406, 0.036319732666015625, 0.039221763610839844, 0.04212379455566406, 0.04502582550048828, 0.0479278564453125, 0.05082988739013672, 0.05373191833496094, 0.056633949279785156, 0.059535980224609375, 0.062438011169433594, 0.06534004211425781, 0.06824207305908203, 0.07114410400390625, 0.07404613494873047, 0.07694816589355469, 0.0798501968383789, 0.08275222778320312, 0.08565425872802734, 0.08855628967285156, 0.09145832061767578, 0.0943603515625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 6.0, 6.0, 5.0, 10.0, 9.0, 14.0, 13.0, 18.0, 19.0, 29.0, 22.0, 37.0, 36.0, 64.0, 108.0, 107.0, 146.0, 98.0, 56.0, 40.0, 32.0, 21.0, 23.0, 19.0, 14.0, 10.0, 10.0, 8.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00475311279296875, -0.0045830607414245605, -0.004413008689880371, -0.004242956638336182, -0.004072904586791992, -0.0039028525352478027, -0.0037328004837036133, -0.003562748432159424, -0.0033926963806152344, -0.003222644329071045, -0.0030525922775268555, -0.002882540225982666, -0.0027124881744384766, -0.002542436122894287, -0.0023723840713500977, -0.002202332019805908, -0.0020322799682617188, -0.0018622279167175293, -0.0016921758651733398, -0.0015221238136291504, -0.001352071762084961, -0.0011820197105407715, -0.001011967658996582, -0.0008419156074523926, -0.0006718635559082031, -0.0005018115043640137, -0.0003317594528198242, -0.00016170740127563477, 8.344650268554688e-06, 0.00017839670181274414, 0.0003484487533569336, 0.000518500804901123, 0.0006885528564453125, 0.000858604907989502, 0.0010286569595336914, 0.0011987090110778809, 0.0013687610626220703, 0.0015388131141662598, 0.0017088651657104492, 0.0018789172172546387, 0.002048969268798828, 0.0022190213203430176, 0.002389073371887207, 0.0025591254234313965, 0.002729177474975586, 0.0028992295265197754, 0.003069281578063965, 0.0032393336296081543, 0.0034093856811523438, 0.003579437732696533, 0.0037494897842407227, 0.003919541835784912, 0.0040895938873291016, 0.004259645938873291, 0.0044296979904174805, 0.00459975004196167, 0.004769802093505859, 0.004939854145050049, 0.005109906196594238, 0.005279958248138428, 0.005450010299682617, 0.005620062351226807, 0.005790114402770996, 0.0059601664543151855, 0.006130218505859375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 13.0, 15.0, 13.0, 10.0, 14.0, 25.0, 27.0, 38.0, 57.0, 78.0, 141.0, 262.0, 718.0, 39117.0, 1002712.0, 4178.0, 460.0, 168.0, 145.0, 80.0, 64.0, 57.0, 32.0, 25.0, 22.0, 10.0, 19.0, 8.0, 10.0, 10.0, 1.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1676025390625, -0.16298484802246094, -0.15836715698242188, -0.1537494659423828, -0.14913177490234375, -0.1445140838623047, -0.13989639282226562, -0.13527870178222656, -0.1306610107421875, -0.12604331970214844, -0.12142562866210938, -0.11680793762207031, -0.11219024658203125, -0.10757255554199219, -0.10295486450195312, -0.09833717346191406, -0.093719482421875, -0.08910179138183594, -0.08448410034179688, -0.07986640930175781, -0.07524871826171875, -0.07063102722167969, -0.06601333618164062, -0.06139564514160156, -0.0567779541015625, -0.05216026306152344, -0.047542572021484375, -0.04292488098144531, -0.03830718994140625, -0.03368949890136719, -0.029071807861328125, -0.024454116821289062, -0.01983642578125, -0.015218734741210938, -0.010601043701171875, -0.0059833526611328125, -0.00136566162109375, 0.0032520294189453125, 0.007869720458984375, 0.012487411499023438, 0.0171051025390625, 0.021722793579101562, 0.026340484619140625, 0.030958175659179688, 0.03557586669921875, 0.04019355773925781, 0.044811248779296875, 0.04942893981933594, 0.054046630859375, 0.05866432189941406, 0.06328201293945312, 0.06789970397949219, 0.07251739501953125, 0.07713508605957031, 0.08175277709960938, 0.08637046813964844, 0.0909881591796875, 0.09560585021972656, 0.10022354125976562, 0.10484123229980469, 0.10945892333984375, 0.11407661437988281, 0.11869430541992188, 0.12331199645996094, 0.1279296875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 30.0, 860.0, 128.0], "bins": [-0.20568373799324036, -0.20240294933319092, -0.19912216067314148, -0.19584137201309204, -0.1925605684518814, -0.18927977979183197, -0.18599899113178253, -0.1827182024717331, -0.17943741381168365, -0.17615662515163422, -0.17287583649158478, -0.16959503293037415, -0.1663142442703247, -0.16303345561027527, -0.15975266695022583, -0.1564718782901764, -0.15319107472896576, -0.14991028606891632, -0.14662949740886688, -0.14334869384765625, -0.1400679051876068, -0.13678711652755737, -0.13350632786750793, -0.1302255392074585, -0.12694475054740906, -0.12366396188735962, -0.12038316577672958, -0.11710237711668015, -0.1138215884566307, -0.11054079234600067, -0.10726000368595123, -0.1039792150259018, -0.10069841146469116, -0.09741762280464172, -0.09413682669401169, -0.09085603803396225, -0.08757524937391281, -0.08429445326328278, -0.08101366460323334, -0.0777328759431839, -0.07445207983255386, -0.07117129117250443, -0.06789049506187439, -0.06460970640182495, -0.061328914016485214, -0.05804812163114548, -0.05476733297109604, -0.0514865405857563, -0.04820575192570686, -0.044924959540367126, -0.04164417088031769, -0.03836337849497795, -0.035082586109638214, -0.031801797449588776, -0.02852100506424904, -0.025240212678909302, -0.021959422156214714, -0.018678631633520126, -0.01539783924818039, -0.012117048725485802, -0.00883625727146864, -0.005555465817451477, -0.0022746752947568893, 0.0010061170905828476, 0.004286907147616148]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 4.0, 10.0, 14.0, 11.0, 13.0, 10.0, 18.0, 19.0, 33.0, 41.0, 31.0, 39.0, 39.0, 50.0, 42.0, 48.0, 56.0, 51.0, 51.0, 41.0, 41.0, 40.0, 30.0, 42.0, 25.0, 29.0, 29.0, 30.0, 27.0, 15.0, 14.0, 13.0, 10.0, 6.0, 8.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004167735576629639, -0.0040216511115431786, -0.0038755666464567184, -0.0037294821813702583, -0.0035833977162837982, -0.003437313251197338, -0.003291228786110878, -0.003145144321024418, -0.0029990598559379578, -0.0028529753908514977, -0.0027068909257650375, -0.0025608064606785774, -0.0024147219955921173, -0.002268637530505657, -0.002122553065419197, -0.001976468600332737, -0.0018303841352462769, -0.0016842996701598167, -0.0015382152050733566, -0.0013921307399868965, -0.0012460462749004364, -0.0010999618098139763, -0.0009538773447275162, -0.0008077928796410561, -0.000661708414554596, -0.0005156239494681358, -0.0003695394843816757, -0.0002234550192952156, -7.737055420875549e-05, 6.871391087770462e-05, 0.00021479837596416473, 0.00036088284105062485, 0.000506967306137085, 0.0006530517712235451, 0.0007991362363100052, 0.0009452207013964653, 0.0010913051664829254, 0.0012373896315693855, 0.0013834740966558456, 0.0015295585617423058, 0.0016756430268287659, 0.001821727491915226, 0.001967811957001686, 0.002113896422088146, 0.0022599808871746063, 0.0024060653522610664, 0.0025521498173475266, 0.0026982342824339867, 0.0028443187475204468, 0.002990403212606907, 0.003136487677693367, 0.003282572142779827, 0.0034286566078662872, 0.0035747410729527473, 0.0037208255380392075, 0.0038669100031256676, 0.004012994468212128, 0.004159078933298588, 0.004305163398385048, 0.004451247863471508, 0.004597332328557968, 0.004743416793644428, 0.004889501258730888, 0.0050355857238173485, 0.005181670188903809]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 4.0, 4.0, 7.0, 12.0, 11.0, 12.0, 18.0, 17.0, 21.0, 21.0, 25.0, 31.0, 30.0, 31.0, 22.0, 31.0, 34.0, 36.0, 41.0, 28.0, 34.0, 37.0, 40.0, 38.0, 42.0, 41.0, 28.0, 37.0, 37.0, 28.0, 30.0, 20.0, 26.0, 20.0, 17.0, 12.0, 15.0, 9.0, 7.0, 10.0, 3.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-2.142578125, -2.08154296875, -2.0205078125, -1.95947265625, -1.8984375, -1.83740234375, -1.7763671875, -1.71533203125, -1.654296875, -1.59326171875, -1.5322265625, -1.47119140625, -1.41015625, -1.34912109375, -1.2880859375, -1.22705078125, -1.166015625, -1.10498046875, -1.0439453125, -0.98291015625, -0.921875, -0.86083984375, -0.7998046875, -0.73876953125, -0.677734375, -0.61669921875, -0.5556640625, -0.49462890625, -0.43359375, -0.37255859375, -0.3115234375, -0.25048828125, -0.189453125, -0.12841796875, -0.0673828125, -0.00634765625, 0.0546875, 0.11572265625, 0.1767578125, 0.23779296875, 0.298828125, 0.35986328125, 0.4208984375, 0.48193359375, 0.54296875, 0.60400390625, 0.6650390625, 0.72607421875, 0.787109375, 0.84814453125, 0.9091796875, 0.97021484375, 1.03125, 1.09228515625, 1.1533203125, 1.21435546875, 1.275390625, 1.33642578125, 1.3974609375, 1.45849609375, 1.51953125, 1.58056640625, 1.6416015625, 1.70263671875, 1.763671875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [6.0, 3.0, 3.0, 1.0, 15.0, 12.0, 25.0, 8.0, 25.0, 30.0, 44.0, 70.0, 113.0, 115.0, 161.0, 229.0, 354.0, 529.0, 732.0, 1190.0, 1913.0, 2933.0, 4782.0, 7807.0, 13144.0, 23014.0, 41011.0, 76952.0, 145981.0, 262305.0, 213285.0, 113387.0, 59613.0, 32331.0, 18260.0, 10701.0, 6350.0, 3910.0, 2447.0, 1550.0, 1035.0, 670.0, 476.0, 313.0, 221.0, 166.0, 104.0, 62.0, 57.0, 30.0, 28.0, 26.0, 16.0, 5.0, 7.0, 8.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.521484375, -1.470428466796875, -1.41937255859375, -1.368316650390625, -1.3172607421875, -1.266204833984375, -1.21514892578125, -1.164093017578125, -1.113037109375, -1.061981201171875, -1.01092529296875, -0.959869384765625, -0.9088134765625, -0.857757568359375, -0.80670166015625, -0.755645751953125, -0.70458984375, -0.653533935546875, -0.60247802734375, -0.551422119140625, -0.5003662109375, -0.449310302734375, -0.39825439453125, -0.347198486328125, -0.296142578125, -0.245086669921875, -0.19403076171875, -0.142974853515625, -0.0919189453125, -0.040863037109375, 0.01019287109375, 0.061248779296875, 0.1123046875, 0.163360595703125, 0.21441650390625, 0.265472412109375, 0.3165283203125, 0.367584228515625, 0.41864013671875, 0.469696044921875, 0.520751953125, 0.571807861328125, 0.62286376953125, 0.673919677734375, 0.7249755859375, 0.776031494140625, 0.82708740234375, 0.878143310546875, 0.92919921875, 0.980255126953125, 1.03131103515625, 1.082366943359375, 1.1334228515625, 1.184478759765625, 1.23553466796875, 1.286590576171875, 1.337646484375, 1.388702392578125, 1.43975830078125, 1.490814208984375, 1.5418701171875, 1.592926025390625, 1.64398193359375, 1.695037841796875, 1.74609375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 2.0, 6.0, 3.0, 3.0, 10.0, 10.0, 18.0, 21.0, 19.0, 21.0, 23.0, 25.0, 28.0, 34.0, 35.0, 46.0, 41.0, 54.0, 65.0, 125.0, 249.0, 1483.0, 185.0, 91.0, 73.0, 54.0, 40.0, 33.0, 38.0, 31.0, 33.0, 24.0, 23.0, 22.0, 17.0, 14.0, 8.0, 13.0, 7.0, 3.0, 2.0, 5.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.49609375, -7.26422119140625, -7.0323486328125, -6.80047607421875, -6.568603515625, -6.33673095703125, -6.1048583984375, -5.87298583984375, -5.64111328125, -5.40924072265625, -5.1773681640625, -4.94549560546875, -4.713623046875, -4.48175048828125, -4.2498779296875, -4.01800537109375, -3.7861328125, -3.55426025390625, -3.3223876953125, -3.09051513671875, -2.858642578125, -2.62677001953125, -2.3948974609375, -2.16302490234375, -1.93115234375, -1.69927978515625, -1.4674072265625, -1.23553466796875, -1.003662109375, -0.77178955078125, -0.5399169921875, -0.30804443359375, -0.076171875, 0.15570068359375, 0.3875732421875, 0.61944580078125, 0.851318359375, 1.08319091796875, 1.3150634765625, 1.54693603515625, 1.77880859375, 2.01068115234375, 2.2425537109375, 2.47442626953125, 2.706298828125, 2.93817138671875, 3.1700439453125, 3.40191650390625, 3.6337890625, 3.86566162109375, 4.0975341796875, 4.32940673828125, 4.561279296875, 4.79315185546875, 5.0250244140625, 5.25689697265625, 5.48876953125, 5.72064208984375, 5.9525146484375, 6.18438720703125, 6.416259765625, 6.64813232421875, 6.8800048828125, 7.11187744140625, 7.34375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 11.0, 10.0, 14.0, 15.0, 22.0, 21.0, 26.0, 57.0, 53.0, 90.0, 106.0, 148.0, 240.0, 540.0, 1347.0, 7412.0, 128309.0, 2867335.0, 129520.0, 7669.0, 1406.0, 505.0, 282.0, 123.0, 94.0, 68.0, 52.0, 44.0, 34.0, 37.0, 23.0, 23.0, 14.0, 11.0, 9.0, 6.0, 3.0, 3.0, 6.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.765625, -11.3798828125, -10.994140625, -10.6083984375, -10.22265625, -9.8369140625, -9.451171875, -9.0654296875, -8.6796875, -8.2939453125, -7.908203125, -7.5224609375, -7.13671875, -6.7509765625, -6.365234375, -5.9794921875, -5.59375, -5.2080078125, -4.822265625, -4.4365234375, -4.05078125, -3.6650390625, -3.279296875, -2.8935546875, -2.5078125, -2.1220703125, -1.736328125, -1.3505859375, -0.96484375, -0.5791015625, -0.193359375, 0.1923828125, 0.578125, 0.9638671875, 1.349609375, 1.7353515625, 2.12109375, 2.5068359375, 2.892578125, 3.2783203125, 3.6640625, 4.0498046875, 4.435546875, 4.8212890625, 5.20703125, 5.5927734375, 5.978515625, 6.3642578125, 6.75, 7.1357421875, 7.521484375, 7.9072265625, 8.29296875, 8.6787109375, 9.064453125, 9.4501953125, 9.8359375, 10.2216796875, 10.607421875, 10.9931640625, 11.37890625, 11.7646484375, 12.150390625, 12.5361328125, 12.921875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [329.0, 683.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.175058841705322, -0.6615290641784668, 3.8520007133483887, 8.365530014038086, 12.879060745239258, 17.39259147644043, 21.90612030029297, 26.419649124145508, 30.93317985534668, 35.44670867919922, 39.96023941040039, 44.47377014160156, 48.98729705810547, 53.500831604003906, 58.01435852050781, 62.52788543701172, 67.04141998291016, 71.55494689941406, 76.0684814453125, 80.5820083618164, 85.09553527832031, 89.60906982421875, 94.12259674072266, 98.63612365722656, 103.149658203125, 107.6631851196289, 112.17671966552734, 116.69024658203125, 121.20378112792969, 125.7173080444336, 130.2308349609375, 134.74436950683594, 139.25790405273438, 143.7714385986328, 148.2849578857422, 152.79849243164062, 157.31202697753906, 161.8255615234375, 166.33908081054688, 170.8526153564453, 175.36614990234375, 179.8796844482422, 184.39320373535156, 188.90673828125, 193.42027282714844, 197.93380737304688, 202.44732666015625, 206.9608612060547, 211.47438049316406, 215.9879150390625, 220.50143432617188, 225.0149688720703, 229.52850341796875, 234.04202270507812, 238.55555725097656, 243.069091796875, 247.58261108398438, 252.0961456298828, 256.60968017578125, 261.1231994628906, 265.63671875, 270.1502685546875, 274.6637878417969, 279.17730712890625, 283.69085693359375]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 6.0, 5.0, 8.0, 10.0, 9.0, 9.0, 22.0, 21.0, 23.0, 21.0, 27.0, 33.0, 32.0, 36.0, 33.0, 27.0, 33.0, 38.0, 49.0, 42.0, 44.0, 40.0, 41.0, 27.0, 29.0, 34.0, 29.0, 27.0, 37.0, 21.0, 31.0, 25.0, 18.0, 17.0, 15.0, 16.0, 13.0, 8.0, 11.0, 5.0, 10.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.62816047668457, -21.891433715820312, -21.154705047607422, -20.417978286743164, -19.681249618530273, -18.944522857666016, -18.207794189453125, -17.471067428588867, -16.73434066772461, -15.997612953186035, -15.260885238647461, -14.524158477783203, -13.787429809570312, -13.050703048706055, -12.31397533416748, -11.577247619628906, -10.840518951416016, -10.103791236877441, -9.367063522338867, -8.63033676147461, -7.893608570098877, -7.156880855560303, -6.420153617858887, -5.6834259033203125, -4.946698188781738, -4.209970474243164, -3.473242998123169, -2.736515522003174, -1.9997878074645996, -1.2630600929260254, -0.5263328552246094, 0.21039485931396484, 0.9471244812011719, 1.6838520765304565, 2.420579671859741, 3.1573071479797363, 3.8940348625183105, 4.630762577056885, 5.367489814758301, 6.104217529296875, 6.840945243835449, 7.577672958374023, 8.314400672912598, 9.051128387451172, 9.78785514831543, 10.52458381652832, 11.261310577392578, 11.998038291931152, 12.734766006469727, 13.4714937210083, 14.208221435546875, 14.944948196411133, 15.681676864624023, 16.41840362548828, 17.155132293701172, 17.89185905456543, 18.628585815429688, 19.365312576293945, 20.102041244506836, 20.838768005371094, 21.575496673583984, 22.312223434448242, 23.0489501953125, 23.78567886352539, 24.52240753173828]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 5.0, 10.0, 12.0, 13.0, 8.0, 17.0, 26.0, 20.0, 28.0, 22.0, 38.0, 32.0, 21.0, 32.0, 32.0, 29.0, 41.0, 42.0, 31.0, 44.0, 46.0, 32.0, 45.0, 40.0, 30.0, 32.0, 34.0, 43.0, 26.0, 21.0, 15.0, 21.0, 26.0, 10.0, 15.0, 6.0, 7.0, 12.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.271484375, -2.204864501953125, -2.13824462890625, -2.071624755859375, -2.0050048828125, -1.938385009765625, -1.87176513671875, -1.805145263671875, -1.738525390625, -1.671905517578125, -1.60528564453125, -1.538665771484375, -1.4720458984375, -1.405426025390625, -1.33880615234375, -1.272186279296875, -1.20556640625, -1.138946533203125, -1.07232666015625, -1.005706787109375, -0.9390869140625, -0.872467041015625, -0.80584716796875, -0.739227294921875, -0.672607421875, -0.605987548828125, -0.53936767578125, -0.472747802734375, -0.4061279296875, -0.339508056640625, -0.27288818359375, -0.206268310546875, -0.1396484375, -0.073028564453125, -0.00640869140625, 0.060211181640625, 0.1268310546875, 0.193450927734375, 0.26007080078125, 0.326690673828125, 0.393310546875, 0.459930419921875, 0.52655029296875, 0.593170166015625, 0.6597900390625, 0.726409912109375, 0.79302978515625, 0.859649658203125, 0.92626953125, 0.992889404296875, 1.05950927734375, 1.126129150390625, 1.1927490234375, 1.259368896484375, 1.32598876953125, 1.392608642578125, 1.459228515625, 1.525848388671875, 1.59246826171875, 1.659088134765625, 1.7257080078125, 1.792327880859375, 1.85894775390625, 1.925567626953125, 1.9921875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 7.0, 11.0, 17.0, 16.0, 14.0, 27.0, 20.0, 31.0, 35.0, 42.0, 55.0, 53.0, 115.0, 176.0, 423.0, 1101.0, 4434.0, 23342.0, 196136.0, 2258493.0, 1562776.0, 125082.0, 16731.0, 3262.0, 929.0, 350.0, 152.0, 94.0, 71.0, 47.0, 40.0, 29.0, 23.0, 34.0, 18.0, 14.0, 8.0, 16.0, 6.0, 9.0, 7.0, 10.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.5546875, -8.3023681640625, -8.050048828125, -7.7977294921875, -7.54541015625, -7.2930908203125, -7.040771484375, -6.7884521484375, -6.5361328125, -6.2838134765625, -6.031494140625, -5.7791748046875, -5.52685546875, -5.2745361328125, -5.022216796875, -4.7698974609375, -4.517578125, -4.2652587890625, -4.012939453125, -3.7606201171875, -3.50830078125, -3.2559814453125, -3.003662109375, -2.7513427734375, -2.4990234375, -2.2467041015625, -1.994384765625, -1.7420654296875, -1.48974609375, -1.2374267578125, -0.985107421875, -0.7327880859375, -0.48046875, -0.2281494140625, 0.024169921875, 0.2764892578125, 0.52880859375, 0.7811279296875, 1.033447265625, 1.2857666015625, 1.5380859375, 1.7904052734375, 2.042724609375, 2.2950439453125, 2.54736328125, 2.7996826171875, 3.052001953125, 3.3043212890625, 3.556640625, 3.8089599609375, 4.061279296875, 4.3135986328125, 4.56591796875, 4.8182373046875, 5.070556640625, 5.3228759765625, 5.5751953125, 5.8275146484375, 6.079833984375, 6.3321533203125, 6.58447265625, 6.8367919921875, 7.089111328125, 7.3414306640625, 7.59375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 12.0, 16.0, 14.0, 25.0, 39.0, 50.0, 86.0, 110.0, 146.0, 227.0, 328.0, 463.0, 512.0, 514.0, 429.0, 364.0, 218.0, 168.0, 93.0, 82.0, 44.0, 26.0, 26.0, 20.0, 22.0, 14.0, 9.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5390625, -9.30059814453125, -9.0621337890625, -8.82366943359375, -8.585205078125, -8.34674072265625, -8.1082763671875, -7.86981201171875, -7.63134765625, -7.39288330078125, -7.1544189453125, -6.91595458984375, -6.677490234375, -6.43902587890625, -6.2005615234375, -5.96209716796875, -5.7236328125, -5.48516845703125, -5.2467041015625, -5.00823974609375, -4.769775390625, -4.53131103515625, -4.2928466796875, -4.05438232421875, -3.81591796875, -3.57745361328125, -3.3389892578125, -3.10052490234375, -2.862060546875, -2.62359619140625, -2.3851318359375, -2.14666748046875, -1.908203125, -1.66973876953125, -1.4312744140625, -1.19281005859375, -0.954345703125, -0.71588134765625, -0.4774169921875, -0.23895263671875, -0.00048828125, 0.23797607421875, 0.4764404296875, 0.71490478515625, 0.953369140625, 1.19183349609375, 1.4302978515625, 1.66876220703125, 1.9072265625, 2.14569091796875, 2.3841552734375, 2.62261962890625, 2.861083984375, 3.09954833984375, 3.3380126953125, 3.57647705078125, 3.81494140625, 4.05340576171875, 4.2918701171875, 4.53033447265625, 4.768798828125, 5.00726318359375, 5.2457275390625, 5.48419189453125, 5.72265625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 15.0, 13.0, 27.0, 32.0, 36.0, 65.0, 121.0, 220.0, 443.0, 1115.0, 3871.0, 22346.0, 259739.0, 2821632.0, 1005699.0, 67540.0, 8075.0, 1950.0, 657.0, 302.0, 142.0, 84.0, 47.0, 46.0, 22.0, 16.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.921875, -11.458740234375, -10.99560546875, -10.532470703125, -10.0693359375, -9.606201171875, -9.14306640625, -8.679931640625, -8.216796875, -7.753662109375, -7.29052734375, -6.827392578125, -6.3642578125, -5.901123046875, -5.43798828125, -4.974853515625, -4.51171875, -4.048583984375, -3.58544921875, -3.122314453125, -2.6591796875, -2.196044921875, -1.73291015625, -1.269775390625, -0.806640625, -0.343505859375, 0.11962890625, 0.582763671875, 1.0458984375, 1.509033203125, 1.97216796875, 2.435302734375, 2.8984375, 3.361572265625, 3.82470703125, 4.287841796875, 4.7509765625, 5.214111328125, 5.67724609375, 6.140380859375, 6.603515625, 7.066650390625, 7.52978515625, 7.992919921875, 8.4560546875, 8.919189453125, 9.38232421875, 9.845458984375, 10.30859375, 10.771728515625, 11.23486328125, 11.697998046875, 12.1611328125, 12.624267578125, 13.08740234375, 13.550537109375, 14.013671875, 14.476806640625, 14.93994140625, 15.403076171875, 15.8662109375, 16.329345703125, 16.79248046875, 17.255615234375, 17.71875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 14.0, 28.0, 51.0, 53.0, 73.0, 119.0, 116.0, 118.0, 106.0, 92.0, 76.0, 58.0, 37.0, 29.0, 14.0, 8.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.619972229003906, -32.55096435546875, -31.48195457458496, -30.412946701049805, -29.343936920166016, -28.27492904663086, -27.205921173095703, -26.136913299560547, -25.067903518676758, -23.9988956451416, -22.929885864257812, -21.860877990722656, -20.7918701171875, -19.72286033630371, -18.653852462768555, -17.584842681884766, -16.51583480834961, -15.446825981140137, -14.377817153930664, -13.308809280395508, -12.239800453186035, -11.170791625976562, -10.101783752441406, -9.032774925231934, -7.963766098022461, -6.894757270812988, -5.825748920440674, -4.756740570068359, -3.6877317428588867, -2.618722915649414, -1.5497145652770996, -0.48070621490478516, 0.5882987976074219, 1.6573073863983154, 2.726315975189209, 3.7953245639801025, 4.864333152770996, 5.933341979980469, 7.002350330352783, 8.071358680725098, 9.14036750793457, 10.209376335144043, 11.278385162353516, 12.347393035888672, 13.416401863098145, 14.485410690307617, 15.554418563842773, 16.623428344726562, 17.69243621826172, 18.761444091796875, 19.830453872680664, 20.89946174621582, 21.96847152709961, 23.037479400634766, 24.106487274169922, 25.175495147705078, 26.244504928588867, 27.313512802124023, 28.382522583007812, 29.45153045654297, 30.520538330078125, 31.589548110961914, 32.6585578918457, 33.72756576538086, 34.796573638916016]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 5.0, 10.0, 9.0, 12.0, 18.0, 25.0, 17.0, 14.0, 28.0, 21.0, 31.0, 38.0, 24.0, 31.0, 34.0, 27.0, 37.0, 48.0, 29.0, 44.0, 39.0, 36.0, 28.0, 50.0, 39.0, 36.0, 26.0, 33.0, 19.0, 20.0, 21.0, 16.0, 17.0, 17.0, 13.0, 12.0, 9.0, 15.0, 9.0, 4.0, 6.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.896915435791016, -17.28498077392578, -16.673046112060547, -16.061113357543945, -15.449178695678711, -14.837244033813477, -14.225310325622559, -13.61337661743164, -13.001441955566406, -12.389507293701172, -11.777573585510254, -11.165639877319336, -10.553705215454102, -9.941770553588867, -9.32983684539795, -8.717903137207031, -8.105968475341797, -7.494034290313721, -6.8821001052856445, -6.270165920257568, -5.658231735229492, -5.046297550201416, -4.43436336517334, -3.8224291801452637, -3.2104949951171875, -2.5985608100891113, -1.9866266250610352, -1.374692440032959, -0.7627582550048828, -0.15082406997680664, 0.46111011505126953, 1.0730443000793457, 1.6849784851074219, 2.296912670135498, 2.908846855163574, 3.5207810401916504, 4.132715225219727, 4.744649410247803, 5.356583595275879, 5.968517780303955, 6.580451965332031, 7.192386150360107, 7.804320335388184, 8.416254043579102, 9.028188705444336, 9.64012336730957, 10.252057075500488, 10.863990783691406, 11.47592544555664, 12.087860107421875, 12.699793815612793, 13.311727523803711, 13.923662185668945, 14.53559684753418, 15.147530555725098, 15.759464263916016, 16.37139892578125, 16.983333587646484, 17.59526824951172, 18.20720100402832, 18.819135665893555, 19.43107032775879, 20.04300308227539, 20.654937744140625, 21.26687240600586]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 8.0, 6.0, 7.0, 9.0, 9.0, 13.0, 12.0, 10.0, 22.0, 24.0, 28.0, 16.0, 25.0, 25.0, 24.0, 38.0, 34.0, 36.0, 32.0, 32.0, 42.0, 43.0, 39.0, 36.0, 38.0, 42.0, 42.0, 39.0, 38.0, 30.0, 36.0, 21.0, 20.0, 19.0, 8.0, 21.0, 12.0, 10.0, 15.0, 8.0, 6.0, 8.0, 3.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0546875, -1.98779296875, -1.9208984375, -1.85400390625, -1.787109375, -1.72021484375, -1.6533203125, -1.58642578125, -1.51953125, -1.45263671875, -1.3857421875, -1.31884765625, -1.251953125, -1.18505859375, -1.1181640625, -1.05126953125, -0.984375, -0.91748046875, -0.8505859375, -0.78369140625, -0.716796875, -0.64990234375, -0.5830078125, -0.51611328125, -0.44921875, -0.38232421875, -0.3154296875, -0.24853515625, -0.181640625, -0.11474609375, -0.0478515625, 0.01904296875, 0.0859375, 0.15283203125, 0.2197265625, 0.28662109375, 0.353515625, 0.42041015625, 0.4873046875, 0.55419921875, 0.62109375, 0.68798828125, 0.7548828125, 0.82177734375, 0.888671875, 0.95556640625, 1.0224609375, 1.08935546875, 1.15625, 1.22314453125, 1.2900390625, 1.35693359375, 1.423828125, 1.49072265625, 1.5576171875, 1.62451171875, 1.69140625, 1.75830078125, 1.8251953125, 1.89208984375, 1.958984375, 2.02587890625, 2.0927734375, 2.15966796875, 2.2265625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 5.0, 7.0, 6.0, 10.0, 10.0, 8.0, 21.0, 28.0, 48.0, 73.0, 92.0, 152.0, 204.0, 285.0, 434.0, 658.0, 980.0, 1482.0, 2379.0, 3783.0, 5842.0, 9769.0, 16207.0, 26892.0, 44298.0, 72399.0, 114122.0, 165984.0, 188432.0, 145525.0, 95994.0, 59206.0, 36125.0, 21946.0, 13157.0, 8198.0, 4932.0, 3060.0, 1972.0, 1295.0, 845.0, 521.0, 391.0, 238.0, 171.0, 105.0, 83.0, 55.0, 43.0, 26.0, 15.0, 17.0, 10.0, 10.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.1907958984375, -0.1848888397216797, -0.17898178100585938, -0.17307472229003906, -0.16716766357421875, -0.16126060485839844, -0.15535354614257812, -0.1494464874267578, -0.1435394287109375, -0.1376323699951172, -0.13172531127929688, -0.12581825256347656, -0.11991119384765625, -0.11400413513183594, -0.10809707641601562, -0.10219001770019531, -0.096282958984375, -0.09037590026855469, -0.08446884155273438, -0.07856178283691406, -0.07265472412109375, -0.06674766540527344, -0.060840606689453125, -0.05493354797363281, -0.0490264892578125, -0.04311943054199219, -0.037212371826171875, -0.03130531311035156, -0.02539825439453125, -0.019491195678710938, -0.013584136962890625, -0.0076770782470703125, -0.00177001953125, 0.0041370391845703125, 0.010044097900390625, 0.015951156616210938, 0.02185821533203125, 0.027765274047851562, 0.033672332763671875, 0.03957939147949219, 0.0454864501953125, 0.05139350891113281, 0.057300567626953125, 0.06320762634277344, 0.06911468505859375, 0.07502174377441406, 0.08092880249023438, 0.08683586120605469, 0.092742919921875, 0.09864997863769531, 0.10455703735351562, 0.11046409606933594, 0.11637115478515625, 0.12227821350097656, 0.12818527221679688, 0.1340923309326172, 0.1399993896484375, 0.1459064483642578, 0.15181350708007812, 0.15772056579589844, 0.16362762451171875, 0.16953468322753906, 0.17544174194335938, 0.1813488006591797, 0.187255859375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 1.0, 7.0, 7.0, 8.0, 8.0, 12.0, 7.0, 9.0, 21.0, 12.0, 26.0, 24.0, 25.0, 34.0, 28.0, 43.0, 37.0, 44.0, 36.0, 51.0, 41.0, 1071.0, 45.0, 41.0, 44.0, 39.0, 35.0, 39.0, 43.0, 20.0, 21.0, 18.0, 17.0, 11.0, 13.0, 17.0, 21.0, 10.0, 9.0, 11.0, 2.0, 2.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-1.705078125, -1.6590423583984375, -1.613006591796875, -1.5669708251953125, -1.52093505859375, -1.4748992919921875, -1.428863525390625, -1.3828277587890625, -1.3367919921875, -1.2907562255859375, -1.244720458984375, -1.1986846923828125, -1.15264892578125, -1.1066131591796875, -1.060577392578125, -1.0145416259765625, -0.968505859375, -0.9224700927734375, -0.876434326171875, -0.8303985595703125, -0.78436279296875, -0.7383270263671875, -0.692291259765625, -0.6462554931640625, -0.6002197265625, -0.5541839599609375, -0.508148193359375, -0.4621124267578125, -0.41607666015625, -0.3700408935546875, -0.324005126953125, -0.2779693603515625, -0.23193359375, -0.1858978271484375, -0.139862060546875, -0.0938262939453125, -0.04779052734375, -0.0017547607421875, 0.044281005859375, 0.0903167724609375, 0.1363525390625, 0.1823883056640625, 0.228424072265625, 0.2744598388671875, 0.32049560546875, 0.3665313720703125, 0.412567138671875, 0.4586029052734375, 0.504638671875, 0.5506744384765625, 0.596710205078125, 0.6427459716796875, 0.68878173828125, 0.7348175048828125, 0.780853271484375, 0.8268890380859375, 0.8729248046875, 0.9189605712890625, 0.964996337890625, 1.0110321044921875, 1.05706787109375, 1.1031036376953125, 1.149139404296875, 1.1951751708984375, 1.2412109375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 6.0, 15.0, 23.0, 36.0, 63.0, 77.0, 157.0, 258.0, 463.0, 725.0, 1355.0, 2339.0, 4050.0, 7419.0, 13520.0, 24887.0, 43629.0, 75350.0, 121922.0, 195773.0, 1219874.0, 153440.0, 98042.0, 58384.0, 33396.0, 18734.0, 10296.0, 5570.0, 3251.0, 1769.0, 970.0, 528.0, 303.0, 199.0, 119.0, 72.0, 37.0, 22.0, 14.0, 8.0, 14.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1339111328125, -0.1293354034423828, -0.12475967407226562, -0.12018394470214844, -0.11560821533203125, -0.11103248596191406, -0.10645675659179688, -0.10188102722167969, -0.0973052978515625, -0.09272956848144531, -0.08815383911132812, -0.08357810974121094, -0.07900238037109375, -0.07442665100097656, -0.06985092163085938, -0.06527519226074219, -0.060699462890625, -0.05612373352050781, -0.051548004150390625, -0.04697227478027344, -0.04239654541015625, -0.03782081604003906, -0.033245086669921875, -0.028669357299804688, -0.0240936279296875, -0.019517898559570312, -0.014942169189453125, -0.010366439819335938, -0.00579071044921875, -0.0012149810791015625, 0.003360748291015625, 0.007936477661132812, 0.01251220703125, 0.017087936401367188, 0.021663665771484375, 0.026239395141601562, 0.03081512451171875, 0.03539085388183594, 0.039966583251953125, 0.04454231262207031, 0.0491180419921875, 0.05369377136230469, 0.058269500732421875, 0.06284523010253906, 0.06742095947265625, 0.07199668884277344, 0.07657241821289062, 0.08114814758300781, 0.085723876953125, 0.09029960632324219, 0.09487533569335938, 0.09945106506347656, 0.10402679443359375, 0.10860252380371094, 0.11317825317382812, 0.11775398254394531, 0.1223297119140625, 0.1269054412841797, 0.13148117065429688, 0.13605690002441406, 0.14063262939453125, 0.14520835876464844, 0.14978408813476562, 0.1543598175048828, 0.158935546875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 8.0, 10.0, 11.0, 14.0, 20.0, 19.0, 32.0, 46.0, 30.0, 39.0, 56.0, 73.0, 88.0, 80.0, 78.0, 71.0, 61.0, 44.0, 45.0, 34.0, 20.0, 10.0, 19.0, 15.0, 8.0, 10.0, 7.0, 7.0, 7.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00803375244140625, -0.007800281047821045, -0.00756680965423584, -0.007333338260650635, -0.00709986686706543, -0.006866395473480225, -0.0066329240798950195, -0.0063994526863098145, -0.006165981292724609, -0.005932509899139404, -0.005699038505554199, -0.005465567111968994, -0.005232095718383789, -0.004998624324798584, -0.004765152931213379, -0.004531681537628174, -0.004298210144042969, -0.004064738750457764, -0.0038312673568725586, -0.0035977959632873535, -0.0033643245697021484, -0.0031308531761169434, -0.0028973817825317383, -0.002663910388946533, -0.002430438995361328, -0.002196967601776123, -0.001963496208190918, -0.0017300248146057129, -0.0014965534210205078, -0.0012630820274353027, -0.0010296106338500977, -0.0007961392402648926, -0.0005626678466796875, -0.0003291964530944824, -9.572505950927734e-05, 0.00013774633407592773, 0.0003712177276611328, 0.0006046891212463379, 0.000838160514831543, 0.001071631908416748, 0.0013051033020019531, 0.0015385746955871582, 0.0017720460891723633, 0.0020055174827575684, 0.0022389888763427734, 0.0024724602699279785, 0.0027059316635131836, 0.0029394030570983887, 0.0031728744506835938, 0.003406345844268799, 0.003639817237854004, 0.003873288631439209, 0.004106760025024414, 0.004340231418609619, 0.004573702812194824, 0.004807174205780029, 0.005040645599365234, 0.0052741169929504395, 0.0055075883865356445, 0.00574105978012085, 0.005974531173706055, 0.00620800256729126, 0.006441473960876465, 0.00667494535446167, 0.006908416748046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 8.0, 5.0, 6.0, 10.0, 11.0, 12.0, 22.0, 17.0, 31.0, 34.0, 33.0, 63.0, 63.0, 97.0, 126.0, 216.0, 560.0, 8035.0, 1004614.0, 32927.0, 789.0, 291.0, 126.0, 77.0, 68.0, 54.0, 38.0, 31.0, 32.0, 25.0, 27.0, 18.0, 12.0, 18.0, 4.0, 6.0, 4.0, 5.0, 6.0, 1.0, 2.0, 4.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1312255859375, -0.12679672241210938, -0.12236785888671875, -0.11793899536132812, -0.1135101318359375, -0.10908126831054688, -0.10465240478515625, -0.10022354125976562, -0.095794677734375, -0.09136581420898438, -0.08693695068359375, -0.08250808715820312, -0.0780792236328125, -0.07365036010742188, -0.06922149658203125, -0.06479263305664062, -0.06036376953125, -0.055934906005859375, -0.05150604248046875, -0.047077178955078125, -0.0426483154296875, -0.038219451904296875, -0.03379058837890625, -0.029361724853515625, -0.024932861328125, -0.020503997802734375, -0.01607513427734375, -0.011646270751953125, -0.0072174072265625, -0.002788543701171875, 0.00164031982421875, 0.006069183349609375, 0.010498046875, 0.014926910400390625, 0.01935577392578125, 0.023784637451171875, 0.0282135009765625, 0.032642364501953125, 0.03707122802734375, 0.041500091552734375, 0.045928955078125, 0.050357818603515625, 0.05478668212890625, 0.059215545654296875, 0.0636444091796875, 0.06807327270507812, 0.07250213623046875, 0.07693099975585938, 0.08135986328125, 0.08578872680664062, 0.09021759033203125, 0.09464645385742188, 0.0990753173828125, 0.10350418090820312, 0.10793304443359375, 0.11236190795898438, 0.116790771484375, 0.12121963500976562, 0.12564849853515625, 0.13007736206054688, 0.1345062255859375, 0.13893508911132812, 0.14336395263671875, 0.14779281616210938, 0.1522216796875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 895.0, 97.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.22215846180915833, -0.21793340146541595, -0.21370834112167358, -0.20948326587677002, -0.20525820553302765, -0.20103314518928528, -0.1968080699443817, -0.19258300960063934, -0.18835794925689697, -0.1841328889131546, -0.17990782856941223, -0.17568275332450867, -0.1714576929807663, -0.16723263263702393, -0.16300755739212036, -0.158782497048378, -0.15455743670463562, -0.15033237636089325, -0.14610731601715088, -0.14188224077224731, -0.13765718042850494, -0.13343212008476257, -0.129207044839859, -0.12498198449611664, -0.12075692415237427, -0.1165318638086319, -0.11230679601430893, -0.10808172821998596, -0.10385666787624359, -0.09963160753250122, -0.09540653973817825, -0.09118147194385529, -0.08695642650127411, -0.08273136615753174, -0.07850629836320877, -0.0742812305688858, -0.07005617022514343, -0.06583110988140106, -0.061606042087078094, -0.057380978018045425, -0.053155913949012756, -0.04893084987998009, -0.04470578581094742, -0.04048072174191475, -0.03625565767288208, -0.03203059360384941, -0.027805529534816742, -0.023580465465784073, -0.019355401396751404, -0.015130337327718735, -0.010905273258686066, -0.006680209189653397, -0.0024551451206207275, 0.0017699189484119415, 0.005994983017444611, 0.01022004708647728, 0.014445111155509949, 0.018670175224542618, 0.022895239293575287, 0.027120303362607956, 0.031345367431640625, 0.035570431500673294, 0.03979549556970596, 0.04402055963873863, 0.0482456237077713]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 2.0, 4.0, 5.0, 5.0, 8.0, 11.0, 17.0, 21.0, 18.0, 21.0, 17.0, 38.0, 28.0, 36.0, 36.0, 45.0, 42.0, 47.0, 38.0, 65.0, 38.0, 43.0, 38.0, 40.0, 39.0, 25.0, 38.0, 28.0, 29.0, 33.0, 29.0, 20.0, 21.0, 14.0, 20.0, 9.0, 6.0, 7.0, 7.0, 5.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.010283708572387695, -0.009949051775038242, -0.00961439497768879, -0.009279738180339336, -0.008945081382989883, -0.00861042458564043, -0.008275767788290977, -0.007941110990941525, -0.0076064541935920715, -0.0072717973962426186, -0.006937140598893166, -0.006602483801543713, -0.00626782700419426, -0.005933170206844807, -0.005598513409495354, -0.005263856612145901, -0.004929199814796448, -0.004594543017446995, -0.004259886220097542, -0.003925229422748089, -0.003590572625398636, -0.003255915828049183, -0.00292125903069973, -0.002586602233350277, -0.002251945436000824, -0.001917288638651371, -0.001582631841301918, -0.001247975043952465, -0.0009133182466030121, -0.0005786614492535591, -0.00024400465190410614, 9.065214544534683e-05, 0.0004253089427947998, 0.0007599657401442528, 0.0010946225374937057, 0.0014292793348431587, 0.0017639361321926117, 0.0020985929295420647, 0.0024332497268915176, 0.0027679065242409706, 0.0031025633215904236, 0.0034372201189398766, 0.0037718769162893295, 0.0041065337136387825, 0.0044411905109882355, 0.0047758473083376884, 0.005110504105687141, 0.005445160903036594, 0.005779817700386047, 0.0061144744977355, 0.006449131295084953, 0.006783788092434406, 0.007118444889783859, 0.007453101687133312, 0.007787758484482765, 0.008122415281832218, 0.008457072079181671, 0.008791728876531124, 0.009126385673880577, 0.00946104247123003, 0.009795699268579483, 0.010130356065928936, 0.010465012863278389, 0.010799669660627842, 0.011134326457977295]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 8.0, 6.0, 7.0, 9.0, 9.0, 13.0, 12.0, 10.0, 22.0, 24.0, 28.0, 16.0, 25.0, 25.0, 24.0, 38.0, 34.0, 36.0, 32.0, 32.0, 42.0, 43.0, 39.0, 36.0, 38.0, 42.0, 42.0, 39.0, 38.0, 30.0, 36.0, 21.0, 20.0, 19.0, 8.0, 21.0, 12.0, 10.0, 15.0, 8.0, 6.0, 8.0, 3.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0546875, -1.98779296875, -1.9208984375, -1.85400390625, -1.787109375, -1.72021484375, -1.6533203125, -1.58642578125, -1.51953125, -1.45263671875, -1.3857421875, -1.31884765625, -1.251953125, -1.18505859375, -1.1181640625, -1.05126953125, -0.984375, -0.91748046875, -0.8505859375, -0.78369140625, -0.716796875, -0.64990234375, -0.5830078125, -0.51611328125, -0.44921875, -0.38232421875, -0.3154296875, -0.24853515625, -0.181640625, -0.11474609375, -0.0478515625, 0.01904296875, 0.0859375, 0.15283203125, 0.2197265625, 0.28662109375, 0.353515625, 0.42041015625, 0.4873046875, 0.55419921875, 0.62109375, 0.68798828125, 0.7548828125, 0.82177734375, 0.888671875, 0.95556640625, 1.0224609375, 1.08935546875, 1.15625, 1.22314453125, 1.2900390625, 1.35693359375, 1.423828125, 1.49072265625, 1.5576171875, 1.62451171875, 1.69140625, 1.75830078125, 1.8251953125, 1.89208984375, 1.958984375, 2.02587890625, 2.0927734375, 2.15966796875, 2.2265625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 8.0, 6.0, 8.0, 10.0, 14.0, 16.0, 33.0, 40.0, 58.0, 58.0, 103.0, 137.0, 196.0, 301.0, 478.0, 822.0, 1469.0, 2666.0, 5342.0, 11377.0, 25467.0, 63730.0, 167096.0, 347237.0, 251767.0, 99508.0, 38343.0, 16237.0, 7622.0, 3749.0, 1890.0, 1034.0, 586.0, 379.0, 241.0, 158.0, 102.0, 59.0, 59.0, 40.0, 34.0, 20.0, 17.0, 11.0, 11.0, 9.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.119140625, -2.045379638671875, -1.97161865234375, -1.897857666015625, -1.8240966796875, -1.750335693359375, -1.67657470703125, -1.602813720703125, -1.529052734375, -1.455291748046875, -1.38153076171875, -1.307769775390625, -1.2340087890625, -1.160247802734375, -1.08648681640625, -1.012725830078125, -0.93896484375, -0.865203857421875, -0.79144287109375, -0.717681884765625, -0.6439208984375, -0.570159912109375, -0.49639892578125, -0.422637939453125, -0.348876953125, -0.275115966796875, -0.20135498046875, -0.127593994140625, -0.0538330078125, 0.019927978515625, 0.09368896484375, 0.167449951171875, 0.2412109375, 0.314971923828125, 0.38873291015625, 0.462493896484375, 0.5362548828125, 0.610015869140625, 0.68377685546875, 0.757537841796875, 0.831298828125, 0.905059814453125, 0.97882080078125, 1.052581787109375, 1.1263427734375, 1.200103759765625, 1.27386474609375, 1.347625732421875, 1.42138671875, 1.495147705078125, 1.56890869140625, 1.642669677734375, 1.7164306640625, 1.790191650390625, 1.86395263671875, 1.937713623046875, 2.011474609375, 2.085235595703125, 2.15899658203125, 2.232757568359375, 2.3065185546875, 2.380279541015625, 2.45404052734375, 2.527801513671875, 2.6015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 6.0, 6.0, 14.0, 12.0, 11.0, 13.0, 29.0, 24.0, 30.0, 36.0, 34.0, 43.0, 35.0, 56.0, 69.0, 98.0, 195.0, 1553.0, 229.0, 100.0, 72.0, 44.0, 45.0, 43.0, 38.0, 30.0, 31.0, 24.0, 24.0, 16.0, 13.0, 15.0, 11.0, 10.0, 9.0, 5.0, 8.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.4439697265625, -8.177001953125, -7.9100341796875, -7.64306640625, -7.3760986328125, -7.109130859375, -6.8421630859375, -6.5751953125, -6.3082275390625, -6.041259765625, -5.7742919921875, -5.50732421875, -5.2403564453125, -4.973388671875, -4.7064208984375, -4.439453125, -4.1724853515625, -3.905517578125, -3.6385498046875, -3.37158203125, -3.1046142578125, -2.837646484375, -2.5706787109375, -2.3037109375, -2.0367431640625, -1.769775390625, -1.5028076171875, -1.23583984375, -0.9688720703125, -0.701904296875, -0.4349365234375, -0.16796875, 0.0989990234375, 0.365966796875, 0.6329345703125, 0.89990234375, 1.1668701171875, 1.433837890625, 1.7008056640625, 1.9677734375, 2.2347412109375, 2.501708984375, 2.7686767578125, 3.03564453125, 3.3026123046875, 3.569580078125, 3.8365478515625, 4.103515625, 4.3704833984375, 4.637451171875, 4.9044189453125, 5.17138671875, 5.4383544921875, 5.705322265625, 5.9722900390625, 6.2392578125, 6.5062255859375, 6.773193359375, 7.0401611328125, 7.30712890625, 7.5740966796875, 7.841064453125, 8.1080322265625, 8.375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 8.0, 9.0, 12.0, 13.0, 14.0, 20.0, 24.0, 32.0, 32.0, 43.0, 56.0, 72.0, 121.0, 178.0, 316.0, 682.0, 1975.0, 13238.0, 404542.0, 2673631.0, 44383.0, 4003.0, 1127.0, 430.0, 205.0, 133.0, 93.0, 60.0, 51.0, 43.0, 29.0, 28.0, 12.0, 18.0, 18.0, 11.0, 8.0, 6.0, 4.0, 9.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.6796875, -11.293212890625, -10.90673828125, -10.520263671875, -10.1337890625, -9.747314453125, -9.36083984375, -8.974365234375, -8.587890625, -8.201416015625, -7.81494140625, -7.428466796875, -7.0419921875, -6.655517578125, -6.26904296875, -5.882568359375, -5.49609375, -5.109619140625, -4.72314453125, -4.336669921875, -3.9501953125, -3.563720703125, -3.17724609375, -2.790771484375, -2.404296875, -2.017822265625, -1.63134765625, -1.244873046875, -0.8583984375, -0.471923828125, -0.08544921875, 0.301025390625, 0.6875, 1.073974609375, 1.46044921875, 1.846923828125, 2.2333984375, 2.619873046875, 3.00634765625, 3.392822265625, 3.779296875, 4.165771484375, 4.55224609375, 4.938720703125, 5.3251953125, 5.711669921875, 6.09814453125, 6.484619140625, 6.87109375, 7.257568359375, 7.64404296875, 8.030517578125, 8.4169921875, 8.803466796875, 9.18994140625, 9.576416015625, 9.962890625, 10.349365234375, 10.73583984375, 11.122314453125, 11.5087890625, 11.895263671875, 12.28173828125, 12.668212890625, 13.0546875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [2.0, 19.0, 634.0, 362.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.162151336669922, -6.605534076690674, -3.048916816711426, 0.5076999664306641, 4.06431770324707, 7.620935440063477, 11.17755126953125, 14.734169006347656, 18.290786743164062, 21.84740447998047, 25.404022216796875, 28.96063804626465, 32.51725769042969, 36.073875427246094, 39.630489349365234, 43.18710708618164, 46.74372482299805, 50.30034255981445, 53.85696029663086, 57.41357421875, 60.970191955566406, 64.52680969238281, 68.08342742919922, 71.64004516601562, 75.19666290283203, 78.75328063964844, 82.30989837646484, 85.86651611328125, 89.42313385009766, 92.97975158691406, 96.53636169433594, 100.09298706054688, 103.64959716796875, 107.20621490478516, 110.76283264160156, 114.31945037841797, 117.87606811523438, 121.43268585205078, 124.98930358886719, 128.54591369628906, 132.1025390625, 135.65914916992188, 139.2157745361328, 142.7723846435547, 146.32901000976562, 149.8856201171875, 153.44224548339844, 156.9988555908203, 160.55548095703125, 164.11209106445312, 167.66871643066406, 171.22532653808594, 174.78195190429688, 178.33856201171875, 181.8951873779297, 185.45179748535156, 189.00840759277344, 192.5650177001953, 196.12164306640625, 199.67825317382812, 203.23487854003906, 206.79148864746094, 210.34811401367188, 213.90472412109375, 217.4613494873047]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 8.0, 7.0, 18.0, 13.0, 7.0, 13.0, 18.0, 22.0, 23.0, 24.0, 23.0, 29.0, 33.0, 39.0, 33.0, 39.0, 39.0, 33.0, 51.0, 43.0, 40.0, 42.0, 37.0, 43.0, 31.0, 47.0, 43.0, 24.0, 27.0, 20.0, 16.0, 32.0, 12.0, 12.0, 14.0, 10.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.91610336303711, -24.085018157958984, -23.253931045532227, -22.4228458404541, -21.591760635375977, -20.76067352294922, -19.929588317871094, -19.09850311279297, -18.267417907714844, -17.43633270263672, -16.60524559020996, -15.774160385131836, -14.943075180053711, -14.11198902130127, -13.280902862548828, -12.449817657470703, -11.618730545043945, -10.787644386291504, -9.956559181213379, -9.125473022460938, -8.294387817382812, -7.463301658630371, -6.63221549987793, -5.8011298179626465, -4.970044136047363, -4.13895845413208, -3.3078725337982178, -2.4767866134643555, -1.6457009315490723, -0.8146152496337891, 0.016470909118652344, 0.8475565910339355, 1.6786422729492188, 2.509727954864502, 3.3408138751983643, 4.171899795532227, 5.00298547744751, 5.834071159362793, 6.665157318115234, 7.496243000030518, 8.3273286819458, 9.158414840698242, 9.989500045776367, 10.820586204528809, 11.65167236328125, 12.482757568359375, 13.313843727111816, 14.144929885864258, 14.976015090942383, 15.807101249694824, 16.638187408447266, 17.46927261352539, 18.300357818603516, 19.13144302368164, 19.9625301361084, 20.793615341186523, 21.62470245361328, 22.455787658691406, 23.286874771118164, 24.11795997619629, 24.949045181274414, 25.780132293701172, 26.611217498779297, 27.442302703857422, 28.273387908935547]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 5.0, 5.0, 8.0, 8.0, 12.0, 14.0, 17.0, 23.0, 18.0, 23.0, 24.0, 23.0, 27.0, 27.0, 32.0, 33.0, 33.0, 35.0, 37.0, 28.0, 44.0, 40.0, 47.0, 42.0, 46.0, 37.0, 39.0, 38.0, 27.0, 35.0, 24.0, 23.0, 14.0, 19.0, 13.0, 8.0, 7.0, 14.0, 12.0, 7.0, 3.0, 6.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.22265625, -2.152618408203125, -2.08258056640625, -2.012542724609375, -1.9425048828125, -1.872467041015625, -1.80242919921875, -1.732391357421875, -1.662353515625, -1.592315673828125, -1.52227783203125, -1.452239990234375, -1.3822021484375, -1.312164306640625, -1.24212646484375, -1.172088623046875, -1.10205078125, -1.032012939453125, -0.96197509765625, -0.891937255859375, -0.8218994140625, -0.751861572265625, -0.68182373046875, -0.611785888671875, -0.541748046875, -0.471710205078125, -0.40167236328125, -0.331634521484375, -0.2615966796875, -0.191558837890625, -0.12152099609375, -0.051483154296875, 0.0185546875, 0.088592529296875, 0.15863037109375, 0.228668212890625, 0.2987060546875, 0.368743896484375, 0.43878173828125, 0.508819580078125, 0.578857421875, 0.648895263671875, 0.71893310546875, 0.788970947265625, 0.8590087890625, 0.929046630859375, 0.99908447265625, 1.069122314453125, 1.13916015625, 1.209197998046875, 1.27923583984375, 1.349273681640625, 1.4193115234375, 1.489349365234375, 1.55938720703125, 1.629425048828125, 1.699462890625, 1.769500732421875, 1.83953857421875, 1.909576416015625, 1.9796142578125, 2.049652099609375, 2.11968994140625, 2.189727783203125, 2.259765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 5.0, 6.0, 15.0, 12.0, 16.0, 19.0, 31.0, 40.0, 50.0, 78.0, 107.0, 193.0, 448.0, 1152.0, 3319.0, 11078.0, 39039.0, 172611.0, 953324.0, 2172041.0, 673412.0, 124226.0, 29815.0, 8660.0, 2716.0, 959.0, 350.0, 203.0, 82.0, 77.0, 37.0, 32.0, 26.0, 11.0, 25.0, 14.0, 6.0, 8.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03515625, -4.8695068359375, -4.703857421875, -4.5382080078125, -4.37255859375, -4.2069091796875, -4.041259765625, -3.8756103515625, -3.7099609375, -3.5443115234375, -3.378662109375, -3.2130126953125, -3.04736328125, -2.8817138671875, -2.716064453125, -2.5504150390625, -2.384765625, -2.2191162109375, -2.053466796875, -1.8878173828125, -1.72216796875, -1.5565185546875, -1.390869140625, -1.2252197265625, -1.0595703125, -0.8939208984375, -0.728271484375, -0.5626220703125, -0.39697265625, -0.2313232421875, -0.065673828125, 0.0999755859375, 0.265625, 0.4312744140625, 0.596923828125, 0.7625732421875, 0.92822265625, 1.0938720703125, 1.259521484375, 1.4251708984375, 1.5908203125, 1.7564697265625, 1.922119140625, 2.0877685546875, 2.25341796875, 2.4190673828125, 2.584716796875, 2.7503662109375, 2.916015625, 3.0816650390625, 3.247314453125, 3.4129638671875, 3.57861328125, 3.7442626953125, 3.909912109375, 4.0755615234375, 4.2412109375, 4.4068603515625, 4.572509765625, 4.7381591796875, 4.90380859375, 5.0694580078125, 5.235107421875, 5.4007568359375, 5.56640625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 12.0, 16.0, 16.0, 31.0, 47.0, 53.0, 58.0, 124.0, 131.0, 179.0, 256.0, 351.0, 414.0, 454.0, 451.0, 364.0, 282.0, 232.0, 155.0, 125.0, 86.0, 68.0, 43.0, 31.0, 24.0, 13.0, 12.0, 10.0, 5.0, 7.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.08203125, -6.87188720703125, -6.6617431640625, -6.45159912109375, -6.241455078125, -6.03131103515625, -5.8211669921875, -5.61102294921875, -5.40087890625, -5.19073486328125, -4.9805908203125, -4.77044677734375, -4.560302734375, -4.35015869140625, -4.1400146484375, -3.92987060546875, -3.7197265625, -3.50958251953125, -3.2994384765625, -3.08929443359375, -2.879150390625, -2.66900634765625, -2.4588623046875, -2.24871826171875, -2.03857421875, -1.82843017578125, -1.6182861328125, -1.40814208984375, -1.197998046875, -0.98785400390625, -0.7777099609375, -0.56756591796875, -0.357421875, -0.14727783203125, 0.0628662109375, 0.27301025390625, 0.483154296875, 0.69329833984375, 0.9034423828125, 1.11358642578125, 1.32373046875, 1.53387451171875, 1.7440185546875, 1.95416259765625, 2.164306640625, 2.37445068359375, 2.5845947265625, 2.79473876953125, 3.0048828125, 3.21502685546875, 3.4251708984375, 3.63531494140625, 3.845458984375, 4.05560302734375, 4.2657470703125, 4.47589111328125, 4.68603515625, 4.89617919921875, 5.1063232421875, 5.31646728515625, 5.526611328125, 5.73675537109375, 5.9468994140625, 6.15704345703125, 6.3671875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 10.0, 18.0, 31.0, 50.0, 84.0, 119.0, 254.0, 446.0, 995.0, 2723.0, 9769.0, 52805.0, 363705.0, 2209649.0, 1333006.0, 182813.0, 28296.0, 5994.0, 1896.0, 779.0, 364.0, 176.0, 114.0, 62.0, 40.0, 24.0, 21.0, 11.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.2578125, -12.9249267578125, -12.592041015625, -12.2591552734375, -11.92626953125, -11.5933837890625, -11.260498046875, -10.9276123046875, -10.5947265625, -10.2618408203125, -9.928955078125, -9.5960693359375, -9.26318359375, -8.9302978515625, -8.597412109375, -8.2645263671875, -7.931640625, -7.5987548828125, -7.265869140625, -6.9329833984375, -6.60009765625, -6.2672119140625, -5.934326171875, -5.6014404296875, -5.2685546875, -4.9356689453125, -4.602783203125, -4.2698974609375, -3.93701171875, -3.6041259765625, -3.271240234375, -2.9383544921875, -2.60546875, -2.2725830078125, -1.939697265625, -1.6068115234375, -1.27392578125, -0.9410400390625, -0.608154296875, -0.2752685546875, 0.0576171875, 0.3905029296875, 0.723388671875, 1.0562744140625, 1.38916015625, 1.7220458984375, 2.054931640625, 2.3878173828125, 2.720703125, 3.0535888671875, 3.386474609375, 3.7193603515625, 4.05224609375, 4.3851318359375, 4.718017578125, 5.0509033203125, 5.3837890625, 5.7166748046875, 6.049560546875, 6.3824462890625, 6.71533203125, 7.0482177734375, 7.381103515625, 7.7139892578125, 8.046875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 24.0, 62.0, 144.0, 214.0, 227.0, 182.0, 104.0, 33.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.97291564941406, -92.60398864746094, -90.23506164550781, -87.86613464355469, -85.4972152709961, -83.12828826904297, -80.75936126708984, -78.39043426513672, -76.0215072631836, -73.65258026123047, -71.28365325927734, -68.91473388671875, -66.54580688476562, -64.1768798828125, -61.807952880859375, -59.43902587890625, -57.07010269165039, -54.701175689697266, -52.332252502441406, -49.96332550048828, -47.594398498535156, -45.22547149658203, -42.85654830932617, -40.48762130737305, -38.11869812011719, -35.74977111816406, -33.3808479309082, -31.011920928955078, -28.642993927001953, -26.27406883239746, -23.90514373779297, -21.536216735839844, -19.167293548583984, -16.798368453979492, -14.429441452026367, -12.060516357421875, -9.691590309143066, -7.322664260864258, -4.953739166259766, -2.5848121643066406, -0.21588706970214844, 2.153038740158081, 4.5219645500183105, 6.890890121459961, 9.25981616973877, 11.628742218017578, 13.99766731262207, 16.366594314575195, 18.735519409179688, 21.10444450378418, 23.473371505737305, 25.842296600341797, 28.211223602294922, 30.580148696899414, 32.949073791503906, 35.31800079345703, 37.686927795410156, 40.05585479736328, 42.42477798461914, 44.793704986572266, 47.16263198852539, 49.53155517578125, 51.900482177734375, 54.2694091796875, 56.63833236694336]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 9.0, 9.0, 6.0, 15.0, 12.0, 19.0, 19.0, 11.0, 22.0, 27.0, 25.0, 31.0, 29.0, 38.0, 38.0, 39.0, 43.0, 36.0, 43.0, 52.0, 39.0, 37.0, 46.0, 36.0, 28.0, 32.0, 43.0, 31.0, 23.0, 24.0, 24.0, 17.0, 24.0, 21.0, 15.0, 4.0, 10.0, 5.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.37346839904785, -19.657672882080078, -18.941877365112305, -18.22608184814453, -17.510286331176758, -16.794490814208984, -16.07869529724121, -15.362899780273438, -14.647104263305664, -13.93130874633789, -13.215513229370117, -12.499717712402344, -11.78392219543457, -11.068126678466797, -10.352331161499023, -9.63653564453125, -8.920741081237793, -8.20494556427002, -7.489150047302246, -6.773354530334473, -6.057559013366699, -5.341763496398926, -4.6259684562683105, -3.910172939300537, -3.1943774223327637, -2.4785819053649902, -1.7627865076065063, -1.0469911098480225, -0.331195592880249, 0.3845999240875244, 1.1003952026367188, 1.8161907196044922, 2.5319862365722656, 3.247781753540039, 3.9635772705078125, 4.679372787475586, 5.395168304443359, 6.110963821411133, 6.826758861541748, 7.5425543785095215, 8.258350372314453, 8.974145889282227, 9.68994140625, 10.405736923217773, 11.121532440185547, 11.83732795715332, 12.553123474121094, 13.268918991088867, 13.984713554382324, 14.700509071350098, 15.416304588317871, 16.132099151611328, 16.8478946685791, 17.563690185546875, 18.27948570251465, 18.995281219482422, 19.711076736450195, 20.42687225341797, 21.142667770385742, 21.858463287353516, 22.57425880432129, 23.290054321289062, 24.005849838256836, 24.72164535522461, 25.437440872192383]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 4.0, 9.0, 10.0, 14.0, 16.0, 10.0, 11.0, 27.0, 19.0, 15.0, 29.0, 34.0, 30.0, 21.0, 37.0, 40.0, 33.0, 30.0, 46.0, 33.0, 51.0, 51.0, 40.0, 30.0, 42.0, 33.0, 37.0, 33.0, 25.0, 26.0, 18.0, 22.0, 26.0, 21.0, 12.0, 10.0, 6.0, 7.0, 4.0, 7.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.2578125, -2.184661865234375, -2.11151123046875, -2.038360595703125, -1.9652099609375, -1.892059326171875, -1.81890869140625, -1.745758056640625, -1.672607421875, -1.599456787109375, -1.52630615234375, -1.453155517578125, -1.3800048828125, -1.306854248046875, -1.23370361328125, -1.160552978515625, -1.08740234375, -1.014251708984375, -0.94110107421875, -0.867950439453125, -0.7947998046875, -0.721649169921875, -0.64849853515625, -0.575347900390625, -0.502197265625, -0.429046630859375, -0.35589599609375, -0.282745361328125, -0.2095947265625, -0.136444091796875, -0.06329345703125, 0.009857177734375, 0.0830078125, 0.156158447265625, 0.22930908203125, 0.302459716796875, 0.3756103515625, 0.448760986328125, 0.52191162109375, 0.595062255859375, 0.668212890625, 0.741363525390625, 0.81451416015625, 0.887664794921875, 0.9608154296875, 1.033966064453125, 1.10711669921875, 1.180267333984375, 1.25341796875, 1.326568603515625, 1.39971923828125, 1.472869873046875, 1.5460205078125, 1.619171142578125, 1.69232177734375, 1.765472412109375, 1.838623046875, 1.911773681640625, 1.98492431640625, 2.058074951171875, 2.1312255859375, 2.204376220703125, 2.27752685546875, 2.350677490234375, 2.423828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 9.0, 13.0, 27.0, 19.0, 27.0, 71.0, 105.0, 144.0, 192.0, 332.0, 466.0, 741.0, 1089.0, 1574.0, 2535.0, 3819.0, 5804.0, 9192.0, 14680.0, 23061.0, 37495.0, 60412.0, 95226.0, 140454.0, 177090.0, 159786.0, 114495.0, 74387.0, 46912.0, 28758.0, 17873.0, 11198.0, 7166.0, 4613.0, 2928.0, 2007.0, 1259.0, 875.0, 546.0, 394.0, 246.0, 161.0, 124.0, 78.0, 59.0, 53.0, 25.0, 13.0, 12.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1962890625, -0.19010162353515625, -0.1839141845703125, -0.17772674560546875, -0.171539306640625, -0.16535186767578125, -0.1591644287109375, -0.15297698974609375, -0.14678955078125, -0.14060211181640625, -0.1344146728515625, -0.12822723388671875, -0.122039794921875, -0.11585235595703125, -0.1096649169921875, -0.10347747802734375, -0.0972900390625, -0.09110260009765625, -0.0849151611328125, -0.07872772216796875, -0.072540283203125, -0.06635284423828125, -0.0601654052734375, -0.05397796630859375, -0.04779052734375, -0.04160308837890625, -0.0354156494140625, -0.02922821044921875, -0.023040771484375, -0.01685333251953125, -0.0106658935546875, -0.00447845458984375, 0.001708984375, 0.00789642333984375, 0.0140838623046875, 0.02027130126953125, 0.026458740234375, 0.03264617919921875, 0.0388336181640625, 0.04502105712890625, 0.05120849609375, 0.05739593505859375, 0.0635833740234375, 0.06977081298828125, 0.075958251953125, 0.08214569091796875, 0.0883331298828125, 0.09452056884765625, 0.1007080078125, 0.10689544677734375, 0.1130828857421875, 0.11927032470703125, 0.125457763671875, 0.13164520263671875, 0.1378326416015625, 0.14402008056640625, 0.15020751953125, 0.15639495849609375, 0.1625823974609375, 0.16876983642578125, 0.174957275390625, 0.18114471435546875, 0.1873321533203125, 0.19351959228515625, 0.19970703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 8.0, 8.0, 9.0, 6.0, 5.0, 4.0, 6.0, 13.0, 8.0, 14.0, 21.0, 26.0, 23.0, 33.0, 34.0, 30.0, 27.0, 43.0, 44.0, 37.0, 42.0, 36.0, 1071.0, 39.0, 40.0, 44.0, 30.0, 37.0, 34.0, 32.0, 32.0, 24.0, 19.0, 30.0, 15.0, 22.0, 18.0, 8.0, 9.0, 6.0, 10.0, 3.0, 8.0, 7.0, 0.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.3766937255859375, -1.330535888671875, -1.2843780517578125, -1.23822021484375, -1.1920623779296875, -1.145904541015625, -1.0997467041015625, -1.0535888671875, -1.0074310302734375, -0.961273193359375, -0.9151153564453125, -0.86895751953125, -0.8227996826171875, -0.776641845703125, -0.7304840087890625, -0.684326171875, -0.6381683349609375, -0.592010498046875, -0.5458526611328125, -0.49969482421875, -0.4535369873046875, -0.407379150390625, -0.3612213134765625, -0.3150634765625, -0.2689056396484375, -0.222747802734375, -0.1765899658203125, -0.13043212890625, -0.0842742919921875, -0.038116455078125, 0.0080413818359375, 0.05419921875, 0.1003570556640625, 0.146514892578125, 0.1926727294921875, 0.23883056640625, 0.2849884033203125, 0.331146240234375, 0.3773040771484375, 0.4234619140625, 0.4696197509765625, 0.515777587890625, 0.5619354248046875, 0.60809326171875, 0.6542510986328125, 0.700408935546875, 0.7465667724609375, 0.792724609375, 0.8388824462890625, 0.885040283203125, 0.9311981201171875, 0.97735595703125, 1.0235137939453125, 1.069671630859375, 1.1158294677734375, 1.1619873046875, 1.2081451416015625, 1.254302978515625, 1.3004608154296875, 1.34661865234375, 1.3927764892578125, 1.438934326171875, 1.4850921630859375, 1.53125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 15.0, 29.0, 32.0, 63.0, 74.0, 118.0, 183.0, 259.0, 373.0, 577.0, 972.0, 1470.0, 2260.0, 3711.0, 5808.0, 8985.0, 14200.0, 23203.0, 37282.0, 57715.0, 87216.0, 124018.0, 505971.0, 845924.0, 125516.0, 89557.0, 59511.0, 38154.0, 23803.0, 15025.0, 9376.0, 5675.0, 3587.0, 2273.0, 1441.0, 963.0, 604.0, 413.0, 247.0, 174.0, 81.0, 85.0, 68.0, 42.0, 19.0, 17.0, 14.0, 13.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1163330078125, -0.11245918273925781, -0.10858535766601562, -0.10471153259277344, -0.10083770751953125, -0.09696388244628906, -0.09309005737304688, -0.08921623229980469, -0.0853424072265625, -0.08146858215332031, -0.07759475708007812, -0.07372093200683594, -0.06984710693359375, -0.06597328186035156, -0.062099456787109375, -0.05822563171386719, -0.054351806640625, -0.05047798156738281, -0.046604156494140625, -0.04273033142089844, -0.03885650634765625, -0.03498268127441406, -0.031108856201171875, -0.027235031127929688, -0.0233612060546875, -0.019487380981445312, -0.015613555908203125, -0.011739730834960938, -0.00786590576171875, -0.0039920806884765625, -0.000118255615234375, 0.0037555694580078125, 0.00762939453125, 0.011503219604492188, 0.015377044677734375, 0.019250869750976562, 0.02312469482421875, 0.026998519897460938, 0.030872344970703125, 0.03474617004394531, 0.0386199951171875, 0.04249382019042969, 0.046367645263671875, 0.05024147033691406, 0.05411529541015625, 0.05798912048339844, 0.061862945556640625, 0.06573677062988281, 0.069610595703125, 0.07348442077636719, 0.07735824584960938, 0.08123207092285156, 0.08510589599609375, 0.08897972106933594, 0.09285354614257812, 0.09672737121582031, 0.1006011962890625, 0.10447502136230469, 0.10834884643554688, 0.11222267150878906, 0.11609649658203125, 0.11997032165527344, 0.12384414672851562, 0.1277179718017578, 0.131591796875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 10.0, 6.0, 8.0, 9.0, 17.0, 20.0, 17.0, 39.0, 30.0, 64.0, 85.0, 135.0, 125.0, 95.0, 77.0, 52.0, 40.0, 32.0, 18.0, 16.0, 18.0, 13.0, 11.0, 6.0, 7.0, 1.0, 2.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0074920654296875, -0.007260143756866455, -0.00702822208404541, -0.006796300411224365, -0.00656437873840332, -0.006332457065582275, -0.0061005353927612305, -0.0058686137199401855, -0.005636692047119141, -0.005404770374298096, -0.005172848701477051, -0.004940927028656006, -0.004709005355834961, -0.004477083683013916, -0.004245162010192871, -0.004013240337371826, -0.0037813186645507812, -0.0035493969917297363, -0.0033174753189086914, -0.0030855536460876465, -0.0028536319732666016, -0.0026217103004455566, -0.0023897886276245117, -0.002157866954803467, -0.0019259452819824219, -0.001694023609161377, -0.001462101936340332, -0.0012301802635192871, -0.0009982585906982422, -0.0007663369178771973, -0.0005344152450561523, -0.0003024935722351074, -7.05718994140625e-05, 0.00016134977340698242, 0.00039327144622802734, 0.0006251931190490723, 0.0008571147918701172, 0.0010890364646911621, 0.001320958137512207, 0.001552879810333252, 0.0017848014831542969, 0.002016723155975342, 0.0022486448287963867, 0.0024805665016174316, 0.0027124881744384766, 0.0029444098472595215, 0.0031763315200805664, 0.0034082531929016113, 0.0036401748657226562, 0.003872096538543701, 0.004104018211364746, 0.004335939884185791, 0.004567861557006836, 0.004799783229827881, 0.005031704902648926, 0.005263626575469971, 0.005495548248291016, 0.0057274699211120605, 0.0059593915939331055, 0.00619131326675415, 0.006423234939575195, 0.00665515661239624, 0.006887078285217285, 0.00711899995803833, 0.007350921630859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 3.0, 1.0, 4.0, 9.0, 12.0, 8.0, 12.0, 27.0, 27.0, 51.0, 97.0, 163.0, 287.0, 962.0, 92947.0, 949834.0, 3199.0, 391.0, 173.0, 104.0, 69.0, 47.0, 26.0, 18.0, 11.0, 14.0, 6.0, 4.0, 12.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1748046875, -0.16920089721679688, -0.16359710693359375, -0.15799331665039062, -0.1523895263671875, -0.14678573608398438, -0.14118194580078125, -0.13557815551757812, -0.129974365234375, -0.12437057495117188, -0.11876678466796875, -0.11316299438476562, -0.1075592041015625, -0.10195541381835938, -0.09635162353515625, -0.09074783325195312, -0.08514404296875, -0.07954025268554688, -0.07393646240234375, -0.06833267211914062, -0.0627288818359375, -0.057125091552734375, -0.05152130126953125, -0.045917510986328125, -0.040313720703125, -0.034709930419921875, -0.02910614013671875, -0.023502349853515625, -0.0178985595703125, -0.012294769287109375, -0.00669097900390625, -0.001087188720703125, 0.0045166015625, 0.010120391845703125, 0.01572418212890625, 0.021327972412109375, 0.0269317626953125, 0.032535552978515625, 0.03813934326171875, 0.043743133544921875, 0.049346923828125, 0.054950714111328125, 0.06055450439453125, 0.06615829467773438, 0.0717620849609375, 0.07736587524414062, 0.08296966552734375, 0.08857345581054688, 0.09417724609375, 0.09978103637695312, 0.10538482666015625, 0.11098861694335938, 0.1165924072265625, 0.12219619750976562, 0.12779998779296875, 0.13340377807617188, 0.139007568359375, 0.14461135864257812, 0.15021514892578125, 0.15581893920898438, 0.1614227294921875, 0.16702651977539062, 0.17263031005859375, 0.17823410034179688, 0.183837890625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 123.0, 734.0, 127.0, 16.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13747811317443848, -0.1349993646144867, -0.1325206160545349, -0.13004186749458313, -0.12756311893463135, -0.12508437037467957, -0.12260562181472778, -0.120126873254776, -0.11764812469482422, -0.11516937613487244, -0.11269062757492065, -0.11021187901496887, -0.10773313045501709, -0.10525438189506531, -0.10277563333511353, -0.10029688477516174, -0.09781814366579056, -0.09533939510583878, -0.092860646545887, -0.09038189798593521, -0.08790314942598343, -0.08542440086603165, -0.08294565230607986, -0.08046691119670868, -0.0779881626367569, -0.07550941407680511, -0.07303066551685333, -0.07055191695690155, -0.06807316839694977, -0.06559441983699799, -0.0631156712770462, -0.06063692644238472, -0.05815816670656204, -0.05567941814661026, -0.05320066958665848, -0.050721921026706696, -0.04824317246675491, -0.04576442390680313, -0.04328567907214165, -0.040806930512189865, -0.03832818567752838, -0.0358494371175766, -0.03337068855762482, -0.030891941860318184, -0.0284131933003664, -0.02593444474041462, -0.023455698043107986, -0.020976949483156204, -0.018498199060559273, -0.01601945050060749, -0.013540702871978283, -0.011061955243349075, -0.008583206683397293, -0.006104458123445511, -0.0036257104948163033, -0.0011469628661870956, 0.0013317856937646866, 0.0038105337880551815, 0.006289281882345676, 0.008768029510974884, 0.011246778070926666, 0.013725526630878448, 0.01620427519083023, 0.018683021888136864, 0.021161770448088646]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 13.0, 14.0, 9.0, 7.0, 19.0, 17.0, 23.0, 22.0, 31.0, 27.0, 29.0, 32.0, 43.0, 41.0, 43.0, 47.0, 46.0, 39.0, 38.0, 41.0, 43.0, 42.0, 39.0, 33.0, 34.0, 45.0, 22.0, 24.0, 15.0, 31.0, 18.0, 13.0, 9.0, 13.0, 6.0, 5.0, 6.0, 5.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.006684482097625732, -0.00648366566747427, -0.006282849237322807, -0.006082032807171345, -0.005881216377019882, -0.00568039994686842, -0.005479583516716957, -0.0052787670865654945, -0.005077950656414032, -0.004877134226262569, -0.004676317796111107, -0.004475501365959644, -0.004274684935808182, -0.004073868505656719, -0.0038730520755052567, -0.003672235645353794, -0.0034714192152023315, -0.003270602785050869, -0.0030697863548994064, -0.002868969924747944, -0.0026681534945964813, -0.0024673370644450188, -0.002266520634293556, -0.0020657042041420937, -0.001864887773990631, -0.0016640713438391685, -0.001463254913687706, -0.0012624384835362434, -0.0010616220533847809, -0.0008608056232333183, -0.0006599891930818558, -0.0004591727629303932, -0.00025835633277893066, -5.753990262746811e-05, 0.00014327652752399445, 0.000344092957675457, 0.0005449093878269196, 0.0007457258179783821, 0.0009465422481298447, 0.0011473586782813072, 0.0013481751084327698, 0.0015489915385842323, 0.0017498079687356949, 0.0019506243988871574, 0.00215144082903862, 0.0023522572591900826, 0.002553073689341545, 0.0027538901194930077, 0.00295470654964447, 0.0031555229797959328, 0.0033563394099473953, 0.003557155840098858, 0.0037579722702503204, 0.003958788700401783, 0.0041596051305532455, 0.004360421560704708, 0.004561237990856171, 0.004762054421007633, 0.004962870851159096, 0.005163687281310558, 0.005364503711462021, 0.005565320141613483, 0.005766136571764946, 0.0059669530019164085, 0.006167769432067871]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 4.0, 9.0, 10.0, 15.0, 15.0, 10.0, 12.0, 26.0, 19.0, 16.0, 29.0, 34.0, 30.0, 20.0, 38.0, 40.0, 32.0, 31.0, 45.0, 33.0, 52.0, 50.0, 41.0, 29.0, 42.0, 33.0, 37.0, 33.0, 26.0, 25.0, 18.0, 23.0, 25.0, 21.0, 12.0, 10.0, 6.0, 7.0, 4.0, 7.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.255859375, -2.1827392578125, -2.109619140625, -2.0364990234375, -1.96337890625, -1.8902587890625, -1.817138671875, -1.7440185546875, -1.6708984375, -1.5977783203125, -1.524658203125, -1.4515380859375, -1.37841796875, -1.3052978515625, -1.232177734375, -1.1590576171875, -1.0859375, -1.0128173828125, -0.939697265625, -0.8665771484375, -0.79345703125, -0.7203369140625, -0.647216796875, -0.5740966796875, -0.5009765625, -0.4278564453125, -0.354736328125, -0.2816162109375, -0.20849609375, -0.1353759765625, -0.062255859375, 0.0108642578125, 0.083984375, 0.1571044921875, 0.230224609375, 0.3033447265625, 0.37646484375, 0.4495849609375, 0.522705078125, 0.5958251953125, 0.6689453125, 0.7420654296875, 0.815185546875, 0.8883056640625, 0.96142578125, 1.0345458984375, 1.107666015625, 1.1807861328125, 1.25390625, 1.3270263671875, 1.400146484375, 1.4732666015625, 1.54638671875, 1.6195068359375, 1.692626953125, 1.7657470703125, 1.8388671875, 1.9119873046875, 1.985107421875, 2.0582275390625, 2.13134765625, 2.2044677734375, 2.277587890625, 2.3507080078125, 2.423828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 10.0, 17.0, 23.0, 36.0, 52.0, 92.0, 118.0, 201.0, 234.0, 403.0, 678.0, 956.0, 1668.0, 2774.0, 4763.0, 8594.0, 16666.0, 32820.0, 65263.0, 125342.0, 210439.0, 237904.0, 160783.0, 86517.0, 43749.0, 22184.0, 11279.0, 6123.0, 3301.0, 2043.0, 1213.0, 831.0, 495.0, 319.0, 230.0, 135.0, 101.0, 59.0, 39.0, 25.0, 30.0, 11.0, 6.0, 6.0, 5.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8544921875, -1.7931060791015625, -1.731719970703125, -1.6703338623046875, -1.60894775390625, -1.5475616455078125, -1.486175537109375, -1.4247894287109375, -1.3634033203125, -1.3020172119140625, -1.240631103515625, -1.1792449951171875, -1.11785888671875, -1.0564727783203125, -0.995086669921875, -0.9337005615234375, -0.872314453125, -0.8109283447265625, -0.749542236328125, -0.6881561279296875, -0.62677001953125, -0.5653839111328125, -0.503997802734375, -0.4426116943359375, -0.3812255859375, -0.3198394775390625, -0.258453369140625, -0.1970672607421875, -0.13568115234375, -0.0742950439453125, -0.012908935546875, 0.0484771728515625, 0.10986328125, 0.1712493896484375, 0.232635498046875, 0.2940216064453125, 0.35540771484375, 0.4167938232421875, 0.478179931640625, 0.5395660400390625, 0.6009521484375, 0.6623382568359375, 0.723724365234375, 0.7851104736328125, 0.84649658203125, 0.9078826904296875, 0.969268798828125, 1.0306549072265625, 1.092041015625, 1.1534271240234375, 1.214813232421875, 1.2761993408203125, 1.33758544921875, 1.3989715576171875, 1.460357666015625, 1.5217437744140625, 1.5831298828125, 1.6445159912109375, 1.705902099609375, 1.7672882080078125, 1.82867431640625, 1.8900604248046875, 1.951446533203125, 2.0128326416015625, 2.07421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 7.0, 17.0, 14.0, 10.0, 23.0, 33.0, 30.0, 32.0, 32.0, 37.0, 46.0, 35.0, 71.0, 125.0, 222.0, 1413.0, 294.0, 125.0, 69.0, 60.0, 50.0, 46.0, 35.0, 39.0, 33.0, 23.0, 21.0, 18.0, 19.0, 7.0, 14.0, 12.0, 3.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.3726806640625, -8.081298828125, -7.7899169921875, -7.49853515625, -7.2071533203125, -6.915771484375, -6.6243896484375, -6.3330078125, -6.0416259765625, -5.750244140625, -5.4588623046875, -5.16748046875, -4.8760986328125, -4.584716796875, -4.2933349609375, -4.001953125, -3.7105712890625, -3.419189453125, -3.1278076171875, -2.83642578125, -2.5450439453125, -2.253662109375, -1.9622802734375, -1.6708984375, -1.3795166015625, -1.088134765625, -0.7967529296875, -0.50537109375, -0.2139892578125, 0.077392578125, 0.3687744140625, 0.66015625, 0.9515380859375, 1.242919921875, 1.5343017578125, 1.82568359375, 2.1170654296875, 2.408447265625, 2.6998291015625, 2.9912109375, 3.2825927734375, 3.573974609375, 3.8653564453125, 4.15673828125, 4.4481201171875, 4.739501953125, 5.0308837890625, 5.322265625, 5.6136474609375, 5.905029296875, 6.1964111328125, 6.48779296875, 6.7791748046875, 7.070556640625, 7.3619384765625, 7.6533203125, 7.9447021484375, 8.236083984375, 8.5274658203125, 8.81884765625, 9.1102294921875, 9.401611328125, 9.6929931640625, 9.984375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 11.0, 12.0, 18.0, 20.0, 25.0, 20.0, 49.0, 58.0, 78.0, 78.0, 137.0, 226.0, 407.0, 1128.0, 6031.0, 101640.0, 2803999.0, 219760.0, 9261.0, 1369.0, 515.0, 239.0, 173.0, 105.0, 71.0, 57.0, 50.0, 31.0, 30.0, 20.0, 14.0, 13.0, 13.0, 7.0, 6.0, 6.0, 5.0, 1.0, 3.0, 6.0, 0.0, 1.0, 1.0, 3.0], "bins": [-16.171875, -15.72998046875, -15.2880859375, -14.84619140625, -14.404296875, -13.96240234375, -13.5205078125, -13.07861328125, -12.63671875, -12.19482421875, -11.7529296875, -11.31103515625, -10.869140625, -10.42724609375, -9.9853515625, -9.54345703125, -9.1015625, -8.65966796875, -8.2177734375, -7.77587890625, -7.333984375, -6.89208984375, -6.4501953125, -6.00830078125, -5.56640625, -5.12451171875, -4.6826171875, -4.24072265625, -3.798828125, -3.35693359375, -2.9150390625, -2.47314453125, -2.03125, -1.58935546875, -1.1474609375, -0.70556640625, -0.263671875, 0.17822265625, 0.6201171875, 1.06201171875, 1.50390625, 1.94580078125, 2.3876953125, 2.82958984375, 3.271484375, 3.71337890625, 4.1552734375, 4.59716796875, 5.0390625, 5.48095703125, 5.9228515625, 6.36474609375, 6.806640625, 7.24853515625, 7.6904296875, 8.13232421875, 8.57421875, 9.01611328125, 9.4580078125, 9.89990234375, 10.341796875, 10.78369140625, 11.2255859375, 11.66748046875, 12.109375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 89.0, 562.0, 339.0, 27.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.015636444091797, -17.07900619506836, -14.142375946044922, -11.205745697021484, -8.269115447998047, -5.332485198974609, -2.395854949951172, 0.5407752990722656, 3.477405548095703, 6.414035797119141, 9.350666046142578, 12.287296295166016, 15.223926544189453, 18.16055679321289, 21.097187042236328, 24.033817291259766, 26.970447540283203, 29.90707778930664, 32.84370803833008, 35.780338287353516, 38.71696853637695, 41.65359878540039, 44.59022903442383, 47.526859283447266, 50.4634895324707, 53.40011978149414, 56.33675003051758, 59.273380279541016, 62.21001052856445, 65.14663696289062, 68.08326721191406, 71.0198974609375, 73.95652770996094, 76.89315795898438, 79.82978820800781, 82.76641845703125, 85.70304870605469, 88.63967895507812, 91.57630920410156, 94.512939453125, 97.44956970214844, 100.38619995117188, 103.32283020019531, 106.25946044921875, 109.19609069824219, 112.13272094726562, 115.06935119628906, 118.0059814453125, 120.94261169433594, 123.87924194335938, 126.81587219238281, 129.75250244140625, 132.6891326904297, 135.62576293945312, 138.56239318847656, 141.4990234375, 144.43565368652344, 147.37228393554688, 150.3089141845703, 153.24554443359375, 156.1821746826172, 159.11880493164062, 162.05543518066406, 164.9920654296875, 167.92869567871094]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 2.0, 5.0, 7.0, 5.0, 6.0, 10.0, 15.0, 23.0, 13.0, 17.0, 36.0, 26.0, 31.0, 30.0, 31.0, 31.0, 37.0, 40.0, 42.0, 42.0, 44.0, 43.0, 37.0, 47.0, 35.0, 33.0, 34.0, 37.0, 31.0, 34.0, 29.0, 20.0, 26.0, 17.0, 13.0, 8.0, 10.0, 10.0, 8.0, 3.0, 6.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.738584518432617, -24.90179443359375, -24.06500244140625, -23.228212356567383, -22.391422271728516, -21.554630279541016, -20.71784019470215, -19.88105010986328, -19.04425811767578, -18.207468032836914, -17.370676040649414, -16.533885955810547, -15.69709587097168, -14.860304832458496, -14.023513793945312, -13.186723709106445, -12.349933624267578, -11.513142585754395, -10.676352500915527, -9.839561462402344, -9.002771377563477, -8.165980339050293, -7.329189300537109, -6.492398738861084, -5.655608177185059, -4.818817615509033, -3.9820268154144287, -3.145236015319824, -2.308445453643799, -1.4716548919677734, -0.6348638534545898, 0.20192670822143555, 1.038717269897461, 1.8755079507827759, 2.712298631668091, 3.5490894317626953, 4.385879993438721, 5.222670555114746, 6.05946159362793, 6.896252155303955, 7.7330427169799805, 8.569833755493164, 9.406623840332031, 10.243414878845215, 11.080205917358398, 11.916996002197266, 12.75378704071045, 13.590578079223633, 14.4273681640625, 15.264159202575684, 16.100950241088867, 16.937740325927734, 17.7745304107666, 18.61132049560547, 19.44811248779297, 20.284902572631836, 21.121692657470703, 21.95848274230957, 22.79527473449707, 23.632064819335938, 24.468854904174805, 25.305644989013672, 26.142436981201172, 26.97922706604004, 27.81601905822754]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 5.0, 19.0, 20.0, 14.0, 16.0, 14.0, 18.0, 26.0, 32.0, 25.0, 30.0, 31.0, 31.0, 35.0, 38.0, 44.0, 37.0, 43.0, 41.0, 45.0, 33.0, 55.0, 36.0, 28.0, 39.0, 32.0, 31.0, 24.0, 23.0, 22.0, 18.0, 19.0, 11.0, 3.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.578125, -2.499237060546875, -2.42034912109375, -2.341461181640625, -2.2625732421875, -2.183685302734375, -2.10479736328125, -2.025909423828125, -1.947021484375, -1.868133544921875, -1.78924560546875, -1.710357666015625, -1.6314697265625, -1.552581787109375, -1.47369384765625, -1.394805908203125, -1.31591796875, -1.237030029296875, -1.15814208984375, -1.079254150390625, -1.0003662109375, -0.921478271484375, -0.84259033203125, -0.763702392578125, -0.684814453125, -0.605926513671875, -0.52703857421875, -0.448150634765625, -0.3692626953125, -0.290374755859375, -0.21148681640625, -0.132598876953125, -0.0537109375, 0.025177001953125, 0.10406494140625, 0.182952880859375, 0.2618408203125, 0.340728759765625, 0.41961669921875, 0.498504638671875, 0.577392578125, 0.656280517578125, 0.73516845703125, 0.814056396484375, 0.8929443359375, 0.971832275390625, 1.05072021484375, 1.129608154296875, 1.20849609375, 1.287384033203125, 1.36627197265625, 1.445159912109375, 1.5240478515625, 1.602935791015625, 1.68182373046875, 1.760711669921875, 1.839599609375, 1.918487548828125, 1.99737548828125, 2.076263427734375, 2.1551513671875, 2.234039306640625, 2.31292724609375, 2.391815185546875, 2.470703125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 6.0, 9.0, 6.0, 7.0, 9.0, 13.0, 14.0, 19.0, 24.0, 29.0, 37.0, 53.0, 52.0, 105.0, 192.0, 403.0, 998.0, 3154.0, 11117.0, 47003.0, 245104.0, 1357564.0, 1968413.0, 453878.0, 80718.0, 17799.0, 4777.0, 1497.0, 588.0, 230.0, 144.0, 78.0, 70.0, 39.0, 25.0, 16.0, 18.0, 19.0, 7.0, 4.0, 11.0, 8.0, 5.0, 8.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.02734375, -5.84564208984375, -5.6639404296875, -5.48223876953125, -5.300537109375, -5.11883544921875, -4.9371337890625, -4.75543212890625, -4.57373046875, -4.39202880859375, -4.2103271484375, -4.02862548828125, -3.846923828125, -3.66522216796875, -3.4835205078125, -3.30181884765625, -3.1201171875, -2.93841552734375, -2.7567138671875, -2.57501220703125, -2.393310546875, -2.21160888671875, -2.0299072265625, -1.84820556640625, -1.66650390625, -1.48480224609375, -1.3031005859375, -1.12139892578125, -0.939697265625, -0.75799560546875, -0.5762939453125, -0.39459228515625, -0.212890625, -0.03118896484375, 0.1505126953125, 0.33221435546875, 0.513916015625, 0.69561767578125, 0.8773193359375, 1.05902099609375, 1.24072265625, 1.42242431640625, 1.6041259765625, 1.78582763671875, 1.967529296875, 2.14923095703125, 2.3309326171875, 2.51263427734375, 2.6943359375, 2.87603759765625, 3.0577392578125, 3.23944091796875, 3.421142578125, 3.60284423828125, 3.7845458984375, 3.96624755859375, 4.14794921875, 4.32965087890625, 4.5113525390625, 4.69305419921875, 4.874755859375, 5.05645751953125, 5.2381591796875, 5.41986083984375, 5.6015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 4.0, 7.0, 15.0, 9.0, 8.0, 11.0, 19.0, 31.0, 34.0, 50.0, 70.0, 83.0, 90.0, 148.0, 187.0, 241.0, 285.0, 380.0, 377.0, 395.0, 346.0, 300.0, 235.0, 181.0, 123.0, 108.0, 76.0, 69.0, 47.0, 38.0, 22.0, 26.0, 11.0, 14.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.31732177734375, -6.1190185546875, -5.92071533203125, -5.722412109375, -5.52410888671875, -5.3258056640625, -5.12750244140625, -4.92919921875, -4.73089599609375, -4.5325927734375, -4.33428955078125, -4.135986328125, -3.93768310546875, -3.7393798828125, -3.54107666015625, -3.3427734375, -3.14447021484375, -2.9461669921875, -2.74786376953125, -2.549560546875, -2.35125732421875, -2.1529541015625, -1.95465087890625, -1.75634765625, -1.55804443359375, -1.3597412109375, -1.16143798828125, -0.963134765625, -0.76483154296875, -0.5665283203125, -0.36822509765625, -0.169921875, 0.02838134765625, 0.2266845703125, 0.42498779296875, 0.623291015625, 0.82159423828125, 1.0198974609375, 1.21820068359375, 1.41650390625, 1.61480712890625, 1.8131103515625, 2.01141357421875, 2.209716796875, 2.40802001953125, 2.6063232421875, 2.80462646484375, 3.0029296875, 3.20123291015625, 3.3995361328125, 3.59783935546875, 3.796142578125, 3.99444580078125, 4.1927490234375, 4.39105224609375, 4.58935546875, 4.78765869140625, 4.9859619140625, 5.18426513671875, 5.382568359375, 5.58087158203125, 5.7791748046875, 5.97747802734375, 6.17578125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 7.0, 14.0, 10.0, 27.0, 36.0, 54.0, 104.0, 118.0, 203.0, 343.0, 611.0, 1309.0, 3211.0, 9470.0, 37117.0, 183433.0, 967620.0, 2176440.0, 653187.0, 123001.0, 25862.0, 7111.0, 2478.0, 1090.0, 562.0, 293.0, 212.0, 121.0, 66.0, 45.0, 25.0, 17.0, 29.0, 10.0, 9.0, 6.0, 3.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.40625, -8.1201171875, -7.833984375, -7.5478515625, -7.26171875, -6.9755859375, -6.689453125, -6.4033203125, -6.1171875, -5.8310546875, -5.544921875, -5.2587890625, -4.97265625, -4.6865234375, -4.400390625, -4.1142578125, -3.828125, -3.5419921875, -3.255859375, -2.9697265625, -2.68359375, -2.3974609375, -2.111328125, -1.8251953125, -1.5390625, -1.2529296875, -0.966796875, -0.6806640625, -0.39453125, -0.1083984375, 0.177734375, 0.4638671875, 0.75, 1.0361328125, 1.322265625, 1.6083984375, 1.89453125, 2.1806640625, 2.466796875, 2.7529296875, 3.0390625, 3.3251953125, 3.611328125, 3.8974609375, 4.18359375, 4.4697265625, 4.755859375, 5.0419921875, 5.328125, 5.6142578125, 5.900390625, 6.1865234375, 6.47265625, 6.7587890625, 7.044921875, 7.3310546875, 7.6171875, 7.9033203125, 8.189453125, 8.4755859375, 8.76171875, 9.0478515625, 9.333984375, 9.6201171875, 9.90625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 5.0, 32.0, 68.0, 119.0, 181.0, 218.0, 177.0, 123.0, 53.0, 20.0, 14.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.094093322753906, -18.868501663208008, -16.64291000366211, -14.417318344116211, -12.191726684570312, -9.966135025024414, -7.740543365478516, -5.514951705932617, -3.2893600463867188, -1.0637683868408203, 1.1618232727050781, 3.3874149322509766, 5.613006591796875, 7.838598251342773, 10.064189910888672, 12.28978157043457, 14.515373229980469, 16.740964889526367, 18.966556549072266, 21.192148208618164, 23.417739868164062, 25.64333152770996, 27.86892318725586, 30.094514846801758, 32.320106506347656, 34.54570007324219, 36.77128982543945, 38.99687957763672, 41.22247314453125, 43.44806671142578, 45.67365646362305, 47.89924621582031, 50.124847412109375, 52.350440979003906, 54.57603073120117, 56.80162048339844, 59.02721405029297, 61.2528076171875, 63.478397369384766, 65.70398712158203, 67.92958068847656, 70.1551742553711, 72.38076782226562, 74.60635375976562, 76.83194732666016, 79.05754089355469, 81.28312683105469, 83.50872039794922, 85.73431396484375, 87.95990753173828, 90.18550109863281, 92.41108703613281, 94.63668060302734, 96.86227416992188, 99.08786010742188, 101.3134536743164, 103.53904724121094, 105.76464080810547, 107.990234375, 110.2158203125, 112.44141387939453, 114.66700744628906, 116.89259338378906, 119.1181869506836, 121.34378051757812]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 7.0, 4.0, 4.0, 9.0, 4.0, 7.0, 9.0, 9.0, 20.0, 7.0, 9.0, 17.0, 17.0, 18.0, 19.0, 19.0, 19.0, 32.0, 25.0, 22.0, 32.0, 27.0, 33.0, 42.0, 34.0, 38.0, 46.0, 41.0, 36.0, 36.0, 35.0, 30.0, 32.0, 26.0, 31.0, 20.0, 16.0, 18.0, 20.0, 16.0, 18.0, 19.0, 8.0, 11.0, 8.0, 15.0, 5.0, 6.0, 5.0, 3.0, 7.0, 7.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.83978271484375, -17.23238754272461, -16.624990463256836, -16.017595291137695, -15.410199165344238, -14.802803039550781, -14.195406913757324, -13.588010787963867, -12.980615615844727, -12.37321949005127, -11.765823364257812, -11.158428192138672, -10.551032066345215, -9.943635940551758, -9.3362398147583, -8.728843688964844, -8.121447563171387, -7.51405143737793, -6.906655788421631, -6.299259662628174, -5.691864013671875, -5.084467887878418, -4.477071762084961, -3.869676113128662, -3.262279987335205, -2.654884099960327, -2.047488212585449, -1.4400920867919922, -0.8326961994171143, -0.22530031204223633, 0.3820958137512207, 0.9894914627075195, 1.5968875885009766, 2.2042834758758545, 2.8116793632507324, 3.4190754890441895, 4.026471138000488, 4.633867263793945, 5.241263389587402, 5.848659038543701, 6.456055164337158, 7.063451290130615, 7.670846939086914, 8.278243064880371, 8.885639190673828, 9.493034362792969, 10.100431442260742, 10.707826614379883, 11.31522274017334, 11.922618865966797, 12.530014991760254, 13.137411117553711, 13.744806289672852, 14.352202415466309, 14.959598541259766, 15.566993713378906, 16.17439079284668, 16.78178596496582, 17.389183044433594, 17.996578216552734, 18.603975296020508, 19.21137046813965, 19.818767547607422, 20.426162719726562, 21.033557891845703]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 5.0, 11.0, 10.0, 11.0, 13.0, 16.0, 19.0, 21.0, 24.0, 20.0, 16.0, 45.0, 24.0, 30.0, 38.0, 33.0, 37.0, 31.0, 52.0, 50.0, 44.0, 43.0, 47.0, 44.0, 37.0, 46.0, 26.0, 24.0, 28.0, 29.0, 15.0, 14.0, 11.0, 16.0, 12.0, 12.0, 14.0, 10.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.76171875, -2.67889404296875, -2.5960693359375, -2.51324462890625, -2.430419921875, -2.34759521484375, -2.2647705078125, -2.18194580078125, -2.09912109375, -2.01629638671875, -1.9334716796875, -1.85064697265625, -1.767822265625, -1.68499755859375, -1.6021728515625, -1.51934814453125, -1.4365234375, -1.35369873046875, -1.2708740234375, -1.18804931640625, -1.105224609375, -1.02239990234375, -0.9395751953125, -0.85675048828125, -0.77392578125, -0.69110107421875, -0.6082763671875, -0.52545166015625, -0.442626953125, -0.35980224609375, -0.2769775390625, -0.19415283203125, -0.111328125, -0.02850341796875, 0.0543212890625, 0.13714599609375, 0.219970703125, 0.30279541015625, 0.3856201171875, 0.46844482421875, 0.55126953125, 0.63409423828125, 0.7169189453125, 0.79974365234375, 0.882568359375, 0.96539306640625, 1.0482177734375, 1.13104248046875, 1.2138671875, 1.29669189453125, 1.3795166015625, 1.46234130859375, 1.545166015625, 1.62799072265625, 1.7108154296875, 1.79364013671875, 1.87646484375, 1.95928955078125, 2.0421142578125, 2.12493896484375, 2.207763671875, 2.29058837890625, 2.3734130859375, 2.45623779296875, 2.5390625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 19.0, 34.0, 37.0, 71.0, 81.0, 138.0, 173.0, 261.0, 430.0, 589.0, 915.0, 1306.0, 1954.0, 3041.0, 4488.0, 6735.0, 10650.0, 16347.0, 24982.0, 38282.0, 59527.0, 90353.0, 131444.0, 170961.0, 156703.0, 112210.0, 75622.0, 49315.0, 31810.0, 20720.0, 13498.0, 8779.0, 5732.0, 3858.0, 2553.0, 1602.0, 1098.0, 714.0, 485.0, 352.0, 222.0, 147.0, 79.0, 70.0, 49.0, 36.0, 14.0, 17.0, 8.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.222412109375, -0.21541404724121094, -0.20841598510742188, -0.2014179229736328, -0.19441986083984375, -0.1874217987060547, -0.18042373657226562, -0.17342567443847656, -0.1664276123046875, -0.15942955017089844, -0.15243148803710938, -0.1454334259033203, -0.13843536376953125, -0.1314373016357422, -0.12443923950195312, -0.11744117736816406, -0.110443115234375, -0.10344505310058594, -0.09644699096679688, -0.08944892883300781, -0.08245086669921875, -0.07545280456542969, -0.06845474243164062, -0.06145668029785156, -0.0544586181640625, -0.04746055603027344, -0.040462493896484375, -0.03346443176269531, -0.02646636962890625, -0.019468307495117188, -0.012470245361328125, -0.0054721832275390625, 0.00152587890625, 0.008523941040039062, 0.015522003173828125, 0.022520065307617188, 0.02951812744140625, 0.03651618957519531, 0.043514251708984375, 0.05051231384277344, 0.0575103759765625, 0.06450843811035156, 0.07150650024414062, 0.07850456237792969, 0.08550262451171875, 0.09250068664550781, 0.09949874877929688, 0.10649681091308594, 0.113494873046875, 0.12049293518066406, 0.12749099731445312, 0.1344890594482422, 0.14148712158203125, 0.1484851837158203, 0.15548324584960938, 0.16248130798339844, 0.1694793701171875, 0.17647743225097656, 0.18347549438476562, 0.1904735565185547, 0.19747161865234375, 0.2044696807861328, 0.21146774291992188, 0.21846580505371094, 0.2254638671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 4.0, 6.0, 8.0, 4.0, 10.0, 11.0, 12.0, 15.0, 19.0, 17.0, 26.0, 31.0, 21.0, 19.0, 40.0, 35.0, 44.0, 42.0, 32.0, 43.0, 35.0, 1073.0, 41.0, 43.0, 33.0, 25.0, 47.0, 32.0, 33.0, 36.0, 27.0, 27.0, 21.0, 15.0, 14.0, 18.0, 8.0, 8.0, 8.0, 7.0, 9.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.640625, -1.588775634765625, -1.53692626953125, -1.485076904296875, -1.4332275390625, -1.381378173828125, -1.32952880859375, -1.277679443359375, -1.225830078125, -1.173980712890625, -1.12213134765625, -1.070281982421875, -1.0184326171875, -0.966583251953125, -0.91473388671875, -0.862884521484375, -0.81103515625, -0.759185791015625, -0.70733642578125, -0.655487060546875, -0.6036376953125, -0.551788330078125, -0.49993896484375, -0.448089599609375, -0.396240234375, -0.344390869140625, -0.29254150390625, -0.240692138671875, -0.1888427734375, -0.136993408203125, -0.08514404296875, -0.033294677734375, 0.0185546875, 0.070404052734375, 0.12225341796875, 0.174102783203125, 0.2259521484375, 0.277801513671875, 0.32965087890625, 0.381500244140625, 0.433349609375, 0.485198974609375, 0.53704833984375, 0.588897705078125, 0.6407470703125, 0.692596435546875, 0.74444580078125, 0.796295166015625, 0.84814453125, 0.899993896484375, 0.95184326171875, 1.003692626953125, 1.0555419921875, 1.107391357421875, 1.15924072265625, 1.211090087890625, 1.262939453125, 1.314788818359375, 1.36663818359375, 1.418487548828125, 1.4703369140625, 1.522186279296875, 1.57403564453125, 1.625885009765625, 1.677734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 7.0, 15.0, 17.0, 38.0, 48.0, 77.0, 82.0, 161.0, 260.0, 344.0, 530.0, 880.0, 1328.0, 2085.0, 3224.0, 5209.0, 8292.0, 13242.0, 20746.0, 32162.0, 49002.0, 72762.0, 102600.0, 138708.0, 1171127.0, 147560.0, 105952.0, 75965.0, 51445.0, 33910.0, 21752.0, 13734.0, 8825.0, 5437.0, 3492.0, 2196.0, 1386.0, 848.0, 620.0, 353.0, 244.0, 164.0, 97.0, 81.0, 47.0, 25.0, 20.0, 15.0, 4.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.1328125, -0.1286029815673828, -0.12439346313476562, -0.12018394470214844, -0.11597442626953125, -0.11176490783691406, -0.10755538940429688, -0.10334587097167969, -0.0991363525390625, -0.09492683410644531, -0.09071731567382812, -0.08650779724121094, -0.08229827880859375, -0.07808876037597656, -0.07387924194335938, -0.06966972351074219, -0.065460205078125, -0.06125068664550781, -0.057041168212890625, -0.05283164978027344, -0.04862213134765625, -0.04441261291503906, -0.040203094482421875, -0.03599357604980469, -0.0317840576171875, -0.027574539184570312, -0.023365020751953125, -0.019155502319335938, -0.01494598388671875, -0.010736465454101562, -0.006526947021484375, -0.0023174285888671875, 0.00189208984375, 0.0061016082763671875, 0.010311126708984375, 0.014520645141601562, 0.01873016357421875, 0.022939682006835938, 0.027149200439453125, 0.03135871887207031, 0.0355682373046875, 0.03977775573730469, 0.043987274169921875, 0.04819679260253906, 0.05240631103515625, 0.05661582946777344, 0.060825347900390625, 0.06503486633300781, 0.069244384765625, 0.07345390319824219, 0.07766342163085938, 0.08187294006347656, 0.08608245849609375, 0.09029197692871094, 0.09450149536132812, 0.09871101379394531, 0.1029205322265625, 0.10713005065917969, 0.11133956909179688, 0.11554908752441406, 0.11975860595703125, 0.12396812438964844, 0.12817764282226562, 0.1323871612548828, 0.1365966796875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 8.0, 8.0, 4.0, 9.0, 26.0, 21.0, 13.0, 34.0, 49.0, 36.0, 64.0, 76.0, 79.0, 89.0, 88.0, 83.0, 72.0, 49.0, 36.0, 34.0, 22.0, 20.0, 14.0, 11.0, 6.0, 9.0, 2.0, 6.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00914764404296875, -0.008875608444213867, -0.008603572845458984, -0.008331537246704102, -0.008059501647949219, -0.007787466049194336, -0.007515430450439453, -0.00724339485168457, -0.0069713592529296875, -0.006699323654174805, -0.006427288055419922, -0.006155252456665039, -0.005883216857910156, -0.0056111812591552734, -0.005339145660400391, -0.005067110061645508, -0.004795074462890625, -0.004523038864135742, -0.004251003265380859, -0.0039789676666259766, -0.0037069320678710938, -0.003434896469116211, -0.003162860870361328, -0.0028908252716064453, -0.0026187896728515625, -0.0023467540740966797, -0.002074718475341797, -0.001802682876586914, -0.0015306472778320312, -0.0012586116790771484, -0.0009865760803222656, -0.0007145404815673828, -0.0004425048828125, -0.0001704692840576172, 0.00010156631469726562, 0.00037360191345214844, 0.0006456375122070312, 0.0009176731109619141, 0.0011897087097167969, 0.0014617443084716797, 0.0017337799072265625, 0.0020058155059814453, 0.002277851104736328, 0.002549886703491211, 0.0028219223022460938, 0.0030939579010009766, 0.0033659934997558594, 0.003638029098510742, 0.003910064697265625, 0.004182100296020508, 0.004454135894775391, 0.0047261714935302734, 0.004998207092285156, 0.005270242691040039, 0.005542278289794922, 0.005814313888549805, 0.0060863494873046875, 0.00635838508605957, 0.006630420684814453, 0.006902456283569336, 0.007174491882324219, 0.0074465274810791016, 0.007718563079833984, 0.007990598678588867, 0.00826263427734375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 7.0, 13.0, 10.0, 10.0, 9.0, 13.0, 21.0, 26.0, 29.0, 54.0, 58.0, 75.0, 147.0, 246.0, 762.0, 10159.0, 921639.0, 111874.0, 2407.0, 424.0, 153.0, 102.0, 79.0, 56.0, 32.0, 31.0, 23.0, 17.0, 20.0, 15.0, 3.0, 5.0, 6.0, 3.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.1581401824951172, -0.15282821655273438, -0.14751625061035156, -0.14220428466796875, -0.13689231872558594, -0.13158035278320312, -0.1262683868408203, -0.1209564208984375, -0.11564445495605469, -0.11033248901367188, -0.10502052307128906, -0.09970855712890625, -0.09439659118652344, -0.08908462524414062, -0.08377265930175781, -0.078460693359375, -0.07314872741699219, -0.06783676147460938, -0.06252479553222656, -0.05721282958984375, -0.05190086364746094, -0.046588897705078125, -0.04127693176269531, -0.0359649658203125, -0.030652999877929688, -0.025341033935546875, -0.020029067993164062, -0.01471710205078125, -0.009405136108398438, -0.004093170166015625, 0.0012187957763671875, 0.00653076171875, 0.011842727661132812, 0.017154693603515625, 0.022466659545898438, 0.02777862548828125, 0.03309059143066406, 0.038402557373046875, 0.04371452331542969, 0.0490264892578125, 0.05433845520019531, 0.059650421142578125, 0.06496238708496094, 0.07027435302734375, 0.07558631896972656, 0.08089828491210938, 0.08621025085449219, 0.091522216796875, 0.09683418273925781, 0.10214614868164062, 0.10745811462402344, 0.11277008056640625, 0.11808204650878906, 0.12339401245117188, 0.1287059783935547, 0.1340179443359375, 0.1393299102783203, 0.14464187622070312, 0.14995384216308594, 0.15526580810546875, 0.16057777404785156, 0.16588973999023438, 0.1712017059326172, 0.176513671875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 14.0, 160.0, 642.0, 152.0, 40.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13771268725395203, -0.13492564857006073, -0.13213860988616943, -0.12935155630111694, -0.12656451761722565, -0.12377747893333435, -0.12099044024944305, -0.11820340156555176, -0.11541636288166046, -0.11262932419776917, -0.10984227806329727, -0.10705523937940598, -0.10426820069551468, -0.10148115456104279, -0.09869411587715149, -0.09590707719326019, -0.0931200310587883, -0.090332992374897, -0.08754594624042511, -0.08475890755653381, -0.08197186887264252, -0.07918483018875122, -0.07639778405427933, -0.07361074537038803, -0.07082369923591614, -0.06803666055202484, -0.06524961441755295, -0.06246257573366165, -0.059675537049770355, -0.05688849464058876, -0.054101452231407166, -0.05131441354751587, -0.048527367413043976, -0.04574032500386238, -0.042953286319971085, -0.04016624391078949, -0.03737920522689819, -0.0345921628177166, -0.031805120408535004, -0.029018079861998558, -0.026231039315462112, -0.023443998768925667, -0.02065695822238922, -0.017869915813207626, -0.01508287526667118, -0.012295834720134735, -0.00950879231095314, -0.006721751764416695, -0.003934711217880249, -0.001147670205682516, 0.0016393708065152168, 0.004426412284374237, 0.007213452830910683, 0.010000493377447128, 0.012787535786628723, 0.015574576333165169, 0.018361616879701614, 0.02114865742623806, 0.023935697972774506, 0.0267227403819561, 0.029509780928492546, 0.03229682147502899, 0.03508386388421059, 0.03787090629339218, 0.04065794497728348]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 6.0, 9.0, 13.0, 8.0, 16.0, 22.0, 17.0, 19.0, 21.0, 24.0, 35.0, 30.0, 28.0, 30.0, 30.0, 36.0, 39.0, 35.0, 35.0, 40.0, 46.0, 43.0, 34.0, 40.0, 36.0, 33.0, 32.0, 23.0, 28.0, 31.0, 21.0, 21.0, 22.0, 16.0, 16.0, 8.0, 9.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.008411288261413574, -0.008155453018844128, -0.007899617776274681, -0.0076437825337052345, -0.007387947291135788, -0.007132112048566341, -0.006876276805996895, -0.006620441563427448, -0.006364606320858002, -0.006108771078288555, -0.005852935835719109, -0.005597100593149662, -0.0053412653505802155, -0.005085430108010769, -0.004829594865441322, -0.004573759622871876, -0.004317924380302429, -0.004062089137732983, -0.003806253895163536, -0.0035504186525940895, -0.003294583410024643, -0.0030387481674551964, -0.00278291292488575, -0.0025270776823163033, -0.0022712424397468567, -0.00201540719717741, -0.0017595719546079636, -0.001503736712038517, -0.0012479014694690704, -0.0009920662268996239, -0.0007362309843301773, -0.00048039574176073074, -0.00022456049919128418, 3.1274743378162384e-05, 0.00028710998594760895, 0.0005429452285170555, 0.0007987804710865021, 0.0010546157136559486, 0.0013104509562253952, 0.0015662861987948418, 0.0018221214413642883, 0.002077956683933735, 0.0023337919265031815, 0.002589627169072628, 0.0028454624116420746, 0.003101297654211521, 0.0033571328967809677, 0.0036129681393504143, 0.003868803381919861, 0.004124638624489307, 0.004380473867058754, 0.0046363091096282005, 0.004892144352197647, 0.005147979594767094, 0.00540381483733654, 0.005659650079905987, 0.005915485322475433, 0.00617132056504488, 0.0064271558076143265, 0.006682991050183773, 0.00693882629275322, 0.007194661535322666, 0.007450496777892113, 0.007706332020461559, 0.007962167263031006]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 5.0, 11.0, 10.0, 11.0, 13.0, 16.0, 19.0, 21.0, 24.0, 20.0, 16.0, 45.0, 24.0, 30.0, 38.0, 33.0, 37.0, 31.0, 52.0, 50.0, 44.0, 43.0, 47.0, 44.0, 37.0, 46.0, 26.0, 24.0, 28.0, 29.0, 15.0, 14.0, 11.0, 16.0, 12.0, 12.0, 14.0, 10.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.76171875, -2.67889404296875, -2.5960693359375, -2.51324462890625, -2.430419921875, -2.34759521484375, -2.2647705078125, -2.18194580078125, -2.09912109375, -2.01629638671875, -1.9334716796875, -1.85064697265625, -1.767822265625, -1.68499755859375, -1.6021728515625, -1.51934814453125, -1.4365234375, -1.35369873046875, -1.2708740234375, -1.18804931640625, -1.105224609375, -1.02239990234375, -0.9395751953125, -0.85675048828125, -0.77392578125, -0.69110107421875, -0.6082763671875, -0.52545166015625, -0.442626953125, -0.35980224609375, -0.2769775390625, -0.19415283203125, -0.111328125, -0.02850341796875, 0.0543212890625, 0.13714599609375, 0.219970703125, 0.30279541015625, 0.3856201171875, 0.46844482421875, 0.55126953125, 0.63409423828125, 0.7169189453125, 0.79974365234375, 0.882568359375, 0.96539306640625, 1.0482177734375, 1.13104248046875, 1.2138671875, 1.29669189453125, 1.3795166015625, 1.46234130859375, 1.545166015625, 1.62799072265625, 1.7108154296875, 1.79364013671875, 1.87646484375, 1.95928955078125, 2.0421142578125, 2.12493896484375, 2.207763671875, 2.29058837890625, 2.3734130859375, 2.45623779296875, 2.5390625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 9.0, 11.0, 31.0, 38.0, 49.0, 75.0, 104.0, 160.0, 224.0, 459.0, 714.0, 1261.0, 2391.0, 4287.0, 8488.0, 19145.0, 48207.0, 140689.0, 405684.0, 269722.0, 87865.0, 31830.0, 13232.0, 6200.0, 3331.0, 1715.0, 1041.0, 592.0, 373.0, 196.0, 126.0, 96.0, 50.0, 35.0, 27.0, 24.0, 14.0, 14.0, 12.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.046875, -3.9195556640625, -3.792236328125, -3.6649169921875, -3.53759765625, -3.4102783203125, -3.282958984375, -3.1556396484375, -3.0283203125, -2.9010009765625, -2.773681640625, -2.6463623046875, -2.51904296875, -2.3917236328125, -2.264404296875, -2.1370849609375, -2.009765625, -1.8824462890625, -1.755126953125, -1.6278076171875, -1.50048828125, -1.3731689453125, -1.245849609375, -1.1185302734375, -0.9912109375, -0.8638916015625, -0.736572265625, -0.6092529296875, -0.48193359375, -0.3546142578125, -0.227294921875, -0.0999755859375, 0.02734375, 0.1546630859375, 0.281982421875, 0.4093017578125, 0.53662109375, 0.6639404296875, 0.791259765625, 0.9185791015625, 1.0458984375, 1.1732177734375, 1.300537109375, 1.4278564453125, 1.55517578125, 1.6824951171875, 1.809814453125, 1.9371337890625, 2.064453125, 2.1917724609375, 2.319091796875, 2.4464111328125, 2.57373046875, 2.7010498046875, 2.828369140625, 2.9556884765625, 3.0830078125, 3.2103271484375, 3.337646484375, 3.4649658203125, 3.59228515625, 3.7196044921875, 3.846923828125, 3.9742431640625, 4.1015625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 11.0, 10.0, 11.0, 11.0, 10.0, 20.0, 19.0, 18.0, 22.0, 27.0, 35.0, 51.0, 61.0, 68.0, 91.0, 152.0, 284.0, 1391.0, 235.0, 113.0, 75.0, 50.0, 41.0, 42.0, 31.0, 33.0, 23.0, 21.0, 17.0, 16.0, 11.0, 11.0, 16.0, 8.0, 4.0, 0.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.625, -10.285400390625, -9.94580078125, -9.606201171875, -9.2666015625, -8.927001953125, -8.58740234375, -8.247802734375, -7.908203125, -7.568603515625, -7.22900390625, -6.889404296875, -6.5498046875, -6.210205078125, -5.87060546875, -5.531005859375, -5.19140625, -4.851806640625, -4.51220703125, -4.172607421875, -3.8330078125, -3.493408203125, -3.15380859375, -2.814208984375, -2.474609375, -2.135009765625, -1.79541015625, -1.455810546875, -1.1162109375, -0.776611328125, -0.43701171875, -0.097412109375, 0.2421875, 0.581787109375, 0.92138671875, 1.260986328125, 1.6005859375, 1.940185546875, 2.27978515625, 2.619384765625, 2.958984375, 3.298583984375, 3.63818359375, 3.977783203125, 4.3173828125, 4.656982421875, 4.99658203125, 5.336181640625, 5.67578125, 6.015380859375, 6.35498046875, 6.694580078125, 7.0341796875, 7.373779296875, 7.71337890625, 8.052978515625, 8.392578125, 8.732177734375, 9.07177734375, 9.411376953125, 9.7509765625, 10.090576171875, 10.43017578125, 10.769775390625, 11.109375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 11.0, 13.0, 14.0, 24.0, 23.0, 43.0, 49.0, 77.0, 123.0, 183.0, 356.0, 978.0, 7536.0, 1139258.0, 1985471.0, 9472.0, 1061.0, 397.0, 211.0, 112.0, 84.0, 52.0, 47.0, 29.0, 25.0, 17.0, 7.0, 8.0, 8.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.640625, -28.769775390625, -27.89892578125, -27.028076171875, -26.1572265625, -25.286376953125, -24.41552734375, -23.544677734375, -22.673828125, -21.802978515625, -20.93212890625, -20.061279296875, -19.1904296875, -18.319580078125, -17.44873046875, -16.577880859375, -15.70703125, -14.836181640625, -13.96533203125, -13.094482421875, -12.2236328125, -11.352783203125, -10.48193359375, -9.611083984375, -8.740234375, -7.869384765625, -6.99853515625, -6.127685546875, -5.2568359375, -4.385986328125, -3.51513671875, -2.644287109375, -1.7734375, -0.902587890625, -0.03173828125, 0.839111328125, 1.7099609375, 2.580810546875, 3.45166015625, 4.322509765625, 5.193359375, 6.064208984375, 6.93505859375, 7.805908203125, 8.6767578125, 9.547607421875, 10.41845703125, 11.289306640625, 12.16015625, 13.031005859375, 13.90185546875, 14.772705078125, 15.6435546875, 16.514404296875, 17.38525390625, 18.256103515625, 19.126953125, 19.997802734375, 20.86865234375, 21.739501953125, 22.6103515625, 23.481201171875, 24.35205078125, 25.222900390625, 26.09375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 20.0, 62.0, 105.0, 190.0, 232.0, 173.0, 119.0, 62.0, 29.0, 9.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.874847412109375, -47.75250244140625, -46.63016128540039, -45.507816314697266, -44.385475158691406, -43.26313018798828, -42.14078903198242, -41.0184440612793, -39.89610290527344, -38.77375793457031, -37.65141677856445, -36.52907180786133, -35.40673065185547, -34.284385681152344, -33.162044525146484, -32.03969955444336, -30.917354583740234, -29.795011520385742, -28.67266845703125, -27.550325393676758, -26.427982330322266, -25.30563735961914, -24.18329429626465, -23.060951232910156, -21.938608169555664, -20.816265106201172, -19.69392204284668, -18.571578979492188, -17.449234008789062, -16.326892852783203, -15.204547882080078, -14.082204818725586, -12.95986557006836, -11.837522506713867, -10.715179443359375, -9.592835426330566, -8.470492362976074, -7.348149299621582, -6.225805759429932, -5.103462219238281, -3.981119155883789, -2.8587758541107178, -1.7364325523376465, -0.6140892505645752, 0.5082540512084961, 1.6305971145629883, 2.7529406547546387, 3.875284194946289, 4.997627258300781, 6.119970321655273, 7.242313861846924, 8.364657402038574, 9.487000465393066, 10.609343528747559, 11.731687545776367, 12.85403060913086, 13.976373672485352, 15.098716735839844, 16.221059799194336, 17.343402862548828, 18.465747833251953, 19.588088989257812, 20.710433959960938, 21.83277702331543, 22.955120086669922]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 8.0, 6.0, 7.0, 2.0, 5.0, 18.0, 10.0, 18.0, 12.0, 16.0, 20.0, 23.0, 20.0, 22.0, 29.0, 25.0, 27.0, 25.0, 37.0, 29.0, 43.0, 37.0, 42.0, 40.0, 23.0, 32.0, 29.0, 28.0, 32.0, 40.0, 36.0, 42.0, 29.0, 24.0, 24.0, 18.0, 22.0, 12.0, 18.0, 14.0, 7.0, 6.0, 9.0, 5.0, 6.0, 10.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.633089065551758, -23.84441375732422, -23.055740356445312, -22.267065048217773, -21.478389739990234, -20.689716339111328, -19.90104103088379, -19.11236572265625, -18.323692321777344, -17.535017013549805, -16.7463436126709, -15.95766830444336, -15.168993949890137, -14.380319595336914, -13.591644287109375, -12.802969932556152, -12.01429557800293, -11.225621223449707, -10.436946868896484, -9.648271560668945, -8.859597206115723, -8.0709228515625, -7.282248020172119, -6.493573188781738, -5.704898834228516, -4.916224479675293, -4.127549648284912, -3.3388750553131104, -2.5502004623413086, -1.7615258693695068, -0.9728512763977051, -0.18417644500732422, 0.6044998168945312, 1.393174409866333, 2.1818490028381348, 2.9705235958099365, 3.7591981887817383, 4.547872543334961, 5.336547374725342, 6.125222206115723, 6.913896560668945, 7.702570915222168, 8.49124526977539, 9.27992057800293, 10.068594932556152, 10.857269287109375, 11.645944595336914, 12.434618949890137, 13.22329330444336, 14.011967658996582, 14.800642013549805, 15.589317321777344, 16.37799072265625, 17.16666603088379, 17.955341339111328, 18.744014739990234, 19.532690048217773, 20.321365356445312, 21.11003875732422, 21.898714065551758, 22.687389373779297, 23.476062774658203, 24.264738082885742, 25.05341339111328, 25.842086791992188]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 9.0, 11.0, 12.0, 5.0, 11.0, 15.0, 15.0, 16.0, 20.0, 28.0, 24.0, 21.0, 44.0, 27.0, 31.0, 31.0, 45.0, 34.0, 37.0, 51.0, 43.0, 44.0, 44.0, 43.0, 26.0, 41.0, 34.0, 33.0, 28.0, 26.0, 30.0, 21.0, 8.0, 15.0, 9.0, 18.0, 9.0, 13.0, 5.0, 7.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.939453125, -2.852752685546875, -2.76605224609375, -2.679351806640625, -2.5926513671875, -2.505950927734375, -2.41925048828125, -2.332550048828125, -2.245849609375, -2.159149169921875, -2.07244873046875, -1.985748291015625, -1.8990478515625, -1.812347412109375, -1.72564697265625, -1.638946533203125, -1.55224609375, -1.465545654296875, -1.37884521484375, -1.292144775390625, -1.2054443359375, -1.118743896484375, -1.03204345703125, -0.945343017578125, -0.858642578125, -0.771942138671875, -0.68524169921875, -0.598541259765625, -0.5118408203125, -0.425140380859375, -0.33843994140625, -0.251739501953125, -0.1650390625, -0.078338623046875, 0.00836181640625, 0.095062255859375, 0.1817626953125, 0.268463134765625, 0.35516357421875, 0.441864013671875, 0.528564453125, 0.615264892578125, 0.70196533203125, 0.788665771484375, 0.8753662109375, 0.962066650390625, 1.04876708984375, 1.135467529296875, 1.22216796875, 1.308868408203125, 1.39556884765625, 1.482269287109375, 1.5689697265625, 1.655670166015625, 1.74237060546875, 1.829071044921875, 1.915771484375, 2.002471923828125, 2.08917236328125, 2.175872802734375, 2.2625732421875, 2.349273681640625, 2.43597412109375, 2.522674560546875, 2.609375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 9.0, 17.0, 18.0, 20.0, 30.0, 29.0, 46.0, 74.0, 97.0, 153.0, 261.0, 487.0, 745.0, 1460.0, 2856.0, 6003.0, 12776.0, 30041.0, 72836.0, 186324.0, 480845.0, 1034169.0, 1222286.0, 681906.0, 277017.0, 106658.0, 42627.0, 17995.0, 8032.0, 3839.0, 1979.0, 1040.0, 603.0, 339.0, 225.0, 127.0, 94.0, 60.0, 41.0, 30.0, 19.0, 17.0, 18.0, 5.0, 5.0, 10.0, 2.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.074005126953125, -2.97222900390625, -2.870452880859375, -2.7686767578125, -2.666900634765625, -2.56512451171875, -2.463348388671875, -2.361572265625, -2.259796142578125, -2.15802001953125, -2.056243896484375, -1.9544677734375, -1.852691650390625, -1.75091552734375, -1.649139404296875, -1.54736328125, -1.445587158203125, -1.34381103515625, -1.242034912109375, -1.1402587890625, -1.038482666015625, -0.93670654296875, -0.834930419921875, -0.733154296875, -0.631378173828125, -0.52960205078125, -0.427825927734375, -0.3260498046875, -0.224273681640625, -0.12249755859375, -0.020721435546875, 0.0810546875, 0.182830810546875, 0.28460693359375, 0.386383056640625, 0.4881591796875, 0.589935302734375, 0.69171142578125, 0.793487548828125, 0.895263671875, 0.997039794921875, 1.09881591796875, 1.200592041015625, 1.3023681640625, 1.404144287109375, 1.50592041015625, 1.607696533203125, 1.70947265625, 1.811248779296875, 1.91302490234375, 2.014801025390625, 2.1165771484375, 2.218353271484375, 2.32012939453125, 2.421905517578125, 2.523681640625, 2.625457763671875, 2.72723388671875, 2.829010009765625, 2.9307861328125, 3.032562255859375, 3.13433837890625, 3.236114501953125, 3.337890625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 13.0, 11.0, 16.0, 35.0, 39.0, 56.0, 69.0, 91.0, 132.0, 181.0, 236.0, 298.0, 393.0, 436.0, 447.0, 372.0, 310.0, 215.0, 189.0, 137.0, 120.0, 73.0, 57.0, 41.0, 28.0, 18.0, 14.0, 12.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.92578125, -5.69842529296875, -5.4710693359375, -5.24371337890625, -5.016357421875, -4.78900146484375, -4.5616455078125, -4.33428955078125, -4.10693359375, -3.87957763671875, -3.6522216796875, -3.42486572265625, -3.197509765625, -2.97015380859375, -2.7427978515625, -2.51544189453125, -2.2880859375, -2.06072998046875, -1.8333740234375, -1.60601806640625, -1.378662109375, -1.15130615234375, -0.9239501953125, -0.69659423828125, -0.46923828125, -0.24188232421875, -0.0145263671875, 0.21282958984375, 0.440185546875, 0.66754150390625, 0.8948974609375, 1.12225341796875, 1.349609375, 1.57696533203125, 1.8043212890625, 2.03167724609375, 2.259033203125, 2.48638916015625, 2.7137451171875, 2.94110107421875, 3.16845703125, 3.39581298828125, 3.6231689453125, 3.85052490234375, 4.077880859375, 4.30523681640625, 4.5325927734375, 4.75994873046875, 4.9873046875, 5.21466064453125, 5.4420166015625, 5.66937255859375, 5.896728515625, 6.12408447265625, 6.3514404296875, 6.57879638671875, 6.80615234375, 7.03350830078125, 7.2608642578125, 7.48822021484375, 7.715576171875, 7.94293212890625, 8.1702880859375, 8.39764404296875, 8.625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 12.0, 19.0, 32.0, 39.0, 58.0, 132.0, 219.0, 440.0, 897.0, 2352.0, 7944.0, 36588.0, 197951.0, 1084186.0, 2145648.0, 585874.0, 104005.0, 19941.0, 4949.0, 1529.0, 638.0, 330.0, 192.0, 109.0, 58.0, 42.0, 22.0, 23.0, 12.0, 7.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.8203125, -10.5223388671875, -10.224365234375, -9.9263916015625, -9.62841796875, -9.3304443359375, -9.032470703125, -8.7344970703125, -8.4365234375, -8.1385498046875, -7.840576171875, -7.5426025390625, -7.24462890625, -6.9466552734375, -6.648681640625, -6.3507080078125, -6.052734375, -5.7547607421875, -5.456787109375, -5.1588134765625, -4.86083984375, -4.5628662109375, -4.264892578125, -3.9669189453125, -3.6689453125, -3.3709716796875, -3.072998046875, -2.7750244140625, -2.47705078125, -2.1790771484375, -1.881103515625, -1.5831298828125, -1.28515625, -0.9871826171875, -0.689208984375, -0.3912353515625, -0.09326171875, 0.2047119140625, 0.502685546875, 0.8006591796875, 1.0986328125, 1.3966064453125, 1.694580078125, 1.9925537109375, 2.29052734375, 2.5885009765625, 2.886474609375, 3.1844482421875, 3.482421875, 3.7803955078125, 4.078369140625, 4.3763427734375, 4.67431640625, 4.9722900390625, 5.270263671875, 5.5682373046875, 5.8662109375, 6.1641845703125, 6.462158203125, 6.7601318359375, 7.05810546875, 7.3560791015625, 7.654052734375, 7.9520263671875, 8.25]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 11.0, 32.0, 55.0, 78.0, 118.0, 135.0, 153.0, 163.0, 121.0, 66.0, 43.0, 23.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.18747901916504, -24.4775390625, -22.76759910583496, -21.057659149169922, -19.347719192504883, -17.637779235839844, -15.927839279174805, -14.217899322509766, -12.507959365844727, -10.798019409179688, -9.088079452514648, -7.378139495849609, -5.66819953918457, -3.9582595825195312, -2.248319625854492, -0.5383796691894531, 1.171560287475586, 2.881500244140625, 4.591440200805664, 6.301380157470703, 8.011320114135742, 9.721260070800781, 11.43120002746582, 13.14113998413086, 14.851079940795898, 16.561019897460938, 18.270959854125977, 19.980899810791016, 21.690839767456055, 23.400779724121094, 25.110719680786133, 26.820659637451172, 28.530601501464844, 30.240541458129883, 31.950481414794922, 33.660423278808594, 35.370361328125, 37.080299377441406, 38.79024124145508, 40.50018310546875, 42.210121154785156, 43.92005920410156, 45.630001068115234, 47.339942932128906, 49.04988098144531, 50.75981903076172, 52.46976089477539, 54.17970275878906, 55.88964080810547, 57.599578857421875, 59.30952072143555, 61.01946258544922, 62.729400634765625, 64.43933868408203, 66.14927673339844, 67.85922241210938, 69.56916046142578, 71.27909851074219, 72.98904418945312, 74.69898223876953, 76.40892028808594, 78.11885833740234, 79.82879638671875, 81.53874206542969, 83.2486801147461]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 5.0, 6.0, 6.0, 12.0, 7.0, 12.0, 16.0, 12.0, 24.0, 18.0, 32.0, 33.0, 32.0, 28.0, 28.0, 27.0, 42.0, 44.0, 39.0, 30.0, 37.0, 43.0, 39.0, 40.0, 31.0, 39.0, 48.0, 33.0, 35.0, 20.0, 29.0, 19.0, 16.0, 20.0, 15.0, 22.0, 11.0, 8.0, 6.0, 12.0, 4.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.491764068603516, -23.77920150756836, -23.06663703918457, -22.354074478149414, -21.641511917114258, -20.9289493560791, -20.216384887695312, -19.503822326660156, -18.791259765625, -18.078697204589844, -17.366132736206055, -16.6535701751709, -15.941007614135742, -15.22844409942627, -14.515880584716797, -13.80331802368164, -13.090754508972168, -12.378190994262695, -11.665628433227539, -10.953064918518066, -10.24050235748291, -9.527938842773438, -8.815376281738281, -8.102812767028809, -7.390249729156494, -6.67768669128418, -5.965123653411865, -5.252560615539551, -4.539997100830078, -3.8274343013763428, -3.114871025085449, -2.4023079872131348, -1.6897449493408203, -0.9771818518638611, -0.26461875438690186, 0.44794440269470215, 1.1605074405670166, 1.873070478439331, 2.5856337547302246, 3.298196792602539, 4.0107598304748535, 4.723322868347168, 5.435885906219482, 6.148448944091797, 6.8610124588012695, 7.573575019836426, 8.286138534545898, 8.998701095581055, 9.711264610290527, 10.423828125, 11.136390686035156, 11.848954200744629, 12.561516761779785, 13.274080276489258, 13.986642837524414, 14.699206352233887, 15.41176986694336, 16.124332427978516, 16.836896896362305, 17.54945945739746, 18.262022018432617, 18.974584579467773, 19.687149047851562, 20.39971160888672, 21.112274169921875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 12.0, 12.0, 9.0, 10.0, 17.0, 18.0, 19.0, 19.0, 24.0, 22.0, 41.0, 25.0, 41.0, 37.0, 42.0, 52.0, 30.0, 52.0, 43.0, 46.0, 43.0, 45.0, 44.0, 39.0, 37.0, 31.0, 25.0, 20.0, 12.0, 19.0, 26.0, 16.0, 20.0, 12.0, 7.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.142578125, -3.04754638671875, -2.9525146484375, -2.85748291015625, -2.762451171875, -2.66741943359375, -2.5723876953125, -2.47735595703125, -2.38232421875, -2.28729248046875, -2.1922607421875, -2.09722900390625, -2.002197265625, -1.90716552734375, -1.8121337890625, -1.71710205078125, -1.6220703125, -1.52703857421875, -1.4320068359375, -1.33697509765625, -1.241943359375, -1.14691162109375, -1.0518798828125, -0.95684814453125, -0.86181640625, -0.76678466796875, -0.6717529296875, -0.57672119140625, -0.481689453125, -0.38665771484375, -0.2916259765625, -0.19659423828125, -0.1015625, -0.00653076171875, 0.0885009765625, 0.18353271484375, 0.278564453125, 0.37359619140625, 0.4686279296875, 0.56365966796875, 0.65869140625, 0.75372314453125, 0.8487548828125, 0.94378662109375, 1.038818359375, 1.13385009765625, 1.2288818359375, 1.32391357421875, 1.4189453125, 1.51397705078125, 1.6090087890625, 1.70404052734375, 1.799072265625, 1.89410400390625, 1.9891357421875, 2.08416748046875, 2.17919921875, 2.27423095703125, 2.3692626953125, 2.46429443359375, 2.559326171875, 2.65435791015625, 2.7493896484375, 2.84442138671875, 2.939453125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 25.0, 28.0, 41.0, 53.0, 95.0, 118.0, 182.0, 298.0, 455.0, 695.0, 1027.0, 1477.0, 2335.0, 3669.0, 5671.0, 8913.0, 13946.0, 21861.0, 35462.0, 57322.0, 91814.0, 142676.0, 190265.0, 167866.0, 112792.0, 70951.0, 43667.0, 27396.0, 17117.0, 10762.0, 6853.0, 4486.0, 2833.0, 1829.0, 1149.0, 826.0, 483.0, 344.0, 264.0, 171.0, 113.0, 76.0, 52.0, 40.0, 22.0, 13.0, 3.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29345703125, -0.2842063903808594, -0.27495574951171875, -0.2657051086425781, -0.2564544677734375, -0.24720382690429688, -0.23795318603515625, -0.22870254516601562, -0.219451904296875, -0.21020126342773438, -0.20095062255859375, -0.19169998168945312, -0.1824493408203125, -0.17319869995117188, -0.16394805908203125, -0.15469741821289062, -0.14544677734375, -0.13619613647460938, -0.12694549560546875, -0.11769485473632812, -0.1084442138671875, -0.09919357299804688, -0.08994293212890625, -0.08069229125976562, -0.071441650390625, -0.062191009521484375, -0.05294036865234375, -0.043689727783203125, -0.0344390869140625, -0.025188446044921875, -0.01593780517578125, -0.006687164306640625, 0.0025634765625, 0.011814117431640625, 0.02106475830078125, 0.030315399169921875, 0.0395660400390625, 0.048816680908203125, 0.05806732177734375, 0.06731796264648438, 0.076568603515625, 0.08581924438476562, 0.09506988525390625, 0.10432052612304688, 0.1135711669921875, 0.12282180786132812, 0.13207244873046875, 0.14132308959960938, 0.15057373046875, 0.15982437133789062, 0.16907501220703125, 0.17832565307617188, 0.1875762939453125, 0.19682693481445312, 0.20607757568359375, 0.21532821655273438, 0.224578857421875, 0.23382949829101562, 0.24308013916015625, 0.2523307800292969, 0.2615814208984375, 0.2708320617675781, 0.28008270263671875, 0.2893333435058594, 0.298583984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 10.0, 7.0, 8.0, 8.0, 10.0, 14.0, 19.0, 24.0, 23.0, 21.0, 25.0, 36.0, 37.0, 38.0, 34.0, 55.0, 46.0, 48.0, 1057.0, 47.0, 56.0, 35.0, 37.0, 39.0, 31.0, 36.0, 37.0, 25.0, 29.0, 19.0, 23.0, 15.0, 12.0, 13.0, 14.0, 12.0, 5.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0], "bins": [-2.341796875, -2.278778076171875, -2.21575927734375, -2.152740478515625, -2.0897216796875, -2.026702880859375, -1.96368408203125, -1.900665283203125, -1.837646484375, -1.774627685546875, -1.71160888671875, -1.648590087890625, -1.5855712890625, -1.522552490234375, -1.45953369140625, -1.396514892578125, -1.33349609375, -1.270477294921875, -1.20745849609375, -1.144439697265625, -1.0814208984375, -1.018402099609375, -0.95538330078125, -0.892364501953125, -0.829345703125, -0.766326904296875, -0.70330810546875, -0.640289306640625, -0.5772705078125, -0.514251708984375, -0.45123291015625, -0.388214111328125, -0.3251953125, -0.262176513671875, -0.19915771484375, -0.136138916015625, -0.0731201171875, -0.010101318359375, 0.05291748046875, 0.115936279296875, 0.178955078125, 0.241973876953125, 0.30499267578125, 0.368011474609375, 0.4310302734375, 0.494049072265625, 0.55706787109375, 0.620086669921875, 0.68310546875, 0.746124267578125, 0.80914306640625, 0.872161865234375, 0.9351806640625, 0.998199462890625, 1.06121826171875, 1.124237060546875, 1.187255859375, 1.250274658203125, 1.31329345703125, 1.376312255859375, 1.4393310546875, 1.502349853515625, 1.56536865234375, 1.628387451171875, 1.69140625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 10.0, 11.0, 15.0, 20.0, 47.0, 61.0, 61.0, 86.0, 155.0, 167.0, 306.0, 474.0, 699.0, 1163.0, 1865.0, 2961.0, 4606.0, 7471.0, 12099.0, 19806.0, 31854.0, 49365.0, 75284.0, 108892.0, 166523.0, 1171016.0, 147207.0, 102344.0, 70202.0, 45524.0, 28907.0, 18049.0, 11200.0, 6888.0, 4259.0, 2619.0, 1643.0, 1100.0, 743.0, 448.0, 324.0, 241.0, 136.0, 78.0, 72.0, 51.0, 27.0, 15.0, 18.0, 4.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.1578369140625, -0.15281295776367188, -0.14778900146484375, -0.14276504516601562, -0.1377410888671875, -0.13271713256835938, -0.12769317626953125, -0.12266921997070312, -0.117645263671875, -0.11262130737304688, -0.10759735107421875, -0.10257339477539062, -0.0975494384765625, -0.09252548217773438, -0.08750152587890625, -0.08247756958007812, -0.07745361328125, -0.07242965698242188, -0.06740570068359375, -0.062381744384765625, -0.0573577880859375, -0.052333831787109375, -0.04730987548828125, -0.042285919189453125, -0.037261962890625, -0.032238006591796875, -0.02721405029296875, -0.022190093994140625, -0.0171661376953125, -0.012142181396484375, -0.00711822509765625, -0.002094268798828125, 0.0029296875, 0.007953643798828125, 0.01297760009765625, 0.018001556396484375, 0.0230255126953125, 0.028049468994140625, 0.03307342529296875, 0.038097381591796875, 0.043121337890625, 0.048145294189453125, 0.05316925048828125, 0.058193206787109375, 0.0632171630859375, 0.06824111938476562, 0.07326507568359375, 0.07828903198242188, 0.08331298828125, 0.08833694458007812, 0.09336090087890625, 0.09838485717773438, 0.1034088134765625, 0.10843276977539062, 0.11345672607421875, 0.11848068237304688, 0.123504638671875, 0.12852859497070312, 0.13355255126953125, 0.13857650756835938, 0.1436004638671875, 0.14862442016601562, 0.15364837646484375, 0.15867233276367188, 0.1636962890625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 6.0, 9.0, 7.0, 14.0, 2.0, 11.0, 10.0, 14.0, 19.0, 18.0, 30.0, 39.0, 27.0, 56.0, 87.0, 123.0, 122.0, 94.0, 62.0, 36.0, 33.0, 28.0, 20.0, 13.0, 18.0, 13.0, 10.0, 11.0, 6.0, 9.0, 5.0, 10.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0130462646484375, -0.012595653533935547, -0.012145042419433594, -0.01169443130493164, -0.011243820190429688, -0.010793209075927734, -0.010342597961425781, -0.009891986846923828, -0.009441375732421875, -0.008990764617919922, -0.008540153503417969, -0.008089542388916016, -0.0076389312744140625, -0.007188320159912109, -0.006737709045410156, -0.006287097930908203, -0.00583648681640625, -0.005385875701904297, -0.004935264587402344, -0.004484653472900391, -0.0040340423583984375, -0.0035834312438964844, -0.0031328201293945312, -0.002682209014892578, -0.002231597900390625, -0.0017809867858886719, -0.0013303756713867188, -0.0008797645568847656, -0.0004291534423828125, 2.1457672119140625e-05, 0.00047206878662109375, 0.0009226799011230469, 0.001373291015625, 0.0018239021301269531, 0.0022745132446289062, 0.0027251243591308594, 0.0031757354736328125, 0.0036263465881347656, 0.004076957702636719, 0.004527568817138672, 0.004978179931640625, 0.005428791046142578, 0.005879402160644531, 0.006330013275146484, 0.0067806243896484375, 0.007231235504150391, 0.007681846618652344, 0.008132457733154297, 0.00858306884765625, 0.009033679962158203, 0.009484291076660156, 0.00993490219116211, 0.010385513305664062, 0.010836124420166016, 0.011286735534667969, 0.011737346649169922, 0.012187957763671875, 0.012638568878173828, 0.013089179992675781, 0.013539791107177734, 0.013990402221679688, 0.01444101333618164, 0.014891624450683594, 0.015342235565185547, 0.0157928466796875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 10.0, 13.0, 6.0, 7.0, 8.0, 8.0, 11.0, 14.0, 22.0, 26.0, 41.0, 64.0, 93.0, 148.0, 257.0, 783.0, 26223.0, 1002965.0, 16487.0, 680.0, 245.0, 109.0, 90.0, 69.0, 45.0, 19.0, 18.0, 20.0, 6.0, 7.0, 8.0, 13.0, 6.0, 6.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.351806640625, -0.34215545654296875, -0.3325042724609375, -0.32285308837890625, -0.313201904296875, -0.30355072021484375, -0.2938995361328125, -0.28424835205078125, -0.27459716796875, -0.26494598388671875, -0.2552947998046875, -0.24564361572265625, -0.235992431640625, -0.22634124755859375, -0.2166900634765625, -0.20703887939453125, -0.1973876953125, -0.18773651123046875, -0.1780853271484375, -0.16843414306640625, -0.158782958984375, -0.14913177490234375, -0.1394805908203125, -0.12982940673828125, -0.12017822265625, -0.11052703857421875, -0.1008758544921875, -0.09122467041015625, -0.081573486328125, -0.07192230224609375, -0.0622711181640625, -0.05261993408203125, -0.04296875, -0.03331756591796875, -0.0236663818359375, -0.01401519775390625, -0.004364013671875, 0.00528717041015625, 0.0149383544921875, 0.02458953857421875, 0.03424072265625, 0.04389190673828125, 0.0535430908203125, 0.06319427490234375, 0.072845458984375, 0.08249664306640625, 0.0921478271484375, 0.10179901123046875, 0.1114501953125, 0.12110137939453125, 0.1307525634765625, 0.14040374755859375, 0.150054931640625, 0.15970611572265625, 0.1693572998046875, 0.17900848388671875, 0.18865966796875, 0.19831085205078125, 0.2079620361328125, 0.21761322021484375, 0.227264404296875, 0.23691558837890625, 0.2465667724609375, 0.25621795654296875, 0.265869140625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 17.0, 426.0, 535.0, 34.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.4404247999191284, -0.4326992332935333, -0.42497366666793823, -0.41724810004234314, -0.40952253341674805, -0.40179696679115295, -0.39407140016555786, -0.38634583353996277, -0.3786202669143677, -0.3708947002887726, -0.3631691336631775, -0.3554435670375824, -0.3477180004119873, -0.3399924337863922, -0.3322668671607971, -0.324541300535202, -0.31681573390960693, -0.30909016728401184, -0.30136460065841675, -0.29363903403282166, -0.28591346740722656, -0.27818790078163147, -0.2704623341560364, -0.2627367675304413, -0.2550112009048462, -0.2472856342792511, -0.239560067653656, -0.2318345010280609, -0.22410893440246582, -0.21638336777687073, -0.20865780115127563, -0.20093223452568054, -0.19320665299892426, -0.18548108637332916, -0.17775551974773407, -0.17002995312213898, -0.16230438649654388, -0.1545788198709488, -0.1468532532453537, -0.1391276866197586, -0.1314021199941635, -0.12367655336856842, -0.11595098674297333, -0.10822542011737823, -0.10049985349178314, -0.09277428686618805, -0.08504872024059296, -0.07732315361499786, -0.06959757953882217, -0.06187201291322708, -0.05414644628763199, -0.046420879662036896, -0.0386953130364418, -0.030969742685556412, -0.02324417605996132, -0.015518609434366226, -0.007793042808771133, -6.747571751475334e-05, 0.007658091373741627, 0.015383658930659294, 0.023109225556254387, 0.03083479404449463, 0.03856036067008972, 0.046285927295684814, 0.05401149392127991]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 2.0, 7.0, 5.0, 5.0, 4.0, 10.0, 8.0, 12.0, 23.0, 20.0, 18.0, 23.0, 21.0, 20.0, 24.0, 33.0, 37.0, 36.0, 33.0, 35.0, 41.0, 41.0, 46.0, 48.0, 46.0, 30.0, 40.0, 33.0, 31.0, 36.0, 29.0, 21.0, 26.0, 27.0, 23.0, 15.0, 18.0, 10.0, 15.0, 15.0, 8.0, 3.0, 6.0, 4.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01959174871444702, -0.018993398174643517, -0.01839504763484001, -0.017796697095036507, -0.017198346555233, -0.016599996015429497, -0.016001645475625992, -0.015403294935822487, -0.014804944396018982, -0.014206593856215477, -0.013608243316411972, -0.013009892776608467, -0.012411542236804962, -0.011813191697001457, -0.011214841157197952, -0.010616490617394447, -0.010018140077590942, -0.009419789537787437, -0.008821438997983932, -0.008223088458180428, -0.007624737918376923, -0.007026387378573418, -0.006428036838769913, -0.005829686298966408, -0.005231335759162903, -0.004632985219359398, -0.004034634679555893, -0.003436284139752388, -0.002837933599948883, -0.002239583060145378, -0.0016412325203418732, -0.0010428819805383682, -0.0004445314407348633, 0.00015381909906864166, 0.0007521696388721466, 0.0013505201786756516, 0.0019488707184791565, 0.0025472212582826614, 0.0031455717980861664, 0.0037439223378896713, 0.004342272877693176, 0.004940623417496681, 0.005538973957300186, 0.006137324497103691, 0.006735675036907196, 0.007334025576710701, 0.007932376116514206, 0.008530726656317711, 0.009129077196121216, 0.00972742773592472, 0.010325778275728226, 0.01092412881553173, 0.011522479355335236, 0.01212082989513874, 0.012719180434942245, 0.01331753097474575, 0.013915881514549255, 0.01451423205435276, 0.015112582594156265, 0.01571093313395977, 0.016309283673763275, 0.01690763421356678, 0.017505984753370285, 0.01810433529317379, 0.018702685832977295]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 12.0, 12.0, 9.0, 10.0, 17.0, 18.0, 19.0, 19.0, 24.0, 22.0, 41.0, 25.0, 40.0, 38.0, 42.0, 52.0, 30.0, 52.0, 43.0, 46.0, 43.0, 45.0, 44.0, 39.0, 37.0, 31.0, 26.0, 19.0, 12.0, 19.0, 26.0, 16.0, 20.0, 12.0, 7.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.142578125, -3.04754638671875, -2.9525146484375, -2.85748291015625, -2.762451171875, -2.66741943359375, -2.5723876953125, -2.47735595703125, -2.38232421875, -2.28729248046875, -2.1922607421875, -2.09722900390625, -2.002197265625, -1.90716552734375, -1.8121337890625, -1.71710205078125, -1.6220703125, -1.52703857421875, -1.4320068359375, -1.33697509765625, -1.241943359375, -1.14691162109375, -1.0518798828125, -0.95684814453125, -0.86181640625, -0.76678466796875, -0.6717529296875, -0.57672119140625, -0.481689453125, -0.38665771484375, -0.2916259765625, -0.19659423828125, -0.1015625, -0.00653076171875, 0.0885009765625, 0.18353271484375, 0.278564453125, 0.37359619140625, 0.4686279296875, 0.56365966796875, 0.65869140625, 0.75372314453125, 0.8487548828125, 0.94378662109375, 1.038818359375, 1.13385009765625, 1.2288818359375, 1.32391357421875, 1.4189453125, 1.51397705078125, 1.6090087890625, 1.70404052734375, 1.799072265625, 1.89410400390625, 1.9891357421875, 2.08416748046875, 2.17919921875, 2.27423095703125, 2.3692626953125, 2.46429443359375, 2.559326171875, 2.65435791015625, 2.7493896484375, 2.84442138671875, 2.939453125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 7.0, 7.0, 7.0, 16.0, 18.0, 21.0, 44.0, 54.0, 71.0, 123.0, 158.0, 241.0, 372.0, 570.0, 831.0, 1329.0, 2152.0, 3603.0, 5785.0, 9907.0, 18679.0, 41085.0, 103932.0, 268324.0, 337706.0, 143822.0, 55215.0, 24046.0, 12325.0, 7010.0, 4109.0, 2412.0, 1629.0, 1009.0, 663.0, 400.0, 281.0, 170.0, 119.0, 99.0, 61.0, 42.0, 36.0, 16.0, 22.0, 9.0, 4.0, 3.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.291015625, -3.1854248046875, -3.079833984375, -2.9742431640625, -2.86865234375, -2.7630615234375, -2.657470703125, -2.5518798828125, -2.4462890625, -2.3406982421875, -2.235107421875, -2.1295166015625, -2.02392578125, -1.9183349609375, -1.812744140625, -1.7071533203125, -1.6015625, -1.4959716796875, -1.390380859375, -1.2847900390625, -1.17919921875, -1.0736083984375, -0.968017578125, -0.8624267578125, -0.7568359375, -0.6512451171875, -0.545654296875, -0.4400634765625, -0.33447265625, -0.2288818359375, -0.123291015625, -0.0177001953125, 0.087890625, 0.1934814453125, 0.299072265625, 0.4046630859375, 0.51025390625, 0.6158447265625, 0.721435546875, 0.8270263671875, 0.9326171875, 1.0382080078125, 1.143798828125, 1.2493896484375, 1.35498046875, 1.4605712890625, 1.566162109375, 1.6717529296875, 1.77734375, 1.8829345703125, 1.988525390625, 2.0941162109375, 2.19970703125, 2.3052978515625, 2.410888671875, 2.5164794921875, 2.6220703125, 2.7276611328125, 2.833251953125, 2.9388427734375, 3.04443359375, 3.1500244140625, 3.255615234375, 3.3612060546875, 3.466796875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 5.0, 6.0, 4.0, 6.0, 9.0, 8.0, 6.0, 9.0, 17.0, 18.0, 20.0, 22.0, 37.0, 31.0, 39.0, 51.0, 59.0, 76.0, 98.0, 166.0, 1372.0, 329.0, 157.0, 73.0, 74.0, 65.0, 45.0, 27.0, 37.0, 34.0, 37.0, 25.0, 13.0, 13.0, 11.0, 11.0, 9.0, 7.0, 8.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.1171875, -10.745849609375, -10.37451171875, -10.003173828125, -9.6318359375, -9.260498046875, -8.88916015625, -8.517822265625, -8.146484375, -7.775146484375, -7.40380859375, -7.032470703125, -6.6611328125, -6.289794921875, -5.91845703125, -5.547119140625, -5.17578125, -4.804443359375, -4.43310546875, -4.061767578125, -3.6904296875, -3.319091796875, -2.94775390625, -2.576416015625, -2.205078125, -1.833740234375, -1.46240234375, -1.091064453125, -0.7197265625, -0.348388671875, 0.02294921875, 0.394287109375, 0.765625, 1.136962890625, 1.50830078125, 1.879638671875, 2.2509765625, 2.622314453125, 2.99365234375, 3.364990234375, 3.736328125, 4.107666015625, 4.47900390625, 4.850341796875, 5.2216796875, 5.593017578125, 5.96435546875, 6.335693359375, 6.70703125, 7.078369140625, 7.44970703125, 7.821044921875, 8.1923828125, 8.563720703125, 8.93505859375, 9.306396484375, 9.677734375, 10.049072265625, 10.42041015625, 10.791748046875, 11.1630859375, 11.534423828125, 11.90576171875, 12.277099609375, 12.6484375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 7.0, 15.0, 19.0, 37.0, 34.0, 62.0, 111.0, 156.0, 317.0, 836.0, 7056.0, 3028174.0, 106306.0, 1499.0, 479.0, 226.0, 127.0, 79.0, 51.0, 29.0, 19.0, 18.0, 10.0, 5.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.65625, -54.322998046875, -52.98974609375, -51.656494140625, -50.3232421875, -48.989990234375, -47.65673828125, -46.323486328125, -44.990234375, -43.656982421875, -42.32373046875, -40.990478515625, -39.6572265625, -38.323974609375, -36.99072265625, -35.657470703125, -34.32421875, -32.990966796875, -31.65771484375, -30.324462890625, -28.9912109375, -27.657958984375, -26.32470703125, -24.991455078125, -23.658203125, -22.324951171875, -20.99169921875, -19.658447265625, -18.3251953125, -16.991943359375, -15.65869140625, -14.325439453125, -12.9921875, -11.658935546875, -10.32568359375, -8.992431640625, -7.6591796875, -6.325927734375, -4.99267578125, -3.659423828125, -2.326171875, -0.992919921875, 0.34033203125, 1.673583984375, 3.0068359375, 4.340087890625, 5.67333984375, 7.006591796875, 8.33984375, 9.673095703125, 11.00634765625, 12.339599609375, 13.6728515625, 15.006103515625, 16.33935546875, 17.672607421875, 19.005859375, 20.339111328125, 21.67236328125, 23.005615234375, 24.3388671875, 25.672119140625, 27.00537109375, 28.338623046875, 29.671875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [967.0, 49.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.791018486022949, 3.4811325073242188, 14.753283500671387, 26.025432586669922, 37.297584533691406, 48.56973648071289, 59.84188461303711, 71.11404418945312, 82.38619232177734, 93.65834045410156, 104.93049621582031, 116.20264434814453, 127.47479248046875, 138.7469482421875, 150.01910400390625, 161.291259765625, 172.5634002685547, 183.83555603027344, 195.10769653320312, 206.37985229492188, 217.65200805664062, 228.92416381835938, 240.19630432128906, 251.4684600830078, 262.7406005859375, 274.01275634765625, 285.284912109375, 296.55706787109375, 307.8291931152344, 319.1013488769531, 330.3735046386719, 341.6456604003906, 352.9178161621094, 364.1899719238281, 375.4621276855469, 386.7342529296875, 398.00640869140625, 409.278564453125, 420.55072021484375, 431.8228759765625, 443.09503173828125, 454.3671875, 465.63934326171875, 476.9114990234375, 488.1836242675781, 499.4557800292969, 510.7279357910156, 522.0001220703125, 533.272216796875, 544.5443725585938, 555.8165283203125, 567.0886840820312, 578.36083984375, 589.6329956054688, 600.9051513671875, 612.17724609375, 623.449462890625, 634.7216186523438, 645.9937744140625, 657.2659301757812, 668.5380859375, 679.8102416992188, 691.0823974609375, 702.3544921875, 713.6266479492188]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 9.0, 15.0, 12.0, 16.0, 17.0, 20.0, 25.0, 18.0, 24.0, 22.0, 34.0, 33.0, 40.0, 32.0, 36.0, 39.0, 50.0, 48.0, 49.0, 38.0, 30.0, 38.0, 34.0, 33.0, 40.0, 28.0, 17.0, 29.0, 30.0, 19.0, 16.0, 20.0, 12.0, 7.0, 10.0, 11.0, 9.0, 7.0, 6.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.962600708007812, -27.07193374633789, -26.18126678466797, -25.290599822998047, -24.399932861328125, -23.509265899658203, -22.61859703063965, -21.727930068969727, -20.837263107299805, -19.946596145629883, -19.05592918395996, -18.16526222229004, -17.274593353271484, -16.383926391601562, -15.49325942993164, -14.602592468261719, -13.711925506591797, -12.821258544921875, -11.930591583251953, -11.039923667907715, -10.149256706237793, -9.258589744567871, -8.367921829223633, -7.477254867553711, -6.586587905883789, -5.695920944213867, -4.805253505706787, -3.914586305618286, -3.023919105529785, -2.1332521438598633, -1.2425847053527832, -0.3519172668457031, 0.5387516021728516, 1.4294188022613525, 2.3200860023498535, 3.2107532024383545, 4.1014204025268555, 4.992087364196777, 5.882754802703857, 6.7734222412109375, 7.664089202880859, 8.554756164550781, 9.445423126220703, 10.336091041564941, 11.226758003234863, 12.117424964904785, 13.008092880249023, 13.898759841918945, 14.789426803588867, 15.680093765258789, 16.57076072692871, 17.461427688598633, 18.352096557617188, 19.24276351928711, 20.13343048095703, 21.024097442626953, 21.914764404296875, 22.805431365966797, 23.69609832763672, 24.58676528930664, 25.477432250976562, 26.368099212646484, 27.25876808166504, 28.14943504333496, 29.040102005004883]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 11.0, 7.0, 11.0, 17.0, 21.0, 16.0, 20.0, 27.0, 19.0, 25.0, 34.0, 33.0, 41.0, 29.0, 32.0, 44.0, 46.0, 43.0, 38.0, 37.0, 38.0, 42.0, 45.0, 41.0, 32.0, 29.0, 23.0, 31.0, 22.0, 16.0, 15.0, 16.0, 8.0, 20.0, 16.0, 4.0, 3.0, 11.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.1875, -3.0914306640625, -2.995361328125, -2.8992919921875, -2.80322265625, -2.7071533203125, -2.611083984375, -2.5150146484375, -2.4189453125, -2.3228759765625, -2.226806640625, -2.1307373046875, -2.03466796875, -1.9385986328125, -1.842529296875, -1.7464599609375, -1.650390625, -1.5543212890625, -1.458251953125, -1.3621826171875, -1.26611328125, -1.1700439453125, -1.073974609375, -0.9779052734375, -0.8818359375, -0.7857666015625, -0.689697265625, -0.5936279296875, -0.49755859375, -0.4014892578125, -0.305419921875, -0.2093505859375, -0.11328125, -0.0172119140625, 0.078857421875, 0.1749267578125, 0.27099609375, 0.3670654296875, 0.463134765625, 0.5592041015625, 0.6552734375, 0.7513427734375, 0.847412109375, 0.9434814453125, 1.03955078125, 1.1356201171875, 1.231689453125, 1.3277587890625, 1.423828125, 1.5198974609375, 1.615966796875, 1.7120361328125, 1.80810546875, 1.9041748046875, 2.000244140625, 2.0963134765625, 2.1923828125, 2.2884521484375, 2.384521484375, 2.4805908203125, 2.57666015625, 2.6727294921875, 2.768798828125, 2.8648681640625, 2.9609375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 9.0, 11.0, 19.0, 11.0, 18.0, 21.0, 38.0, 30.0, 43.0, 46.0, 55.0, 61.0, 80.0, 105.0, 164.0, 451.0, 1588.0, 9920.0, 122013.0, 1906478.0, 2007818.0, 131806.0, 10558.0, 1664.0, 494.0, 216.0, 98.0, 76.0, 67.0, 52.0, 30.0, 35.0, 41.0, 23.0, 25.0, 24.0, 14.0, 17.0, 5.0, 10.0, 8.0, 10.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.1953125, -10.856201171875, -10.51708984375, -10.177978515625, -9.8388671875, -9.499755859375, -9.16064453125, -8.821533203125, -8.482421875, -8.143310546875, -7.80419921875, -7.465087890625, -7.1259765625, -6.786865234375, -6.44775390625, -6.108642578125, -5.76953125, -5.430419921875, -5.09130859375, -4.752197265625, -4.4130859375, -4.073974609375, -3.73486328125, -3.395751953125, -3.056640625, -2.717529296875, -2.37841796875, -2.039306640625, -1.7001953125, -1.361083984375, -1.02197265625, -0.682861328125, -0.34375, -0.004638671875, 0.33447265625, 0.673583984375, 1.0126953125, 1.351806640625, 1.69091796875, 2.030029296875, 2.369140625, 2.708251953125, 3.04736328125, 3.386474609375, 3.7255859375, 4.064697265625, 4.40380859375, 4.742919921875, 5.08203125, 5.421142578125, 5.76025390625, 6.099365234375, 6.4384765625, 6.777587890625, 7.11669921875, 7.455810546875, 7.794921875, 8.134033203125, 8.47314453125, 8.812255859375, 9.1513671875, 9.490478515625, 9.82958984375, 10.168701171875, 10.5078125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 17.0, 19.0, 30.0, 64.0, 86.0, 127.0, 218.0, 356.0, 474.0, 630.0, 633.0, 508.0, 342.0, 206.0, 133.0, 96.0, 51.0, 37.0, 19.0, 11.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5390625, -11.1658935546875, -10.792724609375, -10.4195556640625, -10.04638671875, -9.6732177734375, -9.300048828125, -8.9268798828125, -8.5537109375, -8.1805419921875, -7.807373046875, -7.4342041015625, -7.06103515625, -6.6878662109375, -6.314697265625, -5.9415283203125, -5.568359375, -5.1951904296875, -4.822021484375, -4.4488525390625, -4.07568359375, -3.7025146484375, -3.329345703125, -2.9561767578125, -2.5830078125, -2.2098388671875, -1.836669921875, -1.4635009765625, -1.09033203125, -0.7171630859375, -0.343994140625, 0.0291748046875, 0.40234375, 0.7755126953125, 1.148681640625, 1.5218505859375, 1.89501953125, 2.2681884765625, 2.641357421875, 3.0145263671875, 3.3876953125, 3.7608642578125, 4.134033203125, 4.5072021484375, 4.88037109375, 5.2535400390625, 5.626708984375, 5.9998779296875, 6.373046875, 6.7462158203125, 7.119384765625, 7.4925537109375, 7.86572265625, 8.2388916015625, 8.612060546875, 8.9852294921875, 9.3583984375, 9.7315673828125, 10.104736328125, 10.4779052734375, 10.85107421875, 11.2242431640625, 11.597412109375, 11.9705810546875, 12.34375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 10.0, 17.0, 34.0, 44.0, 83.0, 133.0, 231.0, 555.0, 2354.0, 107401.0, 3842528.0, 236330.0, 3361.0, 622.0, 252.0, 114.0, 85.0, 55.0, 31.0, 18.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.5, -31.531982421875, -30.56396484375, -29.595947265625, -28.6279296875, -27.659912109375, -26.69189453125, -25.723876953125, -24.755859375, -23.787841796875, -22.81982421875, -21.851806640625, -20.8837890625, -19.915771484375, -18.94775390625, -17.979736328125, -17.01171875, -16.043701171875, -15.07568359375, -14.107666015625, -13.1396484375, -12.171630859375, -11.20361328125, -10.235595703125, -9.267578125, -8.299560546875, -7.33154296875, -6.363525390625, -5.3955078125, -4.427490234375, -3.45947265625, -2.491455078125, -1.5234375, -0.555419921875, 0.41259765625, 1.380615234375, 2.3486328125, 3.316650390625, 4.28466796875, 5.252685546875, 6.220703125, 7.188720703125, 8.15673828125, 9.124755859375, 10.0927734375, 11.060791015625, 12.02880859375, 12.996826171875, 13.96484375, 14.932861328125, 15.90087890625, 16.868896484375, 17.8369140625, 18.804931640625, 19.77294921875, 20.740966796875, 21.708984375, 22.677001953125, 23.64501953125, 24.613037109375, 25.5810546875, 26.549072265625, 27.51708984375, 28.485107421875, 29.453125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 55.0, 397.0, 493.0, 69.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-305.763671875, -298.3138122558594, -290.86395263671875, -283.4140930175781, -275.9642333984375, -268.5143737792969, -261.06451416015625, -253.61463928222656, -246.16477966308594, -238.7149200439453, -231.2650604248047, -223.81520080566406, -216.36532592773438, -208.91546630859375, -201.46560668945312, -194.0157470703125, -186.56588745117188, -179.11602783203125, -171.66616821289062, -164.21630859375, -156.76644897460938, -149.31658935546875, -141.86671447753906, -134.41685485839844, -126.96699523925781, -119.51713562011719, -112.06727600097656, -104.6174087524414, -97.16754913330078, -89.71768951416016, -82.267822265625, -74.81796264648438, -67.36810302734375, -59.918243408203125, -52.468379974365234, -45.018516540527344, -37.56865692138672, -30.118797302246094, -22.668933868408203, -15.219070434570312, -7.7692108154296875, -0.3193492889404297, 7.130512237548828, 14.580373764038086, 22.030235290527344, 29.48009490966797, 36.92995834350586, 44.37982177734375, 51.829681396484375, 59.279541015625, 66.72940063476562, 74.17926788330078, 81.6291275024414, 89.07898712158203, 96.52885437011719, 103.97871398925781, 111.42857360839844, 118.87843322753906, 126.32829284667969, 133.7781524658203, 141.22802734375, 148.67788696289062, 156.12774658203125, 163.57760620117188, 171.0274658203125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 12.0, 16.0, 13.0, 25.0, 20.0, 22.0, 25.0, 31.0, 34.0, 33.0, 32.0, 47.0, 42.0, 50.0, 45.0, 58.0, 43.0, 35.0, 53.0, 43.0, 41.0, 36.0, 36.0, 37.0, 27.0, 24.0, 24.0, 17.0, 17.0, 9.0, 16.0, 7.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.787200927734375, -25.8486328125, -24.910062789916992, -23.971494674682617, -23.03292465209961, -22.094356536865234, -21.15578842163086, -20.21721839904785, -19.278648376464844, -18.34008026123047, -17.40151023864746, -16.462942123413086, -15.524372100830078, -14.585803985595703, -13.647234916687012, -12.70866584777832, -11.770097732543945, -10.831528663635254, -9.892959594726562, -8.954391479492188, -8.01582145690918, -7.0772528648376465, -6.138684272766113, -5.200115203857422, -4.2615461349487305, -3.322977066040039, -2.3844082355499268, -1.4458394050598145, -0.507270336151123, 0.43129873275756836, 1.3698673248291016, 2.308436393737793, 3.2470054626464844, 4.185574531555176, 5.124143600463867, 6.0627121925354, 7.001281261444092, 7.939850330352783, 8.878418922424316, 9.816987991333008, 10.7555570602417, 11.69412612915039, 12.632695198059082, 13.571264266967773, 14.509832382202148, 15.448402404785156, 16.38697052001953, 17.325538635253906, 18.264108657836914, 19.20267677307129, 20.141246795654297, 21.079814910888672, 22.01838493347168, 22.956953048706055, 23.895523071289062, 24.834091186523438, 25.772659301757812, 26.711227416992188, 27.649797439575195, 28.58836555480957, 29.526935577392578, 30.465503692626953, 31.404071807861328, 32.34264373779297, 33.281211853027344]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 9.0, 9.0, 13.0, 15.0, 8.0, 11.0, 21.0, 10.0, 25.0, 14.0, 21.0, 36.0, 34.0, 27.0, 27.0, 36.0, 43.0, 39.0, 35.0, 36.0, 57.0, 43.0, 37.0, 46.0, 36.0, 32.0, 32.0, 34.0, 24.0, 27.0, 16.0, 27.0, 20.0, 21.0, 8.0, 14.0, 4.0, 7.0, 8.0, 5.0, 10.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.744140625, -2.650238037109375, -2.55633544921875, -2.462432861328125, -2.3685302734375, -2.274627685546875, -2.18072509765625, -2.086822509765625, -1.992919921875, -1.899017333984375, -1.80511474609375, -1.711212158203125, -1.6173095703125, -1.523406982421875, -1.42950439453125, -1.335601806640625, -1.24169921875, -1.147796630859375, -1.05389404296875, -0.959991455078125, -0.8660888671875, -0.772186279296875, -0.67828369140625, -0.584381103515625, -0.490478515625, -0.396575927734375, -0.30267333984375, -0.208770751953125, -0.1148681640625, -0.020965576171875, 0.07293701171875, 0.166839599609375, 0.2607421875, 0.354644775390625, 0.44854736328125, 0.542449951171875, 0.6363525390625, 0.730255126953125, 0.82415771484375, 0.918060302734375, 1.011962890625, 1.105865478515625, 1.19976806640625, 1.293670654296875, 1.3875732421875, 1.481475830078125, 1.57537841796875, 1.669281005859375, 1.76318359375, 1.857086181640625, 1.95098876953125, 2.044891357421875, 2.1387939453125, 2.232696533203125, 2.32659912109375, 2.420501708984375, 2.514404296875, 2.608306884765625, 2.70220947265625, 2.796112060546875, 2.8900146484375, 2.983917236328125, 3.07781982421875, 3.171722412109375, 3.265625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 7.0, 8.0, 19.0, 17.0, 25.0, 53.0, 61.0, 89.0, 141.0, 200.0, 269.0, 401.0, 557.0, 854.0, 1230.0, 1799.0, 2672.0, 3996.0, 5767.0, 8602.0, 12779.0, 18826.0, 28506.0, 41834.0, 62466.0, 90332.0, 122976.0, 149078.0, 141687.0, 110418.0, 79138.0, 53766.0, 35862.0, 24284.0, 16209.0, 10857.0, 7182.0, 4901.0, 3378.0, 2279.0, 1585.0, 1093.0, 757.0, 504.0, 340.0, 223.0, 163.0, 107.0, 96.0, 62.0, 39.0, 28.0, 21.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.2344970703125, -0.2268848419189453, -0.21927261352539062, -0.21166038513183594, -0.20404815673828125, -0.19643592834472656, -0.18882369995117188, -0.1812114715576172, -0.1735992431640625, -0.1659870147705078, -0.15837478637695312, -0.15076255798339844, -0.14315032958984375, -0.13553810119628906, -0.12792587280273438, -0.12031364440917969, -0.112701416015625, -0.10508918762207031, -0.09747695922851562, -0.08986473083496094, -0.08225250244140625, -0.07464027404785156, -0.06702804565429688, -0.05941581726074219, -0.0518035888671875, -0.04419136047363281, -0.036579132080078125, -0.028966903686523438, -0.02135467529296875, -0.013742446899414062, -0.006130218505859375, 0.0014820098876953125, 0.00909423828125, 0.016706466674804688, 0.024318695068359375, 0.03193092346191406, 0.03954315185546875, 0.04715538024902344, 0.054767608642578125, 0.06237983703613281, 0.0699920654296875, 0.07760429382324219, 0.08521652221679688, 0.09282875061035156, 0.10044097900390625, 0.10805320739746094, 0.11566543579101562, 0.12327766418457031, 0.130889892578125, 0.1385021209716797, 0.14611434936523438, 0.15372657775878906, 0.16133880615234375, 0.16895103454589844, 0.17656326293945312, 0.1841754913330078, 0.1917877197265625, 0.1993999481201172, 0.20701217651367188, 0.21462440490722656, 0.22223663330078125, 0.22984886169433594, 0.23746109008789062, 0.2450733184814453, 0.252685546875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 1.0, 9.0, 6.0, 6.0, 12.0, 13.0, 14.0, 16.0, 16.0, 15.0, 22.0, 27.0, 23.0, 26.0, 30.0, 37.0, 46.0, 42.0, 40.0, 39.0, 35.0, 41.0, 1060.0, 40.0, 40.0, 35.0, 33.0, 35.0, 31.0, 34.0, 30.0, 18.0, 26.0, 24.0, 17.0, 12.0, 20.0, 11.0, 9.0, 9.0, 7.0, 8.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.142578125, -2.079803466796875, -2.01702880859375, -1.954254150390625, -1.8914794921875, -1.828704833984375, -1.76593017578125, -1.703155517578125, -1.640380859375, -1.577606201171875, -1.51483154296875, -1.452056884765625, -1.3892822265625, -1.326507568359375, -1.26373291015625, -1.200958251953125, -1.13818359375, -1.075408935546875, -1.01263427734375, -0.949859619140625, -0.8870849609375, -0.824310302734375, -0.76153564453125, -0.698760986328125, -0.635986328125, -0.573211669921875, -0.51043701171875, -0.447662353515625, -0.3848876953125, -0.322113037109375, -0.25933837890625, -0.196563720703125, -0.1337890625, -0.071014404296875, -0.00823974609375, 0.054534912109375, 0.1173095703125, 0.180084228515625, 0.24285888671875, 0.305633544921875, 0.368408203125, 0.431182861328125, 0.49395751953125, 0.556732177734375, 0.6195068359375, 0.682281494140625, 0.74505615234375, 0.807830810546875, 0.87060546875, 0.933380126953125, 0.99615478515625, 1.058929443359375, 1.1217041015625, 1.184478759765625, 1.24725341796875, 1.310028076171875, 1.372802734375, 1.435577392578125, 1.49835205078125, 1.561126708984375, 1.6239013671875, 1.686676025390625, 1.74945068359375, 1.812225341796875, 1.875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 11.0, 12.0, 19.0, 29.0, 35.0, 63.0, 82.0, 137.0, 217.0, 316.0, 511.0, 740.0, 1220.0, 1866.0, 3008.0, 4823.0, 7652.0, 12497.0, 20283.0, 31912.0, 50730.0, 77055.0, 111848.0, 167424.0, 1181083.0, 138485.0, 100136.0, 67785.0, 43622.0, 27685.0, 17437.0, 10592.0, 6673.0, 4196.0, 2502.0, 1570.0, 1007.0, 663.0, 404.0, 294.0, 173.0, 118.0, 75.0, 52.0, 37.0, 21.0, 12.0, 13.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.1842041015625, -0.17883872985839844, -0.17347335815429688, -0.1681079864501953, -0.16274261474609375, -0.1573772430419922, -0.15201187133789062, -0.14664649963378906, -0.1412811279296875, -0.13591575622558594, -0.13055038452148438, -0.1251850128173828, -0.11981964111328125, -0.11445426940917969, -0.10908889770507812, -0.10372352600097656, -0.098358154296875, -0.09299278259277344, -0.08762741088867188, -0.08226203918457031, -0.07689666748046875, -0.07153129577636719, -0.06616592407226562, -0.06080055236816406, -0.0554351806640625, -0.05006980895996094, -0.044704437255859375, -0.03933906555175781, -0.03397369384765625, -0.028608322143554688, -0.023242950439453125, -0.017877578735351562, -0.01251220703125, -0.0071468353271484375, -0.001781463623046875, 0.0035839080810546875, 0.00894927978515625, 0.014314651489257812, 0.019680023193359375, 0.025045394897460938, 0.0304107666015625, 0.03577613830566406, 0.041141510009765625, 0.04650688171386719, 0.05187225341796875, 0.05723762512207031, 0.06260299682617188, 0.06796836853027344, 0.073333740234375, 0.07869911193847656, 0.08406448364257812, 0.08942985534667969, 0.09479522705078125, 0.10016059875488281, 0.10552597045898438, 0.11089134216308594, 0.1162567138671875, 0.12162208557128906, 0.12698745727539062, 0.1323528289794922, 0.13771820068359375, 0.1430835723876953, 0.14844894409179688, 0.15381431579589844, 0.1591796875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 8.0, 11.0, 9.0, 9.0, 20.0, 19.0, 31.0, 43.0, 46.0, 45.0, 56.0, 54.0, 61.0, 85.0, 70.0, 61.0, 54.0, 67.0, 43.0, 51.0, 30.0, 32.0, 24.0, 18.0, 13.0, 9.0, 8.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0127105712890625, -0.01234745979309082, -0.01198434829711914, -0.011621236801147461, -0.011258125305175781, -0.010895013809204102, -0.010531902313232422, -0.010168790817260742, -0.009805679321289062, -0.009442567825317383, -0.009079456329345703, -0.008716344833374023, -0.008353233337402344, -0.007990121841430664, -0.007627010345458984, -0.007263898849487305, -0.006900787353515625, -0.006537675857543945, -0.006174564361572266, -0.005811452865600586, -0.005448341369628906, -0.0050852298736572266, -0.004722118377685547, -0.004359006881713867, -0.0039958953857421875, -0.003632783889770508, -0.003269672393798828, -0.0029065608978271484, -0.0025434494018554688, -0.002180337905883789, -0.0018172264099121094, -0.0014541149139404297, -0.00109100341796875, -0.0007278919219970703, -0.0003647804260253906, -1.6689300537109375e-06, 0.00036144256591796875, 0.0007245540618896484, 0.0010876655578613281, 0.0014507770538330078, 0.0018138885498046875, 0.002177000045776367, 0.002540111541748047, 0.0029032230377197266, 0.0032663345336914062, 0.003629446029663086, 0.003992557525634766, 0.004355669021606445, 0.004718780517578125, 0.005081892013549805, 0.005445003509521484, 0.005808115005493164, 0.006171226501464844, 0.0065343379974365234, 0.006897449493408203, 0.007260560989379883, 0.0076236724853515625, 0.007986783981323242, 0.008349895477294922, 0.008713006973266602, 0.009076118469238281, 0.009439229965209961, 0.00980234146118164, 0.01016545295715332, 0.010528564453125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 19.0, 15.0, 24.0, 32.0, 40.0, 52.0, 58.0, 84.0, 140.0, 382.0, 2731.0, 851488.0, 191134.0, 1597.0, 278.0, 128.0, 79.0, 58.0, 60.0, 31.0, 22.0, 26.0, 12.0, 12.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.232177734375, -0.22414398193359375, -0.2161102294921875, -0.20807647705078125, -0.200042724609375, -0.19200897216796875, -0.1839752197265625, -0.17594146728515625, -0.16790771484375, -0.15987396240234375, -0.1518402099609375, -0.14380645751953125, -0.135772705078125, -0.12773895263671875, -0.1197052001953125, -0.11167144775390625, -0.1036376953125, -0.09560394287109375, -0.0875701904296875, -0.07953643798828125, -0.071502685546875, -0.06346893310546875, -0.0554351806640625, -0.04740142822265625, -0.03936767578125, -0.03133392333984375, -0.0233001708984375, -0.01526641845703125, -0.007232666015625, 0.00080108642578125, 0.0088348388671875, 0.01686859130859375, 0.02490234375, 0.03293609619140625, 0.0409698486328125, 0.04900360107421875, 0.057037353515625, 0.06507110595703125, 0.0731048583984375, 0.08113861083984375, 0.08917236328125, 0.09720611572265625, 0.1052398681640625, 0.11327362060546875, 0.121307373046875, 0.12934112548828125, 0.1373748779296875, 0.14540863037109375, 0.1534423828125, 0.16147613525390625, 0.1695098876953125, 0.17754364013671875, 0.185577392578125, 0.19361114501953125, 0.2016448974609375, 0.20967864990234375, 0.21771240234375, 0.22574615478515625, 0.2337799072265625, 0.24181365966796875, 0.249847412109375, 0.25788116455078125, 0.2659149169921875, 0.27394866943359375, 0.281982421875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 22.0, 98.0, 463.0, 300.0, 76.0, 26.0, 14.0, 11.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02557823807001114, -0.023577380925416946, -0.021576521918177605, -0.019575662910938263, -0.01757480576634407, -0.015573947690427303, -0.013573089614510536, -0.011572231538593769, -0.009571373462677002, -0.007570515386760235, -0.005569657310843468, -0.0035687992349267006, -0.0015679411590099335, 0.00043291691690683365, 0.0024337749928236008, 0.004434633068740368, 0.006435491144657135, 0.008436349220573902, 0.01043720729649067, 0.012438065372407436, 0.014438923448324203, 0.016439780592918396, 0.018440639600157738, 0.02044149860739708, 0.022442355751991272, 0.024443212896585464, 0.026444071903824806, 0.028444930911064148, 0.03044578805565834, 0.03244664520025253, 0.034447506070137024, 0.036448363214731216, 0.038449227809906006, 0.0404500849545002, 0.04245094209909439, 0.04445180296897888, 0.046452660113573074, 0.04845351725816727, 0.05045437812805176, 0.05245523527264595, 0.05445609241724014, 0.056456949561834335, 0.05845780670642853, 0.06045866757631302, 0.06245952472090721, 0.0644603818655014, 0.0664612427353859, 0.06846209615468979, 0.07046295702457428, 0.07246381789445877, 0.07446467131376266, 0.07646553218364716, 0.07846638560295105, 0.08046724647283554, 0.08246810734272003, 0.08446896076202393, 0.08646982163190842, 0.08847068250179291, 0.0904715359210968, 0.09247239679098129, 0.09447325766086578, 0.09647411108016968, 0.09847497195005417, 0.10047582536935806, 0.10247668623924255]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 9.0, 7.0, 6.0, 7.0, 16.0, 11.0, 17.0, 30.0, 35.0, 40.0, 29.0, 22.0, 27.0, 34.0, 47.0, 35.0, 61.0, 48.0, 45.0, 57.0, 47.0, 45.0, 41.0, 36.0, 26.0, 36.0, 28.0, 24.0, 22.0, 21.0, 23.0, 13.0, 17.0, 10.0, 12.0, 4.0, 7.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01805245876312256, -0.017528370022773743, -0.017004279419779778, -0.016480188816785812, -0.015956100076436996, -0.015432010404765606, -0.014907920733094215, -0.014383831061422825, -0.013859741389751434, -0.013335651718080044, -0.012811562046408653, -0.012287472374737263, -0.011763382703065872, -0.011239293031394482, -0.010715203359723091, -0.0101911136880517, -0.00966702401638031, -0.00914293434470892, -0.008618844673037529, -0.008094755001366138, -0.007570665329694748, -0.007046575658023357, -0.006522485986351967, -0.005998396314680576, -0.005474306643009186, -0.004950216971337795, -0.004426127299666405, -0.003902037627995014, -0.0033779479563236237, -0.002853858284652233, -0.0023297686129808426, -0.001805678941309452, -0.0012815892696380615, -0.000757499597966671, -0.00023340992629528046, 0.0002906797453761101, 0.0008147694170475006, 0.0013388590887188911, 0.0018629487603902817, 0.002387038432061672, 0.0029111281037330627, 0.0034352177754044533, 0.003959307447075844, 0.004483397118747234, 0.005007486790418625, 0.005531576462090015, 0.006055666133761406, 0.0065797558054327965, 0.007103845477104187, 0.0076279351487755775, 0.008152024820446968, 0.008676114492118359, 0.00920020416378975, 0.00972429383546114, 0.01024838350713253, 0.01077247317880392, 0.011296562850475311, 0.011820652522146702, 0.012344742193818092, 0.012868831865489483, 0.013392921537160873, 0.013917011208832264, 0.014441100880503654, 0.014965190552175045, 0.015489280223846436]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 9.0, 9.0, 13.0, 16.0, 7.0, 11.0, 21.0, 10.0, 25.0, 14.0, 21.0, 36.0, 34.0, 27.0, 27.0, 35.0, 43.0, 40.0, 35.0, 36.0, 57.0, 43.0, 36.0, 47.0, 36.0, 32.0, 32.0, 34.0, 24.0, 27.0, 16.0, 27.0, 22.0, 19.0, 8.0, 14.0, 4.0, 7.0, 8.0, 5.0, 10.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.744140625, -2.650238037109375, -2.55633544921875, -2.462432861328125, -2.3685302734375, -2.274627685546875, -2.18072509765625, -2.086822509765625, -1.992919921875, -1.899017333984375, -1.80511474609375, -1.711212158203125, -1.6173095703125, -1.523406982421875, -1.42950439453125, -1.335601806640625, -1.24169921875, -1.147796630859375, -1.05389404296875, -0.959991455078125, -0.8660888671875, -0.772186279296875, -0.67828369140625, -0.584381103515625, -0.490478515625, -0.396575927734375, -0.30267333984375, -0.208770751953125, -0.1148681640625, -0.020965576171875, 0.07293701171875, 0.166839599609375, 0.2607421875, 0.354644775390625, 0.44854736328125, 0.542449951171875, 0.6363525390625, 0.730255126953125, 0.82415771484375, 0.918060302734375, 1.011962890625, 1.105865478515625, 1.19976806640625, 1.293670654296875, 1.3875732421875, 1.481475830078125, 1.57537841796875, 1.669281005859375, 1.76318359375, 1.857086181640625, 1.95098876953125, 2.044891357421875, 2.1387939453125, 2.232696533203125, 2.32659912109375, 2.420501708984375, 2.514404296875, 2.608306884765625, 2.70220947265625, 2.796112060546875, 2.8900146484375, 2.983917236328125, 3.07781982421875, 3.171722412109375, 3.265625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 15.0, 18.0, 33.0, 53.0, 81.0, 140.0, 291.0, 545.0, 1094.0, 2312.0, 4734.0, 9793.0, 19101.0, 36927.0, 78115.0, 218287.0, 369967.0, 175555.0, 65885.0, 32360.0, 16681.0, 8465.0, 4207.0, 1980.0, 878.0, 478.0, 204.0, 124.0, 80.0, 44.0, 29.0, 20.0, 22.0, 13.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.494140625, -3.38629150390625, -3.2784423828125, -3.17059326171875, -3.062744140625, -2.95489501953125, -2.8470458984375, -2.73919677734375, -2.63134765625, -2.52349853515625, -2.4156494140625, -2.30780029296875, -2.199951171875, -2.09210205078125, -1.9842529296875, -1.87640380859375, -1.7685546875, -1.66070556640625, -1.5528564453125, -1.44500732421875, -1.337158203125, -1.22930908203125, -1.1214599609375, -1.01361083984375, -0.90576171875, -0.79791259765625, -0.6900634765625, -0.58221435546875, -0.474365234375, -0.36651611328125, -0.2586669921875, -0.15081787109375, -0.04296875, 0.06488037109375, 0.1727294921875, 0.28057861328125, 0.388427734375, 0.49627685546875, 0.6041259765625, 0.71197509765625, 0.81982421875, 0.92767333984375, 1.0355224609375, 1.14337158203125, 1.251220703125, 1.35906982421875, 1.4669189453125, 1.57476806640625, 1.6826171875, 1.79046630859375, 1.8983154296875, 2.00616455078125, 2.114013671875, 2.22186279296875, 2.3297119140625, 2.43756103515625, 2.54541015625, 2.65325927734375, 2.7611083984375, 2.86895751953125, 2.976806640625, 3.08465576171875, 3.1925048828125, 3.30035400390625, 3.408203125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 8.0, 6.0, 9.0, 14.0, 11.0, 16.0, 20.0, 27.0, 31.0, 33.0, 35.0, 35.0, 36.0, 40.0, 57.0, 68.0, 92.0, 159.0, 1387.0, 299.0, 140.0, 90.0, 62.0, 47.0, 37.0, 28.0, 42.0, 27.0, 25.0, 28.0, 18.0, 13.0, 11.0, 9.0, 12.0, 11.0, 11.0, 5.0, 8.0, 4.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.5546875, -11.2022705078125, -10.849853515625, -10.4974365234375, -10.14501953125, -9.7926025390625, -9.440185546875, -9.0877685546875, -8.7353515625, -8.3829345703125, -8.030517578125, -7.6781005859375, -7.32568359375, -6.9732666015625, -6.620849609375, -6.2684326171875, -5.916015625, -5.5635986328125, -5.211181640625, -4.8587646484375, -4.50634765625, -4.1539306640625, -3.801513671875, -3.4490966796875, -3.0966796875, -2.7442626953125, -2.391845703125, -2.0394287109375, -1.68701171875, -1.3345947265625, -0.982177734375, -0.6297607421875, -0.27734375, 0.0750732421875, 0.427490234375, 0.7799072265625, 1.13232421875, 1.4847412109375, 1.837158203125, 2.1895751953125, 2.5419921875, 2.8944091796875, 3.246826171875, 3.5992431640625, 3.95166015625, 4.3040771484375, 4.656494140625, 5.0089111328125, 5.361328125, 5.7137451171875, 6.066162109375, 6.4185791015625, 6.77099609375, 7.1234130859375, 7.475830078125, 7.8282470703125, 8.1806640625, 8.5330810546875, 8.885498046875, 9.2379150390625, 9.59033203125, 9.9427490234375, 10.295166015625, 10.6475830078125, 11.0]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 1.0, 4.0, 2.0, 7.0, 13.0, 6.0, 10.0, 19.0, 18.0, 25.0, 35.0, 37.0, 59.0, 76.0, 116.0, 180.0, 316.0, 579.0, 2127.0, 69516.0, 3049432.0, 20369.0, 1415.0, 488.0, 258.0, 172.0, 113.0, 81.0, 51.0, 44.0, 20.0, 26.0, 10.0, 17.0, 10.0, 13.0, 8.0, 7.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.09375, -31.96728515625, -30.8408203125, -29.71435546875, -28.587890625, -27.46142578125, -26.3349609375, -25.20849609375, -24.08203125, -22.95556640625, -21.8291015625, -20.70263671875, -19.576171875, -18.44970703125, -17.3232421875, -16.19677734375, -15.0703125, -13.94384765625, -12.8173828125, -11.69091796875, -10.564453125, -9.43798828125, -8.3115234375, -7.18505859375, -6.05859375, -4.93212890625, -3.8056640625, -2.67919921875, -1.552734375, -0.42626953125, 0.7001953125, 1.82666015625, 2.953125, 4.07958984375, 5.2060546875, 6.33251953125, 7.458984375, 8.58544921875, 9.7119140625, 10.83837890625, 11.96484375, 13.09130859375, 14.2177734375, 15.34423828125, 16.470703125, 17.59716796875, 18.7236328125, 19.85009765625, 20.9765625, 22.10302734375, 23.2294921875, 24.35595703125, 25.482421875, 26.60888671875, 27.7353515625, 28.86181640625, 29.98828125, 31.11474609375, 32.2412109375, 33.36767578125, 34.494140625, 35.62060546875, 36.7470703125, 37.87353515625, 39.0]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 10.0, 273.0, 652.0, 80.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.60725784301758, -38.02503967285156, -33.44282150268555, -28.86060333251953, -24.278385162353516, -19.6961669921875, -15.113948822021484, -10.531730651855469, -5.949512481689453, -1.3672943115234375, 3.214923858642578, 7.797142028808594, 12.37936019897461, 16.961578369140625, 21.54379653930664, 26.126014709472656, 30.708232879638672, 35.29045104980469, 39.8726692199707, 44.45488739013672, 49.037105560302734, 53.61932373046875, 58.201541900634766, 62.78376007080078, 67.36598205566406, 71.94819641113281, 76.5304183959961, 81.11264038085938, 85.69485473632812, 90.27706909179688, 94.85929107666016, 99.44151306152344, 104.02372741699219, 108.60594177246094, 113.18816375732422, 117.7703857421875, 122.35260009765625, 126.934814453125, 131.51702880859375, 136.09925842285156, 140.6814727783203, 145.26368713378906, 149.84591674804688, 154.42813110351562, 159.01034545898438, 163.59255981445312, 168.17477416992188, 172.7570037841797, 177.33921813964844, 181.9214324951172, 186.503662109375, 191.08587646484375, 195.6680908203125, 200.25030517578125, 204.83251953125, 209.4147491455078, 213.99696350097656, 218.5791778564453, 223.16140747070312, 227.74362182617188, 232.32583618164062, 236.90805053710938, 241.49026489257812, 246.07249450683594, 250.6547088623047]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 9.0, 11.0, 13.0, 19.0, 20.0, 21.0, 18.0, 26.0, 31.0, 28.0, 25.0, 23.0, 33.0, 34.0, 30.0, 48.0, 55.0, 34.0, 36.0, 33.0, 43.0, 33.0, 39.0, 34.0, 40.0, 27.0, 32.0, 37.0, 26.0, 26.0, 17.0, 22.0, 13.0, 14.0, 9.0, 8.0, 3.0, 6.0, 7.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.59071350097656, -33.52473831176758, -32.458763122558594, -31.392789840698242, -30.326814651489258, -29.260839462280273, -28.194866180419922, -27.128890991210938, -26.062915802001953, -24.99694061279297, -23.930965423583984, -22.864992141723633, -21.79901695251465, -20.733041763305664, -19.667068481445312, -18.601093292236328, -17.535118103027344, -16.46914291381836, -15.403168678283691, -14.337194442749023, -13.271219253540039, -12.205244064331055, -11.139269828796387, -10.073295593261719, -9.007320404052734, -7.941345691680908, -6.875370979309082, -5.809396266937256, -4.74342155456543, -3.6774468421936035, -2.6114721298217773, -1.5454974174499512, -0.4795188903808594, 0.5864558219909668, 1.652430534362793, 2.718405246734619, 3.7843799591064453, 4.8503546714782715, 5.916329383850098, 6.982304096221924, 8.04827880859375, 9.114253997802734, 10.180228233337402, 11.24620246887207, 12.312177658081055, 13.378152847290039, 14.444127082824707, 15.510101318359375, 16.57607650756836, 17.642051696777344, 18.708026885986328, 19.77400016784668, 20.839975357055664, 21.90595054626465, 22.971923828125, 24.037899017333984, 25.10387420654297, 26.169849395751953, 27.235824584960938, 28.30179786682129, 29.367773056030273, 30.433748245239258, 31.49972152709961, 32.565696716308594, 33.63167190551758]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 7.0, 6.0, 4.0, 8.0, 11.0, 12.0, 19.0, 9.0, 14.0, 15.0, 29.0, 24.0, 28.0, 38.0, 28.0, 45.0, 17.0, 34.0, 37.0, 37.0, 47.0, 39.0, 58.0, 42.0, 46.0, 34.0, 34.0, 28.0, 27.0, 28.0, 23.0, 24.0, 27.0, 22.0, 12.0, 16.0, 10.0, 9.0, 5.0, 7.0, 5.0, 6.0, 9.0, 5.0, 5.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.12109375, -3.0181884765625, -2.915283203125, -2.8123779296875, -2.70947265625, -2.6065673828125, -2.503662109375, -2.4007568359375, -2.2978515625, -2.1949462890625, -2.092041015625, -1.9891357421875, -1.88623046875, -1.7833251953125, -1.680419921875, -1.5775146484375, -1.474609375, -1.3717041015625, -1.268798828125, -1.1658935546875, -1.06298828125, -0.9600830078125, -0.857177734375, -0.7542724609375, -0.6513671875, -0.5484619140625, -0.445556640625, -0.3426513671875, -0.23974609375, -0.1368408203125, -0.033935546875, 0.0689697265625, 0.171875, 0.2747802734375, 0.377685546875, 0.4805908203125, 0.58349609375, 0.6864013671875, 0.789306640625, 0.8922119140625, 0.9951171875, 1.0980224609375, 1.200927734375, 1.3038330078125, 1.40673828125, 1.5096435546875, 1.612548828125, 1.7154541015625, 1.818359375, 1.9212646484375, 2.024169921875, 2.1270751953125, 2.22998046875, 2.3328857421875, 2.435791015625, 2.5386962890625, 2.6416015625, 2.7445068359375, 2.847412109375, 2.9503173828125, 3.05322265625, 3.1561279296875, 3.259033203125, 3.3619384765625, 3.46484375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 9.0, 6.0, 5.0, 9.0, 11.0, 14.0, 8.0, 17.0, 32.0, 37.0, 48.0, 104.0, 155.0, 346.0, 767.0, 2102.0, 7504.0, 33472.0, 175655.0, 877574.0, 1964520.0, 904873.0, 180829.0, 34418.0, 7845.0, 2157.0, 857.0, 393.0, 170.0, 115.0, 81.0, 30.0, 25.0, 31.0, 12.0, 15.0, 5.0, 13.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.19921875, -5.99603271484375, -5.7928466796875, -5.58966064453125, -5.386474609375, -5.18328857421875, -4.9801025390625, -4.77691650390625, -4.57373046875, -4.37054443359375, -4.1673583984375, -3.96417236328125, -3.760986328125, -3.55780029296875, -3.3546142578125, -3.15142822265625, -2.9482421875, -2.74505615234375, -2.5418701171875, -2.33868408203125, -2.135498046875, -1.93231201171875, -1.7291259765625, -1.52593994140625, -1.32275390625, -1.11956787109375, -0.9163818359375, -0.71319580078125, -0.510009765625, -0.30682373046875, -0.1036376953125, 0.09954833984375, 0.302734375, 0.50592041015625, 0.7091064453125, 0.91229248046875, 1.115478515625, 1.31866455078125, 1.5218505859375, 1.72503662109375, 1.92822265625, 2.13140869140625, 2.3345947265625, 2.53778076171875, 2.740966796875, 2.94415283203125, 3.1473388671875, 3.35052490234375, 3.5537109375, 3.75689697265625, 3.9600830078125, 4.16326904296875, 4.366455078125, 4.56964111328125, 4.7728271484375, 4.97601318359375, 5.17919921875, 5.38238525390625, 5.5855712890625, 5.78875732421875, 5.991943359375, 6.19512939453125, 6.3983154296875, 6.60150146484375, 6.8046875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 15.0, 25.0, 22.0, 37.0, 73.0, 94.0, 139.0, 220.0, 296.0, 404.0, 495.0, 547.0, 478.0, 355.0, 292.0, 169.0, 157.0, 85.0, 59.0, 42.0, 25.0, 14.0, 11.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.609375, -9.269775390625, -8.93017578125, -8.590576171875, -8.2509765625, -7.911376953125, -7.57177734375, -7.232177734375, -6.892578125, -6.552978515625, -6.21337890625, -5.873779296875, -5.5341796875, -5.194580078125, -4.85498046875, -4.515380859375, -4.17578125, -3.836181640625, -3.49658203125, -3.156982421875, -2.8173828125, -2.477783203125, -2.13818359375, -1.798583984375, -1.458984375, -1.119384765625, -0.77978515625, -0.440185546875, -0.1005859375, 0.239013671875, 0.57861328125, 0.918212890625, 1.2578125, 1.597412109375, 1.93701171875, 2.276611328125, 2.6162109375, 2.955810546875, 3.29541015625, 3.635009765625, 3.974609375, 4.314208984375, 4.65380859375, 4.993408203125, 5.3330078125, 5.672607421875, 6.01220703125, 6.351806640625, 6.69140625, 7.031005859375, 7.37060546875, 7.710205078125, 8.0498046875, 8.389404296875, 8.72900390625, 9.068603515625, 9.408203125, 9.747802734375, 10.08740234375, 10.427001953125, 10.7666015625, 11.106201171875, 11.44580078125, 11.785400390625, 12.125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 16.0, 16.0, 18.0, 44.0, 57.0, 107.0, 184.0, 291.0, 611.0, 1855.0, 18550.0, 479145.0, 3256708.0, 417382.0, 16421.0, 1623.0, 555.0, 273.0, 181.0, 88.0, 58.0, 38.0, 22.0, 16.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.890625, -21.29052734375, -20.6904296875, -20.09033203125, -19.490234375, -18.89013671875, -18.2900390625, -17.68994140625, -17.08984375, -16.48974609375, -15.8896484375, -15.28955078125, -14.689453125, -14.08935546875, -13.4892578125, -12.88916015625, -12.2890625, -11.68896484375, -11.0888671875, -10.48876953125, -9.888671875, -9.28857421875, -8.6884765625, -8.08837890625, -7.48828125, -6.88818359375, -6.2880859375, -5.68798828125, -5.087890625, -4.48779296875, -3.8876953125, -3.28759765625, -2.6875, -2.08740234375, -1.4873046875, -0.88720703125, -0.287109375, 0.31298828125, 0.9130859375, 1.51318359375, 2.11328125, 2.71337890625, 3.3134765625, 3.91357421875, 4.513671875, 5.11376953125, 5.7138671875, 6.31396484375, 6.9140625, 7.51416015625, 8.1142578125, 8.71435546875, 9.314453125, 9.91455078125, 10.5146484375, 11.11474609375, 11.71484375, 12.31494140625, 12.9150390625, 13.51513671875, 14.115234375, 14.71533203125, 15.3154296875, 15.91552734375, 16.515625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 9.0, 41.0, 93.0, 188.0, 217.0, 211.0, 151.0, 62.0, 29.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.044071197509766, -57.2835807800293, -54.523094177246094, -51.762603759765625, -49.002113342285156, -46.24162292480469, -43.481136322021484, -40.720645904541016, -37.96015930175781, -35.199668884277344, -32.43918228149414, -29.678691864013672, -26.918201446533203, -24.157712936401367, -21.39722442626953, -18.636734008789062, -15.876243591308594, -13.115754127502441, -10.355264663696289, -7.594776153564453, -4.834286689758301, -2.0737972259521484, 0.6866912841796875, 3.4471817016601562, 6.207670211791992, 8.968159675598145, 11.728649139404297, 14.489137649536133, 17.24962615966797, 20.010116577148438, 22.770605087280273, 25.531095504760742, 28.291587829589844, 31.05207633972168, 33.812564849853516, 36.573055267333984, 39.33354568481445, 42.094032287597656, 44.854522705078125, 47.615013122558594, 50.37550354003906, 53.13599395751953, 55.896480560302734, 58.6569709777832, 61.41746139526367, 64.17794799804688, 66.93843841552734, 69.69892883300781, 72.45941162109375, 75.21990203857422, 77.98039245605469, 80.74087524414062, 83.5013656616211, 86.26185607910156, 89.02234649658203, 91.7828369140625, 94.54332733154297, 97.30381774902344, 100.0643081665039, 102.82479858398438, 105.58528137207031, 108.34577178955078, 111.10626220703125, 113.86675262451172, 116.62724304199219]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 2.0, 2.0, 13.0, 6.0, 12.0, 15.0, 21.0, 25.0, 19.0, 30.0, 24.0, 32.0, 30.0, 37.0, 36.0, 58.0, 59.0, 48.0, 45.0, 36.0, 41.0, 41.0, 32.0, 30.0, 37.0, 30.0, 32.0, 33.0, 25.0, 27.0, 23.0, 22.0, 10.0, 13.0, 12.0, 9.0, 10.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.402509689331055, -29.45628547668457, -28.51006317138672, -27.563838958740234, -26.617616653442383, -25.6713924407959, -24.725170135498047, -23.778945922851562, -22.83272361755371, -21.886499404907227, -20.940277099609375, -19.99405288696289, -19.04783058166504, -18.101606369018555, -17.155384063720703, -16.20915985107422, -15.26293659210205, -14.316713333129883, -13.370490074157715, -12.424266815185547, -11.478043556213379, -10.531820297241211, -9.585596084594727, -8.639373779296875, -7.693150043487549, -6.746926784515381, -5.800703525543213, -4.854479789733887, -3.908256769180298, -2.962033271789551, -2.015810012817383, -1.0695867538452148, -0.12336349487304688, 0.8228598237037659, 1.7690831422805786, 2.715306520462036, 3.661529779434204, 4.607753276824951, 5.553976535797119, 6.500199794769287, 7.446423053741455, 8.392646789550781, 9.33887004852295, 10.285093307495117, 11.231316566467285, 12.177539825439453, 13.123763084411621, 14.069986343383789, 15.016209602355957, 15.962432861328125, 16.90865707397461, 17.85487937927246, 18.801103591918945, 19.747325897216797, 20.69355010986328, 21.639772415161133, 22.585996627807617, 23.5322208404541, 24.478443145751953, 25.424667358398438, 26.37088966369629, 27.317113876342773, 28.263336181640625, 29.20956039428711, 30.15578269958496]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 7.0, 10.0, 11.0, 16.0, 23.0, 23.0, 29.0, 25.0, 33.0, 27.0, 20.0, 28.0, 34.0, 31.0, 33.0, 45.0, 53.0, 37.0, 59.0, 40.0, 43.0, 34.0, 35.0, 33.0, 26.0, 32.0, 23.0, 24.0, 22.0, 13.0, 19.0, 15.0, 16.0, 17.0, 7.0, 8.0, 13.0, 9.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.359375, -3.25341796875, -3.1474609375, -3.04150390625, -2.935546875, -2.82958984375, -2.7236328125, -2.61767578125, -2.51171875, -2.40576171875, -2.2998046875, -2.19384765625, -2.087890625, -1.98193359375, -1.8759765625, -1.77001953125, -1.6640625, -1.55810546875, -1.4521484375, -1.34619140625, -1.240234375, -1.13427734375, -1.0283203125, -0.92236328125, -0.81640625, -0.71044921875, -0.6044921875, -0.49853515625, -0.392578125, -0.28662109375, -0.1806640625, -0.07470703125, 0.03125, 0.13720703125, 0.2431640625, 0.34912109375, 0.455078125, 0.56103515625, 0.6669921875, 0.77294921875, 0.87890625, 0.98486328125, 1.0908203125, 1.19677734375, 1.302734375, 1.40869140625, 1.5146484375, 1.62060546875, 1.7265625, 1.83251953125, 1.9384765625, 2.04443359375, 2.150390625, 2.25634765625, 2.3623046875, 2.46826171875, 2.57421875, 2.68017578125, 2.7861328125, 2.89208984375, 2.998046875, 3.10400390625, 3.2099609375, 3.31591796875, 3.421875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 7.0, 3.0, 7.0, 11.0, 11.0, 8.0, 16.0, 27.0, 54.0, 68.0, 93.0, 184.0, 303.0, 427.0, 688.0, 1003.0, 1597.0, 2472.0, 3911.0, 6070.0, 9863.0, 15873.0, 26030.0, 40967.0, 66148.0, 105822.0, 157698.0, 187558.0, 152367.0, 101001.0, 63406.0, 39354.0, 24681.0, 15097.0, 9594.0, 5874.0, 3676.0, 2421.0, 1523.0, 943.0, 634.0, 368.0, 269.0, 159.0, 105.0, 72.0, 30.0, 23.0, 17.0, 8.0, 7.0, 5.0, 1.0, 2.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3095703125, -0.2994041442871094, -0.28923797607421875, -0.2790718078613281, -0.2689056396484375, -0.2587394714355469, -0.24857330322265625, -0.23840713500976562, -0.228240966796875, -0.21807479858398438, -0.20790863037109375, -0.19774246215820312, -0.1875762939453125, -0.17741012573242188, -0.16724395751953125, -0.15707778930664062, -0.14691162109375, -0.13674545288085938, -0.12657928466796875, -0.11641311645507812, -0.1062469482421875, -0.09608078002929688, -0.08591461181640625, -0.07574844360351562, -0.065582275390625, -0.055416107177734375, -0.04524993896484375, -0.035083770751953125, -0.0249176025390625, -0.014751434326171875, -0.00458526611328125, 0.005580902099609375, 0.0157470703125, 0.025913238525390625, 0.03607940673828125, 0.046245574951171875, 0.0564117431640625, 0.06657791137695312, 0.07674407958984375, 0.08691024780273438, 0.097076416015625, 0.10724258422851562, 0.11740875244140625, 0.12757492065429688, 0.1377410888671875, 0.14790725708007812, 0.15807342529296875, 0.16823959350585938, 0.17840576171875, 0.18857192993164062, 0.19873809814453125, 0.20890426635742188, 0.2190704345703125, 0.22923660278320312, 0.23940277099609375, 0.24956893920898438, 0.259735107421875, 0.2699012756347656, 0.28006744384765625, 0.2902336120605469, 0.3003997802734375, 0.3105659484863281, 0.32073211669921875, 0.3308982849121094, 0.341064453125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 8.0, 12.0, 20.0, 14.0, 18.0, 18.0, 23.0, 24.0, 23.0, 30.0, 36.0, 36.0, 47.0, 41.0, 48.0, 39.0, 1066.0, 45.0, 52.0, 48.0, 37.0, 31.0, 34.0, 23.0, 35.0, 35.0, 36.0, 22.0, 12.0, 16.0, 18.0, 10.0, 16.0, 2.0, 5.0, 12.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.115234375, -2.044219970703125, -1.97320556640625, -1.902191162109375, -1.8311767578125, -1.760162353515625, -1.68914794921875, -1.618133544921875, -1.547119140625, -1.476104736328125, -1.40509033203125, -1.334075927734375, -1.2630615234375, -1.192047119140625, -1.12103271484375, -1.050018310546875, -0.97900390625, -0.907989501953125, -0.83697509765625, -0.765960693359375, -0.6949462890625, -0.623931884765625, -0.55291748046875, -0.481903076171875, -0.410888671875, -0.339874267578125, -0.26885986328125, -0.197845458984375, -0.1268310546875, -0.055816650390625, 0.01519775390625, 0.086212158203125, 0.1572265625, 0.228240966796875, 0.29925537109375, 0.370269775390625, 0.4412841796875, 0.512298583984375, 0.58331298828125, 0.654327392578125, 0.725341796875, 0.796356201171875, 0.86737060546875, 0.938385009765625, 1.0093994140625, 1.080413818359375, 1.15142822265625, 1.222442626953125, 1.29345703125, 1.364471435546875, 1.43548583984375, 1.506500244140625, 1.5775146484375, 1.648529052734375, 1.71954345703125, 1.790557861328125, 1.861572265625, 1.932586669921875, 2.00360107421875, 2.074615478515625, 2.1456298828125, 2.216644287109375, 2.28765869140625, 2.358673095703125, 2.4296875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 7.0, 14.0, 18.0, 44.0, 63.0, 89.0, 119.0, 191.0, 245.0, 439.0, 597.0, 904.0, 1522.0, 2322.0, 3593.0, 5687.0, 9153.0, 14845.0, 23644.0, 37588.0, 58439.0, 86845.0, 120606.0, 376570.0, 971600.0, 124973.0, 89739.0, 60798.0, 39509.0, 25103.0, 15639.0, 9737.0, 5973.0, 3764.0, 2359.0, 1517.0, 958.0, 651.0, 429.0, 272.0, 190.0, 123.0, 88.0, 58.0, 35.0, 21.0, 18.0, 12.0, 10.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1851806640625, -0.1795787811279297, -0.17397689819335938, -0.16837501525878906, -0.16277313232421875, -0.15717124938964844, -0.15156936645507812, -0.1459674835205078, -0.1403656005859375, -0.1347637176513672, -0.12916183471679688, -0.12355995178222656, -0.11795806884765625, -0.11235618591308594, -0.10675430297851562, -0.10115242004394531, -0.095550537109375, -0.08994865417480469, -0.08434677124023438, -0.07874488830566406, -0.07314300537109375, -0.06754112243652344, -0.061939239501953125, -0.05633735656738281, -0.0507354736328125, -0.04513359069824219, -0.039531707763671875, -0.03392982482910156, -0.02832794189453125, -0.022726058959960938, -0.017124176025390625, -0.011522293090820312, -0.00592041015625, -0.0003185272216796875, 0.005283355712890625, 0.010885238647460938, 0.01648712158203125, 0.022089004516601562, 0.027690887451171875, 0.03329277038574219, 0.0388946533203125, 0.04449653625488281, 0.050098419189453125, 0.05570030212402344, 0.06130218505859375, 0.06690406799316406, 0.07250595092773438, 0.07810783386230469, 0.083709716796875, 0.08931159973144531, 0.09491348266601562, 0.10051536560058594, 0.10611724853515625, 0.11171913146972656, 0.11732101440429688, 0.12292289733886719, 0.1285247802734375, 0.1341266632080078, 0.13972854614257812, 0.14533042907714844, 0.15093231201171875, 0.15653419494628906, 0.16213607788085938, 0.1677379608154297, 0.17333984375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 10.0, 16.0, 14.0, 15.0, 16.0, 20.0, 21.0, 32.0, 32.0, 47.0, 37.0, 51.0, 73.0, 113.0, 98.0, 88.0, 45.0, 26.0, 35.0, 37.0, 24.0, 19.0, 20.0, 17.0, 16.0, 24.0, 10.0, 5.0, 6.0, 6.0, 1.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.007534027099609375, -0.007284224033355713, -0.007034420967102051, -0.006784617900848389, -0.0065348148345947266, -0.0062850117683410645, -0.006035208702087402, -0.00578540563583374, -0.005535602569580078, -0.005285799503326416, -0.005035996437072754, -0.004786193370819092, -0.00453639030456543, -0.004286587238311768, -0.0040367841720581055, -0.0037869811058044434, -0.0035371780395507812, -0.003287374973297119, -0.003037571907043457, -0.002787768840789795, -0.002537965774536133, -0.0022881627082824707, -0.0020383596420288086, -0.0017885565757751465, -0.0015387535095214844, -0.0012889504432678223, -0.0010391473770141602, -0.000789344310760498, -0.0005395412445068359, -0.00028973817825317383, -3.993511199951172e-05, 0.0002098679542541504, 0.0004596710205078125, 0.0007094740867614746, 0.0009592771530151367, 0.0012090802192687988, 0.001458883285522461, 0.001708686351776123, 0.001958489418029785, 0.0022082924842834473, 0.0024580955505371094, 0.0027078986167907715, 0.0029577016830444336, 0.0032075047492980957, 0.003457307815551758, 0.00370711088180542, 0.003956913948059082, 0.004206717014312744, 0.004456520080566406, 0.004706323146820068, 0.0049561262130737305, 0.005205929279327393, 0.005455732345581055, 0.005705535411834717, 0.005955338478088379, 0.006205141544342041, 0.006454944610595703, 0.006704747676849365, 0.006954550743103027, 0.0072043538093566895, 0.0074541568756103516, 0.007703959941864014, 0.007953763008117676, 0.008203566074371338, 0.008453369140625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 1.0, 4.0, 7.0, 3.0, 8.0, 18.0, 18.0, 23.0, 15.0, 28.0, 26.0, 45.0, 63.0, 88.0, 269.0, 1329.0, 43504.0, 987592.0, 14111.0, 823.0, 216.0, 101.0, 56.0, 45.0, 26.0, 30.0, 19.0, 16.0, 12.0, 11.0, 10.0, 17.0, 2.0, 3.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.1816425323486328, -0.17566299438476562, -0.16968345642089844, -0.16370391845703125, -0.15772438049316406, -0.15174484252929688, -0.1457653045654297, -0.1397857666015625, -0.1338062286376953, -0.12782669067382812, -0.12184715270996094, -0.11586761474609375, -0.10988807678222656, -0.10390853881835938, -0.09792900085449219, -0.091949462890625, -0.08596992492675781, -0.07999038696289062, -0.07401084899902344, -0.06803131103515625, -0.06205177307128906, -0.056072235107421875, -0.05009269714355469, -0.0441131591796875, -0.03813362121582031, -0.032154083251953125, -0.026174545288085938, -0.02019500732421875, -0.014215469360351562, -0.008235931396484375, -0.0022563934326171875, 0.00372314453125, 0.009702682495117188, 0.015682220458984375, 0.021661758422851562, 0.02764129638671875, 0.03362083435058594, 0.039600372314453125, 0.04557991027832031, 0.0515594482421875, 0.05753898620605469, 0.06351852416992188, 0.06949806213378906, 0.07547760009765625, 0.08145713806152344, 0.08743667602539062, 0.09341621398925781, 0.099395751953125, 0.10537528991699219, 0.11135482788085938, 0.11733436584472656, 0.12331390380859375, 0.12929344177246094, 0.13527297973632812, 0.1412525177001953, 0.1472320556640625, 0.1532115936279297, 0.15919113159179688, 0.16517066955566406, 0.17115020751953125, 0.17712974548339844, 0.18310928344726562, 0.1890888214111328, 0.195068359375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 22.0, 55.0, 180.0, 443.0, 193.0, 62.0, 30.0, 7.0, 9.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047456078231334686, -0.04594796150922775, -0.04443984851241112, -0.04293173551559448, -0.04142361879348755, -0.039915502071380615, -0.03840738907456398, -0.036899276077747345, -0.03539115935564041, -0.03388304263353348, -0.03237492963671684, -0.03086681477725506, -0.029358699917793274, -0.02785058505833149, -0.026342470198869705, -0.02483435533940792, -0.023326240479946136, -0.021818125620484352, -0.020310010761022568, -0.018801895901560783, -0.017293781042099, -0.015785666182637215, -0.01427755132317543, -0.012769436463713646, -0.011261321604251862, -0.009753206744790077, -0.008245091885328293, -0.0067369770258665085, -0.005228862166404724, -0.0037207473069429398, -0.0022126324474811554, -0.000704517588019371, 0.0008035972714424133, 0.0023117121309041977, 0.003819826990365982, 0.005327941849827766, 0.006836056709289551, 0.008344171568751335, 0.00985228642821312, 0.011360401287674904, 0.012868516147136688, 0.014376631006598473, 0.015884745866060257, 0.01739286072552204, 0.018900975584983826, 0.02040909044444561, 0.021917205303907394, 0.02342532016336918, 0.024933435022830963, 0.026441549882292747, 0.027949664741754532, 0.029457779601216316, 0.0309658944606781, 0.032474011182785034, 0.03398212417960167, 0.035490237176418304, 0.03699835389852524, 0.03850647062063217, 0.04001458361744881, 0.04152269661426544, 0.043030813336372375, 0.04453893005847931, 0.046047043055295944, 0.04755515605211258, 0.04906327277421951]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 7.0, 5.0, 10.0, 8.0, 8.0, 13.0, 20.0, 13.0, 14.0, 23.0, 20.0, 21.0, 37.0, 29.0, 31.0, 35.0, 25.0, 27.0, 46.0, 52.0, 38.0, 37.0, 37.0, 41.0, 31.0, 31.0, 44.0, 27.0, 33.0, 30.0, 23.0, 22.0, 19.0, 26.0, 19.0, 15.0, 14.0, 15.0, 13.0, 6.0, 8.0, 3.0, 5.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.009925782680511475, -0.00963624007999897, -0.009346697479486465, -0.009057154878973961, -0.008767612278461456, -0.008478069677948952, -0.008188527077436447, -0.007898984476923943, -0.007609441876411438, -0.007319899275898933, -0.007030356675386429, -0.006740814074873924, -0.00645127147436142, -0.006161728873848915, -0.0058721862733364105, -0.005582643672823906, -0.005293101072311401, -0.005003558471798897, -0.004714015871286392, -0.004424473270773888, -0.004134930670261383, -0.0038453880697488785, -0.003555845469236374, -0.0032663028687238693, -0.0029767602682113647, -0.00268721766769886, -0.0023976750671863556, -0.002108132466673851, -0.0018185898661613464, -0.0015290472656488419, -0.0012395046651363373, -0.0009499620646238327, -0.0006604194641113281, -0.00037087686359882355, -8.133426308631897e-05, 0.0002082083374261856, 0.0004977509379386902, 0.0007872935384511948, 0.0010768361389636993, 0.001366378739476204, 0.0016559213399887085, 0.001945463940501213, 0.0022350065410137177, 0.0025245491415262222, 0.002814091742038727, 0.0031036343425512314, 0.003393176943063736, 0.0036827195435762405, 0.003972262144088745, 0.00426180474460125, 0.004551347345113754, 0.004840889945626259, 0.005130432546138763, 0.005419975146651268, 0.005709517747163773, 0.005999060347676277, 0.006288602948188782, 0.006578145548701286, 0.006867688149213791, 0.0071572307497262955, 0.0074467733502388, 0.007736315950751305, 0.00802585855126381, 0.008315401151776314, 0.008604943752288818]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 8.0, 9.0, 10.0, 17.0, 23.0, 24.0, 28.0, 25.0, 33.0, 27.0, 20.0, 28.0, 34.0, 31.0, 33.0, 45.0, 53.0, 37.0, 59.0, 40.0, 43.0, 34.0, 35.0, 33.0, 26.0, 32.0, 23.0, 24.0, 22.0, 13.0, 19.0, 15.0, 16.0, 17.0, 7.0, 8.0, 13.0, 9.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.359375, -3.25341796875, -3.1474609375, -3.04150390625, -2.935546875, -2.82958984375, -2.7236328125, -2.61767578125, -2.51171875, -2.40576171875, -2.2998046875, -2.19384765625, -2.087890625, -1.98193359375, -1.8759765625, -1.77001953125, -1.6640625, -1.55810546875, -1.4521484375, -1.34619140625, -1.240234375, -1.13427734375, -1.0283203125, -0.92236328125, -0.81640625, -0.71044921875, -0.6044921875, -0.49853515625, -0.392578125, -0.28662109375, -0.1806640625, -0.07470703125, 0.03125, 0.13720703125, 0.2431640625, 0.34912109375, 0.455078125, 0.56103515625, 0.6669921875, 0.77294921875, 0.87890625, 0.98486328125, 1.0908203125, 1.19677734375, 1.302734375, 1.40869140625, 1.5146484375, 1.62060546875, 1.7265625, 1.83251953125, 1.9384765625, 2.04443359375, 2.150390625, 2.25634765625, 2.3623046875, 2.46826171875, 2.57421875, 2.68017578125, 2.7861328125, 2.89208984375, 2.998046875, 3.10400390625, 3.2099609375, 3.31591796875, 3.421875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 8.0, 9.0, 16.0, 19.0, 33.0, 44.0, 47.0, 85.0, 139.0, 257.0, 442.0, 689.0, 1307.0, 2382.0, 4517.0, 8227.0, 15233.0, 27502.0, 49429.0, 90121.0, 161495.0, 243694.0, 195244.0, 111222.0, 60923.0, 33876.0, 18864.0, 10300.0, 5620.0, 3009.0, 1660.0, 886.0, 466.0, 310.0, 172.0, 99.0, 67.0, 39.0, 27.0, 22.0, 12.0, 11.0, 11.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.78125, -2.68426513671875, -2.5872802734375, -2.49029541015625, -2.393310546875, -2.29632568359375, -2.1993408203125, -2.10235595703125, -2.00537109375, -1.90838623046875, -1.8114013671875, -1.71441650390625, -1.617431640625, -1.52044677734375, -1.4234619140625, -1.32647705078125, -1.2294921875, -1.13250732421875, -1.0355224609375, -0.93853759765625, -0.841552734375, -0.74456787109375, -0.6475830078125, -0.55059814453125, -0.45361328125, -0.35662841796875, -0.2596435546875, -0.16265869140625, -0.065673828125, 0.03131103515625, 0.1282958984375, 0.22528076171875, 0.322265625, 0.41925048828125, 0.5162353515625, 0.61322021484375, 0.710205078125, 0.80718994140625, 0.9041748046875, 1.00115966796875, 1.09814453125, 1.19512939453125, 1.2921142578125, 1.38909912109375, 1.486083984375, 1.58306884765625, 1.6800537109375, 1.77703857421875, 1.8740234375, 1.97100830078125, 2.0679931640625, 2.16497802734375, 2.261962890625, 2.35894775390625, 2.4559326171875, 2.55291748046875, 2.64990234375, 2.74688720703125, 2.8438720703125, 2.94085693359375, 3.037841796875, 3.13482666015625, 3.2318115234375, 3.32879638671875, 3.42578125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 7.0, 6.0, 11.0, 10.0, 19.0, 16.0, 24.0, 36.0, 39.0, 35.0, 53.0, 51.0, 75.0, 128.0, 247.0, 1461.0, 291.0, 141.0, 82.0, 56.0, 55.0, 36.0, 42.0, 30.0, 17.0, 26.0, 19.0, 9.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.921875, -22.3431396484375, -21.764404296875, -21.1856689453125, -20.60693359375, -20.0281982421875, -19.449462890625, -18.8707275390625, -18.2919921875, -17.7132568359375, -17.134521484375, -16.5557861328125, -15.97705078125, -15.3983154296875, -14.819580078125, -14.2408447265625, -13.662109375, -13.0833740234375, -12.504638671875, -11.9259033203125, -11.34716796875, -10.7684326171875, -10.189697265625, -9.6109619140625, -9.0322265625, -8.4534912109375, -7.874755859375, -7.2960205078125, -6.71728515625, -6.1385498046875, -5.559814453125, -4.9810791015625, -4.40234375, -3.8236083984375, -3.244873046875, -2.6661376953125, -2.08740234375, -1.5086669921875, -0.929931640625, -0.3511962890625, 0.2275390625, 0.8062744140625, 1.385009765625, 1.9637451171875, 2.54248046875, 3.1212158203125, 3.699951171875, 4.2786865234375, 4.857421875, 5.4361572265625, 6.014892578125, 6.5936279296875, 7.17236328125, 7.7510986328125, 8.329833984375, 8.9085693359375, 9.4873046875, 10.0660400390625, 10.644775390625, 11.2235107421875, 11.80224609375, 12.3809814453125, 12.959716796875, 13.5384521484375, 14.1171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 17.0, 22.0, 18.0, 23.0, 46.0, 43.0, 60.0, 113.0, 142.0, 207.0, 317.0, 656.0, 3198.0, 500977.0, 2631152.0, 6611.0, 902.0, 381.0, 238.0, 151.0, 103.0, 79.0, 70.0, 48.0, 22.0, 23.0, 24.0, 7.0, 18.0, 12.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.484375, -29.220947265625, -27.95751953125, -26.694091796875, -25.4306640625, -24.167236328125, -22.90380859375, -21.640380859375, -20.376953125, -19.113525390625, -17.85009765625, -16.586669921875, -15.3232421875, -14.059814453125, -12.79638671875, -11.532958984375, -10.26953125, -9.006103515625, -7.74267578125, -6.479248046875, -5.2158203125, -3.952392578125, -2.68896484375, -1.425537109375, -0.162109375, 1.101318359375, 2.36474609375, 3.628173828125, 4.8916015625, 6.155029296875, 7.41845703125, 8.681884765625, 9.9453125, 11.208740234375, 12.47216796875, 13.735595703125, 14.9990234375, 16.262451171875, 17.52587890625, 18.789306640625, 20.052734375, 21.316162109375, 22.57958984375, 23.843017578125, 25.1064453125, 26.369873046875, 27.63330078125, 28.896728515625, 30.16015625, 31.423583984375, 32.68701171875, 33.950439453125, 35.2138671875, 36.477294921875, 37.74072265625, 39.004150390625, 40.267578125, 41.531005859375, 42.79443359375, 44.057861328125, 45.3212890625, 46.584716796875, 47.84814453125, 49.111572265625, 50.375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 81.0, 297.0, 405.0, 171.0, 43.0, 9.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.115962982177734, -55.38356399536133, -52.65116500854492, -49.91876983642578, -47.186370849609375, -44.45397186279297, -41.72157287597656, -38.989173889160156, -36.25677490234375, -33.524375915527344, -30.791976928710938, -28.059579849243164, -25.327180862426758, -22.59478187561035, -19.862384796142578, -17.129985809326172, -14.397586822509766, -11.66518783569336, -8.93278980255127, -6.20039176940918, -3.4679927825927734, -0.7355937957763672, 1.9968032836914062, 4.7292022705078125, 7.461601257324219, 10.194000244140625, 12.926398277282715, 15.658796310424805, 18.39119529724121, 21.123594284057617, 23.85599136352539, 26.588390350341797, 29.320785522460938, 32.053184509277344, 34.78558349609375, 37.517982482910156, 40.25038146972656, 42.98278045654297, 45.71517562866211, 48.447574615478516, 51.17997360229492, 53.91237258911133, 56.644771575927734, 59.377166748046875, 62.10956573486328, 64.84196472167969, 67.5743637084961, 70.3067626953125, 73.0391616821289, 75.77156066894531, 78.50395965576172, 81.23635864257812, 83.96875762939453, 86.70115661621094, 89.43354797363281, 92.16595458984375, 94.89834594726562, 97.63074493408203, 100.36314392089844, 103.09554290771484, 105.82794189453125, 108.56034088134766, 111.29273986816406, 114.02513122558594, 116.75753784179688]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 9.0, 13.0, 15.0, 16.0, 22.0, 28.0, 16.0, 26.0, 10.0, 34.0, 34.0, 33.0, 37.0, 45.0, 39.0, 43.0, 19.0, 42.0, 40.0, 41.0, 38.0, 50.0, 48.0, 28.0, 32.0, 30.0, 20.0, 25.0, 14.0, 23.0, 12.0, 16.0, 12.0, 10.0, 13.0, 10.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-33.09831619262695, -32.14722442626953, -31.196136474609375, -30.245046615600586, -29.293956756591797, -28.342866897583008, -27.39177703857422, -26.440685272216797, -25.48959732055664, -24.53850746154785, -23.587417602539062, -22.636327743530273, -21.685237884521484, -20.734148025512695, -19.783058166503906, -18.831966400146484, -17.880876541137695, -16.929786682128906, -15.978696823120117, -15.027606964111328, -14.076517105102539, -13.12542724609375, -12.174336433410645, -11.223246574401855, -10.272156715393066, -9.321066856384277, -8.369976997375488, -7.418886661529541, -6.467796802520752, -5.516706943511963, -4.565616607666016, -3.6145267486572266, -2.6634349822998047, -1.712345004081726, -0.7612550258636475, 0.1898350715637207, 1.1409249305725098, 2.092014789581299, 3.043105125427246, 3.994194984436035, 4.945284843444824, 5.896374702453613, 6.847464561462402, 7.79855489730835, 8.749645233154297, 9.700735092163086, 10.651824951171875, 11.602914810180664, 12.554004669189453, 13.505094528198242, 14.456184387207031, 15.40727424621582, 16.35836410522461, 17.3094539642334, 18.260543823242188, 19.21163558959961, 20.162723541259766, 21.113813400268555, 22.064903259277344, 23.015993118286133, 23.967082977294922, 24.91817283630371, 25.8692626953125, 26.820354461669922, 27.77144432067871]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 7.0, 13.0, 13.0, 12.0, 21.0, 18.0, 20.0, 24.0, 19.0, 29.0, 23.0, 28.0, 30.0, 28.0, 32.0, 40.0, 44.0, 42.0, 36.0, 40.0, 36.0, 29.0, 43.0, 36.0, 44.0, 31.0, 20.0, 23.0, 26.0, 26.0, 19.0, 16.0, 15.0, 16.0, 17.0, 21.0, 12.0, 5.0, 6.0, 7.0, 3.0, 8.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.546875, -3.4373779296875, -3.327880859375, -3.2183837890625, -3.10888671875, -2.9993896484375, -2.889892578125, -2.7803955078125, -2.6708984375, -2.5614013671875, -2.451904296875, -2.3424072265625, -2.23291015625, -2.1234130859375, -2.013916015625, -1.9044189453125, -1.794921875, -1.6854248046875, -1.575927734375, -1.4664306640625, -1.35693359375, -1.2474365234375, -1.137939453125, -1.0284423828125, -0.9189453125, -0.8094482421875, -0.699951171875, -0.5904541015625, -0.48095703125, -0.3714599609375, -0.261962890625, -0.1524658203125, -0.04296875, 0.0665283203125, 0.176025390625, 0.2855224609375, 0.39501953125, 0.5045166015625, 0.614013671875, 0.7235107421875, 0.8330078125, 0.9425048828125, 1.052001953125, 1.1614990234375, 1.27099609375, 1.3804931640625, 1.489990234375, 1.5994873046875, 1.708984375, 1.8184814453125, 1.927978515625, 2.0374755859375, 2.14697265625, 2.2564697265625, 2.365966796875, 2.4754638671875, 2.5849609375, 2.6944580078125, 2.803955078125, 2.9134521484375, 3.02294921875, 3.1324462890625, 3.241943359375, 3.3514404296875, 3.4609375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 10.0, 13.0, 5.0, 19.0, 11.0, 15.0, 21.0, 17.0, 20.0, 22.0, 22.0, 36.0, 42.0, 75.0, 155.0, 314.0, 938.0, 4448.0, 42489.0, 592229.0, 2635442.0, 845775.0, 63887.0, 6104.0, 1219.0, 406.0, 158.0, 104.0, 50.0, 34.0, 27.0, 35.0, 24.0, 13.0, 20.0, 11.0, 11.0, 7.0, 13.0, 8.0, 4.0, 9.0, 4.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.8203125, -10.4881591796875, -10.156005859375, -9.8238525390625, -9.49169921875, -9.1595458984375, -8.827392578125, -8.4952392578125, -8.1630859375, -7.8309326171875, -7.498779296875, -7.1666259765625, -6.83447265625, -6.5023193359375, -6.170166015625, -5.8380126953125, -5.505859375, -5.1737060546875, -4.841552734375, -4.5093994140625, -4.17724609375, -3.8450927734375, -3.512939453125, -3.1807861328125, -2.8486328125, -2.5164794921875, -2.184326171875, -1.8521728515625, -1.52001953125, -1.1878662109375, -0.855712890625, -0.5235595703125, -0.19140625, 0.1407470703125, 0.472900390625, 0.8050537109375, 1.13720703125, 1.4693603515625, 1.801513671875, 2.1336669921875, 2.4658203125, 2.7979736328125, 3.130126953125, 3.4622802734375, 3.79443359375, 4.1265869140625, 4.458740234375, 4.7908935546875, 5.123046875, 5.4552001953125, 5.787353515625, 6.1195068359375, 6.45166015625, 6.7838134765625, 7.115966796875, 7.4481201171875, 7.7802734375, 8.1124267578125, 8.444580078125, 8.7767333984375, 9.10888671875, 9.4410400390625, 9.773193359375, 10.1053466796875, 10.4375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 9.0, 7.0, 7.0, 21.0, 25.0, 28.0, 22.0, 18.0, 38.0, 37.0, 49.0, 66.0, 69.0, 99.0, 125.0, 167.0, 148.0, 175.0, 232.0, 258.0, 268.0, 279.0, 272.0, 260.0, 226.0, 192.0, 178.0, 153.0, 129.0, 89.0, 76.0, 68.0, 54.0, 37.0, 37.0, 25.0, 26.0, 19.0, 20.0, 9.0, 15.0, 6.0, 10.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-5.6484375, -5.46844482421875, -5.2884521484375, -5.10845947265625, -4.928466796875, -4.74847412109375, -4.5684814453125, -4.38848876953125, -4.20849609375, -4.02850341796875, -3.8485107421875, -3.66851806640625, -3.488525390625, -3.30853271484375, -3.1285400390625, -2.94854736328125, -2.7685546875, -2.58856201171875, -2.4085693359375, -2.22857666015625, -2.048583984375, -1.86859130859375, -1.6885986328125, -1.50860595703125, -1.32861328125, -1.14862060546875, -0.9686279296875, -0.78863525390625, -0.608642578125, -0.42864990234375, -0.2486572265625, -0.06866455078125, 0.111328125, 0.29132080078125, 0.4713134765625, 0.65130615234375, 0.831298828125, 1.01129150390625, 1.1912841796875, 1.37127685546875, 1.55126953125, 1.73126220703125, 1.9112548828125, 2.09124755859375, 2.271240234375, 2.45123291015625, 2.6312255859375, 2.81121826171875, 2.9912109375, 3.17120361328125, 3.3511962890625, 3.53118896484375, 3.711181640625, 3.89117431640625, 4.0711669921875, 4.25115966796875, 4.43115234375, 4.61114501953125, 4.7911376953125, 4.97113037109375, 5.151123046875, 5.33111572265625, 5.5111083984375, 5.69110107421875, 5.87109375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 7.0, 5.0, 10.0, 10.0, 17.0, 10.0, 23.0, 23.0, 22.0, 33.0, 50.0, 54.0, 62.0, 80.0, 116.0, 135.0, 178.0, 266.0, 443.0, 1009.0, 3406.0, 19918.0, 159823.0, 1230331.0, 2267990.0, 446284.0, 52937.0, 7508.0, 1685.0, 615.0, 346.0, 205.0, 164.0, 109.0, 72.0, 70.0, 53.0, 33.0, 35.0, 26.0, 31.0, 31.0, 15.0, 7.0, 9.0, 5.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-12.7734375, -12.38916015625, -12.0048828125, -11.62060546875, -11.236328125, -10.85205078125, -10.4677734375, -10.08349609375, -9.69921875, -9.31494140625, -8.9306640625, -8.54638671875, -8.162109375, -7.77783203125, -7.3935546875, -7.00927734375, -6.625, -6.24072265625, -5.8564453125, -5.47216796875, -5.087890625, -4.70361328125, -4.3193359375, -3.93505859375, -3.55078125, -3.16650390625, -2.7822265625, -2.39794921875, -2.013671875, -1.62939453125, -1.2451171875, -0.86083984375, -0.4765625, -0.09228515625, 0.2919921875, 0.67626953125, 1.060546875, 1.44482421875, 1.8291015625, 2.21337890625, 2.59765625, 2.98193359375, 3.3662109375, 3.75048828125, 4.134765625, 4.51904296875, 4.9033203125, 5.28759765625, 5.671875, 6.05615234375, 6.4404296875, 6.82470703125, 7.208984375, 7.59326171875, 7.9775390625, 8.36181640625, 8.74609375, 9.13037109375, 9.5146484375, 9.89892578125, 10.283203125, 10.66748046875, 11.0517578125, 11.43603515625, 11.8203125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 16.0, 50.0, 87.0, 153.0, 200.0, 215.0, 152.0, 74.0, 42.0, 16.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.947265625, -97.4390869140625, -94.93091583251953, -92.42273712158203, -89.91455841064453, -87.40638732910156, -84.89820861816406, -82.39002990722656, -79.88185119628906, -77.37367248535156, -74.8655014038086, -72.3573226928711, -69.8491439819336, -67.34097290039062, -64.83279418945312, -62.324615478515625, -59.816444396972656, -57.30826950073242, -54.80009078979492, -52.29191589355469, -49.78373718261719, -47.27556228637695, -44.76738739013672, -42.25920867919922, -39.751033782958984, -37.24285888671875, -34.73468017578125, -32.226505279541016, -29.71832847595215, -27.21015167236328, -24.701976776123047, -22.19379997253418, -19.685630798339844, -17.177453994750977, -14.669278144836426, -12.161102294921875, -9.652925491333008, -7.144748687744141, -4.63657283782959, -2.128396987915039, 0.3797798156738281, 2.887956142425537, 5.396132469177246, 7.904308795928955, 10.412485122680664, 12.920661926269531, 15.428837776184082, 17.937013626098633, 20.4451904296875, 22.953367233276367, 25.461544036865234, 27.96971893310547, 30.477895736694336, 32.9860725402832, 35.49424743652344, 38.00242614746094, 40.51060104370117, 43.018775939941406, 45.526954650878906, 48.03512954711914, 50.543304443359375, 53.051483154296875, 55.55965805053711, 58.067832946777344, 60.576011657714844]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 10.0, 9.0, 20.0, 19.0, 23.0, 23.0, 27.0, 26.0, 26.0, 39.0, 41.0, 48.0, 44.0, 46.0, 43.0, 42.0, 43.0, 56.0, 44.0, 34.0, 32.0, 35.0, 37.0, 39.0, 30.0, 33.0, 25.0, 19.0, 20.0, 5.0, 6.0, 8.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-34.479705810546875, -33.51327133178711, -32.54683303833008, -31.580398559570312, -30.613964080810547, -29.64752769470215, -28.68109130859375, -27.714656829833984, -26.748220443725586, -25.781784057617188, -24.815349578857422, -23.848913192749023, -22.882476806640625, -21.91604232788086, -20.94960594177246, -19.983169555664062, -19.016735076904297, -18.0502986907959, -17.083864212036133, -16.117427825927734, -15.150992393493652, -14.18455696105957, -13.218120574951172, -12.25168514251709, -11.285249710083008, -10.318814277648926, -9.352378845214844, -8.385942459106445, -7.419507026672363, -6.453071594238281, -5.486635684967041, -4.520199775695801, -3.5537643432617188, -2.5873286724090576, -1.6208930015563965, -0.6544573307037354, 0.3119783401489258, 1.2784137725830078, 2.244849681854248, 3.2112855911254883, 4.17772102355957, 5.144156455993652, 6.110592365264893, 7.077028274536133, 8.043463706970215, 9.009899139404297, 9.976335525512695, 10.942770957946777, 11.90920639038086, 12.875641822814941, 13.842077255249023, 14.808513641357422, 15.774949073791504, 16.741384506225586, 17.707820892333984, 18.67425537109375, 19.64069175720215, 20.607128143310547, 21.573562622070312, 22.53999900817871, 23.50643539428711, 24.472869873046875, 25.439306259155273, 26.405742645263672, 27.372177124023438]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 10.0, 9.0, 12.0, 16.0, 7.0, 15.0, 16.0, 22.0, 23.0, 35.0, 22.0, 35.0, 26.0, 28.0, 26.0, 46.0, 26.0, 41.0, 42.0, 44.0, 39.0, 40.0, 43.0, 38.0, 31.0, 20.0, 22.0, 41.0, 21.0, 26.0, 21.0, 21.0, 21.0, 18.0, 16.0, 12.0, 12.0, 7.0, 12.0, 9.0, 5.0, 6.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.376953125, -3.271209716796875, -3.16546630859375, -3.059722900390625, -2.9539794921875, -2.848236083984375, -2.74249267578125, -2.636749267578125, -2.531005859375, -2.425262451171875, -2.31951904296875, -2.213775634765625, -2.1080322265625, -2.002288818359375, -1.89654541015625, -1.790802001953125, -1.68505859375, -1.579315185546875, -1.47357177734375, -1.367828369140625, -1.2620849609375, -1.156341552734375, -1.05059814453125, -0.944854736328125, -0.839111328125, -0.733367919921875, -0.62762451171875, -0.521881103515625, -0.4161376953125, -0.310394287109375, -0.20465087890625, -0.098907470703125, 0.0068359375, 0.112579345703125, 0.21832275390625, 0.324066162109375, 0.4298095703125, 0.535552978515625, 0.64129638671875, 0.747039794921875, 0.852783203125, 0.958526611328125, 1.06427001953125, 1.170013427734375, 1.2757568359375, 1.381500244140625, 1.48724365234375, 1.592987060546875, 1.69873046875, 1.804473876953125, 1.91021728515625, 2.015960693359375, 2.1217041015625, 2.227447509765625, 2.33319091796875, 2.438934326171875, 2.544677734375, 2.650421142578125, 2.75616455078125, 2.861907958984375, 2.9676513671875, 3.073394775390625, 3.17913818359375, 3.284881591796875, 3.390625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 10.0, 30.0, 31.0, 41.0, 77.0, 103.0, 180.0, 251.0, 422.0, 631.0, 919.0, 1343.0, 2145.0, 3277.0, 4815.0, 7259.0, 11364.0, 17617.0, 27314.0, 42119.0, 65554.0, 98692.0, 141280.0, 171963.0, 147998.0, 105428.0, 69745.0, 45107.0, 29119.0, 18849.0, 11865.0, 7784.0, 5169.0, 3402.0, 2306.0, 1431.0, 986.0, 680.0, 450.0, 285.0, 168.0, 119.0, 71.0, 63.0, 28.0, 23.0, 14.0, 9.0, 5.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.3662109375, -0.3549690246582031, -0.34372711181640625, -0.3324851989746094, -0.3212432861328125, -0.3100013732910156, -0.29875946044921875, -0.2875175476074219, -0.276275634765625, -0.2650337219238281, -0.25379180908203125, -0.24254989624023438, -0.2313079833984375, -0.22006607055664062, -0.20882415771484375, -0.19758224487304688, -0.18634033203125, -0.17509841918945312, -0.16385650634765625, -0.15261459350585938, -0.1413726806640625, -0.13013076782226562, -0.11888885498046875, -0.10764694213867188, -0.096405029296875, -0.08516311645507812, -0.07392120361328125, -0.06267929077148438, -0.0514373779296875, -0.040195465087890625, -0.02895355224609375, -0.017711639404296875, -0.0064697265625, 0.004772186279296875, 0.01601409912109375, 0.027256011962890625, 0.0384979248046875, 0.049739837646484375, 0.06098175048828125, 0.07222366333007812, 0.083465576171875, 0.09470748901367188, 0.10594940185546875, 0.11719131469726562, 0.1284332275390625, 0.13967514038085938, 0.15091705322265625, 0.16215896606445312, 0.17340087890625, 0.18464279174804688, 0.19588470458984375, 0.20712661743164062, 0.2183685302734375, 0.22961044311523438, 0.24085235595703125, 0.2520942687988281, 0.263336181640625, 0.2745780944824219, 0.28582000732421875, 0.2970619201660156, 0.3083038330078125, 0.3195457458496094, 0.33078765869140625, 0.3420295715332031, 0.353271484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 16.0, 14.0, 13.0, 14.0, 26.0, 14.0, 33.0, 21.0, 26.0, 23.0, 33.0, 31.0, 50.0, 37.0, 42.0, 37.0, 34.0, 1053.0, 45.0, 43.0, 32.0, 34.0, 34.0, 37.0, 28.0, 39.0, 29.0, 18.0, 17.0, 12.0, 16.0, 20.0, 11.0, 15.0, 14.0, 5.0, 17.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.3359375, -2.265380859375, -2.19482421875, -2.124267578125, -2.0537109375, -1.983154296875, -1.91259765625, -1.842041015625, -1.771484375, -1.700927734375, -1.63037109375, -1.559814453125, -1.4892578125, -1.418701171875, -1.34814453125, -1.277587890625, -1.20703125, -1.136474609375, -1.06591796875, -0.995361328125, -0.9248046875, -0.854248046875, -0.78369140625, -0.713134765625, -0.642578125, -0.572021484375, -0.50146484375, -0.430908203125, -0.3603515625, -0.289794921875, -0.21923828125, -0.148681640625, -0.078125, -0.007568359375, 0.06298828125, 0.133544921875, 0.2041015625, 0.274658203125, 0.34521484375, 0.415771484375, 0.486328125, 0.556884765625, 0.62744140625, 0.697998046875, 0.7685546875, 0.839111328125, 0.90966796875, 0.980224609375, 1.05078125, 1.121337890625, 1.19189453125, 1.262451171875, 1.3330078125, 1.403564453125, 1.47412109375, 1.544677734375, 1.615234375, 1.685791015625, 1.75634765625, 1.826904296875, 1.8974609375, 1.968017578125, 2.03857421875, 2.109130859375, 2.1796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 11.0, 6.0, 14.0, 18.0, 41.0, 39.0, 63.0, 95.0, 154.0, 255.0, 410.0, 658.0, 1033.0, 1905.0, 2970.0, 5019.0, 8814.0, 15213.0, 26286.0, 45429.0, 75048.0, 118595.0, 177557.0, 1218396.0, 149561.0, 100593.0, 61387.0, 36268.0, 21392.0, 12319.0, 7110.0, 4181.0, 2407.0, 1452.0, 882.0, 559.0, 363.0, 216.0, 161.0, 94.0, 60.0, 39.0, 26.0, 13.0, 12.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.249267578125, -0.24155044555664062, -0.23383331298828125, -0.22611618041992188, -0.2183990478515625, -0.21068191528320312, -0.20296478271484375, -0.19524765014648438, -0.187530517578125, -0.17981338500976562, -0.17209625244140625, -0.16437911987304688, -0.1566619873046875, -0.14894485473632812, -0.14122772216796875, -0.13351058959960938, -0.12579345703125, -0.11807632446289062, -0.11035919189453125, -0.10264205932617188, -0.0949249267578125, -0.08720779418945312, -0.07949066162109375, -0.07177352905273438, -0.064056396484375, -0.056339263916015625, -0.04862213134765625, -0.040904998779296875, -0.0331878662109375, -0.025470733642578125, -0.01775360107421875, -0.010036468505859375, -0.0023193359375, 0.005397796630859375, 0.01311492919921875, 0.020832061767578125, 0.0285491943359375, 0.036266326904296875, 0.04398345947265625, 0.051700592041015625, 0.059417724609375, 0.06713485717773438, 0.07485198974609375, 0.08256912231445312, 0.0902862548828125, 0.09800338745117188, 0.10572052001953125, 0.11343765258789062, 0.12115478515625, 0.12887191772460938, 0.13658905029296875, 0.14430618286132812, 0.1520233154296875, 0.15974044799804688, 0.16745758056640625, 0.17517471313476562, 0.182891845703125, 0.19060897827148438, 0.19832611083984375, 0.20604324340820312, 0.2137603759765625, 0.22147750854492188, 0.22919464111328125, 0.23691177368164062, 0.24462890625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 6.0, 12.0, 15.0, 15.0, 13.0, 21.0, 29.0, 28.0, 38.0, 48.0, 69.0, 93.0, 171.0, 103.0, 59.0, 52.0, 35.0, 32.0, 26.0, 23.0, 20.0, 13.0, 10.0, 9.0, 5.0, 5.0, 9.0, 5.0, 8.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00934600830078125, -0.009039878845214844, -0.008733749389648438, -0.008427619934082031, -0.008121490478515625, -0.007815361022949219, -0.0075092315673828125, -0.007203102111816406, -0.00689697265625, -0.006590843200683594, -0.0062847137451171875, -0.005978584289550781, -0.005672454833984375, -0.005366325378417969, -0.0050601959228515625, -0.004754066467285156, -0.00444793701171875, -0.004141807556152344, -0.0038356781005859375, -0.0035295486450195312, -0.003223419189453125, -0.0029172897338867188, -0.0026111602783203125, -0.0023050308227539062, -0.0019989013671875, -0.0016927719116210938, -0.0013866424560546875, -0.0010805130004882812, -0.000774383544921875, -0.00046825408935546875, -0.0001621246337890625, 0.00014400482177734375, 0.00045013427734375, 0.0007562637329101562, 0.0010623931884765625, 0.0013685226440429688, 0.001674652099609375, 0.0019807815551757812, 0.0022869110107421875, 0.0025930404663085938, 0.002899169921875, 0.0032052993774414062, 0.0035114288330078125, 0.0038175582885742188, 0.004123687744140625, 0.004429817199707031, 0.0047359466552734375, 0.005042076110839844, 0.00534820556640625, 0.005654335021972656, 0.0059604644775390625, 0.006266593933105469, 0.006572723388671875, 0.006878852844238281, 0.0071849822998046875, 0.007491111755371094, 0.0077972412109375, 0.008103370666503906, 0.008409500122070312, 0.008715629577636719, 0.009021759033203125, 0.009327888488769531, 0.009634017944335938, 0.009940147399902344, 0.01024627685546875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 8.0, 9.0, 7.0, 12.0, 11.0, 15.0, 16.0, 30.0, 35.0, 59.0, 87.0, 160.0, 678.0, 11216.0, 964486.0, 69470.0, 1597.0, 275.0, 129.0, 63.0, 47.0, 27.0, 26.0, 17.0, 16.0, 9.0, 11.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.249267578125, -0.24187088012695312, -0.23447418212890625, -0.22707748413085938, -0.2196807861328125, -0.21228408813476562, -0.20488739013671875, -0.19749069213867188, -0.190093994140625, -0.18269729614257812, -0.17530059814453125, -0.16790390014648438, -0.1605072021484375, -0.15311050415039062, -0.14571380615234375, -0.13831710815429688, -0.13092041015625, -0.12352371215820312, -0.11612701416015625, -0.10873031616210938, -0.1013336181640625, -0.09393692016601562, -0.08654022216796875, -0.07914352416992188, -0.071746826171875, -0.06435012817382812, -0.05695343017578125, -0.049556732177734375, -0.0421600341796875, -0.034763336181640625, -0.02736663818359375, -0.019969940185546875, -0.0125732421875, -0.005176544189453125, 0.00222015380859375, 0.009616851806640625, 0.0170135498046875, 0.024410247802734375, 0.03180694580078125, 0.039203643798828125, 0.046600341796875, 0.053997039794921875, 0.06139373779296875, 0.06879043579101562, 0.0761871337890625, 0.08358383178710938, 0.09098052978515625, 0.09837722778320312, 0.10577392578125, 0.11317062377929688, 0.12056732177734375, 0.12796401977539062, 0.1353607177734375, 0.14275741577148438, 0.15015411376953125, 0.15755081176757812, 0.164947509765625, 0.17234420776367188, 0.17974090576171875, 0.18713760375976562, 0.1945343017578125, 0.20193099975585938, 0.20932769775390625, 0.21672439575195312, 0.22412109375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 13.0, 46.0, 231.0, 540.0, 125.0, 31.0, 16.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1253189593553543, -0.12267021834850311, -0.12002148479223251, -0.11737275123596191, -0.11472401022911072, -0.11207526922225952, -0.10942653566598892, -0.10677780210971832, -0.10412906110286713, -0.10148032009601593, -0.09883158653974533, -0.09618285298347473, -0.09353411197662354, -0.09088537096977234, -0.08823663741350174, -0.08558790385723114, -0.08293916285037994, -0.08029042184352875, -0.07764168828725815, -0.07499295473098755, -0.07234421372413635, -0.06969547271728516, -0.06704673916101456, -0.06439800560474396, -0.06174926459789276, -0.05910052731633186, -0.056451790034770966, -0.05380305275321007, -0.05115431547164917, -0.04850557819008827, -0.045856840908527374, -0.043208103626966476, -0.04055936262011528, -0.03791062533855438, -0.035261888056993484, -0.03261315077543259, -0.02996441349387169, -0.02731567621231079, -0.024666938930749893, -0.022018201649188995, -0.019369464367628098, -0.0167207270860672, -0.014071989804506302, -0.011423252522945404, -0.008774515241384506, -0.006125777959823608, -0.0034770406782627106, -0.0008283033967018127, 0.001820433884859085, 0.004469171166419983, 0.007117908447980881, 0.009766645729541779, 0.012415383011102676, 0.015064120292663574, 0.017712857574224472, 0.02036159485578537, 0.023010332137346268, 0.025659069418907166, 0.028307806700468063, 0.03095654398202896, 0.03360528126358986, 0.03625401854515076, 0.038902755826711655, 0.04155149310827255, 0.04420023038983345]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 1.0, 6.0, 7.0, 14.0, 6.0, 10.0, 10.0, 13.0, 13.0, 18.0, 14.0, 29.0, 17.0, 20.0, 30.0, 26.0, 32.0, 33.0, 33.0, 32.0, 31.0, 50.0, 39.0, 45.0, 36.0, 36.0, 36.0, 33.0, 24.0, 33.0, 24.0, 32.0, 24.0, 26.0, 16.0, 22.0, 16.0, 23.0, 17.0, 13.0, 15.0, 11.0, 6.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.008710920810699463, -0.008412553928792477, -0.00811418704688549, -0.007815820164978504, -0.007517453283071518, -0.007219086401164532, -0.0069207195192575455, -0.006622352637350559, -0.006323985755443573, -0.006025618873536587, -0.0057272519916296005, -0.005428885109722614, -0.005130518227815628, -0.004832151345908642, -0.004533784464001656, -0.004235417582094669, -0.003937050700187683, -0.003638683818280697, -0.0033403169363737106, -0.0030419500544667244, -0.002743583172559738, -0.002445216290652752, -0.0021468494087457657, -0.0018484825268387794, -0.0015501156449317932, -0.001251748763024807, -0.0009533818811178207, -0.0006550149992108345, -0.00035664811730384827, -5.828123539686203e-05, 0.0002400856465101242, 0.0005384525284171104, 0.0008368194103240967, 0.001135186292231083, 0.0014335531741380692, 0.0017319200560450554, 0.0020302869379520416, 0.002328653819859028, 0.002627020701766014, 0.0029253875836730003, 0.0032237544655799866, 0.003522121347486973, 0.003820488229393959, 0.004118855111300945, 0.0044172219932079315, 0.004715588875114918, 0.005013955757021904, 0.00531232263892889, 0.0056106895208358765, 0.005909056402742863, 0.006207423284649849, 0.006505790166556835, 0.006804157048463821, 0.007102523930370808, 0.007400890812277794, 0.00769925769418478, 0.007997624576091766, 0.008295991457998753, 0.008594358339905739, 0.008892725221812725, 0.009191092103719711, 0.009489458985626698, 0.009787825867533684, 0.01008619274944067, 0.010384559631347656]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 10.0, 9.0, 12.0, 16.0, 6.0, 16.0, 16.0, 22.0, 23.0, 35.0, 21.0, 36.0, 26.0, 28.0, 26.0, 46.0, 26.0, 41.0, 42.0, 44.0, 39.0, 40.0, 43.0, 38.0, 31.0, 20.0, 22.0, 40.0, 22.0, 27.0, 20.0, 21.0, 21.0, 18.0, 16.0, 12.0, 12.0, 7.0, 12.0, 9.0, 5.0, 6.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.376953125, -3.271209716796875, -3.16546630859375, -3.059722900390625, -2.9539794921875, -2.848236083984375, -2.74249267578125, -2.636749267578125, -2.531005859375, -2.425262451171875, -2.31951904296875, -2.213775634765625, -2.1080322265625, -2.002288818359375, -1.89654541015625, -1.790802001953125, -1.68505859375, -1.579315185546875, -1.47357177734375, -1.367828369140625, -1.2620849609375, -1.156341552734375, -1.05059814453125, -0.944854736328125, -0.839111328125, -0.733367919921875, -0.62762451171875, -0.521881103515625, -0.4161376953125, -0.310394287109375, -0.20465087890625, -0.098907470703125, 0.0068359375, 0.112579345703125, 0.21832275390625, 0.324066162109375, 0.4298095703125, 0.535552978515625, 0.64129638671875, 0.747039794921875, 0.852783203125, 0.958526611328125, 1.06427001953125, 1.170013427734375, 1.2757568359375, 1.381500244140625, 1.48724365234375, 1.592987060546875, 1.69873046875, 1.804473876953125, 1.91021728515625, 2.015960693359375, 2.1217041015625, 2.227447509765625, 2.33319091796875, 2.438934326171875, 2.544677734375, 2.650421142578125, 2.75616455078125, 2.861907958984375, 2.9676513671875, 3.073394775390625, 3.17913818359375, 3.284881591796875, 3.390625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 12.0, 10.0, 17.0, 25.0, 37.0, 67.0, 104.0, 193.0, 320.0, 745.0, 1554.0, 3298.0, 6957.0, 14573.0, 30199.0, 60095.0, 120589.0, 240368.0, 282330.0, 144856.0, 71974.0, 36281.0, 17643.0, 8617.0, 4010.0, 1814.0, 908.0, 442.0, 214.0, 108.0, 76.0, 37.0, 20.0, 20.0, 7.0, 6.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0546875, -3.9244384765625, -3.794189453125, -3.6639404296875, -3.53369140625, -3.4034423828125, -3.273193359375, -3.1429443359375, -3.0126953125, -2.8824462890625, -2.752197265625, -2.6219482421875, -2.49169921875, -2.3614501953125, -2.231201171875, -2.1009521484375, -1.970703125, -1.8404541015625, -1.710205078125, -1.5799560546875, -1.44970703125, -1.3194580078125, -1.189208984375, -1.0589599609375, -0.9287109375, -0.7984619140625, -0.668212890625, -0.5379638671875, -0.40771484375, -0.2774658203125, -0.147216796875, -0.0169677734375, 0.11328125, 0.2435302734375, 0.373779296875, 0.5040283203125, 0.63427734375, 0.7645263671875, 0.894775390625, 1.0250244140625, 1.1552734375, 1.2855224609375, 1.415771484375, 1.5460205078125, 1.67626953125, 1.8065185546875, 1.936767578125, 2.0670166015625, 2.197265625, 2.3275146484375, 2.457763671875, 2.5880126953125, 2.71826171875, 2.8485107421875, 2.978759765625, 3.1090087890625, 3.2392578125, 3.3695068359375, 3.499755859375, 3.6300048828125, 3.76025390625, 3.8905029296875, 4.020751953125, 4.1510009765625, 4.28125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 5.0, 7.0, 14.0, 16.0, 14.0, 15.0, 22.0, 23.0, 30.0, 30.0, 39.0, 34.0, 39.0, 53.0, 103.0, 152.0, 276.0, 1400.0, 180.0, 119.0, 76.0, 47.0, 54.0, 31.0, 31.0, 34.0, 34.0, 19.0, 21.0, 18.0, 16.0, 13.0, 15.0, 11.0, 10.0, 7.0, 5.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.515625, -12.126953125, -11.73828125, -11.349609375, -10.9609375, -10.572265625, -10.18359375, -9.794921875, -9.40625, -9.017578125, -8.62890625, -8.240234375, -7.8515625, -7.462890625, -7.07421875, -6.685546875, -6.296875, -5.908203125, -5.51953125, -5.130859375, -4.7421875, -4.353515625, -3.96484375, -3.576171875, -3.1875, -2.798828125, -2.41015625, -2.021484375, -1.6328125, -1.244140625, -0.85546875, -0.466796875, -0.078125, 0.310546875, 0.69921875, 1.087890625, 1.4765625, 1.865234375, 2.25390625, 2.642578125, 3.03125, 3.419921875, 3.80859375, 4.197265625, 4.5859375, 4.974609375, 5.36328125, 5.751953125, 6.140625, 6.529296875, 6.91796875, 7.306640625, 7.6953125, 8.083984375, 8.47265625, 8.861328125, 9.25, 9.638671875, 10.02734375, 10.416015625, 10.8046875, 11.193359375, 11.58203125, 11.970703125, 12.359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 11.0, 5.0, 12.0, 25.0, 20.0, 29.0, 47.0, 55.0, 69.0, 108.0, 179.0, 244.0, 427.0, 1236.0, 30311.0, 3074775.0, 35718.0, 1194.0, 461.0, 244.0, 147.0, 115.0, 60.0, 54.0, 34.0, 28.0, 14.0, 13.0, 19.0, 12.0, 8.0, 2.0, 7.0, 4.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.40625, -29.0556640625, -27.705078125, -26.3544921875, -25.00390625, -23.6533203125, -22.302734375, -20.9521484375, -19.6015625, -18.2509765625, -16.900390625, -15.5498046875, -14.19921875, -12.8486328125, -11.498046875, -10.1474609375, -8.796875, -7.4462890625, -6.095703125, -4.7451171875, -3.39453125, -2.0439453125, -0.693359375, 0.6572265625, 2.0078125, 3.3583984375, 4.708984375, 6.0595703125, 7.41015625, 8.7607421875, 10.111328125, 11.4619140625, 12.8125, 14.1630859375, 15.513671875, 16.8642578125, 18.21484375, 19.5654296875, 20.916015625, 22.2666015625, 23.6171875, 24.9677734375, 26.318359375, 27.6689453125, 29.01953125, 30.3701171875, 31.720703125, 33.0712890625, 34.421875, 35.7724609375, 37.123046875, 38.4736328125, 39.82421875, 41.1748046875, 42.525390625, 43.8759765625, 45.2265625, 46.5771484375, 47.927734375, 49.2783203125, 50.62890625, 51.9794921875, 53.330078125, 54.6806640625, 56.03125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 52.0, 870.0, 97.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.582706451416016, -37.38191223144531, -29.181121826171875, -20.980329513549805, -12.779537200927734, -4.578746795654297, 3.6220474243164062, 11.82284164428711, 20.023632049560547, 28.224424362182617, 36.42521667480469, 44.626007080078125, 52.82680130004883, 61.027591705322266, 69.22838592529297, 77.42918395996094, 85.62997436523438, 93.83076477050781, 102.03155517578125, 110.23235321044922, 118.43314361572266, 126.6339340209961, 134.83473205566406, 143.0355224609375, 151.23631286621094, 159.43710327148438, 167.6378936767578, 175.83868408203125, 184.03948974609375, 192.24026489257812, 200.44107055664062, 208.64186096191406, 216.8426513671875, 225.04344177246094, 233.24423217773438, 241.4450225830078, 249.64581298828125, 257.84661865234375, 266.0473937988281, 274.2481994628906, 282.448974609375, 290.6497802734375, 298.8505554199219, 307.0513610839844, 315.25213623046875, 323.45294189453125, 331.6537170410156, 339.8545227050781, 348.0553283691406, 356.2561340332031, 364.4569091796875, 372.65771484375, 380.8584899902344, 389.0592956542969, 397.26007080078125, 405.46087646484375, 413.66168212890625, 421.86248779296875, 430.0632629394531, 438.2640686035156, 446.46484375, 454.6656494140625, 462.8664245605469, 471.0672302246094, 479.26800537109375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 9.0, 6.0, 8.0, 7.0, 11.0, 5.0, 18.0, 17.0, 16.0, 23.0, 17.0, 28.0, 24.0, 39.0, 33.0, 37.0, 45.0, 44.0, 42.0, 39.0, 49.0, 56.0, 45.0, 35.0, 38.0, 33.0, 42.0, 38.0, 34.0, 25.0, 18.0, 22.0, 17.0, 14.0, 15.0, 14.0, 16.0, 4.0, 4.0, 1.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.8189697265625, -37.6719856262207, -36.52499771118164, -35.378013610839844, -34.23102569580078, -33.084041595458984, -31.937055587768555, -30.790069580078125, -29.643083572387695, -28.496097564697266, -27.349111557006836, -26.202125549316406, -25.05514144897461, -23.908153533935547, -22.76116943359375, -21.61418342590332, -20.46719741821289, -19.32021141052246, -18.17322540283203, -17.0262393951416, -15.879254341125488, -14.732268333435059, -13.585283279418945, -12.438297271728516, -11.291311264038086, -10.144325256347656, -8.997339248657227, -7.850354194641113, -6.703368186950684, -5.556382179260254, -4.409396648406982, -3.262411117553711, -2.1154212951660156, -0.968435525894165, 0.17855024337768555, 1.3255360126495361, 2.4725217819213867, 3.6195077896118164, 4.766493320465088, 5.913478851318359, 7.060464859008789, 8.207450866699219, 9.354436874389648, 10.501421928405762, 11.648407936096191, 12.795393943786621, 13.942378997802734, 15.089365005493164, 16.236351013183594, 17.383337020874023, 18.530323028564453, 19.677309036254883, 20.824295043945312, 21.97127914428711, 23.11826515197754, 24.26525115966797, 25.4122371673584, 26.559223175048828, 27.706209182739258, 28.853195190429688, 30.000179290771484, 31.147167205810547, 32.294151306152344, 33.441139221191406, 34.5881233215332]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 4.0, 3.0, 2.0, 4.0, 7.0, 7.0, 6.0, 15.0, 10.0, 10.0, 19.0, 20.0, 17.0, 20.0, 30.0, 38.0, 36.0, 24.0, 50.0, 25.0, 31.0, 29.0, 30.0, 51.0, 51.0, 46.0, 42.0, 37.0, 30.0, 25.0, 28.0, 24.0, 19.0, 24.0, 34.0, 18.0, 19.0, 22.0, 17.0, 14.0, 9.0, 10.0, 12.0, 7.0, 6.0, 6.0, 7.0, 6.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.7421875, -3.6229248046875, -3.503662109375, -3.3843994140625, -3.26513671875, -3.1458740234375, -3.026611328125, -2.9073486328125, -2.7880859375, -2.6688232421875, -2.549560546875, -2.4302978515625, -2.31103515625, -2.1917724609375, -2.072509765625, -1.9532470703125, -1.833984375, -1.7147216796875, -1.595458984375, -1.4761962890625, -1.35693359375, -1.2376708984375, -1.118408203125, -0.9991455078125, -0.8798828125, -0.7606201171875, -0.641357421875, -0.5220947265625, -0.40283203125, -0.2835693359375, -0.164306640625, -0.0450439453125, 0.07421875, 0.1934814453125, 0.312744140625, 0.4320068359375, 0.55126953125, 0.6705322265625, 0.789794921875, 0.9090576171875, 1.0283203125, 1.1475830078125, 1.266845703125, 1.3861083984375, 1.50537109375, 1.6246337890625, 1.743896484375, 1.8631591796875, 1.982421875, 2.1016845703125, 2.220947265625, 2.3402099609375, 2.45947265625, 2.5787353515625, 2.697998046875, 2.8172607421875, 2.9365234375, 3.0557861328125, 3.175048828125, 3.2943115234375, 3.41357421875, 3.5328369140625, 3.652099609375, 3.7713623046875, 3.890625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 6.0, 3.0, 12.0, 15.0, 19.0, 21.0, 22.0, 18.0, 29.0, 40.0, 41.0, 79.0, 96.0, 186.0, 457.0, 1479.0, 8457.0, 91907.0, 997403.0, 2451751.0, 585548.0, 49206.0, 5227.0, 1190.0, 434.0, 191.0, 102.0, 77.0, 49.0, 38.0, 35.0, 21.0, 20.0, 18.0, 16.0, 8.0, 9.0, 13.0, 12.0, 5.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.746337890625, -9.41455078125, -9.082763671875, -8.7509765625, -8.419189453125, -8.08740234375, -7.755615234375, -7.423828125, -7.092041015625, -6.76025390625, -6.428466796875, -6.0966796875, -5.764892578125, -5.43310546875, -5.101318359375, -4.76953125, -4.437744140625, -4.10595703125, -3.774169921875, -3.4423828125, -3.110595703125, -2.77880859375, -2.447021484375, -2.115234375, -1.783447265625, -1.45166015625, -1.119873046875, -0.7880859375, -0.456298828125, -0.12451171875, 0.207275390625, 0.5390625, 0.870849609375, 1.20263671875, 1.534423828125, 1.8662109375, 2.197998046875, 2.52978515625, 2.861572265625, 3.193359375, 3.525146484375, 3.85693359375, 4.188720703125, 4.5205078125, 4.852294921875, 5.18408203125, 5.515869140625, 5.84765625, 6.179443359375, 6.51123046875, 6.843017578125, 7.1748046875, 7.506591796875, 7.83837890625, 8.170166015625, 8.501953125, 8.833740234375, 9.16552734375, 9.497314453125, 9.8291015625, 10.160888671875, 10.49267578125, 10.824462890625, 11.15625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 13.0, 18.0, 18.0, 31.0, 50.0, 71.0, 87.0, 134.0, 206.0, 271.0, 369.0, 444.0, 476.0, 439.0, 407.0, 310.0, 232.0, 164.0, 116.0, 62.0, 43.0, 41.0, 18.0, 19.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.4564208984375, -12.115966796875, -11.7755126953125, -11.43505859375, -11.0946044921875, -10.754150390625, -10.4136962890625, -10.0732421875, -9.7327880859375, -9.392333984375, -9.0518798828125, -8.71142578125, -8.3709716796875, -8.030517578125, -7.6900634765625, -7.349609375, -7.0091552734375, -6.668701171875, -6.3282470703125, -5.98779296875, -5.6473388671875, -5.306884765625, -4.9664306640625, -4.6259765625, -4.2855224609375, -3.945068359375, -3.6046142578125, -3.26416015625, -2.9237060546875, -2.583251953125, -2.2427978515625, -1.90234375, -1.5618896484375, -1.221435546875, -0.8809814453125, -0.54052734375, -0.2000732421875, 0.140380859375, 0.4808349609375, 0.8212890625, 1.1617431640625, 1.502197265625, 1.8426513671875, 2.18310546875, 2.5235595703125, 2.864013671875, 3.2044677734375, 3.544921875, 3.8853759765625, 4.225830078125, 4.5662841796875, 4.90673828125, 5.2471923828125, 5.587646484375, 5.9281005859375, 6.2685546875, 6.6090087890625, 6.949462890625, 7.2899169921875, 7.63037109375, 7.9708251953125, 8.311279296875, 8.6517333984375, 8.9921875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 9.0, 15.0, 21.0, 39.0, 39.0, 72.0, 122.0, 199.0, 330.0, 671.0, 3511.0, 769427.0, 3401456.0, 16445.0, 945.0, 381.0, 215.0, 123.0, 82.0, 58.0, 45.0, 18.0, 20.0, 14.0, 9.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.609375, -30.402099609375, -29.19482421875, -27.987548828125, -26.7802734375, -25.572998046875, -24.36572265625, -23.158447265625, -21.951171875, -20.743896484375, -19.53662109375, -18.329345703125, -17.1220703125, -15.914794921875, -14.70751953125, -13.500244140625, -12.29296875, -11.085693359375, -9.87841796875, -8.671142578125, -7.4638671875, -6.256591796875, -5.04931640625, -3.842041015625, -2.634765625, -1.427490234375, -0.22021484375, 0.987060546875, 2.1943359375, 3.401611328125, 4.60888671875, 5.816162109375, 7.0234375, 8.230712890625, 9.43798828125, 10.645263671875, 11.8525390625, 13.059814453125, 14.26708984375, 15.474365234375, 16.681640625, 17.888916015625, 19.09619140625, 20.303466796875, 21.5107421875, 22.718017578125, 23.92529296875, 25.132568359375, 26.33984375, 27.547119140625, 28.75439453125, 29.961669921875, 31.1689453125, 32.376220703125, 33.58349609375, 34.790771484375, 35.998046875, 37.205322265625, 38.41259765625, 39.619873046875, 40.8271484375, 42.034423828125, 43.24169921875, 44.448974609375, 45.65625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 31.0, 82.0, 172.0, 213.0, 233.0, 173.0, 60.0, 37.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.04817199707031, -72.03520965576172, -69.02224731445312, -66.00929260253906, -62.99633026123047, -59.983367919921875, -56.97040939331055, -53.95745086669922, -50.944488525390625, -47.93152618408203, -44.9185676574707, -41.905609130859375, -38.89264678955078, -35.87968444824219, -32.86672592163086, -29.8537654876709, -26.840805053710938, -23.827844619750977, -20.814884185791016, -17.801923751831055, -14.788963317871094, -11.776002883911133, -8.763042449951172, -5.750082015991211, -2.73712158203125, 0.27583885192871094, 3.288799285888672, 6.301759719848633, 9.314720153808594, 12.327680587768555, 15.340641021728516, 18.353601455688477, 21.366561889648438, 24.3795223236084, 27.39248275756836, 30.40544319152832, 33.41840362548828, 36.431365966796875, 39.4443244934082, 42.45728302001953, 45.470245361328125, 48.48320770263672, 51.49616622924805, 54.509124755859375, 57.52208709716797, 60.53504943847656, 63.54800796508789, 66.56096649169922, 69.57392883300781, 72.5868911743164, 75.599853515625, 78.61280822753906, 81.62577056884766, 84.63873291015625, 87.65168762207031, 90.6646499633789, 93.6776123046875, 96.6905746459961, 99.70353698730469, 102.71649169921875, 105.72945404052734, 108.74241638183594, 111.75537109375, 114.7683334350586, 117.78129577636719]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 3.0, 9.0, 3.0, 7.0, 4.0, 16.0, 10.0, 15.0, 22.0, 16.0, 14.0, 32.0, 26.0, 24.0, 37.0, 36.0, 25.0, 47.0, 43.0, 39.0, 39.0, 39.0, 38.0, 46.0, 45.0, 36.0, 44.0, 34.0, 29.0, 34.0, 22.0, 25.0, 19.0, 24.0, 17.0, 13.0, 13.0, 10.0, 9.0, 9.0, 7.0, 7.0, 6.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0], "bins": [-32.24060821533203, -31.361865997314453, -30.483123779296875, -29.604381561279297, -28.72563934326172, -27.84689712524414, -26.968154907226562, -26.089412689208984, -25.210670471191406, -24.331928253173828, -23.45318603515625, -22.574443817138672, -21.695701599121094, -20.816959381103516, -19.938217163085938, -19.05947494506836, -18.18073272705078, -17.301990509033203, -16.423248291015625, -15.544506072998047, -14.665763854980469, -13.78702163696289, -12.908279418945312, -12.029537200927734, -11.150793075561523, -10.272050857543945, -9.393308639526367, -8.514566421508789, -7.635824203491211, -6.757081508636475, -5.8783392906188965, -4.999597072601318, -4.120855331420898, -3.2421131134033203, -2.363370895385742, -1.484628438949585, -0.6058862209320068, 0.2728562355041504, 1.1515984535217285, 2.0303406715393066, 2.9090828895568848, 3.787825107574463, 4.666567325592041, 5.545310020446777, 6.4240522384643555, 7.302794456481934, 8.181536674499512, 9.06027889251709, 9.939021110534668, 10.817763328552246, 11.696505546569824, 12.575247764587402, 13.45398998260498, 14.332733154296875, 15.211475372314453, 16.09021759033203, 16.96895980834961, 17.847702026367188, 18.726444244384766, 19.605186462402344, 20.483928680419922, 21.3626708984375, 22.241413116455078, 23.120155334472656, 23.998897552490234]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 10.0, 10.0, 7.0, 15.0, 14.0, 18.0, 16.0, 24.0, 31.0, 24.0, 44.0, 28.0, 42.0, 44.0, 39.0, 48.0, 43.0, 34.0, 41.0, 35.0, 39.0, 50.0, 34.0, 32.0, 25.0, 31.0, 13.0, 29.0, 24.0, 24.0, 15.0, 29.0, 14.0, 17.0, 13.0, 6.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.82672119140625, -3.7042236328125, -3.58172607421875, -3.459228515625, -3.33673095703125, -3.2142333984375, -3.09173583984375, -2.96923828125, -2.84674072265625, -2.7242431640625, -2.60174560546875, -2.479248046875, -2.35675048828125, -2.2342529296875, -2.11175537109375, -1.9892578125, -1.86676025390625, -1.7442626953125, -1.62176513671875, -1.499267578125, -1.37677001953125, -1.2542724609375, -1.13177490234375, -1.00927734375, -0.88677978515625, -0.7642822265625, -0.64178466796875, -0.519287109375, -0.39678955078125, -0.2742919921875, -0.15179443359375, -0.029296875, 0.09320068359375, 0.2156982421875, 0.33819580078125, 0.460693359375, 0.58319091796875, 0.7056884765625, 0.82818603515625, 0.95068359375, 1.07318115234375, 1.1956787109375, 1.31817626953125, 1.440673828125, 1.56317138671875, 1.6856689453125, 1.80816650390625, 1.9306640625, 2.05316162109375, 2.1756591796875, 2.29815673828125, 2.420654296875, 2.54315185546875, 2.6656494140625, 2.78814697265625, 2.91064453125, 3.03314208984375, 3.1556396484375, 3.27813720703125, 3.400634765625, 3.52313232421875, 3.6456298828125, 3.76812744140625, 3.890625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 15.0, 24.0, 18.0, 44.0, 54.0, 73.0, 132.0, 176.0, 260.0, 359.0, 535.0, 786.0, 1143.0, 1663.0, 2554.0, 3757.0, 5528.0, 8461.0, 12293.0, 18805.0, 28378.0, 42128.0, 62796.0, 91167.0, 127541.0, 154931.0, 144681.0, 108207.0, 76185.0, 51986.0, 34642.0, 23214.0, 15071.0, 10027.0, 6859.0, 4564.0, 3046.0, 2051.0, 1376.0, 961.0, 663.0, 468.0, 272.0, 194.0, 140.0, 115.0, 69.0, 39.0, 34.0, 18.0, 21.0, 13.0, 3.0, 9.0, 0.0, 6.0], "bins": [-0.360107421875, -0.3494377136230469, -0.33876800537109375, -0.3280982971191406, -0.3174285888671875, -0.3067588806152344, -0.29608917236328125, -0.2854194641113281, -0.274749755859375, -0.2640800476074219, -0.25341033935546875, -0.24274063110351562, -0.2320709228515625, -0.22140121459960938, -0.21073150634765625, -0.20006179809570312, -0.18939208984375, -0.17872238159179688, -0.16805267333984375, -0.15738296508789062, -0.1467132568359375, -0.13604354858398438, -0.12537384033203125, -0.11470413208007812, -0.104034423828125, -0.09336471557617188, -0.08269500732421875, -0.07202529907226562, -0.0613555908203125, -0.050685882568359375, -0.04001617431640625, -0.029346466064453125, -0.0186767578125, -0.008007049560546875, 0.00266265869140625, 0.013332366943359375, 0.0240020751953125, 0.034671783447265625, 0.04534149169921875, 0.056011199951171875, 0.066680908203125, 0.07735061645507812, 0.08802032470703125, 0.09869003295898438, 0.1093597412109375, 0.12002944946289062, 0.13069915771484375, 0.14136886596679688, 0.15203857421875, 0.16270828247070312, 0.17337799072265625, 0.18404769897460938, 0.1947174072265625, 0.20538711547851562, 0.21605682373046875, 0.22672653198242188, 0.237396240234375, 0.24806594848632812, 0.25873565673828125, 0.2694053649902344, 0.2800750732421875, 0.2907447814941406, 0.30141448974609375, 0.3120841979980469, 0.32275390625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 1.0, 8.0, 3.0, 4.0, 8.0, 9.0, 14.0, 18.0, 14.0, 14.0, 16.0, 25.0, 19.0, 17.0, 15.0, 31.0, 27.0, 41.0, 44.0, 38.0, 36.0, 40.0, 42.0, 1060.0, 39.0, 36.0, 40.0, 39.0, 42.0, 33.0, 37.0, 27.0, 24.0, 22.0, 15.0, 21.0, 25.0, 17.0, 15.0, 7.0, 16.0, 7.0, 6.0, 7.0, 0.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.978515625, -1.9027099609375, -1.826904296875, -1.7510986328125, -1.67529296875, -1.5994873046875, -1.523681640625, -1.4478759765625, -1.3720703125, -1.2962646484375, -1.220458984375, -1.1446533203125, -1.06884765625, -0.9930419921875, -0.917236328125, -0.8414306640625, -0.765625, -0.6898193359375, -0.614013671875, -0.5382080078125, -0.46240234375, -0.3865966796875, -0.310791015625, -0.2349853515625, -0.1591796875, -0.0833740234375, -0.007568359375, 0.0682373046875, 0.14404296875, 0.2198486328125, 0.295654296875, 0.3714599609375, 0.447265625, 0.5230712890625, 0.598876953125, 0.6746826171875, 0.75048828125, 0.8262939453125, 0.902099609375, 0.9779052734375, 1.0537109375, 1.1295166015625, 1.205322265625, 1.2811279296875, 1.35693359375, 1.4327392578125, 1.508544921875, 1.5843505859375, 1.66015625, 1.7359619140625, 1.811767578125, 1.8875732421875, 1.96337890625, 2.0391845703125, 2.114990234375, 2.1907958984375, 2.2666015625, 2.3424072265625, 2.418212890625, 2.4940185546875, 2.56982421875, 2.6456298828125, 2.721435546875, 2.7972412109375, 2.873046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 7.0, 14.0, 25.0, 32.0, 35.0, 75.0, 135.0, 183.0, 303.0, 445.0, 697.0, 1065.0, 1776.0, 2855.0, 4743.0, 7954.0, 13001.0, 21668.0, 35199.0, 55958.0, 85331.0, 123698.0, 359274.0, 1006528.0, 129924.0, 90547.0, 59422.0, 37176.0, 23279.0, 13860.0, 8401.0, 5216.0, 3151.0, 1896.0, 1186.0, 740.0, 492.0, 300.0, 175.0, 121.0, 100.0, 47.0, 44.0, 16.0, 12.0, 13.0, 7.0, 6.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.2568645477294922, -0.24932479858398438, -0.24178504943847656, -0.23424530029296875, -0.22670555114746094, -0.21916580200195312, -0.2116260528564453, -0.2040863037109375, -0.1965465545654297, -0.18900680541992188, -0.18146705627441406, -0.17392730712890625, -0.16638755798339844, -0.15884780883789062, -0.1513080596923828, -0.143768310546875, -0.1362285614013672, -0.12868881225585938, -0.12114906311035156, -0.11360931396484375, -0.10606956481933594, -0.09852981567382812, -0.09099006652832031, -0.0834503173828125, -0.07591056823730469, -0.06837081909179688, -0.06083106994628906, -0.05329132080078125, -0.04575157165527344, -0.038211822509765625, -0.030672073364257812, -0.02313232421875, -0.015592575073242188, -0.008052825927734375, -0.0005130767822265625, 0.00702667236328125, 0.014566421508789062, 0.022106170654296875, 0.029645919799804688, 0.0371856689453125, 0.04472541809082031, 0.052265167236328125, 0.05980491638183594, 0.06734466552734375, 0.07488441467285156, 0.08242416381835938, 0.08996391296386719, 0.097503662109375, 0.10504341125488281, 0.11258316040039062, 0.12012290954589844, 0.12766265869140625, 0.13520240783691406, 0.14274215698242188, 0.1502819061279297, 0.1578216552734375, 0.1653614044189453, 0.17290115356445312, 0.18044090270996094, 0.18798065185546875, 0.19552040100097656, 0.20306015014648438, 0.2105998992919922, 0.2181396484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 7.0, 12.0, 16.0, 15.0, 15.0, 32.0, 28.0, 34.0, 38.0, 71.0, 63.0, 70.0, 75.0, 97.0, 84.0, 69.0, 41.0, 48.0, 39.0, 24.0, 29.0, 21.0, 12.0, 8.0, 7.0, 8.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0176849365234375, -0.01710367202758789, -0.01652240753173828, -0.015941143035888672, -0.015359878540039062, -0.014778614044189453, -0.014197349548339844, -0.013616085052490234, -0.013034820556640625, -0.012453556060791016, -0.011872291564941406, -0.011291027069091797, -0.010709762573242188, -0.010128498077392578, -0.009547233581542969, -0.00896596908569336, -0.00838470458984375, -0.007803440093994141, -0.007222175598144531, -0.006640911102294922, -0.0060596466064453125, -0.005478382110595703, -0.004897117614746094, -0.004315853118896484, -0.003734588623046875, -0.0031533241271972656, -0.0025720596313476562, -0.001990795135498047, -0.0014095306396484375, -0.0008282661437988281, -0.00024700164794921875, 0.0003342628479003906, 0.00091552734375, 0.0014967918395996094, 0.0020780563354492188, 0.002659320831298828, 0.0032405853271484375, 0.003821849822998047, 0.004403114318847656, 0.004984378814697266, 0.005565643310546875, 0.006146907806396484, 0.006728172302246094, 0.007309436798095703, 0.007890701293945312, 0.008471965789794922, 0.009053230285644531, 0.00963449478149414, 0.01021575927734375, 0.01079702377319336, 0.011378288269042969, 0.011959552764892578, 0.012540817260742188, 0.013122081756591797, 0.013703346252441406, 0.014284610748291016, 0.014865875244140625, 0.015447139739990234, 0.016028404235839844, 0.016609668731689453, 0.017190933227539062, 0.017772197723388672, 0.01835346221923828, 0.01893472671508789, 0.0195159912109375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 7.0, 7.0, 4.0, 12.0, 9.0, 10.0, 22.0, 21.0, 37.0, 45.0, 58.0, 104.0, 182.0, 417.0, 3580.0, 1008538.0, 33971.0, 790.0, 249.0, 151.0, 83.0, 63.0, 43.0, 40.0, 29.0, 22.0, 16.0, 11.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.417236328125, -0.4052162170410156, -0.39319610595703125, -0.3811759948730469, -0.3691558837890625, -0.3571357727050781, -0.34511566162109375, -0.3330955505371094, -0.321075439453125, -0.3090553283691406, -0.29703521728515625, -0.2850151062011719, -0.2729949951171875, -0.2609748840332031, -0.24895477294921875, -0.23693466186523438, -0.22491455078125, -0.21289443969726562, -0.20087432861328125, -0.18885421752929688, -0.1768341064453125, -0.16481399536132812, -0.15279388427734375, -0.14077377319335938, -0.128753662109375, -0.11673355102539062, -0.10471343994140625, -0.09269332885742188, -0.0806732177734375, -0.06865310668945312, -0.05663299560546875, -0.044612884521484375, -0.0325927734375, -0.020572662353515625, -0.00855255126953125, 0.003467559814453125, 0.0154876708984375, 0.027507781982421875, 0.03952789306640625, 0.051548004150390625, 0.063568115234375, 0.07558822631835938, 0.08760833740234375, 0.09962844848632812, 0.1116485595703125, 0.12366867065429688, 0.13568878173828125, 0.14770889282226562, 0.15972900390625, 0.17174911499023438, 0.18376922607421875, 0.19578933715820312, 0.2078094482421875, 0.21982955932617188, 0.23184967041015625, 0.24386978149414062, 0.255889892578125, 0.2679100036621094, 0.27993011474609375, 0.2919502258300781, 0.3039703369140625, 0.3159904479980469, 0.32801055908203125, 0.3400306701660156, 0.35205078125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 461.0, 519.0, 24.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3614063858985901, -0.3529999256134033, -0.34459346532821655, -0.3361870050430298, -0.327780544757843, -0.31937405467033386, -0.3109675943851471, -0.3025611340999603, -0.29415467381477356, -0.2857482135295868, -0.2773417532444, -0.26893529295921326, -0.2605288028717041, -0.25212234258651733, -0.24371588230133057, -0.2353094220161438, -0.22690296173095703, -0.21849650144577026, -0.2100900411605835, -0.20168356597423553, -0.19327710568904877, -0.184870645403862, -0.17646417021751404, -0.16805770993232727, -0.1596512496471405, -0.15124478936195374, -0.14283832907676697, -0.134431853890419, -0.12602539360523224, -0.11761893332004547, -0.1092124655842781, -0.10080599784851074, -0.09239950776100159, -0.08399304747581482, -0.07558657974004745, -0.06718011200428009, -0.05877365171909332, -0.05036718770861626, -0.04196072369813919, -0.033554259687662125, -0.02514779567718506, -0.016741331666707993, -0.008334867656230927, 7.159635424613953e-05, 0.008478060364723206, 0.01688452437520027, 0.025290988385677338, 0.033697452396154404, 0.04210391640663147, 0.050510380417108536, 0.0589168444275856, 0.06732331216335297, 0.07572977244853973, 0.0841362327337265, 0.09254270046949387, 0.10094916820526123, 0.109355628490448, 0.11776208877563477, 0.12616854906082153, 0.1345750242471695, 0.14298148453235626, 0.15138794481754303, 0.159794420003891, 0.16820088028907776, 0.17660734057426453]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 9.0, 10.0, 14.0, 11.0, 11.0, 17.0, 18.0, 26.0, 21.0, 28.0, 28.0, 28.0, 23.0, 25.0, 28.0, 36.0, 36.0, 47.0, 36.0, 29.0, 45.0, 40.0, 44.0, 38.0, 37.0, 29.0, 30.0, 24.0, 18.0, 24.0, 26.0, 24.0, 16.0, 13.0, 19.0, 14.0, 11.0, 13.0, 5.0, 3.0, 7.0, 9.0, 0.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.023770511150360107, -0.023075811564922333, -0.022381113842129707, -0.021686416119337082, -0.020991716533899307, -0.020297016948461533, -0.019602319225668907, -0.018907621502876282, -0.018212921917438507, -0.017518222332000732, -0.016823524609208107, -0.01612882688641548, -0.015434127300977707, -0.014739428646862507, -0.014044729992747307, -0.013350031338632107, -0.012655332684516907, -0.011960634030401707, -0.011265935376286507, -0.010571236722171307, -0.009876538068056107, -0.009181839413940907, -0.008487140759825706, -0.0077924421057105064, -0.007097743451595306, -0.006403044797480106, -0.005708346143364906, -0.005013647489249706, -0.004318948835134506, -0.003624250181019306, -0.002929551526904106, -0.002234852872788906, -0.001540154218673706, -0.000845455564558506, -0.00015075691044330597, 0.0005439417436718941, 0.0012386403977870941, 0.0019333390519022942, 0.002628037706017494, 0.0033227363601326942, 0.004017435014247894, 0.004712133668363094, 0.005406832322478294, 0.006101530976593494, 0.0067962296307086945, 0.0074909282848238945, 0.008185626938939095, 0.008880325593054295, 0.009575024247169495, 0.010269722901284695, 0.010964421555399895, 0.011659120209515095, 0.012353818863630295, 0.013048517517745495, 0.013743216171860695, 0.014437914825975895, 0.015132613480091095, 0.01582731306552887, 0.016522010788321495, 0.01721670851111412, 0.017911408096551895, 0.01860610768198967, 0.019300805404782295, 0.01999550312757492, 0.020690202713012695]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 11.0, 9.0, 7.0, 15.0, 14.0, 18.0, 16.0, 24.0, 31.0, 24.0, 44.0, 28.0, 42.0, 43.0, 40.0, 48.0, 40.0, 37.0, 40.0, 36.0, 39.0, 49.0, 35.0, 32.0, 25.0, 31.0, 13.0, 29.0, 24.0, 24.0, 15.0, 29.0, 14.0, 17.0, 13.0, 6.0, 6.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.951171875, -3.828643798828125, -3.70611572265625, -3.583587646484375, -3.4610595703125, -3.338531494140625, -3.21600341796875, -3.093475341796875, -2.970947265625, -2.848419189453125, -2.72589111328125, -2.603363037109375, -2.4808349609375, -2.358306884765625, -2.23577880859375, -2.113250732421875, -1.99072265625, -1.868194580078125, -1.74566650390625, -1.623138427734375, -1.5006103515625, -1.378082275390625, -1.25555419921875, -1.133026123046875, -1.010498046875, -0.887969970703125, -0.76544189453125, -0.642913818359375, -0.5203857421875, -0.397857666015625, -0.27532958984375, -0.152801513671875, -0.0302734375, 0.092254638671875, 0.21478271484375, 0.337310791015625, 0.4598388671875, 0.582366943359375, 0.70489501953125, 0.827423095703125, 0.949951171875, 1.072479248046875, 1.19500732421875, 1.317535400390625, 1.4400634765625, 1.562591552734375, 1.68511962890625, 1.807647705078125, 1.93017578125, 2.052703857421875, 2.17523193359375, 2.297760009765625, 2.4202880859375, 2.542816162109375, 2.66534423828125, 2.787872314453125, 2.910400390625, 3.032928466796875, 3.15545654296875, 3.277984619140625, 3.4005126953125, 3.523040771484375, 3.64556884765625, 3.768096923828125, 3.890625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 1.0, 6.0, 4.0, 5.0, 9.0, 12.0, 19.0, 14.0, 21.0, 40.0, 50.0, 85.0, 121.0, 160.0, 250.0, 506.0, 882.0, 1649.0, 3173.0, 6326.0, 12526.0, 25750.0, 54542.0, 115293.0, 244502.0, 302771.0, 146730.0, 68705.0, 32236.0, 15839.0, 7691.0, 3978.0, 2060.0, 1084.0, 593.0, 327.0, 202.0, 117.0, 70.0, 41.0, 46.0, 30.0, 18.0, 23.0, 10.0, 12.0, 13.0, 4.0, 1.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.39453125, -4.25787353515625, -4.1212158203125, -3.98455810546875, -3.847900390625, -3.71124267578125, -3.5745849609375, -3.43792724609375, -3.30126953125, -3.16461181640625, -3.0279541015625, -2.89129638671875, -2.754638671875, -2.61798095703125, -2.4813232421875, -2.34466552734375, -2.2080078125, -2.07135009765625, -1.9346923828125, -1.79803466796875, -1.661376953125, -1.52471923828125, -1.3880615234375, -1.25140380859375, -1.11474609375, -0.97808837890625, -0.8414306640625, -0.70477294921875, -0.568115234375, -0.43145751953125, -0.2947998046875, -0.15814208984375, -0.021484375, 0.11517333984375, 0.2518310546875, 0.38848876953125, 0.525146484375, 0.66180419921875, 0.7984619140625, 0.93511962890625, 1.07177734375, 1.20843505859375, 1.3450927734375, 1.48175048828125, 1.618408203125, 1.75506591796875, 1.8917236328125, 2.02838134765625, 2.1650390625, 2.30169677734375, 2.4383544921875, 2.57501220703125, 2.711669921875, 2.84832763671875, 2.9849853515625, 3.12164306640625, 3.25830078125, 3.39495849609375, 3.5316162109375, 3.66827392578125, 3.804931640625, 3.94158935546875, 4.0782470703125, 4.21490478515625, 4.3515625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 5.0, 10.0, 15.0, 11.0, 11.0, 20.0, 18.0, 24.0, 21.0, 30.0, 39.0, 50.0, 46.0, 68.0, 58.0, 93.0, 173.0, 837.0, 811.0, 173.0, 81.0, 66.0, 60.0, 48.0, 33.0, 29.0, 33.0, 26.0, 22.0, 28.0, 19.0, 11.0, 8.0, 6.0, 15.0, 7.0, 3.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-13.5078125, -13.085693359375, -12.66357421875, -12.241455078125, -11.8193359375, -11.397216796875, -10.97509765625, -10.552978515625, -10.130859375, -9.708740234375, -9.28662109375, -8.864501953125, -8.4423828125, -8.020263671875, -7.59814453125, -7.176025390625, -6.75390625, -6.331787109375, -5.90966796875, -5.487548828125, -5.0654296875, -4.643310546875, -4.22119140625, -3.799072265625, -3.376953125, -2.954833984375, -2.53271484375, -2.110595703125, -1.6884765625, -1.266357421875, -0.84423828125, -0.422119140625, 0.0, 0.422119140625, 0.84423828125, 1.266357421875, 1.6884765625, 2.110595703125, 2.53271484375, 2.954833984375, 3.376953125, 3.799072265625, 4.22119140625, 4.643310546875, 5.0654296875, 5.487548828125, 5.90966796875, 6.331787109375, 6.75390625, 7.176025390625, 7.59814453125, 8.020263671875, 8.4423828125, 8.864501953125, 9.28662109375, 9.708740234375, 10.130859375, 10.552978515625, 10.97509765625, 11.397216796875, 11.8193359375, 12.241455078125, 12.66357421875, 13.085693359375, 13.5078125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 3.0, 11.0, 25.0, 24.0, 32.0, 60.0, 78.0, 128.0, 222.0, 389.0, 777.0, 16195.0, 3119626.0, 6459.0, 739.0, 364.0, 196.0, 107.0, 90.0, 48.0, 32.0, 21.0, 23.0, 11.0, 5.0, 6.0, 5.0, 6.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.1875, -80.96435546875, -78.7412109375, -76.51806640625, -74.294921875, -72.07177734375, -69.8486328125, -67.62548828125, -65.40234375, -63.17919921875, -60.9560546875, -58.73291015625, -56.509765625, -54.28662109375, -52.0634765625, -49.84033203125, -47.6171875, -45.39404296875, -43.1708984375, -40.94775390625, -38.724609375, -36.50146484375, -34.2783203125, -32.05517578125, -29.83203125, -27.60888671875, -25.3857421875, -23.16259765625, -20.939453125, -18.71630859375, -16.4931640625, -14.27001953125, -12.046875, -9.82373046875, -7.6005859375, -5.37744140625, -3.154296875, -0.93115234375, 1.2919921875, 3.51513671875, 5.73828125, 7.96142578125, 10.1845703125, 12.40771484375, 14.630859375, 16.85400390625, 19.0771484375, 21.30029296875, 23.5234375, 25.74658203125, 27.9697265625, 30.19287109375, 32.416015625, 34.63916015625, 36.8623046875, 39.08544921875, 41.30859375, 43.53173828125, 45.7548828125, 47.97802734375, 50.201171875, 52.42431640625, 54.6474609375, 56.87060546875, 59.09375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 98.0, 576.0, 319.0, 22.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-233.8211669921875, -229.3029327392578, -224.78469848632812, -220.2664794921875, -215.7482452392578, -211.23001098632812, -206.71177673339844, -202.19354248046875, -197.67530822753906, -193.15707397460938, -188.6388397216797, -184.12060546875, -179.60238647460938, -175.0841522216797, -170.56591796875, -166.0476837158203, -161.52944946289062, -157.01121520996094, -152.49298095703125, -147.97476196289062, -143.45652770996094, -138.93829345703125, -134.42005920410156, -129.90182495117188, -125.38360595703125, -120.86537170410156, -116.3471450805664, -111.82891082763672, -107.31067657470703, -102.79244995117188, -98.27421569824219, -93.7559814453125, -89.23773956298828, -84.7195053100586, -80.20127868652344, -75.68304443359375, -71.16481018066406, -66.64657592773438, -62.12834930419922, -57.61011505126953, -53.09188461303711, -48.57365417480469, -44.055419921875, -39.53718948364258, -35.018959045410156, -30.50072479248047, -25.982494354248047, -21.464262008666992, -16.946029663085938, -12.427797317504883, -7.9095659255981445, -3.3913345336914062, 1.1268978118896484, 5.645130157470703, 10.163360595703125, 14.68159294128418, 19.199825286865234, 23.71805763244629, 28.236289978027344, 32.754520416259766, 37.27275085449219, 41.790985107421875, 46.3092155456543, 50.82744598388672, 55.345680236816406]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 10.0, 2.0, 8.0, 7.0, 8.0, 13.0, 14.0, 18.0, 24.0, 19.0, 17.0, 29.0, 23.0, 32.0, 47.0, 31.0, 39.0, 33.0, 53.0, 48.0, 39.0, 43.0, 38.0, 40.0, 44.0, 44.0, 44.0, 38.0, 35.0, 28.0, 27.0, 18.0, 12.0, 21.0, 10.0, 12.0, 7.0, 14.0, 3.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.29620361328125, -32.120670318603516, -30.945138931274414, -29.769607543945312, -28.594074249267578, -27.418542861938477, -26.243011474609375, -25.06747817993164, -23.89194679260254, -22.716415405273438, -21.540882110595703, -20.3653507232666, -19.1898193359375, -18.014286041259766, -16.838754653930664, -15.663222312927246, -14.487689971923828, -13.31215763092041, -12.136625289916992, -10.96109390258789, -9.785561561584473, -8.610029220581055, -7.434497356414795, -6.258965492248535, -5.083433151245117, -3.9079010486602783, -2.7323689460754395, -1.5568368434906006, -0.3813047409057617, 0.7942276000976562, 1.969759464263916, 3.145291328430176, 4.320823669433594, 5.496356010437012, 6.6718878746032715, 7.847419738769531, 9.02295207977295, 10.198484420776367, 11.374015808105469, 12.549548149108887, 13.725080490112305, 14.900612831115723, 16.07614517211914, 17.251676559448242, 18.427207946777344, 19.602741241455078, 20.77827262878418, 21.95380401611328, 23.129337310791016, 24.304868698120117, 25.48040199279785, 26.655933380126953, 27.831466674804688, 29.00699806213379, 30.18252944946289, 31.358062744140625, 32.533592224121094, 33.70912551879883, 34.8846549987793, 36.06018829345703, 37.235721588134766, 38.4112548828125, 39.58678436279297, 40.7623176574707, 41.93785095214844]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 11.0, 2.0, 10.0, 11.0, 9.0, 11.0, 8.0, 20.0, 30.0, 26.0, 24.0, 34.0, 38.0, 33.0, 40.0, 38.0, 41.0, 49.0, 51.0, 46.0, 35.0, 43.0, 42.0, 32.0, 26.0, 33.0, 30.0, 26.0, 29.0, 29.0, 20.0, 22.0, 13.0, 18.0, 16.0, 16.0, 10.0, 7.0, 6.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8046875, -4.661865234375, -4.51904296875, -4.376220703125, -4.2333984375, -4.090576171875, -3.94775390625, -3.804931640625, -3.662109375, -3.519287109375, -3.37646484375, -3.233642578125, -3.0908203125, -2.947998046875, -2.80517578125, -2.662353515625, -2.51953125, -2.376708984375, -2.23388671875, -2.091064453125, -1.9482421875, -1.805419921875, -1.66259765625, -1.519775390625, -1.376953125, -1.234130859375, -1.09130859375, -0.948486328125, -0.8056640625, -0.662841796875, -0.52001953125, -0.377197265625, -0.234375, -0.091552734375, 0.05126953125, 0.194091796875, 0.3369140625, 0.479736328125, 0.62255859375, 0.765380859375, 0.908203125, 1.051025390625, 1.19384765625, 1.336669921875, 1.4794921875, 1.622314453125, 1.76513671875, 1.907958984375, 2.05078125, 2.193603515625, 2.33642578125, 2.479248046875, 2.6220703125, 2.764892578125, 2.90771484375, 3.050537109375, 3.193359375, 3.336181640625, 3.47900390625, 3.621826171875, 3.7646484375, 3.907470703125, 4.05029296875, 4.193115234375, 4.3359375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 7.0, 3.0, 9.0, 14.0, 20.0, 16.0, 35.0, 43.0, 64.0, 109.0, 175.0, 301.0, 739.0, 2781.0, 19060.0, 191538.0, 1447748.0, 2085247.0, 399385.0, 39148.0, 5240.0, 1359.0, 468.0, 280.0, 159.0, 99.0, 67.0, 55.0, 39.0, 30.0, 12.0, 12.0, 9.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.453125, -12.1351318359375, -11.817138671875, -11.4991455078125, -11.18115234375, -10.8631591796875, -10.545166015625, -10.2271728515625, -9.9091796875, -9.5911865234375, -9.273193359375, -8.9552001953125, -8.63720703125, -8.3192138671875, -8.001220703125, -7.6832275390625, -7.365234375, -7.0472412109375, -6.729248046875, -6.4112548828125, -6.09326171875, -5.7752685546875, -5.457275390625, -5.1392822265625, -4.8212890625, -4.5032958984375, -4.185302734375, -3.8673095703125, -3.54931640625, -3.2313232421875, -2.913330078125, -2.5953369140625, -2.27734375, -1.9593505859375, -1.641357421875, -1.3233642578125, -1.00537109375, -0.6873779296875, -0.369384765625, -0.0513916015625, 0.2666015625, 0.5845947265625, 0.902587890625, 1.2205810546875, 1.53857421875, 1.8565673828125, 2.174560546875, 2.4925537109375, 2.810546875, 3.1285400390625, 3.446533203125, 3.7645263671875, 4.08251953125, 4.4005126953125, 4.718505859375, 5.0364990234375, 5.3544921875, 5.6724853515625, 5.990478515625, 6.3084716796875, 6.62646484375, 6.9444580078125, 7.262451171875, 7.5804443359375, 7.8984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 14.0, 21.0, 20.0, 36.0, 36.0, 47.0, 72.0, 90.0, 118.0, 168.0, 239.0, 259.0, 349.0, 343.0, 386.0, 386.0, 358.0, 268.0, 203.0, 136.0, 123.0, 104.0, 74.0, 55.0, 36.0, 26.0, 27.0, 12.0, 17.0, 12.0, 9.0, 5.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3203125, -8.0377197265625, -7.755126953125, -7.4725341796875, -7.18994140625, -6.9073486328125, -6.624755859375, -6.3421630859375, -6.0595703125, -5.7769775390625, -5.494384765625, -5.2117919921875, -4.92919921875, -4.6466064453125, -4.364013671875, -4.0814208984375, -3.798828125, -3.5162353515625, -3.233642578125, -2.9510498046875, -2.66845703125, -2.3858642578125, -2.103271484375, -1.8206787109375, -1.5380859375, -1.2554931640625, -0.972900390625, -0.6903076171875, -0.40771484375, -0.1251220703125, 0.157470703125, 0.4400634765625, 0.72265625, 1.0052490234375, 1.287841796875, 1.5704345703125, 1.85302734375, 2.1356201171875, 2.418212890625, 2.7008056640625, 2.9833984375, 3.2659912109375, 3.548583984375, 3.8311767578125, 4.11376953125, 4.3963623046875, 4.678955078125, 4.9615478515625, 5.244140625, 5.5267333984375, 5.809326171875, 6.0919189453125, 6.37451171875, 6.6571044921875, 6.939697265625, 7.2222900390625, 7.5048828125, 7.7874755859375, 8.070068359375, 8.3526611328125, 8.63525390625, 8.9178466796875, 9.200439453125, 9.4830322265625, 9.765625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 5.0, 5.0, 14.0, 13.0, 18.0, 18.0, 27.0, 33.0, 56.0, 78.0, 114.0, 160.0, 199.0, 345.0, 573.0, 3316.0, 277976.0, 3772297.0, 135372.0, 2200.0, 494.0, 326.0, 177.0, 137.0, 102.0, 60.0, 43.0, 34.0, 26.0, 25.0, 16.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.46875, -32.467529296875, -31.46630859375, -30.465087890625, -29.4638671875, -28.462646484375, -27.46142578125, -26.460205078125, -25.458984375, -24.457763671875, -23.45654296875, -22.455322265625, -21.4541015625, -20.452880859375, -19.45166015625, -18.450439453125, -17.44921875, -16.447998046875, -15.44677734375, -14.445556640625, -13.4443359375, -12.443115234375, -11.44189453125, -10.440673828125, -9.439453125, -8.438232421875, -7.43701171875, -6.435791015625, -5.4345703125, -4.433349609375, -3.43212890625, -2.430908203125, -1.4296875, -0.428466796875, 0.57275390625, 1.573974609375, 2.5751953125, 3.576416015625, 4.57763671875, 5.578857421875, 6.580078125, 7.581298828125, 8.58251953125, 9.583740234375, 10.5849609375, 11.586181640625, 12.58740234375, 13.588623046875, 14.58984375, 15.591064453125, 16.59228515625, 17.593505859375, 18.5947265625, 19.595947265625, 20.59716796875, 21.598388671875, 22.599609375, 23.600830078125, 24.60205078125, 25.603271484375, 26.6044921875, 27.605712890625, 28.60693359375, 29.608154296875, 30.609375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 11.0, 10.0, 26.0, 60.0, 92.0, 127.0, 141.0, 161.0, 140.0, 104.0, 70.0, 34.0, 25.0, 4.0, 5.0, 4.0, 2.0], "bins": [-110.89139556884766, -108.84294128417969, -106.79449462890625, -104.74604034423828, -102.69759368896484, -100.64913940429688, -98.60069274902344, -96.55223846435547, -94.5037841796875, -92.45532989501953, -90.4068832397461, -88.35842895507812, -86.30998229980469, -84.26152801513672, -82.21308135986328, -80.16462707519531, -78.11618041992188, -76.0677261352539, -74.01927947998047, -71.9708251953125, -69.92237854003906, -67.8739242553711, -65.82547760009766, -63.77702331542969, -61.728572845458984, -59.68012237548828, -57.63167190551758, -55.583221435546875, -53.534767150878906, -51.48632049560547, -49.4378662109375, -47.3894157409668, -45.34095764160156, -43.29250717163086, -41.244056701660156, -39.19560623168945, -37.14715576171875, -35.09870147705078, -33.05025100708008, -31.001800537109375, -28.953350067138672, -26.90489959716797, -24.856449127197266, -22.80799674987793, -20.759546279907227, -18.711095809936523, -16.662643432617188, -14.614192962646484, -12.565742492675781, -10.517292022705078, -8.468840599060059, -6.420389652252197, -4.371938705444336, -2.323488235473633, -0.2750368118286133, 1.7734146118164062, 3.8218650817871094, 5.870316028594971, 7.918766975402832, 9.967218399047852, 12.015668869018555, 14.064119338989258, 16.112571716308594, 18.161022186279297, 20.20947265625]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 7.0, 7.0, 6.0, 8.0, 19.0, 13.0, 19.0, 31.0, 15.0, 18.0, 10.0, 19.0, 30.0, 39.0, 27.0, 35.0, 43.0, 39.0, 52.0, 50.0, 53.0, 39.0, 37.0, 33.0, 40.0, 38.0, 42.0, 27.0, 20.0, 35.0, 31.0, 18.0, 21.0, 14.0, 13.0, 9.0, 5.0, 10.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-30.64522933959961, -29.68155288696289, -28.717876434326172, -27.754199981689453, -26.790525436401367, -25.82684898376465, -24.86317253112793, -23.89949607849121, -22.935819625854492, -21.972143173217773, -21.008466720581055, -20.04479217529297, -19.08111572265625, -18.11743927001953, -17.153762817382812, -16.190086364746094, -15.226410865783691, -14.262734413146973, -13.29905891418457, -12.335382461547852, -11.371706008911133, -10.408029556274414, -9.444354057312012, -8.480677604675293, -7.517001628875732, -6.553325653076172, -5.589649200439453, -4.625973224639893, -3.662297010421753, -2.6986207962036133, -1.7349448204040527, -0.771268367767334, 0.19240760803222656, 1.1560838222503662, 2.119760036468506, 3.0834360122680664, 4.047112464904785, 5.010788440704346, 5.974464416503906, 6.938140869140625, 7.9018168449401855, 8.865492820739746, 9.829169273376465, 10.792844772338867, 11.756521224975586, 12.720197677612305, 13.683874130249023, 14.647550582885742, 15.611226081848145, 16.574901580810547, 17.538578033447266, 18.502254486083984, 19.465930938720703, 20.429607391357422, 21.39328384399414, 22.35696029663086, 23.320634841918945, 24.284311294555664, 25.247987747192383, 26.21166229248047, 27.175338745117188, 28.139015197753906, 29.102691650390625, 30.066368103027344, 31.030044555664062]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 3.0, 6.0, 11.0, 9.0, 14.0, 20.0, 20.0, 18.0, 25.0, 32.0, 30.0, 48.0, 35.0, 35.0, 34.0, 34.0, 36.0, 41.0, 37.0, 45.0, 31.0, 44.0, 34.0, 42.0, 37.0, 34.0, 25.0, 23.0, 18.0, 28.0, 24.0, 19.0, 12.0, 12.0, 12.0, 13.0, 10.0, 12.0, 6.0, 6.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.27734375, -4.1483154296875, -4.019287109375, -3.8902587890625, -3.76123046875, -3.6322021484375, -3.503173828125, -3.3741455078125, -3.2451171875, -3.1160888671875, -2.987060546875, -2.8580322265625, -2.72900390625, -2.5999755859375, -2.470947265625, -2.3419189453125, -2.212890625, -2.0838623046875, -1.954833984375, -1.8258056640625, -1.69677734375, -1.5677490234375, -1.438720703125, -1.3096923828125, -1.1806640625, -1.0516357421875, -0.922607421875, -0.7935791015625, -0.66455078125, -0.5355224609375, -0.406494140625, -0.2774658203125, -0.1484375, -0.0194091796875, 0.109619140625, 0.2386474609375, 0.36767578125, 0.4967041015625, 0.625732421875, 0.7547607421875, 0.8837890625, 1.0128173828125, 1.141845703125, 1.2708740234375, 1.39990234375, 1.5289306640625, 1.657958984375, 1.7869873046875, 1.916015625, 2.0450439453125, 2.174072265625, 2.3031005859375, 2.43212890625, 2.5611572265625, 2.690185546875, 2.8192138671875, 2.9482421875, 3.0772705078125, 3.206298828125, 3.3353271484375, 3.46435546875, 3.5933837890625, 3.722412109375, 3.8514404296875, 3.98046875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 10.0, 25.0, 27.0, 29.0, 69.0, 81.0, 143.0, 208.0, 303.0, 442.0, 605.0, 881.0, 1247.0, 1860.0, 2701.0, 4018.0, 5545.0, 8368.0, 12369.0, 18147.0, 27198.0, 40173.0, 58645.0, 83028.0, 113279.0, 139424.0, 140288.0, 114685.0, 85366.0, 60304.0, 41954.0, 28176.0, 18863.0, 12852.0, 8744.0, 5838.0, 3872.0, 2715.0, 1889.0, 1269.0, 898.0, 648.0, 438.0, 289.0, 209.0, 150.0, 104.0, 72.0, 42.0, 34.0, 17.0, 8.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.279815673828125, -0.26983642578125, -0.259857177734375, -0.2498779296875, -0.239898681640625, -0.22991943359375, -0.219940185546875, -0.2099609375, -0.199981689453125, -0.19000244140625, -0.180023193359375, -0.1700439453125, -0.160064697265625, -0.15008544921875, -0.140106201171875, -0.130126953125, -0.120147705078125, -0.11016845703125, -0.100189208984375, -0.0902099609375, -0.080230712890625, -0.07025146484375, -0.060272216796875, -0.05029296875, -0.040313720703125, -0.03033447265625, -0.020355224609375, -0.0103759765625, -0.000396728515625, 0.00958251953125, 0.019561767578125, 0.029541015625, 0.039520263671875, 0.04949951171875, 0.059478759765625, 0.0694580078125, 0.079437255859375, 0.08941650390625, 0.099395751953125, 0.109375, 0.119354248046875, 0.12933349609375, 0.139312744140625, 0.1492919921875, 0.159271240234375, 0.16925048828125, 0.179229736328125, 0.189208984375, 0.199188232421875, 0.20916748046875, 0.219146728515625, 0.2291259765625, 0.239105224609375, 0.24908447265625, 0.259063720703125, 0.26904296875, 0.279022216796875, 0.28900146484375, 0.298980712890625, 0.3089599609375, 0.318939208984375, 0.32891845703125, 0.338897705078125, 0.348876953125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 0.0, 4.0, 6.0, 5.0, 3.0, 11.0, 18.0, 12.0, 20.0, 22.0, 21.0, 30.0, 25.0, 24.0, 22.0, 44.0, 42.0, 54.0, 38.0, 42.0, 34.0, 1071.0, 46.0, 43.0, 47.0, 30.0, 26.0, 44.0, 31.0, 29.0, 26.0, 24.0, 25.0, 16.0, 16.0, 10.0, 14.0, 9.0, 7.0, 7.0, 6.0, 4.0, 10.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.021484375, -2.931488037109375, -2.84149169921875, -2.751495361328125, -2.6614990234375, -2.571502685546875, -2.48150634765625, -2.391510009765625, -2.301513671875, -2.211517333984375, -2.12152099609375, -2.031524658203125, -1.9415283203125, -1.851531982421875, -1.76153564453125, -1.671539306640625, -1.58154296875, -1.491546630859375, -1.40155029296875, -1.311553955078125, -1.2215576171875, -1.131561279296875, -1.04156494140625, -0.951568603515625, -0.861572265625, -0.771575927734375, -0.68157958984375, -0.591583251953125, -0.5015869140625, -0.411590576171875, -0.32159423828125, -0.231597900390625, -0.1416015625, -0.051605224609375, 0.03839111328125, 0.128387451171875, 0.2183837890625, 0.308380126953125, 0.39837646484375, 0.488372802734375, 0.578369140625, 0.668365478515625, 0.75836181640625, 0.848358154296875, 0.9383544921875, 1.028350830078125, 1.11834716796875, 1.208343505859375, 1.29833984375, 1.388336181640625, 1.47833251953125, 1.568328857421875, 1.6583251953125, 1.748321533203125, 1.83831787109375, 1.928314208984375, 2.018310546875, 2.108306884765625, 2.19830322265625, 2.288299560546875, 2.3782958984375, 2.468292236328125, 2.55828857421875, 2.648284912109375, 2.73828125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 7.0, 7.0, 8.0, 13.0, 14.0, 25.0, 47.0, 52.0, 85.0, 121.0, 191.0, 276.0, 442.0, 643.0, 1032.0, 1615.0, 2449.0, 3797.0, 5863.0, 9368.0, 14698.0, 22579.0, 34061.0, 50936.0, 74713.0, 104396.0, 139234.0, 1189462.0, 131708.0, 100064.0, 71112.0, 47819.0, 31770.0, 20821.0, 13343.0, 8632.0, 5503.0, 3542.0, 2306.0, 1545.0, 930.0, 617.0, 450.0, 279.0, 190.0, 127.0, 78.0, 56.0, 44.0, 27.0, 15.0, 9.0, 5.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2130126953125, -0.20623397827148438, -0.19945526123046875, -0.19267654418945312, -0.1858978271484375, -0.17911911010742188, -0.17234039306640625, -0.16556167602539062, -0.158782958984375, -0.15200424194335938, -0.14522552490234375, -0.13844680786132812, -0.1316680908203125, -0.12488937377929688, -0.11811065673828125, -0.11133193969726562, -0.10455322265625, -0.09777450561523438, -0.09099578857421875, -0.08421707153320312, -0.0774383544921875, -0.07065963745117188, -0.06388092041015625, -0.057102203369140625, -0.050323486328125, -0.043544769287109375, -0.03676605224609375, -0.029987335205078125, -0.0232086181640625, -0.016429901123046875, -0.00965118408203125, -0.002872467041015625, 0.00390625, 0.010684967041015625, 0.01746368408203125, 0.024242401123046875, 0.0310211181640625, 0.037799835205078125, 0.04457855224609375, 0.051357269287109375, 0.058135986328125, 0.06491470336914062, 0.07169342041015625, 0.07847213745117188, 0.0852508544921875, 0.09202957153320312, 0.09880828857421875, 0.10558700561523438, 0.11236572265625, 0.11914443969726562, 0.12592315673828125, 0.13270187377929688, 0.1394805908203125, 0.14625930786132812, 0.15303802490234375, 0.15981674194335938, 0.166595458984375, 0.17337417602539062, 0.18015289306640625, 0.18693161010742188, 0.1937103271484375, 0.20048904418945312, 0.20726776123046875, 0.21404647827148438, 0.2208251953125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 7.0, 6.0, 4.0, 13.0, 8.0, 8.0, 14.0, 15.0, 20.0, 20.0, 39.0, 45.0, 55.0, 50.0, 85.0, 107.0, 90.0, 96.0, 64.0, 48.0, 41.0, 39.0, 19.0, 21.0, 16.0, 12.0, 12.0, 11.0, 6.0, 6.0, 7.0, 5.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01111602783203125, -0.010759234428405762, -0.010402441024780273, -0.010045647621154785, -0.009688854217529297, -0.009332060813903809, -0.00897526741027832, -0.008618474006652832, -0.008261680603027344, -0.007904887199401855, -0.007548093795776367, -0.007191300392150879, -0.006834506988525391, -0.006477713584899902, -0.006120920181274414, -0.005764126777648926, -0.0054073333740234375, -0.005050539970397949, -0.004693746566772461, -0.004336953163146973, -0.003980159759521484, -0.003623366355895996, -0.003266572952270508, -0.0029097795486450195, -0.0025529861450195312, -0.002196192741394043, -0.0018393993377685547, -0.0014826059341430664, -0.0011258125305175781, -0.0007690191268920898, -0.00041222572326660156, -5.543231964111328e-05, 0.000301361083984375, 0.0006581544876098633, 0.0010149478912353516, 0.0013717412948608398, 0.0017285346984863281, 0.0020853281021118164, 0.0024421215057373047, 0.002798914909362793, 0.0031557083129882812, 0.0035125017166137695, 0.003869295120239258, 0.004226088523864746, 0.004582881927490234, 0.004939675331115723, 0.005296468734741211, 0.005653262138366699, 0.0060100555419921875, 0.006366848945617676, 0.006723642349243164, 0.007080435752868652, 0.007437229156494141, 0.007794022560119629, 0.008150815963745117, 0.008507609367370605, 0.008864402770996094, 0.009221196174621582, 0.00957798957824707, 0.009934782981872559, 0.010291576385498047, 0.010648369789123535, 0.011005163192749023, 0.011361956596374512, 0.01171875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 10.0, 5.0, 13.0, 13.0, 16.0, 21.0, 26.0, 32.0, 44.0, 58.0, 105.0, 162.0, 477.0, 7244.0, 959456.0, 78625.0, 1525.0, 262.0, 121.0, 91.0, 71.0, 33.0, 32.0, 18.0, 18.0, 15.0, 6.0, 9.0, 12.0, 7.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.2548828125, -0.24754905700683594, -0.24021530151367188, -0.2328815460205078, -0.22554779052734375, -0.2182140350341797, -0.21088027954101562, -0.20354652404785156, -0.1962127685546875, -0.18887901306152344, -0.18154525756835938, -0.1742115020751953, -0.16687774658203125, -0.1595439910888672, -0.15221023559570312, -0.14487648010253906, -0.137542724609375, -0.13020896911621094, -0.12287521362304688, -0.11554145812988281, -0.10820770263671875, -0.10087394714355469, -0.09354019165039062, -0.08620643615722656, -0.0788726806640625, -0.07153892517089844, -0.06420516967773438, -0.05687141418457031, -0.04953765869140625, -0.04220390319824219, -0.034870147705078125, -0.027536392211914062, -0.02020263671875, -0.012868881225585938, -0.005535125732421875, 0.0017986297607421875, 0.00913238525390625, 0.016466140747070312, 0.023799896240234375, 0.031133651733398438, 0.0384674072265625, 0.04580116271972656, 0.053134918212890625, 0.06046867370605469, 0.06780242919921875, 0.07513618469238281, 0.08246994018554688, 0.08980369567871094, 0.097137451171875, 0.10447120666503906, 0.11180496215820312, 0.11913871765136719, 0.12647247314453125, 0.1338062286376953, 0.14113998413085938, 0.14847373962402344, 0.1558074951171875, 0.16314125061035156, 0.17047500610351562, 0.1778087615966797, 0.18514251708984375, 0.1924762725830078, 0.19981002807617188, 0.20714378356933594, 0.2144775390625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 10.0, 13.0, 29.0, 81.0, 202.0, 343.0, 175.0, 73.0, 39.0, 20.0, 8.0, 8.0, 3.0, 0.0, 0.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016347967088222504, -0.015122907236218452, -0.013897846452891827, -0.0126727856695652, -0.01144772581756115, -0.010222665965557098, -0.008997605182230473, -0.007772544398903847, -0.0065474845468997955, -0.005322424229234457, -0.0040973639115691185, -0.00287230359390378, -0.0016472432762384415, -0.00042218295857310295, 0.0008028773590922356, 0.0020279381424188614, 0.0032529979944229126, 0.004478058312088251, 0.00570311862975359, 0.006928178947418928, 0.008153239265084267, 0.009378299117088318, 0.010603359900414944, 0.01182842068374157, 0.01305348053574562, 0.014278540387749672, 0.015503601171076298, 0.016728661954402924, 0.017953721806406975, 0.019178781658411026, 0.020403843373060226, 0.021628903225064278, 0.02285396307706833, 0.02407902292907238, 0.02530408278107643, 0.02652914449572563, 0.027754204347729683, 0.028979264199733734, 0.030204325914382935, 0.031429387629032135, 0.03265444561839104, 0.03387950733304024, 0.03510456532239914, 0.03632962703704834, 0.03755468875169754, 0.03877974674105644, 0.04000480845570564, 0.041229866445064545, 0.042454928159713745, 0.043679989874362946, 0.04490504786372185, 0.04613010957837105, 0.04735516756772995, 0.04858022928237915, 0.04980529099702835, 0.05103035271167755, 0.05225541070103645, 0.053480472415685654, 0.054705530405044556, 0.055930592119693756, 0.05715565383434296, 0.05838071182370186, 0.05960577353835106, 0.06083083152770996, 0.06205589324235916]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 8.0, 8.0, 7.0, 9.0, 6.0, 7.0, 13.0, 11.0, 22.0, 14.0, 19.0, 18.0, 14.0, 22.0, 23.0, 18.0, 33.0, 20.0, 37.0, 35.0, 37.0, 42.0, 33.0, 34.0, 28.0, 33.0, 38.0, 30.0, 36.0, 17.0, 29.0, 27.0, 32.0, 25.0, 24.0, 24.0, 24.0, 20.0, 16.0, 14.0, 14.0, 11.0, 11.0, 8.0, 17.0, 12.0, 1.0, 5.0, 3.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.010185658931732178, -0.009859631769359112, -0.009533604606986046, -0.00920757744461298, -0.008881550282239914, -0.008555523119866848, -0.008229495957493782, -0.007903468795120716, -0.00757744163274765, -0.007251414470374584, -0.006925387308001518, -0.006599360145628452, -0.006273332983255386, -0.00594730582088232, -0.0056212786585092545, -0.0052952514961361885, -0.0049692243337631226, -0.004643197171390057, -0.004317170009016991, -0.003991142846643925, -0.0036651156842708588, -0.003339088521897793, -0.003013061359524727, -0.002687034197151661, -0.002361007034778595, -0.002034979872405529, -0.001708952710032463, -0.0013829255476593971, -0.0010568983852863312, -0.0007308712229132652, -0.0004048440605401993, -7.881689816713333e-05, 0.0002472102642059326, 0.0005732374265789986, 0.0008992645889520645, 0.0012252917513251305, 0.0015513189136981964, 0.0018773460760712624, 0.0022033732384443283, 0.0025294004008173943, 0.00285542756319046, 0.003181454725563526, 0.003507481887936592, 0.003833509050309658, 0.004159536212682724, 0.00448556337505579, 0.004811590537428856, 0.005137617699801922, 0.005463644862174988, 0.005789672024548054, 0.00611569918692112, 0.006441726349294186, 0.006767753511667252, 0.0070937806740403175, 0.0074198078364133835, 0.007745834998786449, 0.008071862161159515, 0.008397889323532581, 0.008723916485905647, 0.009049943648278713, 0.00937597081065178, 0.009701997973024845, 0.010028025135397911, 0.010354052297770977, 0.010680079460144043]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 3.0, 6.0, 11.0, 9.0, 14.0, 20.0, 20.0, 18.0, 25.0, 32.0, 30.0, 48.0, 35.0, 35.0, 34.0, 34.0, 36.0, 41.0, 38.0, 44.0, 31.0, 44.0, 33.0, 43.0, 37.0, 34.0, 25.0, 23.0, 18.0, 28.0, 24.0, 19.0, 12.0, 12.0, 12.0, 13.0, 11.0, 11.0, 6.0, 6.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.27734375, -4.1483154296875, -4.019287109375, -3.8902587890625, -3.76123046875, -3.6322021484375, -3.503173828125, -3.3741455078125, -3.2451171875, -3.1160888671875, -2.987060546875, -2.8580322265625, -2.72900390625, -2.5999755859375, -2.470947265625, -2.3419189453125, -2.212890625, -2.0838623046875, -1.954833984375, -1.8258056640625, -1.69677734375, -1.5677490234375, -1.438720703125, -1.3096923828125, -1.1806640625, -1.0516357421875, -0.922607421875, -0.7935791015625, -0.66455078125, -0.5355224609375, -0.406494140625, -0.2774658203125, -0.1484375, -0.0194091796875, 0.109619140625, 0.2386474609375, 0.36767578125, 0.4967041015625, 0.625732421875, 0.7547607421875, 0.8837890625, 1.0128173828125, 1.141845703125, 1.2708740234375, 1.39990234375, 1.5289306640625, 1.657958984375, 1.7869873046875, 1.916015625, 2.0450439453125, 2.174072265625, 2.3031005859375, 2.43212890625, 2.5611572265625, 2.690185546875, 2.8192138671875, 2.9482421875, 3.0772705078125, 3.206298828125, 3.3353271484375, 3.46435546875, 3.5933837890625, 3.722412109375, 3.8514404296875, 3.98046875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 7.0, 5.0, 14.0, 21.0, 27.0, 43.0, 49.0, 72.0, 132.0, 196.0, 274.0, 496.0, 843.0, 1428.0, 2670.0, 5430.0, 11892.0, 28221.0, 66969.0, 150508.0, 335358.0, 246802.0, 110602.0, 48514.0, 20340.0, 8663.0, 4022.0, 2029.0, 1130.0, 649.0, 404.0, 233.0, 137.0, 105.0, 80.0, 53.0, 41.0, 19.0, 22.0, 17.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3515625, -4.20556640625, -4.0595703125, -3.91357421875, -3.767578125, -3.62158203125, -3.4755859375, -3.32958984375, -3.18359375, -3.03759765625, -2.8916015625, -2.74560546875, -2.599609375, -2.45361328125, -2.3076171875, -2.16162109375, -2.015625, -1.86962890625, -1.7236328125, -1.57763671875, -1.431640625, -1.28564453125, -1.1396484375, -0.99365234375, -0.84765625, -0.70166015625, -0.5556640625, -0.40966796875, -0.263671875, -0.11767578125, 0.0283203125, 0.17431640625, 0.3203125, 0.46630859375, 0.6123046875, 0.75830078125, 0.904296875, 1.05029296875, 1.1962890625, 1.34228515625, 1.48828125, 1.63427734375, 1.7802734375, 1.92626953125, 2.072265625, 2.21826171875, 2.3642578125, 2.51025390625, 2.65625, 2.80224609375, 2.9482421875, 3.09423828125, 3.240234375, 3.38623046875, 3.5322265625, 3.67822265625, 3.82421875, 3.97021484375, 4.1162109375, 4.26220703125, 4.408203125, 4.55419921875, 4.7001953125, 4.84619140625, 4.9921875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 9.0, 5.0, 6.0, 11.0, 13.0, 16.0, 20.0, 14.0, 23.0, 28.0, 22.0, 30.0, 41.0, 51.0, 46.0, 67.0, 107.0, 197.0, 1466.0, 294.0, 124.0, 68.0, 63.0, 57.0, 51.0, 35.0, 29.0, 30.0, 29.0, 17.0, 18.0, 17.0, 12.0, 10.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.2783203125, -13.744140625, -13.2099609375, -12.67578125, -12.1416015625, -11.607421875, -11.0732421875, -10.5390625, -10.0048828125, -9.470703125, -8.9365234375, -8.40234375, -7.8681640625, -7.333984375, -6.7998046875, -6.265625, -5.7314453125, -5.197265625, -4.6630859375, -4.12890625, -3.5947265625, -3.060546875, -2.5263671875, -1.9921875, -1.4580078125, -0.923828125, -0.3896484375, 0.14453125, 0.6787109375, 1.212890625, 1.7470703125, 2.28125, 2.8154296875, 3.349609375, 3.8837890625, 4.41796875, 4.9521484375, 5.486328125, 6.0205078125, 6.5546875, 7.0888671875, 7.623046875, 8.1572265625, 8.69140625, 9.2255859375, 9.759765625, 10.2939453125, 10.828125, 11.3623046875, 11.896484375, 12.4306640625, 12.96484375, 13.4990234375, 14.033203125, 14.5673828125, 15.1015625, 15.6357421875, 16.169921875, 16.7041015625, 17.23828125, 17.7724609375, 18.306640625, 18.8408203125, 19.375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 11.0, 10.0, 17.0, 17.0, 21.0, 25.0, 58.0, 84.0, 111.0, 205.0, 431.0, 1257.0, 16556.0, 3119202.0, 5844.0, 945.0, 368.0, 178.0, 128.0, 76.0, 49.0, 33.0, 16.0, 15.0, 16.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.1875, -85.82861328125, -83.4697265625, -81.11083984375, -78.751953125, -76.39306640625, -74.0341796875, -71.67529296875, -69.31640625, -66.95751953125, -64.5986328125, -62.23974609375, -59.880859375, -57.52197265625, -55.1630859375, -52.80419921875, -50.4453125, -48.08642578125, -45.7275390625, -43.36865234375, -41.009765625, -38.65087890625, -36.2919921875, -33.93310546875, -31.57421875, -29.21533203125, -26.8564453125, -24.49755859375, -22.138671875, -19.77978515625, -17.4208984375, -15.06201171875, -12.703125, -10.34423828125, -7.9853515625, -5.62646484375, -3.267578125, -0.90869140625, 1.4501953125, 3.80908203125, 6.16796875, 8.52685546875, 10.8857421875, 13.24462890625, 15.603515625, 17.96240234375, 20.3212890625, 22.68017578125, 25.0390625, 27.39794921875, 29.7568359375, 32.11572265625, 34.474609375, 36.83349609375, 39.1923828125, 41.55126953125, 43.91015625, 46.26904296875, 48.6279296875, 50.98681640625, 53.345703125, 55.70458984375, 58.0634765625, 60.42236328125, 62.78125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 11.0, 110.0, 389.0, 395.0, 101.0, 9.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.951934814453125, -11.977840423583984, -9.003745079040527, -6.02964973449707, -3.0555553436279297, -0.08146095275878906, 2.8926353454589844, 5.866729736328125, 8.840824127197266, 11.814918518066406, 14.789013862609863, 17.76310920715332, 20.73720359802246, 23.7112979888916, 26.685394287109375, 29.659488677978516, 32.633583068847656, 35.6076774597168, 38.58177185058594, 41.555870056152344, 44.52996063232422, 47.504058837890625, 50.478153228759766, 53.452247619628906, 56.42634201049805, 59.40043640136719, 62.37453079223633, 65.34862518310547, 68.32272338867188, 71.29681396484375, 74.27091217041016, 77.24501037597656, 80.21910095214844, 83.19319915771484, 86.16728973388672, 89.14138793945312, 92.115478515625, 95.0895767211914, 98.06367492675781, 101.03776550292969, 104.01185607910156, 106.98595428466797, 109.96004486083984, 112.93414306640625, 115.90823364257812, 118.88233184814453, 121.85643005371094, 124.83052062988281, 127.80461883544922, 130.77871704101562, 133.7528076171875, 136.72689819335938, 139.7010040283203, 142.6750946044922, 145.64918518066406, 148.623291015625, 151.59738159179688, 154.57147216796875, 157.5455780029297, 160.51966857910156, 163.49375915527344, 166.4678497314453, 169.44195556640625, 172.41604614257812, 175.39013671875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 10.0, 11.0, 10.0, 12.0, 20.0, 18.0, 16.0, 22.0, 26.0, 37.0, 38.0, 37.0, 48.0, 29.0, 40.0, 29.0, 60.0, 45.0, 44.0, 41.0, 46.0, 31.0, 33.0, 24.0, 42.0, 36.0, 24.0, 23.0, 22.0, 26.0, 19.0, 14.0, 17.0, 7.0, 7.0, 8.0, 5.0, 3.0, 4.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.861671447753906, -36.64950180053711, -35.43733215332031, -34.22516632080078, -33.012996673583984, -31.800827026367188, -30.58865737915039, -29.376487731933594, -28.164318084716797, -26.9521484375, -25.739980697631836, -24.52781105041504, -23.315641403198242, -22.103473663330078, -20.89130401611328, -19.679134368896484, -18.46696662902832, -17.254796981811523, -16.04262924194336, -14.830459594726562, -13.618289947509766, -12.406121253967285, -11.193952560424805, -9.981782913208008, -8.769614219665527, -7.557445049285889, -6.34527587890625, -5.1331071853637695, -3.920938014984131, -2.708768844604492, -1.4966001510620117, -0.28443050384521484, 0.9277381896972656, 2.1399073600769043, 3.352076292037964, 4.564245223999023, 5.776414394378662, 6.988583564758301, 8.200752258300781, 9.412921905517578, 10.625090599060059, 11.837259292602539, 13.049428939819336, 14.261597633361816, 15.473766326904297, 16.685935974121094, 17.89810562133789, 19.110275268554688, 20.32244300842285, 21.53461265563965, 22.746780395507812, 23.95895004272461, 25.171119689941406, 26.383289337158203, 27.595457077026367, 28.807626724243164, 30.019794464111328, 31.231964111328125, 32.44413375854492, 33.65630340576172, 34.86846923828125, 36.08063888549805, 37.292808532714844, 38.50497817993164, 39.71714782714844]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 8.0, 4.0, 10.0, 7.0, 13.0, 13.0, 30.0, 24.0, 30.0, 27.0, 27.0, 34.0, 36.0, 28.0, 42.0, 53.0, 35.0, 45.0, 31.0, 36.0, 32.0, 34.0, 38.0, 40.0, 36.0, 33.0, 23.0, 22.0, 23.0, 25.0, 16.0, 18.0, 17.0, 20.0, 14.0, 13.0, 3.0, 5.0, 8.0, 8.0, 10.0, 3.0, 6.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5546875, -4.41680908203125, -4.2789306640625, -4.14105224609375, -4.003173828125, -3.86529541015625, -3.7274169921875, -3.58953857421875, -3.45166015625, -3.31378173828125, -3.1759033203125, -3.03802490234375, -2.900146484375, -2.76226806640625, -2.6243896484375, -2.48651123046875, -2.3486328125, -2.21075439453125, -2.0728759765625, -1.93499755859375, -1.797119140625, -1.65924072265625, -1.5213623046875, -1.38348388671875, -1.24560546875, -1.10772705078125, -0.9698486328125, -0.83197021484375, -0.694091796875, -0.55621337890625, -0.4183349609375, -0.28045654296875, -0.142578125, -0.00469970703125, 0.1331787109375, 0.27105712890625, 0.408935546875, 0.54681396484375, 0.6846923828125, 0.82257080078125, 0.96044921875, 1.09832763671875, 1.2362060546875, 1.37408447265625, 1.511962890625, 1.64984130859375, 1.7877197265625, 1.92559814453125, 2.0634765625, 2.20135498046875, 2.3392333984375, 2.47711181640625, 2.614990234375, 2.75286865234375, 2.8907470703125, 3.02862548828125, 3.16650390625, 3.30438232421875, 3.4422607421875, 3.58013916015625, 3.718017578125, 3.85589599609375, 3.9937744140625, 4.13165283203125, 4.26953125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 9.0, 15.0, 20.0, 18.0, 24.0, 34.0, 39.0, 45.0, 66.0, 61.0, 101.0, 166.0, 246.0, 463.0, 1235.0, 3965.0, 16964.0, 87073.0, 456102.0, 1490283.0, 1542397.0, 476715.0, 92908.0, 18325.0, 4209.0, 1309.0, 545.0, 297.0, 150.0, 99.0, 77.0, 54.0, 48.0, 32.0, 31.0, 19.0, 23.0, 24.0, 13.0, 8.0, 17.0, 14.0, 5.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0], "bins": [-8.40625, -8.16619873046875, -7.9261474609375, -7.68609619140625, -7.446044921875, -7.20599365234375, -6.9659423828125, -6.72589111328125, -6.48583984375, -6.24578857421875, -6.0057373046875, -5.76568603515625, -5.525634765625, -5.28558349609375, -5.0455322265625, -4.80548095703125, -4.5654296875, -4.32537841796875, -4.0853271484375, -3.84527587890625, -3.605224609375, -3.36517333984375, -3.1251220703125, -2.88507080078125, -2.64501953125, -2.40496826171875, -2.1649169921875, -1.92486572265625, -1.684814453125, -1.44476318359375, -1.2047119140625, -0.96466064453125, -0.724609375, -0.48455810546875, -0.2445068359375, -0.00445556640625, 0.235595703125, 0.47564697265625, 0.7156982421875, 0.95574951171875, 1.19580078125, 1.43585205078125, 1.6759033203125, 1.91595458984375, 2.156005859375, 2.39605712890625, 2.6361083984375, 2.87615966796875, 3.1162109375, 3.35626220703125, 3.5963134765625, 3.83636474609375, 4.076416015625, 4.31646728515625, 4.5565185546875, 4.79656982421875, 5.03662109375, 5.27667236328125, 5.5167236328125, 5.75677490234375, 5.996826171875, 6.23687744140625, 6.4769287109375, 6.71697998046875, 6.95703125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 6.0, 8.0, 7.0, 9.0, 17.0, 42.0, 45.0, 53.0, 82.0, 97.0, 170.0, 204.0, 286.0, 352.0, 430.0, 455.0, 421.0, 354.0, 263.0, 193.0, 141.0, 116.0, 94.0, 61.0, 48.0, 32.0, 25.0, 20.0, 19.0, 9.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.6732177734375, -8.346435546875, -8.0196533203125, -7.69287109375, -7.3660888671875, -7.039306640625, -6.7125244140625, -6.3857421875, -6.0589599609375, -5.732177734375, -5.4053955078125, -5.07861328125, -4.7518310546875, -4.425048828125, -4.0982666015625, -3.771484375, -3.4447021484375, -3.117919921875, -2.7911376953125, -2.46435546875, -2.1375732421875, -1.810791015625, -1.4840087890625, -1.1572265625, -0.8304443359375, -0.503662109375, -0.1768798828125, 0.14990234375, 0.4766845703125, 0.803466796875, 1.1302490234375, 1.45703125, 1.7838134765625, 2.110595703125, 2.4373779296875, 2.76416015625, 3.0909423828125, 3.417724609375, 3.7445068359375, 4.0712890625, 4.3980712890625, 4.724853515625, 5.0516357421875, 5.37841796875, 5.7052001953125, 6.031982421875, 6.3587646484375, 6.685546875, 7.0123291015625, 7.339111328125, 7.6658935546875, 7.99267578125, 8.3194580078125, 8.646240234375, 8.9730224609375, 9.2998046875, 9.6265869140625, 9.953369140625, 10.2801513671875, 10.60693359375, 10.9337158203125, 11.260498046875, 11.5872802734375, 11.9140625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 1.0, 8.0, 11.0, 13.0, 20.0, 25.0, 33.0, 54.0, 67.0, 91.0, 135.0, 155.0, 266.0, 482.0, 2109.0, 728974.0, 3452449.0, 7716.0, 653.0, 323.0, 202.0, 169.0, 88.0, 65.0, 53.0, 39.0, 33.0, 12.0, 14.0, 8.0, 5.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.6875, -54.18896484375, -52.6904296875, -51.19189453125, -49.693359375, -48.19482421875, -46.6962890625, -45.19775390625, -43.69921875, -42.20068359375, -40.7021484375, -39.20361328125, -37.705078125, -36.20654296875, -34.7080078125, -33.20947265625, -31.7109375, -30.21240234375, -28.7138671875, -27.21533203125, -25.716796875, -24.21826171875, -22.7197265625, -21.22119140625, -19.72265625, -18.22412109375, -16.7255859375, -15.22705078125, -13.728515625, -12.22998046875, -10.7314453125, -9.23291015625, -7.734375, -6.23583984375, -4.7373046875, -3.23876953125, -1.740234375, -0.24169921875, 1.2568359375, 2.75537109375, 4.25390625, 5.75244140625, 7.2509765625, 8.74951171875, 10.248046875, 11.74658203125, 13.2451171875, 14.74365234375, 16.2421875, 17.74072265625, 19.2392578125, 20.73779296875, 22.236328125, 23.73486328125, 25.2333984375, 26.73193359375, 28.23046875, 29.72900390625, 31.2275390625, 32.72607421875, 34.224609375, 35.72314453125, 37.2216796875, 38.72021484375, 40.21875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 2.0, 23.0, 68.0, 176.0, 226.0, 272.0, 157.0, 71.0, 15.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.012392044067383, -27.58333969116211, -24.154285430908203, -20.725231170654297, -17.296178817749023, -13.867124557495117, -10.438072204589844, -7.00901985168457, -3.579965591430664, -0.15091228485107422, 3.2781410217285156, 6.7071943283081055, 10.136247634887695, 13.565301895141602, 16.994354248046875, 20.42340660095215, 23.852460861206055, 27.281513214111328, 30.710567474365234, 34.13962173461914, 37.56867218017578, 40.99772644042969, 44.426780700683594, 47.8558349609375, 51.284889221191406, 54.71394348144531, 58.14299774169922, 61.57204818725586, 65.0010986328125, 68.43016052246094, 71.85920715332031, 75.28826141357422, 78.71731567382812, 82.14636993408203, 85.57542419433594, 89.00447845458984, 92.43353271484375, 95.86257934570312, 99.29163360595703, 102.72068786621094, 106.14974212646484, 109.57879638671875, 113.00785064697266, 116.43690490722656, 119.86595153808594, 123.29501342773438, 126.72406005859375, 130.15310668945312, 133.58216857910156, 137.01121520996094, 140.44027709960938, 143.86932373046875, 147.2983856201172, 150.72743225097656, 154.156494140625, 157.58554077148438, 161.01458740234375, 164.44363403320312, 167.87269592285156, 171.30174255371094, 174.73080444335938, 178.15985107421875, 181.5889129638672, 185.01795959472656, 188.447021484375]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 7.0, 7.0, 9.0, 14.0, 20.0, 27.0, 28.0, 24.0, 30.0, 42.0, 34.0, 37.0, 46.0, 35.0, 36.0, 44.0, 38.0, 43.0, 36.0, 44.0, 42.0, 40.0, 43.0, 29.0, 27.0, 31.0, 27.0, 21.0, 22.0, 16.0, 9.0, 14.0, 11.0, 11.0, 10.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.871028900146484, -30.838356018066406, -29.805683135986328, -28.773008346557617, -27.74033546447754, -26.70766258239746, -25.67498779296875, -24.642314910888672, -23.609642028808594, -22.576969146728516, -21.544296264648438, -20.511621475219727, -19.47894859313965, -18.44627571105957, -17.41360092163086, -16.38092803955078, -15.348255157470703, -14.315582275390625, -13.28290843963623, -12.250234603881836, -11.217561721801758, -10.18488883972168, -9.152215003967285, -8.11954116821289, -7.0868682861328125, -6.054194927215576, -5.02152156829834, -3.9888482093811035, -2.956174850463867, -1.9235014915466309, -0.8908281326293945, 0.1418452262878418, 1.1745147705078125, 2.207188129425049, 3.239861488342285, 4.2725348472595215, 5.305208206176758, 6.337881565093994, 7.3705549240112305, 8.403228759765625, 9.435901641845703, 10.468574523925781, 11.501248359680176, 12.53392219543457, 13.566595077514648, 14.599267959594727, 15.631941795349121, 16.664615631103516, 17.697288513183594, 18.729961395263672, 19.76263427734375, 20.79530906677246, 21.82798194885254, 22.860654830932617, 23.893329620361328, 24.926002502441406, 25.958675384521484, 26.991348266601562, 28.02402114868164, 29.05669593811035, 30.08936882019043, 31.122041702270508, 32.15471649169922, 33.1873893737793, 34.220062255859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 14.0, 7.0, 6.0, 13.0, 8.0, 10.0, 18.0, 33.0, 19.0, 33.0, 34.0, 30.0, 36.0, 28.0, 40.0, 37.0, 33.0, 39.0, 46.0, 42.0, 34.0, 36.0, 34.0, 39.0, 35.0, 32.0, 26.0, 26.0, 29.0, 12.0, 22.0, 24.0, 17.0, 18.0, 17.0, 11.0, 5.0, 10.0, 8.0, 6.0, 9.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.1953125, -4.0614013671875, -3.927490234375, -3.7935791015625, -3.65966796875, -3.5257568359375, -3.391845703125, -3.2579345703125, -3.1240234375, -2.9901123046875, -2.856201171875, -2.7222900390625, -2.58837890625, -2.4544677734375, -2.320556640625, -2.1866455078125, -2.052734375, -1.9188232421875, -1.784912109375, -1.6510009765625, -1.51708984375, -1.3831787109375, -1.249267578125, -1.1153564453125, -0.9814453125, -0.8475341796875, -0.713623046875, -0.5797119140625, -0.44580078125, -0.3118896484375, -0.177978515625, -0.0440673828125, 0.08984375, 0.2237548828125, 0.357666015625, 0.4915771484375, 0.62548828125, 0.7593994140625, 0.893310546875, 1.0272216796875, 1.1611328125, 1.2950439453125, 1.428955078125, 1.5628662109375, 1.69677734375, 1.8306884765625, 1.964599609375, 2.0985107421875, 2.232421875, 2.3663330078125, 2.500244140625, 2.6341552734375, 2.76806640625, 2.9019775390625, 3.035888671875, 3.1697998046875, 3.3037109375, 3.4376220703125, 3.571533203125, 3.7054443359375, 3.83935546875, 3.9732666015625, 4.107177734375, 4.2410888671875, 4.375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 8.0, 14.0, 30.0, 39.0, 54.0, 92.0, 145.0, 277.0, 449.0, 785.0, 1285.0, 2350.0, 4147.0, 7665.0, 14107.0, 25844.0, 46984.0, 83674.0, 142252.0, 206321.0, 201103.0, 134555.0, 78822.0, 44074.0, 24191.0, 13046.0, 7267.0, 3863.0, 2166.0, 1223.0, 728.0, 449.0, 224.0, 120.0, 81.0, 51.0, 24.0, 21.0, 15.0, 7.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4079551696777344, -0.39281463623046875, -0.3776741027832031, -0.3625335693359375, -0.3473930358886719, -0.33225250244140625, -0.3171119689941406, -0.301971435546875, -0.2868309020996094, -0.27169036865234375, -0.2565498352050781, -0.2414093017578125, -0.22626876831054688, -0.21112823486328125, -0.19598770141601562, -0.18084716796875, -0.16570663452148438, -0.15056610107421875, -0.13542556762695312, -0.1202850341796875, -0.10514450073242188, -0.09000396728515625, -0.07486343383789062, -0.059722900390625, -0.044582366943359375, -0.02944183349609375, -0.014301300048828125, 0.0008392333984375, 0.015979766845703125, 0.03112030029296875, 0.046260833740234375, 0.0614013671875, 0.07654190063476562, 0.09168243408203125, 0.10682296752929688, 0.1219635009765625, 0.13710403442382812, 0.15224456787109375, 0.16738510131835938, 0.182525634765625, 0.19766616821289062, 0.21280670166015625, 0.22794723510742188, 0.2430877685546875, 0.2582283020019531, 0.27336883544921875, 0.2885093688964844, 0.30364990234375, 0.3187904357910156, 0.33393096923828125, 0.3490715026855469, 0.3642120361328125, 0.3793525695800781, 0.39449310302734375, 0.4096336364746094, 0.424774169921875, 0.4399147033691406, 0.45505523681640625, 0.4701957702636719, 0.4853363037109375, 0.5004768371582031, 0.5156173706054688, 0.5307579040527344, 0.5458984375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 5.0, 12.0, 13.0, 21.0, 16.0, 19.0, 26.0, 28.0, 33.0, 26.0, 26.0, 33.0, 25.0, 38.0, 35.0, 31.0, 45.0, 1067.0, 46.0, 35.0, 47.0, 26.0, 35.0, 28.0, 38.0, 35.0, 36.0, 26.0, 27.0, 14.0, 17.0, 15.0, 12.0, 15.0, 12.0, 7.0, 5.0, 5.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.802734375, -2.717987060546875, -2.63323974609375, -2.548492431640625, -2.4637451171875, -2.378997802734375, -2.29425048828125, -2.209503173828125, -2.124755859375, -2.040008544921875, -1.95526123046875, -1.870513916015625, -1.7857666015625, -1.701019287109375, -1.61627197265625, -1.531524658203125, -1.44677734375, -1.362030029296875, -1.27728271484375, -1.192535400390625, -1.1077880859375, -1.023040771484375, -0.93829345703125, -0.853546142578125, -0.768798828125, -0.684051513671875, -0.59930419921875, -0.514556884765625, -0.4298095703125, -0.345062255859375, -0.26031494140625, -0.175567626953125, -0.0908203125, -0.006072998046875, 0.07867431640625, 0.163421630859375, 0.2481689453125, 0.332916259765625, 0.41766357421875, 0.502410888671875, 0.587158203125, 0.671905517578125, 0.75665283203125, 0.841400146484375, 0.9261474609375, 1.010894775390625, 1.09564208984375, 1.180389404296875, 1.26513671875, 1.349884033203125, 1.43463134765625, 1.519378662109375, 1.6041259765625, 1.688873291015625, 1.77362060546875, 1.858367919921875, 1.943115234375, 2.027862548828125, 2.11260986328125, 2.197357177734375, 2.2821044921875, 2.366851806640625, 2.45159912109375, 2.536346435546875, 2.62109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 14.0, 20.0, 24.0, 30.0, 52.0, 81.0, 107.0, 172.0, 261.0, 406.0, 611.0, 924.0, 1556.0, 2582.0, 3837.0, 6195.0, 9693.0, 15166.0, 23795.0, 36420.0, 55390.0, 80799.0, 111520.0, 158696.0, 1166933.0, 128113.0, 96285.0, 68311.0, 45907.0, 29906.0, 19248.0, 12317.0, 7908.0, 5040.0, 3154.0, 1988.0, 1302.0, 857.0, 528.0, 339.0, 246.0, 156.0, 96.0, 61.0, 31.0, 19.0, 14.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2174072265625, -0.21045494079589844, -0.20350265502929688, -0.1965503692626953, -0.18959808349609375, -0.1826457977294922, -0.17569351196289062, -0.16874122619628906, -0.1617889404296875, -0.15483665466308594, -0.14788436889648438, -0.1409320831298828, -0.13397979736328125, -0.1270275115966797, -0.12007522583007812, -0.11312294006347656, -0.106170654296875, -0.09921836853027344, -0.09226608276367188, -0.08531379699707031, -0.07836151123046875, -0.07140922546386719, -0.06445693969726562, -0.05750465393066406, -0.0505523681640625, -0.04360008239746094, -0.036647796630859375, -0.029695510864257812, -0.02274322509765625, -0.015790939331054688, -0.008838653564453125, -0.0018863677978515625, 0.00506591796875, 0.012018203735351562, 0.018970489501953125, 0.025922775268554688, 0.03287506103515625, 0.03982734680175781, 0.046779632568359375, 0.05373191833496094, 0.0606842041015625, 0.06763648986816406, 0.07458877563476562, 0.08154106140136719, 0.08849334716796875, 0.09544563293457031, 0.10239791870117188, 0.10935020446777344, 0.116302490234375, 0.12325477600097656, 0.13020706176757812, 0.1371593475341797, 0.14411163330078125, 0.1510639190673828, 0.15801620483398438, 0.16496849060058594, 0.1719207763671875, 0.17887306213378906, 0.18582534790039062, 0.1927776336669922, 0.19972991943359375, 0.2066822052001953, 0.21363449096679688, 0.22058677673339844, 0.2275390625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 6.0, 10.0, 6.0, 15.0, 29.0, 16.0, 49.0, 80.0, 95.0, 191.0, 147.0, 100.0, 74.0, 46.0, 30.0, 26.0, 20.0, 13.0, 7.0, 5.0, 3.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02484130859375, -0.024167537689208984, -0.02349376678466797, -0.022819995880126953, -0.022146224975585938, -0.021472454071044922, -0.020798683166503906, -0.02012491226196289, -0.019451141357421875, -0.01877737045288086, -0.018103599548339844, -0.017429828643798828, -0.016756057739257812, -0.016082286834716797, -0.015408515930175781, -0.014734745025634766, -0.01406097412109375, -0.013387203216552734, -0.012713432312011719, -0.012039661407470703, -0.011365890502929688, -0.010692119598388672, -0.010018348693847656, -0.00934457778930664, -0.008670806884765625, -0.00799703598022461, -0.007323265075683594, -0.006649494171142578, -0.0059757232666015625, -0.005301952362060547, -0.004628181457519531, -0.003954410552978516, -0.0032806396484375, -0.0026068687438964844, -0.0019330978393554688, -0.0012593269348144531, -0.0005855560302734375, 8.821487426757812e-05, 0.0007619857788085938, 0.0014357566833496094, 0.002109527587890625, 0.0027832984924316406, 0.0034570693969726562, 0.004130840301513672, 0.0048046112060546875, 0.005478382110595703, 0.006152153015136719, 0.006825923919677734, 0.00749969482421875, 0.008173465728759766, 0.008847236633300781, 0.009521007537841797, 0.010194778442382812, 0.010868549346923828, 0.011542320251464844, 0.01221609115600586, 0.012889862060546875, 0.01356363296508789, 0.014237403869628906, 0.014911174774169922, 0.015584945678710938, 0.016258716583251953, 0.01693248748779297, 0.017606258392333984, 0.018280029296875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 9.0, 7.0, 12.0, 15.0, 33.0, 31.0, 47.0, 94.0, 181.0, 414.0, 16598.0, 1029443.0, 1129.0, 240.0, 105.0, 50.0, 36.0, 35.0, 9.0, 14.0, 8.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385986328125, -0.3718299865722656, -0.35767364501953125, -0.3435173034667969, -0.3293609619140625, -0.3152046203613281, -0.30104827880859375, -0.2868919372558594, -0.272735595703125, -0.2585792541503906, -0.24442291259765625, -0.23026657104492188, -0.2161102294921875, -0.20195388793945312, -0.18779754638671875, -0.17364120483398438, -0.15948486328125, -0.14532852172851562, -0.13117218017578125, -0.11701583862304688, -0.1028594970703125, -0.08870315551757812, -0.07454681396484375, -0.060390472412109375, -0.046234130859375, -0.032077789306640625, -0.01792144775390625, -0.003765106201171875, 0.0103912353515625, 0.024547576904296875, 0.03870391845703125, 0.052860260009765625, 0.0670166015625, 0.08117294311523438, 0.09532928466796875, 0.10948562622070312, 0.1236419677734375, 0.13779830932617188, 0.15195465087890625, 0.16611099243164062, 0.180267333984375, 0.19442367553710938, 0.20858001708984375, 0.22273635864257812, 0.2368927001953125, 0.2510490417480469, 0.26520538330078125, 0.2793617248535156, 0.29351806640625, 0.3076744079589844, 0.32183074951171875, 0.3359870910644531, 0.3501434326171875, 0.3642997741699219, 0.37845611572265625, 0.3926124572753906, 0.406768798828125, 0.4209251403808594, 0.43508148193359375, 0.4492378234863281, 0.4633941650390625, 0.4775505065917969, 0.49170684814453125, 0.5058631896972656, 0.52001953125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 148.0, 767.0, 84.0, 9.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13448819518089294, -0.12989123165607452, -0.1252942681312561, -0.12069730460643768, -0.11610034853219986, -0.11150338500738144, -0.10690642148256302, -0.1023094654083252, -0.09771250188350677, -0.09311553835868835, -0.08851857483386993, -0.08392161130905151, -0.07932465523481369, -0.07472769170999527, -0.07013072818517685, -0.06553377211093903, -0.06093680113554001, -0.05633983761072159, -0.051742877811193466, -0.047145914286375046, -0.042548954486846924, -0.0379519909620285, -0.03335502743721008, -0.02875806763768196, -0.02416110411286354, -0.01956414245069027, -0.014967179857194424, -0.010370217263698578, -0.005773255601525307, -0.0011762939393520355, 0.003420669585466385, 0.008017629384994507, 0.012614592909812927, 0.0172115545719862, 0.02180851623415947, 0.02640547975897789, 0.03100244142115116, 0.03559940308332443, 0.04019636660814285, 0.044793326407670975, 0.049390289932489395, 0.053987253457307816, 0.05858421325683594, 0.06318117678165436, 0.06777814030647278, 0.0723751038312912, 0.07697206735610962, 0.08156902343034744, 0.08616598695516586, 0.09076295047998428, 0.0953599140048027, 0.09995687007904053, 0.10455383360385895, 0.10915079712867737, 0.11374776065349579, 0.11834472417831421, 0.12294168770313263, 0.12753865122795105, 0.13213561475276947, 0.1367325782775879, 0.1413295418024063, 0.14592650532722473, 0.15052345395088196, 0.15512041747570038, 0.1597173810005188]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 7.0, 8.0, 10.0, 13.0, 18.0, 18.0, 18.0, 19.0, 22.0, 36.0, 29.0, 43.0, 41.0, 44.0, 37.0, 33.0, 35.0, 25.0, 46.0, 39.0, 52.0, 27.0, 41.0, 28.0, 37.0, 28.0, 30.0, 23.0, 25.0, 28.0, 21.0, 24.0, 16.0, 11.0, 11.0, 12.0, 10.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.018322348594665527, -0.017755262553691864, -0.0171881765127182, -0.016621090471744537, -0.016054004430770874, -0.01548691838979721, -0.014919832348823547, -0.014352746307849884, -0.01378566026687622, -0.013218574225902557, -0.012651488184928894, -0.01208440214395523, -0.011517316102981567, -0.010950230062007904, -0.01038314402103424, -0.009816057980060577, -0.009248971939086914, -0.00868188589811325, -0.008114799857139587, -0.007547713816165924, -0.006980627775192261, -0.006413541734218597, -0.005846455693244934, -0.005279369652271271, -0.004712283611297607, -0.004145197570323944, -0.0035781115293502808, -0.0030110254883766174, -0.002443939447402954, -0.0018768534064292908, -0.0013097673654556274, -0.0007426813244819641, -0.00017559528350830078, 0.00039149075746536255, 0.0009585767984390259, 0.0015256628394126892, 0.0020927488803863525, 0.002659834921360016, 0.003226920962333679, 0.0037940070033073425, 0.004361093044281006, 0.004928179085254669, 0.0054952651262283325, 0.006062351167201996, 0.006629437208175659, 0.0071965232491493225, 0.007763609290122986, 0.00833069533109665, 0.008897781372070312, 0.009464867413043976, 0.01003195345401764, 0.010599039494991302, 0.011166125535964966, 0.01173321157693863, 0.012300297617912292, 0.012867383658885956, 0.01343446969985962, 0.014001555740833282, 0.014568641781806946, 0.015135727822780609, 0.015702813863754272, 0.016269899904727936, 0.0168369859457016, 0.017404071986675262, 0.017971158027648926]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 14.0, 7.0, 6.0, 13.0, 8.0, 10.0, 18.0, 33.0, 19.0, 33.0, 34.0, 30.0, 36.0, 28.0, 40.0, 37.0, 33.0, 39.0, 46.0, 42.0, 34.0, 36.0, 34.0, 39.0, 34.0, 33.0, 26.0, 26.0, 29.0, 12.0, 22.0, 24.0, 17.0, 19.0, 16.0, 11.0, 5.0, 10.0, 8.0, 6.0, 9.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.1953125, -4.0614013671875, -3.927490234375, -3.7935791015625, -3.65966796875, -3.5257568359375, -3.391845703125, -3.2579345703125, -3.1240234375, -2.9901123046875, -2.856201171875, -2.7222900390625, -2.58837890625, -2.4544677734375, -2.320556640625, -2.1866455078125, -2.052734375, -1.9188232421875, -1.784912109375, -1.6510009765625, -1.51708984375, -1.3831787109375, -1.249267578125, -1.1153564453125, -0.9814453125, -0.8475341796875, -0.713623046875, -0.5797119140625, -0.44580078125, -0.3118896484375, -0.177978515625, -0.0440673828125, 0.08984375, 0.2237548828125, 0.357666015625, 0.4915771484375, 0.62548828125, 0.7593994140625, 0.893310546875, 1.0272216796875, 1.1611328125, 1.2950439453125, 1.428955078125, 1.5628662109375, 1.69677734375, 1.8306884765625, 1.964599609375, 2.0985107421875, 2.232421875, 2.3663330078125, 2.500244140625, 2.6341552734375, 2.76806640625, 2.9019775390625, 3.035888671875, 3.1697998046875, 3.3037109375, 3.4376220703125, 3.571533203125, 3.7054443359375, 3.83935546875, 3.9732666015625, 4.107177734375, 4.2410888671875, 4.375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 5.0, 3.0, 9.0, 11.0, 4.0, 16.0, 18.0, 25.0, 22.0, 42.0, 56.0, 112.0, 150.0, 276.0, 536.0, 993.0, 1945.0, 3637.0, 6929.0, 13291.0, 26094.0, 54982.0, 129452.0, 321754.0, 280590.0, 111304.0, 48075.0, 22947.0, 11870.0, 6181.0, 3355.0, 1789.0, 856.0, 508.0, 277.0, 152.0, 89.0, 45.0, 43.0, 25.0, 14.0, 14.0, 11.0, 12.0, 9.0, 5.0, 4.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.625, -4.47039794921875, -4.3157958984375, -4.16119384765625, -4.006591796875, -3.85198974609375, -3.6973876953125, -3.54278564453125, -3.38818359375, -3.23358154296875, -3.0789794921875, -2.92437744140625, -2.769775390625, -2.61517333984375, -2.4605712890625, -2.30596923828125, -2.1513671875, -1.99676513671875, -1.8421630859375, -1.68756103515625, -1.532958984375, -1.37835693359375, -1.2237548828125, -1.06915283203125, -0.91455078125, -0.75994873046875, -0.6053466796875, -0.45074462890625, -0.296142578125, -0.14154052734375, 0.0130615234375, 0.16766357421875, 0.322265625, 0.47686767578125, 0.6314697265625, 0.78607177734375, 0.940673828125, 1.09527587890625, 1.2498779296875, 1.40447998046875, 1.55908203125, 1.71368408203125, 1.8682861328125, 2.02288818359375, 2.177490234375, 2.33209228515625, 2.4866943359375, 2.64129638671875, 2.7958984375, 2.95050048828125, 3.1051025390625, 3.25970458984375, 3.414306640625, 3.56890869140625, 3.7235107421875, 3.87811279296875, 4.03271484375, 4.18731689453125, 4.3419189453125, 4.49652099609375, 4.651123046875, 4.80572509765625, 4.9603271484375, 5.11492919921875, 5.26953125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 2.0, 5.0, 5.0, 6.0, 9.0, 12.0, 12.0, 25.0, 21.0, 23.0, 34.0, 22.0, 30.0, 36.0, 34.0, 46.0, 47.0, 70.0, 108.0, 180.0, 1365.0, 328.0, 150.0, 74.0, 57.0, 37.0, 36.0, 40.0, 37.0, 32.0, 22.0, 15.0, 14.0, 23.0, 9.0, 13.0, 14.0, 8.0, 9.0, 9.0, 6.0, 4.0, 4.0, 2.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-17.78125, -17.257568359375, -16.73388671875, -16.210205078125, -15.6865234375, -15.162841796875, -14.63916015625, -14.115478515625, -13.591796875, -13.068115234375, -12.54443359375, -12.020751953125, -11.4970703125, -10.973388671875, -10.44970703125, -9.926025390625, -9.40234375, -8.878662109375, -8.35498046875, -7.831298828125, -7.3076171875, -6.783935546875, -6.26025390625, -5.736572265625, -5.212890625, -4.689208984375, -4.16552734375, -3.641845703125, -3.1181640625, -2.594482421875, -2.07080078125, -1.547119140625, -1.0234375, -0.499755859375, 0.02392578125, 0.547607421875, 1.0712890625, 1.594970703125, 2.11865234375, 2.642333984375, 3.166015625, 3.689697265625, 4.21337890625, 4.737060546875, 5.2607421875, 5.784423828125, 6.30810546875, 6.831787109375, 7.35546875, 7.879150390625, 8.40283203125, 8.926513671875, 9.4501953125, 9.973876953125, 10.49755859375, 11.021240234375, 11.544921875, 12.068603515625, 12.59228515625, 13.115966796875, 13.6396484375, 14.163330078125, 14.68701171875, 15.210693359375, 15.734375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 11.0, 11.0, 13.0, 9.0, 18.0, 23.0, 25.0, 25.0, 36.0, 53.0, 58.0, 70.0, 104.0, 178.0, 206.0, 285.0, 641.0, 2216.0, 67227.0, 3038876.0, 32137.0, 1681.0, 548.0, 339.0, 217.0, 153.0, 109.0, 99.0, 58.0, 63.0, 40.0, 27.0, 28.0, 23.0, 15.0, 16.0, 9.0, 9.0, 9.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-42.84375, -41.5224609375, -40.201171875, -38.8798828125, -37.55859375, -36.2373046875, -34.916015625, -33.5947265625, -32.2734375, -30.9521484375, -29.630859375, -28.3095703125, -26.98828125, -25.6669921875, -24.345703125, -23.0244140625, -21.703125, -20.3818359375, -19.060546875, -17.7392578125, -16.41796875, -15.0966796875, -13.775390625, -12.4541015625, -11.1328125, -9.8115234375, -8.490234375, -7.1689453125, -5.84765625, -4.5263671875, -3.205078125, -1.8837890625, -0.5625, 0.7587890625, 2.080078125, 3.4013671875, 4.72265625, 6.0439453125, 7.365234375, 8.6865234375, 10.0078125, 11.3291015625, 12.650390625, 13.9716796875, 15.29296875, 16.6142578125, 17.935546875, 19.2568359375, 20.578125, 21.8994140625, 23.220703125, 24.5419921875, 25.86328125, 27.1845703125, 28.505859375, 29.8271484375, 31.1484375, 32.4697265625, 33.791015625, 35.1123046875, 36.43359375, 37.7548828125, 39.076171875, 40.3974609375, 41.71875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 73.0, 237.0, 401.0, 234.0, 53.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-138.49945068359375, -135.95594787597656, -133.4124298095703, -130.86892700195312, -128.32542419433594, -125.78190612792969, -123.2384033203125, -120.69489288330078, -118.15138244628906, -115.60787200927734, -113.06436920166016, -110.52085876464844, -107.97734832763672, -105.433837890625, -102.89033508300781, -100.3468246459961, -97.80331420898438, -95.25980377197266, -92.71630096435547, -90.17279052734375, -87.62928009033203, -85.08576965332031, -82.54226684570312, -79.9987564086914, -77.45525360107422, -74.9117431640625, -72.36824035644531, -69.8247299194336, -67.28121948242188, -64.73770904541016, -62.19420623779297, -59.65069580078125, -57.10718536376953, -54.56367874145508, -52.02016830444336, -49.476661682128906, -46.93315124511719, -44.389644622802734, -41.84613800048828, -39.30262756347656, -36.759117126464844, -34.21561050415039, -31.672100067138672, -29.12859344482422, -26.5850830078125, -24.041576385498047, -21.49806785583496, -18.954559326171875, -16.411052703857422, -13.867544174194336, -11.32403564453125, -8.78052806854248, -6.2370195388793945, -3.6935110092163086, -1.150003433227539, 1.3935050964355469, 3.937013626098633, 6.480522155761719, 9.024030685424805, 11.567538261413574, 14.11104679107666, 16.654556274414062, 19.198062896728516, 21.7415714263916, 24.285079956054688]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 11.0, 8.0, 6.0, 8.0, 12.0, 15.0, 9.0, 17.0, 16.0, 18.0, 20.0, 22.0, 32.0, 21.0, 29.0, 29.0, 35.0, 38.0, 36.0, 38.0, 39.0, 47.0, 42.0, 44.0, 39.0, 49.0, 36.0, 34.0, 28.0, 27.0, 26.0, 25.0, 22.0, 24.0, 19.0, 23.0, 12.0, 8.0, 6.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-42.71039581298828, -41.401756286621094, -40.09312057495117, -38.784481048583984, -37.4758415222168, -36.167205810546875, -34.85856628417969, -33.5499267578125, -32.24128723144531, -30.932649612426758, -29.62401008605957, -28.315372467041016, -27.006732940673828, -25.698095321655273, -24.38945770263672, -23.08081817626953, -21.77218246459961, -20.463544845581055, -19.154905319213867, -17.846267700195312, -16.537628173828125, -15.22899055480957, -13.920352935791016, -12.611714363098145, -11.303075790405273, -9.994437217712402, -8.685798645019531, -7.377161026000977, -6.0685224533081055, -4.759883880615234, -3.4512457847595215, -2.1426076889038086, -0.8339653015136719, 0.4746730327606201, 1.783311367034912, 3.091949701309204, 4.400588035583496, 5.709226608276367, 7.01786470413208, 8.326502799987793, 9.635141372680664, 10.943779945373535, 12.252418518066406, 13.561056137084961, 14.869694709777832, 16.178333282470703, 17.486970901489258, 18.795608520507812, 20.104248046875, 21.412885665893555, 22.721525192260742, 24.030162811279297, 25.338802337646484, 26.64743995666504, 27.956077575683594, 29.26471710205078, 30.573354721069336, 31.88199234008789, 33.19063186645508, 34.499271392822266, 35.80790710449219, 37.116546630859375, 38.42518615722656, 39.733821868896484, 41.04246139526367]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 7.0, 4.0, 4.0, 5.0, 2.0, 7.0, 6.0, 11.0, 9.0, 11.0, 18.0, 18.0, 23.0, 22.0, 24.0, 35.0, 35.0, 28.0, 22.0, 37.0, 37.0, 46.0, 32.0, 49.0, 34.0, 39.0, 40.0, 33.0, 36.0, 35.0, 42.0, 36.0, 23.0, 23.0, 25.0, 23.0, 20.0, 17.0, 5.0, 20.0, 9.0, 10.0, 13.0, 10.0, 8.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.51953125, -4.37078857421875, -4.2220458984375, -4.07330322265625, -3.924560546875, -3.77581787109375, -3.6270751953125, -3.47833251953125, -3.32958984375, -3.18084716796875, -3.0321044921875, -2.88336181640625, -2.734619140625, -2.58587646484375, -2.4371337890625, -2.28839111328125, -2.1396484375, -1.99090576171875, -1.8421630859375, -1.69342041015625, -1.544677734375, -1.39593505859375, -1.2471923828125, -1.09844970703125, -0.94970703125, -0.80096435546875, -0.6522216796875, -0.50347900390625, -0.354736328125, -0.20599365234375, -0.0572509765625, 0.09149169921875, 0.240234375, 0.38897705078125, 0.5377197265625, 0.68646240234375, 0.835205078125, 0.98394775390625, 1.1326904296875, 1.28143310546875, 1.43017578125, 1.57891845703125, 1.7276611328125, 1.87640380859375, 2.025146484375, 2.17388916015625, 2.3226318359375, 2.47137451171875, 2.6201171875, 2.76885986328125, 2.9176025390625, 3.06634521484375, 3.215087890625, 3.36383056640625, 3.5125732421875, 3.66131591796875, 3.81005859375, 3.95880126953125, 4.1075439453125, 4.25628662109375, 4.405029296875, 4.55377197265625, 4.7025146484375, 4.85125732421875, 5.0]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 8.0, 4.0, 2.0, 5.0, 6.0, 9.0, 12.0, 6.0, 18.0, 21.0, 29.0, 35.0, 41.0, 58.0, 71.0, 96.0, 147.0, 213.0, 461.0, 1121.0, 5107.0, 33516.0, 280062.0, 1642308.0, 1834850.0, 345809.0, 41326.0, 6208.0, 1327.0, 548.0, 241.0, 166.0, 111.0, 79.0, 55.0, 44.0, 42.0, 34.0, 27.0, 9.0, 16.0, 8.0, 11.0, 4.0, 7.0, 4.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.54638671875, -9.2177734375, -8.88916015625, -8.560546875, -8.23193359375, -7.9033203125, -7.57470703125, -7.24609375, -6.91748046875, -6.5888671875, -6.26025390625, -5.931640625, -5.60302734375, -5.2744140625, -4.94580078125, -4.6171875, -4.28857421875, -3.9599609375, -3.63134765625, -3.302734375, -2.97412109375, -2.6455078125, -2.31689453125, -1.98828125, -1.65966796875, -1.3310546875, -1.00244140625, -0.673828125, -0.34521484375, -0.0166015625, 0.31201171875, 0.640625, 0.96923828125, 1.2978515625, 1.62646484375, 1.955078125, 2.28369140625, 2.6123046875, 2.94091796875, 3.26953125, 3.59814453125, 3.9267578125, 4.25537109375, 4.583984375, 4.91259765625, 5.2412109375, 5.56982421875, 5.8984375, 6.22705078125, 6.5556640625, 6.88427734375, 7.212890625, 7.54150390625, 7.8701171875, 8.19873046875, 8.52734375, 8.85595703125, 9.1845703125, 9.51318359375, 9.841796875, 10.17041015625, 10.4990234375, 10.82763671875, 11.15625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 11.0, 12.0, 22.0, 27.0, 31.0, 44.0, 55.0, 83.0, 118.0, 152.0, 201.0, 287.0, 359.0, 394.0, 421.0, 415.0, 316.0, 254.0, 220.0, 148.0, 119.0, 86.0, 85.0, 60.0, 42.0, 19.0, 20.0, 18.0, 13.0, 8.0, 4.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.7265625, -8.420654296875, -8.11474609375, -7.808837890625, -7.5029296875, -7.197021484375, -6.89111328125, -6.585205078125, -6.279296875, -5.973388671875, -5.66748046875, -5.361572265625, -5.0556640625, -4.749755859375, -4.44384765625, -4.137939453125, -3.83203125, -3.526123046875, -3.22021484375, -2.914306640625, -2.6083984375, -2.302490234375, -1.99658203125, -1.690673828125, -1.384765625, -1.078857421875, -0.77294921875, -0.467041015625, -0.1611328125, 0.144775390625, 0.45068359375, 0.756591796875, 1.0625, 1.368408203125, 1.67431640625, 1.980224609375, 2.2861328125, 2.592041015625, 2.89794921875, 3.203857421875, 3.509765625, 3.815673828125, 4.12158203125, 4.427490234375, 4.7333984375, 5.039306640625, 5.34521484375, 5.651123046875, 5.95703125, 6.262939453125, 6.56884765625, 6.874755859375, 7.1806640625, 7.486572265625, 7.79248046875, 8.098388671875, 8.404296875, 8.710205078125, 9.01611328125, 9.322021484375, 9.6279296875, 9.933837890625, 10.23974609375, 10.545654296875, 10.8515625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 10.0, 6.0, 9.0, 7.0, 24.0, 18.0, 28.0, 41.0, 61.0, 87.0, 103.0, 124.0, 191.0, 312.0, 427.0, 1999.0, 291717.0, 3863411.0, 33586.0, 894.0, 402.0, 252.0, 173.0, 114.0, 75.0, 54.0, 40.0, 29.0, 27.0, 20.0, 12.0, 5.0, 11.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.03125, -48.65380859375, -47.2763671875, -45.89892578125, -44.521484375, -43.14404296875, -41.7666015625, -40.38916015625, -39.01171875, -37.63427734375, -36.2568359375, -34.87939453125, -33.501953125, -32.12451171875, -30.7470703125, -29.36962890625, -27.9921875, -26.61474609375, -25.2373046875, -23.85986328125, -22.482421875, -21.10498046875, -19.7275390625, -18.35009765625, -16.97265625, -15.59521484375, -14.2177734375, -12.84033203125, -11.462890625, -10.08544921875, -8.7080078125, -7.33056640625, -5.953125, -4.57568359375, -3.1982421875, -1.82080078125, -0.443359375, 0.93408203125, 2.3115234375, 3.68896484375, 5.06640625, 6.44384765625, 7.8212890625, 9.19873046875, 10.576171875, 11.95361328125, 13.3310546875, 14.70849609375, 16.0859375, 17.46337890625, 18.8408203125, 20.21826171875, 21.595703125, 22.97314453125, 24.3505859375, 25.72802734375, 27.10546875, 28.48291015625, 29.8603515625, 31.23779296875, 32.615234375, 33.99267578125, 35.3701171875, 36.74755859375, 38.125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 15.0, 48.0, 219.0, 342.0, 255.0, 109.0, 23.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.34267044067383, -35.22692108154297, -31.11117172241211, -26.99542236328125, -22.87967300415039, -18.76392364501953, -14.648174285888672, -10.532424926757812, -6.416675567626953, -2.3009262084960938, 1.8148231506347656, 5.930572509765625, 10.046321868896484, 14.162071228027344, 18.277820587158203, 22.393569946289062, 26.509319305419922, 30.62506866455078, 34.74081802368164, 38.8565673828125, 42.97231674194336, 47.08806610107422, 51.20381546020508, 55.31956481933594, 59.4353141784668, 63.551063537597656, 67.66680908203125, 71.78256225585938, 75.8983154296875, 80.0140609741211, 84.12980651855469, 88.24555969238281, 92.36129760742188, 96.47705078125, 100.5927963256836, 104.70854187011719, 108.82429504394531, 112.94004821777344, 117.05579376220703, 121.17153930664062, 125.28729248046875, 129.40304565429688, 133.518798828125, 137.63453674316406, 141.7502899169922, 145.8660430908203, 149.98178100585938, 154.0975341796875, 158.21328735351562, 162.32904052734375, 166.44479370117188, 170.56053161621094, 174.67628479003906, 178.7920379638672, 182.90777587890625, 187.02352905273438, 191.1392822265625, 195.25503540039062, 199.37078857421875, 203.4865264892578, 207.60227966308594, 211.71803283691406, 215.83377075195312, 219.94952392578125, 224.06527709960938]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 7.0, 6.0, 8.0, 11.0, 13.0, 6.0, 16.0, 16.0, 28.0, 18.0, 30.0, 34.0, 34.0, 41.0, 45.0, 47.0, 46.0, 44.0, 44.0, 45.0, 36.0, 39.0, 56.0, 34.0, 52.0, 38.0, 29.0, 25.0, 25.0, 22.0, 12.0, 9.0, 17.0, 13.0, 14.0, 8.0, 6.0, 5.0, 3.0, 4.0, 1.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-39.37056350708008, -38.268489837646484, -37.166419982910156, -36.06434631347656, -34.962276458740234, -33.86020278930664, -32.75813293457031, -31.65605926513672, -30.55398941040039, -29.45191764831543, -28.34984588623047, -27.247774124145508, -26.145702362060547, -25.043630599975586, -23.941558837890625, -22.83948516845703, -21.73741340637207, -20.63534164428711, -19.53326988220215, -18.431198120117188, -17.329126358032227, -16.227054595947266, -15.124981880187988, -14.022910118103027, -12.920838356018066, -11.818766593933105, -10.716694831848145, -9.614622116088867, -8.512550354003906, -7.4104790687561035, -6.308406829833984, -5.206335067749023, -4.104265213012695, -3.0021934509277344, -1.9001214504241943, -0.7980494499206543, 0.30402231216430664, 1.4060940742492676, 2.5081663131713867, 3.6102380752563477, 4.712309837341309, 5.8143815994262695, 6.9164533615112305, 8.018526077270508, 9.120597839355469, 10.22266960144043, 11.32474136352539, 12.426813125610352, 13.528884887695312, 14.630956649780273, 15.733028411865234, 16.835100173950195, 17.937171936035156, 19.039243698120117, 20.141315460205078, 21.243389129638672, 22.345458984375, 23.44753074645996, 24.549602508544922, 25.651674270629883, 26.753746032714844, 27.855817794799805, 28.957889556884766, 30.05996322631836, 31.16203498840332]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 11.0, 7.0, 14.0, 9.0, 13.0, 12.0, 21.0, 19.0, 27.0, 30.0, 17.0, 34.0, 31.0, 41.0, 51.0, 35.0, 38.0, 32.0, 38.0, 40.0, 38.0, 34.0, 33.0, 39.0, 35.0, 30.0, 35.0, 18.0, 22.0, 29.0, 16.0, 16.0, 20.0, 17.0, 17.0, 14.0, 14.0, 8.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.5234375, -4.38616943359375, -4.2489013671875, -4.11163330078125, -3.974365234375, -3.83709716796875, -3.6998291015625, -3.56256103515625, -3.42529296875, -3.28802490234375, -3.1507568359375, -3.01348876953125, -2.876220703125, -2.73895263671875, -2.6016845703125, -2.46441650390625, -2.3271484375, -2.18988037109375, -2.0526123046875, -1.91534423828125, -1.778076171875, -1.64080810546875, -1.5035400390625, -1.36627197265625, -1.22900390625, -1.09173583984375, -0.9544677734375, -0.81719970703125, -0.679931640625, -0.54266357421875, -0.4053955078125, -0.26812744140625, -0.130859375, 0.00640869140625, 0.1436767578125, 0.28094482421875, 0.418212890625, 0.55548095703125, 0.6927490234375, 0.83001708984375, 0.96728515625, 1.10455322265625, 1.2418212890625, 1.37908935546875, 1.516357421875, 1.65362548828125, 1.7908935546875, 1.92816162109375, 2.0654296875, 2.20269775390625, 2.3399658203125, 2.47723388671875, 2.614501953125, 2.75177001953125, 2.8890380859375, 3.02630615234375, 3.16357421875, 3.30084228515625, 3.4381103515625, 3.57537841796875, 3.712646484375, 3.84991455078125, 3.9871826171875, 4.12445068359375, 4.26171875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 11.0, 21.0, 36.0, 45.0, 65.0, 99.0, 158.0, 217.0, 351.0, 518.0, 720.0, 1110.0, 1687.0, 2569.0, 3788.0, 5757.0, 8482.0, 13247.0, 19846.0, 29773.0, 43902.0, 64292.0, 90019.0, 118933.0, 141856.0, 136766.0, 110005.0, 81061.0, 56303.0, 39087.0, 26132.0, 17449.0, 11571.0, 7580.0, 5007.0, 3358.0, 2209.0, 1485.0, 979.0, 646.0, 455.0, 340.0, 182.0, 140.0, 94.0, 65.0, 54.0, 31.0, 23.0, 14.0, 11.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.317626953125, -0.3076515197753906, -0.29767608642578125, -0.2877006530761719, -0.2777252197265625, -0.2677497863769531, -0.25777435302734375, -0.24779891967773438, -0.237823486328125, -0.22784805297851562, -0.21787261962890625, -0.20789718627929688, -0.1979217529296875, -0.18794631958007812, -0.17797088623046875, -0.16799545288085938, -0.15802001953125, -0.14804458618164062, -0.13806915283203125, -0.12809371948242188, -0.1181182861328125, -0.10814285278320312, -0.09816741943359375, -0.08819198608398438, -0.078216552734375, -0.06824111938476562, -0.05826568603515625, -0.048290252685546875, -0.0383148193359375, -0.028339385986328125, -0.01836395263671875, -0.008388519287109375, 0.0015869140625, 0.011562347412109375, 0.02153778076171875, 0.031513214111328125, 0.0414886474609375, 0.051464080810546875, 0.06143951416015625, 0.07141494750976562, 0.081390380859375, 0.09136581420898438, 0.10134124755859375, 0.11131668090820312, 0.1212921142578125, 0.13126754760742188, 0.14124298095703125, 0.15121841430664062, 0.16119384765625, 0.17116928100585938, 0.18114471435546875, 0.19112014770507812, 0.2010955810546875, 0.21107101440429688, 0.22104644775390625, 0.23102188110351562, 0.240997314453125, 0.2509727478027344, 0.26094818115234375, 0.2709236145019531, 0.2808990478515625, 0.2908744812011719, 0.30084991455078125, 0.3108253479003906, 0.32080078125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 3.0, 2.0, 5.0, 8.0, 11.0, 10.0, 14.0, 21.0, 21.0, 15.0, 29.0, 25.0, 32.0, 37.0, 27.0, 51.0, 36.0, 30.0, 49.0, 36.0, 1073.0, 36.0, 37.0, 40.0, 52.0, 33.0, 40.0, 34.0, 37.0, 37.0, 20.0, 27.0, 20.0, 12.0, 10.0, 18.0, 10.0, 8.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.375, -3.27471923828125, -3.1744384765625, -3.07415771484375, -2.973876953125, -2.87359619140625, -2.7733154296875, -2.67303466796875, -2.57275390625, -2.47247314453125, -2.3721923828125, -2.27191162109375, -2.171630859375, -2.07135009765625, -1.9710693359375, -1.87078857421875, -1.7705078125, -1.67022705078125, -1.5699462890625, -1.46966552734375, -1.369384765625, -1.26910400390625, -1.1688232421875, -1.06854248046875, -0.96826171875, -0.86798095703125, -0.7677001953125, -0.66741943359375, -0.567138671875, -0.46685791015625, -0.3665771484375, -0.26629638671875, -0.166015625, -0.06573486328125, 0.0345458984375, 0.13482666015625, 0.235107421875, 0.33538818359375, 0.4356689453125, 0.53594970703125, 0.63623046875, 0.73651123046875, 0.8367919921875, 0.93707275390625, 1.037353515625, 1.13763427734375, 1.2379150390625, 1.33819580078125, 1.4384765625, 1.53875732421875, 1.6390380859375, 1.73931884765625, 1.839599609375, 1.93988037109375, 2.0401611328125, 2.14044189453125, 2.24072265625, 2.34100341796875, 2.4412841796875, 2.54156494140625, 2.641845703125, 2.74212646484375, 2.8424072265625, 2.94268798828125, 3.04296875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 13.0, 17.0, 30.0, 44.0, 77.0, 105.0, 147.0, 250.0, 356.0, 557.0, 862.0, 1378.0, 2347.0, 3566.0, 6102.0, 9971.0, 16446.0, 27133.0, 43556.0, 68035.0, 100949.0, 137262.0, 1197059.0, 154237.0, 113740.0, 78207.0, 51573.0, 32146.0, 19779.0, 12027.0, 7403.0, 4446.0, 2697.0, 1691.0, 1080.0, 631.0, 428.0, 268.0, 175.0, 123.0, 65.0, 54.0, 29.0, 22.0, 18.0, 10.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.27392578125, -0.26602745056152344, -0.2581291198730469, -0.2502307891845703, -0.24233245849609375, -0.2344341278076172, -0.22653579711914062, -0.21863746643066406, -0.2107391357421875, -0.20284080505371094, -0.19494247436523438, -0.1870441436767578, -0.17914581298828125, -0.1712474822998047, -0.16334915161132812, -0.15545082092285156, -0.147552490234375, -0.13965415954589844, -0.13175582885742188, -0.12385749816894531, -0.11595916748046875, -0.10806083679199219, -0.10016250610351562, -0.09226417541503906, -0.0843658447265625, -0.07646751403808594, -0.06856918334960938, -0.06067085266113281, -0.05277252197265625, -0.04487419128417969, -0.036975860595703125, -0.029077529907226562, -0.02117919921875, -0.013280868530273438, -0.005382537841796875, 0.0025157928466796875, 0.01041412353515625, 0.018312454223632812, 0.026210784912109375, 0.03410911560058594, 0.0420074462890625, 0.04990577697753906, 0.057804107666015625, 0.06570243835449219, 0.07360076904296875, 0.08149909973144531, 0.08939743041992188, 0.09729576110839844, 0.105194091796875, 0.11309242248535156, 0.12099075317382812, 0.1288890838623047, 0.13678741455078125, 0.1446857452392578, 0.15258407592773438, 0.16048240661621094, 0.1683807373046875, 0.17627906799316406, 0.18417739868164062, 0.1920757293701172, 0.19997406005859375, 0.2078723907470703, 0.21577072143554688, 0.22366905212402344, 0.2315673828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 3.0, 6.0, 5.0, 8.0, 10.0, 10.0, 14.0, 22.0, 40.0, 58.0, 82.0, 137.0, 204.0, 153.0, 68.0, 46.0, 34.0, 15.0, 16.0, 16.0, 14.0, 11.0, 5.0, 4.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.0160980224609375, -0.015568971633911133, -0.015039920806884766, -0.014510869979858398, -0.013981819152832031, -0.013452768325805664, -0.012923717498779297, -0.01239466667175293, -0.011865615844726562, -0.011336565017700195, -0.010807514190673828, -0.010278463363647461, -0.009749412536621094, -0.009220361709594727, -0.00869131088256836, -0.008162260055541992, -0.007633209228515625, -0.007104158401489258, -0.006575107574462891, -0.0060460567474365234, -0.005517005920410156, -0.004987955093383789, -0.004458904266357422, -0.003929853439331055, -0.0034008026123046875, -0.0028717517852783203, -0.002342700958251953, -0.001813650131225586, -0.0012845993041992188, -0.0007555484771728516, -0.00022649765014648438, 0.0003025531768798828, 0.00083160400390625, 0.0013606548309326172, 0.0018897056579589844, 0.0024187564849853516, 0.0029478073120117188, 0.003476858139038086, 0.004005908966064453, 0.00453495979309082, 0.0050640106201171875, 0.005593061447143555, 0.006122112274169922, 0.006651163101196289, 0.007180213928222656, 0.0077092647552490234, 0.00823831558227539, 0.008767366409301758, 0.009296417236328125, 0.009825468063354492, 0.01035451889038086, 0.010883569717407227, 0.011412620544433594, 0.011941671371459961, 0.012470722198486328, 0.012999773025512695, 0.013528823852539062, 0.01405787467956543, 0.014586925506591797, 0.015115976333618164, 0.01564502716064453, 0.0161740779876709, 0.016703128814697266, 0.017232179641723633, 0.01776123046875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 9.0, 3.0, 5.0, 9.0, 12.0, 14.0, 20.0, 33.0, 42.0, 72.0, 126.0, 235.0, 2259.0, 1038911.0, 6124.0, 314.0, 138.0, 81.0, 44.0, 29.0, 13.0, 15.0, 14.0, 7.0, 7.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.3773345947265625, -0.365753173828125, -0.3541717529296875, -0.34259033203125, -0.3310089111328125, -0.319427490234375, -0.3078460693359375, -0.2962646484375, -0.2846832275390625, -0.273101806640625, -0.2615203857421875, -0.24993896484375, -0.2383575439453125, -0.226776123046875, -0.2151947021484375, -0.20361328125, -0.1920318603515625, -0.180450439453125, -0.1688690185546875, -0.15728759765625, -0.1457061767578125, -0.134124755859375, -0.1225433349609375, -0.1109619140625, -0.0993804931640625, -0.087799072265625, -0.0762176513671875, -0.06463623046875, -0.0530548095703125, -0.041473388671875, -0.0298919677734375, -0.018310546875, -0.0067291259765625, 0.004852294921875, 0.0164337158203125, 0.02801513671875, 0.0395965576171875, 0.051177978515625, 0.0627593994140625, 0.0743408203125, 0.0859222412109375, 0.097503662109375, 0.1090850830078125, 0.12066650390625, 0.1322479248046875, 0.143829345703125, 0.1554107666015625, 0.1669921875, 0.1785736083984375, 0.190155029296875, 0.2017364501953125, 0.21331787109375, 0.2248992919921875, 0.236480712890625, 0.2480621337890625, 0.2596435546875, 0.2712249755859375, 0.282806396484375, 0.2943878173828125, 0.30596923828125, 0.3175506591796875, 0.329132080078125, 0.3407135009765625, 0.352294921875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 23.0, 53.0, 147.0, 287.0, 263.0, 106.0, 58.0, 28.0, 12.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013879046775400639, -0.013049098663032055, -0.012219149619340897, -0.011389201506972313, -0.01055925339460373, -0.009729305282235146, -0.008899357169866562, -0.008069408126175404, -0.00723946001380682, -0.006409511901438236, -0.005579563323408365, -0.004749614745378494, -0.003919666633009911, -0.003089718520641327, -0.002259769942611456, -0.001429821364581585, -0.0005998732522130013, 0.00023007509298622608, 0.0010600234381854534, 0.0018899717833846807, 0.002719920128583908, 0.0035498682409524918, 0.004379816818982363, 0.005209765397012234, 0.006039713509380817, 0.006869661621749401, 0.007699610199779272, 0.008529558777809143, 0.009359506890177727, 0.01018945500254631, 0.011019403114914894, 0.011849352158606052, 0.01267930120229721, 0.013509249314665794, 0.014339197427034378, 0.015169146470725536, 0.015999093651771545, 0.01682904362678528, 0.017658991739153862, 0.018488939851522446, 0.01931888796389103, 0.020148836076259613, 0.020978784188628197, 0.02180873230099678, 0.022638682276010513, 0.023468628525733948, 0.02429857850074768, 0.025128526613116264, 0.025958474725484848, 0.02678842283785343, 0.027618370950222015, 0.0284483190625906, 0.029278267174959183, 0.030108217149972916, 0.0309381652623415, 0.03176811337471008, 0.032598063349723816, 0.03342801332473755, 0.03425795957446098, 0.035087909549474716, 0.03591785579919815, 0.036747805774211884, 0.03757775202393532, 0.03840770199894905, 0.039237648248672485]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 12.0, 9.0, 4.0, 12.0, 10.0, 18.0, 21.0, 19.0, 29.0, 25.0, 32.0, 27.0, 41.0, 34.0, 41.0, 40.0, 47.0, 49.0, 38.0, 41.0, 38.0, 50.0, 44.0, 40.0, 32.0, 32.0, 26.0, 31.0, 23.0, 22.0, 15.0, 21.0, 15.0, 15.0, 12.0, 5.0, 5.0, 4.0, 8.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0110853910446167, -0.010772244073450565, -0.010459097102284431, -0.010145950131118298, -0.009832803159952164, -0.00951965618878603, -0.009206509217619896, -0.008893362246453762, -0.008580215275287628, -0.008267068304121494, -0.00795392133295536, -0.0076407743617892265, -0.007327627390623093, -0.007014480419456959, -0.006701333448290825, -0.006388186477124691, -0.006075039505958557, -0.005761892534792423, -0.005448745563626289, -0.0051355985924601555, -0.004822451621294022, -0.004509304650127888, -0.004196157678961754, -0.00388301070779562, -0.003569863736629486, -0.003256716765463352, -0.0029435697942972183, -0.0026304228231310844, -0.0023172758519649506, -0.0020041288807988167, -0.0016909819096326828, -0.001377834938466549, -0.001064687967300415, -0.0007515409961342812, -0.0004383940249681473, -0.0001252470538020134, 0.00018789991736412048, 0.0005010468885302544, 0.0008141938596963882, 0.0011273408308625221, 0.001440487802028656, 0.0017536347731947899, 0.0020667817443609238, 0.0023799287155270576, 0.0026930756866931915, 0.0030062226578593254, 0.0033193696290254593, 0.003632516600191593, 0.003945663571357727, 0.004258810542523861, 0.004571957513689995, 0.004885104484856129, 0.005198251456022263, 0.0055113984271883965, 0.00582454539835453, 0.006137692369520664, 0.006450839340686798, 0.006763986311852932, 0.007077133283019066, 0.0073902802541852, 0.007703427225351334, 0.008016574196517467, 0.008329721167683601, 0.008642868138849735, 0.00895601511001587]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 11.0, 7.0, 14.0, 9.0, 13.0, 12.0, 21.0, 19.0, 27.0, 30.0, 17.0, 34.0, 31.0, 41.0, 51.0, 35.0, 38.0, 32.0, 38.0, 40.0, 38.0, 34.0, 33.0, 39.0, 35.0, 30.0, 35.0, 18.0, 23.0, 28.0, 16.0, 16.0, 20.0, 17.0, 17.0, 14.0, 14.0, 8.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.5234375, -4.38616943359375, -4.2489013671875, -4.11163330078125, -3.974365234375, -3.83709716796875, -3.6998291015625, -3.56256103515625, -3.42529296875, -3.28802490234375, -3.1507568359375, -3.01348876953125, -2.876220703125, -2.73895263671875, -2.6016845703125, -2.46441650390625, -2.3271484375, -2.18988037109375, -2.0526123046875, -1.91534423828125, -1.778076171875, -1.64080810546875, -1.5035400390625, -1.36627197265625, -1.22900390625, -1.09173583984375, -0.9544677734375, -0.81719970703125, -0.679931640625, -0.54266357421875, -0.4053955078125, -0.26812744140625, -0.130859375, 0.00640869140625, 0.1436767578125, 0.28094482421875, 0.418212890625, 0.55548095703125, 0.6927490234375, 0.83001708984375, 0.96728515625, 1.10455322265625, 1.2418212890625, 1.37908935546875, 1.516357421875, 1.65362548828125, 1.7908935546875, 1.92816162109375, 2.0654296875, 2.20269775390625, 2.3399658203125, 2.47723388671875, 2.614501953125, 2.75177001953125, 2.8890380859375, 3.02630615234375, 3.16357421875, 3.30084228515625, 3.4381103515625, 3.57537841796875, 3.712646484375, 3.84991455078125, 3.9871826171875, 4.12445068359375, 4.26171875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 8.0, 13.0, 9.0, 15.0, 20.0, 22.0, 27.0, 37.0, 35.0, 57.0, 96.0, 101.0, 208.0, 356.0, 708.0, 1402.0, 2826.0, 5679.0, 11365.0, 22525.0, 44231.0, 88072.0, 181195.0, 313182.0, 190361.0, 92132.0, 46044.0, 23736.0, 12092.0, 5854.0, 2962.0, 1390.0, 703.0, 364.0, 217.0, 121.0, 94.0, 48.0, 50.0, 35.0, 39.0, 25.0, 19.0, 19.0, 13.0, 9.0, 7.0, 6.0, 3.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.73828125, -4.5880126953125, -4.437744140625, -4.2874755859375, -4.13720703125, -3.9869384765625, -3.836669921875, -3.6864013671875, -3.5361328125, -3.3858642578125, -3.235595703125, -3.0853271484375, -2.93505859375, -2.7847900390625, -2.634521484375, -2.4842529296875, -2.333984375, -2.1837158203125, -2.033447265625, -1.8831787109375, -1.73291015625, -1.5826416015625, -1.432373046875, -1.2821044921875, -1.1318359375, -0.9815673828125, -0.831298828125, -0.6810302734375, -0.53076171875, -0.3804931640625, -0.230224609375, -0.0799560546875, 0.0703125, 0.2205810546875, 0.370849609375, 0.5211181640625, 0.67138671875, 0.8216552734375, 0.971923828125, 1.1221923828125, 1.2724609375, 1.4227294921875, 1.572998046875, 1.7232666015625, 1.87353515625, 2.0238037109375, 2.174072265625, 2.3243408203125, 2.474609375, 2.6248779296875, 2.775146484375, 2.9254150390625, 3.07568359375, 3.2259521484375, 3.376220703125, 3.5264892578125, 3.6767578125, 3.8270263671875, 3.977294921875, 4.1275634765625, 4.27783203125, 4.4281005859375, 4.578369140625, 4.7286376953125, 4.87890625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 9.0, 16.0, 14.0, 13.0, 21.0, 26.0, 35.0, 42.0, 36.0, 43.0, 61.0, 62.0, 59.0, 126.0, 322.0, 1443.0, 221.0, 110.0, 51.0, 43.0, 43.0, 30.0, 27.0, 36.0, 28.0, 20.0, 23.0, 11.0, 17.0, 8.0, 12.0, 11.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.25, -18.688720703125, -18.12744140625, -17.566162109375, -17.0048828125, -16.443603515625, -15.88232421875, -15.321044921875, -14.759765625, -14.198486328125, -13.63720703125, -13.075927734375, -12.5146484375, -11.953369140625, -11.39208984375, -10.830810546875, -10.26953125, -9.708251953125, -9.14697265625, -8.585693359375, -8.0244140625, -7.463134765625, -6.90185546875, -6.340576171875, -5.779296875, -5.218017578125, -4.65673828125, -4.095458984375, -3.5341796875, -2.972900390625, -2.41162109375, -1.850341796875, -1.2890625, -0.727783203125, -0.16650390625, 0.394775390625, 0.9560546875, 1.517333984375, 2.07861328125, 2.639892578125, 3.201171875, 3.762451171875, 4.32373046875, 4.885009765625, 5.4462890625, 6.007568359375, 6.56884765625, 7.130126953125, 7.69140625, 8.252685546875, 8.81396484375, 9.375244140625, 9.9365234375, 10.497802734375, 11.05908203125, 11.620361328125, 12.181640625, 12.742919921875, 13.30419921875, 13.865478515625, 14.4267578125, 14.988037109375, 15.54931640625, 16.110595703125, 16.671875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 6.0, 5.0, 9.0, 7.0, 12.0, 6.0, 9.0, 18.0, 13.0, 20.0, 33.0, 31.0, 46.0, 75.0, 88.0, 127.0, 216.0, 332.0, 660.0, 1555.0, 21384.0, 3084204.0, 33225.0, 1816.0, 706.0, 343.0, 221.0, 125.0, 94.0, 76.0, 53.0, 42.0, 32.0, 23.0, 13.0, 15.0, 11.0, 13.0, 9.0, 9.0, 4.0, 3.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-53.59375, -51.94677734375, -50.2998046875, -48.65283203125, -47.005859375, -45.35888671875, -43.7119140625, -42.06494140625, -40.41796875, -38.77099609375, -37.1240234375, -35.47705078125, -33.830078125, -32.18310546875, -30.5361328125, -28.88916015625, -27.2421875, -25.59521484375, -23.9482421875, -22.30126953125, -20.654296875, -19.00732421875, -17.3603515625, -15.71337890625, -14.06640625, -12.41943359375, -10.7724609375, -9.12548828125, -7.478515625, -5.83154296875, -4.1845703125, -2.53759765625, -0.890625, 0.75634765625, 2.4033203125, 4.05029296875, 5.697265625, 7.34423828125, 8.9912109375, 10.63818359375, 12.28515625, 13.93212890625, 15.5791015625, 17.22607421875, 18.873046875, 20.52001953125, 22.1669921875, 23.81396484375, 25.4609375, 27.10791015625, 28.7548828125, 30.40185546875, 32.048828125, 33.69580078125, 35.3427734375, 36.98974609375, 38.63671875, 40.28369140625, 41.9306640625, 43.57763671875, 45.224609375, 46.87158203125, 48.5185546875, 50.16552734375, 51.8125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 194.0, 659.0, 156.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.0184631347656, -262.2860107421875, -257.5535888671875, -252.82115173339844, -248.08871459960938, -243.3562774658203, -238.62384033203125, -233.89138793945312, -229.15896606445312, -224.42652893066406, -219.694091796875, -214.96165466308594, -210.22921752929688, -205.4967803955078, -200.76434326171875, -196.03189086914062, -191.29945373535156, -186.5670166015625, -181.83457946777344, -177.10214233398438, -172.3697052001953, -167.63726806640625, -162.9048309326172, -158.17239379882812, -153.43994140625, -148.70750427246094, -143.97506713867188, -139.2426300048828, -134.51019287109375, -129.7777557373047, -125.0453109741211, -120.31287384033203, -115.58045196533203, -110.84801483154297, -106.1155776977539, -101.38314056396484, -96.65069580078125, -91.91825866699219, -87.18582153320312, -82.45338439941406, -77.720947265625, -72.98851013183594, -68.25607299804688, -63.52363204956055, -58.791194915771484, -54.05875778198242, -49.326316833496094, -44.59387969970703, -39.86144256591797, -35.129005432128906, -30.39656639099121, -25.664127349853516, -20.931690216064453, -16.19925308227539, -11.466814041137695, -6.734375, -2.0019378662109375, 2.7305002212524414, 7.46293830871582, 12.1953763961792, 16.927814483642578, 21.66025161743164, 26.392690658569336, 31.12512969970703, 35.857566833496094]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 11.0, 7.0, 7.0, 14.0, 17.0, 17.0, 27.0, 18.0, 14.0, 29.0, 25.0, 26.0, 29.0, 39.0, 36.0, 29.0, 30.0, 47.0, 38.0, 33.0, 45.0, 32.0, 38.0, 38.0, 37.0, 39.0, 38.0, 32.0, 31.0, 26.0, 23.0, 24.0, 17.0, 13.0, 11.0, 13.0, 6.0, 9.0, 9.0, 3.0, 2.0, 5.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.434974670410156, -35.29469680786133, -34.154422760009766, -33.01414489746094, -31.873868942260742, -30.733592987060547, -29.59331512451172, -28.453039169311523, -27.312763214111328, -26.172487258911133, -25.032211303710938, -23.89193344116211, -22.751657485961914, -21.61138153076172, -20.47110366821289, -19.330827713012695, -18.1905517578125, -17.050275802612305, -15.909998893737793, -14.769721984863281, -13.629446029663086, -12.48917007446289, -11.348893165588379, -10.208616256713867, -9.068340301513672, -7.928063869476318, -6.787787437438965, -5.647511005401611, -4.507234573364258, -3.3669581413269043, -2.226681709289551, -1.0864052772521973, 0.053867340087890625, 1.1941437721252441, 2.3344202041625977, 3.474696636199951, 4.614973068237305, 5.755249500274658, 6.895525932312012, 8.035802841186523, 9.176078796386719, 10.316354751586914, 11.456631660461426, 12.596908569335938, 13.737184524536133, 14.877460479736328, 16.017738342285156, 17.15801429748535, 18.298290252685547, 19.438566207885742, 20.578842163085938, 21.719120025634766, 22.85939598083496, 23.999671936035156, 25.139949798583984, 26.28022575378418, 27.420501708984375, 28.56077766418457, 29.701053619384766, 30.841331481933594, 31.98160743713379, 33.121883392333984, 34.26216125488281, 35.402435302734375, 36.5427131652832]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 8.0, 7.0, 14.0, 20.0, 14.0, 16.0, 26.0, 18.0, 24.0, 19.0, 22.0, 33.0, 36.0, 39.0, 43.0, 41.0, 38.0, 35.0, 44.0, 38.0, 37.0, 36.0, 30.0, 28.0, 31.0, 32.0, 37.0, 25.0, 16.0, 22.0, 16.0, 21.0, 18.0, 26.0, 14.0, 14.0, 6.0, 8.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.6571044921875, -4.505615234375, -4.3541259765625, -4.20263671875, -4.0511474609375, -3.899658203125, -3.7481689453125, -3.5966796875, -3.4451904296875, -3.293701171875, -3.1422119140625, -2.99072265625, -2.8392333984375, -2.687744140625, -2.5362548828125, -2.384765625, -2.2332763671875, -2.081787109375, -1.9302978515625, -1.77880859375, -1.6273193359375, -1.475830078125, -1.3243408203125, -1.1728515625, -1.0213623046875, -0.869873046875, -0.7183837890625, -0.56689453125, -0.4154052734375, -0.263916015625, -0.1124267578125, 0.0390625, 0.1905517578125, 0.342041015625, 0.4935302734375, 0.64501953125, 0.7965087890625, 0.947998046875, 1.0994873046875, 1.2509765625, 1.4024658203125, 1.553955078125, 1.7054443359375, 1.85693359375, 2.0084228515625, 2.159912109375, 2.3114013671875, 2.462890625, 2.6143798828125, 2.765869140625, 2.9173583984375, 3.06884765625, 3.2203369140625, 3.371826171875, 3.5233154296875, 3.6748046875, 3.8262939453125, 3.977783203125, 4.1292724609375, 4.28076171875, 4.4322509765625, 4.583740234375, 4.7352294921875, 4.88671875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 4.0, 4.0, 2.0, 3.0, 3.0, 5.0, 12.0, 14.0, 13.0, 21.0, 34.0, 26.0, 34.0, 46.0, 56.0, 77.0, 118.0, 223.0, 430.0, 1611.0, 10394.0, 107764.0, 1132988.0, 2448448.0, 446867.0, 38781.0, 4509.0, 880.0, 346.0, 149.0, 94.0, 59.0, 48.0, 46.0, 33.0, 26.0, 23.0, 31.0, 14.0, 11.0, 7.0, 6.0, 4.0, 4.0, 7.0, 1.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.2415771484375, -11.850341796875, -11.4591064453125, -11.06787109375, -10.6766357421875, -10.285400390625, -9.8941650390625, -9.5029296875, -9.1116943359375, -8.720458984375, -8.3292236328125, -7.93798828125, -7.5467529296875, -7.155517578125, -6.7642822265625, -6.373046875, -5.9818115234375, -5.590576171875, -5.1993408203125, -4.80810546875, -4.4168701171875, -4.025634765625, -3.6343994140625, -3.2431640625, -2.8519287109375, -2.460693359375, -2.0694580078125, -1.67822265625, -1.2869873046875, -0.895751953125, -0.5045166015625, -0.11328125, 0.2779541015625, 0.669189453125, 1.0604248046875, 1.45166015625, 1.8428955078125, 2.234130859375, 2.6253662109375, 3.0166015625, 3.4078369140625, 3.799072265625, 4.1903076171875, 4.58154296875, 4.9727783203125, 5.364013671875, 5.7552490234375, 6.146484375, 6.5377197265625, 6.928955078125, 7.3201904296875, 7.71142578125, 8.1026611328125, 8.493896484375, 8.8851318359375, 9.2763671875, 9.6676025390625, 10.058837890625, 10.4500732421875, 10.84130859375, 11.2325439453125, 11.623779296875, 12.0150146484375, 12.40625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 7.0, 8.0, 15.0, 18.0, 32.0, 33.0, 42.0, 51.0, 95.0, 125.0, 191.0, 269.0, 369.0, 453.0, 520.0, 475.0, 408.0, 295.0, 208.0, 150.0, 100.0, 56.0, 41.0, 36.0, 25.0, 9.0, 8.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.703125, -8.3359375, -7.96875, -7.6015625, -7.234375, -6.8671875, -6.5, -6.1328125, -5.765625, -5.3984375, -5.03125, -4.6640625, -4.296875, -3.9296875, -3.5625, -3.1953125, -2.828125, -2.4609375, -2.09375, -1.7265625, -1.359375, -0.9921875, -0.625, -0.2578125, 0.109375, 0.4765625, 0.84375, 1.2109375, 1.578125, 1.9453125, 2.3125, 2.6796875, 3.046875, 3.4140625, 3.78125, 4.1484375, 4.515625, 4.8828125, 5.25, 5.6171875, 5.984375, 6.3515625, 6.71875, 7.0859375, 7.453125, 7.8203125, 8.1875, 8.5546875, 8.921875, 9.2890625, 9.65625, 10.0234375, 10.390625, 10.7578125, 11.125, 11.4921875, 11.859375, 12.2265625, 12.59375, 12.9609375, 13.328125, 13.6953125, 14.0625, 14.4296875, 14.796875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 0.0, 7.0, 9.0, 10.0, 12.0, 17.0, 31.0, 40.0, 53.0, 81.0, 140.0, 207.0, 385.0, 765.0, 16533.0, 4120184.0, 53708.0, 929.0, 440.0, 251.0, 147.0, 108.0, 50.0, 40.0, 49.0, 22.0, 18.0, 18.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-81.8125, -79.8447265625, -77.876953125, -75.9091796875, -73.94140625, -71.9736328125, -70.005859375, -68.0380859375, -66.0703125, -64.1025390625, -62.134765625, -60.1669921875, -58.19921875, -56.2314453125, -54.263671875, -52.2958984375, -50.328125, -48.3603515625, -46.392578125, -44.4248046875, -42.45703125, -40.4892578125, -38.521484375, -36.5537109375, -34.5859375, -32.6181640625, -30.650390625, -28.6826171875, -26.71484375, -24.7470703125, -22.779296875, -20.8115234375, -18.84375, -16.8759765625, -14.908203125, -12.9404296875, -10.97265625, -9.0048828125, -7.037109375, -5.0693359375, -3.1015625, -1.1337890625, 0.833984375, 2.8017578125, 4.76953125, 6.7373046875, 8.705078125, 10.6728515625, 12.640625, 14.6083984375, 16.576171875, 18.5439453125, 20.51171875, 22.4794921875, 24.447265625, 26.4150390625, 28.3828125, 30.3505859375, 32.318359375, 34.2861328125, 36.25390625, 38.2216796875, 40.189453125, 42.1572265625, 44.125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 19.0, 155.0, 367.0, 343.0, 117.0, 12.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.86396026611328, -34.873046875, -29.882137298583984, -24.891225814819336, -19.900314331054688, -14.909402847290039, -9.91849136352539, -4.927581787109375, 0.06333160400390625, 5.054243087768555, 10.045154571533203, 15.036066055297852, 20.0269775390625, 25.01788902282715, 30.008800506591797, 34.99971008300781, 39.990623474121094, 44.981536865234375, 49.97244644165039, 54.963356018066406, 59.95426940917969, 64.94518280029297, 69.93609619140625, 74.927001953125, 79.91791534423828, 84.90882873535156, 89.89973449707031, 94.8906478881836, 99.88156127929688, 104.87247467041016, 109.86338806152344, 114.85429382324219, 119.84521484375, 124.83612823486328, 129.82704162597656, 134.8179473876953, 139.80886840820312, 144.79977416992188, 149.79067993164062, 154.78158569335938, 159.7725067138672, 164.76341247558594, 169.75433349609375, 174.7452392578125, 179.73614501953125, 184.72706604003906, 189.7179718017578, 194.70889282226562, 199.69979858398438, 204.69070434570312, 209.68162536621094, 214.6725311279297, 219.6634521484375, 224.65435791015625, 229.645263671875, 234.63616943359375, 239.62709045410156, 244.6179962158203, 249.60891723632812, 254.59982299804688, 259.5907287597656, 264.5816345214844, 269.57257080078125, 274.5634765625, 279.55438232421875]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 7.0, 10.0, 15.0, 19.0, 12.0, 22.0, 17.0, 27.0, 24.0, 32.0, 20.0, 39.0, 35.0, 41.0, 61.0, 35.0, 43.0, 45.0, 38.0, 29.0, 38.0, 43.0, 50.0, 36.0, 33.0, 40.0, 25.0, 25.0, 17.0, 19.0, 19.0, 18.0, 9.0, 10.0, 11.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.388992309570312, -30.321237564086914, -29.253482818603516, -28.18572998046875, -27.11797523498535, -26.050220489501953, -24.982465744018555, -23.914710998535156, -22.84695816040039, -21.779203414916992, -20.711448669433594, -19.643695831298828, -18.57594108581543, -17.50818634033203, -16.440431594848633, -15.372676849365234, -14.304922103881836, -13.237167358398438, -12.169413566589355, -11.101658821105957, -10.033905029296875, -8.966150283813477, -7.898395538330078, -6.830641269683838, -5.762887001037598, -4.695132732391357, -3.627378225326538, -2.5596237182617188, -1.4918694496154785, -0.4241151809692383, 0.6436395645141602, 1.7113938331604004, 2.7791481018066406, 3.846902370452881, 4.914656639099121, 5.9824113845825195, 7.05016565322876, 8.117919921875, 9.185674667358398, 10.253429412841797, 11.321183204650879, 12.388937950134277, 13.45669174194336, 14.524446487426758, 15.592201232910156, 16.659954071044922, 17.727710723876953, 18.79546356201172, 19.863218307495117, 20.930973052978516, 21.998727798461914, 23.066482543945312, 24.134235382080078, 25.201990127563477, 26.269744873046875, 27.337499618530273, 28.405254364013672, 29.47300910949707, 30.54076385498047, 31.608516693115234, 32.676273345947266, 33.74402618408203, 34.81178283691406, 35.87953567504883, 36.947288513183594]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 6.0, 14.0, 16.0, 11.0, 16.0, 11.0, 13.0, 20.0, 20.0, 22.0, 23.0, 27.0, 28.0, 32.0, 22.0, 32.0, 49.0, 39.0, 38.0, 37.0, 45.0, 40.0, 45.0, 41.0, 47.0, 25.0, 29.0, 24.0, 16.0, 24.0, 29.0, 20.0, 16.0, 22.0, 11.0, 9.0, 15.0, 12.0, 9.0, 7.0, 7.0, 2.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.8359375, -4.68865966796875, -4.5413818359375, -4.39410400390625, -4.246826171875, -4.09954833984375, -3.9522705078125, -3.80499267578125, -3.65771484375, -3.51043701171875, -3.3631591796875, -3.21588134765625, -3.068603515625, -2.92132568359375, -2.7740478515625, -2.62677001953125, -2.4794921875, -2.33221435546875, -2.1849365234375, -2.03765869140625, -1.890380859375, -1.74310302734375, -1.5958251953125, -1.44854736328125, -1.30126953125, -1.15399169921875, -1.0067138671875, -0.85943603515625, -0.712158203125, -0.56488037109375, -0.4176025390625, -0.27032470703125, -0.123046875, 0.02423095703125, 0.1715087890625, 0.31878662109375, 0.466064453125, 0.61334228515625, 0.7606201171875, 0.90789794921875, 1.05517578125, 1.20245361328125, 1.3497314453125, 1.49700927734375, 1.644287109375, 1.79156494140625, 1.9388427734375, 2.08612060546875, 2.2333984375, 2.38067626953125, 2.5279541015625, 2.67523193359375, 2.822509765625, 2.96978759765625, 3.1170654296875, 3.26434326171875, 3.41162109375, 3.55889892578125, 3.7061767578125, 3.85345458984375, 4.000732421875, 4.14801025390625, 4.2952880859375, 4.44256591796875, 4.58984375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 15.0, 22.0, 26.0, 39.0, 51.0, 67.0, 118.0, 185.0, 256.0, 299.0, 497.0, 718.0, 1100.0, 1573.0, 2317.0, 3372.0, 5015.0, 7128.0, 10706.0, 16244.0, 23594.0, 34790.0, 50744.0, 72624.0, 101667.0, 132968.0, 148450.0, 126208.0, 95017.0, 67091.0, 46727.0, 31612.0, 21486.0, 14796.0, 10002.0, 6747.0, 4478.0, 3127.0, 2144.0, 1443.0, 1001.0, 660.0, 417.0, 316.0, 205.0, 159.0, 95.0, 81.0, 50.0, 29.0, 27.0, 19.0, 11.0, 9.0, 6.0, 2.0, 2.0, 2.0], "bins": [-0.347412109375, -0.3366851806640625, -0.325958251953125, -0.3152313232421875, -0.30450439453125, -0.2937774658203125, -0.283050537109375, -0.2723236083984375, -0.2615966796875, -0.2508697509765625, -0.240142822265625, -0.2294158935546875, -0.21868896484375, -0.2079620361328125, -0.197235107421875, -0.1865081787109375, -0.17578125, -0.1650543212890625, -0.154327392578125, -0.1436004638671875, -0.13287353515625, -0.1221466064453125, -0.111419677734375, -0.1006927490234375, -0.0899658203125, -0.0792388916015625, -0.068511962890625, -0.0577850341796875, -0.04705810546875, -0.0363311767578125, -0.025604248046875, -0.0148773193359375, -0.004150390625, 0.0065765380859375, 0.017303466796875, 0.0280303955078125, 0.03875732421875, 0.0494842529296875, 0.060211181640625, 0.0709381103515625, 0.0816650390625, 0.0923919677734375, 0.103118896484375, 0.1138458251953125, 0.12457275390625, 0.1352996826171875, 0.146026611328125, 0.1567535400390625, 0.16748046875, 0.1782073974609375, 0.188934326171875, 0.1996612548828125, 0.21038818359375, 0.2211151123046875, 0.231842041015625, 0.2425689697265625, 0.2532958984375, 0.2640228271484375, 0.274749755859375, 0.2854766845703125, 0.29620361328125, 0.3069305419921875, 0.317657470703125, 0.3283843994140625, 0.339111328125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 3.0, 4.0, 2.0, 9.0, 7.0, 13.0, 10.0, 11.0, 12.0, 12.0, 9.0, 22.0, 15.0, 15.0, 32.0, 24.0, 26.0, 32.0, 33.0, 38.0, 34.0, 30.0, 28.0, 36.0, 42.0, 1055.0, 34.0, 34.0, 35.0, 36.0, 33.0, 35.0, 31.0, 27.0, 26.0, 19.0, 20.0, 22.0, 14.0, 17.0, 15.0, 6.0, 10.0, 10.0, 8.0, 8.0, 9.0, 10.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.453125, -2.36700439453125, -2.2808837890625, -2.19476318359375, -2.108642578125, -2.02252197265625, -1.9364013671875, -1.85028076171875, -1.76416015625, -1.67803955078125, -1.5919189453125, -1.50579833984375, -1.419677734375, -1.33355712890625, -1.2474365234375, -1.16131591796875, -1.0751953125, -0.98907470703125, -0.9029541015625, -0.81683349609375, -0.730712890625, -0.64459228515625, -0.5584716796875, -0.47235107421875, -0.38623046875, -0.30010986328125, -0.2139892578125, -0.12786865234375, -0.041748046875, 0.04437255859375, 0.1304931640625, 0.21661376953125, 0.302734375, 0.38885498046875, 0.4749755859375, 0.56109619140625, 0.647216796875, 0.73333740234375, 0.8194580078125, 0.90557861328125, 0.99169921875, 1.07781982421875, 1.1639404296875, 1.25006103515625, 1.336181640625, 1.42230224609375, 1.5084228515625, 1.59454345703125, 1.6806640625, 1.76678466796875, 1.8529052734375, 1.93902587890625, 2.025146484375, 2.11126708984375, 2.1973876953125, 2.28350830078125, 2.36962890625, 2.45574951171875, 2.5418701171875, 2.62799072265625, 2.714111328125, 2.80023193359375, 2.8863525390625, 2.97247314453125, 3.05859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 13.0, 17.0, 34.0, 38.0, 63.0, 85.0, 142.0, 184.0, 281.0, 415.0, 585.0, 865.0, 1390.0, 2061.0, 3161.0, 4739.0, 7445.0, 11199.0, 16694.0, 25251.0, 37355.0, 53612.0, 75041.0, 100445.0, 131180.0, 1168123.0, 125866.0, 98017.0, 73247.0, 51856.0, 35979.0, 24444.0, 16279.0, 10905.0, 6905.0, 4549.0, 2886.0, 1869.0, 1323.0, 794.0, 559.0, 405.0, 266.0, 162.0, 112.0, 77.0, 75.0, 47.0, 29.0, 17.0, 13.0, 15.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.237060546875, -0.22975540161132812, -0.22245025634765625, -0.21514511108398438, -0.2078399658203125, -0.20053482055664062, -0.19322967529296875, -0.18592453002929688, -0.178619384765625, -0.17131423950195312, -0.16400909423828125, -0.15670394897460938, -0.1493988037109375, -0.14209365844726562, -0.13478851318359375, -0.12748336791992188, -0.12017822265625, -0.11287307739257812, -0.10556793212890625, -0.09826278686523438, -0.0909576416015625, -0.08365249633789062, -0.07634735107421875, -0.06904220581054688, -0.061737060546875, -0.054431915283203125, -0.04712677001953125, -0.039821624755859375, -0.0325164794921875, -0.025211334228515625, -0.01790618896484375, -0.010601043701171875, -0.0032958984375, 0.004009246826171875, 0.01131439208984375, 0.018619537353515625, 0.0259246826171875, 0.033229827880859375, 0.04053497314453125, 0.047840118408203125, 0.055145263671875, 0.062450408935546875, 0.06975555419921875, 0.07706069946289062, 0.0843658447265625, 0.09167098999023438, 0.09897613525390625, 0.10628128051757812, 0.11358642578125, 0.12089157104492188, 0.12819671630859375, 0.13550186157226562, 0.1428070068359375, 0.15011215209960938, 0.15741729736328125, 0.16472244262695312, 0.172027587890625, 0.17933273315429688, 0.18663787841796875, 0.19394302368164062, 0.2012481689453125, 0.20855331420898438, 0.21585845947265625, 0.22316360473632812, 0.23046875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 5.0, 7.0, 6.0, 8.0, 10.0, 13.0, 20.0, 26.0, 30.0, 30.0, 40.0, 40.0, 63.0, 94.0, 96.0, 112.0, 83.0, 53.0, 47.0, 43.0, 32.0, 23.0, 24.0, 21.0, 9.0, 5.0, 7.0, 10.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01488494873046875, -0.01440417766571045, -0.013923406600952148, -0.013442635536193848, -0.012961864471435547, -0.012481093406677246, -0.012000322341918945, -0.011519551277160645, -0.011038780212402344, -0.010558009147644043, -0.010077238082885742, -0.009596467018127441, -0.00911569595336914, -0.00863492488861084, -0.008154153823852539, -0.007673382759094238, -0.0071926116943359375, -0.006711840629577637, -0.006231069564819336, -0.005750298500061035, -0.005269527435302734, -0.004788756370544434, -0.004307985305786133, -0.003827214241027832, -0.0033464431762695312, -0.0028656721115112305, -0.0023849010467529297, -0.001904129981994629, -0.0014233589172363281, -0.0009425878524780273, -0.00046181678771972656, 1.895427703857422e-05, 0.000499725341796875, 0.0009804964065551758, 0.0014612674713134766, 0.0019420385360717773, 0.002422809600830078, 0.002903580665588379, 0.0033843517303466797, 0.0038651227951049805, 0.004345893859863281, 0.004826664924621582, 0.005307435989379883, 0.005788207054138184, 0.006268978118896484, 0.006749749183654785, 0.007230520248413086, 0.007711291313171387, 0.008192062377929688, 0.008672833442687988, 0.009153604507446289, 0.00963437557220459, 0.01011514663696289, 0.010595917701721191, 0.011076688766479492, 0.011557459831237793, 0.012038230895996094, 0.012519001960754395, 0.012999773025512695, 0.013480544090270996, 0.013961315155029297, 0.014442086219787598, 0.014922857284545898, 0.0154036283493042, 0.0158843994140625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 10.0, 11.0, 11.0, 13.0, 32.0, 30.0, 47.0, 60.0, 125.0, 181.0, 385.0, 1997.0, 161849.0, 877894.0, 4736.0, 507.0, 207.0, 115.0, 75.0, 54.0, 42.0, 43.0, 17.0, 17.0, 14.0, 7.0, 8.0, 7.0, 6.0, 6.0, 7.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.329833984375, -0.31987762451171875, -0.3099212646484375, -0.29996490478515625, -0.290008544921875, -0.28005218505859375, -0.2700958251953125, -0.26013946533203125, -0.25018310546875, -0.24022674560546875, -0.2302703857421875, -0.22031402587890625, -0.210357666015625, -0.20040130615234375, -0.1904449462890625, -0.18048858642578125, -0.1705322265625, -0.16057586669921875, -0.1506195068359375, -0.14066314697265625, -0.130706787109375, -0.12075042724609375, -0.1107940673828125, -0.10083770751953125, -0.09088134765625, -0.08092498779296875, -0.0709686279296875, -0.06101226806640625, -0.051055908203125, -0.04109954833984375, -0.0311431884765625, -0.02118682861328125, -0.01123046875, -0.00127410888671875, 0.0086822509765625, 0.01863861083984375, 0.028594970703125, 0.03855133056640625, 0.0485076904296875, 0.05846405029296875, 0.06842041015625, 0.07837677001953125, 0.0883331298828125, 0.09828948974609375, 0.108245849609375, 0.11820220947265625, 0.1281585693359375, 0.13811492919921875, 0.1480712890625, 0.15802764892578125, 0.1679840087890625, 0.17794036865234375, 0.187896728515625, 0.19785308837890625, 0.2078094482421875, 0.21776580810546875, 0.22772216796875, 0.23767852783203125, 0.2476348876953125, 0.25759124755859375, 0.267547607421875, 0.27750396728515625, 0.2874603271484375, 0.29741668701171875, 0.307373046875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 29.0, 260.0, 607.0, 83.0, 26.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19324229657649994, -0.1885472536087036, -0.1838522106409073, -0.17915716767311096, -0.17446212470531464, -0.1697670817375183, -0.16507203876972198, -0.16037699580192566, -0.15568193793296814, -0.15098689496517181, -0.1462918519973755, -0.14159680902957916, -0.13690176606178284, -0.1322067230939865, -0.12751168012619019, -0.12281662970781326, -0.11812159419059753, -0.11342655122280121, -0.10873150825500488, -0.10403646528720856, -0.09934142231941223, -0.0946463793516159, -0.08995132893323898, -0.08525628596544266, -0.08056124299764633, -0.07586620002985, -0.07117115706205368, -0.06647611409425735, -0.06178106740117073, -0.057086024433374405, -0.05239097774028778, -0.047695934772491455, -0.043000876903533936, -0.03830583393573761, -0.033610790967941284, -0.02891574427485466, -0.024220701307058334, -0.01952565833926201, -0.014830613508820534, -0.010135568678379059, -0.005440525710582733, -0.0007454818114638329, 0.0039495620876550674, 0.008644605986773968, 0.013339649885892868, 0.018034692853689194, 0.02272973768413067, 0.027424782514572144, 0.03211982548236847, 0.036814868450164795, 0.04150991141796112, 0.046204958111047745, 0.05090000107884407, 0.055595044046640396, 0.06029009073972702, 0.06498513370752335, 0.06968017667531967, 0.074375219643116, 0.07907026261091232, 0.08376530557870865, 0.08846035599708557, 0.0931553989648819, 0.09785044193267822, 0.10254548490047455, 0.10724052786827087]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 6.0, 5.0, 2.0, 9.0, 8.0, 14.0, 10.0, 19.0, 12.0, 25.0, 25.0, 31.0, 31.0, 26.0, 30.0, 34.0, 19.0, 39.0, 45.0, 35.0, 34.0, 47.0, 37.0, 44.0, 35.0, 32.0, 36.0, 25.0, 26.0, 27.0, 27.0, 27.0, 22.0, 32.0, 19.0, 12.0, 17.0, 13.0, 12.0, 20.0, 2.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.019198596477508545, -0.018639346584677696, -0.018080096691846848, -0.017520846799016, -0.01696159690618515, -0.0164023470133543, -0.015843097120523453, -0.015283847227692604, -0.014724597334861755, -0.014165347442030907, -0.013606097549200058, -0.01304684765636921, -0.01248759776353836, -0.011928347870707512, -0.011369097977876663, -0.010809848085045815, -0.010250598192214966, -0.009691348299384117, -0.009132098406553268, -0.00857284851372242, -0.008013598620891571, -0.007454348728060722, -0.006895098835229874, -0.006335848942399025, -0.005776599049568176, -0.005217349156737328, -0.004658099263906479, -0.00409884937107563, -0.0035395994782447815, -0.002980349585413933, -0.002421099692583084, -0.0018618497997522354, -0.0013025999069213867, -0.000743350014090538, -0.00018410012125968933, 0.00037514977157115936, 0.0009343996644020081, 0.0014936495572328568, 0.0020528994500637054, 0.002612149342894554, 0.003171399235725403, 0.0037306491285562515, 0.0042898990213871, 0.004849148914217949, 0.005408398807048798, 0.005967648699879646, 0.006526898592710495, 0.007086148485541344, 0.007645398378372192, 0.008204648271203041, 0.00876389816403389, 0.009323148056864738, 0.009882397949695587, 0.010441647842526436, 0.011000897735357285, 0.011560147628188133, 0.012119397521018982, 0.01267864741384983, 0.01323789730668068, 0.013797147199511528, 0.014356397092342377, 0.014915646985173225, 0.015474896878004074, 0.016034146770834923, 0.01659339666366577]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 6.0, 14.0, 15.0, 12.0, 16.0, 11.0, 13.0, 19.0, 21.0, 22.0, 22.0, 26.0, 30.0, 30.0, 24.0, 31.0, 50.0, 38.0, 39.0, 37.0, 45.0, 40.0, 45.0, 41.0, 46.0, 26.0, 28.0, 25.0, 16.0, 24.0, 29.0, 20.0, 16.0, 22.0, 11.0, 9.0, 15.0, 12.0, 9.0, 7.0, 7.0, 2.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.83984375, -4.6925048828125, -4.545166015625, -4.3978271484375, -4.25048828125, -4.1031494140625, -3.955810546875, -3.8084716796875, -3.6611328125, -3.5137939453125, -3.366455078125, -3.2191162109375, -3.07177734375, -2.9244384765625, -2.777099609375, -2.6297607421875, -2.482421875, -2.3350830078125, -2.187744140625, -2.0404052734375, -1.89306640625, -1.7457275390625, -1.598388671875, -1.4510498046875, -1.3037109375, -1.1563720703125, -1.009033203125, -0.8616943359375, -0.71435546875, -0.5670166015625, -0.419677734375, -0.2723388671875, -0.125, 0.0223388671875, 0.169677734375, 0.3170166015625, 0.46435546875, 0.6116943359375, 0.759033203125, 0.9063720703125, 1.0537109375, 1.2010498046875, 1.348388671875, 1.4957275390625, 1.64306640625, 1.7904052734375, 1.937744140625, 2.0850830078125, 2.232421875, 2.3797607421875, 2.527099609375, 2.6744384765625, 2.82177734375, 2.9691162109375, 3.116455078125, 3.2637939453125, 3.4111328125, 3.5584716796875, 3.705810546875, 3.8531494140625, 4.00048828125, 4.1478271484375, 4.295166015625, 4.4425048828125, 4.58984375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 19.0, 21.0, 20.0, 22.0, 34.0, 36.0, 59.0, 64.0, 114.0, 156.0, 340.0, 712.0, 1736.0, 5184.0, 16146.0, 51309.0, 196516.0, 561880.0, 151657.0, 42035.0, 13334.0, 4235.0, 1429.0, 610.0, 292.0, 162.0, 116.0, 67.0, 53.0, 31.0, 21.0, 23.0, 20.0, 20.0, 15.0, 11.0, 6.0, 4.0, 11.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.421875, -10.1099853515625, -9.798095703125, -9.4862060546875, -9.17431640625, -8.8624267578125, -8.550537109375, -8.2386474609375, -7.9267578125, -7.6148681640625, -7.302978515625, -6.9910888671875, -6.67919921875, -6.3673095703125, -6.055419921875, -5.7435302734375, -5.431640625, -5.1197509765625, -4.807861328125, -4.4959716796875, -4.18408203125, -3.8721923828125, -3.560302734375, -3.2484130859375, -2.9365234375, -2.6246337890625, -2.312744140625, -2.0008544921875, -1.68896484375, -1.3770751953125, -1.065185546875, -0.7532958984375, -0.44140625, -0.1295166015625, 0.182373046875, 0.4942626953125, 0.80615234375, 1.1180419921875, 1.429931640625, 1.7418212890625, 2.0537109375, 2.3656005859375, 2.677490234375, 2.9893798828125, 3.30126953125, 3.6131591796875, 3.925048828125, 4.2369384765625, 4.548828125, 4.8607177734375, 5.172607421875, 5.4844970703125, 5.79638671875, 6.1082763671875, 6.420166015625, 6.7320556640625, 7.0439453125, 7.3558349609375, 7.667724609375, 7.9796142578125, 8.29150390625, 8.6033935546875, 8.915283203125, 9.2271728515625, 9.5390625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 3.0, 6.0, 10.0, 13.0, 15.0, 16.0, 20.0, 27.0, 37.0, 26.0, 36.0, 38.0, 44.0, 61.0, 107.0, 195.0, 1464.0, 323.0, 141.0, 83.0, 50.0, 55.0, 50.0, 36.0, 32.0, 29.0, 17.0, 17.0, 23.0, 20.0, 8.0, 7.0, 4.0, 7.0, 7.0, 2.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.328857421875, -15.72021484375, -15.111572265625, -14.5029296875, -13.894287109375, -13.28564453125, -12.677001953125, -12.068359375, -11.459716796875, -10.85107421875, -10.242431640625, -9.6337890625, -9.025146484375, -8.41650390625, -7.807861328125, -7.19921875, -6.590576171875, -5.98193359375, -5.373291015625, -4.7646484375, -4.156005859375, -3.54736328125, -2.938720703125, -2.330078125, -1.721435546875, -1.11279296875, -0.504150390625, 0.1044921875, 0.713134765625, 1.32177734375, 1.930419921875, 2.5390625, 3.147705078125, 3.75634765625, 4.364990234375, 4.9736328125, 5.582275390625, 6.19091796875, 6.799560546875, 7.408203125, 8.016845703125, 8.62548828125, 9.234130859375, 9.8427734375, 10.451416015625, 11.06005859375, 11.668701171875, 12.27734375, 12.885986328125, 13.49462890625, 14.103271484375, 14.7119140625, 15.320556640625, 15.92919921875, 16.537841796875, 17.146484375, 17.755126953125, 18.36376953125, 18.972412109375, 19.5810546875, 20.189697265625, 20.79833984375, 21.406982421875, 22.015625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 3.0, 7.0, 5.0, 18.0, 12.0, 21.0, 26.0, 28.0, 30.0, 39.0, 59.0, 69.0, 101.0, 126.0, 228.0, 408.0, 1085.0, 14575.0, 3045523.0, 80184.0, 1743.0, 540.0, 282.0, 149.0, 111.0, 71.0, 51.0, 52.0, 30.0, 28.0, 20.0, 18.0, 11.0, 10.0, 6.0, 11.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.6875, -58.9853515625, -57.283203125, -55.5810546875, -53.87890625, -52.1767578125, -50.474609375, -48.7724609375, -47.0703125, -45.3681640625, -43.666015625, -41.9638671875, -40.26171875, -38.5595703125, -36.857421875, -35.1552734375, -33.453125, -31.7509765625, -30.048828125, -28.3466796875, -26.64453125, -24.9423828125, -23.240234375, -21.5380859375, -19.8359375, -18.1337890625, -16.431640625, -14.7294921875, -13.02734375, -11.3251953125, -9.623046875, -7.9208984375, -6.21875, -4.5166015625, -2.814453125, -1.1123046875, 0.58984375, 2.2919921875, 3.994140625, 5.6962890625, 7.3984375, 9.1005859375, 10.802734375, 12.5048828125, 14.20703125, 15.9091796875, 17.611328125, 19.3134765625, 21.015625, 22.7177734375, 24.419921875, 26.1220703125, 27.82421875, 29.5263671875, 31.228515625, 32.9306640625, 34.6328125, 36.3349609375, 38.037109375, 39.7392578125, 41.44140625, 43.1435546875, 44.845703125, 46.5478515625, 48.25]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 6.0, 12.0, 12.0, 31.0, 41.0, 47.0, 80.0, 84.0, 105.0, 107.0, 98.0, 79.0, 92.0, 52.0, 49.0, 46.0, 25.0, 15.0, 13.0, 2.0, 8.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.501716613769531, -10.852889060974121, -10.204061508178711, -9.555233001708984, -8.906405448913574, -8.257577896118164, -7.608749866485596, -6.959921836853027, -6.311094284057617, -5.662266731262207, -5.013438701629639, -4.36461067199707, -3.71578311920166, -3.066955327987671, -2.4181275367736816, -1.7692995071411133, -1.1204719543457031, -0.47164416313171387, 0.1771836280822754, 0.8260114192962646, 1.474839210510254, 2.123667001724243, 2.7724947929382324, 3.421322822570801, 4.070150375366211, 4.718977928161621, 5.3678059577941895, 6.016633987426758, 6.665461540222168, 7.314289093017578, 7.9631171226501465, 8.611945152282715, 9.260772705078125, 9.909600257873535, 10.558427810668945, 11.207256317138672, 11.856083869934082, 12.504911422729492, 13.153739929199219, 13.802567481994629, 14.451395034790039, 15.10022258758545, 15.74905014038086, 16.397878646850586, 17.046707153320312, 17.695533752441406, 18.344362258911133, 18.99319076538086, 19.642017364501953, 20.29084587097168, 20.939672470092773, 21.5885009765625, 22.237327575683594, 22.88615608215332, 23.534984588623047, 24.18381118774414, 24.832639694213867, 25.481468200683594, 26.130294799804688, 26.779123306274414, 27.42795181274414, 28.076778411865234, 28.72560691833496, 29.374435424804688, 30.02326202392578]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 8.0, 11.0, 13.0, 12.0, 19.0, 12.0, 23.0, 25.0, 28.0, 44.0, 36.0, 40.0, 44.0, 44.0, 48.0, 47.0, 44.0, 55.0, 39.0, 50.0, 45.0, 37.0, 34.0, 31.0, 34.0, 30.0, 25.0, 31.0, 17.0, 20.0, 15.0, 8.0, 8.0, 6.0, 2.0, 10.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-67.97822570800781, -66.26310729980469, -64.54798889160156, -62.83287048339844, -61.11775207519531, -59.40263366699219, -57.68751525878906, -55.97239685058594, -54.25727844238281, -52.54216003417969, -50.82704162597656, -49.11192321777344, -47.39680480957031, -45.68168640136719, -43.96656799316406, -42.25144958496094, -40.53633499145508, -38.82121658325195, -37.10609817504883, -35.3909797668457, -33.67586135864258, -31.960742950439453, -30.24562644958496, -28.530508041381836, -26.81538963317871, -25.100271224975586, -23.38515281677246, -21.67003631591797, -19.954917907714844, -18.23979949951172, -16.524681091308594, -14.809562683105469, -13.09444808959961, -11.379329681396484, -9.66421127319336, -7.949093818664551, -6.233975410461426, -4.518857002258301, -2.803739547729492, -1.0886211395263672, 0.6264972686767578, 2.3416154384613037, 4.05673360824585, 5.771851539611816, 7.486969947814941, 9.202088356018066, 10.917205810546875, 12.63232421875, 14.347442626953125, 16.06256103515625, 17.777679443359375, 19.4927978515625, 21.207916259765625, 22.92303466796875, 24.638151168823242, 26.353269577026367, 28.068387985229492, 29.783506393432617, 31.498624801635742, 33.213741302490234, 34.92885971069336, 36.643978118896484, 38.35909652709961, 40.074214935302734, 41.78933334350586]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 8.0, 6.0, 8.0, 9.0, 13.0, 17.0, 10.0, 25.0, 13.0, 23.0, 25.0, 34.0, 25.0, 26.0, 23.0, 35.0, 42.0, 35.0, 41.0, 35.0, 48.0, 48.0, 41.0, 43.0, 41.0, 30.0, 33.0, 29.0, 29.0, 28.0, 21.0, 22.0, 23.0, 15.0, 9.0, 15.0, 12.0, 19.0, 6.0, 3.0, 4.0, 6.0, 7.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0], "bins": [-6.09765625, -5.92572021484375, -5.7537841796875, -5.58184814453125, -5.409912109375, -5.23797607421875, -5.0660400390625, -4.89410400390625, -4.72216796875, -4.55023193359375, -4.3782958984375, -4.20635986328125, -4.034423828125, -3.86248779296875, -3.6905517578125, -3.51861572265625, -3.3466796875, -3.17474365234375, -3.0028076171875, -2.83087158203125, -2.658935546875, -2.48699951171875, -2.3150634765625, -2.14312744140625, -1.97119140625, -1.79925537109375, -1.6273193359375, -1.45538330078125, -1.283447265625, -1.11151123046875, -0.9395751953125, -0.76763916015625, -0.595703125, -0.42376708984375, -0.2518310546875, -0.07989501953125, 0.092041015625, 0.26397705078125, 0.4359130859375, 0.60784912109375, 0.77978515625, 0.95172119140625, 1.1236572265625, 1.29559326171875, 1.467529296875, 1.63946533203125, 1.8114013671875, 1.98333740234375, 2.1552734375, 2.32720947265625, 2.4991455078125, 2.67108154296875, 2.843017578125, 3.01495361328125, 3.1868896484375, 3.35882568359375, 3.53076171875, 3.70269775390625, 3.8746337890625, 4.04656982421875, 4.218505859375, 4.39044189453125, 4.5623779296875, 4.73431396484375, 4.90625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 1.0, 6.0, 18.0, 17.0, 15.0, 19.0, 27.0, 33.0, 28.0, 57.0, 74.0, 134.0, 226.0, 373.0, 633.0, 1340.0, 3124.0, 8186.0, 21722.0, 64698.0, 184682.0, 472464.0, 942443.0, 1167925.0, 771449.0, 350720.0, 131464.0, 45842.0, 15674.0, 5961.0, 2436.0, 1062.0, 558.0, 304.0, 166.0, 113.0, 78.0, 54.0, 27.0, 22.0, 22.0, 12.0, 14.0, 10.0, 14.0, 5.0, 3.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0], "bins": [-5.89453125, -5.72283935546875, -5.5511474609375, -5.37945556640625, -5.207763671875, -5.03607177734375, -4.8643798828125, -4.69268798828125, -4.52099609375, -4.34930419921875, -4.1776123046875, -4.00592041015625, -3.834228515625, -3.66253662109375, -3.4908447265625, -3.31915283203125, -3.1474609375, -2.97576904296875, -2.8040771484375, -2.63238525390625, -2.460693359375, -2.28900146484375, -2.1173095703125, -1.94561767578125, -1.77392578125, -1.60223388671875, -1.4305419921875, -1.25885009765625, -1.087158203125, -0.91546630859375, -0.7437744140625, -0.57208251953125, -0.400390625, -0.22869873046875, -0.0570068359375, 0.11468505859375, 0.286376953125, 0.45806884765625, 0.6297607421875, 0.80145263671875, 0.97314453125, 1.14483642578125, 1.3165283203125, 1.48822021484375, 1.659912109375, 1.83160400390625, 2.0032958984375, 2.17498779296875, 2.3466796875, 2.51837158203125, 2.6900634765625, 2.86175537109375, 3.033447265625, 3.20513916015625, 3.3768310546875, 3.54852294921875, 3.72021484375, 3.89190673828125, 4.0635986328125, 4.23529052734375, 4.406982421875, 4.57867431640625, 4.7503662109375, 4.92205810546875, 5.09375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 6.0, 4.0, 7.0, 13.0, 11.0, 20.0, 30.0, 26.0, 40.0, 54.0, 63.0, 85.0, 103.0, 145.0, 194.0, 239.0, 308.0, 354.0, 374.0, 383.0, 327.0, 299.0, 243.0, 184.0, 138.0, 98.0, 77.0, 64.0, 40.0, 36.0, 15.0, 19.0, 18.0, 12.0, 11.0, 7.0, 7.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0078125, -8.7161865234375, -8.424560546875, -8.1329345703125, -7.84130859375, -7.5496826171875, -7.258056640625, -6.9664306640625, -6.6748046875, -6.3831787109375, -6.091552734375, -5.7999267578125, -5.50830078125, -5.2166748046875, -4.925048828125, -4.6334228515625, -4.341796875, -4.0501708984375, -3.758544921875, -3.4669189453125, -3.17529296875, -2.8836669921875, -2.592041015625, -2.3004150390625, -2.0087890625, -1.7171630859375, -1.425537109375, -1.1339111328125, -0.84228515625, -0.5506591796875, -0.259033203125, 0.0325927734375, 0.32421875, 0.6158447265625, 0.907470703125, 1.1990966796875, 1.49072265625, 1.7823486328125, 2.073974609375, 2.3656005859375, 2.6572265625, 2.9488525390625, 3.240478515625, 3.5321044921875, 3.82373046875, 4.1153564453125, 4.406982421875, 4.6986083984375, 4.990234375, 5.2818603515625, 5.573486328125, 5.8651123046875, 6.15673828125, 6.4483642578125, 6.739990234375, 7.0316162109375, 7.3232421875, 7.6148681640625, 7.906494140625, 8.1981201171875, 8.48974609375, 8.7813720703125, 9.072998046875, 9.3646240234375, 9.65625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 11.0, 10.0, 12.0, 10.0, 16.0, 16.0, 27.0, 39.0, 47.0, 67.0, 116.0, 147.0, 238.0, 427.0, 697.0, 1644.0, 12261.0, 1077884.0, 3056639.0, 39374.0, 2367.0, 879.0, 481.0, 245.0, 177.0, 123.0, 74.0, 65.0, 44.0, 37.0, 24.0, 18.0, 16.0, 13.0, 7.0, 8.0, 7.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.15625, -34.095703125, -33.03515625, -31.974609375, -30.9140625, -29.853515625, -28.79296875, -27.732421875, -26.671875, -25.611328125, -24.55078125, -23.490234375, -22.4296875, -21.369140625, -20.30859375, -19.248046875, -18.1875, -17.126953125, -16.06640625, -15.005859375, -13.9453125, -12.884765625, -11.82421875, -10.763671875, -9.703125, -8.642578125, -7.58203125, -6.521484375, -5.4609375, -4.400390625, -3.33984375, -2.279296875, -1.21875, -0.158203125, 0.90234375, 1.962890625, 3.0234375, 4.083984375, 5.14453125, 6.205078125, 7.265625, 8.326171875, 9.38671875, 10.447265625, 11.5078125, 12.568359375, 13.62890625, 14.689453125, 15.75, 16.810546875, 17.87109375, 18.931640625, 19.9921875, 21.052734375, 22.11328125, 23.173828125, 24.234375, 25.294921875, 26.35546875, 27.416015625, 28.4765625, 29.537109375, 30.59765625, 31.658203125, 32.71875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 34.0, 691.0, 287.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-493.4949035644531, -481.6839904785156, -469.8730773925781, -458.0621337890625, -446.251220703125, -434.4403076171875, -422.62939453125, -410.8184814453125, -399.007568359375, -387.1966552734375, -375.3857421875, -363.5748291015625, -351.7638854980469, -339.9529724121094, -328.1420593261719, -316.3311462402344, -304.52020263671875, -292.70928955078125, -280.89837646484375, -269.08746337890625, -257.2765197753906, -245.46560668945312, -233.65469360351562, -221.84378051757812, -210.03286743164062, -198.22195434570312, -186.41102600097656, -174.60011291503906, -162.78919982910156, -150.978271484375, -139.1673583984375, -127.3564453125, -115.5455322265625, -103.73461151123047, -91.92369842529297, -80.11277770996094, -68.30186462402344, -56.490943908691406, -44.680023193359375, -32.869110107421875, -21.058189392089844, -9.247271537780762, 2.5636463165283203, 14.374565124511719, 26.185482025146484, 37.99639892578125, 49.80731964111328, 61.61823272705078, 73.42915344238281, 85.24007415771484, 97.05098724365234, 108.86190795898438, 120.67282104492188, 132.48373413085938, 144.29466247558594, 156.10557556152344, 167.91650390625, 179.7274169921875, 191.53834533691406, 203.34925842285156, 215.16017150878906, 226.97109985351562, 238.78201293945312, 250.59292602539062, 262.4038391113281]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 10.0, 9.0, 10.0, 15.0, 10.0, 25.0, 17.0, 24.0, 28.0, 35.0, 35.0, 38.0, 42.0, 42.0, 36.0, 33.0, 39.0, 37.0, 38.0, 42.0, 44.0, 48.0, 35.0, 44.0, 30.0, 33.0, 26.0, 15.0, 23.0, 19.0, 19.0, 21.0, 8.0, 8.0, 8.0, 7.0, 2.0, 8.0, 6.0, 8.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.747676849365234, -31.709997177124023, -30.672317504882812, -29.6346378326416, -28.59695816040039, -27.55927848815918, -26.52159881591797, -25.483919143676758, -24.446239471435547, -23.408559799194336, -22.370880126953125, -21.333200454711914, -20.295520782470703, -19.257841110229492, -18.22016143798828, -17.18248176574707, -16.14480209350586, -15.107122421264648, -14.069442749023438, -13.031763076782227, -11.994083404541016, -10.956403732299805, -9.918724060058594, -8.881044387817383, -7.843364715576172, -6.805685043334961, -5.76800537109375, -4.730325698852539, -3.692646026611328, -2.654966354370117, -1.6172866821289062, -0.5796070098876953, 0.45807647705078125, 1.4957561492919922, 2.533435821533203, 3.571115493774414, 4.608795166015625, 5.646474838256836, 6.684154510498047, 7.721834182739258, 8.759513854980469, 9.79719352722168, 10.83487319946289, 11.872552871704102, 12.910232543945312, 13.947912216186523, 14.985591888427734, 16.023271560668945, 17.060951232910156, 18.098630905151367, 19.136310577392578, 20.17399024963379, 21.211669921875, 22.24934959411621, 23.287029266357422, 24.324708938598633, 25.362388610839844, 26.400068283081055, 27.437747955322266, 28.475427627563477, 29.513107299804688, 30.5507869720459, 31.58846664428711, 32.62614440917969, 33.66382598876953]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 8.0, 9.0, 6.0, 15.0, 17.0, 21.0, 17.0, 23.0, 25.0, 23.0, 26.0, 27.0, 37.0, 27.0, 40.0, 45.0, 37.0, 38.0, 43.0, 47.0, 44.0, 37.0, 51.0, 35.0, 29.0, 46.0, 25.0, 24.0, 22.0, 33.0, 24.0, 13.0, 15.0, 10.0, 15.0, 12.0, 6.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.63433837890625, -5.4639892578125, -5.29364013671875, -5.123291015625, -4.95294189453125, -4.7825927734375, -4.61224365234375, -4.44189453125, -4.27154541015625, -4.1011962890625, -3.93084716796875, -3.760498046875, -3.59014892578125, -3.4197998046875, -3.24945068359375, -3.0791015625, -2.90875244140625, -2.7384033203125, -2.56805419921875, -2.397705078125, -2.22735595703125, -2.0570068359375, -1.88665771484375, -1.71630859375, -1.54595947265625, -1.3756103515625, -1.20526123046875, -1.034912109375, -0.86456298828125, -0.6942138671875, -0.52386474609375, -0.353515625, -0.18316650390625, -0.0128173828125, 0.15753173828125, 0.327880859375, 0.49822998046875, 0.6685791015625, 0.83892822265625, 1.00927734375, 1.17962646484375, 1.3499755859375, 1.52032470703125, 1.690673828125, 1.86102294921875, 2.0313720703125, 2.20172119140625, 2.3720703125, 2.54241943359375, 2.7127685546875, 2.88311767578125, 3.053466796875, 3.22381591796875, 3.3941650390625, 3.56451416015625, 3.73486328125, 3.90521240234375, 4.0755615234375, 4.24591064453125, 4.416259765625, 4.58660888671875, 4.7569580078125, 4.92730712890625, 5.09765625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 10.0, 8.0, 9.0, 21.0, 23.0, 31.0, 65.0, 100.0, 161.0, 271.0, 407.0, 603.0, 1037.0, 1737.0, 2673.0, 4297.0, 6885.0, 11104.0, 17972.0, 28434.0, 46676.0, 74661.0, 118180.0, 170854.0, 186311.0, 138370.0, 90113.0, 56117.0, 34543.0, 21634.0, 13200.0, 8315.0, 5151.0, 3194.0, 2000.0, 1264.0, 772.0, 498.0, 337.0, 158.0, 133.0, 93.0, 50.0, 33.0, 20.0, 16.0, 3.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.483642578125, -0.46862030029296875, -0.4535980224609375, -0.43857574462890625, -0.423553466796875, -0.40853118896484375, -0.3935089111328125, -0.37848663330078125, -0.36346435546875, -0.34844207763671875, -0.3334197998046875, -0.31839752197265625, -0.303375244140625, -0.28835296630859375, -0.2733306884765625, -0.25830841064453125, -0.2432861328125, -0.22826385498046875, -0.2132415771484375, -0.19821929931640625, -0.183197021484375, -0.16817474365234375, -0.1531524658203125, -0.13813018798828125, -0.12310791015625, -0.10808563232421875, -0.0930633544921875, -0.07804107666015625, -0.063018798828125, -0.04799652099609375, -0.0329742431640625, -0.01795196533203125, -0.0029296875, 0.01209259033203125, 0.0271148681640625, 0.04213714599609375, 0.057159423828125, 0.07218170166015625, 0.0872039794921875, 0.10222625732421875, 0.11724853515625, 0.13227081298828125, 0.1472930908203125, 0.16231536865234375, 0.177337646484375, 0.19235992431640625, 0.2073822021484375, 0.22240447998046875, 0.2374267578125, 0.25244903564453125, 0.2674713134765625, 0.28249359130859375, 0.297515869140625, 0.31253814697265625, 0.3275604248046875, 0.34258270263671875, 0.35760498046875, 0.37262725830078125, 0.3876495361328125, 0.40267181396484375, 0.417694091796875, 0.43271636962890625, 0.4477386474609375, 0.46276092529296875, 0.477783203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 8.0, 4.0, 8.0, 13.0, 16.0, 13.0, 14.0, 19.0, 23.0, 32.0, 16.0, 31.0, 38.0, 27.0, 30.0, 38.0, 33.0, 52.0, 43.0, 1062.0, 37.0, 45.0, 42.0, 38.0, 41.0, 35.0, 32.0, 32.0, 23.0, 30.0, 26.0, 14.0, 29.0, 17.0, 9.0, 9.0, 11.0, 14.0, 3.0, 11.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.873046875, -3.76544189453125, -3.6578369140625, -3.55023193359375, -3.442626953125, -3.33502197265625, -3.2274169921875, -3.11981201171875, -3.01220703125, -2.90460205078125, -2.7969970703125, -2.68939208984375, -2.581787109375, -2.47418212890625, -2.3665771484375, -2.25897216796875, -2.1513671875, -2.04376220703125, -1.9361572265625, -1.82855224609375, -1.720947265625, -1.61334228515625, -1.5057373046875, -1.39813232421875, -1.29052734375, -1.18292236328125, -1.0753173828125, -0.96771240234375, -0.860107421875, -0.75250244140625, -0.6448974609375, -0.53729248046875, -0.4296875, -0.32208251953125, -0.2144775390625, -0.10687255859375, 0.000732421875, 0.10833740234375, 0.2159423828125, 0.32354736328125, 0.43115234375, 0.53875732421875, 0.6463623046875, 0.75396728515625, 0.861572265625, 0.96917724609375, 1.0767822265625, 1.18438720703125, 1.2919921875, 1.39959716796875, 1.5072021484375, 1.61480712890625, 1.722412109375, 1.83001708984375, 1.9376220703125, 2.04522705078125, 2.15283203125, 2.26043701171875, 2.3680419921875, 2.47564697265625, 2.583251953125, 2.69085693359375, 2.7984619140625, 2.90606689453125, 3.013671875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 15.0, 22.0, 27.0, 52.0, 64.0, 91.0, 140.0, 183.0, 276.0, 427.0, 602.0, 908.0, 1383.0, 2013.0, 3098.0, 4907.0, 7527.0, 11958.0, 18395.0, 28077.0, 42936.0, 64047.0, 91550.0, 123007.0, 1125160.0, 209301.0, 113728.0, 82350.0, 56755.0, 37625.0, 24912.0, 16066.0, 10300.0, 6656.0, 4341.0, 2734.0, 1786.0, 1194.0, 812.0, 533.0, 331.0, 263.0, 175.0, 128.0, 90.0, 56.0, 46.0, 27.0, 14.0, 9.0, 7.0, 7.0, 5.0, 4.0, 1.0, 4.0, 2.0], "bins": [-0.267578125, -0.25917816162109375, -0.2507781982421875, -0.24237823486328125, -0.233978271484375, -0.22557830810546875, -0.2171783447265625, -0.20877838134765625, -0.20037841796875, -0.19197845458984375, -0.1835784912109375, -0.17517852783203125, -0.166778564453125, -0.15837860107421875, -0.1499786376953125, -0.14157867431640625, -0.1331787109375, -0.12477874755859375, -0.1163787841796875, -0.10797882080078125, -0.099578857421875, -0.09117889404296875, -0.0827789306640625, -0.07437896728515625, -0.06597900390625, -0.05757904052734375, -0.0491790771484375, -0.04077911376953125, -0.032379150390625, -0.02397918701171875, -0.0155792236328125, -0.00717926025390625, 0.001220703125, 0.00962066650390625, 0.0180206298828125, 0.02642059326171875, 0.034820556640625, 0.04322052001953125, 0.0516204833984375, 0.06002044677734375, 0.06842041015625, 0.07682037353515625, 0.0852203369140625, 0.09362030029296875, 0.102020263671875, 0.11042022705078125, 0.1188201904296875, 0.12722015380859375, 0.1356201171875, 0.14402008056640625, 0.1524200439453125, 0.16082000732421875, 0.169219970703125, 0.17761993408203125, 0.1860198974609375, 0.19441986083984375, 0.20281982421875, 0.21121978759765625, 0.2196197509765625, 0.22801971435546875, 0.236419677734375, 0.24481964111328125, 0.2532196044921875, 0.26161956787109375, 0.27001953125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 16.0, 7.0, 16.0, 18.0, 21.0, 24.0, 24.0, 28.0, 33.0, 60.0, 75.0, 82.0, 94.0, 84.0, 75.0, 50.0, 55.0, 27.0, 26.0, 20.0, 19.0, 20.0, 17.0, 12.0, 5.0, 11.0, 14.0, 8.0, 6.0, 1.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0101470947265625, -0.009816169738769531, -0.009485244750976562, -0.009154319763183594, -0.008823394775390625, -0.008492469787597656, -0.008161544799804688, -0.007830619812011719, -0.00749969482421875, -0.007168769836425781, -0.0068378448486328125, -0.006506919860839844, -0.006175994873046875, -0.005845069885253906, -0.0055141448974609375, -0.005183219909667969, -0.004852294921875, -0.004521369934082031, -0.0041904449462890625, -0.0038595199584960938, -0.003528594970703125, -0.0031976699829101562, -0.0028667449951171875, -0.0025358200073242188, -0.00220489501953125, -0.0018739700317382812, -0.0015430450439453125, -0.0012121200561523438, -0.000881195068359375, -0.0005502700805664062, -0.0002193450927734375, 0.00011157989501953125, 0.0004425048828125, 0.0007734298706054688, 0.0011043548583984375, 0.0014352798461914062, 0.001766204833984375, 0.0020971298217773438, 0.0024280548095703125, 0.0027589797973632812, 0.00308990478515625, 0.0034208297729492188, 0.0037517547607421875, 0.004082679748535156, 0.004413604736328125, 0.004744529724121094, 0.0050754547119140625, 0.005406379699707031, 0.0057373046875, 0.006068229675292969, 0.0063991546630859375, 0.006730079650878906, 0.007061004638671875, 0.007391929626464844, 0.0077228546142578125, 0.008053779602050781, 0.00838470458984375, 0.008715629577636719, 0.009046554565429688, 0.009377479553222656, 0.009708404541015625, 0.010039329528808594, 0.010370254516601562, 0.010701179504394531, 0.0110321044921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 7.0, 11.0, 10.0, 15.0, 15.0, 17.0, 24.0, 26.0, 41.0, 45.0, 85.0, 107.0, 188.0, 402.0, 2282.0, 83044.0, 945187.0, 15224.0, 1019.0, 297.0, 135.0, 83.0, 61.0, 52.0, 44.0, 27.0, 25.0, 16.0, 15.0, 6.0, 8.0, 8.0, 8.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.24951171875, -0.2420177459716797, -0.23452377319335938, -0.22702980041503906, -0.21953582763671875, -0.21204185485839844, -0.20454788208007812, -0.1970539093017578, -0.1895599365234375, -0.1820659637451172, -0.17457199096679688, -0.16707801818847656, -0.15958404541015625, -0.15209007263183594, -0.14459609985351562, -0.1371021270751953, -0.129608154296875, -0.12211418151855469, -0.11462020874023438, -0.10712623596191406, -0.09963226318359375, -0.09213829040527344, -0.08464431762695312, -0.07715034484863281, -0.0696563720703125, -0.06216239929199219, -0.054668426513671875, -0.04717445373535156, -0.03968048095703125, -0.03218650817871094, -0.024692535400390625, -0.017198562622070312, -0.00970458984375, -0.0022106170654296875, 0.005283355712890625, 0.012777328491210938, 0.02027130126953125, 0.027765274047851562, 0.035259246826171875, 0.04275321960449219, 0.0502471923828125, 0.05774116516113281, 0.06523513793945312, 0.07272911071777344, 0.08022308349609375, 0.08771705627441406, 0.09521102905273438, 0.10270500183105469, 0.110198974609375, 0.11769294738769531, 0.12518692016601562, 0.13268089294433594, 0.14017486572265625, 0.14766883850097656, 0.15516281127929688, 0.1626567840576172, 0.1701507568359375, 0.1776447296142578, 0.18513870239257812, 0.19263267517089844, 0.20012664794921875, 0.20762062072753906, 0.21511459350585938, 0.2226085662841797, 0.2301025390625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 20.0, 37.0, 45.0, 116.0, 246.0, 197.0, 147.0, 67.0, 47.0, 17.0, 21.0, 14.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03400374948978424, -0.03282804414629936, -0.031652338802814484, -0.030476629734039307, -0.029300924390554428, -0.02812521904706955, -0.026949511840939522, -0.025773804634809494, -0.024598099291324615, -0.023422393947839737, -0.02224668674170971, -0.02107097953557968, -0.019895274192094803, -0.018719568848609924, -0.017543861642479897, -0.01636815443634987, -0.01519244909286499, -0.014016742818057537, -0.012841036543250084, -0.01166533026844263, -0.010489623993635178, -0.009313917718827724, -0.008138211444020271, -0.006962505169212818, -0.005786798894405365, -0.004611092619597912, -0.0034353863447904587, -0.0022596800699830055, -0.0010839737951755524, 9.173247963190079e-05, 0.001267438754439354, 0.002443145029246807, 0.0036188513040542603, 0.004794557578861713, 0.0059702638536691666, 0.00714597012847662, 0.008321676403284073, 0.009497382678091526, 0.01067308895289898, 0.011848795227706432, 0.013024501502513885, 0.014200207777321339, 0.015375914052128792, 0.01655162125825882, 0.017727326601743698, 0.018903031945228577, 0.020078739151358604, 0.021254446357488632, 0.02243015170097351, 0.02360585704445839, 0.024781564250588417, 0.025957271456718445, 0.027132976800203323, 0.028308682143688202, 0.02948438934981823, 0.030660096555948257, 0.031835801899433136, 0.033011507242918015, 0.03418721258640289, 0.03536292165517807, 0.03653862699866295, 0.03771433234214783, 0.038890041410923004, 0.04006574675440788, 0.04124145209789276]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 6.0, 6.0, 9.0, 7.0, 13.0, 15.0, 13.0, 28.0, 14.0, 29.0, 24.0, 29.0, 27.0, 32.0, 33.0, 32.0, 42.0, 34.0, 35.0, 46.0, 42.0, 37.0, 31.0, 43.0, 35.0, 36.0, 42.0, 34.0, 28.0, 23.0, 25.0, 33.0, 19.0, 13.0, 22.0, 8.0, 14.0, 10.0, 8.0, 6.0, 1.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.006516158580780029, -0.0063246507197618484, -0.006133142858743668, -0.005941634997725487, -0.005750127136707306, -0.005558619275689125, -0.005367111414670944, -0.005175603553652763, -0.0049840956926345825, -0.004792587831616402, -0.004601079970598221, -0.00440957210958004, -0.004218064248561859, -0.004026556387543678, -0.0038350485265254974, -0.0036435406655073166, -0.0034520328044891357, -0.003260524943470955, -0.003069017082452774, -0.002877509221434593, -0.0026860013604164124, -0.0024944934993982315, -0.0023029856383800507, -0.00211147777736187, -0.001919969916343689, -0.0017284620553255081, -0.0015369541943073273, -0.0013454463332891464, -0.0011539384722709656, -0.0009624306112527847, -0.0007709227502346039, -0.000579414889216423, -0.0003879070281982422, -0.00019639916718006134, -4.891306161880493e-06, 0.00018661655485630035, 0.0003781244158744812, 0.000569632276892662, 0.0007611401379108429, 0.0009526479989290237, 0.0011441558599472046, 0.0013356637209653854, 0.0015271715819835663, 0.0017186794430017471, 0.001910187304019928, 0.002101695165038109, 0.0022932030260562897, 0.0024847108870744705, 0.0026762187480926514, 0.002867726609110832, 0.003059234470129013, 0.003250742331147194, 0.0034422501921653748, 0.0036337580531835556, 0.0038252659142017365, 0.004016773775219917, 0.004208281636238098, 0.004399789497256279, 0.00459129735827446, 0.004782805219292641, 0.0049743130803108215, 0.005165820941329002, 0.005357328802347183, 0.005548836663365364, 0.005740344524383545]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 8.0, 9.0, 6.0, 15.0, 17.0, 21.0, 17.0, 23.0, 25.0, 23.0, 26.0, 27.0, 37.0, 27.0, 40.0, 45.0, 37.0, 38.0, 43.0, 47.0, 44.0, 37.0, 51.0, 36.0, 28.0, 47.0, 24.0, 24.0, 22.0, 33.0, 24.0, 13.0, 15.0, 10.0, 15.0, 12.0, 6.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.63433837890625, -5.4639892578125, -5.29364013671875, -5.123291015625, -4.95294189453125, -4.7825927734375, -4.61224365234375, -4.44189453125, -4.27154541015625, -4.1011962890625, -3.93084716796875, -3.760498046875, -3.59014892578125, -3.4197998046875, -3.24945068359375, -3.0791015625, -2.90875244140625, -2.7384033203125, -2.56805419921875, -2.397705078125, -2.22735595703125, -2.0570068359375, -1.88665771484375, -1.71630859375, -1.54595947265625, -1.3756103515625, -1.20526123046875, -1.034912109375, -0.86456298828125, -0.6942138671875, -0.52386474609375, -0.353515625, -0.18316650390625, -0.0128173828125, 0.15753173828125, 0.327880859375, 0.49822998046875, 0.6685791015625, 0.83892822265625, 1.00927734375, 1.17962646484375, 1.3499755859375, 1.52032470703125, 1.690673828125, 1.86102294921875, 2.0313720703125, 2.20172119140625, 2.3720703125, 2.54241943359375, 2.7127685546875, 2.88311767578125, 3.053466796875, 3.22381591796875, 3.3941650390625, 3.56451416015625, 3.73486328125, 3.90521240234375, 4.0755615234375, 4.24591064453125, 4.416259765625, 4.58660888671875, 4.7569580078125, 4.92730712890625, 5.09765625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 5.0, 4.0, 6.0, 15.0, 15.0, 22.0, 31.0, 53.0, 75.0, 106.0, 158.0, 287.0, 532.0, 981.0, 1867.0, 3634.0, 6995.0, 13840.0, 26527.0, 52014.0, 111177.0, 256417.0, 300641.0, 142946.0, 63591.0, 32034.0, 16688.0, 8543.0, 4320.0, 2288.0, 1178.0, 621.0, 370.0, 207.0, 126.0, 68.0, 38.0, 39.0, 28.0, 20.0, 8.0, 10.0, 7.0, 7.0, 6.0, 5.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.9190673828125, -5.740478515625, -5.5618896484375, -5.38330078125, -5.2047119140625, -5.026123046875, -4.8475341796875, -4.6689453125, -4.4903564453125, -4.311767578125, -4.1331787109375, -3.95458984375, -3.7760009765625, -3.597412109375, -3.4188232421875, -3.240234375, -3.0616455078125, -2.883056640625, -2.7044677734375, -2.52587890625, -2.3472900390625, -2.168701171875, -1.9901123046875, -1.8115234375, -1.6329345703125, -1.454345703125, -1.2757568359375, -1.09716796875, -0.9185791015625, -0.739990234375, -0.5614013671875, -0.3828125, -0.2042236328125, -0.025634765625, 0.1529541015625, 0.33154296875, 0.5101318359375, 0.688720703125, 0.8673095703125, 1.0458984375, 1.2244873046875, 1.403076171875, 1.5816650390625, 1.76025390625, 1.9388427734375, 2.117431640625, 2.2960205078125, 2.474609375, 2.6531982421875, 2.831787109375, 3.0103759765625, 3.18896484375, 3.3675537109375, 3.546142578125, 3.7247314453125, 3.9033203125, 4.0819091796875, 4.260498046875, 4.4390869140625, 4.61767578125, 4.7962646484375, 4.974853515625, 5.1534423828125, 5.33203125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 3.0, 5.0, 9.0, 7.0, 5.0, 7.0, 13.0, 10.0, 22.0, 24.0, 26.0, 18.0, 24.0, 28.0, 37.0, 45.0, 48.0, 49.0, 69.0, 112.0, 212.0, 1385.0, 285.0, 117.0, 73.0, 67.0, 47.0, 39.0, 38.0, 39.0, 25.0, 20.0, 23.0, 16.0, 17.0, 15.0, 9.0, 9.0, 17.0, 6.0, 10.0, 3.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.32666015625, -15.7939453125, -15.26123046875, -14.728515625, -14.19580078125, -13.6630859375, -13.13037109375, -12.59765625, -12.06494140625, -11.5322265625, -10.99951171875, -10.466796875, -9.93408203125, -9.4013671875, -8.86865234375, -8.3359375, -7.80322265625, -7.2705078125, -6.73779296875, -6.205078125, -5.67236328125, -5.1396484375, -4.60693359375, -4.07421875, -3.54150390625, -3.0087890625, -2.47607421875, -1.943359375, -1.41064453125, -0.8779296875, -0.34521484375, 0.1875, 0.72021484375, 1.2529296875, 1.78564453125, 2.318359375, 2.85107421875, 3.3837890625, 3.91650390625, 4.44921875, 4.98193359375, 5.5146484375, 6.04736328125, 6.580078125, 7.11279296875, 7.6455078125, 8.17822265625, 8.7109375, 9.24365234375, 9.7763671875, 10.30908203125, 10.841796875, 11.37451171875, 11.9072265625, 12.43994140625, 12.97265625, 13.50537109375, 14.0380859375, 14.57080078125, 15.103515625, 15.63623046875, 16.1689453125, 16.70166015625, 17.234375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 4.0, 4.0, 8.0, 6.0, 6.0, 14.0, 21.0, 22.0, 32.0, 46.0, 43.0, 71.0, 103.0, 135.0, 238.0, 369.0, 700.0, 2378.0, 72954.0, 3006013.0, 58616.0, 2166.0, 618.0, 370.0, 215.0, 145.0, 99.0, 74.0, 63.0, 41.0, 24.0, 17.0, 21.0, 15.0, 13.0, 7.0, 10.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.65625, -40.37353515625, -39.0908203125, -37.80810546875, -36.525390625, -35.24267578125, -33.9599609375, -32.67724609375, -31.39453125, -30.11181640625, -28.8291015625, -27.54638671875, -26.263671875, -24.98095703125, -23.6982421875, -22.41552734375, -21.1328125, -19.85009765625, -18.5673828125, -17.28466796875, -16.001953125, -14.71923828125, -13.4365234375, -12.15380859375, -10.87109375, -9.58837890625, -8.3056640625, -7.02294921875, -5.740234375, -4.45751953125, -3.1748046875, -1.89208984375, -0.609375, 0.67333984375, 1.9560546875, 3.23876953125, 4.521484375, 5.80419921875, 7.0869140625, 8.36962890625, 9.65234375, 10.93505859375, 12.2177734375, 13.50048828125, 14.783203125, 16.06591796875, 17.3486328125, 18.63134765625, 19.9140625, 21.19677734375, 22.4794921875, 23.76220703125, 25.044921875, 26.32763671875, 27.6103515625, 28.89306640625, 30.17578125, 31.45849609375, 32.7412109375, 34.02392578125, 35.306640625, 36.58935546875, 37.8720703125, 39.15478515625, 40.4375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 40.0, 964.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-681.158935546875, -669.08349609375, -657.008056640625, -644.9326171875, -632.857177734375, -620.78173828125, -608.706298828125, -596.630859375, -584.555419921875, -572.47998046875, -560.404541015625, -548.3291015625, -536.253662109375, -524.17822265625, -512.102783203125, -500.02734375, -487.9518737792969, -475.8764343261719, -463.8009948730469, -451.7255554199219, -439.6501159667969, -427.5746765136719, -415.49920654296875, -403.42376708984375, -391.34832763671875, -379.27288818359375, -367.19744873046875, -355.12200927734375, -343.04656982421875, -330.97113037109375, -318.89569091796875, -306.82025146484375, -294.74481201171875, -282.66937255859375, -270.59393310546875, -258.51849365234375, -246.44305419921875, -234.36761474609375, -222.2921600341797, -210.2167205810547, -198.14129638671875, -186.06585693359375, -173.99041748046875, -161.91497802734375, -149.83953857421875, -137.76409912109375, -125.68864440917969, -113.61320495605469, -101.53776550292969, -89.46232604980469, -77.38688659667969, -65.31143951416016, -53.236000061035156, -41.160560607910156, -29.085113525390625, -17.009674072265625, -4.934234619140625, 7.141206741333008, 19.21664810180664, 31.292091369628906, 43.367530822753906, 55.442970275878906, 67.51841735839844, 79.59385681152344, 91.66929626464844]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 11.0, 9.0, 18.0, 18.0, 23.0, 23.0, 34.0, 37.0, 51.0, 48.0, 53.0, 54.0, 56.0, 56.0, 56.0, 61.0, 65.0, 45.0, 37.0, 42.0, 24.0, 34.0, 17.0, 32.0, 25.0, 16.0, 18.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.01895523071289, -61.288143157958984, -59.557334899902344, -57.82652282714844, -56.09571075439453, -54.364898681640625, -52.634090423583984, -50.90327835083008, -49.17247009277344, -47.44165802001953, -45.71084976196289, -43.980037689208984, -42.24922561645508, -40.51841735839844, -38.78760528564453, -37.056793212890625, -35.32598114013672, -33.59516906738281, -31.86435890197754, -30.133548736572266, -28.40273666381836, -26.671926498413086, -24.941116333007812, -23.210304260253906, -21.479494094848633, -19.74868392944336, -18.017871856689453, -16.28706169128418, -14.55625057220459, -12.825439453125, -11.094629287719727, -9.363818168640137, -7.633003234863281, -5.902192115783691, -4.17138147354126, -2.440570831298828, -0.7097597122192383, 1.0210514068603516, 2.751861572265625, 4.482672691345215, 6.213483810424805, 7.9442949295043945, 9.675106048583984, 11.405916213989258, 13.136727333068848, 14.867538452148438, 16.59834861755371, 18.329158782958984, 20.05997085571289, 21.790781021118164, 23.52159309387207, 25.252403259277344, 26.98321533203125, 28.714025497436523, 30.444835662841797, 32.1756477355957, 33.906455993652344, 35.63726806640625, 37.36807632446289, 39.0988883972168, 40.8297004699707, 42.560508728027344, 44.29132080078125, 46.022132873535156, 47.75294494628906]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 3.0, 7.0, 2.0, 6.0, 13.0, 10.0, 15.0, 18.0, 19.0, 20.0, 25.0, 23.0, 20.0, 28.0, 42.0, 34.0, 32.0, 32.0, 39.0, 36.0, 37.0, 44.0, 45.0, 39.0, 37.0, 35.0, 31.0, 29.0, 29.0, 28.0, 26.0, 29.0, 33.0, 20.0, 18.0, 14.0, 15.0, 12.0, 4.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-6.0078125, -5.833251953125, -5.65869140625, -5.484130859375, -5.3095703125, -5.135009765625, -4.96044921875, -4.785888671875, -4.611328125, -4.436767578125, -4.26220703125, -4.087646484375, -3.9130859375, -3.738525390625, -3.56396484375, -3.389404296875, -3.21484375, -3.040283203125, -2.86572265625, -2.691162109375, -2.5166015625, -2.342041015625, -2.16748046875, -1.992919921875, -1.818359375, -1.643798828125, -1.46923828125, -1.294677734375, -1.1201171875, -0.945556640625, -0.77099609375, -0.596435546875, -0.421875, -0.247314453125, -0.07275390625, 0.101806640625, 0.2763671875, 0.450927734375, 0.62548828125, 0.800048828125, 0.974609375, 1.149169921875, 1.32373046875, 1.498291015625, 1.6728515625, 1.847412109375, 2.02197265625, 2.196533203125, 2.37109375, 2.545654296875, 2.72021484375, 2.894775390625, 3.0693359375, 3.243896484375, 3.41845703125, 3.593017578125, 3.767578125, 3.942138671875, 4.11669921875, 4.291259765625, 4.4658203125, 4.640380859375, 4.81494140625, 4.989501953125, 5.1640625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 6.0, 4.0, 5.0, 4.0, 4.0, 16.0, 8.0, 23.0, 10.0, 13.0, 25.0, 33.0, 26.0, 42.0, 46.0, 76.0, 102.0, 182.0, 560.0, 2763.0, 20910.0, 230263.0, 1875420.0, 1816799.0, 222714.0, 20472.0, 2652.0, 502.0, 157.0, 87.0, 64.0, 52.0, 49.0, 34.0, 29.0, 24.0, 16.0, 16.0, 14.0, 14.0, 7.0, 7.0, 1.0, 8.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0], "bins": [-13.5390625, -13.1407470703125, -12.742431640625, -12.3441162109375, -11.94580078125, -11.5474853515625, -11.149169921875, -10.7508544921875, -10.3525390625, -9.9542236328125, -9.555908203125, -9.1575927734375, -8.75927734375, -8.3609619140625, -7.962646484375, -7.5643310546875, -7.166015625, -6.7677001953125, -6.369384765625, -5.9710693359375, -5.57275390625, -5.1744384765625, -4.776123046875, -4.3778076171875, -3.9794921875, -3.5811767578125, -3.182861328125, -2.7845458984375, -2.38623046875, -1.9879150390625, -1.589599609375, -1.1912841796875, -0.79296875, -0.3946533203125, 0.003662109375, 0.4019775390625, 0.80029296875, 1.1986083984375, 1.596923828125, 1.9952392578125, 2.3935546875, 2.7918701171875, 3.190185546875, 3.5885009765625, 3.98681640625, 4.3851318359375, 4.783447265625, 5.1817626953125, 5.580078125, 5.9783935546875, 6.376708984375, 6.7750244140625, 7.17333984375, 7.5716552734375, 7.969970703125, 8.3682861328125, 8.7666015625, 9.1649169921875, 9.563232421875, 9.9615478515625, 10.35986328125, 10.7581787109375, 11.156494140625, 11.5548095703125, 11.953125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 14.0, 21.0, 23.0, 35.0, 45.0, 65.0, 88.0, 151.0, 199.0, 302.0, 432.0, 506.0, 537.0, 494.0, 372.0, 240.0, 156.0, 110.0, 85.0, 58.0, 46.0, 23.0, 18.0, 8.0, 13.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.046875, -15.667236328125, -15.28759765625, -14.907958984375, -14.5283203125, -14.148681640625, -13.76904296875, -13.389404296875, -13.009765625, -12.630126953125, -12.25048828125, -11.870849609375, -11.4912109375, -11.111572265625, -10.73193359375, -10.352294921875, -9.97265625, -9.593017578125, -9.21337890625, -8.833740234375, -8.4541015625, -8.074462890625, -7.69482421875, -7.315185546875, -6.935546875, -6.555908203125, -6.17626953125, -5.796630859375, -5.4169921875, -5.037353515625, -4.65771484375, -4.278076171875, -3.8984375, -3.518798828125, -3.13916015625, -2.759521484375, -2.3798828125, -2.000244140625, -1.62060546875, -1.240966796875, -0.861328125, -0.481689453125, -0.10205078125, 0.277587890625, 0.6572265625, 1.036865234375, 1.41650390625, 1.796142578125, 2.17578125, 2.555419921875, 2.93505859375, 3.314697265625, 3.6943359375, 4.073974609375, 4.45361328125, 4.833251953125, 5.212890625, 5.592529296875, 5.97216796875, 6.351806640625, 6.7314453125, 7.111083984375, 7.49072265625, 7.870361328125, 8.25]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 9.0, 15.0, 18.0, 40.0, 47.0, 86.0, 104.0, 133.0, 268.0, 457.0, 951.0, 6485.0, 509116.0, 3615351.0, 57540.0, 1998.0, 674.0, 335.0, 217.0, 137.0, 79.0, 69.0, 44.0, 27.0, 14.0, 20.0, 11.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.53125, -26.3486328125, -25.166015625, -23.9833984375, -22.80078125, -21.6181640625, -20.435546875, -19.2529296875, -18.0703125, -16.8876953125, -15.705078125, -14.5224609375, -13.33984375, -12.1572265625, -10.974609375, -9.7919921875, -8.609375, -7.4267578125, -6.244140625, -5.0615234375, -3.87890625, -2.6962890625, -1.513671875, -0.3310546875, 0.8515625, 2.0341796875, 3.216796875, 4.3994140625, 5.58203125, 6.7646484375, 7.947265625, 9.1298828125, 10.3125, 11.4951171875, 12.677734375, 13.8603515625, 15.04296875, 16.2255859375, 17.408203125, 18.5908203125, 19.7734375, 20.9560546875, 22.138671875, 23.3212890625, 24.50390625, 25.6865234375, 26.869140625, 28.0517578125, 29.234375, 30.4169921875, 31.599609375, 32.7822265625, 33.96484375, 35.1474609375, 36.330078125, 37.5126953125, 38.6953125, 39.8779296875, 41.060546875, 42.2431640625, 43.42578125, 44.6083984375, 45.791015625, 46.9736328125, 48.15625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 13.0, 69.0, 311.0, 419.0, 171.0, 32.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.78282165527344, -182.75057983398438, -177.71835327148438, -172.6861114501953, -167.65386962890625, -162.62164306640625, -157.5894012451172, -152.55715942382812, -147.52493286132812, -142.49269104003906, -137.46046447753906, -132.42822265625, -127.39598083496094, -122.3637466430664, -117.33151245117188, -112.29927062988281, -107.26702880859375, -102.23479461669922, -97.20255279541016, -92.17031860351562, -87.13807678222656, -82.10584259033203, -77.0736083984375, -72.04136657714844, -67.0091323852539, -61.97689437866211, -56.94465637207031, -51.91242218017578, -46.880184173583984, -41.84794616699219, -36.815711975097656, -31.78347396850586, -26.751220703125, -21.718982696533203, -16.68674659729004, -11.654509544372559, -6.622272491455078, -1.5900344848632812, 3.442201614379883, 8.474437713623047, 13.506675720214844, 18.53891372680664, 23.571149826049805, 28.60338592529297, 33.635623931884766, 38.66786193847656, 43.700096130371094, 48.73233413696289, 53.76457214355469, 58.796810150146484, 63.82904815673828, 68.86128234863281, 73.89352416992188, 78.9257583618164, 83.95799255371094, 88.990234375, 94.02246856689453, 99.05470275878906, 104.08694458007812, 109.11917877197266, 114.15141296386719, 119.18365478515625, 124.21588897705078, 129.2481231689453, 134.28036499023438]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 2.0, 7.0, 6.0, 7.0, 9.0, 11.0, 10.0, 16.0, 14.0, 15.0, 18.0, 19.0, 22.0, 41.0, 26.0, 25.0, 38.0, 31.0, 37.0, 28.0, 34.0, 39.0, 43.0, 38.0, 29.0, 39.0, 35.0, 42.0, 30.0, 24.0, 33.0, 30.0, 19.0, 28.0, 19.0, 18.0, 18.0, 15.0, 18.0, 17.0, 14.0, 8.0, 11.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.55781555175781, -32.573326110839844, -31.588838577270508, -30.60434913635254, -29.61985969543457, -28.635372161865234, -27.650882720947266, -26.666393280029297, -25.681903839111328, -24.69741439819336, -23.712926864624023, -22.728437423706055, -21.743947982788086, -20.75946044921875, -19.77497100830078, -18.790481567382812, -17.805994033813477, -16.821504592895508, -15.837016105651855, -14.852527618408203, -13.868038177490234, -12.883549690246582, -11.89906120300293, -10.914571762084961, -9.930083274841309, -8.945594787597656, -7.9611053466796875, -6.976616859436035, -5.992127895355225, -5.007638931274414, -4.023150444030762, -3.038661479949951, -2.0541725158691406, -1.0696836709976196, -0.08519482612609863, 0.8992938995361328, 1.8837828636169434, 2.868271827697754, 3.8527603149414062, 4.837249279022217, 5.821738243103027, 6.806227207183838, 7.790716171264648, 8.7752046585083, 9.759693145751953, 10.744182586669922, 11.728671073913574, 12.713159561157227, 13.697649002075195, 14.682137489318848, 15.666626930236816, 16.65111541748047, 17.635604858398438, 18.620094299316406, 19.604581832885742, 20.58907127380371, 21.573558807373047, 22.558048248291016, 23.54253578186035, 24.52702522277832, 25.51151466369629, 26.496002197265625, 27.480491638183594, 28.464981079101562, 29.44947052001953]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 3.0, 4.0, 6.0, 5.0, 12.0, 12.0, 13.0, 9.0, 14.0, 24.0, 33.0, 34.0, 32.0, 35.0, 41.0, 37.0, 40.0, 40.0, 41.0, 53.0, 37.0, 44.0, 38.0, 43.0, 42.0, 38.0, 31.0, 25.0, 34.0, 38.0, 29.0, 17.0, 18.0, 12.0, 20.0, 11.0, 6.0, 10.0, 1.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.556884765625, -6.36376953125, -6.170654296875, -5.9775390625, -5.784423828125, -5.59130859375, -5.398193359375, -5.205078125, -5.011962890625, -4.81884765625, -4.625732421875, -4.4326171875, -4.239501953125, -4.04638671875, -3.853271484375, -3.66015625, -3.467041015625, -3.27392578125, -3.080810546875, -2.8876953125, -2.694580078125, -2.50146484375, -2.308349609375, -2.115234375, -1.922119140625, -1.72900390625, -1.535888671875, -1.3427734375, -1.149658203125, -0.95654296875, -0.763427734375, -0.5703125, -0.377197265625, -0.18408203125, 0.009033203125, 0.2021484375, 0.395263671875, 0.58837890625, 0.781494140625, 0.974609375, 1.167724609375, 1.36083984375, 1.553955078125, 1.7470703125, 1.940185546875, 2.13330078125, 2.326416015625, 2.51953125, 2.712646484375, 2.90576171875, 3.098876953125, 3.2919921875, 3.485107421875, 3.67822265625, 3.871337890625, 4.064453125, 4.257568359375, 4.45068359375, 4.643798828125, 4.8369140625, 5.030029296875, 5.22314453125, 5.416259765625, 5.609375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 6.0, 3.0, 4.0, 16.0, 15.0, 32.0, 38.0, 61.0, 99.0, 129.0, 213.0, 310.0, 412.0, 551.0, 860.0, 1176.0, 1629.0, 2470.0, 3548.0, 5186.0, 7425.0, 10640.0, 15664.0, 22558.0, 33032.0, 47607.0, 68788.0, 94663.0, 121602.0, 138803.0, 127879.0, 101207.0, 74268.0, 52335.0, 36157.0, 24609.0, 16737.0, 11753.0, 8069.0, 5497.0, 3771.0, 2746.0, 1864.0, 1229.0, 899.0, 606.0, 437.0, 322.0, 225.0, 144.0, 88.0, 66.0, 38.0, 26.0, 28.0, 14.0, 10.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.350341796875, -0.3392601013183594, -0.32817840576171875, -0.3170967102050781, -0.3060150146484375, -0.2949333190917969, -0.28385162353515625, -0.2727699279785156, -0.261688232421875, -0.2506065368652344, -0.23952484130859375, -0.22844314575195312, -0.2173614501953125, -0.20627975463867188, -0.19519805908203125, -0.18411636352539062, -0.17303466796875, -0.16195297241210938, -0.15087127685546875, -0.13978958129882812, -0.1287078857421875, -0.11762619018554688, -0.10654449462890625, -0.09546279907226562, -0.084381103515625, -0.07329940795898438, -0.06221771240234375, -0.051136016845703125, -0.0400543212890625, -0.028972625732421875, -0.01789093017578125, -0.006809234619140625, 0.0042724609375, 0.015354156494140625, 0.02643585205078125, 0.037517547607421875, 0.0485992431640625, 0.059680938720703125, 0.07076263427734375, 0.08184432983398438, 0.092926025390625, 0.10400772094726562, 0.11508941650390625, 0.12617111206054688, 0.1372528076171875, 0.14833450317382812, 0.15941619873046875, 0.17049789428710938, 0.18157958984375, 0.19266128540039062, 0.20374298095703125, 0.21482467651367188, 0.2259063720703125, 0.23698806762695312, 0.24806976318359375, 0.2591514587402344, 0.270233154296875, 0.2813148498535156, 0.29239654541015625, 0.3034782409667969, 0.3145599365234375, 0.3256416320800781, 0.33672332763671875, 0.3478050231933594, 0.35888671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 6.0, 12.0, 3.0, 5.0, 12.0, 13.0, 15.0, 13.0, 18.0, 21.0, 23.0, 20.0, 23.0, 25.0, 26.0, 17.0, 34.0, 30.0, 39.0, 31.0, 38.0, 45.0, 1069.0, 30.0, 35.0, 37.0, 28.0, 32.0, 31.0, 33.0, 26.0, 32.0, 26.0, 24.0, 26.0, 23.0, 15.0, 14.0, 12.0, 15.0, 8.0, 7.0, 4.0, 7.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05859375, -2.956634521484375, -2.85467529296875, -2.752716064453125, -2.6507568359375, -2.548797607421875, -2.44683837890625, -2.344879150390625, -2.242919921875, -2.140960693359375, -2.03900146484375, -1.937042236328125, -1.8350830078125, -1.733123779296875, -1.63116455078125, -1.529205322265625, -1.42724609375, -1.325286865234375, -1.22332763671875, -1.121368408203125, -1.0194091796875, -0.917449951171875, -0.81549072265625, -0.713531494140625, -0.611572265625, -0.509613037109375, -0.40765380859375, -0.305694580078125, -0.2037353515625, -0.101776123046875, 0.00018310546875, 0.102142333984375, 0.2041015625, 0.306060791015625, 0.40802001953125, 0.509979248046875, 0.6119384765625, 0.713897705078125, 0.81585693359375, 0.917816162109375, 1.019775390625, 1.121734619140625, 1.22369384765625, 1.325653076171875, 1.4276123046875, 1.529571533203125, 1.63153076171875, 1.733489990234375, 1.83544921875, 1.937408447265625, 2.03936767578125, 2.141326904296875, 2.2432861328125, 2.345245361328125, 2.44720458984375, 2.549163818359375, 2.651123046875, 2.753082275390625, 2.85504150390625, 2.957000732421875, 3.0589599609375, 3.160919189453125, 3.26287841796875, 3.364837646484375, 3.466796875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 10.0, 30.0, 39.0, 62.0, 108.0, 171.0, 209.0, 370.0, 554.0, 914.0, 1514.0, 2469.0, 4297.0, 7191.0, 12087.0, 20107.0, 33980.0, 55968.0, 89235.0, 133033.0, 1019812.0, 364362.0, 129748.0, 86011.0, 54051.0, 32731.0, 19624.0, 11415.0, 6886.0, 4021.0, 2379.0, 1408.0, 892.0, 532.0, 318.0, 213.0, 144.0, 89.0, 51.0, 30.0, 20.0, 10.0, 15.0, 5.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.297607421875, -0.28733062744140625, -0.2770538330078125, -0.26677703857421875, -0.256500244140625, -0.24622344970703125, -0.2359466552734375, -0.22566986083984375, -0.21539306640625, -0.20511627197265625, -0.1948394775390625, -0.18456268310546875, -0.174285888671875, -0.16400909423828125, -0.1537322998046875, -0.14345550537109375, -0.1331787109375, -0.12290191650390625, -0.1126251220703125, -0.10234832763671875, -0.092071533203125, -0.08179473876953125, -0.0715179443359375, -0.06124114990234375, -0.05096435546875, -0.04068756103515625, -0.0304107666015625, -0.02013397216796875, -0.009857177734375, 0.00041961669921875, 0.0106964111328125, 0.02097320556640625, 0.03125, 0.04152679443359375, 0.0518035888671875, 0.06208038330078125, 0.072357177734375, 0.08263397216796875, 0.0929107666015625, 0.10318756103515625, 0.11346435546875, 0.12374114990234375, 0.1340179443359375, 0.14429473876953125, 0.154571533203125, 0.16484832763671875, 0.1751251220703125, 0.18540191650390625, 0.1956787109375, 0.20595550537109375, 0.2162322998046875, 0.22650909423828125, 0.236785888671875, 0.24706268310546875, 0.2573394775390625, 0.26761627197265625, 0.27789306640625, 0.28816986083984375, 0.2984466552734375, 0.30872344970703125, 0.319000244140625, 0.32927703857421875, 0.3395538330078125, 0.34983062744140625, 0.360107421875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 12.0, 15.0, 35.0, 41.0, 54.0, 64.0, 116.0, 226.0, 158.0, 96.0, 61.0, 42.0, 24.0, 13.0, 11.0, 9.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01398468017578125, -0.013581275939941406, -0.013177871704101562, -0.012774467468261719, -0.012371063232421875, -0.011967658996582031, -0.011564254760742188, -0.011160850524902344, -0.0107574462890625, -0.010354042053222656, -0.009950637817382812, -0.009547233581542969, -0.009143829345703125, -0.008740425109863281, -0.008337020874023438, -0.007933616638183594, -0.00753021240234375, -0.007126808166503906, -0.0067234039306640625, -0.006319999694824219, -0.005916595458984375, -0.005513191223144531, -0.0051097869873046875, -0.004706382751464844, -0.004302978515625, -0.0038995742797851562, -0.0034961700439453125, -0.0030927658081054688, -0.002689361572265625, -0.0022859573364257812, -0.0018825531005859375, -0.0014791488647460938, -0.00107574462890625, -0.0006723403930664062, -0.0002689361572265625, 0.00013446807861328125, 0.000537872314453125, 0.0009412765502929688, 0.0013446807861328125, 0.0017480850219726562, 0.0021514892578125, 0.0025548934936523438, 0.0029582977294921875, 0.0033617019653320312, 0.003765106201171875, 0.004168510437011719, 0.0045719146728515625, 0.004975318908691406, 0.00537872314453125, 0.005782127380371094, 0.0061855316162109375, 0.006588935852050781, 0.006992340087890625, 0.007395744323730469, 0.0077991485595703125, 0.008202552795410156, 0.00860595703125, 0.009009361267089844, 0.009412765502929688, 0.009816169738769531, 0.010219573974609375, 0.010622978210449219, 0.011026382446289062, 0.011429786682128906, 0.01183319091796875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 10.0, 16.0, 20.0, 19.0, 46.0, 73.0, 167.0, 601.0, 25136.0, 1015061.0, 6689.0, 366.0, 141.0, 75.0, 45.0, 28.0, 22.0, 11.0, 6.0, 4.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25146484375, -0.2429046630859375, -0.234344482421875, -0.2257843017578125, -0.21722412109375, -0.2086639404296875, -0.200103759765625, -0.1915435791015625, -0.1829833984375, -0.1744232177734375, -0.165863037109375, -0.1573028564453125, -0.14874267578125, -0.1401824951171875, -0.131622314453125, -0.1230621337890625, -0.114501953125, -0.1059417724609375, -0.097381591796875, -0.0888214111328125, -0.08026123046875, -0.0717010498046875, -0.063140869140625, -0.0545806884765625, -0.0460205078125, -0.0374603271484375, -0.028900146484375, -0.0203399658203125, -0.01177978515625, -0.0032196044921875, 0.005340576171875, 0.0139007568359375, 0.0224609375, 0.0310211181640625, 0.039581298828125, 0.0481414794921875, 0.05670166015625, 0.0652618408203125, 0.073822021484375, 0.0823822021484375, 0.0909423828125, 0.0995025634765625, 0.108062744140625, 0.1166229248046875, 0.12518310546875, 0.1337432861328125, 0.142303466796875, 0.1508636474609375, 0.159423828125, 0.1679840087890625, 0.176544189453125, 0.1851043701171875, 0.19366455078125, 0.2022247314453125, 0.210784912109375, 0.2193450927734375, 0.2279052734375, 0.2364654541015625, 0.245025634765625, 0.2535858154296875, 0.26214599609375, 0.2707061767578125, 0.279266357421875, 0.2878265380859375, 0.29638671875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 12.0, 79.0, 468.0, 347.0, 69.0, 26.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.10467356443405151, -0.10253288596868515, -0.10039220750331879, -0.09825153648853302, -0.09611085802316666, -0.09397017955780029, -0.09182950109243393, -0.08968882262706757, -0.0875481441617012, -0.08540746569633484, -0.08326678723096848, -0.08112610876560211, -0.07898543775081635, -0.07684475928544998, -0.07470408082008362, -0.07256340235471725, -0.07042272388935089, -0.06828204542398453, -0.06614136695861816, -0.0640006959438324, -0.061860013753175735, -0.05971933901309967, -0.05757866054773331, -0.05543798208236694, -0.05329731106758118, -0.05115663260221481, -0.04901595786213875, -0.046875279396772385, -0.04473460093140602, -0.042593926191329956, -0.04045324772596359, -0.03831256926059723, -0.036171890795230865, -0.0340312123298645, -0.03189053758978844, -0.029749859124422073, -0.02760918065905571, -0.025468504056334496, -0.02332782745361328, -0.021187148988246918, -0.019046472385525703, -0.01690579578280449, -0.014765117317438126, -0.012624440714716911, -0.010483763180673122, -0.008343085646629333, -0.006202409043908119, -0.00406173150986433, -0.0019210539758205414, 0.00021962332539260387, 0.002360300626605749, 0.004500977694988251, 0.00664165522903204, 0.008782332763075829, 0.010923009365797043, 0.013063686899840832, 0.01520436443388462, 0.017345041036605835, 0.0194857195019722, 0.021626396104693413, 0.023767072707414627, 0.02590775117278099, 0.028048427775502205, 0.03018910437822342, 0.03232978284358978]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 11.0, 10.0, 8.0, 10.0, 15.0, 17.0, 26.0, 24.0, 25.0, 29.0, 31.0, 25.0, 38.0, 30.0, 49.0, 45.0, 39.0, 36.0, 51.0, 34.0, 47.0, 44.0, 37.0, 35.0, 29.0, 27.0, 38.0, 27.0, 25.0, 22.0, 19.0, 14.0, 10.0, 10.0, 4.0, 14.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006221175193786621, -0.006025002337992191, -0.0058288294821977615, -0.005632656626403332, -0.005436483770608902, -0.005240310914814472, -0.005044138059020042, -0.004847965203225613, -0.004651792347431183, -0.004455619491636753, -0.004259446635842323, -0.0040632737800478935, -0.0038671009242534637, -0.003670928068459034, -0.003474755212664604, -0.0032785823568701744, -0.0030824095010757446, -0.002886236645281315, -0.002690063789486885, -0.0024938909336924553, -0.0022977180778980255, -0.0021015452221035957, -0.001905372366309166, -0.0017091995105147362, -0.0015130266547203064, -0.0013168537989258766, -0.0011206809431314468, -0.0009245080873370171, -0.0007283352315425873, -0.0005321623757481575, -0.0003359895199537277, -0.00013981666415929794, 5.6356191635131836e-05, 0.0002525290474295616, 0.0004487019032239914, 0.0006448747590184212, 0.000841047614812851, 0.0010372204706072807, 0.0012333933264017105, 0.0014295661821961403, 0.00162573903799057, 0.0018219118937849998, 0.0020180847495794296, 0.0022142576053738594, 0.002410430461168289, 0.002606603316962719, 0.0028027761727571487, 0.0029989490285515785, 0.0031951218843460083, 0.003391294740140438, 0.003587467595934868, 0.0037836404517292976, 0.003979813307523727, 0.004175986163318157, 0.004372159019112587, 0.004568331874907017, 0.0047645047307014465, 0.004960677586495876, 0.005156850442290306, 0.005353023298084736, 0.005549196153879166, 0.005745369009673595, 0.005941541865468025, 0.006137714721262455, 0.006333887577056885]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 7.0, 3.0, 4.0, 6.0, 5.0, 12.0, 12.0, 13.0, 9.0, 14.0, 24.0, 32.0, 35.0, 32.0, 35.0, 40.0, 38.0, 40.0, 39.0, 42.0, 53.0, 37.0, 44.0, 38.0, 42.0, 42.0, 39.0, 28.0, 28.0, 33.0, 38.0, 29.0, 18.0, 17.0, 13.0, 20.0, 11.0, 5.0, 11.0, 1.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.55694580078125, -6.3638916015625, -6.17083740234375, -5.977783203125, -5.78472900390625, -5.5916748046875, -5.39862060546875, -5.20556640625, -5.01251220703125, -4.8194580078125, -4.62640380859375, -4.433349609375, -4.24029541015625, -4.0472412109375, -3.85418701171875, -3.6611328125, -3.46807861328125, -3.2750244140625, -3.08197021484375, -2.888916015625, -2.69586181640625, -2.5028076171875, -2.30975341796875, -2.11669921875, -1.92364501953125, -1.7305908203125, -1.53753662109375, -1.344482421875, -1.15142822265625, -0.9583740234375, -0.76531982421875, -0.572265625, -0.37921142578125, -0.1861572265625, 0.00689697265625, 0.199951171875, 0.39300537109375, 0.5860595703125, 0.77911376953125, 0.97216796875, 1.16522216796875, 1.3582763671875, 1.55133056640625, 1.744384765625, 1.93743896484375, 2.1304931640625, 2.32354736328125, 2.5166015625, 2.70965576171875, 2.9027099609375, 3.09576416015625, 3.288818359375, 3.48187255859375, 3.6749267578125, 3.86798095703125, 4.06103515625, 4.25408935546875, 4.4471435546875, 4.64019775390625, 4.833251953125, 5.02630615234375, 5.2193603515625, 5.41241455078125, 5.60546875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 3.0, 7.0, 2.0, 7.0, 6.0, 12.0, 10.0, 10.0, 15.0, 26.0, 42.0, 43.0, 60.0, 80.0, 132.0, 148.0, 240.0, 471.0, 1131.0, 3507.0, 10924.0, 36700.0, 196149.0, 607123.0, 146590.0, 30787.0, 9304.0, 2824.0, 1009.0, 409.0, 219.0, 153.0, 92.0, 67.0, 53.0, 50.0, 36.0, 42.0, 21.0, 12.0, 11.0, 9.0, 9.0, 6.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.640625, -12.2838134765625, -11.927001953125, -11.5701904296875, -11.21337890625, -10.8565673828125, -10.499755859375, -10.1429443359375, -9.7861328125, -9.4293212890625, -9.072509765625, -8.7156982421875, -8.35888671875, -8.0020751953125, -7.645263671875, -7.2884521484375, -6.931640625, -6.5748291015625, -6.218017578125, -5.8612060546875, -5.50439453125, -5.1475830078125, -4.790771484375, -4.4339599609375, -4.0771484375, -3.7203369140625, -3.363525390625, -3.0067138671875, -2.64990234375, -2.2930908203125, -1.936279296875, -1.5794677734375, -1.22265625, -0.8658447265625, -0.509033203125, -0.1522216796875, 0.20458984375, 0.5614013671875, 0.918212890625, 1.2750244140625, 1.6318359375, 1.9886474609375, 2.345458984375, 2.7022705078125, 3.05908203125, 3.4158935546875, 3.772705078125, 4.1295166015625, 4.486328125, 4.8431396484375, 5.199951171875, 5.5567626953125, 5.91357421875, 6.2703857421875, 6.627197265625, 6.9840087890625, 7.3408203125, 7.6976318359375, 8.054443359375, 8.4112548828125, 8.76806640625, 9.1248779296875, 9.481689453125, 9.8385009765625, 10.1953125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 8.0, 15.0, 7.0, 20.0, 16.0, 19.0, 20.0, 21.0, 23.0, 31.0, 32.0, 35.0, 39.0, 51.0, 63.0, 80.0, 131.0, 1472.0, 402.0, 134.0, 66.0, 43.0, 37.0, 38.0, 33.0, 32.0, 27.0, 31.0, 19.0, 13.0, 18.0, 13.0, 12.0, 12.0, 11.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -19.101806640625, -18.48486328125, -17.867919921875, -17.2509765625, -16.634033203125, -16.01708984375, -15.400146484375, -14.783203125, -14.166259765625, -13.54931640625, -12.932373046875, -12.3154296875, -11.698486328125, -11.08154296875, -10.464599609375, -9.84765625, -9.230712890625, -8.61376953125, -7.996826171875, -7.3798828125, -6.762939453125, -6.14599609375, -5.529052734375, -4.912109375, -4.295166015625, -3.67822265625, -3.061279296875, -2.4443359375, -1.827392578125, -1.21044921875, -0.593505859375, 0.0234375, 0.640380859375, 1.25732421875, 1.874267578125, 2.4912109375, 3.108154296875, 3.72509765625, 4.342041015625, 4.958984375, 5.575927734375, 6.19287109375, 6.809814453125, 7.4267578125, 8.043701171875, 8.66064453125, 9.277587890625, 9.89453125, 10.511474609375, 11.12841796875, 11.745361328125, 12.3623046875, 12.979248046875, 13.59619140625, 14.213134765625, 14.830078125, 15.447021484375, 16.06396484375, 16.680908203125, 17.2978515625, 17.914794921875, 18.53173828125, 19.148681640625, 19.765625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 7.0, 7.0, 8.0, 13.0, 13.0, 25.0, 18.0, 37.0, 42.0, 60.0, 81.0, 101.0, 168.0, 334.0, 847.0, 6501.0, 2807089.0, 326142.0, 2727.0, 622.0, 275.0, 171.0, 101.0, 70.0, 53.0, 36.0, 31.0, 32.0, 26.0, 14.0, 11.0, 12.0, 6.0, 3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.5, -38.87060546875, -37.2412109375, -35.61181640625, -33.982421875, -32.35302734375, -30.7236328125, -29.09423828125, -27.46484375, -25.83544921875, -24.2060546875, -22.57666015625, -20.947265625, -19.31787109375, -17.6884765625, -16.05908203125, -14.4296875, -12.80029296875, -11.1708984375, -9.54150390625, -7.912109375, -6.28271484375, -4.6533203125, -3.02392578125, -1.39453125, 0.23486328125, 1.8642578125, 3.49365234375, 5.123046875, 6.75244140625, 8.3818359375, 10.01123046875, 11.640625, 13.27001953125, 14.8994140625, 16.52880859375, 18.158203125, 19.78759765625, 21.4169921875, 23.04638671875, 24.67578125, 26.30517578125, 27.9345703125, 29.56396484375, 31.193359375, 32.82275390625, 34.4521484375, 36.08154296875, 37.7109375, 39.34033203125, 40.9697265625, 42.59912109375, 44.228515625, 45.85791015625, 47.4873046875, 49.11669921875, 50.74609375, 52.37548828125, 54.0048828125, 55.63427734375, 57.263671875, 58.89306640625, 60.5224609375, 62.15185546875, 63.78125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 15.0, 68.0, 130.0, 226.0, 277.0, 194.0, 63.0, 32.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.018024444580078, -24.410335540771484, -22.80264663696289, -21.194957733154297, -19.587268829345703, -17.97957992553711, -16.371889114379883, -14.764200210571289, -13.156511306762695, -11.548822402954102, -9.941133499145508, -8.333443641662598, -6.725754737854004, -5.11806583404541, -3.5103759765625, -1.9026870727539062, -0.2949981689453125, 1.3126909732818604, 2.920380115509033, 4.528069496154785, 6.135758399963379, 7.743447303771973, 9.351137161254883, 10.958826065063477, 12.56651496887207, 14.174203872680664, 15.781892776489258, 17.389583587646484, 18.997272491455078, 20.604961395263672, 22.212650299072266, 23.82033920288086, 25.428024291992188, 27.03571319580078, 28.643402099609375, 30.25109100341797, 31.858779907226562, 33.466468811035156, 35.07415771484375, 36.681846618652344, 38.28953552246094, 39.89722442626953, 41.504913330078125, 43.11260223388672, 44.72029113769531, 46.327980041503906, 47.9356689453125, 49.543357849121094, 51.15105056762695, 52.75873947143555, 54.36642837524414, 55.974117279052734, 57.58180618286133, 59.18949508666992, 60.79718780517578, 62.404876708984375, 64.01256561279297, 65.62025451660156, 67.22794342041016, 68.83563232421875, 70.44332122802734, 72.05101013183594, 73.65869903564453, 75.26638793945312, 76.87407684326172]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 11.0, 5.0, 11.0, 4.0, 12.0, 13.0, 21.0, 21.0, 22.0, 27.0, 27.0, 29.0, 31.0, 23.0, 43.0, 32.0, 47.0, 44.0, 31.0, 43.0, 41.0, 44.0, 52.0, 45.0, 37.0, 30.0, 24.0, 36.0, 24.0, 31.0, 23.0, 20.0, 19.0, 13.0, 15.0, 8.0, 10.0, 7.0, 8.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.94161605834961, -42.57663345336914, -41.21165084838867, -39.8466682434082, -38.481685638427734, -37.116703033447266, -35.7517204284668, -34.38673782348633, -33.02175521850586, -31.65677261352539, -30.291790008544922, -28.926807403564453, -27.561824798583984, -26.196842193603516, -24.831859588623047, -23.466876983642578, -22.10189437866211, -20.73691177368164, -19.371929168701172, -18.006946563720703, -16.641963958740234, -15.276981353759766, -13.911998748779297, -12.547016143798828, -11.18203353881836, -9.81705093383789, -8.452068328857422, -7.087085723876953, -5.722103118896484, -4.357120513916016, -2.992137908935547, -1.6271553039550781, -0.26216888427734375, 1.102813720703125, 2.4677963256835938, 3.8327789306640625, 5.197761535644531, 6.562744140625, 7.927726745605469, 9.292709350585938, 10.657691955566406, 12.022674560546875, 13.387657165527344, 14.752639770507812, 16.11762237548828, 17.48260498046875, 18.84758758544922, 20.212570190429688, 21.577552795410156, 22.942535400390625, 24.307518005371094, 25.672500610351562, 27.03748321533203, 28.4024658203125, 29.76744842529297, 31.132431030273438, 32.497413635253906, 33.862396240234375, 35.227378845214844, 36.59236145019531, 37.95734405517578, 39.32232666015625, 40.68730926513672, 42.05229187011719, 43.417274475097656]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 8.0, 8.0, 3.0, 6.0, 5.0, 11.0, 16.0, 15.0, 14.0, 28.0, 22.0, 34.0, 30.0, 47.0, 31.0, 37.0, 51.0, 32.0, 45.0, 52.0, 36.0, 47.0, 46.0, 43.0, 32.0, 39.0, 39.0, 37.0, 30.0, 27.0, 20.0, 18.0, 19.0, 13.0, 11.0, 9.0, 12.0, 8.0, 8.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.93359375, -7.7236328125, -7.513671875, -7.3037109375, -7.09375, -6.8837890625, -6.673828125, -6.4638671875, -6.25390625, -6.0439453125, -5.833984375, -5.6240234375, -5.4140625, -5.2041015625, -4.994140625, -4.7841796875, -4.57421875, -4.3642578125, -4.154296875, -3.9443359375, -3.734375, -3.5244140625, -3.314453125, -3.1044921875, -2.89453125, -2.6845703125, -2.474609375, -2.2646484375, -2.0546875, -1.8447265625, -1.634765625, -1.4248046875, -1.21484375, -1.0048828125, -0.794921875, -0.5849609375, -0.375, -0.1650390625, 0.044921875, 0.2548828125, 0.46484375, 0.6748046875, 0.884765625, 1.0947265625, 1.3046875, 1.5146484375, 1.724609375, 1.9345703125, 2.14453125, 2.3544921875, 2.564453125, 2.7744140625, 2.984375, 3.1943359375, 3.404296875, 3.6142578125, 3.82421875, 4.0341796875, 4.244140625, 4.4541015625, 4.6640625, 4.8740234375, 5.083984375, 5.2939453125, 5.50390625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 6.0, 4.0, 10.0, 7.0, 11.0, 16.0, 18.0, 23.0, 35.0, 36.0, 43.0, 60.0, 97.0, 151.0, 312.0, 888.0, 3680.0, 23242.0, 196040.0, 1353378.0, 2081504.0, 467982.0, 56670.0, 7599.0, 1452.0, 410.0, 172.0, 106.0, 67.0, 63.0, 46.0, 30.0, 25.0, 18.0, 14.0, 17.0, 6.0, 9.0, 7.0, 6.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-12.8515625, -12.49658203125, -12.1416015625, -11.78662109375, -11.431640625, -11.07666015625, -10.7216796875, -10.36669921875, -10.01171875, -9.65673828125, -9.3017578125, -8.94677734375, -8.591796875, -8.23681640625, -7.8818359375, -7.52685546875, -7.171875, -6.81689453125, -6.4619140625, -6.10693359375, -5.751953125, -5.39697265625, -5.0419921875, -4.68701171875, -4.33203125, -3.97705078125, -3.6220703125, -3.26708984375, -2.912109375, -2.55712890625, -2.2021484375, -1.84716796875, -1.4921875, -1.13720703125, -0.7822265625, -0.42724609375, -0.072265625, 0.28271484375, 0.6376953125, 0.99267578125, 1.34765625, 1.70263671875, 2.0576171875, 2.41259765625, 2.767578125, 3.12255859375, 3.4775390625, 3.83251953125, 4.1875, 4.54248046875, 4.8974609375, 5.25244140625, 5.607421875, 5.96240234375, 6.3173828125, 6.67236328125, 7.02734375, 7.38232421875, 7.7373046875, 8.09228515625, 8.447265625, 8.80224609375, 9.1572265625, 9.51220703125, 9.8671875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 7.0, 5.0, 17.0, 11.0, 20.0, 28.0, 34.0, 44.0, 49.0, 77.0, 76.0, 115.0, 182.0, 191.0, 246.0, 329.0, 374.0, 364.0, 353.0, 315.0, 270.0, 218.0, 187.0, 125.0, 94.0, 76.0, 75.0, 36.0, 28.0, 25.0, 23.0, 18.0, 12.0, 9.0, 7.0, 4.0, 9.0, 1.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.515625, -8.255126953125, -7.99462890625, -7.734130859375, -7.4736328125, -7.213134765625, -6.95263671875, -6.692138671875, -6.431640625, -6.171142578125, -5.91064453125, -5.650146484375, -5.3896484375, -5.129150390625, -4.86865234375, -4.608154296875, -4.34765625, -4.087158203125, -3.82666015625, -3.566162109375, -3.3056640625, -3.045166015625, -2.78466796875, -2.524169921875, -2.263671875, -2.003173828125, -1.74267578125, -1.482177734375, -1.2216796875, -0.961181640625, -0.70068359375, -0.440185546875, -0.1796875, 0.080810546875, 0.34130859375, 0.601806640625, 0.8623046875, 1.122802734375, 1.38330078125, 1.643798828125, 1.904296875, 2.164794921875, 2.42529296875, 2.685791015625, 2.9462890625, 3.206787109375, 3.46728515625, 3.727783203125, 3.98828125, 4.248779296875, 4.50927734375, 4.769775390625, 5.0302734375, 5.290771484375, 5.55126953125, 5.811767578125, 6.072265625, 6.332763671875, 6.59326171875, 6.853759765625, 7.1142578125, 7.374755859375, 7.63525390625, 7.895751953125, 8.15625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 8.0, 9.0, 10.0, 9.0, 21.0, 28.0, 28.0, 39.0, 62.0, 92.0, 117.0, 162.0, 222.0, 320.0, 521.0, 1055.0, 3358.0, 20417.0, 244476.0, 2729965.0, 1108651.0, 72642.0, 8095.0, 1827.0, 736.0, 424.0, 267.0, 180.0, 155.0, 90.0, 69.0, 65.0, 29.0, 35.0, 23.0, 20.0, 15.0, 5.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.75, -18.140625, -17.53125, -16.921875, -16.3125, -15.703125, -15.09375, -14.484375, -13.875, -13.265625, -12.65625, -12.046875, -11.4375, -10.828125, -10.21875, -9.609375, -9.0, -8.390625, -7.78125, -7.171875, -6.5625, -5.953125, -5.34375, -4.734375, -4.125, -3.515625, -2.90625, -2.296875, -1.6875, -1.078125, -0.46875, 0.140625, 0.75, 1.359375, 1.96875, 2.578125, 3.1875, 3.796875, 4.40625, 5.015625, 5.625, 6.234375, 6.84375, 7.453125, 8.0625, 8.671875, 9.28125, 9.890625, 10.5, 11.109375, 11.71875, 12.328125, 12.9375, 13.546875, 14.15625, 14.765625, 15.375, 15.984375, 16.59375, 17.203125, 17.8125, 18.421875, 19.03125, 19.640625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 12.0, 44.0, 80.0, 160.0, 195.0, 200.0, 180.0, 78.0, 41.0, 16.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0794677734375, -30.730344772338867, -28.381221771240234, -26.032100677490234, -23.6829776763916, -21.33385467529297, -18.98473358154297, -16.635610580444336, -14.286487579345703, -11.93736457824707, -9.588242530822754, -7.239120006561279, -4.889997482299805, -2.540874481201172, -0.19175243377685547, 2.157369613647461, 4.506492614746094, 6.855615139007568, 9.204737663269043, 11.55385971069336, 13.902982711791992, 16.252105712890625, 18.601226806640625, 20.950349807739258, 23.29947280883789, 25.648595809936523, 27.997718811035156, 30.346839904785156, 32.695960998535156, 35.04508590698242, 37.39420700073242, 39.74333190917969, 42.09245300292969, 44.44157409667969, 46.79069900512695, 49.13982009887695, 51.48894500732422, 53.83806610107422, 56.18718719482422, 58.53630828857422, 60.885433197021484, 63.234554290771484, 65.58367919921875, 67.93280029296875, 70.28192138671875, 72.63104248046875, 74.98017120361328, 77.32929229736328, 79.67841339111328, 82.02753448486328, 84.37665557861328, 86.72578430175781, 89.07490539550781, 91.42402648925781, 93.77314758300781, 96.12226867675781, 98.47138977050781, 100.82051086425781, 103.16963195800781, 105.51876068115234, 107.86788177490234, 110.21700286865234, 112.56612396240234, 114.91524505615234, 117.26437377929688]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 5.0, 7.0, 10.0, 6.0, 12.0, 14.0, 18.0, 12.0, 21.0, 22.0, 26.0, 17.0, 26.0, 28.0, 26.0, 24.0, 29.0, 32.0, 40.0, 49.0, 28.0, 32.0, 36.0, 34.0, 33.0, 30.0, 42.0, 36.0, 21.0, 23.0, 35.0, 21.0, 24.0, 17.0, 23.0, 22.0, 19.0, 17.0, 20.0, 13.0, 12.0, 8.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-29.119922637939453, -28.207233428955078, -27.29454231262207, -26.381851196289062, -25.469161987304688, -24.556472778320312, -23.643781661987305, -22.731090545654297, -21.818401336669922, -20.905712127685547, -19.99302101135254, -19.08032989501953, -18.167640686035156, -17.25495147705078, -16.342260360717773, -15.429570198059082, -14.51688003540039, -13.6041898727417, -12.691499710083008, -11.778809547424316, -10.866119384765625, -9.953429222106934, -9.040739059448242, -8.12804889678955, -7.215358734130859, -6.302668571472168, -5.389978408813477, -4.477288246154785, -3.5645980834960938, -2.6519079208374023, -1.739217758178711, -0.8265275955200195, 0.08616065979003906, 0.9988508224487305, 1.9115409851074219, 2.8242311477661133, 3.7369213104248047, 4.649611473083496, 5.5623016357421875, 6.474991798400879, 7.38768196105957, 8.300372123718262, 9.213062286376953, 10.125752449035645, 11.038442611694336, 11.951132774353027, 12.863822937011719, 13.77651309967041, 14.689203262329102, 15.601893424987793, 16.514583587646484, 17.42727279663086, 18.339963912963867, 19.252655029296875, 20.16534423828125, 21.078033447265625, 21.990724563598633, 22.90341567993164, 23.816104888916016, 24.72879409790039, 25.6414852142334, 26.554176330566406, 27.46686553955078, 28.379554748535156, 29.292245864868164]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 10.0, 9.0, 19.0, 15.0, 11.0, 15.0, 23.0, 24.0, 25.0, 25.0, 32.0, 28.0, 34.0, 43.0, 44.0, 40.0, 38.0, 41.0, 42.0, 49.0, 39.0, 38.0, 29.0, 26.0, 30.0, 24.0, 23.0, 23.0, 32.0, 21.0, 21.0, 18.0, 13.0, 18.0, 8.0, 10.0, 9.0, 9.0, 8.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5, -6.313720703125, -6.12744140625, -5.941162109375, -5.7548828125, -5.568603515625, -5.38232421875, -5.196044921875, -5.009765625, -4.823486328125, -4.63720703125, -4.450927734375, -4.2646484375, -4.078369140625, -3.89208984375, -3.705810546875, -3.51953125, -3.333251953125, -3.14697265625, -2.960693359375, -2.7744140625, -2.588134765625, -2.40185546875, -2.215576171875, -2.029296875, -1.843017578125, -1.65673828125, -1.470458984375, -1.2841796875, -1.097900390625, -0.91162109375, -0.725341796875, -0.5390625, -0.352783203125, -0.16650390625, 0.019775390625, 0.2060546875, 0.392333984375, 0.57861328125, 0.764892578125, 0.951171875, 1.137451171875, 1.32373046875, 1.510009765625, 1.6962890625, 1.882568359375, 2.06884765625, 2.255126953125, 2.44140625, 2.627685546875, 2.81396484375, 3.000244140625, 3.1865234375, 3.372802734375, 3.55908203125, 3.745361328125, 3.931640625, 4.117919921875, 4.30419921875, 4.490478515625, 4.6767578125, 4.863037109375, 5.04931640625, 5.235595703125, 5.421875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 8.0, 9.0, 14.0, 16.0, 24.0, 35.0, 54.0, 76.0, 124.0, 184.0, 298.0, 398.0, 692.0, 963.0, 1402.0, 2160.0, 3130.0, 4624.0, 7021.0, 10314.0, 15558.0, 23145.0, 34103.0, 51143.0, 74476.0, 105516.0, 139366.0, 153037.0, 127278.0, 93777.0, 64709.0, 44224.0, 29730.0, 20073.0, 13595.0, 9045.0, 6008.0, 4055.0, 2658.0, 1831.0, 1242.0, 823.0, 556.0, 340.0, 259.0, 161.0, 123.0, 69.0, 45.0, 30.0, 22.0, 9.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.376220703125, -0.3642082214355469, -0.35219573974609375, -0.3401832580566406, -0.3281707763671875, -0.3161582946777344, -0.30414581298828125, -0.2921333312988281, -0.280120849609375, -0.2681083679199219, -0.25609588623046875, -0.24408340454101562, -0.2320709228515625, -0.22005844116210938, -0.20804595947265625, -0.19603347778320312, -0.18402099609375, -0.17200851440429688, -0.15999603271484375, -0.14798355102539062, -0.1359710693359375, -0.12395858764648438, -0.11194610595703125, -0.09993362426757812, -0.087921142578125, -0.07590866088867188, -0.06389617919921875, -0.051883697509765625, -0.0398712158203125, -0.027858734130859375, -0.01584625244140625, -0.003833770751953125, 0.0081787109375, 0.020191192626953125, 0.03220367431640625, 0.044216156005859375, 0.0562286376953125, 0.06824111938476562, 0.08025360107421875, 0.09226608276367188, 0.104278564453125, 0.11629104614257812, 0.12830352783203125, 0.14031600952148438, 0.1523284912109375, 0.16434097290039062, 0.17635345458984375, 0.18836593627929688, 0.20037841796875, 0.21239089965820312, 0.22440338134765625, 0.23641586303710938, 0.2484283447265625, 0.2604408264160156, 0.27245330810546875, 0.2844657897949219, 0.296478271484375, 0.3084907531738281, 0.32050323486328125, 0.3325157165527344, 0.3445281982421875, 0.3565406799316406, 0.36855316162109375, 0.3805656433105469, 0.392578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 9.0, 4.0, 7.0, 7.0, 12.0, 10.0, 17.0, 19.0, 19.0, 19.0, 31.0, 35.0, 29.0, 31.0, 49.0, 27.0, 50.0, 38.0, 41.0, 1053.0, 40.0, 49.0, 49.0, 48.0, 46.0, 36.0, 41.0, 22.0, 25.0, 29.0, 25.0, 26.0, 18.0, 10.0, 17.0, 14.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.02423095703125, -3.8883056640625, -3.75238037109375, -3.616455078125, -3.48052978515625, -3.3446044921875, -3.20867919921875, -3.07275390625, -2.93682861328125, -2.8009033203125, -2.66497802734375, -2.529052734375, -2.39312744140625, -2.2572021484375, -2.12127685546875, -1.9853515625, -1.84942626953125, -1.7135009765625, -1.57757568359375, -1.441650390625, -1.30572509765625, -1.1697998046875, -1.03387451171875, -0.89794921875, -0.76202392578125, -0.6260986328125, -0.49017333984375, -0.354248046875, -0.21832275390625, -0.0823974609375, 0.05352783203125, 0.189453125, 0.32537841796875, 0.4613037109375, 0.59722900390625, 0.733154296875, 0.86907958984375, 1.0050048828125, 1.14093017578125, 1.27685546875, 1.41278076171875, 1.5487060546875, 1.68463134765625, 1.820556640625, 1.95648193359375, 2.0924072265625, 2.22833251953125, 2.3642578125, 2.50018310546875, 2.6361083984375, 2.77203369140625, 2.907958984375, 3.04388427734375, 3.1798095703125, 3.31573486328125, 3.45166015625, 3.58758544921875, 3.7235107421875, 3.85943603515625, 3.995361328125, 4.13128662109375, 4.2672119140625, 4.40313720703125, 4.5390625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 9.0, 3.0, 12.0, 5.0, 11.0, 17.0, 25.0, 24.0, 51.0, 75.0, 111.0, 155.0, 234.0, 281.0, 447.0, 700.0, 1055.0, 1622.0, 2471.0, 3853.0, 6211.0, 9549.0, 15309.0, 23697.0, 37101.0, 56307.0, 83133.0, 115602.0, 172737.0, 1165837.0, 125188.0, 92908.0, 63975.0, 42371.0, 27482.0, 17498.0, 11131.0, 7116.0, 4496.0, 2853.0, 1844.0, 1244.0, 802.0, 533.0, 332.0, 230.0, 161.0, 96.0, 77.0, 40.0, 29.0, 23.0, 15.0, 13.0, 12.0, 8.0, 12.0, 5.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.28857421875, -0.2793121337890625, -0.270050048828125, -0.2607879638671875, -0.25152587890625, -0.2422637939453125, -0.233001708984375, -0.2237396240234375, -0.2144775390625, -0.2052154541015625, -0.195953369140625, -0.1866912841796875, -0.17742919921875, -0.1681671142578125, -0.158905029296875, -0.1496429443359375, -0.140380859375, -0.1311187744140625, -0.121856689453125, -0.1125946044921875, -0.10333251953125, -0.0940704345703125, -0.084808349609375, -0.0755462646484375, -0.0662841796875, -0.0570220947265625, -0.047760009765625, -0.0384979248046875, -0.02923583984375, -0.0199737548828125, -0.010711669921875, -0.0014495849609375, 0.0078125, 0.0170745849609375, 0.026336669921875, 0.0355987548828125, 0.04486083984375, 0.0541229248046875, 0.063385009765625, 0.0726470947265625, 0.0819091796875, 0.0911712646484375, 0.100433349609375, 0.1096954345703125, 0.11895751953125, 0.1282196044921875, 0.137481689453125, 0.1467437744140625, 0.156005859375, 0.1652679443359375, 0.174530029296875, 0.1837921142578125, 0.19305419921875, 0.2023162841796875, 0.211578369140625, 0.2208404541015625, 0.2301025390625, 0.2393646240234375, 0.248626708984375, 0.2578887939453125, 0.26715087890625, 0.2764129638671875, 0.285675048828125, 0.2949371337890625, 0.30419921875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 2.0, 6.0, 6.0, 5.0, 4.0, 7.0, 9.0, 13.0, 15.0, 17.0, 15.0, 30.0, 43.0, 44.0, 58.0, 89.0, 99.0, 107.0, 97.0, 64.0, 51.0, 39.0, 30.0, 25.0, 24.0, 12.0, 16.0, 10.0, 6.0, 10.0, 6.0, 3.0, 7.0, 6.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00766754150390625, -0.007431149482727051, -0.0071947574615478516, -0.006958365440368652, -0.006721973419189453, -0.006485581398010254, -0.006249189376831055, -0.0060127973556518555, -0.005776405334472656, -0.005540013313293457, -0.005303621292114258, -0.005067229270935059, -0.004830837249755859, -0.00459444522857666, -0.004358053207397461, -0.004121661186218262, -0.0038852691650390625, -0.0036488771438598633, -0.003412485122680664, -0.003176093101501465, -0.0029397010803222656, -0.0027033090591430664, -0.002466917037963867, -0.002230525016784668, -0.0019941329956054688, -0.0017577409744262695, -0.0015213489532470703, -0.001284956932067871, -0.0010485649108886719, -0.0008121728897094727, -0.0005757808685302734, -0.0003393888473510742, -0.000102996826171875, 0.00013339519500732422, 0.00036978721618652344, 0.0006061792373657227, 0.0008425712585449219, 0.001078963279724121, 0.0013153553009033203, 0.0015517473220825195, 0.0017881393432617188, 0.002024531364440918, 0.002260923385620117, 0.0024973154067993164, 0.0027337074279785156, 0.002970099449157715, 0.003206491470336914, 0.0034428834915161133, 0.0036792755126953125, 0.003915667533874512, 0.004152059555053711, 0.00438845157623291, 0.004624843597412109, 0.004861235618591309, 0.005097627639770508, 0.005334019660949707, 0.005570411682128906, 0.0058068037033081055, 0.006043195724487305, 0.006279587745666504, 0.006515979766845703, 0.006752371788024902, 0.0069887638092041016, 0.007225155830383301, 0.0074615478515625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 6.0, 7.0, 10.0, 9.0, 6.0, 13.0, 15.0, 14.0, 27.0, 26.0, 37.0, 44.0, 85.0, 127.0, 256.0, 718.0, 4646.0, 170367.0, 858652.0, 11389.0, 1217.0, 367.0, 146.0, 99.0, 62.0, 45.0, 31.0, 24.0, 20.0, 19.0, 12.0, 9.0, 5.0, 8.0, 5.0, 5.0, 4.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15478515625, -0.14981842041015625, -0.1448516845703125, -0.13988494873046875, -0.134918212890625, -0.12995147705078125, -0.1249847412109375, -0.12001800537109375, -0.11505126953125, -0.11008453369140625, -0.1051177978515625, -0.10015106201171875, -0.095184326171875, -0.09021759033203125, -0.0852508544921875, -0.08028411865234375, -0.0753173828125, -0.07035064697265625, -0.0653839111328125, -0.06041717529296875, -0.055450439453125, -0.05048370361328125, -0.0455169677734375, -0.04055023193359375, -0.03558349609375, -0.03061676025390625, -0.0256500244140625, -0.02068328857421875, -0.015716552734375, -0.01074981689453125, -0.0057830810546875, -0.00081634521484375, 0.004150390625, 0.00911712646484375, 0.0140838623046875, 0.01905059814453125, 0.024017333984375, 0.02898406982421875, 0.0339508056640625, 0.03891754150390625, 0.04388427734375, 0.04885101318359375, 0.0538177490234375, 0.05878448486328125, 0.063751220703125, 0.06871795654296875, 0.0736846923828125, 0.07865142822265625, 0.0836181640625, 0.08858489990234375, 0.0935516357421875, 0.09851837158203125, 0.103485107421875, 0.10845184326171875, 0.1134185791015625, 0.11838531494140625, 0.12335205078125, 0.12831878662109375, 0.1332855224609375, 0.13825225830078125, 0.143218994140625, 0.14818572998046875, 0.1531524658203125, 0.15811920166015625, 0.1630859375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 7.0, 25.0, 72.0, 235.0, 398.0, 168.0, 66.0, 21.0, 11.0, 10.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00669793039560318, -0.005446131341159344, -0.0041943322867155075, -0.0029425336979329586, -0.0016907346434891224, -0.0004389355890452862, 0.0008128629997372627, 0.002064662054181099, 0.003316461108624935, 0.004568260163068771, 0.005820059217512608, 0.0070718578062951565, 0.008323656395077705, 0.009575456380844116, 0.010827254503965378, 0.012079053558409214, 0.01333085261285305, 0.014582651667296886, 0.015834450721740723, 0.017086248844861984, 0.018338048830628395, 0.019589846953749657, 0.020841646939516068, 0.02209344506263733, 0.02334524318575859, 0.024597041308879852, 0.025848841294646263, 0.027100639417767525, 0.028352439403533936, 0.029604237526655197, 0.03085603564977646, 0.03210783749818802, 0.03335963562130928, 0.03461143374443054, 0.035863231867551804, 0.037115033715963364, 0.038366831839084625, 0.03961862996220589, 0.04087042808532715, 0.04212222993373871, 0.04337402805685997, 0.04462582617998123, 0.04587762430310249, 0.04712942615151405, 0.048381224274635315, 0.04963302239775658, 0.05088482052087784, 0.0521366223692894, 0.05338841676712036, 0.05464021489024162, 0.055892013013362885, 0.057143814861774445, 0.058395612984895706, 0.05964741110801697, 0.06089920923113823, 0.06215100735425949, 0.06340280920267105, 0.06465461105108261, 0.06590640544891357, 0.06715820729732513, 0.0684100016951561, 0.06966180354356766, 0.07091360539197922, 0.07216539978981018, 0.07341720163822174]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 7.0, 9.0, 11.0, 24.0, 31.0, 34.0, 31.0, 42.0, 46.0, 45.0, 67.0, 69.0, 88.0, 60.0, 43.0, 62.0, 56.0, 59.0, 47.0, 33.0, 30.0, 27.0, 19.0, 12.0, 13.0, 7.0, 9.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007668793201446533, -0.007420984096825123, -0.0071731749922037125, -0.006925365887582302, -0.006677556782960892, -0.006429747678339481, -0.006181938573718071, -0.005934129469096661, -0.00568632036447525, -0.00543851125985384, -0.0051907021552324295, -0.004942893050611019, -0.004695083945989609, -0.004447274841368198, -0.004199465736746788, -0.003951656632125378, -0.0037038475275039673, -0.003456038422882557, -0.0032082293182611465, -0.002960420213639736, -0.002712611109018326, -0.0024648020043969154, -0.002216992899775505, -0.0019691837951540947, -0.0017213746905326843, -0.001473565585911274, -0.0012257564812898636, -0.0009779473766684532, -0.0007301382720470428, -0.0004823291674256325, -0.0002345200628042221, 1.3289041817188263e-05, 0.00026109814643859863, 0.000508907251060009, 0.0007567163556814194, 0.0010045254603028297, 0.0012523345649242401, 0.0015001436695456505, 0.0017479527741670609, 0.0019957618787884712, 0.0022435709834098816, 0.002491380088031292, 0.0027391891926527023, 0.0029869982972741127, 0.003234807401895523, 0.0034826165065169334, 0.003730425611138344, 0.003978234715759754, 0.0042260438203811646, 0.004473852925002575, 0.004721662029623985, 0.004969471134245396, 0.005217280238866806, 0.005465089343488216, 0.005712898448109627, 0.005960707552731037, 0.0062085166573524475, 0.006456325761973858, 0.006704134866595268, 0.006951943971216679, 0.007199753075838089, 0.007447562180459499, 0.00769537128508091, 0.00794318038970232, 0.00819098949432373]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 10.0, 9.0, 19.0, 15.0, 11.0, 15.0, 23.0, 24.0, 25.0, 25.0, 32.0, 28.0, 34.0, 43.0, 45.0, 39.0, 38.0, 41.0, 42.0, 49.0, 39.0, 38.0, 29.0, 26.0, 30.0, 24.0, 23.0, 23.0, 32.0, 21.0, 21.0, 18.0, 13.0, 17.0, 9.0, 10.0, 9.0, 9.0, 8.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5, -6.313720703125, -6.12744140625, -5.941162109375, -5.7548828125, -5.568603515625, -5.38232421875, -5.196044921875, -5.009765625, -4.823486328125, -4.63720703125, -4.450927734375, -4.2646484375, -4.078369140625, -3.89208984375, -3.705810546875, -3.51953125, -3.333251953125, -3.14697265625, -2.960693359375, -2.7744140625, -2.588134765625, -2.40185546875, -2.215576171875, -2.029296875, -1.843017578125, -1.65673828125, -1.470458984375, -1.2841796875, -1.097900390625, -0.91162109375, -0.725341796875, -0.5390625, -0.352783203125, -0.16650390625, 0.019775390625, 0.2060546875, 0.392333984375, 0.57861328125, 0.764892578125, 0.951171875, 1.137451171875, 1.32373046875, 1.510009765625, 1.6962890625, 1.882568359375, 2.06884765625, 2.255126953125, 2.44140625, 2.627685546875, 2.81396484375, 3.000244140625, 3.1865234375, 3.372802734375, 3.55908203125, 3.745361328125, 3.931640625, 4.117919921875, 4.30419921875, 4.490478515625, 4.6767578125, 4.863037109375, 5.04931640625, 5.235595703125, 5.421875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 6.0, 6.0, 8.0, 9.0, 15.0, 23.0, 24.0, 20.0, 47.0, 54.0, 61.0, 84.0, 119.0, 176.0, 210.0, 312.0, 415.0, 676.0, 1206.0, 2967.0, 10404.0, 41301.0, 292434.0, 608940.0, 65514.0, 15233.0, 4260.0, 1537.0, 774.0, 437.0, 302.0, 205.0, 176.0, 148.0, 107.0, 97.0, 71.0, 45.0, 42.0, 23.0, 20.0, 14.0, 11.0, 12.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.359375, -15.8939208984375, -15.428466796875, -14.9630126953125, -14.49755859375, -14.0321044921875, -13.566650390625, -13.1011962890625, -12.6357421875, -12.1702880859375, -11.704833984375, -11.2393798828125, -10.77392578125, -10.3084716796875, -9.843017578125, -9.3775634765625, -8.912109375, -8.4466552734375, -7.981201171875, -7.5157470703125, -7.05029296875, -6.5848388671875, -6.119384765625, -5.6539306640625, -5.1884765625, -4.7230224609375, -4.257568359375, -3.7921142578125, -3.32666015625, -2.8612060546875, -2.395751953125, -1.9302978515625, -1.46484375, -0.9993896484375, -0.533935546875, -0.0684814453125, 0.39697265625, 0.8624267578125, 1.327880859375, 1.7933349609375, 2.2587890625, 2.7242431640625, 3.189697265625, 3.6551513671875, 4.12060546875, 4.5860595703125, 5.051513671875, 5.5169677734375, 5.982421875, 6.4478759765625, 6.913330078125, 7.3787841796875, 7.84423828125, 8.3096923828125, 8.775146484375, 9.2406005859375, 9.7060546875, 10.1715087890625, 10.636962890625, 11.1024169921875, 11.56787109375, 12.0333251953125, 12.498779296875, 12.9642333984375, 13.4296875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 2.0, 7.0, 11.0, 5.0, 14.0, 9.0, 8.0, 17.0, 25.0, 26.0, 27.0, 35.0, 45.0, 36.0, 49.0, 54.0, 67.0, 95.0, 169.0, 1474.0, 327.0, 110.0, 64.0, 54.0, 51.0, 45.0, 27.0, 32.0, 31.0, 24.0, 26.0, 12.0, 13.0, 11.0, 13.0, 7.0, 10.0, 2.0, 4.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.859375, -22.219970703125, -21.58056640625, -20.941162109375, -20.3017578125, -19.662353515625, -19.02294921875, -18.383544921875, -17.744140625, -17.104736328125, -16.46533203125, -15.825927734375, -15.1865234375, -14.547119140625, -13.90771484375, -13.268310546875, -12.62890625, -11.989501953125, -11.35009765625, -10.710693359375, -10.0712890625, -9.431884765625, -8.79248046875, -8.153076171875, -7.513671875, -6.874267578125, -6.23486328125, -5.595458984375, -4.9560546875, -4.316650390625, -3.67724609375, -3.037841796875, -2.3984375, -1.759033203125, -1.11962890625, -0.480224609375, 0.1591796875, 0.798583984375, 1.43798828125, 2.077392578125, 2.716796875, 3.356201171875, 3.99560546875, 4.635009765625, 5.2744140625, 5.913818359375, 6.55322265625, 7.192626953125, 7.83203125, 8.471435546875, 9.11083984375, 9.750244140625, 10.3896484375, 11.029052734375, 11.66845703125, 12.307861328125, 12.947265625, 13.586669921875, 14.22607421875, 14.865478515625, 15.5048828125, 16.144287109375, 16.78369140625, 17.423095703125, 18.0625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 9.0, 8.0, 16.0, 12.0, 18.0, 17.0, 22.0, 40.0, 44.0, 37.0, 63.0, 79.0, 121.0, 246.0, 439.0, 1258.0, 9873.0, 2861951.0, 265418.0, 4144.0, 781.0, 358.0, 189.0, 136.0, 89.0, 84.0, 49.0, 33.0, 33.0, 22.0, 19.0, 16.0, 16.0, 15.0, 6.0, 5.0, 8.0, 5.0, 7.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.71875, -47.029296875, -45.33984375, -43.650390625, -41.9609375, -40.271484375, -38.58203125, -36.892578125, -35.203125, -33.513671875, -31.82421875, -30.134765625, -28.4453125, -26.755859375, -25.06640625, -23.376953125, -21.6875, -19.998046875, -18.30859375, -16.619140625, -14.9296875, -13.240234375, -11.55078125, -9.861328125, -8.171875, -6.482421875, -4.79296875, -3.103515625, -1.4140625, 0.275390625, 1.96484375, 3.654296875, 5.34375, 7.033203125, 8.72265625, 10.412109375, 12.1015625, 13.791015625, 15.48046875, 17.169921875, 18.859375, 20.548828125, 22.23828125, 23.927734375, 25.6171875, 27.306640625, 28.99609375, 30.685546875, 32.375, 34.064453125, 35.75390625, 37.443359375, 39.1328125, 40.822265625, 42.51171875, 44.201171875, 45.890625, 47.580078125, 49.26953125, 50.958984375, 52.6484375, 54.337890625, 56.02734375, 57.716796875, 59.40625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 286.0, 595.0, 116.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.23345947265625, -217.005859375, -212.77825927734375, -208.5506591796875, -204.3230438232422, -200.09544372558594, -195.8678436279297, -191.64024353027344, -187.4126434326172, -183.18504333496094, -178.9574432373047, -174.72982788085938, -170.50222778320312, -166.27462768554688, -162.04702758789062, -157.81942749023438, -153.59182739257812, -149.36422729492188, -145.13662719726562, -140.90902709960938, -136.68141174316406, -132.4538116455078, -128.22621154785156, -123.99861145019531, -119.77099609375, -115.54339599609375, -111.31578826904297, -107.08818817138672, -102.86058807373047, -98.63298034667969, -94.40538024902344, -90.17778015136719, -85.9501953125, -81.72259521484375, -77.49498748779297, -73.26738739013672, -69.03978729248047, -64.81217956542969, -60.58457946777344, -56.35697937011719, -52.129371643066406, -47.90176773071289, -43.67416763305664, -39.446563720703125, -35.218963623046875, -30.99135971069336, -26.763755798339844, -22.53615379333496, -18.308551788330078, -14.080949783325195, -9.853346824645996, -5.625743865966797, -1.398141860961914, 2.8294601440429688, 7.057064056396484, 11.284666061401367, 15.51226806640625, 19.739870071411133, 23.967472076416016, 28.19507598876953, 32.42267608642578, 36.6502799987793, 40.87788391113281, 45.10548400878906, 49.33308792114258]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 14.0, 12.0, 11.0, 25.0, 19.0, 35.0, 19.0, 37.0, 43.0, 63.0, 43.0, 41.0, 37.0, 44.0, 55.0, 49.0, 43.0, 44.0, 41.0, 51.0, 46.0, 42.0, 28.0, 30.0, 18.0, 19.0, 18.0, 15.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.21122360229492, -50.403079986572266, -48.594940185546875, -46.78679656982422, -44.97865295410156, -43.17051315307617, -41.362369537353516, -39.554229736328125, -37.74608612060547, -35.93794250488281, -34.12980270385742, -32.321659088134766, -30.513517379760742, -28.70537567138672, -26.897232055664062, -25.08909034729004, -23.280948638916016, -21.472806930541992, -19.66466522216797, -17.856521606445312, -16.04837989807129, -14.240238189697266, -12.432095527648926, -10.623952865600586, -8.815811157226562, -7.007668972015381, -5.199526786804199, -3.3913846015930176, -1.583242416381836, 0.2248992919921875, 2.0330419540405273, 3.841184616088867, 5.649322509765625, 7.457464694976807, 9.265606880187988, 11.073749542236328, 12.881891250610352, 14.690032958984375, 16.49817657470703, 18.306318283081055, 20.114459991455078, 21.9226016998291, 23.730743408203125, 25.53888702392578, 27.347028732299805, 29.155170440673828, 30.963314056396484, 32.771453857421875, 34.57959747314453, 36.38774108886719, 38.19588088989258, 40.004024505615234, 41.812164306640625, 43.62030792236328, 45.42845153808594, 47.236595153808594, 49.044734954833984, 50.85287857055664, 52.66101837158203, 54.46916198730469, 56.277305603027344, 58.085445404052734, 59.89358901977539, 61.70172882080078, 63.50987243652344]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 5.0, 8.0, 6.0, 9.0, 9.0, 10.0, 16.0, 15.0, 18.0, 29.0, 22.0, 16.0, 18.0, 34.0, 21.0, 24.0, 33.0, 38.0, 42.0, 42.0, 47.0, 62.0, 36.0, 47.0, 44.0, 41.0, 29.0, 39.0, 30.0, 17.0, 25.0, 25.0, 21.0, 18.0, 17.0, 23.0, 10.0, 13.0, 11.0, 9.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.58984375, -6.3924560546875, -6.195068359375, -5.9976806640625, -5.80029296875, -5.6029052734375, -5.405517578125, -5.2081298828125, -5.0107421875, -4.8133544921875, -4.615966796875, -4.4185791015625, -4.22119140625, -4.0238037109375, -3.826416015625, -3.6290283203125, -3.431640625, -3.2342529296875, -3.036865234375, -2.8394775390625, -2.64208984375, -2.4447021484375, -2.247314453125, -2.0499267578125, -1.8525390625, -1.6551513671875, -1.457763671875, -1.2603759765625, -1.06298828125, -0.8656005859375, -0.668212890625, -0.4708251953125, -0.2734375, -0.0760498046875, 0.121337890625, 0.3187255859375, 0.51611328125, 0.7135009765625, 0.910888671875, 1.1082763671875, 1.3056640625, 1.5030517578125, 1.700439453125, 1.8978271484375, 2.09521484375, 2.2926025390625, 2.489990234375, 2.6873779296875, 2.884765625, 3.0821533203125, 3.279541015625, 3.4769287109375, 3.67431640625, 3.8717041015625, 4.069091796875, 4.2664794921875, 4.4638671875, 4.6612548828125, 4.858642578125, 5.0560302734375, 5.25341796875, 5.4508056640625, 5.648193359375, 5.8455810546875, 6.04296875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 10.0, 8.0, 12.0, 14.0, 19.0, 18.0, 42.0, 40.0, 48.0, 59.0, 76.0, 93.0, 147.0, 224.0, 409.0, 776.0, 2276.0, 9103.0, 46540.0, 267588.0, 1178495.0, 1839140.0, 682570.0, 135108.0, 23542.0, 4980.0, 1373.0, 587.0, 290.0, 164.0, 134.0, 84.0, 70.0, 44.0, 42.0, 35.0, 31.0, 27.0, 16.0, 11.0, 8.0, 11.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6015625, -8.317626953125, -8.03369140625, -7.749755859375, -7.4658203125, -7.181884765625, -6.89794921875, -6.614013671875, -6.330078125, -6.046142578125, -5.76220703125, -5.478271484375, -5.1943359375, -4.910400390625, -4.62646484375, -4.342529296875, -4.05859375, -3.774658203125, -3.49072265625, -3.206787109375, -2.9228515625, -2.638916015625, -2.35498046875, -2.071044921875, -1.787109375, -1.503173828125, -1.21923828125, -0.935302734375, -0.6513671875, -0.367431640625, -0.08349609375, 0.200439453125, 0.484375, 0.768310546875, 1.05224609375, 1.336181640625, 1.6201171875, 1.904052734375, 2.18798828125, 2.471923828125, 2.755859375, 3.039794921875, 3.32373046875, 3.607666015625, 3.8916015625, 4.175537109375, 4.45947265625, 4.743408203125, 5.02734375, 5.311279296875, 5.59521484375, 5.879150390625, 6.1630859375, 6.447021484375, 6.73095703125, 7.014892578125, 7.298828125, 7.582763671875, 7.86669921875, 8.150634765625, 8.4345703125, 8.718505859375, 9.00244140625, 9.286376953125, 9.5703125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 5.0, 9.0, 13.0, 12.0, 22.0, 21.0, 32.0, 74.0, 84.0, 126.0, 140.0, 205.0, 257.0, 375.0, 410.0, 459.0, 410.0, 365.0, 290.0, 214.0, 151.0, 112.0, 80.0, 55.0, 34.0, 26.0, 24.0, 17.0, 13.0, 11.0, 5.0, 1.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.3436279296875, -7.031005859375, -6.7183837890625, -6.40576171875, -6.0931396484375, -5.780517578125, -5.4678955078125, -5.1552734375, -4.8426513671875, -4.530029296875, -4.2174072265625, -3.90478515625, -3.5921630859375, -3.279541015625, -2.9669189453125, -2.654296875, -2.3416748046875, -2.029052734375, -1.7164306640625, -1.40380859375, -1.0911865234375, -0.778564453125, -0.4659423828125, -0.1533203125, 0.1593017578125, 0.471923828125, 0.7845458984375, 1.09716796875, 1.4097900390625, 1.722412109375, 2.0350341796875, 2.34765625, 2.6602783203125, 2.972900390625, 3.2855224609375, 3.59814453125, 3.9107666015625, 4.223388671875, 4.5360107421875, 4.8486328125, 5.1612548828125, 5.473876953125, 5.7864990234375, 6.09912109375, 6.4117431640625, 6.724365234375, 7.0369873046875, 7.349609375, 7.6622314453125, 7.974853515625, 8.2874755859375, 8.60009765625, 8.9127197265625, 9.225341796875, 9.5379638671875, 9.8505859375, 10.1632080078125, 10.475830078125, 10.7884521484375, 11.10107421875, 11.4136962890625, 11.726318359375, 12.0389404296875, 12.3515625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 14.0, 10.0, 16.0, 35.0, 46.0, 58.0, 89.0, 139.0, 198.0, 423.0, 770.0, 2319.0, 20513.0, 719004.0, 3310294.0, 130855.0, 6820.0, 1290.0, 550.0, 319.0, 167.0, 125.0, 66.0, 48.0, 39.0, 19.0, 15.0, 13.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-35.0, -34.131103515625, -33.26220703125, -32.393310546875, -31.5244140625, -30.655517578125, -29.78662109375, -28.917724609375, -28.048828125, -27.179931640625, -26.31103515625, -25.442138671875, -24.5732421875, -23.704345703125, -22.83544921875, -21.966552734375, -21.09765625, -20.228759765625, -19.35986328125, -18.490966796875, -17.6220703125, -16.753173828125, -15.88427734375, -15.015380859375, -14.146484375, -13.277587890625, -12.40869140625, -11.539794921875, -10.6708984375, -9.802001953125, -8.93310546875, -8.064208984375, -7.1953125, -6.326416015625, -5.45751953125, -4.588623046875, -3.7197265625, -2.850830078125, -1.98193359375, -1.113037109375, -0.244140625, 0.624755859375, 1.49365234375, 2.362548828125, 3.2314453125, 4.100341796875, 4.96923828125, 5.838134765625, 6.70703125, 7.575927734375, 8.44482421875, 9.313720703125, 10.1826171875, 11.051513671875, 11.92041015625, 12.789306640625, 13.658203125, 14.527099609375, 15.39599609375, 16.264892578125, 17.1337890625, 18.002685546875, 18.87158203125, 19.740478515625, 20.609375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 329.0, 684.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-605.7996826171875, -591.0722045898438, -576.3446655273438, -561.6171875, -546.8897094726562, -532.1622314453125, -517.4346923828125, -502.70721435546875, -487.9797058105469, -473.252197265625, -458.52471923828125, -443.7972106933594, -429.0697021484375, -414.34222412109375, -399.6147155761719, -384.88720703125, -370.15972900390625, -355.4322204589844, -340.7047424316406, -325.97723388671875, -311.249755859375, -296.5222473144531, -281.79473876953125, -267.0672607421875, -252.33975219726562, -237.6122589111328, -222.884765625, -208.15725708007812, -193.4297637939453, -178.7022705078125, -163.97476196289062, -149.2472686767578, -134.519775390625, -119.79228210449219, -105.06478118896484, -90.3372802734375, -75.60978698730469, -60.882293701171875, -46.15479278564453, -31.427291870117188, -16.699798583984375, -1.9723014831542969, 12.755195617675781, 27.48269271850586, 42.21018981933594, 56.93768310546875, 71.6651840209961, 86.39268493652344, 101.12017822265625, 115.84767150878906, 130.57516479492188, 145.30267333984375, 160.03016662597656, 174.75765991210938, 189.48516845703125, 204.21266174316406, 218.94015502929688, 233.6676483154297, 248.3951416015625, 263.1226501464844, 277.85015869140625, 292.57763671875, 307.3051452636719, 322.03265380859375, 336.7601318359375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 9.0, 12.0, 7.0, 12.0, 14.0, 16.0, 25.0, 22.0, 22.0, 25.0, 29.0, 30.0, 40.0, 34.0, 30.0, 34.0, 34.0, 48.0, 45.0, 37.0, 45.0, 43.0, 35.0, 38.0, 50.0, 32.0, 33.0, 31.0, 16.0, 24.0, 20.0, 17.0, 18.0, 14.0, 11.0, 10.0, 11.0, 10.0, 10.0, 3.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.876346588134766, -27.870195388793945, -26.864046096801758, -25.857894897460938, -24.85174560546875, -23.84559440612793, -22.83944320678711, -21.833293914794922, -20.8271427154541, -19.82099151611328, -18.814842224121094, -17.808691024780273, -16.802539825439453, -15.796390533447266, -14.790239334106445, -13.784089088439941, -12.777938842773438, -11.771788597106934, -10.76563835144043, -9.75948715209961, -8.753336906433105, -7.747186660766602, -6.7410359382629395, -5.734885215759277, -4.728734970092773, -3.7225844860076904, -2.7164340019226074, -1.7102835178375244, -0.7041330337524414, 0.3020172119140625, 1.3081679344177246, 2.3143186569213867, 3.320465087890625, 4.326615333557129, 5.332766056060791, 6.338916778564453, 7.345067024230957, 8.351217269897461, 9.357368469238281, 10.363518714904785, 11.369668960571289, 12.375819206237793, 13.381969451904297, 14.388120651245117, 15.394270896911621, 16.400421142578125, 17.406572341918945, 18.412723541259766, 19.418872833251953, 20.425024032592773, 21.43117332458496, 22.43732452392578, 23.44347381591797, 24.44962501525879, 25.45577621459961, 26.461925506591797, 27.468076705932617, 28.474227905273438, 29.480377197265625, 30.486528396606445, 31.492679595947266, 32.49882888793945, 33.50497817993164, 34.511131286621094, 35.51728057861328]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 11.0, 8.0, 8.0, 18.0, 20.0, 13.0, 26.0, 25.0, 28.0, 42.0, 34.0, 35.0, 40.0, 40.0, 38.0, 55.0, 50.0, 40.0, 53.0, 44.0, 36.0, 45.0, 28.0, 45.0, 29.0, 38.0, 24.0, 29.0, 15.0, 19.0, 7.0, 11.0, 9.0, 6.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.71875, -6.49993896484375, -6.2811279296875, -6.06231689453125, -5.843505859375, -5.62469482421875, -5.4058837890625, -5.18707275390625, -4.96826171875, -4.74945068359375, -4.5306396484375, -4.31182861328125, -4.093017578125, -3.87420654296875, -3.6553955078125, -3.43658447265625, -3.2177734375, -2.99896240234375, -2.7801513671875, -2.56134033203125, -2.342529296875, -2.12371826171875, -1.9049072265625, -1.68609619140625, -1.46728515625, -1.24847412109375, -1.0296630859375, -0.81085205078125, -0.592041015625, -0.37322998046875, -0.1544189453125, 0.06439208984375, 0.283203125, 0.50201416015625, 0.7208251953125, 0.93963623046875, 1.158447265625, 1.37725830078125, 1.5960693359375, 1.81488037109375, 2.03369140625, 2.25250244140625, 2.4713134765625, 2.69012451171875, 2.908935546875, 3.12774658203125, 3.3465576171875, 3.56536865234375, 3.7841796875, 4.00299072265625, 4.2218017578125, 4.44061279296875, 4.659423828125, 4.87823486328125, 5.0970458984375, 5.31585693359375, 5.53466796875, 5.75347900390625, 5.9722900390625, 6.19110107421875, 6.409912109375, 6.62872314453125, 6.8475341796875, 7.06634521484375, 7.28515625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 15.0, 22.0, 28.0, 49.0, 68.0, 113.0, 174.0, 286.0, 464.0, 746.0, 1229.0, 1850.0, 2913.0, 4627.0, 7404.0, 11850.0, 19040.0, 29898.0, 46491.0, 71525.0, 106126.0, 146748.0, 167317.0, 141422.0, 101117.0, 67736.0, 44067.0, 27799.0, 17298.0, 11134.0, 7100.0, 4392.0, 2749.0, 1758.0, 1083.0, 685.0, 444.0, 275.0, 171.0, 124.0, 76.0, 47.0, 30.0, 21.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.473876953125, -0.460113525390625, -0.44635009765625, -0.432586669921875, -0.4188232421875, -0.405059814453125, -0.39129638671875, -0.377532958984375, -0.36376953125, -0.350006103515625, -0.33624267578125, -0.322479248046875, -0.3087158203125, -0.294952392578125, -0.28118896484375, -0.267425537109375, -0.253662109375, -0.239898681640625, -0.22613525390625, -0.212371826171875, -0.1986083984375, -0.184844970703125, -0.17108154296875, -0.157318115234375, -0.1435546875, -0.129791259765625, -0.11602783203125, -0.102264404296875, -0.0885009765625, -0.074737548828125, -0.06097412109375, -0.047210693359375, -0.033447265625, -0.019683837890625, -0.00592041015625, 0.007843017578125, 0.0216064453125, 0.035369873046875, 0.04913330078125, 0.062896728515625, 0.07666015625, 0.090423583984375, 0.10418701171875, 0.117950439453125, 0.1317138671875, 0.145477294921875, 0.15924072265625, 0.173004150390625, 0.186767578125, 0.200531005859375, 0.21429443359375, 0.228057861328125, 0.2418212890625, 0.255584716796875, 0.26934814453125, 0.283111572265625, 0.296875, 0.310638427734375, 0.32440185546875, 0.338165283203125, 0.3519287109375, 0.365692138671875, 0.37945556640625, 0.393218994140625, 0.406982421875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 5.0, 9.0, 3.0, 13.0, 11.0, 8.0, 15.0, 15.0, 16.0, 30.0, 28.0, 27.0, 27.0, 30.0, 31.0, 48.0, 45.0, 39.0, 39.0, 30.0, 1056.0, 38.0, 33.0, 37.0, 33.0, 35.0, 30.0, 38.0, 28.0, 33.0, 31.0, 23.0, 19.0, 25.0, 22.0, 15.0, 13.0, 10.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.04296875, -3.921783447265625, -3.80059814453125, -3.679412841796875, -3.5582275390625, -3.437042236328125, -3.31585693359375, -3.194671630859375, -3.073486328125, -2.952301025390625, -2.83111572265625, -2.709930419921875, -2.5887451171875, -2.467559814453125, -2.34637451171875, -2.225189208984375, -2.10400390625, -1.982818603515625, -1.86163330078125, -1.740447998046875, -1.6192626953125, -1.498077392578125, -1.37689208984375, -1.255706787109375, -1.134521484375, -1.013336181640625, -0.89215087890625, -0.770965576171875, -0.6497802734375, -0.528594970703125, -0.40740966796875, -0.286224365234375, -0.1650390625, -0.043853759765625, 0.07733154296875, 0.198516845703125, 0.3197021484375, 0.440887451171875, 0.56207275390625, 0.683258056640625, 0.804443359375, 0.925628662109375, 1.04681396484375, 1.167999267578125, 1.2891845703125, 1.410369873046875, 1.53155517578125, 1.652740478515625, 1.77392578125, 1.895111083984375, 2.01629638671875, 2.137481689453125, 2.2586669921875, 2.379852294921875, 2.50103759765625, 2.622222900390625, 2.743408203125, 2.864593505859375, 2.98577880859375, 3.106964111328125, 3.2281494140625, 3.349334716796875, 3.47052001953125, 3.591705322265625, 3.712890625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 13.0, 18.0, 30.0, 41.0, 51.0, 79.0, 123.0, 196.0, 270.0, 368.0, 559.0, 833.0, 1285.0, 1907.0, 2931.0, 4464.0, 7107.0, 11147.0, 16985.0, 26391.0, 40390.0, 60532.0, 86290.0, 117769.0, 372354.0, 957161.0, 119350.0, 88278.0, 61316.0, 41393.0, 27288.0, 17607.0, 11420.0, 7306.0, 4767.0, 3086.0, 2016.0, 1379.0, 831.0, 564.0, 370.0, 255.0, 189.0, 127.0, 86.0, 58.0, 47.0, 32.0, 22.0, 16.0, 13.0, 14.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.301513671875, -0.2921028137207031, -0.28269195556640625, -0.2732810974121094, -0.2638702392578125, -0.2544593811035156, -0.24504852294921875, -0.23563766479492188, -0.226226806640625, -0.21681594848632812, -0.20740509033203125, -0.19799423217773438, -0.1885833740234375, -0.17917251586914062, -0.16976165771484375, -0.16035079956054688, -0.15093994140625, -0.14152908325195312, -0.13211822509765625, -0.12270736694335938, -0.1132965087890625, -0.10388565063476562, -0.09447479248046875, -0.08506393432617188, -0.075653076171875, -0.06624221801757812, -0.05683135986328125, -0.047420501708984375, -0.0380096435546875, -0.028598785400390625, -0.01918792724609375, -0.009777069091796875, -0.0003662109375, 0.009044647216796875, 0.01845550537109375, 0.027866363525390625, 0.0372772216796875, 0.046688079833984375, 0.05609893798828125, 0.06550979614257812, 0.074920654296875, 0.08433151245117188, 0.09374237060546875, 0.10315322875976562, 0.1125640869140625, 0.12197494506835938, 0.13138580322265625, 0.14079666137695312, 0.15020751953125, 0.15961837768554688, 0.16902923583984375, 0.17844009399414062, 0.1878509521484375, 0.19726181030273438, 0.20667266845703125, 0.21608352661132812, 0.225494384765625, 0.23490524291992188, 0.24431610107421875, 0.2537269592285156, 0.2631378173828125, 0.2725486755371094, 0.28195953369140625, 0.2913703918457031, 0.30078125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 5.0, 7.0, 7.0, 14.0, 10.0, 7.0, 18.0, 32.0, 45.0, 49.0, 66.0, 115.0, 117.0, 136.0, 96.0, 74.0, 51.0, 37.0, 30.0, 26.0, 8.0, 22.0, 10.0, 9.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014404296875, -0.013982295989990234, -0.013560295104980469, -0.013138294219970703, -0.012716293334960938, -0.012294292449951172, -0.011872291564941406, -0.01145029067993164, -0.011028289794921875, -0.01060628890991211, -0.010184288024902344, -0.009762287139892578, -0.009340286254882812, -0.008918285369873047, -0.008496284484863281, -0.008074283599853516, -0.00765228271484375, -0.007230281829833984, -0.006808280944824219, -0.006386280059814453, -0.0059642791748046875, -0.005542278289794922, -0.005120277404785156, -0.004698276519775391, -0.004276275634765625, -0.0038542747497558594, -0.0034322738647460938, -0.003010272979736328, -0.0025882720947265625, -0.002166271209716797, -0.0017442703247070312, -0.0013222694396972656, -0.0009002685546875, -0.0004782676696777344, -5.626678466796875e-05, 0.0003657341003417969, 0.0007877349853515625, 0.0012097358703613281, 0.0016317367553710938, 0.0020537376403808594, 0.002475738525390625, 0.0028977394104003906, 0.0033197402954101562, 0.003741741180419922, 0.0041637420654296875, 0.004585742950439453, 0.005007743835449219, 0.005429744720458984, 0.00585174560546875, 0.006273746490478516, 0.006695747375488281, 0.007117748260498047, 0.0075397491455078125, 0.007961750030517578, 0.008383750915527344, 0.00880575180053711, 0.009227752685546875, 0.00964975357055664, 0.010071754455566406, 0.010493755340576172, 0.010915756225585938, 0.011337757110595703, 0.011759757995605469, 0.012181758880615234, 0.012603759765625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 12.0, 15.0, 14.0, 21.0, 54.0, 57.0, 109.0, 145.0, 367.0, 1920.0, 984249.0, 60214.0, 708.0, 280.0, 141.0, 85.0, 55.0, 25.0, 26.0, 17.0, 14.0, 9.0, 6.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2685546875, -0.25954437255859375, -0.2505340576171875, -0.24152374267578125, -0.232513427734375, -0.22350311279296875, -0.2144927978515625, -0.20548248291015625, -0.19647216796875, -0.18746185302734375, -0.1784515380859375, -0.16944122314453125, -0.160430908203125, -0.15142059326171875, -0.1424102783203125, -0.13339996337890625, -0.1243896484375, -0.11537933349609375, -0.1063690185546875, -0.09735870361328125, -0.088348388671875, -0.07933807373046875, -0.0703277587890625, -0.06131744384765625, -0.05230712890625, -0.04329681396484375, -0.0342864990234375, -0.02527618408203125, -0.016265869140625, -0.00725555419921875, 0.0017547607421875, 0.01076507568359375, 0.019775390625, 0.02878570556640625, 0.0377960205078125, 0.04680633544921875, 0.055816650390625, 0.06482696533203125, 0.0738372802734375, 0.08284759521484375, 0.09185791015625, 0.10086822509765625, 0.1098785400390625, 0.11888885498046875, 0.127899169921875, 0.13690948486328125, 0.1459197998046875, 0.15493011474609375, 0.1639404296875, 0.17295074462890625, 0.1819610595703125, 0.19097137451171875, 0.199981689453125, 0.20899200439453125, 0.2180023193359375, 0.22701263427734375, 0.23602294921875, 0.24503326416015625, 0.2540435791015625, 0.26305389404296875, 0.272064208984375, 0.28107452392578125, 0.2900848388671875, 0.29909515380859375, 0.30810546875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 8.0, 35.0, 115.0, 400.0, 310.0, 104.0, 27.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007931796833872795, -0.006773454137146473, -0.0056151109747588634, -0.004456767812371254, -0.003298425115644932, -0.0021400824189186096, -0.0009817392565310001, 0.00017660390585660934, 0.0013349466025829315, 0.0024932895321398973, 0.003651632461696863, 0.004809975624084473, 0.005968318320810795, 0.007126661017537117, 0.008285004645586014, 0.009443347342312336, 0.010601690039038658, 0.01176003273576498, 0.012918375432491302, 0.0140767190605402, 0.015235061757266521, 0.016393404453992844, 0.01755174808204174, 0.018710091710090637, 0.019868433475494385, 0.02102677710354328, 0.02218511886894703, 0.023343462496995926, 0.024501804262399673, 0.02566014789044857, 0.026818491518497467, 0.027976833283901215, 0.029135175049304962, 0.03029351867735386, 0.031451862305402756, 0.0326102040708065, 0.03376854583621025, 0.0349268913269043, 0.036085233092308044, 0.03724357485771179, 0.03840191662311554, 0.03956025838851929, 0.04071860387921333, 0.04187694564461708, 0.04303528741002083, 0.044193632900714874, 0.04535197466611862, 0.04651031643152237, 0.047668661922216415, 0.04882700368762016, 0.04998534917831421, 0.05114369094371796, 0.052302032709121704, 0.05346037447452545, 0.0546187199652195, 0.055777061730623245, 0.05693540722131729, 0.05809374898672104, 0.059252094477415085, 0.06041043624281883, 0.06156877800822258, 0.06272712349891663, 0.06388546526432037, 0.06504380702972412, 0.06620214879512787]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 1.0, 10.0, 15.0, 12.0, 15.0, 22.0, 25.0, 32.0, 48.0, 45.0, 47.0, 54.0, 57.0, 49.0, 62.0, 36.0, 76.0, 50.0, 42.0, 48.0, 39.0, 45.0, 39.0, 19.0, 28.0, 20.0, 16.0, 14.0, 17.0, 4.0, 4.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008097052574157715, -0.007872756570577621, -0.007648460566997528, -0.007424164563417435, -0.007199868559837341, -0.006975572556257248, -0.0067512765526771545, -0.006526980549097061, -0.006302684545516968, -0.006078388541936874, -0.005854092538356781, -0.005629796534776688, -0.005405500531196594, -0.005181204527616501, -0.0049569085240364075, -0.004732612520456314, -0.004508316516876221, -0.004284020513296127, -0.004059724509716034, -0.0038354285061359406, -0.003611132502555847, -0.003386836498975754, -0.0031625404953956604, -0.002938244491815567, -0.0027139484882354736, -0.0024896524846553802, -0.002265356481075287, -0.0020410604774951935, -0.0018167644739151, -0.0015924684703350067, -0.0013681724667549133, -0.00114387646317482, -0.0009195804595947266, -0.0006952844560146332, -0.0004709884524345398, -0.0002466924488544464, -2.2396445274353027e-05, 0.00020189955830574036, 0.00042619556188583374, 0.0006504915654659271, 0.0008747875690460205, 0.001099083572626114, 0.0013233795762062073, 0.0015476755797863007, 0.001771971583366394, 0.0019962675869464874, 0.002220563590526581, 0.002444859594106674, 0.0026691555976867676, 0.002893451601266861, 0.0031177476048469543, 0.0033420436084270477, 0.003566339612007141, 0.0037906356155872345, 0.004014931619167328, 0.004239227622747421, 0.004463523626327515, 0.004687819629907608, 0.004912115633487701, 0.005136411637067795, 0.005360707640647888, 0.005585003644227982, 0.005809299647808075, 0.006033595651388168, 0.006257891654968262]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 11.0, 8.0, 8.0, 18.0, 20.0, 13.0, 26.0, 26.0, 27.0, 42.0, 34.0, 35.0, 40.0, 40.0, 37.0, 56.0, 50.0, 40.0, 53.0, 44.0, 36.0, 45.0, 28.0, 45.0, 29.0, 38.0, 24.0, 29.0, 15.0, 19.0, 7.0, 11.0, 9.0, 6.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.71875, -6.49993896484375, -6.2811279296875, -6.06231689453125, -5.843505859375, -5.62469482421875, -5.4058837890625, -5.18707275390625, -4.96826171875, -4.74945068359375, -4.5306396484375, -4.31182861328125, -4.093017578125, -3.87420654296875, -3.6553955078125, -3.43658447265625, -3.2177734375, -2.99896240234375, -2.7801513671875, -2.56134033203125, -2.342529296875, -2.12371826171875, -1.9049072265625, -1.68609619140625, -1.46728515625, -1.24847412109375, -1.0296630859375, -0.81085205078125, -0.592041015625, -0.37322998046875, -0.1544189453125, 0.06439208984375, 0.283203125, 0.50201416015625, 0.7208251953125, 0.93963623046875, 1.158447265625, 1.37725830078125, 1.5960693359375, 1.81488037109375, 2.03369140625, 2.25250244140625, 2.4713134765625, 2.69012451171875, 2.908935546875, 3.12774658203125, 3.3465576171875, 3.56536865234375, 3.7841796875, 4.00299072265625, 4.2218017578125, 4.44061279296875, 4.659423828125, 4.87823486328125, 5.0970458984375, 5.31585693359375, 5.53466796875, 5.75347900390625, 5.9722900390625, 6.19110107421875, 6.409912109375, 6.62872314453125, 6.8475341796875, 7.06634521484375, 7.28515625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 16.0, 9.0, 15.0, 16.0, 22.0, 32.0, 40.0, 64.0, 57.0, 97.0, 135.0, 188.0, 330.0, 521.0, 985.0, 1830.0, 3897.0, 8801.0, 20368.0, 46377.0, 108496.0, 263245.0, 332166.0, 148972.0, 61813.0, 27604.0, 11605.0, 5236.0, 2497.0, 1181.0, 711.0, 416.0, 261.0, 174.0, 105.0, 80.0, 49.0, 39.0, 22.0, 19.0, 18.0, 13.0, 5.0, 8.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1484375, -6.9034423828125, -6.658447265625, -6.4134521484375, -6.16845703125, -5.9234619140625, -5.678466796875, -5.4334716796875, -5.1884765625, -4.9434814453125, -4.698486328125, -4.4534912109375, -4.20849609375, -3.9635009765625, -3.718505859375, -3.4735107421875, -3.228515625, -2.9835205078125, -2.738525390625, -2.4935302734375, -2.24853515625, -2.0035400390625, -1.758544921875, -1.5135498046875, -1.2685546875, -1.0235595703125, -0.778564453125, -0.5335693359375, -0.28857421875, -0.0435791015625, 0.201416015625, 0.4464111328125, 0.69140625, 0.9364013671875, 1.181396484375, 1.4263916015625, 1.67138671875, 1.9163818359375, 2.161376953125, 2.4063720703125, 2.6513671875, 2.8963623046875, 3.141357421875, 3.3863525390625, 3.63134765625, 3.8763427734375, 4.121337890625, 4.3663330078125, 4.611328125, 4.8563232421875, 5.101318359375, 5.3463134765625, 5.59130859375, 5.8363037109375, 6.081298828125, 6.3262939453125, 6.5712890625, 6.8162841796875, 7.061279296875, 7.3062744140625, 7.55126953125, 7.7962646484375, 8.041259765625, 8.2862548828125, 8.53125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 6.0, 12.0, 11.0, 14.0, 13.0, 13.0, 18.0, 18.0, 26.0, 35.0, 31.0, 31.0, 53.0, 48.0, 58.0, 65.0, 141.0, 261.0, 1418.0, 216.0, 112.0, 65.0, 49.0, 41.0, 40.0, 43.0, 35.0, 23.0, 32.0, 22.0, 23.0, 15.0, 9.0, 9.0, 4.0, 9.0, 9.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.21875, -18.62353515625, -18.0283203125, -17.43310546875, -16.837890625, -16.24267578125, -15.6474609375, -15.05224609375, -14.45703125, -13.86181640625, -13.2666015625, -12.67138671875, -12.076171875, -11.48095703125, -10.8857421875, -10.29052734375, -9.6953125, -9.10009765625, -8.5048828125, -7.90966796875, -7.314453125, -6.71923828125, -6.1240234375, -5.52880859375, -4.93359375, -4.33837890625, -3.7431640625, -3.14794921875, -2.552734375, -1.95751953125, -1.3623046875, -0.76708984375, -0.171875, 0.42333984375, 1.0185546875, 1.61376953125, 2.208984375, 2.80419921875, 3.3994140625, 3.99462890625, 4.58984375, 5.18505859375, 5.7802734375, 6.37548828125, 6.970703125, 7.56591796875, 8.1611328125, 8.75634765625, 9.3515625, 9.94677734375, 10.5419921875, 11.13720703125, 11.732421875, 12.32763671875, 12.9228515625, 13.51806640625, 14.11328125, 14.70849609375, 15.3037109375, 15.89892578125, 16.494140625, 17.08935546875, 17.6845703125, 18.27978515625, 18.875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 13.0, 20.0, 24.0, 22.0, 42.0, 74.0, 73.0, 120.0, 211.0, 348.0, 499.0, 1018.0, 6615.0, 249525.0, 2828794.0, 53685.0, 2560.0, 777.0, 451.0, 252.0, 157.0, 99.0, 85.0, 51.0, 38.0, 31.0, 22.0, 15.0, 9.0, 6.0, 9.0, 8.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.375, -34.2802734375, -33.185546875, -32.0908203125, -30.99609375, -29.9013671875, -28.806640625, -27.7119140625, -26.6171875, -25.5224609375, -24.427734375, -23.3330078125, -22.23828125, -21.1435546875, -20.048828125, -18.9541015625, -17.859375, -16.7646484375, -15.669921875, -14.5751953125, -13.48046875, -12.3857421875, -11.291015625, -10.1962890625, -9.1015625, -8.0068359375, -6.912109375, -5.8173828125, -4.72265625, -3.6279296875, -2.533203125, -1.4384765625, -0.34375, 0.7509765625, 1.845703125, 2.9404296875, 4.03515625, 5.1298828125, 6.224609375, 7.3193359375, 8.4140625, 9.5087890625, 10.603515625, 11.6982421875, 12.79296875, 13.8876953125, 14.982421875, 16.0771484375, 17.171875, 18.2666015625, 19.361328125, 20.4560546875, 21.55078125, 22.6455078125, 23.740234375, 24.8349609375, 25.9296875, 27.0244140625, 28.119140625, 29.2138671875, 30.30859375, 31.4033203125, 32.498046875, 33.5927734375, 34.6875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 89.0, 913.0, 16.0, 1.0], "bins": [-675.0516357421875, -664.0450439453125, -653.0384521484375, -642.0318603515625, -631.0252685546875, -620.0186767578125, -609.0120849609375, -598.0054931640625, -586.9988403320312, -575.9922485351562, -564.9856567382812, -553.9790649414062, -542.9724731445312, -531.9658813476562, -520.959228515625, -509.9526672363281, -498.94610595703125, -487.93951416015625, -476.93292236328125, -465.92633056640625, -454.9197082519531, -443.9131164550781, -432.9065246582031, -421.8999328613281, -410.893310546875, -399.88671875, -388.880126953125, -377.87353515625, -366.8669128417969, -355.8603210449219, -344.8537292480469, -333.8471374511719, -322.8405456542969, -311.8339538574219, -300.8273620605469, -289.82073974609375, -278.81414794921875, -267.80755615234375, -256.80096435546875, -245.79437255859375, -234.78778076171875, -223.78118896484375, -212.7745819091797, -201.7679901123047, -190.7613983154297, -179.75479125976562, -168.74819946289062, -157.74160766601562, -146.73500061035156, -135.72840881347656, -124.72180938720703, -113.7152099609375, -102.7086181640625, -91.70201873779297, -80.69541931152344, -69.68882751464844, -58.682228088378906, -47.67563247680664, -36.669036865234375, -25.662437438964844, -14.655841827392578, -3.6492462158203125, 7.357353210449219, 18.36394500732422, 29.37054443359375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 8.0, 2.0, 6.0, 10.0, 8.0, 8.0, 8.0, 10.0, 15.0, 15.0, 12.0, 15.0, 23.0, 19.0, 24.0, 30.0, 29.0, 35.0, 36.0, 35.0, 39.0, 36.0, 43.0, 47.0, 37.0, 42.0, 39.0, 44.0, 24.0, 31.0, 21.0, 24.0, 21.0, 32.0, 27.0, 23.0, 25.0, 23.0, 6.0, 11.0, 10.0, 10.0, 11.0, 12.0, 3.0, 5.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.55262756347656, -36.398128509521484, -35.243629455566406, -34.089134216308594, -32.934635162353516, -31.780136108398438, -30.62563705444336, -29.47113800048828, -28.316640853881836, -27.162141799926758, -26.007644653320312, -24.853145599365234, -23.698646545410156, -22.54414939880371, -21.389650344848633, -20.235153198242188, -19.08065414428711, -17.92615509033203, -16.771657943725586, -15.617158889770508, -14.462660789489746, -13.308162689208984, -12.153663635253906, -10.999165534973145, -9.844667434692383, -8.690169334411621, -7.535670757293701, -6.381172180175781, -5.2266740798950195, -4.072175979614258, -2.917677402496338, -1.763178825378418, -0.6086807250976562, 0.5458176136016846, 1.7003159523010254, 2.854814291000366, 4.009312629699707, 5.163810729980469, 6.318309307098389, 7.472807884216309, 8.62730598449707, 9.781804084777832, 10.936302185058594, 12.090801239013672, 13.245299339294434, 14.399797439575195, 15.554296493530273, 16.70879364013672, 17.863292694091797, 19.017791748046875, 20.17228889465332, 21.3267879486084, 22.481285095214844, 23.635784149169922, 24.790283203125, 25.944782257080078, 27.099279403686523, 28.2537784576416, 29.408275604248047, 30.562774658203125, 31.717273712158203, 32.87177276611328, 34.026268005371094, 35.18076705932617, 36.33526611328125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 11.0, 12.0, 12.0, 24.0, 17.0, 16.0, 13.0, 33.0, 26.0, 41.0, 42.0, 31.0, 39.0, 57.0, 35.0, 48.0, 45.0, 58.0, 55.0, 40.0, 36.0, 43.0, 34.0, 39.0, 37.0, 24.0, 28.0, 15.0, 16.0, 16.0, 14.0, 10.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.818359375, -6.59375, -6.369140625, -6.14453125, -5.919921875, -5.6953125, -5.470703125, -5.24609375, -5.021484375, -4.796875, -4.572265625, -4.34765625, -4.123046875, -3.8984375, -3.673828125, -3.44921875, -3.224609375, -3.0, -2.775390625, -2.55078125, -2.326171875, -2.1015625, -1.876953125, -1.65234375, -1.427734375, -1.203125, -0.978515625, -0.75390625, -0.529296875, -0.3046875, -0.080078125, 0.14453125, 0.369140625, 0.59375, 0.818359375, 1.04296875, 1.267578125, 1.4921875, 1.716796875, 1.94140625, 2.166015625, 2.390625, 2.615234375, 2.83984375, 3.064453125, 3.2890625, 3.513671875, 3.73828125, 3.962890625, 4.1875, 4.412109375, 4.63671875, 4.861328125, 5.0859375, 5.310546875, 5.53515625, 5.759765625, 5.984375, 6.208984375, 6.43359375, 6.658203125, 6.8828125, 7.107421875, 7.33203125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 12.0, 17.0, 26.0, 33.0, 46.0, 69.0, 118.0, 179.0, 301.0, 535.0, 924.0, 1949.0, 4692.0, 13532.0, 44970.0, 163864.0, 575764.0, 1429234.0, 1282797.0, 481655.0, 136660.0, 37866.0, 11351.0, 4000.0, 1709.0, 815.0, 420.0, 266.0, 151.0, 120.0, 70.0, 49.0, 27.0, 13.0, 15.0, 13.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.20361328125, -5.9814453125, -5.75927734375, -5.537109375, -5.31494140625, -5.0927734375, -4.87060546875, -4.6484375, -4.42626953125, -4.2041015625, -3.98193359375, -3.759765625, -3.53759765625, -3.3154296875, -3.09326171875, -2.87109375, -2.64892578125, -2.4267578125, -2.20458984375, -1.982421875, -1.76025390625, -1.5380859375, -1.31591796875, -1.09375, -0.87158203125, -0.6494140625, -0.42724609375, -0.205078125, 0.01708984375, 0.2392578125, 0.46142578125, 0.68359375, 0.90576171875, 1.1279296875, 1.35009765625, 1.572265625, 1.79443359375, 2.0166015625, 2.23876953125, 2.4609375, 2.68310546875, 2.9052734375, 3.12744140625, 3.349609375, 3.57177734375, 3.7939453125, 4.01611328125, 4.23828125, 4.46044921875, 4.6826171875, 4.90478515625, 5.126953125, 5.34912109375, 5.5712890625, 5.79345703125, 6.015625, 6.23779296875, 6.4599609375, 6.68212890625, 6.904296875, 7.12646484375, 7.3486328125, 7.57080078125, 7.79296875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 4.0, 8.0, 14.0, 13.0, 19.0, 24.0, 43.0, 38.0, 50.0, 74.0, 94.0, 122.0, 196.0, 265.0, 298.0, 369.0, 375.0, 375.0, 332.0, 314.0, 237.0, 190.0, 139.0, 99.0, 96.0, 59.0, 41.0, 32.0, 30.0, 23.0, 14.0, 9.0, 11.0, 10.0, 9.0, 7.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0], "bins": [-7.71484375, -7.46588134765625, -7.2169189453125, -6.96795654296875, -6.718994140625, -6.47003173828125, -6.2210693359375, -5.97210693359375, -5.72314453125, -5.47418212890625, -5.2252197265625, -4.97625732421875, -4.727294921875, -4.47833251953125, -4.2293701171875, -3.98040771484375, -3.7314453125, -3.48248291015625, -3.2335205078125, -2.98455810546875, -2.735595703125, -2.48663330078125, -2.2376708984375, -1.98870849609375, -1.73974609375, -1.49078369140625, -1.2418212890625, -0.99285888671875, -0.743896484375, -0.49493408203125, -0.2459716796875, 0.00299072265625, 0.251953125, 0.50091552734375, 0.7498779296875, 0.99884033203125, 1.247802734375, 1.49676513671875, 1.7457275390625, 1.99468994140625, 2.24365234375, 2.49261474609375, 2.7415771484375, 2.99053955078125, 3.239501953125, 3.48846435546875, 3.7374267578125, 3.98638916015625, 4.2353515625, 4.48431396484375, 4.7332763671875, 4.98223876953125, 5.231201171875, 5.48016357421875, 5.7291259765625, 5.97808837890625, 6.22705078125, 6.47601318359375, 6.7249755859375, 6.97393798828125, 7.222900390625, 7.47186279296875, 7.7208251953125, 7.96978759765625, 8.21875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 1.0, 11.0, 11.0, 4.0, 17.0, 16.0, 19.0, 13.0, 27.0, 40.0, 58.0, 68.0, 93.0, 124.0, 229.0, 380.0, 685.0, 1363.0, 3162.0, 8377.0, 25775.0, 100474.0, 505938.0, 2125541.0, 1139479.0, 209888.0, 48563.0, 14597.0, 4994.0, 2020.0, 969.0, 484.0, 281.0, 174.0, 118.0, 80.0, 45.0, 42.0, 36.0, 15.0, 19.0, 6.0, 10.0, 7.0, 4.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.444091796875, -11.08349609375, -10.722900390625, -10.3623046875, -10.001708984375, -9.64111328125, -9.280517578125, -8.919921875, -8.559326171875, -8.19873046875, -7.838134765625, -7.4775390625, -7.116943359375, -6.75634765625, -6.395751953125, -6.03515625, -5.674560546875, -5.31396484375, -4.953369140625, -4.5927734375, -4.232177734375, -3.87158203125, -3.510986328125, -3.150390625, -2.789794921875, -2.42919921875, -2.068603515625, -1.7080078125, -1.347412109375, -0.98681640625, -0.626220703125, -0.265625, 0.094970703125, 0.45556640625, 0.816162109375, 1.1767578125, 1.537353515625, 1.89794921875, 2.258544921875, 2.619140625, 2.979736328125, 3.34033203125, 3.700927734375, 4.0615234375, 4.422119140625, 4.78271484375, 5.143310546875, 5.50390625, 5.864501953125, 6.22509765625, 6.585693359375, 6.9462890625, 7.306884765625, 7.66748046875, 8.028076171875, 8.388671875, 8.749267578125, 9.10986328125, 9.470458984375, 9.8310546875, 10.191650390625, 10.55224609375, 10.912841796875, 11.2734375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 93.0, 452.0, 400.0, 63.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.30988311767578, -67.13794708251953, -60.96601104736328, -54.7940788269043, -48.62214279174805, -42.4502067565918, -36.27827453613281, -30.106338500976562, -23.934402465820312, -17.762466430664062, -11.590532302856445, -5.418598175048828, 0.7533378601074219, 6.925273895263672, 13.097206115722656, 19.269142150878906, 25.441078186035156, 31.613014221191406, 37.784950256347656, 43.95688247680664, 50.12881851196289, 56.30075454711914, 62.472686767578125, 68.64462280273438, 74.81655883789062, 80.98849487304688, 87.16043090820312, 93.33236694335938, 99.50430297851562, 105.67623901367188, 111.8481674194336, 118.02010345458984, 124.19204711914062, 130.36398315429688, 136.53591918945312, 142.70785522460938, 148.87979125976562, 155.05172729492188, 161.22366333007812, 167.39559936523438, 173.56753540039062, 179.73947143554688, 185.91140747070312, 192.08334350585938, 198.25527954101562, 204.42721557617188, 210.59915161132812, 216.77108764648438, 222.94300842285156, 229.1149444580078, 235.28688049316406, 241.4588165283203, 247.63075256347656, 253.8026885986328, 259.974609375, 266.14654541015625, 272.3184814453125, 278.49041748046875, 284.662353515625, 290.83428955078125, 297.0062255859375, 303.17816162109375, 309.35009765625, 315.52203369140625, 321.6939697265625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 4.0, 8.0, 3.0, 12.0, 17.0, 13.0, 15.0, 24.0, 28.0, 31.0, 22.0, 40.0, 35.0, 50.0, 41.0, 47.0, 38.0, 42.0, 37.0, 28.0, 44.0, 48.0, 34.0, 39.0, 35.0, 42.0, 23.0, 32.0, 20.0, 22.0, 17.0, 17.0, 11.0, 17.0, 12.0, 10.0, 6.0, 6.0, 3.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.025562286376953, -30.02846336364746, -29.03136444091797, -28.034263610839844, -27.03716468811035, -26.04006576538086, -25.042966842651367, -24.045867919921875, -23.04876708984375, -22.051668167114258, -21.054569244384766, -20.05746841430664, -19.06036949157715, -18.063270568847656, -17.066171646118164, -16.069072723388672, -15.071972846984863, -14.074873924255371, -13.077774047851562, -12.08067512512207, -11.083575248718262, -10.08647632598877, -9.089376449584961, -8.092277526855469, -7.095178127288818, -6.098078727722168, -5.100979328155518, -4.103879928588867, -3.106780767440796, -2.1096816062927246, -1.1125822067260742, -0.11548280715942383, 0.8816165924072266, 1.878715991973877, 2.8758153915405273, 3.8729145526885986, 4.870014190673828, 5.86711311340332, 6.864212512969971, 7.861311912536621, 8.85841178894043, 9.855510711669922, 10.85261058807373, 11.849709510803223, 12.846809387207031, 13.843908309936523, 14.841007232666016, 15.838107109069824, 16.835205078125, 17.832304000854492, 18.829402923583984, 19.82650375366211, 20.8236026763916, 21.820701599121094, 22.817800521850586, 23.814899444580078, 24.812000274658203, 25.809099197387695, 26.806198120117188, 27.803298950195312, 28.800397872924805, 29.797496795654297, 30.79459571838379, 31.79169464111328, 32.788795471191406]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 8.0, 7.0, 13.0, 7.0, 15.0, 16.0, 24.0, 10.0, 15.0, 27.0, 17.0, 35.0, 27.0, 33.0, 41.0, 44.0, 47.0, 41.0, 31.0, 48.0, 50.0, 38.0, 35.0, 47.0, 47.0, 34.0, 34.0, 22.0, 20.0, 30.0, 22.0, 21.0, 22.0, 17.0, 7.0, 5.0, 9.0, 9.0, 7.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.97265625, -6.7708740234375, -6.569091796875, -6.3673095703125, -6.16552734375, -5.9637451171875, -5.761962890625, -5.5601806640625, -5.3583984375, -5.1566162109375, -4.954833984375, -4.7530517578125, -4.55126953125, -4.3494873046875, -4.147705078125, -3.9459228515625, -3.744140625, -3.5423583984375, -3.340576171875, -3.1387939453125, -2.93701171875, -2.7352294921875, -2.533447265625, -2.3316650390625, -2.1298828125, -1.9281005859375, -1.726318359375, -1.5245361328125, -1.32275390625, -1.1209716796875, -0.919189453125, -0.7174072265625, -0.515625, -0.3138427734375, -0.112060546875, 0.0897216796875, 0.29150390625, 0.4932861328125, 0.695068359375, 0.8968505859375, 1.0986328125, 1.3004150390625, 1.502197265625, 1.7039794921875, 1.90576171875, 2.1075439453125, 2.309326171875, 2.5111083984375, 2.712890625, 2.9146728515625, 3.116455078125, 3.3182373046875, 3.52001953125, 3.7218017578125, 3.923583984375, 4.1253662109375, 4.3271484375, 4.5289306640625, 4.730712890625, 4.9324951171875, 5.13427734375, 5.3360595703125, 5.537841796875, 5.7396240234375, 5.94140625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 13.0, 8.0, 18.0, 30.0, 39.0, 48.0, 83.0, 150.0, 225.0, 276.0, 509.0, 781.0, 1143.0, 1996.0, 3146.0, 5337.0, 8862.0, 15539.0, 26050.0, 45374.0, 78734.0, 132832.0, 197858.0, 200118.0, 136516.0, 80502.0, 46545.0, 26836.0, 15694.0, 9122.0, 5510.0, 3254.0, 1947.0, 1291.0, 750.0, 521.0, 313.0, 197.0, 135.0, 68.0, 64.0, 42.0, 27.0, 20.0, 13.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61181640625, -0.5914382934570312, -0.5710601806640625, -0.5506820678710938, -0.530303955078125, -0.5099258422851562, -0.4895477294921875, -0.46916961669921875, -0.44879150390625, -0.42841339111328125, -0.4080352783203125, -0.38765716552734375, -0.367279052734375, -0.34690093994140625, -0.3265228271484375, -0.30614471435546875, -0.2857666015625, -0.26538848876953125, -0.2450103759765625, -0.22463226318359375, -0.204254150390625, -0.18387603759765625, -0.1634979248046875, -0.14311981201171875, -0.12274169921875, -0.10236358642578125, -0.0819854736328125, -0.06160736083984375, -0.041229248046875, -0.02085113525390625, -0.0004730224609375, 0.01990509033203125, 0.040283203125, 0.06066131591796875, 0.0810394287109375, 0.10141754150390625, 0.121795654296875, 0.14217376708984375, 0.1625518798828125, 0.18292999267578125, 0.20330810546875, 0.22368621826171875, 0.2440643310546875, 0.26444244384765625, 0.284820556640625, 0.30519866943359375, 0.3255767822265625, 0.34595489501953125, 0.3663330078125, 0.38671112060546875, 0.4070892333984375, 0.42746734619140625, 0.447845458984375, 0.46822357177734375, 0.4886016845703125, 0.5089797973632812, 0.52935791015625, 0.5497360229492188, 0.5701141357421875, 0.5904922485351562, 0.610870361328125, 0.6312484741210938, 0.6516265869140625, 0.6720046997070312, 0.6923828125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 5.0, 12.0, 10.0, 9.0, 21.0, 16.0, 29.0, 13.0, 19.0, 14.0, 24.0, 25.0, 23.0, 34.0, 34.0, 41.0, 33.0, 51.0, 32.0, 1063.0, 29.0, 42.0, 48.0, 39.0, 33.0, 37.0, 24.0, 34.0, 22.0, 27.0, 32.0, 20.0, 16.0, 14.0, 24.0, 23.0, 7.0, 12.0, 8.0, 11.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62890625, -3.50250244140625, -3.3760986328125, -3.24969482421875, -3.123291015625, -2.99688720703125, -2.8704833984375, -2.74407958984375, -2.61767578125, -2.49127197265625, -2.3648681640625, -2.23846435546875, -2.112060546875, -1.98565673828125, -1.8592529296875, -1.73284912109375, -1.6064453125, -1.48004150390625, -1.3536376953125, -1.22723388671875, -1.100830078125, -0.97442626953125, -0.8480224609375, -0.72161865234375, -0.59521484375, -0.46881103515625, -0.3424072265625, -0.21600341796875, -0.089599609375, 0.03680419921875, 0.1632080078125, 0.28961181640625, 0.416015625, 0.54241943359375, 0.6688232421875, 0.79522705078125, 0.921630859375, 1.04803466796875, 1.1744384765625, 1.30084228515625, 1.42724609375, 1.55364990234375, 1.6800537109375, 1.80645751953125, 1.932861328125, 2.05926513671875, 2.1856689453125, 2.31207275390625, 2.4384765625, 2.56488037109375, 2.6912841796875, 2.81768798828125, 2.944091796875, 3.07049560546875, 3.1968994140625, 3.32330322265625, 3.44970703125, 3.57611083984375, 3.7025146484375, 3.82891845703125, 3.955322265625, 4.08172607421875, 4.2081298828125, 4.33453369140625, 4.4609375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 10.0, 19.0, 24.0, 39.0, 58.0, 79.0, 141.0, 198.0, 338.0, 581.0, 957.0, 1710.0, 3211.0, 5826.0, 11436.0, 21989.0, 43405.0, 81401.0, 143960.0, 937950.0, 535517.0, 141475.0, 79137.0, 42027.0, 21575.0, 10917.0, 5721.0, 3122.0, 1757.0, 974.0, 626.0, 363.0, 213.0, 132.0, 87.0, 55.0, 27.0, 21.0, 16.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.49658203125, -0.48055267333984375, -0.4645233154296875, -0.44849395751953125, -0.432464599609375, -0.41643524169921875, -0.4004058837890625, -0.38437652587890625, -0.36834716796875, -0.35231781005859375, -0.3362884521484375, -0.32025909423828125, -0.304229736328125, -0.28820037841796875, -0.2721710205078125, -0.25614166259765625, -0.2401123046875, -0.22408294677734375, -0.2080535888671875, -0.19202423095703125, -0.175994873046875, -0.15996551513671875, -0.1439361572265625, -0.12790679931640625, -0.11187744140625, -0.09584808349609375, -0.0798187255859375, -0.06378936767578125, -0.047760009765625, -0.03173065185546875, -0.0157012939453125, 0.00032806396484375, 0.016357421875, 0.03238677978515625, 0.0484161376953125, 0.06444549560546875, 0.080474853515625, 0.09650421142578125, 0.1125335693359375, 0.12856292724609375, 0.14459228515625, 0.16062164306640625, 0.1766510009765625, 0.19268035888671875, 0.208709716796875, 0.22473907470703125, 0.2407684326171875, 0.25679779052734375, 0.2728271484375, 0.28885650634765625, 0.3048858642578125, 0.32091522216796875, 0.336944580078125, 0.35297393798828125, 0.3690032958984375, 0.38503265380859375, 0.40106201171875, 0.41709136962890625, 0.4331207275390625, 0.44915008544921875, 0.465179443359375, 0.48120880126953125, 0.4972381591796875, 0.5132675170898438, 0.529296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 5.0, 7.0, 7.0, 10.0, 11.0, 12.0, 14.0, 21.0, 30.0, 24.0, 24.0, 41.0, 36.0, 61.0, 75.0, 88.0, 101.0, 80.0, 53.0, 41.0, 35.0, 41.0, 21.0, 30.0, 13.0, 13.0, 10.0, 12.0, 6.0, 10.0, 12.0, 12.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0152587890625, -0.014785528182983398, -0.014312267303466797, -0.013839006423950195, -0.013365745544433594, -0.012892484664916992, -0.01241922378540039, -0.011945962905883789, -0.011472702026367188, -0.010999441146850586, -0.010526180267333984, -0.010052919387817383, -0.009579658508300781, -0.00910639762878418, -0.008633136749267578, -0.008159875869750977, -0.007686614990234375, -0.0072133541107177734, -0.006740093231201172, -0.00626683235168457, -0.005793571472167969, -0.005320310592651367, -0.004847049713134766, -0.004373788833618164, -0.0039005279541015625, -0.003427267074584961, -0.0029540061950683594, -0.002480745315551758, -0.0020074844360351562, -0.0015342235565185547, -0.0010609626770019531, -0.0005877017974853516, -0.00011444091796875, 0.00035881996154785156, 0.0008320808410644531, 0.0013053417205810547, 0.0017786026000976562, 0.002251863479614258, 0.0027251243591308594, 0.003198385238647461, 0.0036716461181640625, 0.004144906997680664, 0.004618167877197266, 0.005091428756713867, 0.005564689636230469, 0.00603795051574707, 0.006511211395263672, 0.0069844722747802734, 0.007457733154296875, 0.007930994033813477, 0.008404254913330078, 0.00887751579284668, 0.009350776672363281, 0.009824037551879883, 0.010297298431396484, 0.010770559310913086, 0.011243820190429688, 0.011717081069946289, 0.01219034194946289, 0.012663602828979492, 0.013136863708496094, 0.013610124588012695, 0.014083385467529297, 0.014556646347045898, 0.0150299072265625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 4.0, 7.0, 14.0, 8.0, 9.0, 18.0, 23.0, 17.0, 31.0, 31.0, 44.0, 48.0, 88.0, 111.0, 186.0, 260.0, 421.0, 1189.0, 30338.0, 992850.0, 20453.0, 1070.0, 437.0, 229.0, 166.0, 126.0, 80.0, 70.0, 39.0, 36.0, 23.0, 24.0, 18.0, 14.0, 11.0, 8.0, 10.0, 7.0, 5.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2962913513183594, -0.28716278076171875, -0.2780342102050781, -0.2689056396484375, -0.2597770690917969, -0.25064849853515625, -0.24151992797851562, -0.232391357421875, -0.22326278686523438, -0.21413421630859375, -0.20500564575195312, -0.1958770751953125, -0.18674850463867188, -0.17761993408203125, -0.16849136352539062, -0.15936279296875, -0.15023422241210938, -0.14110565185546875, -0.13197708129882812, -0.1228485107421875, -0.11371994018554688, -0.10459136962890625, -0.09546279907226562, -0.086334228515625, -0.07720565795898438, -0.06807708740234375, -0.058948516845703125, -0.0498199462890625, -0.040691375732421875, -0.03156280517578125, -0.022434234619140625, -0.0133056640625, -0.004177093505859375, 0.00495147705078125, 0.014080047607421875, 0.0232086181640625, 0.032337188720703125, 0.04146575927734375, 0.050594329833984375, 0.059722900390625, 0.06885147094726562, 0.07798004150390625, 0.08710861206054688, 0.0962371826171875, 0.10536575317382812, 0.11449432373046875, 0.12362289428710938, 0.13275146484375, 0.14188003540039062, 0.15100860595703125, 0.16013717651367188, 0.1692657470703125, 0.17839431762695312, 0.18752288818359375, 0.19665145874023438, 0.205780029296875, 0.21490859985351562, 0.22403717041015625, 0.23316574096679688, 0.2422943115234375, 0.2514228820800781, 0.26055145263671875, 0.2696800231933594, 0.27880859375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 317.0, 680.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0902738869190216, -0.08281730860471725, -0.0753607302904129, -0.06790414452552795, -0.0604475662112236, -0.05299098789691925, -0.0455344095826149, -0.03807782754302025, -0.030621249228715897, -0.023164669051766396, -0.015708088874816895, -0.008251510560512543, -0.0007949303835630417, 0.006661649793386459, 0.014118228107690811, 0.02157481014728546, 0.029031388461589813, 0.036487966775894165, 0.043944548815488815, 0.05140112712979317, 0.05885770916938782, 0.06631428748369217, 0.07377086579799652, 0.08122745156288147, 0.08868402242660522, 0.09614060074090958, 0.10359717905521393, 0.11105376482009888, 0.11851034313440323, 0.12596692144870758, 0.13342350721359253, 0.14088007807731628, 0.14833666384220123, 0.15579324960708618, 0.16324982047080994, 0.17070640623569489, 0.17816297709941864, 0.1856195628643036, 0.19307613372802734, 0.2005327194929123, 0.20798930525779724, 0.2154458910226822, 0.22290246188640594, 0.2303590476512909, 0.23781561851501465, 0.2452722042798996, 0.25272879004478455, 0.2601853609085083, 0.26764193177223206, 0.2750985026359558, 0.28255510330200195, 0.2900116741657257, 0.29746824502944946, 0.3049248456954956, 0.31238141655921936, 0.3198379874229431, 0.32729458808898926, 0.334751158952713, 0.34220775961875916, 0.3496643304824829, 0.35712090134620667, 0.3645774722099304, 0.37203407287597656, 0.3794906437397003, 0.3869472146034241]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 9.0, 4.0, 7.0, 6.0, 15.0, 21.0, 26.0, 20.0, 35.0, 28.0, 31.0, 33.0, 39.0, 51.0, 54.0, 54.0, 57.0, 57.0, 52.0, 50.0, 43.0, 41.0, 46.0, 39.0, 37.0, 27.0, 28.0, 24.0, 12.0, 9.0, 18.0, 10.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.024103105068206787, -0.023459849879145622, -0.022816594690084457, -0.022173339501023293, -0.021530084311962128, -0.020886829122900963, -0.020243573933839798, -0.019600318744778633, -0.018957063555717468, -0.018313808366656303, -0.01767055317759514, -0.017027297988533974, -0.01638404279947281, -0.015740787610411644, -0.015097532421350479, -0.014454277232289314, -0.01381102204322815, -0.013167766854166985, -0.01252451166510582, -0.011881256476044655, -0.01123800128698349, -0.010594746097922325, -0.00995149090886116, -0.009308235719799995, -0.00866498053073883, -0.008021725341677666, -0.007378470152616501, -0.006735214963555336, -0.006091959774494171, -0.005448704585433006, -0.004805449396371841, -0.004162194207310677, -0.0035189390182495117, -0.002875683829188347, -0.002232428640127182, -0.0015891734510660172, -0.0009459182620048523, -0.00030266307294368744, 0.0003405921161174774, 0.0009838473051786423, 0.0016271024942398071, 0.002270357683300972, 0.002913612872362137, 0.0035568680614233017, 0.0042001232504844666, 0.004843378439545631, 0.005486633628606796, 0.006129888817667961, 0.006773144006729126, 0.007416399195790291, 0.008059654384851456, 0.00870290957391262, 0.009346164762973785, 0.00998941995203495, 0.010632675141096115, 0.01127593033015728, 0.011919185519218445, 0.01256244070827961, 0.013205695897340775, 0.01384895108640194, 0.014492206275463104, 0.015135461464524269, 0.015778716653585434, 0.0164219718426466, 0.017065227031707764]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 8.0, 7.0, 13.0, 7.0, 15.0, 15.0, 25.0, 9.0, 16.0, 27.0, 17.0, 35.0, 26.0, 33.0, 42.0, 43.0, 48.0, 41.0, 30.0, 48.0, 51.0, 37.0, 36.0, 45.0, 48.0, 35.0, 34.0, 22.0, 19.0, 31.0, 21.0, 22.0, 22.0, 17.0, 7.0, 4.0, 10.0, 9.0, 7.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.97265625, -6.77093505859375, -6.5692138671875, -6.36749267578125, -6.165771484375, -5.96405029296875, -5.7623291015625, -5.56060791015625, -5.35888671875, -5.15716552734375, -4.9554443359375, -4.75372314453125, -4.552001953125, -4.35028076171875, -4.1485595703125, -3.94683837890625, -3.7451171875, -3.54339599609375, -3.3416748046875, -3.13995361328125, -2.938232421875, -2.73651123046875, -2.5347900390625, -2.33306884765625, -2.13134765625, -1.92962646484375, -1.7279052734375, -1.52618408203125, -1.324462890625, -1.12274169921875, -0.9210205078125, -0.71929931640625, -0.517578125, -0.31585693359375, -0.1141357421875, 0.08758544921875, 0.289306640625, 0.49102783203125, 0.6927490234375, 0.89447021484375, 1.09619140625, 1.29791259765625, 1.4996337890625, 1.70135498046875, 1.903076171875, 2.10479736328125, 2.3065185546875, 2.50823974609375, 2.7099609375, 2.91168212890625, 3.1134033203125, 3.31512451171875, 3.516845703125, 3.71856689453125, 3.9202880859375, 4.12200927734375, 4.32373046875, 4.52545166015625, 4.7271728515625, 4.92889404296875, 5.130615234375, 5.33233642578125, 5.5340576171875, 5.73577880859375, 5.9375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 2.0, 3.0, 3.0, 7.0, 12.0, 13.0, 18.0, 23.0, 28.0, 29.0, 50.0, 75.0, 117.0, 148.0, 196.0, 274.0, 440.0, 748.0, 1446.0, 2991.0, 6987.0, 18107.0, 49437.0, 131053.0, 328523.0, 310810.0, 121830.0, 45725.0, 16568.0, 6647.0, 2785.0, 1328.0, 736.0, 440.0, 256.0, 185.0, 128.0, 104.0, 72.0, 53.0, 49.0, 24.0, 19.0, 29.0, 13.0, 9.0, 10.0, 2.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2265625, -7.9425048828125, -7.658447265625, -7.3743896484375, -7.09033203125, -6.8062744140625, -6.522216796875, -6.2381591796875, -5.9541015625, -5.6700439453125, -5.385986328125, -5.1019287109375, -4.81787109375, -4.5338134765625, -4.249755859375, -3.9656982421875, -3.681640625, -3.3975830078125, -3.113525390625, -2.8294677734375, -2.54541015625, -2.2613525390625, -1.977294921875, -1.6932373046875, -1.4091796875, -1.1251220703125, -0.841064453125, -0.5570068359375, -0.27294921875, 0.0111083984375, 0.295166015625, 0.5792236328125, 0.86328125, 1.1473388671875, 1.431396484375, 1.7154541015625, 1.99951171875, 2.2835693359375, 2.567626953125, 2.8516845703125, 3.1357421875, 3.4197998046875, 3.703857421875, 3.9879150390625, 4.27197265625, 4.5560302734375, 4.840087890625, 5.1241455078125, 5.408203125, 5.6922607421875, 5.976318359375, 6.2603759765625, 6.54443359375, 6.8284912109375, 7.112548828125, 7.3966064453125, 7.6806640625, 7.9647216796875, 8.248779296875, 8.5328369140625, 8.81689453125, 9.1009521484375, 9.385009765625, 9.6690673828125, 9.953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 12.0, 16.0, 17.0, 16.0, 20.0, 20.0, 28.0, 42.0, 33.0, 40.0, 57.0, 70.0, 103.0, 160.0, 247.0, 1392.0, 204.0, 119.0, 82.0, 49.0, 57.0, 44.0, 37.0, 30.0, 22.0, 26.0, 20.0, 13.0, 9.0, 11.0, 12.0, 4.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.75, -16.176513671875, -15.60302734375, -15.029541015625, -14.4560546875, -13.882568359375, -13.30908203125, -12.735595703125, -12.162109375, -11.588623046875, -11.01513671875, -10.441650390625, -9.8681640625, -9.294677734375, -8.72119140625, -8.147705078125, -7.57421875, -7.000732421875, -6.42724609375, -5.853759765625, -5.2802734375, -4.706787109375, -4.13330078125, -3.559814453125, -2.986328125, -2.412841796875, -1.83935546875, -1.265869140625, -0.6923828125, -0.118896484375, 0.45458984375, 1.028076171875, 1.6015625, 2.175048828125, 2.74853515625, 3.322021484375, 3.8955078125, 4.468994140625, 5.04248046875, 5.615966796875, 6.189453125, 6.762939453125, 7.33642578125, 7.909912109375, 8.4833984375, 9.056884765625, 9.63037109375, 10.203857421875, 10.77734375, 11.350830078125, 11.92431640625, 12.497802734375, 13.0712890625, 13.644775390625, 14.21826171875, 14.791748046875, 15.365234375, 15.938720703125, 16.51220703125, 17.085693359375, 17.6591796875, 18.232666015625, 18.80615234375, 19.379638671875, 19.953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 3.0, 8.0, 5.0, 9.0, 16.0, 20.0, 26.0, 38.0, 58.0, 71.0, 121.0, 171.0, 276.0, 416.0, 851.0, 2491.0, 66719.0, 2980839.0, 88633.0, 2784.0, 807.0, 480.0, 259.0, 173.0, 137.0, 73.0, 54.0, 45.0, 32.0, 23.0, 15.0, 14.0, 12.0, 6.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-47.40625, -46.14306640625, -44.8798828125, -43.61669921875, -42.353515625, -41.09033203125, -39.8271484375, -38.56396484375, -37.30078125, -36.03759765625, -34.7744140625, -33.51123046875, -32.248046875, -30.98486328125, -29.7216796875, -28.45849609375, -27.1953125, -25.93212890625, -24.6689453125, -23.40576171875, -22.142578125, -20.87939453125, -19.6162109375, -18.35302734375, -17.08984375, -15.82666015625, -14.5634765625, -13.30029296875, -12.037109375, -10.77392578125, -9.5107421875, -8.24755859375, -6.984375, -5.72119140625, -4.4580078125, -3.19482421875, -1.931640625, -0.66845703125, 0.5947265625, 1.85791015625, 3.12109375, 4.38427734375, 5.6474609375, 6.91064453125, 8.173828125, 9.43701171875, 10.7001953125, 11.96337890625, 13.2265625, 14.48974609375, 15.7529296875, 17.01611328125, 18.279296875, 19.54248046875, 20.8056640625, 22.06884765625, 23.33203125, 24.59521484375, 25.8583984375, 27.12158203125, 28.384765625, 29.64794921875, 30.9111328125, 32.17431640625, 33.4375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 10.0, 13.0, 26.0, 90.0, 144.0, 191.0, 195.0, 167.0, 113.0, 38.0, 20.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.012578964233398, -11.406538009643555, -9.800498008728027, -8.194457054138184, -6.588416576385498, -4.9823760986328125, -3.3763351440429688, -1.7702951431274414, -0.16425418853759766, 1.4417864084243774, 3.0478270053863525, 4.653867721557617, 6.259908199310303, 7.865948677062988, 9.471989631652832, 11.07802963256836, 12.684070587158203, 14.290111541748047, 15.896151542663574, 17.502193450927734, 19.108232498168945, 20.71427345275879, 22.320314407348633, 23.926353454589844, 25.532394409179688, 27.13843536376953, 28.744476318359375, 30.35051727294922, 31.95655632019043, 33.562599182128906, 35.16864013671875, 36.77467727661133, 38.38071823120117, 39.986759185791016, 41.59280014038086, 43.1988410949707, 44.80488204956055, 46.410919189453125, 48.01696014404297, 49.62300109863281, 51.229042053222656, 52.8350830078125, 54.441123962402344, 56.04716491699219, 57.65320587158203, 59.259246826171875, 60.86528778076172, 62.4713249206543, 64.0773696899414, 65.68341064453125, 67.2894515991211, 68.89549255371094, 70.50153350830078, 72.10757446289062, 73.71361541748047, 75.31965637207031, 76.92568969726562, 78.53173065185547, 80.13777160644531, 81.74381256103516, 83.349853515625, 84.95589447021484, 86.56193542480469, 88.16797637939453, 89.77401733398438]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 10.0, 4.0, 8.0, 11.0, 10.0, 8.0, 22.0, 28.0, 16.0, 28.0, 33.0, 33.0, 33.0, 29.0, 38.0, 43.0, 41.0, 40.0, 49.0, 60.0, 39.0, 37.0, 41.0, 47.0, 37.0, 40.0, 35.0, 29.0, 26.0, 23.0, 17.0, 20.0, 15.0, 10.0, 7.0, 9.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.79722595214844, -31.507078170776367, -30.21693229675293, -28.92678451538086, -27.63663673400879, -26.34648895263672, -25.05634307861328, -23.76619529724121, -22.47604751586914, -21.18589973449707, -19.895753860473633, -18.605606079101562, -17.315458297729492, -16.025310516357422, -14.735164642333984, -13.445016860961914, -12.154870986938477, -10.864724159240723, -9.574576377868652, -8.284429550170898, -6.994282245635986, -5.704134941101074, -4.41398811340332, -3.12384033203125, -1.833693504333496, -0.5435463190078735, 0.746600866317749, 2.036747932434082, 3.326895236968994, 4.617042541503906, 5.90718936920166, 7.1973371505737305, 8.487483978271484, 9.777630805969238, 11.067778587341309, 12.357925415039062, 13.648073196411133, 14.938220024108887, 16.22836685180664, 17.51851463317871, 18.80866241455078, 20.09881019592285, 21.38895606994629, 22.67910385131836, 23.96925163269043, 25.2593994140625, 26.549545288085938, 27.839693069458008, 29.129838943481445, 30.419986724853516, 31.710132598876953, 33.000282287597656, 34.290428161621094, 35.58057403564453, 36.87071990966797, 38.16086959838867, 39.45101547241211, 40.74116134643555, 42.03131103515625, 43.32145690917969, 44.611602783203125, 45.90175247192383, 47.191898345947266, 48.48204803466797, 49.772193908691406]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 9.0, 10.0, 7.0, 15.0, 12.0, 17.0, 30.0, 22.0, 24.0, 20.0, 39.0, 36.0, 31.0, 42.0, 40.0, 52.0, 60.0, 42.0, 48.0, 35.0, 45.0, 39.0, 48.0, 36.0, 43.0, 31.0, 34.0, 23.0, 15.0, 20.0, 15.0, 8.0, 10.0, 7.0, 8.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.97265625, -7.74774169921875, -7.5228271484375, -7.29791259765625, -7.072998046875, -6.84808349609375, -6.6231689453125, -6.39825439453125, -6.17333984375, -5.94842529296875, -5.7235107421875, -5.49859619140625, -5.273681640625, -5.04876708984375, -4.8238525390625, -4.59893798828125, -4.3740234375, -4.14910888671875, -3.9241943359375, -3.69927978515625, -3.474365234375, -3.24945068359375, -3.0245361328125, -2.79962158203125, -2.57470703125, -2.34979248046875, -2.1248779296875, -1.89996337890625, -1.675048828125, -1.45013427734375, -1.2252197265625, -1.00030517578125, -0.775390625, -0.55047607421875, -0.3255615234375, -0.10064697265625, 0.124267578125, 0.34918212890625, 0.5740966796875, 0.79901123046875, 1.02392578125, 1.24884033203125, 1.4737548828125, 1.69866943359375, 1.923583984375, 2.14849853515625, 2.3734130859375, 2.59832763671875, 2.8232421875, 3.04815673828125, 3.2730712890625, 3.49798583984375, 3.722900390625, 3.94781494140625, 4.1727294921875, 4.39764404296875, 4.62255859375, 4.84747314453125, 5.0723876953125, 5.29730224609375, 5.522216796875, 5.74713134765625, 5.9720458984375, 6.19696044921875, 6.421875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 9.0, 8.0, 14.0, 21.0, 27.0, 22.0, 49.0, 50.0, 72.0, 107.0, 161.0, 210.0, 336.0, 509.0, 4607.0, 3932556.0, 253138.0, 1032.0, 412.0, 286.0, 192.0, 127.0, 83.0, 52.0, 61.0, 28.0, 31.0, 20.0, 14.0, 17.0, 7.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.875, -54.96484375, -53.0546875, -51.14453125, -49.234375, -47.32421875, -45.4140625, -43.50390625, -41.59375, -39.68359375, -37.7734375, -35.86328125, -33.953125, -32.04296875, -30.1328125, -28.22265625, -26.3125, -24.40234375, -22.4921875, -20.58203125, -18.671875, -16.76171875, -14.8515625, -12.94140625, -11.03125, -9.12109375, -7.2109375, -5.30078125, -3.390625, -1.48046875, 0.4296875, 2.33984375, 4.25, 6.16015625, 8.0703125, 9.98046875, 11.890625, 13.80078125, 15.7109375, 17.62109375, 19.53125, 21.44140625, 23.3515625, 25.26171875, 27.171875, 29.08203125, 30.9921875, 32.90234375, 34.8125, 36.72265625, 38.6328125, 40.54296875, 42.453125, 44.36328125, 46.2734375, 48.18359375, 50.09375, 52.00390625, 53.9140625, 55.82421875, 57.734375, 59.64453125, 61.5546875, 63.46484375, 65.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 6.0, 4.0, 5.0, 7.0, 10.0, 9.0, 14.0, 17.0, 27.0, 31.0, 42.0, 59.0, 78.0, 96.0, 126.0, 193.0, 254.0, 361.0, 456.0, 516.0, 483.0, 315.0, 238.0, 179.0, 141.0, 94.0, 77.0, 62.0, 41.0, 29.0, 18.0, 19.0, 15.0, 12.0, 13.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-9.0390625, -8.7425537109375, -8.446044921875, -8.1495361328125, -7.85302734375, -7.5565185546875, -7.260009765625, -6.9635009765625, -6.6669921875, -6.3704833984375, -6.073974609375, -5.7774658203125, -5.48095703125, -5.1844482421875, -4.887939453125, -4.5914306640625, -4.294921875, -3.9984130859375, -3.701904296875, -3.4053955078125, -3.10888671875, -2.8123779296875, -2.515869140625, -2.2193603515625, -1.9228515625, -1.6263427734375, -1.329833984375, -1.0333251953125, -0.73681640625, -0.4403076171875, -0.143798828125, 0.1527099609375, 0.44921875, 0.7457275390625, 1.042236328125, 1.3387451171875, 1.63525390625, 1.9317626953125, 2.228271484375, 2.5247802734375, 2.8212890625, 3.1177978515625, 3.414306640625, 3.7108154296875, 4.00732421875, 4.3038330078125, 4.600341796875, 4.8968505859375, 5.193359375, 5.4898681640625, 5.786376953125, 6.0828857421875, 6.37939453125, 6.6759033203125, 6.972412109375, 7.2689208984375, 7.5654296875, 7.8619384765625, 8.158447265625, 8.4549560546875, 8.75146484375, 9.0479736328125, 9.344482421875, 9.6409912109375, 9.9375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 6.0, 13.0, 13.0, 25.0, 24.0, 37.0, 47.0, 58.0, 87.0, 172.0, 301.0, 840.0, 6447.0, 173240.0, 3765867.0, 236979.0, 8299.0, 1053.0, 290.0, 172.0, 102.0, 54.0, 36.0, 28.0, 29.0, 15.0, 11.0, 7.0, 4.0, 7.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.5625, -39.53662109375, -38.5107421875, -37.48486328125, -36.458984375, -35.43310546875, -34.4072265625, -33.38134765625, -32.35546875, -31.32958984375, -30.3037109375, -29.27783203125, -28.251953125, -27.22607421875, -26.2001953125, -25.17431640625, -24.1484375, -23.12255859375, -22.0966796875, -21.07080078125, -20.044921875, -19.01904296875, -17.9931640625, -16.96728515625, -15.94140625, -14.91552734375, -13.8896484375, -12.86376953125, -11.837890625, -10.81201171875, -9.7861328125, -8.76025390625, -7.734375, -6.70849609375, -5.6826171875, -4.65673828125, -3.630859375, -2.60498046875, -1.5791015625, -0.55322265625, 0.47265625, 1.49853515625, 2.5244140625, 3.55029296875, 4.576171875, 5.60205078125, 6.6279296875, 7.65380859375, 8.6796875, 9.70556640625, 10.7314453125, 11.75732421875, 12.783203125, 13.80908203125, 14.8349609375, 15.86083984375, 16.88671875, 17.91259765625, 18.9384765625, 19.96435546875, 20.990234375, 22.01611328125, 23.0419921875, 24.06787109375, 25.09375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 44.0, 146.0, 347.0, 342.0, 110.0, 20.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.33321380615234, -96.31324768066406, -92.29328155517578, -88.2733154296875, -84.25335693359375, -80.23339080810547, -76.21342468261719, -72.1934585571289, -68.17349243164062, -64.15352630615234, -60.13356399536133, -56.11359786987305, -52.09363555908203, -48.07366943359375, -44.05370330810547, -40.03373718261719, -36.01377868652344, -31.99381446838379, -27.97385025024414, -23.95388412475586, -19.93391990661621, -15.913955688476562, -11.893989562988281, -7.874025344848633, -3.8540611267089844, 0.16590356826782227, 4.185868263244629, 8.205833435058594, 12.225797653198242, 16.24576187133789, 20.265727996826172, 24.28569221496582, 28.305648803710938, 32.32561492919922, 36.345577239990234, 40.365543365478516, 44.38550567626953, 48.40547180175781, 52.425437927246094, 56.445404052734375, 60.46536636352539, 64.4853286743164, 68.50529479980469, 72.52526092529297, 76.54522705078125, 80.565185546875, 84.58515930175781, 88.60511779785156, 92.62508392333984, 96.64505004882812, 100.6650161743164, 104.68498229980469, 108.70494079589844, 112.72490692138672, 116.744873046875, 120.76483917236328, 124.78480529785156, 128.8047637939453, 132.82473754882812, 136.84469604492188, 140.8646697998047, 144.88462829589844, 148.90460205078125, 152.924560546875, 156.94451904296875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 3.0, 6.0, 6.0, 6.0, 11.0, 12.0, 13.0, 11.0, 20.0, 17.0, 17.0, 27.0, 23.0, 37.0, 38.0, 34.0, 39.0, 32.0, 40.0, 51.0, 48.0, 40.0, 46.0, 39.0, 30.0, 37.0, 32.0, 38.0, 22.0, 29.0, 31.0, 29.0, 22.0, 19.0, 15.0, 10.0, 10.0, 15.0, 10.0, 7.0, 4.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-35.067378997802734, -34.06101989746094, -33.054656982421875, -32.04829788208008, -31.04193878173828, -30.03557777404785, -29.029216766357422, -28.022857666015625, -27.016498565673828, -26.0101375579834, -25.0037784576416, -23.997417449951172, -22.991058349609375, -21.984697341918945, -20.978336334228516, -19.97197723388672, -18.96561622619629, -17.95925521850586, -16.952896118164062, -15.946535110473633, -14.940176010131836, -13.933815002441406, -12.927454948425293, -11.92109489440918, -10.914734840393066, -9.908374786376953, -8.90201473236084, -7.895654201507568, -6.889294147491455, -5.882934093475342, -4.87657356262207, -3.870213508605957, -2.863851547241211, -1.857491374015808, -0.8511312007904053, 0.1552290916442871, 1.1615891456604004, 2.1679491996765137, 3.174309730529785, 4.180669784545898, 5.187029838562012, 6.193389892578125, 7.199749946594238, 8.206110000610352, 9.212471008300781, 10.218830108642578, 11.225191116333008, 12.231551170349121, 13.237911224365234, 14.244271278381348, 15.250631332397461, 16.25699234008789, 17.263351440429688, 18.269712448120117, 19.276073455810547, 20.282432556152344, 21.28879165649414, 22.29515266418457, 23.301511764526367, 24.307872772216797, 25.314231872558594, 26.320592880249023, 27.326953887939453, 28.33331298828125, 29.33967399597168]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 2.0, 3.0, 4.0, 7.0, 8.0, 4.0, 11.0, 24.0, 22.0, 18.0, 22.0, 20.0, 28.0, 29.0, 34.0, 40.0, 27.0, 39.0, 39.0, 45.0, 39.0, 39.0, 48.0, 51.0, 27.0, 47.0, 21.0, 40.0, 38.0, 25.0, 25.0, 27.0, 13.0, 15.0, 17.0, 22.0, 15.0, 14.0, 4.0, 8.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.19140625, -6.00732421875, -5.8232421875, -5.63916015625, -5.455078125, -5.27099609375, -5.0869140625, -4.90283203125, -4.71875, -4.53466796875, -4.3505859375, -4.16650390625, -3.982421875, -3.79833984375, -3.6142578125, -3.43017578125, -3.24609375, -3.06201171875, -2.8779296875, -2.69384765625, -2.509765625, -2.32568359375, -2.1416015625, -1.95751953125, -1.7734375, -1.58935546875, -1.4052734375, -1.22119140625, -1.037109375, -0.85302734375, -0.6689453125, -0.48486328125, -0.30078125, -0.11669921875, 0.0673828125, 0.25146484375, 0.435546875, 0.61962890625, 0.8037109375, 0.98779296875, 1.171875, 1.35595703125, 1.5400390625, 1.72412109375, 1.908203125, 2.09228515625, 2.2763671875, 2.46044921875, 2.64453125, 2.82861328125, 3.0126953125, 3.19677734375, 3.380859375, 3.56494140625, 3.7490234375, 3.93310546875, 4.1171875, 4.30126953125, 4.4853515625, 4.66943359375, 4.853515625, 5.03759765625, 5.2216796875, 5.40576171875, 5.58984375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 11.0, 15.0, 18.0, 19.0, 48.0, 59.0, 111.0, 143.0, 227.0, 322.0, 560.0, 918.0, 1390.0, 2382.0, 4100.0, 7542.0, 13533.0, 25790.0, 52634.0, 106989.0, 205060.0, 265150.0, 178736.0, 89301.0, 44297.0, 21947.0, 11680.0, 6388.0, 3564.0, 2089.0, 1350.0, 768.0, 483.0, 298.0, 222.0, 135.0, 101.0, 56.0, 24.0, 37.0, 17.0, 6.0, 15.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.91650390625, -0.8890457153320312, -0.8615875244140625, -0.8341293334960938, -0.806671142578125, -0.7792129516601562, -0.7517547607421875, -0.7242965698242188, -0.69683837890625, -0.6693801879882812, -0.6419219970703125, -0.6144638061523438, -0.587005615234375, -0.5595474243164062, -0.5320892333984375, -0.5046310424804688, -0.4771728515625, -0.44971466064453125, -0.4222564697265625, -0.39479827880859375, -0.367340087890625, -0.33988189697265625, -0.3124237060546875, -0.28496551513671875, -0.25750732421875, -0.23004913330078125, -0.2025909423828125, -0.17513275146484375, -0.147674560546875, -0.12021636962890625, -0.0927581787109375, -0.06529998779296875, -0.037841796875, -0.01038360595703125, 0.0170745849609375, 0.04453277587890625, 0.071990966796875, 0.09944915771484375, 0.1269073486328125, 0.15436553955078125, 0.18182373046875, 0.20928192138671875, 0.2367401123046875, 0.26419830322265625, 0.291656494140625, 0.31911468505859375, 0.3465728759765625, 0.37403106689453125, 0.4014892578125, 0.42894744873046875, 0.4564056396484375, 0.48386383056640625, 0.511322021484375, 0.5387802124023438, 0.5662384033203125, 0.5936965942382812, 0.62115478515625, 0.6486129760742188, 0.6760711669921875, 0.7035293579101562, 0.730987548828125, 0.7584457397460938, 0.7859039306640625, 0.8133621215820312, 0.8408203125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 3.0, 3.0, 9.0, 7.0, 12.0, 10.0, 10.0, 11.0, 19.0, 20.0, 28.0, 30.0, 27.0, 30.0, 39.0, 27.0, 35.0, 27.0, 30.0, 33.0, 34.0, 1066.0, 41.0, 35.0, 46.0, 32.0, 35.0, 31.0, 26.0, 39.0, 31.0, 27.0, 23.0, 18.0, 23.0, 19.0, 17.0, 10.0, 11.0, 6.0, 7.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0], "bins": [-3.80078125, -3.690673828125, -3.58056640625, -3.470458984375, -3.3603515625, -3.250244140625, -3.14013671875, -3.030029296875, -2.919921875, -2.809814453125, -2.69970703125, -2.589599609375, -2.4794921875, -2.369384765625, -2.25927734375, -2.149169921875, -2.0390625, -1.928955078125, -1.81884765625, -1.708740234375, -1.5986328125, -1.488525390625, -1.37841796875, -1.268310546875, -1.158203125, -1.048095703125, -0.93798828125, -0.827880859375, -0.7177734375, -0.607666015625, -0.49755859375, -0.387451171875, -0.27734375, -0.167236328125, -0.05712890625, 0.052978515625, 0.1630859375, 0.273193359375, 0.38330078125, 0.493408203125, 0.603515625, 0.713623046875, 0.82373046875, 0.933837890625, 1.0439453125, 1.154052734375, 1.26416015625, 1.374267578125, 1.484375, 1.594482421875, 1.70458984375, 1.814697265625, 1.9248046875, 2.034912109375, 2.14501953125, 2.255126953125, 2.365234375, 2.475341796875, 2.58544921875, 2.695556640625, 2.8056640625, 2.915771484375, 3.02587890625, 3.135986328125, 3.24609375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 0.0, 3.0, 4.0, 8.0, 10.0, 13.0, 37.0, 60.0, 66.0, 126.0, 198.0, 324.0, 500.0, 880.0, 1513.0, 2740.0, 5205.0, 9897.0, 19824.0, 39371.0, 78889.0, 151035.0, 1174818.0, 336206.0, 134895.0, 69003.0, 34731.0, 17167.0, 8833.0, 4675.0, 2592.0, 1449.0, 852.0, 493.0, 261.0, 161.0, 104.0, 60.0, 42.0, 28.0, 12.0, 18.0, 9.0, 5.0, 8.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5859375, -0.5681304931640625, -0.550323486328125, -0.5325164794921875, -0.51470947265625, -0.4969024658203125, -0.479095458984375, -0.4612884521484375, -0.4434814453125, -0.4256744384765625, -0.407867431640625, -0.3900604248046875, -0.37225341796875, -0.3544464111328125, -0.336639404296875, -0.3188323974609375, -0.301025390625, -0.2832183837890625, -0.265411376953125, -0.2476043701171875, -0.22979736328125, -0.2119903564453125, -0.194183349609375, -0.1763763427734375, -0.1585693359375, -0.1407623291015625, -0.122955322265625, -0.1051483154296875, -0.08734130859375, -0.0695343017578125, -0.051727294921875, -0.0339202880859375, -0.01611328125, 0.0016937255859375, 0.019500732421875, 0.0373077392578125, 0.05511474609375, 0.0729217529296875, 0.090728759765625, 0.1085357666015625, 0.1263427734375, 0.1441497802734375, 0.161956787109375, 0.1797637939453125, 0.19757080078125, 0.2153778076171875, 0.233184814453125, 0.2509918212890625, 0.268798828125, 0.2866058349609375, 0.304412841796875, 0.3222198486328125, 0.34002685546875, 0.3578338623046875, 0.375640869140625, 0.3934478759765625, 0.4112548828125, 0.4290618896484375, 0.446868896484375, 0.4646759033203125, 0.48248291015625, 0.5002899169921875, 0.518096923828125, 0.5359039306640625, 0.5537109375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 0.0, 5.0, 15.0, 8.0, 12.0, 14.0, 15.0, 18.0, 20.0, 16.0, 35.0, 38.0, 51.0, 50.0, 72.0, 99.0, 139.0, 58.0, 51.0, 48.0, 25.0, 35.0, 28.0, 21.0, 25.0, 19.0, 8.0, 14.0, 11.0, 11.0, 4.0, 7.0, 7.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.041351318359375, -0.04021024703979492, -0.039069175720214844, -0.037928104400634766, -0.03678703308105469, -0.03564596176147461, -0.03450489044189453, -0.03336381912231445, -0.032222747802734375, -0.031081676483154297, -0.02994060516357422, -0.02879953384399414, -0.027658462524414062, -0.026517391204833984, -0.025376319885253906, -0.024235248565673828, -0.02309417724609375, -0.021953105926513672, -0.020812034606933594, -0.019670963287353516, -0.018529891967773438, -0.01738882064819336, -0.01624774932861328, -0.015106678009033203, -0.013965606689453125, -0.012824535369873047, -0.011683464050292969, -0.01054239273071289, -0.009401321411132812, -0.008260250091552734, -0.007119178771972656, -0.005978107452392578, -0.0048370361328125, -0.003695964813232422, -0.0025548934936523438, -0.0014138221740722656, -0.0002727508544921875, 0.0008683204650878906, 0.0020093917846679688, 0.003150463104248047, 0.004291534423828125, 0.005432605743408203, 0.006573677062988281, 0.007714748382568359, 0.008855819702148438, 0.009996891021728516, 0.011137962341308594, 0.012279033660888672, 0.01342010498046875, 0.014561176300048828, 0.015702247619628906, 0.016843318939208984, 0.017984390258789062, 0.01912546157836914, 0.02026653289794922, 0.021407604217529297, 0.022548675537109375, 0.023689746856689453, 0.02483081817626953, 0.02597188949584961, 0.027112960815429688, 0.028254032135009766, 0.029395103454589844, 0.030536174774169922, 0.03167724609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 2.0, 11.0, 10.0, 19.0, 16.0, 23.0, 35.0, 33.0, 46.0, 71.0, 80.0, 127.0, 155.0, 234.0, 439.0, 840.0, 12797.0, 1026298.0, 5317.0, 710.0, 392.0, 251.0, 181.0, 98.0, 68.0, 61.0, 40.0, 35.0, 30.0, 29.0, 25.0, 13.0, 10.0, 10.0, 13.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5791015625, -0.5587234497070312, -0.5383453369140625, -0.5179672241210938, -0.497589111328125, -0.47721099853515625, -0.4568328857421875, -0.43645477294921875, -0.41607666015625, -0.39569854736328125, -0.3753204345703125, -0.35494232177734375, -0.334564208984375, -0.31418609619140625, -0.2938079833984375, -0.27342987060546875, -0.2530517578125, -0.23267364501953125, -0.2122955322265625, -0.19191741943359375, -0.171539306640625, -0.15116119384765625, -0.1307830810546875, -0.11040496826171875, -0.09002685546875, -0.06964874267578125, -0.0492706298828125, -0.02889251708984375, -0.008514404296875, 0.01186370849609375, 0.0322418212890625, 0.05261993408203125, 0.072998046875, 0.09337615966796875, 0.1137542724609375, 0.13413238525390625, 0.154510498046875, 0.17488861083984375, 0.1952667236328125, 0.21564483642578125, 0.23602294921875, 0.25640106201171875, 0.2767791748046875, 0.29715728759765625, 0.317535400390625, 0.33791351318359375, 0.3582916259765625, 0.37866973876953125, 0.3990478515625, 0.41942596435546875, 0.4398040771484375, 0.46018218994140625, 0.480560302734375, 0.5009384155273438, 0.5213165283203125, 0.5416946411132812, 0.56207275390625, 0.5824508666992188, 0.6028289794921875, 0.6232070922851562, 0.643585205078125, 0.6639633178710938, 0.6843414306640625, 0.7047195434570312, 0.72509765625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 832.0, 175.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14046236872673035, -0.12001092731952667, -0.0995594784617424, -0.07910802960395813, -0.058656588196754456, -0.03820514678955078, -0.01775369793176651, 0.0026977509260177612, 0.023149192333221436, 0.04360063746571541, 0.06405208259820938, 0.08450353145599365, 0.10495497286319733, 0.125406414270401, 0.14585787057876587, 0.16630931198596954, 0.18676075339317322, 0.2072121948003769, 0.22766363620758057, 0.24811509251594543, 0.2685665488243103, 0.2890179753303528, 0.30946943163871765, 0.3299208879470825, 0.350372314453125, 0.37082377076148987, 0.39127519726753235, 0.4117266535758972, 0.4321780800819397, 0.45262953639030457, 0.47308099269866943, 0.4935324192047119, 0.5139838457107544, 0.5344352722167969, 0.5548867583274841, 0.5753381848335266, 0.5957896113395691, 0.6162410974502563, 0.6366925239562988, 0.6571439504623413, 0.6775953769683838, 0.6980468034744263, 0.7184982895851135, 0.738949716091156, 0.7594011425971985, 0.7798526287078857, 0.8003040552139282, 0.8207554817199707, 0.841206967830658, 0.8616583943367004, 0.8821098804473877, 0.9025613069534302, 0.9230127334594727, 0.9434641599655151, 0.9639156460762024, 0.9843670725822449, 1.0048185586929321, 1.0252699851989746, 1.045721411705017, 1.0661728382110596, 1.0866243839263916, 1.107075810432434, 1.1275272369384766, 1.147978663444519, 1.1684300899505615]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 8.0, 7.0, 10.0, 11.0, 27.0, 18.0, 31.0, 27.0, 30.0, 41.0, 34.0, 40.0, 45.0, 57.0, 61.0, 46.0, 57.0, 40.0, 48.0, 40.0, 38.0, 39.0, 39.0, 31.0, 26.0, 19.0, 29.0, 20.0, 17.0, 10.0, 8.0, 11.0, 8.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.07264828681945801, -0.07077066600322723, -0.06889304518699646, -0.06701542437076569, -0.06513780355453491, -0.06326018273830414, -0.061382561922073364, -0.05950494110584259, -0.057627320289611816, -0.05574969947338104, -0.05387207865715027, -0.051994457840919495, -0.05011683702468872, -0.04823921620845795, -0.04636159539222717, -0.0444839745759964, -0.042606353759765625, -0.04072873294353485, -0.03885111212730408, -0.0369734913110733, -0.03509587049484253, -0.033218249678611755, -0.03134062886238098, -0.029463008046150208, -0.027585387229919434, -0.02570776641368866, -0.023830145597457886, -0.021952524781227112, -0.020074903964996338, -0.018197283148765564, -0.01631966233253479, -0.014442041516304016, -0.012564420700073242, -0.010686799883842468, -0.008809179067611694, -0.00693155825138092, -0.0050539374351501465, -0.0031763166189193726, -0.0012986958026885986, 0.0005789250135421753, 0.0024565458297729492, 0.004334166646003723, 0.006211787462234497, 0.008089408278465271, 0.009967029094696045, 0.011844649910926819, 0.013722270727157593, 0.015599891543388367, 0.01747751235961914, 0.019355133175849915, 0.02123275399208069, 0.023110374808311462, 0.024987995624542236, 0.02686561644077301, 0.028743237257003784, 0.030620858073234558, 0.03249847888946533, 0.034376099705696106, 0.03625372052192688, 0.038131341338157654, 0.04000896215438843, 0.0418865829706192, 0.043764203786849976, 0.04564182460308075, 0.04751944541931152]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 3.0, 2.0, 4.0, 7.0, 8.0, 5.0, 11.0, 23.0, 22.0, 19.0, 22.0, 20.0, 28.0, 28.0, 34.0, 40.0, 27.0, 40.0, 41.0, 44.0, 39.0, 38.0, 50.0, 49.0, 28.0, 44.0, 24.0, 38.0, 38.0, 25.0, 25.0, 27.0, 13.0, 15.0, 17.0, 22.0, 15.0, 14.0, 4.0, 8.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.1875, -6.00341796875, -5.8193359375, -5.63525390625, -5.451171875, -5.26708984375, -5.0830078125, -4.89892578125, -4.71484375, -4.53076171875, -4.3466796875, -4.16259765625, -3.978515625, -3.79443359375, -3.6103515625, -3.42626953125, -3.2421875, -3.05810546875, -2.8740234375, -2.68994140625, -2.505859375, -2.32177734375, -2.1376953125, -1.95361328125, -1.76953125, -1.58544921875, -1.4013671875, -1.21728515625, -1.033203125, -0.84912109375, -0.6650390625, -0.48095703125, -0.296875, -0.11279296875, 0.0712890625, 0.25537109375, 0.439453125, 0.62353515625, 0.8076171875, 0.99169921875, 1.17578125, 1.35986328125, 1.5439453125, 1.72802734375, 1.912109375, 2.09619140625, 2.2802734375, 2.46435546875, 2.6484375, 2.83251953125, 3.0166015625, 3.20068359375, 3.384765625, 3.56884765625, 3.7529296875, 3.93701171875, 4.12109375, 4.30517578125, 4.4892578125, 4.67333984375, 4.857421875, 5.04150390625, 5.2255859375, 5.40966796875, 5.59375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 6.0, 10.0, 14.0, 21.0, 24.0, 20.0, 45.0, 35.0, 55.0, 99.0, 102.0, 152.0, 173.0, 240.0, 327.0, 446.0, 560.0, 808.0, 1095.0, 2009.0, 5726.0, 25448.0, 118999.0, 419681.0, 352773.0, 90406.0, 19044.0, 4507.0, 1722.0, 1059.0, 763.0, 531.0, 411.0, 303.0, 224.0, 156.0, 122.0, 128.0, 81.0, 58.0, 36.0, 28.0, 20.0, 29.0, 16.0, 15.0, 12.0, 7.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-12.4609375, -12.082275390625, -11.70361328125, -11.324951171875, -10.9462890625, -10.567626953125, -10.18896484375, -9.810302734375, -9.431640625, -9.052978515625, -8.67431640625, -8.295654296875, -7.9169921875, -7.538330078125, -7.15966796875, -6.781005859375, -6.40234375, -6.023681640625, -5.64501953125, -5.266357421875, -4.8876953125, -4.509033203125, -4.13037109375, -3.751708984375, -3.373046875, -2.994384765625, -2.61572265625, -2.237060546875, -1.8583984375, -1.479736328125, -1.10107421875, -0.722412109375, -0.34375, 0.034912109375, 0.41357421875, 0.792236328125, 1.1708984375, 1.549560546875, 1.92822265625, 2.306884765625, 2.685546875, 3.064208984375, 3.44287109375, 3.821533203125, 4.2001953125, 4.578857421875, 4.95751953125, 5.336181640625, 5.71484375, 6.093505859375, 6.47216796875, 6.850830078125, 7.2294921875, 7.608154296875, 7.98681640625, 8.365478515625, 8.744140625, 9.122802734375, 9.50146484375, 9.880126953125, 10.2587890625, 10.637451171875, 11.01611328125, 11.394775390625, 11.7734375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 3.0, 8.0, 7.0, 7.0, 11.0, 12.0, 19.0, 21.0, 19.0, 37.0, 29.0, 46.0, 44.0, 51.0, 65.0, 105.0, 216.0, 1420.0, 304.0, 149.0, 72.0, 62.0, 54.0, 36.0, 36.0, 28.0, 24.0, 26.0, 20.0, 21.0, 20.0, 24.0, 9.0, 14.0, 6.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.09375, -17.58740234375, -17.0810546875, -16.57470703125, -16.068359375, -15.56201171875, -15.0556640625, -14.54931640625, -14.04296875, -13.53662109375, -13.0302734375, -12.52392578125, -12.017578125, -11.51123046875, -11.0048828125, -10.49853515625, -9.9921875, -9.48583984375, -8.9794921875, -8.47314453125, -7.966796875, -7.46044921875, -6.9541015625, -6.44775390625, -5.94140625, -5.43505859375, -4.9287109375, -4.42236328125, -3.916015625, -3.40966796875, -2.9033203125, -2.39697265625, -1.890625, -1.38427734375, -0.8779296875, -0.37158203125, 0.134765625, 0.64111328125, 1.1474609375, 1.65380859375, 2.16015625, 2.66650390625, 3.1728515625, 3.67919921875, 4.185546875, 4.69189453125, 5.1982421875, 5.70458984375, 6.2109375, 6.71728515625, 7.2236328125, 7.72998046875, 8.236328125, 8.74267578125, 9.2490234375, 9.75537109375, 10.26171875, 10.76806640625, 11.2744140625, 11.78076171875, 12.287109375, 12.79345703125, 13.2998046875, 13.80615234375, 14.3125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 7.0, 10.0, 12.0, 12.0, 15.0, 20.0, 19.0, 32.0, 47.0, 51.0, 96.0, 150.0, 243.0, 367.0, 708.0, 1602.0, 129147.0, 3009011.0, 2176.0, 785.0, 428.0, 257.0, 162.0, 97.0, 68.0, 53.0, 38.0, 18.0, 15.0, 11.0, 18.0, 9.0, 5.0, 5.0, 5.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.0625, -66.419921875, -63.77734375, -61.134765625, -58.4921875, -55.849609375, -53.20703125, -50.564453125, -47.921875, -45.279296875, -42.63671875, -39.994140625, -37.3515625, -34.708984375, -32.06640625, -29.423828125, -26.78125, -24.138671875, -21.49609375, -18.853515625, -16.2109375, -13.568359375, -10.92578125, -8.283203125, -5.640625, -2.998046875, -0.35546875, 2.287109375, 4.9296875, 7.572265625, 10.21484375, 12.857421875, 15.5, 18.142578125, 20.78515625, 23.427734375, 26.0703125, 28.712890625, 31.35546875, 33.998046875, 36.640625, 39.283203125, 41.92578125, 44.568359375, 47.2109375, 49.853515625, 52.49609375, 55.138671875, 57.78125, 60.423828125, 63.06640625, 65.708984375, 68.3515625, 70.994140625, 73.63671875, 76.279296875, 78.921875, 81.564453125, 84.20703125, 86.849609375, 89.4921875, 92.134765625, 94.77734375, 97.419921875, 100.0625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 7.0, 11.0, 60.0, 195.0, 272.0, 268.0, 143.0, 44.0, 10.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.63715362548828, -94.26972198486328, -91.90229034423828, -89.53485107421875, -87.16741943359375, -84.79998779296875, -82.43255615234375, -80.06512451171875, -77.69768524169922, -75.33025360107422, -72.96282196044922, -70.59538269042969, -68.22795104980469, -65.86051940917969, -63.49308776855469, -61.12565231323242, -58.75822067260742, -56.39078903198242, -54.023353576660156, -51.655921936035156, -49.28848648071289, -46.92105484008789, -44.553619384765625, -42.186187744140625, -39.818756103515625, -37.451324462890625, -35.08388900756836, -32.71645736694336, -30.349021911621094, -27.981590270996094, -25.61415672302246, -23.246723175048828, -20.879287719726562, -18.51185417175293, -16.144420623779297, -13.77698802947998, -11.409554481506348, -9.042120933532715, -6.674688339233398, -4.307254791259766, -1.9398212432861328, 0.4276120662689209, 2.7950453758239746, 5.162478446960449, 7.529911994934082, 9.897345542907715, 12.264778137207031, 14.632211685180664, 16.999645233154297, 19.36707878112793, 21.734512329101562, 24.101943969726562, 26.469379425048828, 28.836811065673828, 31.20424461364746, 33.571678161621094, 35.939109802246094, 38.306541442871094, 40.67397689819336, 43.04140853881836, 45.408843994140625, 47.776275634765625, 50.143707275390625, 52.51114273071289, 54.878578186035156]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 9.0, 6.0, 14.0, 7.0, 14.0, 16.0, 20.0, 21.0, 15.0, 17.0, 34.0, 29.0, 36.0, 35.0, 44.0, 48.0, 31.0, 47.0, 53.0, 39.0, 48.0, 36.0, 33.0, 28.0, 33.0, 29.0, 33.0, 33.0, 26.0, 25.0, 25.0, 22.0, 12.0, 12.0, 17.0, 19.0, 5.0, 8.0, 10.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.62610626220703, -37.34136962890625, -36.056636810302734, -34.77190017700195, -33.48716735839844, -32.202430725097656, -30.917694091796875, -29.632959365844727, -28.348224639892578, -27.06348991394043, -25.77875518798828, -24.4940185546875, -23.20928382873535, -21.924549102783203, -20.639812469482422, -19.355077743530273, -18.070343017578125, -16.785608291625977, -15.500872611999512, -14.216136932373047, -12.931402206420898, -11.64666748046875, -10.361931800842285, -9.07719612121582, -7.792461395263672, -6.507726192474365, -5.222990989685059, -3.938255786895752, -2.6535205841064453, -1.3687853813171387, -0.08405017852783203, 1.2006855010986328, 2.4854202270507812, 3.770155429840088, 5.0548906326293945, 6.339625835418701, 7.624361038208008, 8.909095764160156, 10.193831443786621, 11.478567123413086, 12.763301849365234, 14.048036575317383, 15.332772254943848, 16.617507934570312, 17.90224266052246, 19.18697738647461, 20.47171401977539, 21.75644874572754, 23.041183471679688, 24.325918197631836, 25.610652923583984, 26.895389556884766, 28.180124282836914, 29.464859008789062, 30.749595642089844, 32.034332275390625, 33.31906509399414, 34.60380172729492, 35.88853454589844, 37.17327117919922, 38.4580078125, 39.742740631103516, 41.0274772644043, 42.31221008300781, 43.596946716308594]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 3.0, 4.0, 11.0, 8.0, 6.0, 12.0, 9.0, 12.0, 15.0, 15.0, 25.0, 21.0, 22.0, 27.0, 29.0, 38.0, 37.0, 34.0, 30.0, 41.0, 30.0, 51.0, 36.0, 42.0, 31.0, 32.0, 40.0, 35.0, 37.0, 34.0, 27.0, 30.0, 22.0, 24.0, 24.0, 14.0, 17.0, 11.0, 8.0, 5.0, 7.0, 12.0, 4.0, 5.0, 1.0, 6.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-5.7109375, -5.53570556640625, -5.3604736328125, -5.18524169921875, -5.010009765625, -4.83477783203125, -4.6595458984375, -4.48431396484375, -4.30908203125, -4.13385009765625, -3.9586181640625, -3.78338623046875, -3.608154296875, -3.43292236328125, -3.2576904296875, -3.08245849609375, -2.9072265625, -2.73199462890625, -2.5567626953125, -2.38153076171875, -2.206298828125, -2.03106689453125, -1.8558349609375, -1.68060302734375, -1.50537109375, -1.33013916015625, -1.1549072265625, -0.97967529296875, -0.804443359375, -0.62921142578125, -0.4539794921875, -0.27874755859375, -0.103515625, 0.07171630859375, 0.2469482421875, 0.42218017578125, 0.597412109375, 0.77264404296875, 0.9478759765625, 1.12310791015625, 1.29833984375, 1.47357177734375, 1.6488037109375, 1.82403564453125, 1.999267578125, 2.17449951171875, 2.3497314453125, 2.52496337890625, 2.7001953125, 2.87542724609375, 3.0506591796875, 3.22589111328125, 3.401123046875, 3.57635498046875, 3.7515869140625, 3.92681884765625, 4.10205078125, 4.27728271484375, 4.4525146484375, 4.62774658203125, 4.802978515625, 4.97821044921875, 5.1534423828125, 5.32867431640625, 5.50390625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 5.0, 1.0, 11.0, 15.0, 31.0, 28.0, 69.0, 87.0, 110.0, 148.0, 294.0, 392.0, 702.0, 1252.0, 2370.0, 5380.0, 14083.0, 49288.0, 206141.0, 785142.0, 1802250.0, 969752.0, 264973.0, 61841.0, 17543.0, 6254.0, 2800.0, 1354.0, 755.0, 452.0, 265.0, 167.0, 106.0, 76.0, 41.0, 27.0, 22.0, 14.0, 8.0, 10.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8671875, -8.5950927734375, -8.322998046875, -8.0509033203125, -7.77880859375, -7.5067138671875, -7.234619140625, -6.9625244140625, -6.6904296875, -6.4183349609375, -6.146240234375, -5.8741455078125, -5.60205078125, -5.3299560546875, -5.057861328125, -4.7857666015625, -4.513671875, -4.2415771484375, -3.969482421875, -3.6973876953125, -3.42529296875, -3.1531982421875, -2.881103515625, -2.6090087890625, -2.3369140625, -2.0648193359375, -1.792724609375, -1.5206298828125, -1.24853515625, -0.9764404296875, -0.704345703125, -0.4322509765625, -0.16015625, 0.1119384765625, 0.384033203125, 0.6561279296875, 0.92822265625, 1.2003173828125, 1.472412109375, 1.7445068359375, 2.0166015625, 2.2886962890625, 2.560791015625, 2.8328857421875, 3.10498046875, 3.3770751953125, 3.649169921875, 3.9212646484375, 4.193359375, 4.4654541015625, 4.737548828125, 5.0096435546875, 5.28173828125, 5.5538330078125, 5.825927734375, 6.0980224609375, 6.3701171875, 6.6422119140625, 6.914306640625, 7.1864013671875, 7.45849609375, 7.7305908203125, 8.002685546875, 8.2747802734375, 8.546875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 8.0, 3.0, 11.0, 9.0, 12.0, 17.0, 25.0, 29.0, 31.0, 52.0, 53.0, 78.0, 80.0, 129.0, 149.0, 203.0, 319.0, 417.0, 455.0, 446.0, 354.0, 290.0, 186.0, 163.0, 110.0, 90.0, 90.0, 57.0, 61.0, 32.0, 27.0, 21.0, 17.0, 10.0, 9.0, 8.0, 8.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6875, -9.3734130859375, -9.059326171875, -8.7452392578125, -8.43115234375, -8.1170654296875, -7.802978515625, -7.4888916015625, -7.1748046875, -6.8607177734375, -6.546630859375, -6.2325439453125, -5.91845703125, -5.6043701171875, -5.290283203125, -4.9761962890625, -4.662109375, -4.3480224609375, -4.033935546875, -3.7198486328125, -3.40576171875, -3.0916748046875, -2.777587890625, -2.4635009765625, -2.1494140625, -1.8353271484375, -1.521240234375, -1.2071533203125, -0.89306640625, -0.5789794921875, -0.264892578125, 0.0491943359375, 0.36328125, 0.6773681640625, 0.991455078125, 1.3055419921875, 1.61962890625, 1.9337158203125, 2.247802734375, 2.5618896484375, 2.8759765625, 3.1900634765625, 3.504150390625, 3.8182373046875, 4.13232421875, 4.4464111328125, 4.760498046875, 5.0745849609375, 5.388671875, 5.7027587890625, 6.016845703125, 6.3309326171875, 6.64501953125, 6.9591064453125, 7.273193359375, 7.5872802734375, 7.9013671875, 8.2154541015625, 8.529541015625, 8.8436279296875, 9.15771484375, 9.4718017578125, 9.785888671875, 10.0999755859375, 10.4140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 6.0, 3.0, 8.0, 9.0, 12.0, 12.0, 13.0, 19.0, 27.0, 32.0, 62.0, 67.0, 85.0, 138.0, 204.0, 263.0, 395.0, 725.0, 1312.0, 3029.0, 11084.0, 71258.0, 547662.0, 2825699.0, 631630.0, 81861.0, 12195.0, 3093.0, 1278.0, 708.0, 438.0, 293.0, 171.0, 128.0, 97.0, 67.0, 59.0, 34.0, 30.0, 18.0, 16.0, 8.0, 11.0, 13.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-17.0, -16.53466796875, -16.0693359375, -15.60400390625, -15.138671875, -14.67333984375, -14.2080078125, -13.74267578125, -13.27734375, -12.81201171875, -12.3466796875, -11.88134765625, -11.416015625, -10.95068359375, -10.4853515625, -10.02001953125, -9.5546875, -9.08935546875, -8.6240234375, -8.15869140625, -7.693359375, -7.22802734375, -6.7626953125, -6.29736328125, -5.83203125, -5.36669921875, -4.9013671875, -4.43603515625, -3.970703125, -3.50537109375, -3.0400390625, -2.57470703125, -2.109375, -1.64404296875, -1.1787109375, -0.71337890625, -0.248046875, 0.21728515625, 0.6826171875, 1.14794921875, 1.61328125, 2.07861328125, 2.5439453125, 3.00927734375, 3.474609375, 3.93994140625, 4.4052734375, 4.87060546875, 5.3359375, 5.80126953125, 6.2666015625, 6.73193359375, 7.197265625, 7.66259765625, 8.1279296875, 8.59326171875, 9.05859375, 9.52392578125, 9.9892578125, 10.45458984375, 10.919921875, 11.38525390625, 11.8505859375, 12.31591796875, 12.78125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 27.0, 480.0, 473.0, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-491.4495849609375, -481.9941101074219, -472.53863525390625, -463.0831298828125, -453.6276550292969, -444.17218017578125, -434.7166748046875, -425.2611999511719, -415.80572509765625, -406.3502502441406, -396.894775390625, -387.43927001953125, -377.9837951660156, -368.5283203125, -359.07281494140625, -349.6173400878906, -340.161865234375, -330.7063903808594, -321.25091552734375, -311.79541015625, -302.3399353027344, -292.88446044921875, -283.428955078125, -273.9734802246094, -264.51800537109375, -255.06253051757812, -245.60704040527344, -236.15155029296875, -226.69607543945312, -217.2406005859375, -207.7851104736328, -198.32962036132812, -188.87417602539062, -179.418701171875, -169.9632110595703, -160.50772094726562, -151.05224609375, -141.59677124023438, -132.1412811279297, -122.68579864501953, -113.23031616210938, -103.77483367919922, -94.31935119628906, -84.8638687133789, -75.40838623046875, -65.9529037475586, -56.49742126464844, -47.04193878173828, -37.586456298828125, -28.13097381591797, -18.675491333007812, -9.220008850097656, 0.2354736328125, 9.690956115722656, 19.146438598632812, 28.60192108154297, 38.057403564453125, 47.51288604736328, 56.96836853027344, 66.4238510131836, 75.87933349609375, 85.3348159790039, 94.79029846191406, 104.24578094482422, 113.70126342773438]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 11.0, 9.0, 8.0, 9.0, 14.0, 16.0, 20.0, 24.0, 20.0, 25.0, 26.0, 24.0, 30.0, 38.0, 30.0, 29.0, 35.0, 24.0, 41.0, 43.0, 52.0, 44.0, 38.0, 47.0, 36.0, 30.0, 41.0, 34.0, 19.0, 24.0, 19.0, 17.0, 20.0, 19.0, 15.0, 13.0, 16.0, 7.0, 10.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.23923110961914, -37.9691162109375, -36.699005126953125, -35.428890228271484, -34.158775329589844, -32.8886604309082, -31.618547439575195, -30.348434448242188, -29.078319549560547, -27.808204650878906, -26.5380916595459, -25.26797866821289, -23.99786376953125, -22.72774887084961, -21.4576358795166, -20.187522888183594, -18.917407989501953, -17.647293090820312, -16.377180099487305, -15.10706615447998, -13.836952209472656, -12.566838264465332, -11.296724319458008, -10.026610374450684, -8.75649642944336, -7.486382484436035, -6.216268539428711, -4.946154594421387, -3.6760406494140625, -2.4059267044067383, -1.135812759399414, 0.13430118560791016, 1.4044151306152344, 2.6745290756225586, 3.944643020629883, 5.214756965637207, 6.484870910644531, 7.7549848556518555, 9.02509880065918, 10.295212745666504, 11.565326690673828, 12.835440635681152, 14.105554580688477, 15.3756685256958, 16.645782470703125, 17.915897369384766, 19.186010360717773, 20.45612335205078, 21.726238250732422, 22.996353149414062, 24.26646614074707, 25.536579132080078, 26.80669403076172, 28.07680892944336, 29.346921920776367, 30.617034912109375, 31.887149810791016, 33.157264709472656, 34.42737579345703, 35.69749069213867, 36.96760559082031, 38.23772048950195, 39.507835388183594, 40.77794647216797, 42.04806137084961]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 13.0, 11.0, 10.0, 16.0, 26.0, 22.0, 23.0, 18.0, 26.0, 29.0, 32.0, 33.0, 46.0, 37.0, 38.0, 44.0, 36.0, 40.0, 48.0, 49.0, 42.0, 41.0, 38.0, 37.0, 32.0, 28.0, 24.0, 26.0, 34.0, 15.0, 12.0, 10.0, 9.0, 12.0, 9.0, 9.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.08831787109375, -4.9266357421875, -4.76495361328125, -4.603271484375, -4.44158935546875, -4.2799072265625, -4.11822509765625, -3.95654296875, -3.79486083984375, -3.6331787109375, -3.47149658203125, -3.309814453125, -3.14813232421875, -2.9864501953125, -2.82476806640625, -2.6630859375, -2.50140380859375, -2.3397216796875, -2.17803955078125, -2.016357421875, -1.85467529296875, -1.6929931640625, -1.53131103515625, -1.36962890625, -1.20794677734375, -1.0462646484375, -0.88458251953125, -0.722900390625, -0.56121826171875, -0.3995361328125, -0.23785400390625, -0.076171875, 0.08551025390625, 0.2471923828125, 0.40887451171875, 0.570556640625, 0.73223876953125, 0.8939208984375, 1.05560302734375, 1.21728515625, 1.37896728515625, 1.5406494140625, 1.70233154296875, 1.864013671875, 2.02569580078125, 2.1873779296875, 2.34906005859375, 2.5107421875, 2.67242431640625, 2.8341064453125, 2.99578857421875, 3.157470703125, 3.31915283203125, 3.4808349609375, 3.64251708984375, 3.80419921875, 3.96588134765625, 4.1275634765625, 4.28924560546875, 4.450927734375, 4.61260986328125, 4.7742919921875, 4.93597412109375, 5.09765625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 8.0, 5.0, 15.0, 18.0, 34.0, 45.0, 50.0, 79.0, 135.0, 210.0, 290.0, 446.0, 636.0, 928.0, 1390.0, 2281.0, 3474.0, 5288.0, 8338.0, 13675.0, 22733.0, 38653.0, 65661.0, 109997.0, 171540.0, 202472.0, 156376.0, 97651.0, 57912.0, 34348.0, 20085.0, 12377.0, 7749.0, 4750.0, 2963.0, 1941.0, 1301.0, 870.0, 539.0, 406.0, 264.0, 195.0, 142.0, 90.0, 65.0, 49.0, 37.0, 19.0, 13.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.461181640625, -0.4460029602050781, -0.43082427978515625, -0.4156455993652344, -0.4004669189453125, -0.3852882385253906, -0.37010955810546875, -0.3549308776855469, -0.339752197265625, -0.3245735168457031, -0.30939483642578125, -0.2942161560058594, -0.2790374755859375, -0.2638587951660156, -0.24868011474609375, -0.23350143432617188, -0.21832275390625, -0.20314407348632812, -0.18796539306640625, -0.17278671264648438, -0.1576080322265625, -0.14242935180664062, -0.12725067138671875, -0.11207199096679688, -0.096893310546875, -0.08171463012695312, -0.06653594970703125, -0.051357269287109375, -0.0361785888671875, -0.020999908447265625, -0.00582122802734375, 0.009357452392578125, 0.0245361328125, 0.039714813232421875, 0.05489349365234375, 0.07007217407226562, 0.0852508544921875, 0.10042953491210938, 0.11560821533203125, 0.13078689575195312, 0.145965576171875, 0.16114425659179688, 0.17632293701171875, 0.19150161743164062, 0.2066802978515625, 0.22185897827148438, 0.23703765869140625, 0.2522163391113281, 0.26739501953125, 0.2825736999511719, 0.29775238037109375, 0.3129310607910156, 0.3281097412109375, 0.3432884216308594, 0.35846710205078125, 0.3736457824707031, 0.388824462890625, 0.4040031433105469, 0.41918182373046875, 0.4343605041503906, 0.4495391845703125, 0.4647178649902344, 0.47989654541015625, 0.4950752258300781, 0.51025390625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 12.0, 11.0, 8.0, 13.0, 17.0, 18.0, 27.0, 25.0, 31.0, 34.0, 27.0, 45.0, 37.0, 48.0, 34.0, 49.0, 48.0, 1059.0, 36.0, 38.0, 46.0, 32.0, 31.0, 27.0, 30.0, 23.0, 31.0, 32.0, 27.0, 15.0, 13.0, 13.0, 18.0, 14.0, 14.0, 8.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.00390625, -2.903411865234375, -2.80291748046875, -2.702423095703125, -2.6019287109375, -2.501434326171875, -2.40093994140625, -2.300445556640625, -2.199951171875, -2.099456787109375, -1.99896240234375, -1.898468017578125, -1.7979736328125, -1.697479248046875, -1.59698486328125, -1.496490478515625, -1.39599609375, -1.295501708984375, -1.19500732421875, -1.094512939453125, -0.9940185546875, -0.893524169921875, -0.79302978515625, -0.692535400390625, -0.592041015625, -0.491546630859375, -0.39105224609375, -0.290557861328125, -0.1900634765625, -0.089569091796875, 0.01092529296875, 0.111419677734375, 0.2119140625, 0.312408447265625, 0.41290283203125, 0.513397216796875, 0.6138916015625, 0.714385986328125, 0.81488037109375, 0.915374755859375, 1.015869140625, 1.116363525390625, 1.21685791015625, 1.317352294921875, 1.4178466796875, 1.518341064453125, 1.61883544921875, 1.719329833984375, 1.81982421875, 1.920318603515625, 2.02081298828125, 2.121307373046875, 2.2218017578125, 2.322296142578125, 2.42279052734375, 2.523284912109375, 2.623779296875, 2.724273681640625, 2.82476806640625, 2.925262451171875, 3.0257568359375, 3.126251220703125, 3.22674560546875, 3.327239990234375, 3.427734375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 6.0, 2.0, 25.0, 24.0, 40.0, 63.0, 94.0, 159.0, 272.0, 540.0, 909.0, 1732.0, 3338.0, 6548.0, 13141.0, 26992.0, 54316.0, 105844.0, 187859.0, 1288564.0, 189407.0, 106903.0, 55536.0, 27429.0, 13442.0, 6525.0, 3478.0, 1654.0, 988.0, 557.0, 301.0, 180.0, 93.0, 51.0, 47.0, 26.0, 10.0, 13.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44921875, -0.43581390380859375, -0.4224090576171875, -0.40900421142578125, -0.395599365234375, -0.38219451904296875, -0.3687896728515625, -0.35538482666015625, -0.34197998046875, -0.32857513427734375, -0.3151702880859375, -0.30176544189453125, -0.288360595703125, -0.27495574951171875, -0.2615509033203125, -0.24814605712890625, -0.2347412109375, -0.22133636474609375, -0.2079315185546875, -0.19452667236328125, -0.181121826171875, -0.16771697998046875, -0.1543121337890625, -0.14090728759765625, -0.12750244140625, -0.11409759521484375, -0.1006927490234375, -0.08728790283203125, -0.073883056640625, -0.06047821044921875, -0.0470733642578125, -0.03366851806640625, -0.020263671875, -0.00685882568359375, 0.0065460205078125, 0.01995086669921875, 0.033355712890625, 0.04676055908203125, 0.0601654052734375, 0.07357025146484375, 0.08697509765625, 0.10037994384765625, 0.1137847900390625, 0.12718963623046875, 0.140594482421875, 0.15399932861328125, 0.1674041748046875, 0.18080902099609375, 0.1942138671875, 0.20761871337890625, 0.2210235595703125, 0.23442840576171875, 0.247833251953125, 0.26123809814453125, 0.2746429443359375, 0.28804779052734375, 0.30145263671875, 0.31485748291015625, 0.3282623291015625, 0.34166717529296875, 0.355072021484375, 0.36847686767578125, 0.3818817138671875, 0.39528656005859375, 0.40869140625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 10.0, 6.0, 11.0, 14.0, 25.0, 31.0, 27.0, 30.0, 43.0, 54.0, 79.0, 96.0, 87.0, 98.0, 79.0, 66.0, 35.0, 31.0, 36.0, 25.0, 20.0, 18.0, 12.0, 8.0, 9.0, 8.0, 12.0, 6.0, 5.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0146026611328125, -0.01419520378112793, -0.01378774642944336, -0.013380289077758789, -0.012972831726074219, -0.012565374374389648, -0.012157917022705078, -0.011750459671020508, -0.011343002319335938, -0.010935544967651367, -0.010528087615966797, -0.010120630264282227, -0.009713172912597656, -0.009305715560913086, -0.008898258209228516, -0.008490800857543945, -0.008083343505859375, -0.007675886154174805, -0.007268428802490234, -0.006860971450805664, -0.006453514099121094, -0.0060460567474365234, -0.005638599395751953, -0.005231142044067383, -0.0048236846923828125, -0.004416227340698242, -0.004008769989013672, -0.0036013126373291016, -0.0031938552856445312, -0.002786397933959961, -0.0023789405822753906, -0.0019714832305908203, -0.00156402587890625, -0.0011565685272216797, -0.0007491111755371094, -0.00034165382385253906, 6.580352783203125e-05, 0.00047326087951660156, 0.0008807182312011719, 0.0012881755828857422, 0.0016956329345703125, 0.002103090286254883, 0.002510547637939453, 0.0029180049896240234, 0.0033254623413085938, 0.003732919692993164, 0.004140377044677734, 0.004547834396362305, 0.004955291748046875, 0.005362749099731445, 0.005770206451416016, 0.006177663803100586, 0.006585121154785156, 0.0069925785064697266, 0.007400035858154297, 0.007807493209838867, 0.008214950561523438, 0.008622407913208008, 0.009029865264892578, 0.009437322616577148, 0.009844779968261719, 0.010252237319946289, 0.01065969467163086, 0.01106715202331543, 0.011474609375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 5.0, 4.0, 9.0, 9.0, 9.0, 9.0, 17.0, 10.0, 27.0, 20.0, 28.0, 34.0, 46.0, 79.0, 101.0, 154.0, 229.0, 440.0, 1386.0, 63451.0, 972325.0, 8453.0, 746.0, 321.0, 185.0, 112.0, 81.0, 79.0, 57.0, 35.0, 26.0, 17.0, 15.0, 16.0, 9.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19873046875, -0.19170379638671875, -0.1846771240234375, -0.17765045166015625, -0.170623779296875, -0.16359710693359375, -0.1565704345703125, -0.14954376220703125, -0.14251708984375, -0.13549041748046875, -0.1284637451171875, -0.12143707275390625, -0.114410400390625, -0.10738372802734375, -0.1003570556640625, -0.09333038330078125, -0.0863037109375, -0.07927703857421875, -0.0722503662109375, -0.06522369384765625, -0.058197021484375, -0.05117034912109375, -0.0441436767578125, -0.03711700439453125, -0.03009033203125, -0.02306365966796875, -0.0160369873046875, -0.00901031494140625, -0.001983642578125, 0.00504302978515625, 0.0120697021484375, 0.01909637451171875, 0.026123046875, 0.03314971923828125, 0.0401763916015625, 0.04720306396484375, 0.054229736328125, 0.06125640869140625, 0.0682830810546875, 0.07530975341796875, 0.08233642578125, 0.08936309814453125, 0.0963897705078125, 0.10341644287109375, 0.110443115234375, 0.11746978759765625, 0.1244964599609375, 0.13152313232421875, 0.1385498046875, 0.14557647705078125, 0.1526031494140625, 0.15962982177734375, 0.166656494140625, 0.17368316650390625, 0.1807098388671875, 0.18773651123046875, 0.19476318359375, 0.20178985595703125, 0.2088165283203125, 0.21584320068359375, 0.222869873046875, 0.22989654541015625, 0.2369232177734375, 0.24394989013671875, 0.2509765625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 15.0, 466.0, 530.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049009084701538086, -0.04289869964122772, -0.03678831085562706, -0.030677923932671547, -0.024567537009716034, -0.01845715008676052, -0.012346763163805008, -0.006236374378204346, -0.00012598931789398193, 0.005984397605061531, 0.012094784528017044, 0.018205171450972557, 0.02431555837392807, 0.030425945296883583, 0.036536332219839096, 0.04264672100543976, 0.04875710606575012, 0.054867491126060486, 0.06097787991166115, 0.06708826869726181, 0.07319865375757217, 0.07930903881788254, 0.0854194313287735, 0.09152981638908386, 0.09764020144939423, 0.10375058650970459, 0.10986097157001495, 0.11597136408090591, 0.12208174914121628, 0.12819214165210724, 0.1343025267124176, 0.14041291177272797, 0.14652329683303833, 0.1526336818933487, 0.15874406695365906, 0.16485445201396942, 0.17096483707427979, 0.17707523703575134, 0.1831856220960617, 0.18929600715637207, 0.19540639221668243, 0.2015167772769928, 0.20762716233730316, 0.21373754739761353, 0.21984794735908508, 0.22595833241939545, 0.2320687174797058, 0.23817910254001617, 0.24428948760032654, 0.2503998875617981, 0.25651025772094727, 0.2626206576824188, 0.268731027841568, 0.27484142780303955, 0.2809517979621887, 0.2870621979236603, 0.29317259788513184, 0.2992829978466034, 0.30539336800575256, 0.3115037679672241, 0.3176141381263733, 0.32372453808784485, 0.329834908246994, 0.3359453082084656, 0.34205567836761475]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 9.0, 13.0, 20.0, 14.0, 18.0, 22.0, 33.0, 40.0, 34.0, 42.0, 47.0, 55.0, 67.0, 64.0, 71.0, 45.0, 56.0, 63.0, 38.0, 44.0, 48.0, 38.0, 27.0, 19.0, 24.0, 16.0, 8.0, 6.0, 9.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01946234703063965, -0.01892559789121151, -0.01838884875178337, -0.017852099612355232, -0.017315350472927094, -0.016778601333498955, -0.016241852194070816, -0.015705103054642677, -0.015168353915214539, -0.0146316047757864, -0.014094855636358261, -0.013558106496930122, -0.013021357357501984, -0.012484608218073845, -0.011947859078645706, -0.011411109939217567, -0.010874360799789429, -0.01033761166036129, -0.009800862520933151, -0.009264113381505013, -0.008727364242076874, -0.008190615102648735, -0.007653865963220596, -0.007117116823792458, -0.006580367684364319, -0.00604361854493618, -0.005506869405508041, -0.004970120266079903, -0.004433371126651764, -0.003896621987223625, -0.0033598728477954865, -0.0028231237083673477, -0.002286374568939209, -0.0017496254295110703, -0.0012128762900829315, -0.0006761271506547928, -0.00013937801122665405, 0.0003973711282014847, 0.0009341202676296234, 0.0014708694070577621, 0.002007618546485901, 0.0025443676859140396, 0.0030811168253421783, 0.003617865964770317, 0.004154615104198456, 0.0046913642436265945, 0.005228113383054733, 0.005764862522482872, 0.006301611661911011, 0.0068383608013391495, 0.007375109940767288, 0.007911859080195427, 0.008448608219623566, 0.008985357359051704, 0.009522106498479843, 0.010058855637907982, 0.01059560477733612, 0.01113235391676426, 0.011669103056192398, 0.012205852195620537, 0.012742601335048676, 0.013279350474476814, 0.013816099613904953, 0.014352848753333092, 0.01488959789276123]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 14.0, 11.0, 10.0, 16.0, 26.0, 22.0, 23.0, 18.0, 26.0, 29.0, 32.0, 33.0, 46.0, 38.0, 36.0, 45.0, 36.0, 40.0, 48.0, 49.0, 43.0, 40.0, 38.0, 37.0, 32.0, 28.0, 24.0, 26.0, 34.0, 15.0, 12.0, 10.0, 9.0, 12.0, 9.0, 9.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.08831787109375, -4.9266357421875, -4.76495361328125, -4.603271484375, -4.44158935546875, -4.2799072265625, -4.11822509765625, -3.95654296875, -3.79486083984375, -3.6331787109375, -3.47149658203125, -3.309814453125, -3.14813232421875, -2.9864501953125, -2.82476806640625, -2.6630859375, -2.50140380859375, -2.3397216796875, -2.17803955078125, -2.016357421875, -1.85467529296875, -1.6929931640625, -1.53131103515625, -1.36962890625, -1.20794677734375, -1.0462646484375, -0.88458251953125, -0.722900390625, -0.56121826171875, -0.3995361328125, -0.23785400390625, -0.076171875, 0.08551025390625, 0.2471923828125, 0.40887451171875, 0.570556640625, 0.73223876953125, 0.8939208984375, 1.05560302734375, 1.21728515625, 1.37896728515625, 1.5406494140625, 1.70233154296875, 1.864013671875, 2.02569580078125, 2.1873779296875, 2.34906005859375, 2.5107421875, 2.67242431640625, 2.8341064453125, 2.99578857421875, 3.157470703125, 3.31915283203125, 3.4808349609375, 3.64251708984375, 3.80419921875, 3.96588134765625, 4.1275634765625, 4.28924560546875, 4.450927734375, 4.61260986328125, 4.7742919921875, 4.93597412109375, 5.09765625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 12.0, 20.0, 21.0, 37.0, 48.0, 52.0, 76.0, 113.0, 131.0, 194.0, 275.0, 351.0, 529.0, 733.0, 1010.0, 1293.0, 1890.0, 3065.0, 6329.0, 25631.0, 190152.0, 648428.0, 134569.0, 18902.0, 5398.0, 2842.0, 1830.0, 1242.0, 858.0, 657.0, 485.0, 359.0, 287.0, 213.0, 150.0, 112.0, 86.0, 52.0, 38.0, 26.0, 15.0, 12.0, 11.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.15625, -11.769287109375, -11.38232421875, -10.995361328125, -10.6083984375, -10.221435546875, -9.83447265625, -9.447509765625, -9.060546875, -8.673583984375, -8.28662109375, -7.899658203125, -7.5126953125, -7.125732421875, -6.73876953125, -6.351806640625, -5.96484375, -5.577880859375, -5.19091796875, -4.803955078125, -4.4169921875, -4.030029296875, -3.64306640625, -3.256103515625, -2.869140625, -2.482177734375, -2.09521484375, -1.708251953125, -1.3212890625, -0.934326171875, -0.54736328125, -0.160400390625, 0.2265625, 0.613525390625, 1.00048828125, 1.387451171875, 1.7744140625, 2.161376953125, 2.54833984375, 2.935302734375, 3.322265625, 3.709228515625, 4.09619140625, 4.483154296875, 4.8701171875, 5.257080078125, 5.64404296875, 6.031005859375, 6.41796875, 6.804931640625, 7.19189453125, 7.578857421875, 7.9658203125, 8.352783203125, 8.73974609375, 9.126708984375, 9.513671875, 9.900634765625, 10.28759765625, 10.674560546875, 11.0615234375, 11.448486328125, 11.83544921875, 12.222412109375, 12.609375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 6.0, 7.0, 11.0, 15.0, 13.0, 24.0, 22.0, 22.0, 31.0, 35.0, 41.0, 44.0, 56.0, 51.0, 131.0, 290.0, 1466.0, 257.0, 106.0, 50.0, 58.0, 43.0, 35.0, 30.0, 29.0, 22.0, 26.0, 12.0, 18.0, 18.0, 12.0, 8.0, 18.0, 3.0, 5.0, 4.0, 1.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.65625, -13.25927734375, -12.8623046875, -12.46533203125, -12.068359375, -11.67138671875, -11.2744140625, -10.87744140625, -10.48046875, -10.08349609375, -9.6865234375, -9.28955078125, -8.892578125, -8.49560546875, -8.0986328125, -7.70166015625, -7.3046875, -6.90771484375, -6.5107421875, -6.11376953125, -5.716796875, -5.31982421875, -4.9228515625, -4.52587890625, -4.12890625, -3.73193359375, -3.3349609375, -2.93798828125, -2.541015625, -2.14404296875, -1.7470703125, -1.35009765625, -0.953125, -0.55615234375, -0.1591796875, 0.23779296875, 0.634765625, 1.03173828125, 1.4287109375, 1.82568359375, 2.22265625, 2.61962890625, 3.0166015625, 3.41357421875, 3.810546875, 4.20751953125, 4.6044921875, 5.00146484375, 5.3984375, 5.79541015625, 6.1923828125, 6.58935546875, 6.986328125, 7.38330078125, 7.7802734375, 8.17724609375, 8.57421875, 8.97119140625, 9.3681640625, 9.76513671875, 10.162109375, 10.55908203125, 10.9560546875, 11.35302734375, 11.75]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 9.0, 15.0, 17.0, 22.0, 28.0, 34.0, 45.0, 67.0, 105.0, 166.0, 328.0, 639.0, 1564.0, 11239.0, 3124802.0, 4263.0, 1099.0, 511.0, 271.0, 147.0, 82.0, 79.0, 43.0, 45.0, 18.0, 13.0, 10.0, 5.0, 4.0, 10.0, 5.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.3818359375, -60.326171875, -58.2705078125, -56.21484375, -54.1591796875, -52.103515625, -50.0478515625, -47.9921875, -45.9365234375, -43.880859375, -41.8251953125, -39.76953125, -37.7138671875, -35.658203125, -33.6025390625, -31.546875, -29.4912109375, -27.435546875, -25.3798828125, -23.32421875, -21.2685546875, -19.212890625, -17.1572265625, -15.1015625, -13.0458984375, -10.990234375, -8.9345703125, -6.87890625, -4.8232421875, -2.767578125, -0.7119140625, 1.34375, 3.3994140625, 5.455078125, 7.5107421875, 9.56640625, 11.6220703125, 13.677734375, 15.7333984375, 17.7890625, 19.8447265625, 21.900390625, 23.9560546875, 26.01171875, 28.0673828125, 30.123046875, 32.1787109375, 34.234375, 36.2900390625, 38.345703125, 40.4013671875, 42.45703125, 44.5126953125, 46.568359375, 48.6240234375, 50.6796875, 52.7353515625, 54.791015625, 56.8466796875, 58.90234375, 60.9580078125, 63.013671875, 65.0693359375, 67.125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 28.0, 242.0, 483.0, 218.0, 34.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.78399658203125, -209.54949951171875, -205.31500244140625, -201.08050537109375, -196.84600830078125, -192.61151123046875, -188.37701416015625, -184.14251708984375, -179.90802001953125, -175.67352294921875, -171.43902587890625, -167.20452880859375, -162.97003173828125, -158.73553466796875, -154.50103759765625, -150.26654052734375, -146.03204345703125, -141.79754638671875, -137.56304931640625, -133.32855224609375, -129.09405517578125, -124.85955810546875, -120.62506103515625, -116.39056396484375, -112.15606689453125, -107.92156982421875, -103.68707275390625, -99.45257568359375, -95.21807861328125, -90.98358154296875, -86.74908447265625, -82.51458740234375, -78.28010559082031, -74.04560852050781, -69.81111145019531, -65.57661437988281, -61.34211730957031, -57.10762023925781, -52.87312316894531, -48.63862609863281, -44.40412902832031, -40.16963195800781, -35.93513488769531, -31.700637817382812, -27.466140747070312, -23.231643676757812, -18.997146606445312, -14.762649536132812, -10.528152465820312, -6.2936553955078125, -2.0591583251953125, 2.1753387451171875, 6.4098358154296875, 10.644332885742188, 14.878829956054688, 19.113327026367188, 23.347824096679688, 27.582321166992188, 31.816818237304688, 36.05131530761719, 40.28581237792969, 44.52030944824219, 48.75480651855469, 52.98930358886719, 57.22380065917969]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 5.0, 11.0, 12.0, 17.0, 14.0, 12.0, 16.0, 17.0, 27.0, 24.0, 31.0, 31.0, 33.0, 24.0, 39.0, 41.0, 39.0, 39.0, 45.0, 40.0, 57.0, 42.0, 45.0, 36.0, 35.0, 40.0, 28.0, 32.0, 14.0, 31.0, 14.0, 15.0, 18.0, 18.0, 16.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-44.88050079345703, -43.524410247802734, -42.16831970214844, -40.812225341796875, -39.45613479614258, -38.10004425048828, -36.74394989013672, -35.38785934448242, -34.031768798828125, -32.67567825317383, -31.3195858001709, -29.96349334716797, -28.607402801513672, -27.251312255859375, -25.895219802856445, -24.539127349853516, -23.18303680419922, -21.826946258544922, -20.470853805541992, -19.114761352539062, -17.758670806884766, -16.40258026123047, -15.046487808227539, -13.690396308898926, -12.334304809570312, -10.9782133102417, -9.622121810913086, -8.266030311584473, -6.909938812255859, -5.553847312927246, -4.197755813598633, -2.8416643142700195, -1.4855690002441406, -0.12947750091552734, 1.226613998413086, 2.582705497741699, 3.9387969970703125, 5.294888496398926, 6.650979995727539, 8.007071495056152, 9.363162994384766, 10.719254493713379, 12.075345993041992, 13.431437492370605, 14.787528991699219, 16.143619537353516, 17.499711990356445, 18.855804443359375, 20.211894989013672, 21.56798553466797, 22.9240779876709, 24.280170440673828, 25.636260986328125, 26.992351531982422, 28.34844398498535, 29.70453643798828, 31.060626983642578, 32.416717529296875, 33.77281188964844, 35.128902435302734, 36.48499298095703, 37.84108352661133, 39.197174072265625, 40.55326843261719, 41.909358978271484]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 8.0, 3.0, 4.0, 7.0, 10.0, 12.0, 16.0, 19.0, 24.0, 20.0, 21.0, 27.0, 26.0, 25.0, 31.0, 37.0, 37.0, 35.0, 39.0, 36.0, 51.0, 38.0, 41.0, 29.0, 34.0, 39.0, 37.0, 30.0, 39.0, 37.0, 28.0, 44.0, 24.0, 13.0, 17.0, 10.0, 16.0, 17.0, 4.0, 5.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.1680908203125, -4.004150390625, -3.8402099609375, -3.67626953125, -3.5123291015625, -3.348388671875, -3.1844482421875, -3.0205078125, -2.8565673828125, -2.692626953125, -2.5286865234375, -2.36474609375, -2.2008056640625, -2.036865234375, -1.8729248046875, -1.708984375, -1.5450439453125, -1.381103515625, -1.2171630859375, -1.05322265625, -0.8892822265625, -0.725341796875, -0.5614013671875, -0.3974609375, -0.2335205078125, -0.069580078125, 0.0943603515625, 0.25830078125, 0.4222412109375, 0.586181640625, 0.7501220703125, 0.9140625, 1.0780029296875, 1.241943359375, 1.4058837890625, 1.56982421875, 1.7337646484375, 1.897705078125, 2.0616455078125, 2.2255859375, 2.3895263671875, 2.553466796875, 2.7174072265625, 2.88134765625, 3.0452880859375, 3.209228515625, 3.3731689453125, 3.537109375, 3.7010498046875, 3.864990234375, 4.0289306640625, 4.19287109375, 4.3568115234375, 4.520751953125, 4.6846923828125, 4.8486328125, 5.0125732421875, 5.176513671875, 5.3404541015625, 5.50439453125, 5.6683349609375, 5.832275390625, 5.9962158203125, 6.16015625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 8.0, 3.0, 4.0, 5.0, 7.0, 12.0, 23.0, 30.0, 31.0, 32.0, 40.0, 60.0, 116.0, 169.0, 269.0, 422.0, 706.0, 1108.0, 1890.0, 3581.0, 7338.0, 18342.0, 62491.0, 315747.0, 1309386.0, 1780655.0, 542821.0, 103068.0, 26003.0, 9719.0, 4454.0, 2333.0, 1289.0, 760.0, 476.0, 264.0, 186.0, 125.0, 75.0, 66.0, 47.0, 36.0, 16.0, 23.0, 8.0, 15.0, 10.0, 11.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.66015625, -7.41436767578125, -7.1685791015625, -6.92279052734375, -6.677001953125, -6.43121337890625, -6.1854248046875, -5.93963623046875, -5.69384765625, -5.44805908203125, -5.2022705078125, -4.95648193359375, -4.710693359375, -4.46490478515625, -4.2191162109375, -3.97332763671875, -3.7275390625, -3.48175048828125, -3.2359619140625, -2.99017333984375, -2.744384765625, -2.49859619140625, -2.2528076171875, -2.00701904296875, -1.76123046875, -1.51544189453125, -1.2696533203125, -1.02386474609375, -0.778076171875, -0.53228759765625, -0.2864990234375, -0.04071044921875, 0.205078125, 0.45086669921875, 0.6966552734375, 0.94244384765625, 1.188232421875, 1.43402099609375, 1.6798095703125, 1.92559814453125, 2.17138671875, 2.41717529296875, 2.6629638671875, 2.90875244140625, 3.154541015625, 3.40032958984375, 3.6461181640625, 3.89190673828125, 4.1376953125, 4.38348388671875, 4.6292724609375, 4.87506103515625, 5.120849609375, 5.36663818359375, 5.6124267578125, 5.85821533203125, 6.10400390625, 6.34979248046875, 6.5955810546875, 6.84136962890625, 7.087158203125, 7.33294677734375, 7.5787353515625, 7.82452392578125, 8.0703125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 6.0, 16.0, 26.0, 34.0, 40.0, 94.0, 185.0, 318.0, 506.0, 791.0, 818.0, 530.0, 304.0, 182.0, 95.0, 58.0, 27.0, 17.0, 15.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -16.045654296875, -15.52880859375, -15.011962890625, -14.4951171875, -13.978271484375, -13.46142578125, -12.944580078125, -12.427734375, -11.910888671875, -11.39404296875, -10.877197265625, -10.3603515625, -9.843505859375, -9.32666015625, -8.809814453125, -8.29296875, -7.776123046875, -7.25927734375, -6.742431640625, -6.2255859375, -5.708740234375, -5.19189453125, -4.675048828125, -4.158203125, -3.641357421875, -3.12451171875, -2.607666015625, -2.0908203125, -1.573974609375, -1.05712890625, -0.540283203125, -0.0234375, 0.493408203125, 1.01025390625, 1.527099609375, 2.0439453125, 2.560791015625, 3.07763671875, 3.594482421875, 4.111328125, 4.628173828125, 5.14501953125, 5.661865234375, 6.1787109375, 6.695556640625, 7.21240234375, 7.729248046875, 8.24609375, 8.762939453125, 9.27978515625, 9.796630859375, 10.3134765625, 10.830322265625, 11.34716796875, 11.864013671875, 12.380859375, 12.897705078125, 13.41455078125, 13.931396484375, 14.4482421875, 14.965087890625, 15.48193359375, 15.998779296875, 16.515625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 16.0, 18.0, 44.0, 67.0, 182.0, 390.0, 1045.0, 4238.0, 471465.0, 3702201.0, 11801.0, 1739.0, 565.0, 258.0, 82.0, 51.0, 51.0, 17.0, 16.0, 4.0, 9.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.21875, -35.0576171875, -33.896484375, -32.7353515625, -31.57421875, -30.4130859375, -29.251953125, -28.0908203125, -26.9296875, -25.7685546875, -24.607421875, -23.4462890625, -22.28515625, -21.1240234375, -19.962890625, -18.8017578125, -17.640625, -16.4794921875, -15.318359375, -14.1572265625, -12.99609375, -11.8349609375, -10.673828125, -9.5126953125, -8.3515625, -7.1904296875, -6.029296875, -4.8681640625, -3.70703125, -2.5458984375, -1.384765625, -0.2236328125, 0.9375, 2.0986328125, 3.259765625, 4.4208984375, 5.58203125, 6.7431640625, 7.904296875, 9.0654296875, 10.2265625, 11.3876953125, 12.548828125, 13.7099609375, 14.87109375, 16.0322265625, 17.193359375, 18.3544921875, 19.515625, 20.6767578125, 21.837890625, 22.9990234375, 24.16015625, 25.3212890625, 26.482421875, 27.6435546875, 28.8046875, 29.9658203125, 31.126953125, 32.2880859375, 33.44921875, 34.6103515625, 35.771484375, 36.9326171875, 38.09375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 222.0, 592.0, 182.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.44705200195312, -153.61192321777344, -146.77679443359375, -139.94166564941406, -133.10653686523438, -126.27140808105469, -119.436279296875, -112.60115051269531, -105.76602172851562, -98.93089294433594, -92.09576416015625, -85.26063537597656, -78.42550659179688, -71.59037780761719, -64.7552490234375, -57.92012405395508, -51.084999084472656, -44.24987030029297, -37.41474151611328, -30.579614639282227, -23.74448585510254, -16.909358978271484, -10.074230194091797, -3.2391014099121094, 3.596027374267578, 10.431156158447266, 17.266284942626953, 24.101411819458008, 30.936540603637695, 37.77166748046875, 44.60679626464844, 51.441925048828125, 58.27705383300781, 65.1121826171875, 71.94731140136719, 78.78244018554688, 85.61756896972656, 92.45269775390625, 99.28782653808594, 106.12295532226562, 112.95808410644531, 119.793212890625, 126.62834167480469, 133.46347045898438, 140.29859924316406, 147.13372802734375, 153.96885681152344, 160.80398559570312, 167.63909912109375, 174.47422790527344, 181.30935668945312, 188.1444854736328, 194.9796142578125, 201.8147430419922, 208.64987182617188, 215.48500061035156, 222.32012939453125, 229.15525817871094, 235.99038696289062, 242.8255157470703, 249.66064453125, 256.4957580566406, 263.3309020996094, 270.166015625, 277.00115966796875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 5.0, 11.0, 19.0, 21.0, 21.0, 25.0, 25.0, 38.0, 45.0, 29.0, 34.0, 40.0, 39.0, 44.0, 51.0, 48.0, 50.0, 49.0, 50.0, 41.0, 40.0, 38.0, 37.0, 35.0, 26.0, 30.0, 22.0, 14.0, 14.0, 11.0, 6.0, 4.0, 9.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.47022247314453, -35.155433654785156, -33.84064483642578, -32.52585983276367, -31.211071014404297, -29.896282196044922, -28.581493377685547, -27.266706466674805, -25.951919555664062, -24.637130737304688, -23.322343826293945, -22.00755500793457, -20.692768096923828, -19.377979278564453, -18.063190460205078, -16.748403549194336, -15.433614730834961, -14.118826866149902, -12.804039001464844, -11.489250183105469, -10.174463272094727, -8.859674453735352, -7.544886589050293, -6.230098724365234, -4.915310859680176, -3.600522994995117, -2.2857348918914795, -0.9709467887878418, 0.3438410758972168, 1.6586289405822754, 2.973417282104492, 4.288205146789551, 5.602993011474609, 6.917780876159668, 8.232568740844727, 9.547357559204102, 10.862144470214844, 12.176933288574219, 13.491721153259277, 14.806509017944336, 16.121295928955078, 17.436084747314453, 18.750871658325195, 20.06566047668457, 21.380447387695312, 22.695236206054688, 24.010025024414062, 25.324811935424805, 26.63960075378418, 27.954389572143555, 29.269176483154297, 30.583965301513672, 31.898752212524414, 33.213539123535156, 34.52832794189453, 35.843116760253906, 37.15790557861328, 38.472694396972656, 39.78748321533203, 41.10226821899414, 42.417057037353516, 43.73184585571289, 45.046634674072266, 46.361419677734375, 47.67620849609375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 1.0, 3.0, 2.0, 3.0, 10.0, 6.0, 14.0, 9.0, 11.0, 12.0, 21.0, 11.0, 27.0, 21.0, 31.0, 29.0, 38.0, 26.0, 41.0, 48.0, 35.0, 41.0, 57.0, 40.0, 39.0, 43.0, 37.0, 36.0, 24.0, 28.0, 32.0, 30.0, 35.0, 32.0, 16.0, 21.0, 19.0, 18.0, 17.0, 9.0, 12.0, 6.0, 3.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69140625, -3.56146240234375, -3.4315185546875, -3.30157470703125, -3.171630859375, -3.04168701171875, -2.9117431640625, -2.78179931640625, -2.65185546875, -2.52191162109375, -2.3919677734375, -2.26202392578125, -2.132080078125, -2.00213623046875, -1.8721923828125, -1.74224853515625, -1.6123046875, -1.48236083984375, -1.3524169921875, -1.22247314453125, -1.092529296875, -0.96258544921875, -0.8326416015625, -0.70269775390625, -0.57275390625, -0.44281005859375, -0.3128662109375, -0.18292236328125, -0.052978515625, 0.07696533203125, 0.2069091796875, 0.33685302734375, 0.466796875, 0.59674072265625, 0.7266845703125, 0.85662841796875, 0.986572265625, 1.11651611328125, 1.2464599609375, 1.37640380859375, 1.50634765625, 1.63629150390625, 1.7662353515625, 1.89617919921875, 2.026123046875, 2.15606689453125, 2.2860107421875, 2.41595458984375, 2.5458984375, 2.67584228515625, 2.8057861328125, 2.93572998046875, 3.065673828125, 3.19561767578125, 3.3255615234375, 3.45550537109375, 3.58544921875, 3.71539306640625, 3.8453369140625, 3.97528076171875, 4.105224609375, 4.23516845703125, 4.3651123046875, 4.49505615234375, 4.625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 13.0, 12.0, 23.0, 30.0, 32.0, 61.0, 76.0, 131.0, 169.0, 344.0, 526.0, 864.0, 1484.0, 2523.0, 4145.0, 7120.0, 12542.0, 21545.0, 37100.0, 64034.0, 108306.0, 170550.0, 208818.0, 162724.0, 102207.0, 60141.0, 34770.0, 20097.0, 11676.0, 6736.0, 3912.0, 2308.0, 1323.0, 862.0, 484.0, 294.0, 203.0, 105.0, 78.0, 51.0, 43.0, 27.0, 23.0, 14.0, 5.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3359375, -0.3252525329589844, -0.31456756591796875, -0.3038825988769531, -0.2931976318359375, -0.2825126647949219, -0.27182769775390625, -0.2611427307128906, -0.250457763671875, -0.23977279663085938, -0.22908782958984375, -0.21840286254882812, -0.2077178955078125, -0.19703292846679688, -0.18634796142578125, -0.17566299438476562, -0.16497802734375, -0.15429306030273438, -0.14360809326171875, -0.13292312622070312, -0.1222381591796875, -0.11155319213867188, -0.10086822509765625, -0.09018325805664062, -0.079498291015625, -0.06881332397460938, -0.05812835693359375, -0.047443389892578125, -0.0367584228515625, -0.026073455810546875, -0.01538848876953125, -0.004703521728515625, 0.0059814453125, 0.016666412353515625, 0.02735137939453125, 0.038036346435546875, 0.0487213134765625, 0.059406280517578125, 0.07009124755859375, 0.08077621459960938, 0.091461181640625, 0.10214614868164062, 0.11283111572265625, 0.12351608276367188, 0.1342010498046875, 0.14488601684570312, 0.15557098388671875, 0.16625595092773438, 0.17694091796875, 0.18762588500976562, 0.19831085205078125, 0.20899581909179688, 0.2196807861328125, 0.23036575317382812, 0.24105072021484375, 0.2517356872558594, 0.262420654296875, 0.2731056213378906, 0.28379058837890625, 0.2944755554199219, 0.3051605224609375, 0.3158454895019531, 0.32653045654296875, 0.3372154235839844, 0.347900390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 2.0, 10.0, 11.0, 10.0, 18.0, 16.0, 13.0, 14.0, 16.0, 17.0, 30.0, 21.0, 26.0, 29.0, 42.0, 38.0, 33.0, 34.0, 40.0, 36.0, 34.0, 1055.0, 58.0, 37.0, 42.0, 34.0, 31.0, 27.0, 31.0, 25.0, 28.0, 20.0, 22.0, 20.0, 15.0, 14.0, 9.0, 11.0, 7.0, 7.0, 10.0, 5.0, 12.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.478515625, -2.401397705078125, -2.32427978515625, -2.247161865234375, -2.1700439453125, -2.092926025390625, -2.01580810546875, -1.938690185546875, -1.861572265625, -1.784454345703125, -1.70733642578125, -1.630218505859375, -1.5531005859375, -1.475982666015625, -1.39886474609375, -1.321746826171875, -1.24462890625, -1.167510986328125, -1.09039306640625, -1.013275146484375, -0.9361572265625, -0.859039306640625, -0.78192138671875, -0.704803466796875, -0.627685546875, -0.550567626953125, -0.47344970703125, -0.396331787109375, -0.3192138671875, -0.242095947265625, -0.16497802734375, -0.087860107421875, -0.0107421875, 0.066375732421875, 0.14349365234375, 0.220611572265625, 0.2977294921875, 0.374847412109375, 0.45196533203125, 0.529083251953125, 0.606201171875, 0.683319091796875, 0.76043701171875, 0.837554931640625, 0.9146728515625, 0.991790771484375, 1.06890869140625, 1.146026611328125, 1.22314453125, 1.300262451171875, 1.37738037109375, 1.454498291015625, 1.5316162109375, 1.608734130859375, 1.68585205078125, 1.762969970703125, 1.840087890625, 1.917205810546875, 1.99432373046875, 2.071441650390625, 2.1485595703125, 2.225677490234375, 2.30279541015625, 2.379913330078125, 2.45703125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 9.0, 13.0, 13.0, 29.0, 38.0, 51.0, 76.0, 117.0, 176.0, 262.0, 346.0, 499.0, 770.0, 1115.0, 1756.0, 2686.0, 3919.0, 6103.0, 9100.0, 13717.0, 20464.0, 30231.0, 43933.0, 62985.0, 86739.0, 112985.0, 970444.0, 341673.0, 110859.0, 84500.0, 61108.0, 42674.0, 29265.0, 19536.0, 12996.0, 8801.0, 5741.0, 3853.0, 2558.0, 1659.0, 1034.0, 728.0, 508.0, 364.0, 229.0, 162.0, 109.0, 66.0, 37.0, 39.0, 24.0, 15.0, 6.0, 8.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0], "bins": [-0.17138671875, -0.1658496856689453, -0.16031265258789062, -0.15477561950683594, -0.14923858642578125, -0.14370155334472656, -0.13816452026367188, -0.1326274871826172, -0.1270904541015625, -0.12155342102050781, -0.11601638793945312, -0.11047935485839844, -0.10494232177734375, -0.09940528869628906, -0.09386825561523438, -0.08833122253417969, -0.082794189453125, -0.07725715637207031, -0.07172012329101562, -0.06618309020996094, -0.06064605712890625, -0.05510902404785156, -0.049571990966796875, -0.04403495788574219, -0.0384979248046875, -0.03296089172363281, -0.027423858642578125, -0.021886825561523438, -0.01634979248046875, -0.010812759399414062, -0.005275726318359375, 0.0002613067626953125, 0.00579833984375, 0.011335372924804688, 0.016872406005859375, 0.022409439086914062, 0.02794647216796875, 0.03348350524902344, 0.039020538330078125, 0.04455757141113281, 0.0500946044921875, 0.05563163757324219, 0.061168670654296875, 0.06670570373535156, 0.07224273681640625, 0.07777976989746094, 0.08331680297851562, 0.08885383605957031, 0.094390869140625, 0.09992790222167969, 0.10546493530273438, 0.11100196838378906, 0.11653900146484375, 0.12207603454589844, 0.12761306762695312, 0.1331501007080078, 0.1386871337890625, 0.1442241668701172, 0.14976119995117188, 0.15529823303222656, 0.16083526611328125, 0.16637229919433594, 0.17190933227539062, 0.1774463653564453, 0.1829833984375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 9.0, 16.0, 13.0, 25.0, 19.0, 44.0, 41.0, 49.0, 76.0, 83.0, 108.0, 101.0, 89.0, 66.0, 56.0, 48.0, 30.0, 26.0, 15.0, 17.0, 14.0, 10.0, 9.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00672149658203125, -0.006494998931884766, -0.006268501281738281, -0.006042003631591797, -0.0058155059814453125, -0.005589008331298828, -0.005362510681152344, -0.005136013031005859, -0.004909515380859375, -0.004683017730712891, -0.004456520080566406, -0.004230022430419922, -0.0040035247802734375, -0.003777027130126953, -0.0035505294799804688, -0.0033240318298339844, -0.0030975341796875, -0.0028710365295410156, -0.0026445388793945312, -0.002418041229248047, -0.0021915435791015625, -0.001965045928955078, -0.0017385482788085938, -0.0015120506286621094, -0.001285552978515625, -0.0010590553283691406, -0.0008325576782226562, -0.0006060600280761719, -0.0003795623779296875, -0.00015306472778320312, 7.343292236328125e-05, 0.0002999305725097656, 0.00052642822265625, 0.0007529258728027344, 0.0009794235229492188, 0.0012059211730957031, 0.0014324188232421875, 0.0016589164733886719, 0.0018854141235351562, 0.0021119117736816406, 0.002338409423828125, 0.0025649070739746094, 0.0027914047241210938, 0.003017902374267578, 0.0032444000244140625, 0.003470897674560547, 0.0036973953247070312, 0.003923892974853516, 0.004150390625, 0.004376888275146484, 0.004603385925292969, 0.004829883575439453, 0.0050563812255859375, 0.005282878875732422, 0.005509376525878906, 0.005735874176025391, 0.005962371826171875, 0.006188869476318359, 0.006415367126464844, 0.006641864776611328, 0.0068683624267578125, 0.007094860076904297, 0.007321357727050781, 0.007547855377197266, 0.00777435302734375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 4.0, 12.0, 12.0, 17.0, 22.0, 23.0, 33.0, 30.0, 55.0, 71.0, 118.0, 171.0, 264.0, 458.0, 1132.0, 36174.0, 999684.0, 8465.0, 745.0, 345.0, 228.0, 134.0, 100.0, 67.0, 38.0, 44.0, 19.0, 17.0, 15.0, 12.0, 9.0, 8.0, 5.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1328125, -0.12894725799560547, -0.12508201599121094, -0.1212167739868164, -0.11735153198242188, -0.11348628997802734, -0.10962104797363281, -0.10575580596923828, -0.10189056396484375, -0.09802532196044922, -0.09416007995605469, -0.09029483795166016, -0.08642959594726562, -0.0825643539428711, -0.07869911193847656, -0.07483386993408203, -0.0709686279296875, -0.06710338592529297, -0.06323814392089844, -0.059372901916503906, -0.055507659912109375, -0.051642417907714844, -0.04777717590332031, -0.04391193389892578, -0.04004669189453125, -0.03618144989013672, -0.03231620788574219, -0.028450965881347656, -0.024585723876953125, -0.020720481872558594, -0.016855239868164062, -0.012989997863769531, -0.009124755859375, -0.005259513854980469, -0.0013942718505859375, 0.0024709701538085938, 0.006336212158203125, 0.010201454162597656, 0.014066696166992188, 0.01793193817138672, 0.02179718017578125, 0.02566242218017578, 0.029527664184570312, 0.033392906188964844, 0.037258148193359375, 0.041123390197753906, 0.04498863220214844, 0.04885387420654297, 0.0527191162109375, 0.05658435821533203, 0.06044960021972656, 0.0643148422241211, 0.06818008422851562, 0.07204532623291016, 0.07591056823730469, 0.07977581024169922, 0.08364105224609375, 0.08750629425048828, 0.09137153625488281, 0.09523677825927734, 0.09910202026367188, 0.1029672622680664, 0.10683250427246094, 0.11069774627685547, 0.11456298828125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 450.0, 552.0, 9.0], "bins": [-0.14696530997753143, -0.1445966511964798, -0.14222797751426697, -0.13985931873321533, -0.1374906450510025, -0.13512198626995087, -0.13275332748889923, -0.1303846538066864, -0.12801599502563477, -0.12564733624458313, -0.1232786625623703, -0.12091000378131866, -0.11854133754968643, -0.1161726713180542, -0.11380400508642197, -0.11143533885478973, -0.1090666726231575, -0.10669800639152527, -0.10432934015989304, -0.1019606813788414, -0.09959201514720917, -0.09722334891557693, -0.0948546826839447, -0.09248601645231247, -0.09011735022068024, -0.087748683989048, -0.08538001775741577, -0.08301135897636414, -0.0806426927447319, -0.07827402651309967, -0.07590536028146744, -0.0735366940498352, -0.07116802781820297, -0.06879936158657074, -0.06643069535493851, -0.06406203657388687, -0.06169337034225464, -0.059324704110622406, -0.05695603787899017, -0.05458737164735794, -0.052218709141016006, -0.049850042909383774, -0.04748138040304184, -0.04511271417140961, -0.042744047939777374, -0.04037538543343544, -0.03800671920180321, -0.03563805669546127, -0.03326939046382904, -0.030900726094841957, -0.028532061725854874, -0.02616339549422264, -0.023794731125235558, -0.021426066756248474, -0.01905740052461624, -0.016688736155629158, -0.014320071786642075, -0.011951407417654991, -0.009582742117345333, -0.007214077282696962, -0.004845412448048592, -0.002476748079061508, -0.00010808277875185013, 0.002260582521557808, 0.004629246890544891]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 15.0, 17.0, 26.0, 41.0, 39.0, 61.0, 77.0, 86.0, 86.0, 91.0, 107.0, 77.0, 68.0, 56.0, 47.0, 38.0, 34.0, 21.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012537539005279541, -0.012221626937389374, -0.011905714869499207, -0.01158980280160904, -0.011273890733718872, -0.010957978665828705, -0.010642066597938538, -0.01032615453004837, -0.010010242462158203, -0.009694330394268036, -0.009378418326377869, -0.009062506258487701, -0.008746594190597534, -0.008430682122707367, -0.0081147700548172, -0.0077988579869270325, -0.007482945919036865, -0.007167033851146698, -0.006851121783256531, -0.0065352097153663635, -0.006219297647476196, -0.005903385579586029, -0.005587473511695862, -0.005271561443805695, -0.004955649375915527, -0.00463973730802536, -0.004323825240135193, -0.004007913172245026, -0.0036920011043548584, -0.003376089036464691, -0.003060176968574524, -0.0027442649006843567, -0.0024283528327941895, -0.002112440764904022, -0.001796528697013855, -0.0014806166291236877, -0.0011647045612335205, -0.0008487924933433533, -0.000532880425453186, -0.0002169683575630188, 9.894371032714844e-05, 0.0004148557782173157, 0.0007307678461074829, 0.0010466799139976501, 0.0013625919818878174, 0.0016785040497779846, 0.001994416117668152, 0.002310328185558319, 0.0026262402534484863, 0.0029421523213386536, 0.003258064389228821, 0.003573976457118988, 0.0038898885250091553, 0.0042058005928993225, 0.00452171266078949, 0.004837624728679657, 0.005153536796569824, 0.0054694488644599915, 0.005785360932350159, 0.006101273000240326, 0.006417185068130493, 0.00673309713602066, 0.007049009203910828, 0.007364921271800995, 0.007680833339691162]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 1.0, 3.0, 2.0, 3.0, 10.0, 6.0, 14.0, 9.0, 11.0, 12.0, 21.0, 11.0, 27.0, 20.0, 32.0, 29.0, 38.0, 26.0, 41.0, 48.0, 35.0, 41.0, 56.0, 41.0, 39.0, 43.0, 37.0, 36.0, 24.0, 28.0, 32.0, 30.0, 35.0, 32.0, 16.0, 21.0, 19.0, 18.0, 17.0, 9.0, 12.0, 6.0, 3.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69140625, -3.56146240234375, -3.4315185546875, -3.30157470703125, -3.171630859375, -3.04168701171875, -2.9117431640625, -2.78179931640625, -2.65185546875, -2.52191162109375, -2.3919677734375, -2.26202392578125, -2.132080078125, -2.00213623046875, -1.8721923828125, -1.74224853515625, -1.6123046875, -1.48236083984375, -1.3524169921875, -1.22247314453125, -1.092529296875, -0.96258544921875, -0.8326416015625, -0.70269775390625, -0.57275390625, -0.44281005859375, -0.3128662109375, -0.18292236328125, -0.052978515625, 0.07696533203125, 0.2069091796875, 0.33685302734375, 0.466796875, 0.59674072265625, 0.7266845703125, 0.85662841796875, 0.986572265625, 1.11651611328125, 1.2464599609375, 1.37640380859375, 1.50634765625, 1.63629150390625, 1.7662353515625, 1.89617919921875, 2.026123046875, 2.15606689453125, 2.2860107421875, 2.41595458984375, 2.5458984375, 2.67584228515625, 2.8057861328125, 2.93572998046875, 3.065673828125, 3.19561767578125, 3.3255615234375, 3.45550537109375, 3.58544921875, 3.71539306640625, 3.8453369140625, 3.97528076171875, 4.105224609375, 4.23516845703125, 4.3651123046875, 4.49505615234375, 4.625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 5.0, 14.0, 17.0, 9.0, 12.0, 16.0, 25.0, 35.0, 41.0, 58.0, 70.0, 93.0, 109.0, 150.0, 215.0, 281.0, 397.0, 528.0, 864.0, 1283.0, 2306.0, 4886.0, 12003.0, 40957.0, 208818.0, 559782.0, 161393.0, 33528.0, 10302.0, 4286.0, 2081.0, 1202.0, 782.0, 486.0, 369.0, 267.0, 212.0, 156.0, 142.0, 88.0, 74.0, 56.0, 41.0, 23.0, 25.0, 13.0, 21.0, 15.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0078125, -5.80364990234375, -5.5994873046875, -5.39532470703125, -5.191162109375, -4.98699951171875, -4.7828369140625, -4.57867431640625, -4.37451171875, -4.17034912109375, -3.9661865234375, -3.76202392578125, -3.557861328125, -3.35369873046875, -3.1495361328125, -2.94537353515625, -2.7412109375, -2.53704833984375, -2.3328857421875, -2.12872314453125, -1.924560546875, -1.72039794921875, -1.5162353515625, -1.31207275390625, -1.10791015625, -0.90374755859375, -0.6995849609375, -0.49542236328125, -0.291259765625, -0.08709716796875, 0.1170654296875, 0.32122802734375, 0.525390625, 0.72955322265625, 0.9337158203125, 1.13787841796875, 1.342041015625, 1.54620361328125, 1.7503662109375, 1.95452880859375, 2.15869140625, 2.36285400390625, 2.5670166015625, 2.77117919921875, 2.975341796875, 3.17950439453125, 3.3836669921875, 3.58782958984375, 3.7919921875, 3.99615478515625, 4.2003173828125, 4.40447998046875, 4.608642578125, 4.81280517578125, 5.0169677734375, 5.22113037109375, 5.42529296875, 5.62945556640625, 5.8336181640625, 6.03778076171875, 6.241943359375, 6.44610595703125, 6.6502685546875, 6.85443115234375, 7.05859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 5.0, 6.0, 9.0, 9.0, 7.0, 5.0, 16.0, 15.0, 15.0, 24.0, 36.0, 31.0, 45.0, 48.0, 52.0, 73.0, 114.0, 297.0, 1487.0, 251.0, 122.0, 65.0, 58.0, 57.0, 36.0, 41.0, 26.0, 24.0, 12.0, 8.0, 8.0, 7.0, 8.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-15.0703125, -14.6456298828125, -14.220947265625, -13.7962646484375, -13.37158203125, -12.9468994140625, -12.522216796875, -12.0975341796875, -11.6728515625, -11.2481689453125, -10.823486328125, -10.3988037109375, -9.97412109375, -9.5494384765625, -9.124755859375, -8.7000732421875, -8.275390625, -7.8507080078125, -7.426025390625, -7.0013427734375, -6.57666015625, -6.1519775390625, -5.727294921875, -5.3026123046875, -4.8779296875, -4.4532470703125, -4.028564453125, -3.6038818359375, -3.17919921875, -2.7545166015625, -2.329833984375, -1.9051513671875, -1.48046875, -1.0557861328125, -0.631103515625, -0.2064208984375, 0.21826171875, 0.6429443359375, 1.067626953125, 1.4923095703125, 1.9169921875, 2.3416748046875, 2.766357421875, 3.1910400390625, 3.61572265625, 4.0404052734375, 4.465087890625, 4.8897705078125, 5.314453125, 5.7391357421875, 6.163818359375, 6.5885009765625, 7.01318359375, 7.4378662109375, 7.862548828125, 8.2872314453125, 8.7119140625, 9.1365966796875, 9.561279296875, 9.9859619140625, 10.41064453125, 10.8353271484375, 11.260009765625, 11.6846923828125, 12.109375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 7.0, 5.0, 12.0, 10.0, 16.0, 15.0, 37.0, 41.0, 76.0, 92.0, 142.0, 224.0, 398.0, 1025.0, 5680.0, 3076984.0, 57437.0, 1921.0, 631.0, 320.0, 152.0, 121.0, 101.0, 58.0, 44.0, 40.0, 32.0, 12.0, 20.0, 12.0, 14.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.671875, -26.674072265625, -25.67626953125, -24.678466796875, -23.6806640625, -22.682861328125, -21.68505859375, -20.687255859375, -19.689453125, -18.691650390625, -17.69384765625, -16.696044921875, -15.6982421875, -14.700439453125, -13.70263671875, -12.704833984375, -11.70703125, -10.709228515625, -9.71142578125, -8.713623046875, -7.7158203125, -6.718017578125, -5.72021484375, -4.722412109375, -3.724609375, -2.726806640625, -1.72900390625, -0.731201171875, 0.2666015625, 1.264404296875, 2.26220703125, 3.260009765625, 4.2578125, 5.255615234375, 6.25341796875, 7.251220703125, 8.2490234375, 9.246826171875, 10.24462890625, 11.242431640625, 12.240234375, 13.238037109375, 14.23583984375, 15.233642578125, 16.2314453125, 17.229248046875, 18.22705078125, 19.224853515625, 20.22265625, 21.220458984375, 22.21826171875, 23.216064453125, 24.2138671875, 25.211669921875, 26.20947265625, 27.207275390625, 28.205078125, 29.202880859375, 30.20068359375, 31.198486328125, 32.1962890625, 33.194091796875, 34.19189453125, 35.189697265625, 36.1875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 172.0, 827.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-382.6285400390625, -375.70989990234375, -368.7912292480469, -361.8725891113281, -354.95391845703125, -348.0352783203125, -341.1166076660156, -334.1979675292969, -327.279296875, -320.36065673828125, -313.4419860839844, -306.5233459472656, -299.60467529296875, -292.68603515625, -285.7673645019531, -278.8487243652344, -271.9300537109375, -265.01141357421875, -258.0927429199219, -251.17408752441406, -244.25543212890625, -237.33677673339844, -230.41812133789062, -223.4994659423828, -216.58082580566406, -209.66217041015625, -202.74351501464844, -195.82485961914062, -188.9062042236328, -181.987548828125, -175.0688934326172, -168.15023803710938, -161.23159790039062, -154.3129425048828, -147.394287109375, -140.4756317138672, -133.55697631835938, -126.63832092285156, -119.71966552734375, -112.80101013183594, -105.88235473632812, -98.96369934082031, -92.0450439453125, -85.12638854980469, -78.20773315429688, -71.28907775878906, -64.37042236328125, -57.4517707824707, -50.533111572265625, -43.61445617675781, -36.69580078125, -29.77714729309082, -22.858491897583008, -15.939838409423828, -9.021183013916016, -2.102527618408203, 4.816127777099609, 11.734783172607422, 18.653438568115234, 25.572092056274414, 32.490745544433594, 39.409400939941406, 46.32805633544922, 53.24671173095703, 60.165367126464844]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 5.0, 9.0, 7.0, 7.0, 9.0, 9.0, 14.0, 9.0, 19.0, 19.0, 18.0, 27.0, 36.0, 30.0, 27.0, 34.0, 36.0, 48.0, 38.0, 40.0, 38.0, 40.0, 38.0, 49.0, 41.0, 29.0, 31.0, 26.0, 30.0, 34.0, 32.0, 25.0, 25.0, 17.0, 19.0, 15.0, 18.0, 10.0, 11.0, 7.0, 4.0, 11.0, 6.0, 1.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.71405029296875, -25.867168426513672, -25.020286560058594, -24.173404693603516, -23.326522827148438, -22.47964096069336, -21.63275909423828, -20.785877227783203, -19.938995361328125, -19.092113494873047, -18.24523162841797, -17.39834976196289, -16.551467895507812, -15.704586029052734, -14.857704162597656, -14.010822296142578, -13.163941383361816, -12.317059516906738, -11.47017765045166, -10.623295783996582, -9.776413917541504, -8.929533004760742, -8.082651138305664, -7.235768795013428, -6.38888692855835, -5.5420050621032715, -4.695123195648193, -3.8482415676116943, -3.001359701156616, -2.154478073120117, -1.307596206665039, -0.46071434020996094, 0.3861675262451172, 1.2330493927001953, 2.0799312591552734, 2.9268128871917725, 3.7736947536468506, 4.62057638168335, 5.467458248138428, 6.314340114593506, 7.161221981048584, 8.008103370666504, 8.854985237121582, 9.70186710357666, 10.548748970031738, 11.395630836486816, 12.242512702941895, 13.089394569396973, 13.93627643585205, 14.783158302307129, 15.630040168762207, 16.47692108154297, 17.323802947998047, 18.170684814453125, 19.017566680908203, 19.86444854736328, 20.71133041381836, 21.558212280273438, 22.405094146728516, 23.251976013183594, 24.098857879638672, 24.94573974609375, 25.792621612548828, 26.639503479003906, 27.486385345458984]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 5.0, 5.0, 14.0, 13.0, 14.0, 19.0, 19.0, 21.0, 27.0, 33.0, 38.0, 36.0, 49.0, 31.0, 40.0, 28.0, 41.0, 40.0, 51.0, 53.0, 42.0, 42.0, 34.0, 43.0, 25.0, 32.0, 30.0, 24.0, 32.0, 26.0, 20.0, 11.0, 14.0, 11.0, 12.0, 4.0, 9.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0234375, -4.8665771484375, -4.709716796875, -4.5528564453125, -4.39599609375, -4.2391357421875, -4.082275390625, -3.9254150390625, -3.7685546875, -3.6116943359375, -3.454833984375, -3.2979736328125, -3.14111328125, -2.9842529296875, -2.827392578125, -2.6705322265625, -2.513671875, -2.3568115234375, -2.199951171875, -2.0430908203125, -1.88623046875, -1.7293701171875, -1.572509765625, -1.4156494140625, -1.2587890625, -1.1019287109375, -0.945068359375, -0.7882080078125, -0.63134765625, -0.4744873046875, -0.317626953125, -0.1607666015625, -0.00390625, 0.1529541015625, 0.309814453125, 0.4666748046875, 0.62353515625, 0.7803955078125, 0.937255859375, 1.0941162109375, 1.2509765625, 1.4078369140625, 1.564697265625, 1.7215576171875, 1.87841796875, 2.0352783203125, 2.192138671875, 2.3489990234375, 2.505859375, 2.6627197265625, 2.819580078125, 2.9764404296875, 3.13330078125, 3.2901611328125, 3.447021484375, 3.6038818359375, 3.7607421875, 3.9176025390625, 4.074462890625, 4.2313232421875, 4.38818359375, 4.5450439453125, 4.701904296875, 4.8587646484375, 5.015625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 8.0, 21.0, 17.0, 24.0, 36.0, 43.0, 65.0, 105.0, 137.0, 165.0, 239.0, 395.0, 517.0, 902.0, 1908.0, 6513.0, 106965.0, 3402130.0, 653414.0, 14672.0, 2746.0, 1093.0, 669.0, 428.0, 306.0, 205.0, 158.0, 113.0, 79.0, 50.0, 27.0, 27.0, 14.0, 18.0, 14.0, 9.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.953125, -23.1728515625, -22.392578125, -21.6123046875, -20.83203125, -20.0517578125, -19.271484375, -18.4912109375, -17.7109375, -16.9306640625, -16.150390625, -15.3701171875, -14.58984375, -13.8095703125, -13.029296875, -12.2490234375, -11.46875, -10.6884765625, -9.908203125, -9.1279296875, -8.34765625, -7.5673828125, -6.787109375, -6.0068359375, -5.2265625, -4.4462890625, -3.666015625, -2.8857421875, -2.10546875, -1.3251953125, -0.544921875, 0.2353515625, 1.015625, 1.7958984375, 2.576171875, 3.3564453125, 4.13671875, 4.9169921875, 5.697265625, 6.4775390625, 7.2578125, 8.0380859375, 8.818359375, 9.5986328125, 10.37890625, 11.1591796875, 11.939453125, 12.7197265625, 13.5, 14.2802734375, 15.060546875, 15.8408203125, 16.62109375, 17.4013671875, 18.181640625, 18.9619140625, 19.7421875, 20.5224609375, 21.302734375, 22.0830078125, 22.86328125, 23.6435546875, 24.423828125, 25.2041015625, 25.984375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 9.0, 9.0, 9.0, 13.0, 28.0, 36.0, 45.0, 90.0, 151.0, 239.0, 362.0, 512.0, 569.0, 577.0, 470.0, 313.0, 242.0, 156.0, 80.0, 60.0, 30.0, 27.0, 10.0, 10.0, 4.0, 3.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.421875, -10.0753173828125, -9.728759765625, -9.3822021484375, -9.03564453125, -8.6890869140625, -8.342529296875, -7.9959716796875, -7.6494140625, -7.3028564453125, -6.956298828125, -6.6097412109375, -6.26318359375, -5.9166259765625, -5.570068359375, -5.2235107421875, -4.876953125, -4.5303955078125, -4.183837890625, -3.8372802734375, -3.49072265625, -3.1441650390625, -2.797607421875, -2.4510498046875, -2.1044921875, -1.7579345703125, -1.411376953125, -1.0648193359375, -0.71826171875, -0.3717041015625, -0.025146484375, 0.3214111328125, 0.66796875, 1.0145263671875, 1.361083984375, 1.7076416015625, 2.05419921875, 2.4007568359375, 2.747314453125, 3.0938720703125, 3.4404296875, 3.7869873046875, 4.133544921875, 4.4801025390625, 4.82666015625, 5.1732177734375, 5.519775390625, 5.8663330078125, 6.212890625, 6.5594482421875, 6.906005859375, 7.2525634765625, 7.59912109375, 7.9456787109375, 8.292236328125, 8.6387939453125, 8.9853515625, 9.3319091796875, 9.678466796875, 10.0250244140625, 10.37158203125, 10.7181396484375, 11.064697265625, 11.4112548828125, 11.7578125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 10.0, 8.0, 14.0, 12.0, 20.0, 40.0, 73.0, 160.0, 271.0, 610.0, 1419.0, 4572.0, 18353.0, 137790.0, 1471751.0, 2262970.0, 257803.0, 28990.0, 5994.0, 1920.0, 791.0, 337.0, 150.0, 85.0, 47.0, 26.0, 24.0, 16.0, 13.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.9921875, -11.6602783203125, -11.328369140625, -10.9964599609375, -10.66455078125, -10.3326416015625, -10.000732421875, -9.6688232421875, -9.3369140625, -9.0050048828125, -8.673095703125, -8.3411865234375, -8.00927734375, -7.6773681640625, -7.345458984375, -7.0135498046875, -6.681640625, -6.3497314453125, -6.017822265625, -5.6859130859375, -5.35400390625, -5.0220947265625, -4.690185546875, -4.3582763671875, -4.0263671875, -3.6944580078125, -3.362548828125, -3.0306396484375, -2.69873046875, -2.3668212890625, -2.034912109375, -1.7030029296875, -1.37109375, -1.0391845703125, -0.707275390625, -0.3753662109375, -0.04345703125, 0.2884521484375, 0.620361328125, 0.9522705078125, 1.2841796875, 1.6160888671875, 1.947998046875, 2.2799072265625, 2.61181640625, 2.9437255859375, 3.275634765625, 3.6075439453125, 3.939453125, 4.2713623046875, 4.603271484375, 4.9351806640625, 5.26708984375, 5.5989990234375, 5.930908203125, 6.2628173828125, 6.5947265625, 6.9266357421875, 7.258544921875, 7.5904541015625, 7.92236328125, 8.2542724609375, 8.586181640625, 8.9180908203125, 9.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 11.0, 9.0, 20.0, 29.0, 45.0, 53.0, 72.0, 86.0, 115.0, 107.0, 99.0, 100.0, 68.0, 60.0, 44.0, 25.0, 16.0, 9.0, 14.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.067909240722656, -37.87989807128906, -35.69188690185547, -33.503875732421875, -31.315866470336914, -29.12785530090332, -26.93984603881836, -24.751834869384766, -22.563823699951172, -20.375812530517578, -18.187801361083984, -15.999792098999023, -13.81178092956543, -11.623769760131836, -9.435759544372559, -7.247749328613281, -5.0597381591796875, -2.871727466583252, -0.6837167739868164, 1.5042939186096191, 3.6923046112060547, 5.880315780639648, 8.068325996398926, 10.256336212158203, 12.444347381591797, 14.63235855102539, 16.820369720458984, 19.008378982543945, 21.19639015197754, 23.384401321411133, 25.572410583496094, 27.760421752929688, 29.94842529296875, 32.136436462402344, 34.32444763183594, 36.51245880126953, 38.700469970703125, 40.88848114013672, 43.07648849487305, 45.26449966430664, 47.452510833740234, 49.64052200317383, 51.82853317260742, 54.016544342041016, 56.204551696777344, 58.39256286621094, 60.58057403564453, 62.768585205078125, 64.95659637451172, 67.14460754394531, 69.3326187133789, 71.5206298828125, 73.7086410522461, 75.89665222167969, 78.08466339111328, 80.27267456054688, 82.46067810058594, 84.64868927001953, 86.83670043945312, 89.02471160888672, 91.21272277832031, 93.4007339477539, 95.5887451171875, 97.77674865722656, 99.96476745605469]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 7.0, 3.0, 3.0, 2.0, 5.0, 12.0, 8.0, 8.0, 19.0, 18.0, 19.0, 29.0, 22.0, 25.0, 26.0, 27.0, 45.0, 33.0, 32.0, 31.0, 40.0, 33.0, 42.0, 37.0, 41.0, 39.0, 41.0, 40.0, 34.0, 29.0, 32.0, 24.0, 23.0, 25.0, 22.0, 22.0, 24.0, 16.0, 20.0, 17.0, 9.0, 8.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-37.983272552490234, -36.90467071533203, -35.82606887817383, -34.747467041015625, -33.66886520385742, -32.59026336669922, -31.51166343688965, -30.433061599731445, -29.354459762573242, -28.27585792541504, -27.197256088256836, -26.118654251098633, -25.040054321289062, -23.96145248413086, -22.882850646972656, -21.804248809814453, -20.72564697265625, -19.647045135498047, -18.568443298339844, -17.48984146118164, -16.411239624023438, -15.33263874053955, -14.254037857055664, -13.175436019897461, -12.096834182739258, -11.018232345581055, -9.939630508422852, -8.861029624938965, -7.782427787780762, -6.703825950622559, -5.625224590301514, -4.546623229980469, -3.4680233001708984, -2.3894217014312744, -1.3108201026916504, -0.23221850395202637, 0.8463830947875977, 1.9249849319458008, 3.0035862922668457, 4.082187652587891, 5.160789489746094, 6.239391326904297, 7.317992687225342, 8.396594047546387, 9.47519588470459, 10.553797721862793, 11.63239860534668, 12.711000442504883, 13.789602279663086, 14.868204116821289, 15.946805953979492, 17.025407791137695, 18.104007720947266, 19.18260955810547, 20.261211395263672, 21.339813232421875, 22.418415069580078, 23.49701690673828, 24.575618743896484, 25.654220581054688, 26.73282241821289, 27.811424255371094, 28.890024185180664, 29.968626022338867, 31.04722785949707]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 7.0, 13.0, 10.0, 20.0, 26.0, 24.0, 36.0, 28.0, 28.0, 33.0, 49.0, 41.0, 51.0, 48.0, 47.0, 45.0, 50.0, 46.0, 48.0, 49.0, 42.0, 35.0, 38.0, 28.0, 33.0, 19.0, 24.0, 20.0, 22.0, 10.0, 12.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.7421875, -68.171875, -65.6015625, -63.03125, -60.4609375, -57.890625, -55.3203125, -52.75, -50.1796875, -47.609375, -45.0390625, -42.46875, -39.8984375, -37.328125, -34.7578125, -32.1875, -29.6171875, -27.046875, -24.4765625, -21.90625, -19.3359375, -16.765625, -14.1953125, -11.625, -9.0546875, -6.484375, -3.9140625, -1.34375, 1.2265625, 3.796875, 6.3671875, 8.9375, 11.5078125, 14.078125, 16.6484375, 19.21875, 21.7890625, 24.359375, 26.9296875, 29.5, 32.0703125, 34.640625, 37.2109375, 39.78125, 42.3515625, 44.921875, 47.4921875, 50.0625, 52.6328125, 55.203125, 57.7734375, 60.34375, 62.9140625, 65.484375, 68.0546875, 70.625, 73.1953125, 75.765625, 78.3359375, 80.90625, 83.4765625, 86.046875, 88.6171875, 91.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 12.0, 24.0, 27.0, 38.0, 64.0, 118.0, 160.0, 230.0, 392.0, 633.0, 981.0, 1513.0, 2399.0, 3929.0, 6318.0, 10210.0, 16272.0, 26228.0, 42466.0, 68061.0, 105964.0, 149582.0, 173010.0, 151183.0, 106881.0, 69164.0, 42496.0, 26534.0, 16324.0, 10168.0, 6352.0, 3999.0, 2503.0, 1537.0, 1045.0, 603.0, 402.0, 243.0, 170.0, 94.0, 79.0, 46.0, 27.0, 22.0, 11.0, 11.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.62109375, -3.502410888671875, -3.38372802734375, -3.265045166015625, -3.1463623046875, -3.027679443359375, -2.90899658203125, -2.790313720703125, -2.671630859375, -2.552947998046875, -2.43426513671875, -2.315582275390625, -2.1968994140625, -2.078216552734375, -1.95953369140625, -1.840850830078125, -1.72216796875, -1.603485107421875, -1.48480224609375, -1.366119384765625, -1.2474365234375, -1.128753662109375, -1.01007080078125, -0.891387939453125, -0.772705078125, -0.654022216796875, -0.53533935546875, -0.416656494140625, -0.2979736328125, -0.179290771484375, -0.06060791015625, 0.058074951171875, 0.1767578125, 0.295440673828125, 0.41412353515625, 0.532806396484375, 0.6514892578125, 0.770172119140625, 0.88885498046875, 1.007537841796875, 1.126220703125, 1.244903564453125, 1.36358642578125, 1.482269287109375, 1.6009521484375, 1.719635009765625, 1.83831787109375, 1.957000732421875, 2.07568359375, 2.194366455078125, 2.31304931640625, 2.431732177734375, 2.5504150390625, 2.669097900390625, 2.78778076171875, 2.906463623046875, 3.025146484375, 3.143829345703125, 3.26251220703125, 3.381195068359375, 3.4998779296875, 3.618560791015625, 3.73724365234375, 3.855926513671875, 3.974609375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 10.0, 11.0, 16.0, 21.0, 21.0, 30.0, 25.0, 27.0, 34.0, 37.0, 37.0, 41.0, 50.0, 41.0, 52.0, 1073.0, 53.0, 49.0, 32.0, 37.0, 37.0, 31.0, 29.0, 37.0, 35.0, 21.0, 14.0, 16.0, 16.0, 14.0, 13.0, 7.0, 9.0, 8.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.5, -40.0810546875, -38.662109375, -37.2431640625, -35.82421875, -34.4052734375, -32.986328125, -31.5673828125, -30.1484375, -28.7294921875, -27.310546875, -25.8916015625, -24.47265625, -23.0537109375, -21.634765625, -20.2158203125, -18.796875, -17.3779296875, -15.958984375, -14.5400390625, -13.12109375, -11.7021484375, -10.283203125, -8.8642578125, -7.4453125, -6.0263671875, -4.607421875, -3.1884765625, -1.76953125, -0.3505859375, 1.068359375, 2.4873046875, 3.90625, 5.3251953125, 6.744140625, 8.1630859375, 9.58203125, 11.0009765625, 12.419921875, 13.8388671875, 15.2578125, 16.6767578125, 18.095703125, 19.5146484375, 20.93359375, 22.3525390625, 23.771484375, 25.1904296875, 26.609375, 28.0283203125, 29.447265625, 30.8662109375, 32.28515625, 33.7041015625, 35.123046875, 36.5419921875, 37.9609375, 39.3798828125, 40.798828125, 42.2177734375, 43.63671875, 45.0556640625, 46.474609375, 47.8935546875, 49.3125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 16.0, 17.0, 27.0, 28.0, 52.0, 69.0, 107.0, 166.0, 287.0, 447.0, 646.0, 1021.0, 1643.0, 2606.0, 4094.0, 6468.0, 9820.0, 15428.0, 24587.0, 37857.0, 57877.0, 86268.0, 121275.0, 401902.0, 945763.0, 122721.0, 88371.0, 59516.0, 38924.0, 25076.0, 15838.0, 10165.0, 6360.0, 4177.0, 2664.0, 1670.0, 1124.0, 689.0, 492.0, 309.0, 203.0, 113.0, 85.0, 61.0, 40.0, 20.0, 13.0, 12.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.96484375, -2.872283935546875, -2.77972412109375, -2.687164306640625, -2.5946044921875, -2.502044677734375, -2.40948486328125, -2.316925048828125, -2.224365234375, -2.131805419921875, -2.03924560546875, -1.946685791015625, -1.8541259765625, -1.761566162109375, -1.66900634765625, -1.576446533203125, -1.48388671875, -1.391326904296875, -1.29876708984375, -1.206207275390625, -1.1136474609375, -1.021087646484375, -0.92852783203125, -0.835968017578125, -0.743408203125, -0.650848388671875, -0.55828857421875, -0.465728759765625, -0.3731689453125, -0.280609130859375, -0.18804931640625, -0.095489501953125, -0.0029296875, 0.089630126953125, 0.18218994140625, 0.274749755859375, 0.3673095703125, 0.459869384765625, 0.55242919921875, 0.644989013671875, 0.737548828125, 0.830108642578125, 0.92266845703125, 1.015228271484375, 1.1077880859375, 1.200347900390625, 1.29290771484375, 1.385467529296875, 1.47802734375, 1.570587158203125, 1.66314697265625, 1.755706787109375, 1.8482666015625, 1.940826416015625, 2.03338623046875, 2.125946044921875, 2.218505859375, 2.311065673828125, 2.40362548828125, 2.496185302734375, 2.5887451171875, 2.681304931640625, 2.77386474609375, 2.866424560546875, 2.958984375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 7.0, 3.0, 9.0, 4.0, 9.0, 14.0, 17.0, 25.0, 26.0, 25.0, 26.0, 23.0, 36.0, 38.0, 56.0, 51.0, 47.0, 59.0, 48.0, 61.0, 50.0, 45.0, 48.0, 51.0, 39.0, 33.0, 33.0, 29.0, 18.0, 13.0, 14.0, 9.0, 6.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.033233642578125, -0.03231477737426758, -0.031395912170410156, -0.030477046966552734, -0.029558181762695312, -0.02863931655883789, -0.02772045135498047, -0.026801586151123047, -0.025882720947265625, -0.024963855743408203, -0.02404499053955078, -0.02312612533569336, -0.022207260131835938, -0.021288394927978516, -0.020369529724121094, -0.019450664520263672, -0.01853179931640625, -0.017612934112548828, -0.016694068908691406, -0.015775203704833984, -0.014856338500976562, -0.01393747329711914, -0.013018608093261719, -0.012099742889404297, -0.011180877685546875, -0.010262012481689453, -0.009343147277832031, -0.00842428207397461, -0.0075054168701171875, -0.006586551666259766, -0.005667686462402344, -0.004748821258544922, -0.0038299560546875, -0.002911090850830078, -0.0019922256469726562, -0.0010733604431152344, -0.0001544952392578125, 0.0007643699645996094, 0.0016832351684570312, 0.002602100372314453, 0.003520965576171875, 0.004439830780029297, 0.005358695983886719, 0.006277561187744141, 0.0071964263916015625, 0.008115291595458984, 0.009034156799316406, 0.009953022003173828, 0.01087188720703125, 0.011790752410888672, 0.012709617614746094, 0.013628482818603516, 0.014547348022460938, 0.01546621322631836, 0.01638507843017578, 0.017303943634033203, 0.018222808837890625, 0.019141674041748047, 0.02006053924560547, 0.02097940444946289, 0.021898269653320312, 0.022817134857177734, 0.023736000061035156, 0.024654865264892578, 0.02557373046875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 14.0, 14.0, 10.0, 13.0, 38.0, 21.0, 35.0, 61.0, 85.0, 131.0, 203.0, 308.0, 603.0, 1085.0, 2011.0, 3816.0, 8029.0, 17812.0, 45088.0, 121683.0, 330365.0, 322748.0, 117817.0, 42983.0, 17442.0, 7820.0, 3734.0, 1995.0, 1068.0, 553.0, 317.0, 193.0, 154.0, 85.0, 50.0, 42.0, 38.0, 30.0, 16.0, 13.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.1579303741455078, -0.15228652954101562, -0.14664268493652344, -0.14099884033203125, -0.13535499572753906, -0.12971115112304688, -0.12406730651855469, -0.1184234619140625, -0.11277961730957031, -0.10713577270507812, -0.10149192810058594, -0.09584808349609375, -0.09020423889160156, -0.08456039428710938, -0.07891654968261719, -0.073272705078125, -0.06762886047363281, -0.061985015869140625, -0.05634117126464844, -0.05069732666015625, -0.04505348205566406, -0.039409637451171875, -0.03376579284667969, -0.0281219482421875, -0.022478103637695312, -0.016834259033203125, -0.011190414428710938, -0.00554656982421875, 9.72747802734375e-05, 0.005741119384765625, 0.011384963989257812, 0.01702880859375, 0.022672653198242188, 0.028316497802734375, 0.03396034240722656, 0.03960418701171875, 0.04524803161621094, 0.050891876220703125, 0.05653572082519531, 0.0621795654296875, 0.06782341003417969, 0.07346725463867188, 0.07911109924316406, 0.08475494384765625, 0.09039878845214844, 0.09604263305664062, 0.10168647766113281, 0.107330322265625, 0.11297416687011719, 0.11861801147460938, 0.12426185607910156, 0.12990570068359375, 0.13554954528808594, 0.14119338989257812, 0.1468372344970703, 0.1524810791015625, 0.1581249237060547, 0.16376876831054688, 0.16941261291503906, 0.17505645751953125, 0.18070030212402344, 0.18634414672851562, 0.1919879913330078, 0.1976318359375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 13.0, 7.0, 11.0, 22.0, 53.0, 63.0, 64.0, 86.0, 113.0, 122.0, 115.0, 90.0, 76.0, 55.0, 32.0, 25.0, 10.0, 9.0, 16.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.08668020367622375, -0.08447448909282684, -0.08226878196001053, -0.08006306737661362, -0.0778573527932167, -0.07565164566040039, -0.07344593107700348, -0.07124021649360657, -0.06903450936079025, -0.06682879477739334, -0.06462308764457703, -0.062417373061180115, -0.0602116622030735, -0.05800595134496689, -0.05580023676156998, -0.053594525903463364, -0.05138881132006645, -0.04918310046195984, -0.04697738587856293, -0.044771675020456314, -0.0425659641623497, -0.04036024957895279, -0.038154538720846176, -0.03594882786273956, -0.03374311327934265, -0.03153740242123604, -0.029331689700484276, -0.027125976979732513, -0.0249202661216259, -0.022714553400874138, -0.020508840680122375, -0.018303129822015762, -0.016097422689199448, -0.01389171089977026, -0.011685999110341072, -0.00948028638958931, -0.007274574600160122, -0.005068862810730934, -0.0028631500899791718, -0.000657438300549984, 0.0015482734888792038, 0.0037539855111390352, 0.005959697533398867, 0.008165409788489342, 0.01037112157791853, 0.012576833367347717, 0.01478254608809948, 0.016988258808851242, 0.019193969666957855, 0.021399682387709618, 0.02360539324581623, 0.025811105966567993, 0.028016816824674606, 0.03022252954542637, 0.03242824226617813, 0.034633953124284744, 0.03683966398239136, 0.03904537484049797, 0.04125108942389488, 0.043456800282001495, 0.04566251114010811, 0.04786822199821472, 0.05007393658161163, 0.052279647439718246, 0.05448536202311516]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 10.0, 12.0, 14.0, 10.0, 16.0, 19.0, 16.0, 20.0, 25.0, 28.0, 29.0, 27.0, 36.0, 46.0, 41.0, 33.0, 30.0, 47.0, 39.0, 59.0, 57.0, 37.0, 34.0, 36.0, 43.0, 32.0, 28.0, 20.0, 22.0, 15.0, 21.0, 18.0, 13.0, 11.0, 10.0, 8.0, 7.0, 9.0, 6.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.02265644073486328, -0.02202192321419716, -0.021387403830885887, -0.020752884447574615, -0.020118366926908493, -0.01948384940624237, -0.0188493300229311, -0.018214810639619827, -0.017580293118953705, -0.016945775598287582, -0.01631125621497631, -0.01567673683166504, -0.015042219310998917, -0.01440770085901022, -0.013773182407021523, -0.013138663955032825, -0.012504145503044128, -0.011869627051055431, -0.011235108599066734, -0.010600590147078037, -0.00996607169508934, -0.009331553243100643, -0.008697034791111946, -0.008062516339123249, -0.007427997887134552, -0.006793479435145855, -0.006158960983157158, -0.005524442531168461, -0.004889924079179764, -0.004255405627191067, -0.0036208871752023697, -0.0029863687232136726, -0.0023518502712249756, -0.0017173318192362785, -0.0010828133672475815, -0.00044829491525888443, 0.00018622353672981262, 0.0008207419887185097, 0.0014552604407072067, 0.0020897788926959038, 0.002724297344684601, 0.003358815796673298, 0.003993334248661995, 0.004627852700650692, 0.005262371152639389, 0.005896889604628086, 0.006531408056616783, 0.00716592650860548, 0.007800444960594177, 0.008434963412582874, 0.009069481864571571, 0.009704000316560268, 0.010338518768548965, 0.010973037220537663, 0.01160755567252636, 0.012242074124515057, 0.012876592576503754, 0.01351111102849245, 0.014145629480481148, 0.014780147932469845, 0.015414666384458542, 0.016049183905124664, 0.016683703288435936, 0.017318222671747208, 0.01795274019241333]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 13.0, 10.0, 20.0, 24.0, 28.0, 33.0, 29.0, 28.0, 33.0, 49.0, 41.0, 51.0, 48.0, 48.0, 45.0, 48.0, 46.0, 50.0, 48.0, 40.0, 38.0, 37.0, 28.0, 34.0, 19.0, 23.0, 20.0, 21.0, 10.0, 13.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.7421875, -68.171875, -65.6015625, -63.03125, -60.4609375, -57.890625, -55.3203125, -52.75, -50.1796875, -47.609375, -45.0390625, -42.46875, -39.8984375, -37.328125, -34.7578125, -32.1875, -29.6171875, -27.046875, -24.4765625, -21.90625, -19.3359375, -16.765625, -14.1953125, -11.625, -9.0546875, -6.484375, -3.9140625, -1.34375, 1.2265625, 3.796875, 6.3671875, 8.9375, 11.5078125, 14.078125, 16.6484375, 19.21875, 21.7890625, 24.359375, 26.9296875, 29.5, 32.0703125, 34.640625, 37.2109375, 39.78125, 42.3515625, 44.921875, 47.4921875, 50.0625, 52.6328125, 55.203125, 57.7734375, 60.34375, 62.9140625, 65.484375, 68.0546875, 70.625, 73.1953125, 75.765625, 78.3359375, 80.90625, 83.4765625, 86.046875, 88.6171875, 91.1875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 19.0, 13.0, 26.0, 37.0, 67.0, 77.0, 142.0, 230.0, 391.0, 680.0, 1378.0, 3771.0, 15009.0, 104295.0, 587060.0, 287742.0, 36329.0, 6846.0, 2161.0, 981.0, 525.0, 286.0, 176.0, 88.0, 86.0, 44.0, 33.0, 16.0, 12.0, 11.0, 6.0, 4.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -11.97412109375, -11.5263671875, -11.07861328125, -10.630859375, -10.18310546875, -9.7353515625, -9.28759765625, -8.83984375, -8.39208984375, -7.9443359375, -7.49658203125, -7.048828125, -6.60107421875, -6.1533203125, -5.70556640625, -5.2578125, -4.81005859375, -4.3623046875, -3.91455078125, -3.466796875, -3.01904296875, -2.5712890625, -2.12353515625, -1.67578125, -1.22802734375, -0.7802734375, -0.33251953125, 0.115234375, 0.56298828125, 1.0107421875, 1.45849609375, 1.90625, 2.35400390625, 2.8017578125, 3.24951171875, 3.697265625, 4.14501953125, 4.5927734375, 5.04052734375, 5.48828125, 5.93603515625, 6.3837890625, 6.83154296875, 7.279296875, 7.72705078125, 8.1748046875, 8.62255859375, 9.0703125, 9.51806640625, 9.9658203125, 10.41357421875, 10.861328125, 11.30908203125, 11.7568359375, 12.20458984375, 12.65234375, 13.10009765625, 13.5478515625, 13.99560546875, 14.443359375, 14.89111328125, 15.3388671875, 15.78662109375, 16.234375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 11.0, 20.0, 42.0, 70.0, 125.0, 138.0, 2205.0, 160.0, 113.0, 75.0, 42.0, 20.0, 12.0, 4.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-337.75, -327.69921875, -317.6484375, -307.59765625, -297.546875, -287.49609375, -277.4453125, -267.39453125, -257.34375, -247.29296875, -237.2421875, -227.19140625, -217.140625, -207.08984375, -197.0390625, -186.98828125, -176.9375, -166.88671875, -156.8359375, -146.78515625, -136.734375, -126.68359375, -116.6328125, -106.58203125, -96.53125, -86.48046875, -76.4296875, -66.37890625, -56.328125, -46.27734375, -36.2265625, -26.17578125, -16.125, -6.07421875, 3.9765625, 14.02734375, 24.078125, 34.12890625, 44.1796875, 54.23046875, 64.28125, 74.33203125, 84.3828125, 94.43359375, 104.484375, 114.53515625, 124.5859375, 134.63671875, 144.6875, 154.73828125, 164.7890625, 174.83984375, 184.890625, 194.94140625, 204.9921875, 215.04296875, 225.09375, 235.14453125, 245.1953125, 255.24609375, 265.296875, 275.34765625, 285.3984375, 295.44921875, 305.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 7.0, 7.0, 9.0, 12.0, 19.0, 23.0, 40.0, 49.0, 100.0, 261.0, 648.0, 1910.0, 16043.0, 3075301.0, 47064.0, 2768.0, 800.0, 323.0, 123.0, 78.0, 46.0, 20.0, 17.0, 10.0, 5.0, 8.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.625, -39.2978515625, -37.970703125, -36.6435546875, -35.31640625, -33.9892578125, -32.662109375, -31.3349609375, -30.0078125, -28.6806640625, -27.353515625, -26.0263671875, -24.69921875, -23.3720703125, -22.044921875, -20.7177734375, -19.390625, -18.0634765625, -16.736328125, -15.4091796875, -14.08203125, -12.7548828125, -11.427734375, -10.1005859375, -8.7734375, -7.4462890625, -6.119140625, -4.7919921875, -3.46484375, -2.1376953125, -0.810546875, 0.5166015625, 1.84375, 3.1708984375, 4.498046875, 5.8251953125, 7.15234375, 8.4794921875, 9.806640625, 11.1337890625, 12.4609375, 13.7880859375, 15.115234375, 16.4423828125, 17.76953125, 19.0966796875, 20.423828125, 21.7509765625, 23.078125, 24.4052734375, 25.732421875, 27.0595703125, 28.38671875, 29.7138671875, 31.041015625, 32.3681640625, 33.6953125, 35.0224609375, 36.349609375, 37.6767578125, 39.00390625, 40.3310546875, 41.658203125, 42.9853515625, 44.3125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 13.0, 26.0, 85.0, 212.0, 356.0, 202.0, 58.0, 19.0, 13.0, 5.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-240.0777587890625, -229.2676544189453, -218.4575653076172, -207.6474609375, -196.83737182617188, -186.0272674560547, -175.2171630859375, -164.40707397460938, -153.59698486328125, -142.78688049316406, -131.97679138183594, -121.16668701171875, -110.35659790039062, -99.54649353027344, -88.73639678955078, -77.92630004882812, -67.11619567871094, -56.30609893798828, -45.496002197265625, -34.6859016418457, -23.875804901123047, -13.06570816040039, -2.2556076049804688, 8.554489135742188, 19.364585876464844, 30.1746826171875, 40.984779357910156, 51.79487991333008, 62.604976654052734, 73.41506958007812, 84.22517395019531, 95.03527069091797, 105.84536743164062, 116.65546417236328, 127.46556091308594, 138.27566528320312, 149.08575439453125, 159.89585876464844, 170.70596313476562, 181.51605224609375, 192.32614135742188, 203.13624572753906, 213.9463348388672, 224.75643920898438, 235.5665283203125, 246.3766326904297, 257.1867370605469, 267.996826171875, 278.80694580078125, 289.6170349121094, 300.4271545410156, 311.23724365234375, 322.0473327636719, 332.857421875, 343.66754150390625, 354.4776306152344, 365.2877197265625, 376.0978088378906, 386.9079284667969, 397.718017578125, 408.5281066894531, 419.33819580078125, 430.1483154296875, 440.9584045410156, 451.76849365234375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 5.0, 4.0, 5.0, 7.0, 9.0, 10.0, 18.0, 22.0, 25.0, 17.0, 28.0, 31.0, 34.0, 31.0, 34.0, 41.0, 41.0, 41.0, 52.0, 40.0, 30.0, 35.0, 43.0, 39.0, 41.0, 37.0, 36.0, 30.0, 46.0, 26.0, 21.0, 21.0, 18.0, 14.0, 14.0, 13.0, 13.0, 5.0, 2.0, 8.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-129.8126983642578, -125.88247680664062, -121.95225524902344, -118.02203369140625, -114.09181213378906, -110.16159057617188, -106.23136901855469, -102.3011474609375, -98.37092590332031, -94.44070434570312, -90.51048278808594, -86.58026123046875, -82.65003967285156, -78.71981811523438, -74.78959655761719, -70.859375, -66.92914581298828, -62.998924255371094, -59.068702697753906, -55.13848114013672, -51.20825958251953, -47.278038024902344, -43.34781265258789, -39.4175910949707, -35.487369537353516, -31.557147979736328, -27.62692642211914, -23.69670295715332, -19.766481399536133, -15.836259841918945, -11.906036376953125, -7.9758148193359375, -4.04559326171875, -0.1153712272644043, 3.8148508071899414, 7.745073318481445, 11.675294876098633, 15.60551643371582, 19.53573989868164, 23.465961456298828, 27.396183013916016, 31.326404571533203, 35.25662612915039, 39.186851501464844, 43.11707305908203, 47.04729461669922, 50.977516174316406, 54.907737731933594, 58.83795928955078, 62.76818084716797, 66.69840240478516, 70.62862396240234, 74.55884552001953, 78.48906707763672, 82.41929626464844, 86.34951782226562, 90.27973937988281, 94.2099609375, 98.14018249511719, 102.07040405273438, 106.00062561035156, 109.93084716796875, 113.86106872558594, 117.79129028320312, 121.72151184082031]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 8.0, 9.0, 13.0, 14.0, 21.0, 21.0, 41.0, 55.0, 62.0, 115.0, 148.0, 192.0, 261.0, 436.0, 578.0, 826.0, 1336.0, 1927.0, 2842.0, 4064.0, 5575.0, 1007423.0, 6900.0, 4650.0, 3526.0, 2424.0, 1637.0, 1094.0, 695.0, 462.0, 345.0, 233.0, 179.0, 119.0, 77.0, 66.0, 42.0, 37.0, 21.0, 25.0, 11.0, 9.0, 7.0, 5.0, 10.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.909204483032227, -18.228309631347656, -17.54741668701172, -16.86652183532715, -16.185626983642578, -15.504732131958008, -14.823838233947754, -14.1429443359375, -13.46204948425293, -12.78115463256836, -12.100260734558105, -11.419366836547852, -10.738471984863281, -10.057577133178711, -9.376683235168457, -8.695789337158203, -8.014894485473633, -7.334000110626221, -6.653105735778809, -5.9722113609313965, -5.291316986083984, -4.610422611236572, -3.92952823638916, -3.248633861541748, -2.567739486694336, -1.8868451118469238, -1.2059507369995117, -0.5250563621520996, 0.1558380126953125, 0.8367323875427246, 1.5176267623901367, 2.198521137237549, 2.879413604736328, 3.5603079795837402, 4.241202354431152, 4.9220967292785645, 5.602991104125977, 6.283885478973389, 6.964779853820801, 7.645674228668213, 8.326568603515625, 9.007463455200195, 9.68835735321045, 10.369251251220703, 11.050146102905273, 11.731040954589844, 12.411934852600098, 13.092828750610352, 13.773723602294922, 14.454618453979492, 15.135512351989746, 15.81640625, 16.49730110168457, 17.17819595336914, 17.859088897705078, 18.53998374938965, 19.22087860107422, 19.90177345275879, 20.58266830444336, 21.263561248779297, 21.944456100463867, 22.625350952148438, 23.306243896484375, 23.987138748168945, 24.668033599853516]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 8.0, 5.0, 6.0, 8.0, 16.0, 16.0, 39.0, 63.0, 68.0, 119.0, 157.0, 1346.0, 51460764.0, 322.0, 84.0, 38.0, 27.0, 20.0, 13.0, 11.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2445.1943359375, -2361.688720703125, -2278.18310546875, -2194.677734375, -2111.172119140625, -2027.66650390625, -1944.160888671875, -1860.6552734375, -1777.149658203125, -1693.64404296875, -1610.1385498046875, -1526.6329345703125, -1443.1273193359375, -1359.621826171875, -1276.1162109375, -1192.610595703125, -1109.1051025390625, -1025.5994873046875, -942.0939331054688, -858.58837890625, -775.082763671875, -691.5772094726562, -608.0716552734375, -524.5660400390625, -441.06048583984375, -357.5549011230469, -274.04931640625, -190.54376220703125, -107.03817749023438, -23.5325927734375, 59.97296142578125, 143.47857666015625, 226.984130859375, 310.4897155761719, 393.99530029296875, 477.5008544921875, 561.0064697265625, 644.5120239257812, 728.017578125, 811.523193359375, 895.0287475585938, 978.5343017578125, 1062.0399169921875, 1145.54541015625, 1229.051025390625, 1312.556640625, 1396.062255859375, 1479.56787109375, 1563.0733642578125, 1646.5789794921875, 1730.08447265625, 1813.590087890625, 1897.095703125, 1980.601318359375, 2064.10693359375, 2147.6123046875, 2231.117919921875, 2314.62353515625, 2398.129150390625, 2481.634765625, 2565.14013671875, 2648.645751953125, 2732.1513671875, 2815.656982421875, 2899.16259765625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 9.0, 15.0, 18.0, 29.0, 27.0, 60.0, 91.0, 128.0, 163.0, 287.0, 425.0, 654.0, 920.0, 1339.0, 2146.0, 3209.0, 4882.0, 7397.0, 11532.0, 17614.0, 27573.0, 43233.0, 67334.0, 102979.0, 157755.0, 232117.0, 322172.0, 453428.0, 3509510.0, 400240.0, 301687.0, 213038.0, 144275.0, 94264.0, 59960.0, 39072.0, 25499.0, 16031.0, 10647.0, 6665.0, 4365.0, 2895.0, 1860.0, 1389.0, 842.0, 528.0, 376.0, 241.0, 159.0, 113.0, 79.0, 54.0, 47.0, 20.0, 15.0, 15.0, 7.0, 8.0, 4.0, 3.0, 4.0], "bins": [-0.89208984375, -0.8636703491210938, -0.8352508544921875, -0.8068313598632812, -0.778411865234375, -0.7499923706054688, -0.7215728759765625, -0.6931533813476562, -0.66473388671875, -0.6363143920898438, -0.6078948974609375, -0.5794754028320312, -0.551055908203125, -0.5226364135742188, -0.4942169189453125, -0.46579742431640625, -0.4373779296875, -0.40895843505859375, -0.3805389404296875, -0.35211944580078125, -0.323699951171875, -0.29528045654296875, -0.2668609619140625, -0.23844146728515625, -0.21002197265625, -0.18160247802734375, -0.1531829833984375, -0.12476348876953125, -0.096343994140625, -0.06792449951171875, -0.0395050048828125, -0.01108551025390625, 0.017333984375, 0.04575347900390625, 0.0741729736328125, 0.10259246826171875, 0.131011962890625, 0.15943145751953125, 0.1878509521484375, 0.21627044677734375, 0.24468994140625, 0.27310943603515625, 0.3015289306640625, 0.32994842529296875, 0.358367919921875, 0.38678741455078125, 0.4152069091796875, 0.44362640380859375, 0.4720458984375, 0.5004653930664062, 0.5288848876953125, 0.5573043823242188, 0.585723876953125, 0.6141433715820312, 0.6425628662109375, 0.6709823608398438, 0.69940185546875, 0.7278213500976562, 0.7562408447265625, 0.7846603393554688, 0.813079833984375, 0.8414993286132812, 0.8699188232421875, 0.8983383178710938, 0.9267578125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 13.0, 15.0, 12.0, 9.0, 10.0, 24.0, 23.0, 37.0, 29.0, 33.0, 37.0, 33.0, 39.0, 35.0, 32.0, 39.0, 46.0, 944.0, 149.0, 51.0, 32.0, 35.0, 28.0, 36.0, 24.0, 35.0, 29.0, 34.0, 21.0, 27.0, 16.0, 13.0, 12.0, 6.0, 9.0, 6.0, 5.0, 5.0, 7.0, 2.0, 0.0, 8.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.6484375, -13.2047119140625, -12.760986328125, -12.3172607421875, -11.87353515625, -11.4298095703125, -10.986083984375, -10.5423583984375, -10.0986328125, -9.6549072265625, -9.211181640625, -8.7674560546875, -8.32373046875, -7.8800048828125, -7.436279296875, -6.9925537109375, -6.548828125, -6.1051025390625, -5.661376953125, -5.2176513671875, -4.77392578125, -4.3302001953125, -3.886474609375, -3.4427490234375, -2.9990234375, -2.5552978515625, -2.111572265625, -1.6678466796875, -1.22412109375, -0.7803955078125, -0.336669921875, 0.1070556640625, 0.55078125, 0.9945068359375, 1.438232421875, 1.8819580078125, 2.32568359375, 2.7694091796875, 3.213134765625, 3.6568603515625, 4.1005859375, 4.5443115234375, 4.988037109375, 5.4317626953125, 5.87548828125, 6.3192138671875, 6.762939453125, 7.2066650390625, 7.650390625, 8.0941162109375, 8.537841796875, 8.9815673828125, 9.42529296875, 9.8690185546875, 10.312744140625, 10.7564697265625, 11.2001953125, 11.6439208984375, 12.087646484375, 12.5313720703125, 12.97509765625, 13.4188232421875, 13.862548828125, 14.3062744140625, 14.75]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 13.0, 13.0, 16.0, 29.0, 40.0, 46.0, 88.0, 156.0, 237.0, 436.0, 795.0, 1443.0, 2307.0, 4162.0, 7675.0, 14216.0, 26195.0, 48603.0, 88423.0, 158364.0, 272585.0, 426275.0, 2694252.0, 1541920.0, 411326.0, 258635.0, 150296.0, 83383.0, 45196.0, 24190.0, 13157.0, 7306.0, 4000.0, 2309.0, 1400.0, 765.0, 445.0, 247.0, 178.0, 109.0, 70.0, 43.0, 38.0, 18.0, 15.0, 9.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.1572265625, -1.124114990234375, -1.09100341796875, -1.057891845703125, -1.0247802734375, -0.991668701171875, -0.95855712890625, -0.925445556640625, -0.892333984375, -0.859222412109375, -0.82611083984375, -0.792999267578125, -0.7598876953125, -0.726776123046875, -0.69366455078125, -0.660552978515625, -0.62744140625, -0.594329833984375, -0.56121826171875, -0.528106689453125, -0.4949951171875, -0.461883544921875, -0.42877197265625, -0.395660400390625, -0.362548828125, -0.329437255859375, -0.29632568359375, -0.263214111328125, -0.2301025390625, -0.196990966796875, -0.16387939453125, -0.130767822265625, -0.09765625, -0.064544677734375, -0.03143310546875, 0.001678466796875, 0.0347900390625, 0.067901611328125, 0.10101318359375, 0.134124755859375, 0.167236328125, 0.200347900390625, 0.23345947265625, 0.266571044921875, 0.2996826171875, 0.332794189453125, 0.36590576171875, 0.399017333984375, 0.43212890625, 0.465240478515625, 0.49835205078125, 0.531463623046875, 0.5645751953125, 0.597686767578125, 0.63079833984375, 0.663909912109375, 0.697021484375, 0.730133056640625, 0.76324462890625, 0.796356201171875, 0.8294677734375, 0.862579345703125, 0.89569091796875, 0.928802490234375, 0.9619140625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 6.0, 7.0, 10.0, 11.0, 15.0, 16.0, 18.0, 11.0, 11.0, 18.0, 43.0, 39.0, 35.0, 40.0, 52.0, 34.0, 39.0, 50.0, 996.0, 113.0, 55.0, 42.0, 36.0, 43.0, 31.0, 42.0, 30.0, 29.0, 24.0, 27.0, 16.0, 15.0, 13.0, 9.0, 8.0, 6.0, 4.0, 4.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.078125, -10.705810546875, -10.33349609375, -9.961181640625, -9.5888671875, -9.216552734375, -8.84423828125, -8.471923828125, -8.099609375, -7.727294921875, -7.35498046875, -6.982666015625, -6.6103515625, -6.238037109375, -5.86572265625, -5.493408203125, -5.12109375, -4.748779296875, -4.37646484375, -4.004150390625, -3.6318359375, -3.259521484375, -2.88720703125, -2.514892578125, -2.142578125, -1.770263671875, -1.39794921875, -1.025634765625, -0.6533203125, -0.281005859375, 0.09130859375, 0.463623046875, 0.8359375, 1.208251953125, 1.58056640625, 1.952880859375, 2.3251953125, 2.697509765625, 3.06982421875, 3.442138671875, 3.814453125, 4.186767578125, 4.55908203125, 4.931396484375, 5.3037109375, 5.676025390625, 6.04833984375, 6.420654296875, 6.79296875, 7.165283203125, 7.53759765625, 7.909912109375, 8.2822265625, 8.654541015625, 9.02685546875, 9.399169921875, 9.771484375, 10.143798828125, 10.51611328125, 10.888427734375, 11.2607421875, 11.633056640625, 12.00537109375, 12.377685546875, 12.75]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 9.0, 5.0, 9.0, 10.0, 22.0, 20.0, 40.0, 42.0, 76.0, 101.0, 134.0, 157.0, 223.0, 322.0, 510.0, 692.0, 949.0, 1587.0, 2343.0, 4126.0, 7290.0, 13407.0, 25790.0, 52794.0, 114885.0, 5653950.0, 240882.0, 84559.0, 40380.0, 19985.0, 10314.0, 5898.0, 3446.0, 2159.0, 1342.0, 872.0, 583.0, 407.0, 315.0, 233.0, 171.0, 94.0, 74.0, 67.0, 50.0, 40.0, 17.0, 17.0, 16.0, 2.0, 2.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.060546875, -2.96435546875, -2.8681640625, -2.77197265625, -2.67578125, -2.57958984375, -2.4833984375, -2.38720703125, -2.291015625, -2.19482421875, -2.0986328125, -2.00244140625, -1.90625, -1.81005859375, -1.7138671875, -1.61767578125, -1.521484375, -1.42529296875, -1.3291015625, -1.23291015625, -1.13671875, -1.04052734375, -0.9443359375, -0.84814453125, -0.751953125, -0.65576171875, -0.5595703125, -0.46337890625, -0.3671875, -0.27099609375, -0.1748046875, -0.07861328125, 0.017578125, 0.11376953125, 0.2099609375, 0.30615234375, 0.40234375, 0.49853515625, 0.5947265625, 0.69091796875, 0.787109375, 0.88330078125, 0.9794921875, 1.07568359375, 1.171875, 1.26806640625, 1.3642578125, 1.46044921875, 1.556640625, 1.65283203125, 1.7490234375, 1.84521484375, 1.94140625, 2.03759765625, 2.1337890625, 2.22998046875, 2.326171875, 2.42236328125, 2.5185546875, 2.61474609375, 2.7109375, 2.80712890625, 2.9033203125, 2.99951171875, 3.095703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 7.0, 4.0, 6.0, 8.0, 7.0, 16.0, 11.0, 13.0, 16.0, 25.0, 19.0, 21.0, 26.0, 30.0, 31.0, 27.0, 46.0, 34.0, 38.0, 36.0, 62.0, 883.0, 190.0, 42.0, 37.0, 39.0, 27.0, 38.0, 34.0, 32.0, 28.0, 22.0, 27.0, 27.0, 20.0, 16.0, 13.0, 14.0, 11.0, 10.0, 5.0, 6.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.2177734375, -7.951171875, -7.6845703125, -7.41796875, -7.1513671875, -6.884765625, -6.6181640625, -6.3515625, -6.0849609375, -5.818359375, -5.5517578125, -5.28515625, -5.0185546875, -4.751953125, -4.4853515625, -4.21875, -3.9521484375, -3.685546875, -3.4189453125, -3.15234375, -2.8857421875, -2.619140625, -2.3525390625, -2.0859375, -1.8193359375, -1.552734375, -1.2861328125, -1.01953125, -0.7529296875, -0.486328125, -0.2197265625, 0.046875, 0.3134765625, 0.580078125, 0.8466796875, 1.11328125, 1.3798828125, 1.646484375, 1.9130859375, 2.1796875, 2.4462890625, 2.712890625, 2.9794921875, 3.24609375, 3.5126953125, 3.779296875, 4.0458984375, 4.3125, 4.5791015625, 4.845703125, 5.1123046875, 5.37890625, 5.6455078125, 5.912109375, 6.1787109375, 6.4453125, 6.7119140625, 6.978515625, 7.2451171875, 7.51171875, 7.7783203125, 8.044921875, 8.3115234375, 8.578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 8.0, 10.0, 15.0, 28.0, 41.0, 67.0, 133.0, 182.0, 178.0, 133.0, 64.0, 49.0, 35.0, 18.0, 18.0, 7.0, 6.0, 4.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.14434051513672, -17.088048934936523, -16.031755447387695, -14.9754638671875, -13.919170379638672, -12.862878799438477, -11.806586265563965, -10.750293731689453, -9.694001197814941, -8.63770866394043, -7.581416130065918, -6.5251240730285645, -5.468831539154053, -4.412539005279541, -3.3562469482421875, -2.299954414367676, -1.243661880493164, -0.1873694658279419, 0.8689229488372803, 1.925215244293213, 2.9815077781677246, 4.037800312042236, 5.09409236907959, 6.150384902954102, 7.206677436828613, 8.262969970703125, 9.319262504577637, 10.375555038452148, 11.431846618652344, 12.488140106201172, 13.544431686401367, 14.600724220275879, 15.65701675415039, 16.713308334350586, 17.769601821899414, 18.82589340209961, 19.882186889648438, 20.938478469848633, 21.994770050048828, 23.051063537597656, 24.107357025146484, 25.16364860534668, 26.219942092895508, 27.276233673095703, 28.33252716064453, 29.388818740844727, 30.445110321044922, 31.50140380859375, 32.55769348144531, 33.61398696899414, 34.6702766418457, 35.72657012939453, 36.78286361694336, 37.83915710449219, 38.89544677734375, 39.95174026489258, 41.008033752441406, 42.064327239990234, 43.1206169128418, 44.176910400390625, 45.23320388793945, 46.28949737548828, 47.345787048339844, 48.40208053588867, 49.4583740234375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 7.0, 5.0, 9.0, 4.0, 20.0, 21.0, 24.0, 32.0, 40.0, 42.0, 35.0, 53.0, 61.0, 55.0, 43.0, 59.0, 48.0, 47.0, 61.0, 47.0, 50.0, 49.0, 42.0, 32.0, 39.0, 29.0, 25.0, 11.0, 7.0, 6.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.16651153564453, -36.938209533691406, -35.70990753173828, -34.48160934448242, -33.2533073425293, -32.02500534057617, -30.796703338623047, -29.568403244018555, -28.340103149414062, -27.111801147460938, -25.883501052856445, -24.65519905090332, -23.426898956298828, -22.198596954345703, -20.970294952392578, -19.741994857788086, -18.51369285583496, -17.285390853881836, -16.057090759277344, -14.828788757324219, -13.600488662719727, -12.372186660766602, -11.143885612487793, -9.915584564208984, -8.687283515930176, -7.458982467651367, -6.230681419372559, -5.002379894256592, -3.774078845977783, -2.5457777976989746, -1.3174762725830078, -0.08917522430419922, 1.1391258239746094, 2.367426872253418, 3.5957281589508057, 4.824029445648193, 6.052330493927002, 7.2806315422058105, 8.508933067321777, 9.737234115600586, 10.965535163879395, 12.193836212158203, 13.422137260437012, 14.65043830871582, 15.878740310668945, 17.107040405273438, 18.335342407226562, 19.563644409179688, 20.79194450378418, 22.020246505737305, 23.248546600341797, 24.476848602294922, 25.705148696899414, 26.93345069885254, 28.16175079345703, 29.390052795410156, 30.61835479736328, 31.846656799316406, 33.07495880126953, 34.30325698852539, 35.531558990478516, 36.75986099243164, 37.988162994384766, 39.216461181640625, 40.44476318359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 5.0, 5.0, 12.0, 16.0, 20.0, 29.0, 56.0, 62.0, 95.0, 139.0, 221.0, 293.0, 484.0, 765.0, 1215.0, 1957.0, 3767.0, 8885.0, 35454.0, 3987410.0, 128058.0, 14656.0, 4919.0, 2406.0, 1353.0, 758.0, 461.0, 278.0, 154.0, 118.0, 70.0, 57.0, 28.0, 19.0, 15.0, 13.0, 2.0, 9.0, 5.0, 4.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.252685546875, -0.24358749389648438, -0.23448944091796875, -0.22539138793945312, -0.2162933349609375, -0.20719528198242188, -0.19809722900390625, -0.18899917602539062, -0.179901123046875, -0.17080307006835938, -0.16170501708984375, -0.15260696411132812, -0.1435089111328125, -0.13441085815429688, -0.12531280517578125, -0.11621475219726562, -0.10711669921875, -0.09801864624023438, -0.08892059326171875, -0.07982254028320312, -0.0707244873046875, -0.061626434326171875, -0.05252838134765625, -0.043430328369140625, -0.034332275390625, -0.025234222412109375, -0.01613616943359375, -0.007038116455078125, 0.0020599365234375, 0.011157989501953125, 0.02025604248046875, 0.029354095458984375, 0.0384521484375, 0.047550201416015625, 0.05664825439453125, 0.06574630737304688, 0.0748443603515625, 0.08394241333007812, 0.09304046630859375, 0.10213851928710938, 0.111236572265625, 0.12033462524414062, 0.12943267822265625, 0.13853073120117188, 0.1476287841796875, 0.15672683715820312, 0.16582489013671875, 0.17492294311523438, 0.18402099609375, 0.19311904907226562, 0.20221710205078125, 0.21131515502929688, 0.2204132080078125, 0.22951126098632812, 0.23860931396484375, 0.24770736694335938, 0.256805419921875, 0.2659034729003906, 0.27500152587890625, 0.2840995788574219, 0.2931976318359375, 0.3022956848144531, 0.31139373779296875, 0.3204917907714844, 0.32958984375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 0.0, 7.0, 2.0, 5.0, 6.0, 8.0, 8.0, 9.0, 9.0, 10.0, 12.0, 18.0, 20.0, 767.0, 16.0, 17.0, 8.0, 9.0, 12.0, 9.0, 6.0, 5.0, 9.0, 2.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1102294921875, -0.10700511932373047, -0.10378074645996094, -0.1005563735961914, -0.09733200073242188, -0.09410762786865234, -0.09088325500488281, -0.08765888214111328, -0.08443450927734375, -0.08121013641357422, -0.07798576354980469, -0.07476139068603516, -0.07153701782226562, -0.0683126449584961, -0.06508827209472656, -0.06186389923095703, -0.0586395263671875, -0.05541515350341797, -0.05219078063964844, -0.048966407775878906, -0.045742034912109375, -0.042517662048339844, -0.03929328918457031, -0.03606891632080078, -0.03284454345703125, -0.02962017059326172, -0.026395797729492188, -0.023171424865722656, -0.019947052001953125, -0.016722679138183594, -0.013498306274414062, -0.010273933410644531, -0.007049560546875, -0.0038251876831054688, -0.0006008148193359375, 0.0026235580444335938, 0.005847930908203125, 0.009072303771972656, 0.012296676635742188, 0.015521049499511719, 0.01874542236328125, 0.02196979522705078, 0.025194168090820312, 0.028418540954589844, 0.031642913818359375, 0.034867286682128906, 0.03809165954589844, 0.04131603240966797, 0.0445404052734375, 0.04776477813720703, 0.05098915100097656, 0.054213523864746094, 0.057437896728515625, 0.060662269592285156, 0.06388664245605469, 0.06711101531982422, 0.07033538818359375, 0.07355976104736328, 0.07678413391113281, 0.08000850677490234, 0.08323287963867188, 0.0864572525024414, 0.08968162536621094, 0.09290599822998047, 0.09613037109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 13.0, 15.0, 21.0, 26.0, 44.0, 60.0, 88.0, 141.0, 199.0, 364.0, 627.0, 1117.0, 2317.0, 5158.0, 14209.0, 63027.0, 3532288.0, 518471.0, 36049.0, 10663.0, 4390.0, 2119.0, 1060.0, 697.0, 389.0, 238.0, 150.0, 87.0, 66.0, 44.0, 40.0, 19.0, 23.0, 8.0, 5.0, 12.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.248291015625, -0.24048614501953125, -0.2326812744140625, -0.22487640380859375, -0.217071533203125, -0.20926666259765625, -0.2014617919921875, -0.19365692138671875, -0.18585205078125, -0.17804718017578125, -0.1702423095703125, -0.16243743896484375, -0.154632568359375, -0.14682769775390625, -0.1390228271484375, -0.13121795654296875, -0.1234130859375, -0.11560821533203125, -0.1078033447265625, -0.09999847412109375, -0.092193603515625, -0.08438873291015625, -0.0765838623046875, -0.06877899169921875, -0.06097412109375, -0.05316925048828125, -0.0453643798828125, -0.03755950927734375, -0.029754638671875, -0.02194976806640625, -0.0141448974609375, -0.00634002685546875, 0.00146484375, 0.00926971435546875, 0.0170745849609375, 0.02487945556640625, 0.032684326171875, 0.04048919677734375, 0.0482940673828125, 0.05609893798828125, 0.06390380859375, 0.07170867919921875, 0.0795135498046875, 0.08731842041015625, 0.095123291015625, 0.10292816162109375, 0.1107330322265625, 0.11853790283203125, 0.1263427734375, 0.13414764404296875, 0.1419525146484375, 0.14975738525390625, 0.157562255859375, 0.16536712646484375, 0.1731719970703125, 0.18097686767578125, 0.18878173828125, 0.19658660888671875, 0.2043914794921875, 0.21219635009765625, 0.220001220703125, 0.22780609130859375, 0.2356109619140625, 0.24341583251953125, 0.251220703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 8.0, 15.0, 10.0, 17.0, 42.0, 79.0, 292.0, 1713.0, 1318.0, 299.0, 104.0, 48.0, 28.0, 18.0, 9.0, 12.0, 13.0, 8.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.161376953125, -0.15662193298339844, -0.15186691284179688, -0.1471118927001953, -0.14235687255859375, -0.1376018524169922, -0.13284683227539062, -0.12809181213378906, -0.1233367919921875, -0.11858177185058594, -0.11382675170898438, -0.10907173156738281, -0.10431671142578125, -0.09956169128417969, -0.09480667114257812, -0.09005165100097656, -0.085296630859375, -0.08054161071777344, -0.07578659057617188, -0.07103157043457031, -0.06627655029296875, -0.06152153015136719, -0.056766510009765625, -0.05201148986816406, -0.0472564697265625, -0.04250144958496094, -0.037746429443359375, -0.03299140930175781, -0.02823638916015625, -0.023481369018554688, -0.018726348876953125, -0.013971328735351562, -0.00921630859375, -0.0044612884521484375, 0.000293731689453125, 0.0050487518310546875, 0.00980377197265625, 0.014558792114257812, 0.019313812255859375, 0.024068832397460938, 0.0288238525390625, 0.03357887268066406, 0.038333892822265625, 0.04308891296386719, 0.04784393310546875, 0.05259895324707031, 0.057353973388671875, 0.06210899353027344, 0.066864013671875, 0.07161903381347656, 0.07637405395507812, 0.08112907409667969, 0.08588409423828125, 0.09063911437988281, 0.09539413452148438, 0.10014915466308594, 0.1049041748046875, 0.10965919494628906, 0.11441421508789062, 0.11916923522949219, 0.12392425537109375, 0.1286792755126953, 0.13343429565429688, 0.13818931579589844, 0.1429443359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 59.0, 462.0, 385.0, 61.0, 16.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.095311164855957, -2.0515289306640625, -2.007746934890747, -1.963964819908142, -1.920182704925537, -1.8764004707336426, -1.8326184749603271, -1.7888362407684326, -1.7450541257858276, -1.7012720108032227, -1.6574898958206177, -1.6137077808380127, -1.5699256658554077, -1.5261435508728027, -1.4823613166809082, -1.4385792016983032, -1.3947970867156982, -1.3510149717330933, -1.3072328567504883, -1.2634507417678833, -1.2196686267852783, -1.1758863925933838, -1.1321043968200684, -1.0883221626281738, -1.0445401668548584, -1.0007580518722534, -0.9569759368896484, -0.9131938219070435, -0.8694116473197937, -0.8256295323371887, -0.7818474173545837, -0.738065242767334, -0.6942831873893738, -0.6505010724067688, -0.6067189574241638, -0.5629367828369141, -0.5191546678543091, -0.4753725528717041, -0.4315904378890991, -0.38780829310417175, -0.3440261781215668, -0.3002440631389618, -0.2564619183540344, -0.21267980337142944, -0.16889767348766327, -0.1251155436038971, -0.08133342862129211, -0.037551283836364746, 0.006230831146240234, 0.05001295730471611, 0.09379508346319199, 0.13757720589637756, 0.18135933578014374, 0.2251414656639099, 0.2689235806465149, 0.31270572543144226, 0.35648784041404724, 0.4002699553966522, 0.4440521001815796, 0.48783421516418457, 0.5316163301467896, 0.5753984451293945, 0.6191805601119995, 0.6629627346992493, 0.7067448496818542]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 13.0, 6.0, 13.0, 25.0, 35.0, 53.0, 88.0, 114.0, 127.0, 136.0, 121.0, 82.0, 60.0, 50.0, 30.0, 16.0, 10.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7515149712562561, -0.7248200178146362, -0.6981250047683716, -0.6714300513267517, -0.6447350978851318, -0.618040144443512, -0.5913451910018921, -0.5646501779556274, -0.5379552245140076, -0.5112602710723877, -0.48456528782844543, -0.4578703045845032, -0.4311753511428833, -0.4044803977012634, -0.37778541445732117, -0.3510904312133789, -0.32439547777175903, -0.29770052433013916, -0.2710055410861969, -0.24431057274341583, -0.21761560440063477, -0.1909206360578537, -0.16422566771507263, -0.13753069937229156, -0.1108357310295105, -0.08414076268672943, -0.057445794343948364, -0.030750826001167297, -0.0040558576583862305, 0.022639110684394836, 0.0493340790271759, 0.07602904736995697, 0.10272401571273804, 0.1294189840555191, 0.15611395239830017, 0.18280892074108124, 0.2095038890838623, 0.23619885742664337, 0.26289382576942444, 0.2895888090133667, 0.3162837624549866, 0.34297871589660645, 0.3696736991405487, 0.39636868238449097, 0.42306363582611084, 0.4497585892677307, 0.476453572511673, 0.5031485557556152, 0.5298435091972351, 0.556538462638855, 0.5832334756851196, 0.6099284291267395, 0.6366233825683594, 0.6633183360099792, 0.6900132894515991, 0.7167083024978638, 0.7434032559394836, 0.7700982093811035, 0.7967932224273682, 0.823488175868988, 0.8501831293106079, 0.8768780827522278, 0.9035730361938477, 0.9302680492401123, 0.9569630026817322]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 9.0, 14.0, 15.0, 14.0, 26.0, 47.0, 46.0, 75.0, 89.0, 150.0, 235.0, 350.0, 505.0, 658.0, 1084.0, 1690.0, 2796.0, 4498.0, 8145.0, 14985.0, 31235.0, 730555.0, 191293.0, 27791.0, 13472.0, 7391.0, 4172.0, 2558.0, 1559.0, 1002.0, 664.0, 443.0, 292.0, 187.0, 131.0, 110.0, 71.0, 59.0, 40.0, 23.0, 23.0, 18.0, 9.0, 9.0, 7.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.410400390625, -0.3971290588378906, -0.38385772705078125, -0.3705863952636719, -0.3573150634765625, -0.3440437316894531, -0.33077239990234375, -0.3175010681152344, -0.304229736328125, -0.2909584045410156, -0.27768707275390625, -0.2644157409667969, -0.2511444091796875, -0.23787307739257812, -0.22460174560546875, -0.21133041381835938, -0.19805908203125, -0.18478775024414062, -0.17151641845703125, -0.15824508666992188, -0.1449737548828125, -0.13170242309570312, -0.11843109130859375, -0.10515975952148438, -0.091888427734375, -0.07861709594726562, -0.06534576416015625, -0.052074432373046875, -0.0388031005859375, -0.025531768798828125, -0.01226043701171875, 0.001010894775390625, 0.0142822265625, 0.027553558349609375, 0.04082489013671875, 0.054096221923828125, 0.0673675537109375, 0.08063888549804688, 0.09391021728515625, 0.10718154907226562, 0.120452880859375, 0.13372421264648438, 0.14699554443359375, 0.16026687622070312, 0.1735382080078125, 0.18680953979492188, 0.20008087158203125, 0.21335220336914062, 0.22662353515625, 0.23989486694335938, 0.25316619873046875, 0.2664375305175781, 0.2797088623046875, 0.2929801940917969, 0.30625152587890625, 0.3195228576660156, 0.332794189453125, 0.3460655212402344, 0.35933685302734375, 0.3726081848144531, 0.3858795166015625, 0.3991508483886719, 0.41242218017578125, 0.4256935119628906, 0.43896484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 10.0, 10.0, 8.0, 9.0, 8.0, 12.0, 12.0, 32.0, 611.0, 157.0, 16.0, 11.0, 8.0, 9.0, 13.0, 7.0, 9.0, 2.0, 9.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097900390625, -0.09497642517089844, -0.09205245971679688, -0.08912849426269531, -0.08620452880859375, -0.08328056335449219, -0.08035659790039062, -0.07743263244628906, -0.0745086669921875, -0.07158470153808594, -0.06866073608398438, -0.06573677062988281, -0.06281280517578125, -0.05988883972167969, -0.056964874267578125, -0.05404090881347656, -0.051116943359375, -0.04819297790527344, -0.045269012451171875, -0.04234504699707031, -0.03942108154296875, -0.03649711608886719, -0.033573150634765625, -0.030649185180664062, -0.0277252197265625, -0.024801254272460938, -0.021877288818359375, -0.018953323364257812, -0.01602935791015625, -0.013105392456054688, -0.010181427001953125, -0.0072574615478515625, -0.00433349609375, -0.0014095306396484375, 0.001514434814453125, 0.0044384002685546875, 0.00736236572265625, 0.010286331176757812, 0.013210296630859375, 0.016134262084960938, 0.0190582275390625, 0.021982192993164062, 0.024906158447265625, 0.027830123901367188, 0.03075408935546875, 0.03367805480957031, 0.036602020263671875, 0.03952598571777344, 0.042449951171875, 0.04537391662597656, 0.048297882080078125, 0.05122184753417969, 0.05414581298828125, 0.05706977844238281, 0.059993743896484375, 0.06291770935058594, 0.0658416748046875, 0.06876564025878906, 0.07168960571289062, 0.07461357116699219, 0.07753753662109375, 0.08046150207519531, 0.08338546752929688, 0.08630943298339844, 0.0892333984375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 14.0, 22.0, 27.0, 28.0, 46.0, 58.0, 76.0, 126.0, 149.0, 242.0, 395.0, 751.0, 1473.0, 3334.0, 8874.0, 27633.0, 98914.0, 355719.0, 392259.0, 111056.0, 30454.0, 9710.0, 3623.0, 1489.0, 755.0, 421.0, 268.0, 160.0, 148.0, 89.0, 66.0, 46.0, 33.0, 19.0, 12.0, 15.0, 11.0, 7.0, 5.0, 3.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.27099609375, -0.2625389099121094, -0.25408172607421875, -0.24562454223632812, -0.2371673583984375, -0.22871017456054688, -0.22025299072265625, -0.21179580688476562, -0.203338623046875, -0.19488143920898438, -0.18642425537109375, -0.17796707153320312, -0.1695098876953125, -0.16105270385742188, -0.15259552001953125, -0.14413833618164062, -0.13568115234375, -0.12722396850585938, -0.11876678466796875, -0.11030960083007812, -0.1018524169921875, -0.09339523315429688, -0.08493804931640625, -0.07648086547851562, -0.068023681640625, -0.059566497802734375, -0.05110931396484375, -0.042652130126953125, -0.0341949462890625, -0.025737762451171875, -0.01728057861328125, -0.008823394775390625, -0.0003662109375, 0.008090972900390625, 0.01654815673828125, 0.025005340576171875, 0.0334625244140625, 0.041919708251953125, 0.05037689208984375, 0.058834075927734375, 0.067291259765625, 0.07574844360351562, 0.08420562744140625, 0.09266281127929688, 0.1011199951171875, 0.10957717895507812, 0.11803436279296875, 0.12649154663085938, 0.13494873046875, 0.14340591430664062, 0.15186309814453125, 0.16032028198242188, 0.1687774658203125, 0.17723464965820312, 0.18569183349609375, 0.19414901733398438, 0.202606201171875, 0.21106338500976562, 0.21952056884765625, 0.22797775268554688, 0.2364349365234375, 0.24489212036132812, 0.25334930419921875, 0.2618064880371094, 0.270263671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 9.0, 11.0, 10.0, 8.0, 17.0, 24.0, 29.0, 18.0, 25.0, 34.0, 30.0, 31.0, 38.0, 30.0, 33.0, 30.0, 40.0, 39.0, 51.0, 44.0, 43.0, 44.0, 37.0, 36.0, 35.0, 43.0, 33.0, 29.0, 17.0, 19.0, 20.0, 15.0, 7.0, 16.0, 9.0, 8.0, 6.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.37060546875, -0.36048126220703125, -0.3503570556640625, -0.34023284912109375, -0.330108642578125, -0.31998443603515625, -0.3098602294921875, -0.29973602294921875, -0.28961181640625, -0.27948760986328125, -0.2693634033203125, -0.25923919677734375, -0.249114990234375, -0.23899078369140625, -0.2288665771484375, -0.21874237060546875, -0.2086181640625, -0.19849395751953125, -0.1883697509765625, -0.17824554443359375, -0.168121337890625, -0.15799713134765625, -0.1478729248046875, -0.13774871826171875, -0.12762451171875, -0.11750030517578125, -0.1073760986328125, -0.09725189208984375, -0.087127685546875, -0.07700347900390625, -0.0668792724609375, -0.05675506591796875, -0.046630859375, -0.03650665283203125, -0.0263824462890625, -0.01625823974609375, -0.006134033203125, 0.00399017333984375, 0.0141143798828125, 0.02423858642578125, 0.03436279296875, 0.04448699951171875, 0.0546112060546875, 0.06473541259765625, 0.074859619140625, 0.08498382568359375, 0.0951080322265625, 0.10523223876953125, 0.1153564453125, 0.12548065185546875, 0.1356048583984375, 0.14572906494140625, 0.155853271484375, 0.16597747802734375, 0.1761016845703125, 0.18622589111328125, 0.19635009765625, 0.20647430419921875, 0.2165985107421875, 0.22672271728515625, 0.236846923828125, 0.24697113037109375, 0.2570953369140625, 0.26721954345703125, 0.27734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 9.0, 18.0, 29.0, 37.0, 106.0, 142.0, 264.0, 667.0, 1627.0, 5996.0, 54541.0, 944710.0, 33253.0, 4673.0, 1350.0, 504.0, 264.0, 127.0, 80.0, 43.0, 31.0, 21.0, 10.0, 10.0, 10.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34521484375, -0.331634521484375, -0.31805419921875, -0.304473876953125, -0.2908935546875, -0.277313232421875, -0.26373291015625, -0.250152587890625, -0.236572265625, -0.222991943359375, -0.20941162109375, -0.195831298828125, -0.1822509765625, -0.168670654296875, -0.15509033203125, -0.141510009765625, -0.1279296875, -0.114349365234375, -0.10076904296875, -0.087188720703125, -0.0736083984375, -0.060028076171875, -0.04644775390625, -0.032867431640625, -0.019287109375, -0.005706787109375, 0.00787353515625, 0.021453857421875, 0.0350341796875, 0.048614501953125, 0.06219482421875, 0.075775146484375, 0.08935546875, 0.102935791015625, 0.11651611328125, 0.130096435546875, 0.1436767578125, 0.157257080078125, 0.17083740234375, 0.184417724609375, 0.197998046875, 0.211578369140625, 0.22515869140625, 0.238739013671875, 0.2523193359375, 0.265899658203125, 0.27947998046875, 0.293060302734375, 0.306640625, 0.320220947265625, 0.33380126953125, 0.347381591796875, 0.3609619140625, 0.374542236328125, 0.38812255859375, 0.401702880859375, 0.415283203125, 0.428863525390625, 0.44244384765625, 0.456024169921875, 0.4696044921875, 0.483184814453125, 0.49676513671875, 0.510345458984375, 0.52392578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 8.0, 7.0, 8.0, 9.0, 11.0, 8.0, 15.0, 23.0, 20.0, 14.0, 25.0, 29.0, 46.0, 66.0, 131.0, 145.0, 146.0, 57.0, 44.0, 36.0, 25.0, 22.0, 9.0, 18.0, 15.0, 13.0, 9.0, 8.0, 3.0, 6.0, 6.0, 7.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023126602172851562, -0.00022310763597488403, -0.00021494925022125244, -0.00020679086446762085, -0.00019863247871398926, -0.00019047409296035767, -0.00018231570720672607, -0.00017415732145309448, -0.0001659989356994629, -0.0001578405499458313, -0.0001496821641921997, -0.00014152377843856812, -0.00013336539268493652, -0.00012520700693130493, -0.00011704862117767334, -0.00010889023542404175, -0.00010073184967041016, -9.257346391677856e-05, -8.441507816314697e-05, -7.625669240951538e-05, -6.809830665588379e-05, -5.99399209022522e-05, -5.1781535148620605e-05, -4.3623149394989014e-05, -3.546476364135742e-05, -2.730637788772583e-05, -1.9147992134094238e-05, -1.0989606380462646e-05, -2.8312206268310547e-06, 5.327165126800537e-06, 1.3485550880432129e-05, 2.164393663406372e-05, 2.9802322387695312e-05, 3.7960708141326904e-05, 4.6119093894958496e-05, 5.427747964859009e-05, 6.243586540222168e-05, 7.059425115585327e-05, 7.875263690948486e-05, 8.691102266311646e-05, 9.506940841674805e-05, 0.00010322779417037964, 0.00011138617992401123, 0.00011954456567764282, 0.00012770295143127441, 0.000135861337184906, 0.0001440197229385376, 0.0001521781086921692, 0.00016033649444580078, 0.00016849488019943237, 0.00017665326595306396, 0.00018481165170669556, 0.00019297003746032715, 0.00020112842321395874, 0.00020928680896759033, 0.00021744519472122192, 0.00022560358047485352, 0.0002337619662284851, 0.0002419203519821167, 0.0002500787377357483, 0.0002582371234893799, 0.0002663955092430115, 0.00027455389499664307, 0.00028271228075027466, 0.00029087066650390625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 10.0, 10.0, 14.0, 27.0, 67.0, 121.0, 225.0, 462.0, 1262.0, 4658.0, 30398.0, 715647.0, 274897.0, 15965.0, 3107.0, 960.0, 342.0, 161.0, 75.0, 48.0, 31.0, 23.0, 16.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3202018737792969, -0.30910491943359375, -0.2980079650878906, -0.2869110107421875, -0.2758140563964844, -0.26471710205078125, -0.2536201477050781, -0.242523193359375, -0.23142623901367188, -0.22032928466796875, -0.20923233032226562, -0.1981353759765625, -0.18703842163085938, -0.17594146728515625, -0.16484451293945312, -0.15374755859375, -0.14265060424804688, -0.13155364990234375, -0.12045669555664062, -0.1093597412109375, -0.09826278686523438, -0.08716583251953125, -0.07606887817382812, -0.064971923828125, -0.053874969482421875, -0.04277801513671875, -0.031681060791015625, -0.0205841064453125, -0.009487152099609375, 0.00160980224609375, 0.012706756591796875, 0.0238037109375, 0.034900665283203125, 0.04599761962890625, 0.057094573974609375, 0.0681915283203125, 0.07928848266601562, 0.09038543701171875, 0.10148239135742188, 0.112579345703125, 0.12367630004882812, 0.13477325439453125, 0.14587020874023438, 0.1569671630859375, 0.16806411743164062, 0.17916107177734375, 0.19025802612304688, 0.20135498046875, 0.21245193481445312, 0.22354888916015625, 0.23464584350585938, 0.2457427978515625, 0.2568397521972656, 0.26793670654296875, 0.2790336608886719, 0.290130615234375, 0.3012275695800781, 0.31232452392578125, 0.3234214782714844, 0.3345184326171875, 0.3456153869628906, 0.35671234130859375, 0.3678092956542969, 0.37890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 8.0, 7.0, 9.0, 18.0, 23.0, 33.0, 60.0, 78.0, 131.0, 162.0, 181.0, 100.0, 82.0, 49.0, 33.0, 13.0, 10.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5164108276367188, -0.5015716552734375, -0.48673248291015625, -0.471893310546875, -0.45705413818359375, -0.4422149658203125, -0.42737579345703125, -0.41253662109375, -0.39769744873046875, -0.3828582763671875, -0.36801910400390625, -0.353179931640625, -0.33834075927734375, -0.3235015869140625, -0.30866241455078125, -0.2938232421875, -0.27898406982421875, -0.2641448974609375, -0.24930572509765625, -0.234466552734375, -0.21962738037109375, -0.2047882080078125, -0.18994903564453125, -0.17510986328125, -0.16027069091796875, -0.1454315185546875, -0.13059234619140625, -0.115753173828125, -0.10091400146484375, -0.0860748291015625, -0.07123565673828125, -0.056396484375, -0.04155731201171875, -0.0267181396484375, -0.01187896728515625, 0.002960205078125, 0.01779937744140625, 0.0326385498046875, 0.04747772216796875, 0.06231689453125, 0.07715606689453125, 0.0919952392578125, 0.10683441162109375, 0.121673583984375, 0.13651275634765625, 0.1513519287109375, 0.16619110107421875, 0.1810302734375, 0.19586944580078125, 0.2107086181640625, 0.22554779052734375, 0.240386962890625, 0.25522613525390625, 0.2700653076171875, 0.28490447998046875, 0.29974365234375, 0.31458282470703125, 0.3294219970703125, 0.34426116943359375, 0.359100341796875, 0.37393951416015625, 0.3887786865234375, 0.40361785888671875, 0.41845703125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 19.0, 58.0, 257.0, 496.0, 117.0, 23.0, 15.0, 5.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.924313545227051, -6.680110454559326, -6.43590784072876, -6.191704750061035, -5.947502136230469, -5.703299045562744, -5.459096431732178, -5.214893341064453, -4.970690727233887, -4.726487636566162, -4.482285022735596, -4.238081932067871, -3.9938793182373047, -3.74967622756958, -3.5054736137390137, -3.261270523071289, -3.0170676708221436, -2.772864818572998, -2.5286619663238525, -2.284459114074707, -2.0402562618255615, -1.7960532903671265, -1.551850438117981, -1.3076475858688354, -1.06344473361969, -0.8192418813705444, -0.5750390291213989, -0.33083611726760864, -0.08663326501846313, 0.15756964683532715, 0.40177249908447266, 0.6459753513336182, 0.8901782035827637, 1.1343810558319092, 1.3785839080810547, 1.6227867603302002, 1.8669896125793457, 2.1111927032470703, 2.3553953170776367, 2.5995984077453613, 2.8438010215759277, 3.0880038738250732, 3.3322067260742188, 3.5764095783233643, 3.8206124305725098, 4.064815521240234, 4.309018135070801, 4.553221225738525, 4.79742431640625, 5.041627407073975, 5.285830020904541, 5.530033111572266, 5.774235725402832, 6.018438816070557, 6.262641429901123, 6.506844520568848, 6.751047134399414, 6.995250225067139, 7.239452838897705, 7.48365592956543, 7.727858543395996, 7.972061634063721, 8.216264724731445, 8.460467338562012, 8.704669952392578]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 2.0, 7.0, 14.0, 17.0, 16.0, 29.0, 53.0, 79.0, 112.0, 123.0, 121.0, 109.0, 89.0, 63.0, 35.0, 27.0, 12.0, 8.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.305180072784424, -5.129615783691406, -4.9540510177612305, -4.778486251831055, -4.602921962738037, -4.4273576736450195, -4.251792907714844, -4.076228141784668, -3.9006638526916504, -3.7250993251800537, -3.549534797668457, -3.3739702701568604, -3.1984057426452637, -3.022841215133667, -2.8472766876220703, -2.6717121601104736, -2.496147632598877, -2.3205831050872803, -2.1450185775756836, -1.969454050064087, -1.7938895225524902, -1.6183249950408936, -1.4427604675292969, -1.2671959400177002, -1.0916314125061035, -0.9160668849945068, -0.7405023574829102, -0.5649378299713135, -0.3893733024597168, -0.21380877494812012, -0.03824424743652344, 0.13732028007507324, 0.3128852844238281, 0.4884498119354248, 0.6640143394470215, 0.8395788669586182, 1.0151433944702148, 1.1907079219818115, 1.3662724494934082, 1.5418369770050049, 1.7174015045166016, 1.8929660320281982, 2.068530559539795, 2.2440950870513916, 2.4196596145629883, 2.595224142074585, 2.7707886695861816, 2.9463531970977783, 3.121917724609375, 3.2974822521209717, 3.4730467796325684, 3.648611307144165, 3.8241758346557617, 3.9997403621673584, 4.175304889678955, 4.350869178771973, 4.526433944702148, 4.701998710632324, 4.877562999725342, 5.053127288818359, 5.228692054748535, 5.404256820678711, 5.5798211097717285, 5.755385398864746, 5.930950164794922]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 5.0, 6.0, 9.0, 18.0, 12.0, 18.0, 24.0, 48.0, 66.0, 95.0, 156.0, 284.0, 417.0, 790.0, 1428.0, 2890.0, 6111.0, 16141.0, 69851.0, 3955251.0, 113323.0, 17230.0, 5809.0, 2142.0, 994.0, 537.0, 256.0, 151.0, 78.0, 53.0, 40.0, 18.0, 18.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2490234375, -1.2174835205078125, -1.185943603515625, -1.1544036865234375, -1.12286376953125, -1.0913238525390625, -1.059783935546875, -1.0282440185546875, -0.9967041015625, -0.9651641845703125, -0.933624267578125, -0.9020843505859375, -0.87054443359375, -0.8390045166015625, -0.807464599609375, -0.7759246826171875, -0.744384765625, -0.7128448486328125, -0.681304931640625, -0.6497650146484375, -0.61822509765625, -0.5866851806640625, -0.555145263671875, -0.5236053466796875, -0.4920654296875, -0.4605255126953125, -0.428985595703125, -0.3974456787109375, -0.36590576171875, -0.3343658447265625, -0.302825927734375, -0.2712860107421875, -0.23974609375, -0.2082061767578125, -0.176666259765625, -0.1451263427734375, -0.11358642578125, -0.0820465087890625, -0.050506591796875, -0.0189666748046875, 0.0125732421875, 0.0441131591796875, 0.075653076171875, 0.1071929931640625, 0.13873291015625, 0.1702728271484375, 0.201812744140625, 0.2333526611328125, 0.264892578125, 0.2964324951171875, 0.327972412109375, 0.3595123291015625, 0.39105224609375, 0.4225921630859375, 0.454132080078125, 0.4856719970703125, 0.5172119140625, 0.5487518310546875, 0.580291748046875, 0.6118316650390625, 0.64337158203125, 0.6749114990234375, 0.706451416015625, 0.7379913330078125, 0.76953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 2.0, 7.0, 6.0, 10.0, 11.0, 7.0, 10.0, 17.0, 45.0, 213.0, 386.0, 151.0, 40.0, 8.0, 15.0, 9.0, 18.0, 8.0, 5.0, 2.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10772705078125, -0.10497760772705078, -0.10222816467285156, -0.09947872161865234, -0.09672927856445312, -0.0939798355102539, -0.09123039245605469, -0.08848094940185547, -0.08573150634765625, -0.08298206329345703, -0.08023262023925781, -0.0774831771850586, -0.07473373413085938, -0.07198429107666016, -0.06923484802246094, -0.06648540496826172, -0.0637359619140625, -0.06098651885986328, -0.05823707580566406, -0.055487632751464844, -0.052738189697265625, -0.049988746643066406, -0.04723930358886719, -0.04448986053466797, -0.04174041748046875, -0.03899097442626953, -0.03624153137207031, -0.033492088317871094, -0.030742645263671875, -0.027993202209472656, -0.025243759155273438, -0.02249431610107422, -0.019744873046875, -0.01699542999267578, -0.014245986938476562, -0.011496543884277344, -0.008747100830078125, -0.005997657775878906, -0.0032482147216796875, -0.0004987716674804688, 0.00225067138671875, 0.005000114440917969, 0.0077495574951171875, 0.010499000549316406, 0.013248443603515625, 0.015997886657714844, 0.018747329711914062, 0.02149677276611328, 0.0242462158203125, 0.02699565887451172, 0.029745101928710938, 0.032494544982910156, 0.035243988037109375, 0.037993431091308594, 0.04074287414550781, 0.04349231719970703, 0.04624176025390625, 0.04899120330810547, 0.05174064636230469, 0.054490089416503906, 0.057239532470703125, 0.059988975524902344, 0.06273841857910156, 0.06548786163330078, 0.0682373046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 17.0, 24.0, 25.0, 59.0, 124.0, 245.0, 700.0, 2297.0, 13572.0, 312436.0, 3822608.0, 35759.0, 4472.0, 1093.0, 388.0, 205.0, 105.0, 51.0, 39.0, 18.0, 12.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6576766967773438, -0.6293182373046875, -0.6009597778320312, -0.572601318359375, -0.5442428588867188, -0.5158843994140625, -0.48752593994140625, -0.45916748046875, -0.43080902099609375, -0.4024505615234375, -0.37409210205078125, -0.345733642578125, -0.31737518310546875, -0.2890167236328125, -0.26065826416015625, -0.2322998046875, -0.20394134521484375, -0.1755828857421875, -0.14722442626953125, -0.118865966796875, -0.09050750732421875, -0.0621490478515625, -0.03379058837890625, -0.00543212890625, 0.02292633056640625, 0.0512847900390625, 0.07964324951171875, 0.108001708984375, 0.13636016845703125, 0.1647186279296875, 0.19307708740234375, 0.221435546875, 0.24979400634765625, 0.2781524658203125, 0.30651092529296875, 0.334869384765625, 0.36322784423828125, 0.3915863037109375, 0.41994476318359375, 0.44830322265625, 0.47666168212890625, 0.5050201416015625, 0.5333786010742188, 0.561737060546875, 0.5900955200195312, 0.6184539794921875, 0.6468124389648438, 0.6751708984375, 0.7035293579101562, 0.7318878173828125, 0.7602462768554688, 0.788604736328125, 0.8169631958007812, 0.8453216552734375, 0.8736801147460938, 0.90203857421875, 0.9303970336914062, 0.9587554931640625, 0.9871139526367188, 1.015472412109375, 1.0438308715820312, 1.0721893310546875, 1.1005477905273438, 1.12890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 3.0, 13.0, 7.0, 16.0, 21.0, 42.0, 79.0, 135.0, 532.0, 2212.0, 578.0, 194.0, 93.0, 45.0, 27.0, 23.0, 12.0, 16.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0718994140625, -0.067535400390625, -0.06317138671875, -0.058807373046875, -0.054443359375, -0.050079345703125, -0.04571533203125, -0.041351318359375, -0.0369873046875, -0.032623291015625, -0.02825927734375, -0.023895263671875, -0.01953125, -0.015167236328125, -0.01080322265625, -0.006439208984375, -0.0020751953125, 0.002288818359375, 0.00665283203125, 0.011016845703125, 0.015380859375, 0.019744873046875, 0.02410888671875, 0.028472900390625, 0.0328369140625, 0.037200927734375, 0.04156494140625, 0.045928955078125, 0.05029296875, 0.054656982421875, 0.05902099609375, 0.063385009765625, 0.0677490234375, 0.072113037109375, 0.07647705078125, 0.080841064453125, 0.085205078125, 0.089569091796875, 0.09393310546875, 0.098297119140625, 0.1026611328125, 0.107025146484375, 0.11138916015625, 0.115753173828125, 0.1201171875, 0.124481201171875, 0.12884521484375, 0.133209228515625, 0.1375732421875, 0.141937255859375, 0.14630126953125, 0.150665283203125, 0.155029296875, 0.159393310546875, 0.16375732421875, 0.168121337890625, 0.1724853515625, 0.176849365234375, 0.18121337890625, 0.185577392578125, 0.18994140625, 0.194305419921875, 0.19866943359375, 0.203033447265625, 0.2073974609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 16.0, 207.0, 628.0, 105.0, 17.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7564871311187744, -1.6835155487060547, -1.610543966293335, -1.5375723838806152, -1.4646008014678955, -1.3916292190551758, -1.318657636642456, -1.2456860542297363, -1.1727144718170166, -1.0997428894042969, -1.0267713069915771, -0.9537997245788574, -0.8808281421661377, -0.807856559753418, -0.7348849773406982, -0.6619133949279785, -0.5889418125152588, -0.5159702301025391, -0.44299864768981934, -0.3700270652770996, -0.2970554828643799, -0.22408390045166016, -0.15111231803894043, -0.0781407356262207, -0.0051691532135009766, 0.06780242919921875, 0.14077401161193848, 0.2137455940246582, 0.28671717643737793, 0.35968875885009766, 0.4326603412628174, 0.5056319236755371, 0.5786037445068359, 0.6515753269195557, 0.7245469093322754, 0.7975184917449951, 0.8704900741577148, 0.9434616565704346, 1.0164332389831543, 1.089404821395874, 1.1623764038085938, 1.2353479862213135, 1.3083195686340332, 1.381291151046753, 1.4542627334594727, 1.5272343158721924, 1.600205898284912, 1.6731774806976318, 1.7461490631103516, 1.8191206455230713, 1.892092227935791, 1.9650638103485107, 2.0380353927612305, 2.11100697517395, 2.18397855758667, 2.2569501399993896, 2.3299217224121094, 2.402893304824829, 2.475864887237549, 2.5488364696502686, 2.6218080520629883, 2.694779634475708, 2.7677512168884277, 2.8407227993011475, 2.913694381713867]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 9.0, 12.0, 12.0, 22.0, 31.0, 33.0, 39.0, 54.0, 69.0, 68.0, 84.0, 91.0, 62.0, 63.0, 53.0, 57.0, 58.0, 41.0, 37.0, 22.0, 17.0, 7.0, 14.0, 8.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.8213629722595215, -0.8008663654327393, -0.7803698182106018, -0.7598732709884644, -0.7393766641616821, -0.7188800573348999, -0.6983835101127625, -0.677886962890625, -0.6573903560638428, -0.6368937492370605, -0.6163972020149231, -0.5959006547927856, -0.5754040479660034, -0.5549074411392212, -0.5344108939170837, -0.5139143466949463, -0.49341773986816406, -0.4729211628437042, -0.4524245858192444, -0.43192800879478455, -0.4114314317703247, -0.39093485474586487, -0.37043827772140503, -0.3499417006969452, -0.32944512367248535, -0.3089485466480255, -0.2884519696235657, -0.26795539259910583, -0.247458815574646, -0.22696223855018616, -0.20646566152572632, -0.18596908450126648, -0.16547244787216187, -0.14497587084770203, -0.12447929382324219, -0.10398271679878235, -0.08348613977432251, -0.06298956274986267, -0.04249298572540283, -0.021996408700942993, -0.0014998316764831543, 0.018996745347976685, 0.03949332237243652, 0.05998989939689636, 0.0804864764213562, 0.10098305344581604, 0.12147963047027588, 0.14197620749473572, 0.16247278451919556, 0.1829693615436554, 0.20346593856811523, 0.22396251559257507, 0.2444590926170349, 0.26495566964149475, 0.2854522466659546, 0.30594882369041443, 0.32644540071487427, 0.3469419777393341, 0.36743855476379395, 0.3879351317882538, 0.4084317088127136, 0.42892828583717346, 0.4494248628616333, 0.46992143988609314, 0.490418016910553]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 7.0, 3.0, 7.0, 14.0, 12.0, 19.0, 27.0, 37.0, 59.0, 72.0, 135.0, 214.0, 300.0, 493.0, 935.0, 1651.0, 3170.0, 6848.0, 16051.0, 50493.0, 658021.0, 253937.0, 32672.0, 12101.0, 5301.0, 2567.0, 1457.0, 699.0, 468.0, 249.0, 150.0, 129.0, 88.0, 55.0, 29.0, 23.0, 22.0, 12.0, 9.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.470458984375, -0.4546928405761719, -0.43892669677734375, -0.4231605529785156, -0.4073944091796875, -0.3916282653808594, -0.37586212158203125, -0.3600959777832031, -0.344329833984375, -0.3285636901855469, -0.31279754638671875, -0.2970314025878906, -0.2812652587890625, -0.2654991149902344, -0.24973297119140625, -0.23396682739257812, -0.21820068359375, -0.20243453979492188, -0.18666839599609375, -0.17090225219726562, -0.1551361083984375, -0.13936996459960938, -0.12360382080078125, -0.10783767700195312, -0.092071533203125, -0.07630538940429688, -0.06053924560546875, -0.044773101806640625, -0.0290069580078125, -0.013240814208984375, 0.00252532958984375, 0.018291473388671875, 0.0340576171875, 0.049823760986328125, 0.06558990478515625, 0.08135604858398438, 0.0971221923828125, 0.11288833618164062, 0.12865447998046875, 0.14442062377929688, 0.160186767578125, 0.17595291137695312, 0.19171905517578125, 0.20748519897460938, 0.2232513427734375, 0.23901748657226562, 0.25478363037109375, 0.2705497741699219, 0.28631591796875, 0.3020820617675781, 0.31784820556640625, 0.3336143493652344, 0.3493804931640625, 0.3651466369628906, 0.38091278076171875, 0.3966789245605469, 0.412445068359375, 0.4282112121582031, 0.44397735595703125, 0.4597434997558594, 0.4755096435546875, 0.4912757873535156, 0.5070419311523438, 0.5228080749511719, 0.53857421875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 7.0, 9.0, 6.0, 12.0, 6.0, 25.0, 27.0, 79.0, 169.0, 255.0, 173.0, 92.0, 46.0, 20.0, 19.0, 5.0, 6.0, 13.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.10113525390625, -0.09857177734375, -0.09600830078125, -0.09344482421875, -0.09088134765625, -0.08831787109375, -0.08575439453125, -0.08319091796875, -0.08062744140625, -0.07806396484375, -0.07550048828125, -0.07293701171875, -0.07037353515625, -0.06781005859375, -0.06524658203125, -0.06268310546875, -0.06011962890625, -0.05755615234375, -0.05499267578125, -0.05242919921875, -0.04986572265625, -0.04730224609375, -0.04473876953125, -0.04217529296875, -0.03961181640625, -0.03704833984375, -0.03448486328125, -0.03192138671875, -0.02935791015625, -0.02679443359375, -0.02423095703125, -0.02166748046875, -0.01910400390625, -0.01654052734375, -0.01397705078125, -0.01141357421875, -0.00885009765625, -0.00628662109375, -0.00372314453125, -0.00115966796875, 0.00140380859375, 0.00396728515625, 0.00653076171875, 0.00909423828125, 0.01165771484375, 0.01422119140625, 0.01678466796875, 0.01934814453125, 0.02191162109375, 0.02447509765625, 0.02703857421875, 0.02960205078125, 0.03216552734375, 0.03472900390625, 0.03729248046875, 0.03985595703125, 0.04241943359375, 0.04498291015625, 0.04754638671875, 0.05010986328125, 0.05267333984375, 0.05523681640625, 0.05780029296875, 0.06036376953125, 0.06292724609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 6.0, 1.0, 4.0, 2.0, 5.0, 4.0, 15.0, 65.0, 408.0, 4208.0, 887245.0, 154844.0, 1467.0, 190.0, 32.0, 8.0, 10.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.732421875, -1.679656982421875, -1.62689208984375, -1.574127197265625, -1.5213623046875, -1.468597412109375, -1.41583251953125, -1.363067626953125, -1.310302734375, -1.257537841796875, -1.20477294921875, -1.152008056640625, -1.0992431640625, -1.046478271484375, -0.99371337890625, -0.940948486328125, -0.88818359375, -0.835418701171875, -0.78265380859375, -0.729888916015625, -0.6771240234375, -0.624359130859375, -0.57159423828125, -0.518829345703125, -0.466064453125, -0.413299560546875, -0.36053466796875, -0.307769775390625, -0.2550048828125, -0.202239990234375, -0.14947509765625, -0.096710205078125, -0.0439453125, 0.008819580078125, 0.06158447265625, 0.114349365234375, 0.1671142578125, 0.219879150390625, 0.27264404296875, 0.325408935546875, 0.378173828125, 0.430938720703125, 0.48370361328125, 0.536468505859375, 0.5892333984375, 0.641998291015625, 0.69476318359375, 0.747528076171875, 0.80029296875, 0.853057861328125, 0.90582275390625, 0.958587646484375, 1.0113525390625, 1.064117431640625, 1.11688232421875, 1.169647216796875, 1.222412109375, 1.275177001953125, 1.32794189453125, 1.380706787109375, 1.4334716796875, 1.486236572265625, 1.53900146484375, 1.591766357421875, 1.64453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 3.0, 1.0, 1.0, 2.0, 5.0, 12.0, 5.0, 9.0, 11.0, 9.0, 6.0, 7.0, 16.0, 16.0, 18.0, 13.0, 24.0, 21.0, 25.0, 31.0, 26.0, 28.0, 28.0, 33.0, 28.0, 36.0, 33.0, 39.0, 37.0, 30.0, 35.0, 32.0, 35.0, 27.0, 30.0, 30.0, 33.0, 25.0, 16.0, 30.0, 22.0, 30.0, 12.0, 17.0, 18.0, 17.0, 10.0, 7.0, 5.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.1727294921875, -0.16731834411621094, -0.16190719604492188, -0.1564960479736328, -0.15108489990234375, -0.1456737518310547, -0.14026260375976562, -0.13485145568847656, -0.1294403076171875, -0.12402915954589844, -0.11861801147460938, -0.11320686340332031, -0.10779571533203125, -0.10238456726074219, -0.09697341918945312, -0.09156227111816406, -0.086151123046875, -0.08073997497558594, -0.07532882690429688, -0.06991767883300781, -0.06450653076171875, -0.05909538269042969, -0.053684234619140625, -0.04827308654785156, -0.0428619384765625, -0.03745079040527344, -0.032039642333984375, -0.026628494262695312, -0.02121734619140625, -0.015806198120117188, -0.010395050048828125, -0.0049839019775390625, 0.00042724609375, 0.0058383941650390625, 0.011249542236328125, 0.016660690307617188, 0.02207183837890625, 0.027482986450195312, 0.032894134521484375, 0.03830528259277344, 0.0437164306640625, 0.04912757873535156, 0.054538726806640625, 0.05994987487792969, 0.06536102294921875, 0.07077217102050781, 0.07618331909179688, 0.08159446716308594, 0.087005615234375, 0.09241676330566406, 0.09782791137695312, 0.10323905944824219, 0.10865020751953125, 0.11406135559082031, 0.11947250366210938, 0.12488365173339844, 0.1302947998046875, 0.13570594787597656, 0.14111709594726562, 0.1465282440185547, 0.15193939208984375, 0.1573505401611328, 0.16276168823242188, 0.16817283630371094, 0.173583984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 6.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 18.0, 34.0, 72.0, 272.0, 1666.0, 85343.0, 957020.0, 3473.0, 400.0, 106.0, 35.0, 19.0, 17.0, 12.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.48828125, -1.4389190673828125, -1.389556884765625, -1.3401947021484375, -1.29083251953125, -1.2414703369140625, -1.192108154296875, -1.1427459716796875, -1.0933837890625, -1.0440216064453125, -0.994659423828125, -0.9452972412109375, -0.89593505859375, -0.8465728759765625, -0.797210693359375, -0.7478485107421875, -0.698486328125, -0.6491241455078125, -0.599761962890625, -0.5503997802734375, -0.50103759765625, -0.4516754150390625, -0.402313232421875, -0.3529510498046875, -0.3035888671875, -0.2542266845703125, -0.204864501953125, -0.1555023193359375, -0.10614013671875, -0.0567779541015625, -0.007415771484375, 0.0419464111328125, 0.09130859375, 0.1406707763671875, 0.190032958984375, 0.2393951416015625, 0.28875732421875, 0.3381195068359375, 0.387481689453125, 0.4368438720703125, 0.4862060546875, 0.5355682373046875, 0.584930419921875, 0.6342926025390625, 0.68365478515625, 0.7330169677734375, 0.782379150390625, 0.8317413330078125, 0.881103515625, 0.9304656982421875, 0.979827880859375, 1.0291900634765625, 1.07855224609375, 1.1279144287109375, 1.177276611328125, 1.2266387939453125, 1.2760009765625, 1.3253631591796875, 1.374725341796875, 1.4240875244140625, 1.47344970703125, 1.5228118896484375, 1.572174072265625, 1.6215362548828125, 1.6708984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 8.0, 5.0, 12.0, 6.0, 10.0, 18.0, 23.0, 29.0, 33.0, 67.0, 101.0, 133.0, 177.0, 88.0, 63.0, 64.0, 32.0, 21.0, 18.0, 17.0, 13.0, 11.0, 9.0, 5.0, 1.0, 6.0, 7.0, 4.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0003590583801269531, -0.0003485754132270813, -0.00033809244632720947, -0.00032760947942733765, -0.0003171265125274658, -0.000306643545627594, -0.00029616057872772217, -0.00028567761182785034, -0.0002751946449279785, -0.0002647116780281067, -0.00025422871112823486, -0.00024374574422836304, -0.0002332627773284912, -0.00022277981042861938, -0.00021229684352874756, -0.00020181387662887573, -0.0001913309097290039, -0.00018084794282913208, -0.00017036497592926025, -0.00015988200902938843, -0.0001493990421295166, -0.00013891607522964478, -0.00012843310832977295, -0.00011795014142990112, -0.0001074671745300293, -9.698420763015747e-05, -8.650124073028564e-05, -7.601827383041382e-05, -6.553530693054199e-05, -5.5052340030670166e-05, -4.456937313079834e-05, -3.4086406230926514e-05, -2.3603439331054688e-05, -1.3120472431182861e-05, -2.637505531311035e-06, 7.845461368560791e-06, 1.8328428268432617e-05, 2.8811395168304443e-05, 3.929436206817627e-05, 4.9777328968048096e-05, 6.026029586791992e-05, 7.074326276779175e-05, 8.122622966766357e-05, 9.17091965675354e-05, 0.00010219216346740723, 0.00011267513036727905, 0.00012315809726715088, 0.0001336410641670227, 0.00014412403106689453, 0.00015460699796676636, 0.00016508996486663818, 0.00017557293176651, 0.00018605589866638184, 0.00019653886556625366, 0.0002070218324661255, 0.00021750479936599731, 0.00022798776626586914, 0.00023847073316574097, 0.0002489537000656128, 0.0002594366669654846, 0.00026991963386535645, 0.00028040260076522827, 0.0002908855676651001, 0.0003013685345649719, 0.00031185150146484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 13.0, 15.0, 30.0, 37.0, 74.0, 132.0, 202.0, 472.0, 1236.0, 4872.0, 45387.0, 864864.0, 119671.0, 8466.0, 1827.0, 652.0, 278.0, 133.0, 80.0, 39.0, 22.0, 13.0, 10.0, 7.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54345703125, -0.52777099609375, -0.5120849609375, -0.49639892578125, -0.480712890625, -0.46502685546875, -0.4493408203125, -0.43365478515625, -0.41796875, -0.40228271484375, -0.3865966796875, -0.37091064453125, -0.355224609375, -0.33953857421875, -0.3238525390625, -0.30816650390625, -0.29248046875, -0.27679443359375, -0.2611083984375, -0.24542236328125, -0.229736328125, -0.21405029296875, -0.1983642578125, -0.18267822265625, -0.1669921875, -0.15130615234375, -0.1356201171875, -0.11993408203125, -0.104248046875, -0.08856201171875, -0.0728759765625, -0.05718994140625, -0.04150390625, -0.02581787109375, -0.0101318359375, 0.00555419921875, 0.021240234375, 0.03692626953125, 0.0526123046875, 0.06829833984375, 0.083984375, 0.09967041015625, 0.1153564453125, 0.13104248046875, 0.146728515625, 0.16241455078125, 0.1781005859375, 0.19378662109375, 0.20947265625, 0.22515869140625, 0.2408447265625, 0.25653076171875, 0.272216796875, 0.28790283203125, 0.3035888671875, 0.31927490234375, 0.3349609375, 0.35064697265625, 0.3663330078125, 0.38201904296875, 0.397705078125, 0.41339111328125, 0.4290771484375, 0.44476318359375, 0.46044921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 11.0, 17.0, 29.0, 34.0, 77.0, 145.0, 161.0, 177.0, 149.0, 94.0, 42.0, 28.0, 18.0, 9.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50537109375, -0.4921226501464844, -0.47887420654296875, -0.4656257629394531, -0.4523773193359375, -0.4391288757324219, -0.42588043212890625, -0.4126319885253906, -0.399383544921875, -0.3861351013183594, -0.37288665771484375, -0.3596382141113281, -0.3463897705078125, -0.3331413269042969, -0.31989288330078125, -0.3066444396972656, -0.29339599609375, -0.2801475524902344, -0.26689910888671875, -0.2536506652832031, -0.2404022216796875, -0.22715377807617188, -0.21390533447265625, -0.20065689086914062, -0.187408447265625, -0.17416000366210938, -0.16091156005859375, -0.14766311645507812, -0.1344146728515625, -0.12116622924804688, -0.10791778564453125, -0.09466934204101562, -0.0814208984375, -0.06817245483398438, -0.05492401123046875, -0.041675567626953125, -0.0284271240234375, -0.015178680419921875, -0.00193023681640625, 0.011318206787109375, 0.024566650390625, 0.037815093994140625, 0.05106353759765625, 0.06431198120117188, 0.0775604248046875, 0.09080886840820312, 0.10405731201171875, 0.11730575561523438, 0.13055419921875, 0.14380264282226562, 0.15705108642578125, 0.17029953002929688, 0.1835479736328125, 0.19679641723632812, 0.21004486083984375, 0.22329330444335938, 0.236541748046875, 0.24979019165039062, 0.26303863525390625, 0.2762870788574219, 0.2895355224609375, 0.3027839660644531, 0.31603240966796875, 0.3292808532714844, 0.342529296875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 24.0, 63.0, 167.0, 323.0, 232.0, 102.0, 36.0, 18.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.8879098892211914, -3.7847743034362793, -3.681638717651367, -3.578502893447876, -3.475367307662964, -3.3722317218780518, -3.2690958976745605, -3.1659603118896484, -3.0628247261047363, -2.959689140319824, -2.856553554534912, -2.753417730331421, -2.650282144546509, -2.5471465587615967, -2.4440107345581055, -2.3408751487731934, -2.2377395629882812, -2.134603977203369, -2.031468391418457, -1.9283325672149658, -1.8251969814300537, -1.7220613956451416, -1.61892569065094, -1.5157899856567383, -1.4126543998718262, -1.309518814086914, -1.2063831090927124, -1.1032474040985107, -1.0001118183135986, -0.8969761729240417, -0.7938405275344849, -0.690704882144928, -0.5875692367553711, -0.4844335913658142, -0.3812979459762573, -0.27816230058670044, -0.17502665519714355, -0.07189100980758667, 0.031244635581970215, 0.1343802809715271, 0.23751592636108398, 0.34065157175064087, 0.44378721714019775, 0.5469228625297546, 0.6500585079193115, 0.7531941533088684, 0.8563297986984253, 0.9594654440879822, 1.062601089477539, 1.1657366752624512, 1.2688723802566528, 1.3720080852508545, 1.4751436710357666, 1.5782792568206787, 1.6814149618148804, 1.784550666809082, 1.8876862525939941, 1.9908218383789062, 2.0939574241638184, 2.1970932483673096, 2.3002288341522217, 2.403364419937134, 2.506500244140625, 2.609635829925537, 2.712771415710449]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 10.0, 16.0, 19.0, 33.0, 54.0, 70.0, 92.0, 118.0, 141.0, 115.0, 111.0, 70.0, 42.0, 36.0, 24.0, 11.0, 6.0, 4.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6824002265930176, -2.5637271404266357, -2.445053815841675, -2.326380729675293, -2.207707643508911, -2.0890345573425293, -1.9703612327575684, -1.8516881465911865, -1.7330150604248047, -1.6143418550491333, -1.4956687688827515, -1.37699556350708, -1.2583224773406982, -1.1396492719650269, -1.0209760665893555, -0.9023029804229736, -0.7836297750473022, -0.6649566292762756, -0.546283483505249, -0.4276103079319, -0.3089371621608734, -0.19026398658752441, -0.0715908408164978, 0.04708230495452881, 0.16575545072555542, 0.28442859649658203, 0.40310174226760864, 0.5217748880386353, 0.6404480934143066, 0.7591212391853333, 0.8777943849563599, 0.9964675307273865, 1.115140676498413, 1.2338138818740845, 1.3524869680404663, 1.4711601734161377, 1.5898332595825195, 1.708506464958191, 1.8271796703338623, 1.9458527565002441, 2.064525842666626, 2.183198928833008, 2.3018722534179688, 2.4205453395843506, 2.5392184257507324, 2.6578917503356934, 2.776564836502075, 2.895237922668457, 3.013911247253418, 3.1325843334198, 3.2512576580047607, 3.3699307441711426, 3.4886038303375244, 3.6072769165039062, 3.725950241088867, 3.844623327255249, 3.963296413421631, 4.081969738006592, 4.2006425857543945, 4.3193159103393555, 4.437989234924316, 4.556662082672119, 4.67533540725708, 4.794008255004883, 4.912681579589844]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 3.0, 11.0, 8.0, 12.0, 12.0, 22.0, 22.0, 38.0, 56.0, 96.0, 155.0, 201.0, 317.0, 515.0, 1002.0, 2458.0, 8704.0, 218655.0, 3944652.0, 12499.0, 2696.0, 1111.0, 491.0, 231.0, 113.0, 63.0, 39.0, 25.0, 15.0, 13.0, 11.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849609375, -2.7785491943359375, -2.707489013671875, -2.6364288330078125, -2.56536865234375, -2.4943084716796875, -2.423248291015625, -2.3521881103515625, -2.2811279296875, -2.2100677490234375, -2.139007568359375, -2.0679473876953125, -1.99688720703125, -1.9258270263671875, -1.854766845703125, -1.7837066650390625, -1.712646484375, -1.6415863037109375, -1.570526123046875, -1.4994659423828125, -1.42840576171875, -1.3573455810546875, -1.286285400390625, -1.2152252197265625, -1.1441650390625, -1.0731048583984375, -1.002044677734375, -0.9309844970703125, -0.85992431640625, -0.7888641357421875, -0.717803955078125, -0.6467437744140625, -0.57568359375, -0.5046234130859375, -0.433563232421875, -0.3625030517578125, -0.29144287109375, -0.2203826904296875, -0.149322509765625, -0.0782623291015625, -0.0072021484375, 0.0638580322265625, 0.134918212890625, 0.2059783935546875, 0.27703857421875, 0.3480987548828125, 0.419158935546875, 0.4902191162109375, 0.561279296875, 0.6323394775390625, 0.703399658203125, 0.7744598388671875, 0.84552001953125, 0.9165802001953125, 0.987640380859375, 1.0587005615234375, 1.1297607421875, 1.2008209228515625, 1.271881103515625, 1.3429412841796875, 1.41400146484375, 1.4850616455078125, 1.556121826171875, 1.6271820068359375, 1.6982421875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 11.0, 21.0, 22.0, 29.0, 100.0, 212.0, 243.0, 174.0, 83.0, 37.0, 12.0, 18.0, 14.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11944580078125, -0.11647891998291016, -0.11351203918457031, -0.11054515838623047, -0.10757827758789062, -0.10461139678955078, -0.10164451599121094, -0.0986776351928711, -0.09571075439453125, -0.0927438735961914, -0.08977699279785156, -0.08681011199951172, -0.08384323120117188, -0.08087635040283203, -0.07790946960449219, -0.07494258880615234, -0.0719757080078125, -0.06900882720947266, -0.06604194641113281, -0.06307506561279297, -0.060108184814453125, -0.05714130401611328, -0.05417442321777344, -0.051207542419433594, -0.04824066162109375, -0.045273780822753906, -0.04230690002441406, -0.03934001922607422, -0.036373138427734375, -0.03340625762939453, -0.030439376831054688, -0.027472496032714844, -0.024505615234375, -0.021538734436035156, -0.018571853637695312, -0.015604972839355469, -0.012638092041015625, -0.009671211242675781, -0.0067043304443359375, -0.0037374496459960938, -0.00077056884765625, 0.0021963119506835938, 0.0051631927490234375, 0.008130073547363281, 0.011096954345703125, 0.014063835144042969, 0.017030715942382812, 0.019997596740722656, 0.0229644775390625, 0.025931358337402344, 0.028898239135742188, 0.03186511993408203, 0.034832000732421875, 0.03779888153076172, 0.04076576232910156, 0.043732643127441406, 0.04669952392578125, 0.049666404724121094, 0.05263328552246094, 0.05560016632080078, 0.058567047119140625, 0.06153392791748047, 0.06450080871582031, 0.06746768951416016, 0.0704345703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 9.0, 16.0, 13.0, 28.0, 36.0, 75.0, 170.0, 1212.0, 786609.0, 3404436.0, 1330.0, 172.0, 62.0, 30.0, 24.0, 13.0, 12.0, 9.0, 4.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.61614990234375, -2.5115966796875, -2.40704345703125, -2.302490234375, -2.19793701171875, -2.0933837890625, -1.98883056640625, -1.88427734375, -1.77972412109375, -1.6751708984375, -1.57061767578125, -1.466064453125, -1.36151123046875, -1.2569580078125, -1.15240478515625, -1.0478515625, -0.94329833984375, -0.8387451171875, -0.73419189453125, -0.629638671875, -0.52508544921875, -0.4205322265625, -0.31597900390625, -0.21142578125, -0.10687255859375, -0.0023193359375, 0.10223388671875, 0.206787109375, 0.31134033203125, 0.4158935546875, 0.52044677734375, 0.625, 0.72955322265625, 0.8341064453125, 0.93865966796875, 1.043212890625, 1.14776611328125, 1.2523193359375, 1.35687255859375, 1.46142578125, 1.56597900390625, 1.6705322265625, 1.77508544921875, 1.879638671875, 1.98419189453125, 2.0887451171875, 2.19329833984375, 2.2978515625, 2.40240478515625, 2.5069580078125, 2.61151123046875, 2.716064453125, 2.82061767578125, 2.9251708984375, 3.02972412109375, 3.13427734375, 3.23883056640625, 3.3433837890625, 3.44793701171875, 3.552490234375, 3.65704345703125, 3.7615966796875, 3.86614990234375, 3.970703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 4.0, 7.0, 12.0, 9.0, 11.0, 30.0, 43.0, 75.0, 137.0, 363.0, 1864.0, 976.0, 259.0, 112.0, 55.0, 29.0, 38.0, 19.0, 11.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.14306640625, -0.1391744613647461, -0.1352825164794922, -0.13139057159423828, -0.12749862670898438, -0.12360668182373047, -0.11971473693847656, -0.11582279205322266, -0.11193084716796875, -0.10803890228271484, -0.10414695739746094, -0.10025501251220703, -0.09636306762695312, -0.09247112274169922, -0.08857917785644531, -0.0846872329711914, -0.0807952880859375, -0.0769033432006836, -0.07301139831542969, -0.06911945343017578, -0.06522750854492188, -0.06133556365966797, -0.05744361877441406, -0.053551673889160156, -0.04965972900390625, -0.045767784118652344, -0.04187583923339844, -0.03798389434814453, -0.034091949462890625, -0.03020000457763672, -0.026308059692382812, -0.022416114807128906, -0.018524169921875, -0.014632225036621094, -0.010740280151367188, -0.006848335266113281, -0.002956390380859375, 0.0009355545043945312, 0.0048274993896484375, 0.008719444274902344, 0.01261138916015625, 0.016503334045410156, 0.020395278930664062, 0.02428722381591797, 0.028179168701171875, 0.03207111358642578, 0.03596305847167969, 0.039855003356933594, 0.0437469482421875, 0.047638893127441406, 0.05153083801269531, 0.05542278289794922, 0.059314727783203125, 0.06320667266845703, 0.06709861755371094, 0.07099056243896484, 0.07488250732421875, 0.07877445220947266, 0.08266639709472656, 0.08655834197998047, 0.09045028686523438, 0.09434223175048828, 0.09823417663574219, 0.1021261215209961, 0.10601806640625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 16.0, 23.0, 75.0, 347.0, 417.0, 95.0, 16.0, 9.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.921736240386963, -1.8760442733764648, -1.8303521871566772, -1.7846602201461792, -1.7389682531356812, -1.693276286125183, -1.6475841999053955, -1.6018922328948975, -1.5562002658843994, -1.5105082988739014, -1.4648162126541138, -1.4191242456436157, -1.3734322786331177, -1.3277403116226196, -1.282048225402832, -1.236356258392334, -1.190664291381836, -1.144972324371338, -1.0992802381515503, -1.0535882711410522, -1.0078963041305542, -0.9622042775154114, -0.9165122509002686, -0.8708202838897705, -0.8251281976699829, -0.7794361710548401, -0.733744204044342, -0.6880521774291992, -0.6423602104187012, -0.5966681838035583, -0.5509761571884155, -0.5052841901779175, -0.45959222316741943, -0.413900226354599, -0.36820822954177856, -0.32251620292663574, -0.2768242359161377, -0.23113222420215607, -0.18544021248817444, -0.139748215675354, -0.09405621886253357, -0.048364218324422836, -0.0026722177863121033, 0.04301978647708893, 0.08871178328990936, 0.1344037801027298, 0.18009579181671143, 0.22578778862953186, 0.2714797854423523, 0.31717178225517273, 0.36286377906799316, 0.408555805683136, 0.45424777269363403, 0.49993979930877686, 0.5456317663192749, 0.5913237929344177, 0.6370158195495605, 0.6827078461647034, 0.7283998131752014, 0.7740918397903442, 0.8197838068008423, 0.8654758334159851, 0.9111678600311279, 0.956859827041626, 1.002551794052124]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 3.0, 6.0, 6.0, 9.0, 6.0, 8.0, 18.0, 13.0, 20.0, 34.0, 37.0, 45.0, 49.0, 40.0, 77.0, 62.0, 61.0, 67.0, 66.0, 63.0, 48.0, 49.0, 35.0, 37.0, 24.0, 24.0, 18.0, 12.0, 11.0, 9.0, 7.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3199346661567688, -0.3076961636543274, -0.295457661151886, -0.2832191586494446, -0.2709806561470032, -0.25874215364456177, -0.24650365114212036, -0.23426514863967896, -0.22202664613723755, -0.20978814363479614, -0.19754964113235474, -0.18531113862991333, -0.17307263612747192, -0.16083413362503052, -0.1485956311225891, -0.1363571286201477, -0.12411864101886749, -0.11188013851642609, -0.09964163601398468, -0.08740313351154327, -0.07516463100910187, -0.06292612850666046, -0.05068763345479965, -0.038449130952358246, -0.02621062844991684, -0.013972126878798008, -0.0017336253076791763, 0.01050487533211708, 0.022743377834558487, 0.03498188033699989, 0.047220379114151, 0.05945888161659241, 0.07169738411903381, 0.08393588662147522, 0.09617438912391663, 0.10841289162635803, 0.12065139412879944, 0.13288989663124084, 0.14512839913368225, 0.15736690163612366, 0.16960540413856506, 0.18184390664100647, 0.19408240914344788, 0.20632091164588928, 0.2185594141483307, 0.2307979166507721, 0.2430364191532135, 0.2552749216556549, 0.2675133943557739, 0.27975189685821533, 0.29199039936065674, 0.30422890186309814, 0.31646740436553955, 0.32870590686798096, 0.34094440937042236, 0.35318291187286377, 0.3654214143753052, 0.3776599168777466, 0.389898419380188, 0.4021369218826294, 0.4143754243850708, 0.4266139268875122, 0.4388524293899536, 0.451090931892395, 0.4633294343948364]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 9.0, 9.0, 18.0, 16.0, 35.0, 58.0, 82.0, 167.0, 271.0, 625.0, 1582.0, 5221.0, 42771.0, 909943.0, 77441.0, 6921.0, 1901.0, 726.0, 336.0, 174.0, 93.0, 42.0, 37.0, 21.0, 14.0, 14.0, 7.0, 4.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7767715454101562, -0.7464141845703125, -0.7160568237304688, -0.685699462890625, -0.6553421020507812, -0.6249847412109375, -0.5946273803710938, -0.56427001953125, -0.5339126586914062, -0.5035552978515625, -0.47319793701171875, -0.442840576171875, -0.41248321533203125, -0.3821258544921875, -0.35176849365234375, -0.3214111328125, -0.29105377197265625, -0.2606964111328125, -0.23033905029296875, -0.199981689453125, -0.16962432861328125, -0.1392669677734375, -0.10890960693359375, -0.07855224609375, -0.04819488525390625, -0.0178375244140625, 0.01251983642578125, 0.042877197265625, 0.07323455810546875, 0.1035919189453125, 0.13394927978515625, 0.164306640625, 0.19466400146484375, 0.2250213623046875, 0.25537872314453125, 0.285736083984375, 0.31609344482421875, 0.3464508056640625, 0.37680816650390625, 0.40716552734375, 0.43752288818359375, 0.4678802490234375, 0.49823760986328125, 0.528594970703125, 0.5589523315429688, 0.5893096923828125, 0.6196670532226562, 0.6500244140625, 0.6803817749023438, 0.7107391357421875, 0.7410964965820312, 0.771453857421875, 0.8018112182617188, 0.8321685791015625, 0.8625259399414062, 0.89288330078125, 0.9232406616210938, 0.9535980224609375, 0.9839553833007812, 1.014312744140625, 1.0446701049804688, 1.0750274658203125, 1.1053848266601562, 1.1357421875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 11.0, 13.0, 28.0, 77.0, 155.0, 225.0, 220.0, 150.0, 56.0, 26.0, 12.0, 12.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11663818359375, -0.11363029479980469, -0.11062240600585938, -0.10761451721191406, -0.10460662841796875, -0.10159873962402344, -0.09859085083007812, -0.09558296203613281, -0.0925750732421875, -0.08956718444824219, -0.08655929565429688, -0.08355140686035156, -0.08054351806640625, -0.07753562927246094, -0.07452774047851562, -0.07151985168457031, -0.068511962890625, -0.06550407409667969, -0.062496185302734375, -0.05948829650878906, -0.05648040771484375, -0.05347251892089844, -0.050464630126953125, -0.04745674133300781, -0.0444488525390625, -0.04144096374511719, -0.038433074951171875, -0.03542518615722656, -0.03241729736328125, -0.029409408569335938, -0.026401519775390625, -0.023393630981445312, -0.0203857421875, -0.017377853393554688, -0.014369964599609375, -0.011362075805664062, -0.00835418701171875, -0.0053462982177734375, -0.002338409423828125, 0.0006694793701171875, 0.0036773681640625, 0.0066852569580078125, 0.009693145751953125, 0.012701034545898438, 0.01570892333984375, 0.018716812133789062, 0.021724700927734375, 0.024732589721679688, 0.027740478515625, 0.030748367309570312, 0.033756256103515625, 0.03676414489746094, 0.03977203369140625, 0.04277992248535156, 0.045787811279296875, 0.04879570007324219, 0.0518035888671875, 0.05481147766113281, 0.057819366455078125, 0.06082725524902344, 0.06383514404296875, 0.06684303283691406, 0.06985092163085938, 0.07285881042480469, 0.07586669921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 6.0, 6.0, 13.0, 10.0, 12.0, 41.0, 57.0, 102.0, 221.0, 449.0, 1106.0, 3514.0, 14365.0, 85960.0, 520110.0, 356825.0, 51931.0, 9638.0, 2476.0, 899.0, 353.0, 184.0, 97.0, 57.0, 43.0, 18.0, 19.0, 12.0, 9.0, 4.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.481689453125, -0.4660835266113281, -0.45047760009765625, -0.4348716735839844, -0.4192657470703125, -0.4036598205566406, -0.38805389404296875, -0.3724479675292969, -0.356842041015625, -0.3412361145019531, -0.32563018798828125, -0.3100242614746094, -0.2944183349609375, -0.2788124084472656, -0.26320648193359375, -0.24760055541992188, -0.23199462890625, -0.21638870239257812, -0.20078277587890625, -0.18517684936523438, -0.1695709228515625, -0.15396499633789062, -0.13835906982421875, -0.12275314331054688, -0.107147216796875, -0.09154129028320312, -0.07593536376953125, -0.060329437255859375, -0.0447235107421875, -0.029117584228515625, -0.01351165771484375, 0.002094268798828125, 0.0177001953125, 0.033306121826171875, 0.04891204833984375, 0.06451797485351562, 0.0801239013671875, 0.09572982788085938, 0.11133575439453125, 0.12694168090820312, 0.142547607421875, 0.15815353393554688, 0.17375946044921875, 0.18936538696289062, 0.2049713134765625, 0.22057723999023438, 0.23618316650390625, 0.2517890930175781, 0.26739501953125, 0.2830009460449219, 0.29860687255859375, 0.3142127990722656, 0.3298187255859375, 0.3454246520996094, 0.36103057861328125, 0.3766365051269531, 0.392242431640625, 0.4078483581542969, 0.42345428466796875, 0.4390602111816406, 0.4546661376953125, 0.4702720642089844, 0.48587799072265625, 0.5014839172363281, 0.51708984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 6.0, 7.0, 4.0, 15.0, 13.0, 15.0, 15.0, 19.0, 30.0, 29.0, 35.0, 42.0, 51.0, 38.0, 36.0, 50.0, 57.0, 58.0, 45.0, 42.0, 60.0, 55.0, 45.0, 39.0, 33.0, 26.0, 28.0, 23.0, 14.0, 18.0, 13.0, 9.0, 6.0, 6.0, 5.0, 7.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19287109375, -0.18605804443359375, -0.1792449951171875, -0.17243194580078125, -0.165618896484375, -0.15880584716796875, -0.1519927978515625, -0.14517974853515625, -0.13836669921875, -0.13155364990234375, -0.1247406005859375, -0.11792755126953125, -0.111114501953125, -0.10430145263671875, -0.0974884033203125, -0.09067535400390625, -0.0838623046875, -0.07704925537109375, -0.0702362060546875, -0.06342315673828125, -0.056610107421875, -0.04979705810546875, -0.0429840087890625, -0.03617095947265625, -0.02935791015625, -0.02254486083984375, -0.0157318115234375, -0.00891876220703125, -0.002105712890625, 0.00470733642578125, 0.0115203857421875, 0.01833343505859375, 0.025146484375, 0.03195953369140625, 0.0387725830078125, 0.04558563232421875, 0.052398681640625, 0.05921173095703125, 0.0660247802734375, 0.07283782958984375, 0.07965087890625, 0.08646392822265625, 0.0932769775390625, 0.10009002685546875, 0.106903076171875, 0.11371612548828125, 0.1205291748046875, 0.12734222412109375, 0.1341552734375, 0.14096832275390625, 0.1477813720703125, 0.15459442138671875, 0.161407470703125, 0.16822052001953125, 0.1750335693359375, 0.18184661865234375, 0.18865966796875, 0.19547271728515625, 0.2022857666015625, 0.20909881591796875, 0.215911865234375, 0.22272491455078125, 0.2295379638671875, 0.23635101318359375, 0.2431640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 13.0, 8.0, 11.0, 27.0, 35.0, 68.0, 140.0, 382.0, 1229.0, 7044.0, 530104.0, 500548.0, 7025.0, 1240.0, 359.0, 154.0, 68.0, 48.0, 20.0, 11.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.923828125, -0.8995132446289062, -0.8751983642578125, -0.8508834838867188, -0.826568603515625, -0.8022537231445312, -0.7779388427734375, -0.7536239624023438, -0.72930908203125, -0.7049942016601562, -0.6806793212890625, -0.6563644409179688, -0.632049560546875, -0.6077346801757812, -0.5834197998046875, -0.5591049194335938, -0.5347900390625, -0.5104751586914062, -0.4861602783203125, -0.46184539794921875, -0.437530517578125, -0.41321563720703125, -0.3889007568359375, -0.36458587646484375, -0.34027099609375, -0.31595611572265625, -0.2916412353515625, -0.26732635498046875, -0.243011474609375, -0.21869659423828125, -0.1943817138671875, -0.17006683349609375, -0.145751953125, -0.12143707275390625, -0.0971221923828125, -0.07280731201171875, -0.048492431640625, -0.02417755126953125, 0.0001373291015625, 0.02445220947265625, 0.04876708984375, 0.07308197021484375, 0.0973968505859375, 0.12171173095703125, 0.146026611328125, 0.17034149169921875, 0.1946563720703125, 0.21897125244140625, 0.2432861328125, 0.26760101318359375, 0.2919158935546875, 0.31623077392578125, 0.340545654296875, 0.36486053466796875, 0.3891754150390625, 0.41349029541015625, 0.43780517578125, 0.46212005615234375, 0.4864349365234375, 0.5107498168945312, 0.535064697265625, 0.5593795776367188, 0.5836944580078125, 0.6080093383789062, 0.63232421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 5.0, 11.0, 17.0, 25.0, 20.0, 25.0, 26.0, 41.0, 44.0, 62.0, 66.0, 98.0, 115.0, 92.0, 69.0, 55.0, 50.0, 35.0, 35.0, 25.0, 22.0, 13.0, 13.0, 6.0, 6.0, 10.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024020671844482422, -0.00023213960230350494, -0.00022407248616218567, -0.0002160053700208664, -0.00020793825387954712, -0.00019987113773822784, -0.00019180402159690857, -0.0001837369054555893, -0.00017566978931427002, -0.00016760267317295074, -0.00015953555703163147, -0.0001514684408903122, -0.00014340132474899292, -0.00013533420860767365, -0.00012726709246635437, -0.0001191999763250351, -0.00011113286018371582, -0.00010306574404239655, -9.499862790107727e-05, -8.6931511759758e-05, -7.886439561843872e-05, -7.079727947711945e-05, -6.273016333580017e-05, -5.4663047194480896e-05, -4.659593105316162e-05, -3.8528814911842346e-05, -3.046169877052307e-05, -2.2394582629203796e-05, -1.4327466487884521e-05, -6.260350346565247e-06, 1.8067657947540283e-06, 9.873881936073303e-06, 1.7940998077392578e-05, 2.6008114218711853e-05, 3.407523036003113e-05, 4.21423465013504e-05, 5.020946264266968e-05, 5.827657878398895e-05, 6.634369492530823e-05, 7.44108110666275e-05, 8.247792720794678e-05, 9.054504334926605e-05, 9.861215949058533e-05, 0.0001066792756319046, 0.00011474639177322388, 0.00012281350791454315, 0.00013088062405586243, 0.0001389477401971817, 0.00014701485633850098, 0.00015508197247982025, 0.00016314908862113953, 0.0001712162047624588, 0.00017928332090377808, 0.00018735043704509735, 0.00019541755318641663, 0.0002034846693277359, 0.00021155178546905518, 0.00021961890161037445, 0.00022768601775169373, 0.000235753133893013, 0.00024382025003433228, 0.00025188736617565155, 0.0002599544823169708, 0.0002680215984582901, 0.0002760887145996094]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 5.0, 6.0, 7.0, 25.0, 30.0, 30.0, 68.0, 97.0, 160.0, 234.0, 466.0, 920.0, 2233.0, 9873.0, 158751.0, 837850.0, 30352.0, 4369.0, 1460.0, 651.0, 372.0, 229.0, 133.0, 86.0, 42.0, 40.0, 18.0, 12.0, 13.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.421875, -0.40517425537109375, -0.3884735107421875, -0.37177276611328125, -0.355072021484375, -0.33837127685546875, -0.3216705322265625, -0.30496978759765625, -0.28826904296875, -0.27156829833984375, -0.2548675537109375, -0.23816680908203125, -0.221466064453125, -0.20476531982421875, -0.1880645751953125, -0.17136383056640625, -0.1546630859375, -0.13796234130859375, -0.1212615966796875, -0.10456085205078125, -0.087860107421875, -0.07115936279296875, -0.0544586181640625, -0.03775787353515625, -0.02105712890625, -0.00435638427734375, 0.0123443603515625, 0.02904510498046875, 0.045745849609375, 0.06244659423828125, 0.0791473388671875, 0.09584808349609375, 0.112548828125, 0.12924957275390625, 0.1459503173828125, 0.16265106201171875, 0.179351806640625, 0.19605255126953125, 0.2127532958984375, 0.22945404052734375, 0.24615478515625, 0.26285552978515625, 0.2795562744140625, 0.29625701904296875, 0.312957763671875, 0.32965850830078125, 0.3463592529296875, 0.36305999755859375, 0.3797607421875, 0.39646148681640625, 0.4131622314453125, 0.42986297607421875, 0.446563720703125, 0.46326446533203125, 0.4799652099609375, 0.49666595458984375, 0.51336669921875, 0.5300674438476562, 0.5467681884765625, 0.5634689331054688, 0.580169677734375, 0.5968704223632812, 0.6135711669921875, 0.6302719116210938, 0.64697265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 7.0, 12.0, 27.0, 32.0, 59.0, 124.0, 186.0, 211.0, 146.0, 88.0, 43.0, 26.0, 22.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2489013671875, -0.2403888702392578, -0.23187637329101562, -0.22336387634277344, -0.21485137939453125, -0.20633888244628906, -0.19782638549804688, -0.1893138885498047, -0.1808013916015625, -0.1722888946533203, -0.16377639770507812, -0.15526390075683594, -0.14675140380859375, -0.13823890686035156, -0.12972640991210938, -0.12121391296386719, -0.112701416015625, -0.10418891906738281, -0.09567642211914062, -0.08716392517089844, -0.07865142822265625, -0.07013893127441406, -0.061626434326171875, -0.05311393737792969, -0.0446014404296875, -0.03608894348144531, -0.027576446533203125, -0.019063949584960938, -0.01055145263671875, -0.0020389556884765625, 0.006473541259765625, 0.014986038208007812, 0.02349853515625, 0.03201103210449219, 0.040523529052734375, 0.04903602600097656, 0.05754852294921875, 0.06606101989746094, 0.07457351684570312, 0.08308601379394531, 0.0915985107421875, 0.10011100769042969, 0.10862350463867188, 0.11713600158691406, 0.12564849853515625, 0.13416099548339844, 0.14267349243164062, 0.1511859893798828, 0.159698486328125, 0.1682109832763672, 0.17672348022460938, 0.18523597717285156, 0.19374847412109375, 0.20226097106933594, 0.21077346801757812, 0.2192859649658203, 0.2277984619140625, 0.2363109588623047, 0.24482345581054688, 0.25333595275878906, 0.26184844970703125, 0.27036094665527344, 0.2788734436035156, 0.2873859405517578, 0.2958984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 9.0, 14.0, 37.0, 103.0, 270.0, 307.0, 156.0, 63.0, 28.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.9216318130493164, -3.7715790271759033, -3.6215262413024902, -3.471473455429077, -3.321420669555664, -3.171367883682251, -3.021315097808838, -2.871262550354004, -2.7212095260620117, -2.5711567401885986, -2.4211039543151855, -2.2710511684417725, -2.1209983825683594, -1.9709455966949463, -1.8208929300308228, -1.6708401441574097, -1.5207874774932861, -1.370734691619873, -1.22068190574646, -1.0706291198730469, -0.9205763936042786, -0.7705236077308655, -0.6204708814620972, -0.4704180955886841, -0.320365309715271, -0.1703125387430191, -0.020259767770767212, 0.1297929883003235, 0.2798457741737366, 0.42989856004714966, 0.579951286315918, 0.730004072189331, 0.8800568580627441, 1.0301096439361572, 1.1801624298095703, 1.3302152156829834, 1.4802680015563965, 1.6303207874298096, 1.780373454093933, 1.9304262399673462, 2.080479145050049, 2.230531930923462, 2.380584716796875, 2.530637502670288, 2.680690288543701, 2.8307430744171143, 2.9807958602905273, 3.1308484077453613, 3.2809011936187744, 3.4309539794921875, 3.5810067653656006, 3.7310595512390137, 3.8811123371124268, 4.03116512298584, 4.181217670440674, 4.331270694732666, 4.4813232421875, 4.631375789642334, 4.781428813934326, 4.93148136138916, 5.081534385681152, 5.231586933135986, 5.3816399574279785, 5.5316925048828125, 5.681745529174805]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 7.0, 10.0, 12.0, 14.0, 13.0, 26.0, 18.0, 27.0, 43.0, 52.0, 55.0, 52.0, 60.0, 60.0, 62.0, 72.0, 62.0, 66.0, 50.0, 49.0, 40.0, 29.0, 24.0, 21.0, 23.0, 12.0, 12.0, 12.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.242246389389038, -2.1774702072143555, -2.112694025039673, -2.0479178428649902, -1.9831416606903076, -1.918365478515625, -1.8535891771316528, -1.7888129949569702, -1.7240368127822876, -1.659260630607605, -1.5944844484329224, -1.5297082662582397, -1.4649319648742676, -1.400155782699585, -1.3353796005249023, -1.2706034183502197, -1.205827236175537, -1.1410510540008545, -1.0762748718261719, -1.0114986896514893, -0.9467224478721619, -0.8819462656974792, -0.8171700239181519, -0.7523938417434692, -0.6876176595687866, -0.622841477394104, -0.5580652952194214, -0.493289053440094, -0.4285128712654114, -0.36373668909072876, -0.29896047711372375, -0.23418426513671875, -0.16940808296203613, -0.10463188588619232, -0.03985568881034851, 0.0249205082654953, 0.08969670534133911, 0.15447288751602173, 0.21924909949302673, 0.28402531147003174, 0.34880149364471436, 0.413577675819397, 0.478353887796402, 0.543130099773407, 0.6079062819480896, 0.6726824641227722, 0.7374587059020996, 0.8022348880767822, 0.8670110702514648, 0.9317872524261475, 0.9965634346008301, 1.0613396167755127, 1.1261157989501953, 1.190891981124878, 1.25566828250885, 1.3204444646835327, 1.3852206468582153, 1.449996829032898, 1.5147730112075806, 1.5795491933822632, 1.6443254947662354, 1.709101676940918, 1.7738778591156006, 1.8386540412902832, 1.9034302234649658]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 10.0, 22.0, 33.0, 71.0, 213.0, 645.0, 6960.0, 4178475.0, 7195.0, 441.0, 116.0, 46.0, 25.0, 13.0, 4.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.234375, -7.06011962890625, -6.8858642578125, -6.71160888671875, -6.537353515625, -6.36309814453125, -6.1888427734375, -6.01458740234375, -5.84033203125, -5.66607666015625, -5.4918212890625, -5.31756591796875, -5.143310546875, -4.96905517578125, -4.7947998046875, -4.62054443359375, -4.4462890625, -4.27203369140625, -4.0977783203125, -3.92352294921875, -3.749267578125, -3.57501220703125, -3.4007568359375, -3.22650146484375, -3.05224609375, -2.87799072265625, -2.7037353515625, -2.52947998046875, -2.355224609375, -2.18096923828125, -2.0067138671875, -1.83245849609375, -1.658203125, -1.48394775390625, -1.3096923828125, -1.13543701171875, -0.961181640625, -0.78692626953125, -0.6126708984375, -0.43841552734375, -0.26416015625, -0.08990478515625, 0.0843505859375, 0.25860595703125, 0.432861328125, 0.60711669921875, 0.7813720703125, 0.95562744140625, 1.1298828125, 1.30413818359375, 1.4783935546875, 1.65264892578125, 1.826904296875, 2.00115966796875, 2.1754150390625, 2.34967041015625, 2.52392578125, 2.69818115234375, 2.8724365234375, 3.04669189453125, 3.220947265625, 3.39520263671875, 3.5694580078125, 3.74371337890625, 3.91796875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 10.0, 16.0, 37.0, 69.0, 102.0, 163.0, 204.0, 147.0, 117.0, 61.0, 33.0, 19.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15781211853027344, -0.15400314331054688, -0.1501941680908203, -0.14638519287109375, -0.1425762176513672, -0.13876724243164062, -0.13495826721191406, -0.1311492919921875, -0.12734031677246094, -0.12353134155273438, -0.11972236633300781, -0.11591339111328125, -0.11210441589355469, -0.10829544067382812, -0.10448646545410156, -0.100677490234375, -0.09686851501464844, -0.09305953979492188, -0.08925056457519531, -0.08544158935546875, -0.08163261413574219, -0.07782363891601562, -0.07401466369628906, -0.0702056884765625, -0.06639671325683594, -0.06258773803710938, -0.05877876281738281, -0.05496978759765625, -0.05116081237792969, -0.047351837158203125, -0.04354286193847656, -0.03973388671875, -0.03592491149902344, -0.032115936279296875, -0.028306961059570312, -0.02449798583984375, -0.020689010620117188, -0.016880035400390625, -0.013071060180664062, -0.0092620849609375, -0.0054531097412109375, -0.001644134521484375, 0.0021648406982421875, 0.00597381591796875, 0.009782791137695312, 0.013591766357421875, 0.017400741577148438, 0.021209716796875, 0.025018692016601562, 0.028827667236328125, 0.03263664245605469, 0.03644561767578125, 0.04025459289550781, 0.044063568115234375, 0.04787254333496094, 0.0516815185546875, 0.05549049377441406, 0.059299468994140625, 0.06310844421386719, 0.06691741943359375, 0.07072639465332031, 0.07453536987304688, 0.07834434509277344, 0.0821533203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 13.0, 20.0, 29.0, 49.0, 49.0, 71.0, 91.0, 148.0, 219.0, 425.0, 1144.0, 7715.0, 267395.0, 3894496.0, 19239.0, 1996.0, 539.0, 235.0, 128.0, 84.0, 58.0, 37.0, 34.0, 20.0, 14.0, 10.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9033203125, -1.85595703125, -1.80859375, -1.76123046875, -1.7138671875, -1.66650390625, -1.619140625, -1.57177734375, -1.5244140625, -1.47705078125, -1.4296875, -1.38232421875, -1.3349609375, -1.28759765625, -1.240234375, -1.19287109375, -1.1455078125, -1.09814453125, -1.05078125, -1.00341796875, -0.9560546875, -0.90869140625, -0.861328125, -0.81396484375, -0.7666015625, -0.71923828125, -0.671875, -0.62451171875, -0.5771484375, -0.52978515625, -0.482421875, -0.43505859375, -0.3876953125, -0.34033203125, -0.29296875, -0.24560546875, -0.1982421875, -0.15087890625, -0.103515625, -0.05615234375, -0.0087890625, 0.03857421875, 0.0859375, 0.13330078125, 0.1806640625, 0.22802734375, 0.275390625, 0.32275390625, 0.3701171875, 0.41748046875, 0.46484375, 0.51220703125, 0.5595703125, 0.60693359375, 0.654296875, 0.70166015625, 0.7490234375, 0.79638671875, 0.84375, 0.89111328125, 0.9384765625, 0.98583984375, 1.033203125, 1.08056640625, 1.1279296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 8.0, 17.0, 24.0, 23.0, 50.0, 104.0, 292.0, 1225.0, 1799.0, 306.0, 105.0, 54.0, 24.0, 10.0, 8.0, 7.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.291259765625, -0.284942626953125, -0.27862548828125, -0.272308349609375, -0.2659912109375, -0.259674072265625, -0.25335693359375, -0.247039794921875, -0.24072265625, -0.234405517578125, -0.22808837890625, -0.221771240234375, -0.2154541015625, -0.209136962890625, -0.20281982421875, -0.196502685546875, -0.190185546875, -0.183868408203125, -0.17755126953125, -0.171234130859375, -0.1649169921875, -0.158599853515625, -0.15228271484375, -0.145965576171875, -0.1396484375, -0.133331298828125, -0.12701416015625, -0.120697021484375, -0.1143798828125, -0.108062744140625, -0.10174560546875, -0.095428466796875, -0.089111328125, -0.082794189453125, -0.07647705078125, -0.070159912109375, -0.0638427734375, -0.057525634765625, -0.05120849609375, -0.044891357421875, -0.03857421875, -0.032257080078125, -0.02593994140625, -0.019622802734375, -0.0133056640625, -0.006988525390625, -0.00067138671875, 0.005645751953125, 0.011962890625, 0.018280029296875, 0.02459716796875, 0.030914306640625, 0.0372314453125, 0.043548583984375, 0.04986572265625, 0.056182861328125, 0.0625, 0.068817138671875, 0.07513427734375, 0.081451416015625, 0.0877685546875, 0.094085693359375, 0.10040283203125, 0.106719970703125, 0.113037109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 9.0, 15.0, 71.0, 220.0, 421.0, 184.0, 60.0, 16.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5949995517730713, -2.527709722518921, -2.4604198932647705, -2.39313006401062, -2.3258402347564697, -2.2585504055023193, -2.191260576248169, -2.1239709854125977, -2.0566811561584473, -1.9893913269042969, -1.9221014976501465, -1.854811668395996, -1.7875218391418457, -1.7202320098876953, -1.6529422998428345, -1.585652470588684, -1.5183625221252441, -1.4510726928710938, -1.3837828636169434, -1.316493034362793, -1.2492032051086426, -1.1819133758544922, -1.1146236658096313, -1.047333836555481, -0.9800440073013306, -0.9127541780471802, -0.8454643487930298, -0.7781745791435242, -0.7108847498893738, -0.6435949206352234, -0.5763051509857178, -0.5090153217315674, -0.4417257308959961, -0.3744359016418457, -0.3071461021900177, -0.2398562878370285, -0.1725664734840393, -0.10527664422988892, -0.03798684477806091, 0.02930295467376709, 0.09659278392791748, 0.16388259828090668, 0.23117241263389587, 0.2984622120857239, 0.36575204133987427, 0.43304187059402466, 0.5003316402435303, 0.5676214694976807, 0.634911298751831, 0.7022011280059814, 0.7694909572601318, 0.8367807269096375, 0.9040705561637878, 0.9713603854179382, 1.0386501550674438, 1.1059399843215942, 1.1732298135757446, 1.240519642829895, 1.3078094720840454, 1.3750993013381958, 1.4423890113830566, 1.509678840637207, 1.5769686698913574, 1.6442584991455078, 1.7115483283996582]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 7.0, 13.0, 12.0, 20.0, 36.0, 42.0, 45.0, 70.0, 78.0, 88.0, 88.0, 101.0, 77.0, 77.0, 69.0, 49.0, 49.0, 27.0, 19.0, 15.0, 10.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7502862811088562, -0.7251657247543335, -0.7000452280044556, -0.6749246716499329, -0.6498041152954102, -0.6246835589408875, -0.5995630025863647, -0.5744425058364868, -0.5493219494819641, -0.5242013931274414, -0.4990808665752411, -0.47396034002304077, -0.44883978366851807, -0.42371922731399536, -0.39859870076179504, -0.3734781742095947, -0.348357617855072, -0.3232370615005493, -0.298116534948349, -0.2729960083961487, -0.24787545204162598, -0.22275491058826447, -0.19763436913490295, -0.17251382768154144, -0.14739328622817993, -0.12227274477481842, -0.09715220332145691, -0.0720316618680954, -0.04691112041473389, -0.021790578961372375, 0.0033299624919891357, 0.028450503945350647, 0.05357104539871216, 0.07869158685207367, 0.10381212830543518, 0.1289326697587967, 0.1540532112121582, 0.17917375266551971, 0.20429429411888123, 0.22941483557224274, 0.25453537702560425, 0.27965593338012695, 0.30477645993232727, 0.3298969864845276, 0.3550175428390503, 0.380138099193573, 0.4052586257457733, 0.43037915229797363, 0.45549970865249634, 0.48062026500701904, 0.505740761756897, 0.5308613181114197, 0.5559818744659424, 0.5811024308204651, 0.6062229871749878, 0.6313434839248657, 0.6564640402793884, 0.6815845966339111, 0.7067050933837891, 0.7318256497383118, 0.7569462060928345, 0.7820667624473572, 0.8071873188018799, 0.8323078155517578, 0.8574283719062805]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 4.0, 7.0, 11.0, 21.0, 37.0, 66.0, 94.0, 201.0, 379.0, 888.0, 2319.0, 9522.0, 161796.0, 815130.0, 49562.0, 5516.0, 1660.0, 647.0, 296.0, 181.0, 96.0, 44.0, 26.0, 21.0, 8.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88330078125, -0.8541793823242188, -0.8250579833984375, -0.7959365844726562, -0.766815185546875, -0.7376937866210938, -0.7085723876953125, -0.6794509887695312, -0.65032958984375, -0.6212081909179688, -0.5920867919921875, -0.5629653930664062, -0.533843994140625, -0.5047225952148438, -0.4756011962890625, -0.44647979736328125, -0.4173583984375, -0.38823699951171875, -0.3591156005859375, -0.32999420166015625, -0.300872802734375, -0.27175140380859375, -0.2426300048828125, -0.21350860595703125, -0.18438720703125, -0.15526580810546875, -0.1261444091796875, -0.09702301025390625, -0.067901611328125, -0.03878021240234375, -0.0096588134765625, 0.01946258544921875, 0.048583984375, 0.07770538330078125, 0.1068267822265625, 0.13594818115234375, 0.165069580078125, 0.19419097900390625, 0.2233123779296875, 0.25243377685546875, 0.28155517578125, 0.31067657470703125, 0.3397979736328125, 0.36891937255859375, 0.398040771484375, 0.42716217041015625, 0.4562835693359375, 0.48540496826171875, 0.5145263671875, 0.5436477661132812, 0.5727691650390625, 0.6018905639648438, 0.631011962890625, 0.6601333618164062, 0.6892547607421875, 0.7183761596679688, 0.74749755859375, 0.7766189575195312, 0.8057403564453125, 0.8348617553710938, 0.863983154296875, 0.8931045532226562, 0.9222259521484375, 0.9513473510742188, 0.98046875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 15.0, 33.0, 59.0, 86.0, 135.0, 170.0, 168.0, 123.0, 94.0, 50.0, 29.0, 17.0, 4.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1514892578125, -0.14795207977294922, -0.14441490173339844, -0.14087772369384766, -0.13734054565429688, -0.1338033676147461, -0.1302661895751953, -0.12672901153564453, -0.12319183349609375, -0.11965465545654297, -0.11611747741699219, -0.1125802993774414, -0.10904312133789062, -0.10550594329833984, -0.10196876525878906, -0.09843158721923828, -0.0948944091796875, -0.09135723114013672, -0.08782005310058594, -0.08428287506103516, -0.08074569702148438, -0.0772085189819336, -0.07367134094238281, -0.07013416290283203, -0.06659698486328125, -0.06305980682373047, -0.05952262878417969, -0.055985450744628906, -0.052448272705078125, -0.048911094665527344, -0.04537391662597656, -0.04183673858642578, -0.038299560546875, -0.03476238250732422, -0.031225204467773438, -0.027688026428222656, -0.024150848388671875, -0.020613670349121094, -0.017076492309570312, -0.013539314270019531, -0.01000213623046875, -0.006464958190917969, -0.0029277801513671875, 0.0006093978881835938, 0.004146575927734375, 0.007683753967285156, 0.011220932006835938, 0.014758110046386719, 0.0182952880859375, 0.02183246612548828, 0.025369644165039062, 0.028906822204589844, 0.032444000244140625, 0.035981178283691406, 0.03951835632324219, 0.04305553436279297, 0.04659271240234375, 0.05012989044189453, 0.05366706848144531, 0.057204246520996094, 0.060741424560546875, 0.06427860260009766, 0.06781578063964844, 0.07135295867919922, 0.07489013671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 8.0, 9.0, 6.0, 17.0, 24.0, 26.0, 47.0, 104.0, 133.0, 298.0, 565.0, 1241.0, 2956.0, 8764.0, 32968.0, 167339.0, 540429.0, 232255.0, 44288.0, 10920.0, 3502.0, 1314.0, 649.0, 282.0, 145.0, 105.0, 52.0, 42.0, 24.0, 17.0, 9.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.383544921875, -0.3696479797363281, -0.35575103759765625, -0.3418540954589844, -0.3279571533203125, -0.3140602111816406, -0.30016326904296875, -0.2862663269042969, -0.272369384765625, -0.2584724426269531, -0.24457550048828125, -0.23067855834960938, -0.2167816162109375, -0.20288467407226562, -0.18898773193359375, -0.17509078979492188, -0.16119384765625, -0.14729690551757812, -0.13339996337890625, -0.11950302124023438, -0.1056060791015625, -0.09170913696289062, -0.07781219482421875, -0.06391525268554688, -0.050018310546875, -0.036121368408203125, -0.02222442626953125, -0.008327484130859375, 0.0055694580078125, 0.019466400146484375, 0.03336334228515625, 0.047260284423828125, 0.0611572265625, 0.07505416870117188, 0.08895111083984375, 0.10284805297851562, 0.1167449951171875, 0.13064193725585938, 0.14453887939453125, 0.15843582153320312, 0.172332763671875, 0.18622970581054688, 0.20012664794921875, 0.21402359008789062, 0.2279205322265625, 0.24181747436523438, 0.25571441650390625, 0.2696113586425781, 0.28350830078125, 0.2974052429199219, 0.31130218505859375, 0.3251991271972656, 0.3390960693359375, 0.3529930114746094, 0.36688995361328125, 0.3807868957519531, 0.394683837890625, 0.4085807800292969, 0.42247772216796875, 0.4363746643066406, 0.4502716064453125, 0.4641685485839844, 0.47806549072265625, 0.4919624328613281, 0.505859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 1.0, 13.0, 9.0, 15.0, 15.0, 13.0, 18.0, 22.0, 26.0, 41.0, 35.0, 33.0, 62.0, 53.0, 59.0, 56.0, 70.0, 55.0, 59.0, 50.0, 43.0, 41.0, 42.0, 30.0, 22.0, 24.0, 16.0, 11.0, 16.0, 8.0, 7.0, 6.0, 7.0, 5.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.28955078125, -0.2805938720703125, -0.271636962890625, -0.2626800537109375, -0.25372314453125, -0.2447662353515625, -0.235809326171875, -0.2268524169921875, -0.2178955078125, -0.2089385986328125, -0.199981689453125, -0.1910247802734375, -0.18206787109375, -0.1731109619140625, -0.164154052734375, -0.1551971435546875, -0.146240234375, -0.1372833251953125, -0.128326416015625, -0.1193695068359375, -0.11041259765625, -0.1014556884765625, -0.092498779296875, -0.0835418701171875, -0.0745849609375, -0.0656280517578125, -0.056671142578125, -0.0477142333984375, -0.03875732421875, -0.0298004150390625, -0.020843505859375, -0.0118865966796875, -0.0029296875, 0.0060272216796875, 0.014984130859375, 0.0239410400390625, 0.03289794921875, 0.0418548583984375, 0.050811767578125, 0.0597686767578125, 0.0687255859375, 0.0776824951171875, 0.086639404296875, 0.0955963134765625, 0.10455322265625, 0.1135101318359375, 0.122467041015625, 0.1314239501953125, 0.140380859375, 0.1493377685546875, 0.158294677734375, 0.1672515869140625, 0.17620849609375, 0.1851654052734375, 0.194122314453125, 0.2030792236328125, 0.2120361328125, 0.2209930419921875, 0.229949951171875, 0.2389068603515625, 0.24786376953125, 0.2568206787109375, 0.265777587890625, 0.2747344970703125, 0.28369140625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 10.0, 25.0, 37.0, 85.0, 236.0, 831.0, 9831.0, 1014510.0, 21395.0, 1127.0, 287.0, 98.0, 37.0, 15.0, 15.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.806640625, -1.7686767578125, -1.730712890625, -1.6927490234375, -1.65478515625, -1.6168212890625, -1.578857421875, -1.5408935546875, -1.5029296875, -1.4649658203125, -1.427001953125, -1.3890380859375, -1.35107421875, -1.3131103515625, -1.275146484375, -1.2371826171875, -1.19921875, -1.1612548828125, -1.123291015625, -1.0853271484375, -1.04736328125, -1.0093994140625, -0.971435546875, -0.9334716796875, -0.8955078125, -0.8575439453125, -0.819580078125, -0.7816162109375, -0.74365234375, -0.7056884765625, -0.667724609375, -0.6297607421875, -0.591796875, -0.5538330078125, -0.515869140625, -0.4779052734375, -0.43994140625, -0.4019775390625, -0.364013671875, -0.3260498046875, -0.2880859375, -0.2501220703125, -0.212158203125, -0.1741943359375, -0.13623046875, -0.0982666015625, -0.060302734375, -0.0223388671875, 0.015625, 0.0535888671875, 0.091552734375, 0.1295166015625, 0.16748046875, 0.2054443359375, 0.243408203125, 0.2813720703125, 0.3193359375, 0.3572998046875, 0.395263671875, 0.4332275390625, 0.47119140625, 0.5091552734375, 0.547119140625, 0.5850830078125, 0.623046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 12.0, 11.0, 16.0, 21.0, 19.0, 34.0, 36.0, 52.0, 49.0, 54.0, 111.0, 106.0, 95.0, 78.0, 50.0, 36.0, 39.0, 30.0, 23.0, 21.0, 15.0, 15.0, 8.0, 7.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0001590251922607422, -0.00015250593423843384, -0.0001459866762161255, -0.00013946741819381714, -0.0001329481601715088, -0.00012642890214920044, -0.00011990964412689209, -0.00011339038610458374, -0.00010687112808227539, -0.00010035187005996704, -9.383261203765869e-05, -8.731335401535034e-05, -8.079409599304199e-05, -7.427483797073364e-05, -6.775557994842529e-05, -6.123632192611694e-05, -5.4717063903808594e-05, -4.8197805881500244e-05, -4.1678547859191895e-05, -3.5159289836883545e-05, -2.8640031814575195e-05, -2.2120773792266846e-05, -1.5601515769958496e-05, -9.082257747650146e-06, -2.562999725341797e-06, 3.956258296966553e-06, 1.0475516319274902e-05, 1.6994774341583252e-05, 2.35140323638916e-05, 3.003329038619995e-05, 3.65525484085083e-05, 4.307180643081665e-05, 4.9591064453125e-05, 5.611032247543335e-05, 6.26295804977417e-05, 6.914883852005005e-05, 7.56680965423584e-05, 8.218735456466675e-05, 8.87066125869751e-05, 9.522587060928345e-05, 0.0001017451286315918, 0.00010826438665390015, 0.0001147836446762085, 0.00012130290269851685, 0.0001278221607208252, 0.00013434141874313354, 0.0001408606767654419, 0.00014737993478775024, 0.0001538991928100586, 0.00016041845083236694, 0.0001669377088546753, 0.00017345696687698364, 0.000179976224899292, 0.00018649548292160034, 0.0001930147409439087, 0.00019953399896621704, 0.0002060532569885254, 0.00021257251501083374, 0.0002190917730331421, 0.00022561103105545044, 0.0002321302890777588, 0.00023864954710006714, 0.0002451688051223755, 0.00025168806314468384, 0.0002582073211669922]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 4.0, 7.0, 7.0, 8.0, 14.0, 20.0, 32.0, 41.0, 83.0, 144.0, 291.0, 483.0, 1059.0, 2661.0, 8984.0, 58934.0, 811759.0, 143278.0, 14271.0, 3712.0, 1399.0, 588.0, 329.0, 171.0, 91.0, 58.0, 37.0, 33.0, 16.0, 8.0, 9.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.396728515625, -0.38457489013671875, -0.3724212646484375, -0.36026763916015625, -0.348114013671875, -0.33596038818359375, -0.3238067626953125, -0.31165313720703125, -0.29949951171875, -0.28734588623046875, -0.2751922607421875, -0.26303863525390625, -0.250885009765625, -0.23873138427734375, -0.2265777587890625, -0.21442413330078125, -0.2022705078125, -0.19011688232421875, -0.1779632568359375, -0.16580963134765625, -0.153656005859375, -0.14150238037109375, -0.1293487548828125, -0.11719512939453125, -0.10504150390625, -0.09288787841796875, -0.0807342529296875, -0.06858062744140625, -0.056427001953125, -0.04427337646484375, -0.0321197509765625, -0.01996612548828125, -0.0078125, 0.00434112548828125, 0.0164947509765625, 0.02864837646484375, 0.040802001953125, 0.05295562744140625, 0.0651092529296875, 0.07726287841796875, 0.08941650390625, 0.10157012939453125, 0.1137237548828125, 0.12587738037109375, 0.138031005859375, 0.15018463134765625, 0.1623382568359375, 0.17449188232421875, 0.1866455078125, 0.19879913330078125, 0.2109527587890625, 0.22310638427734375, 0.235260009765625, 0.24741363525390625, 0.2595672607421875, 0.27172088623046875, 0.28387451171875, 0.29602813720703125, 0.3081817626953125, 0.32033538818359375, 0.332489013671875, 0.34464263916015625, 0.3567962646484375, 0.36894989013671875, 0.381103515625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 13.0, 17.0, 45.0, 65.0, 95.0, 133.0, 166.0, 159.0, 118.0, 60.0, 60.0, 16.0, 11.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2080078125, -0.20122528076171875, -0.1944427490234375, -0.18766021728515625, -0.180877685546875, -0.17409515380859375, -0.1673126220703125, -0.16053009033203125, -0.15374755859375, -0.14696502685546875, -0.1401824951171875, -0.13339996337890625, -0.126617431640625, -0.11983489990234375, -0.1130523681640625, -0.10626983642578125, -0.0994873046875, -0.09270477294921875, -0.0859222412109375, -0.07913970947265625, -0.072357177734375, -0.06557464599609375, -0.0587921142578125, -0.05200958251953125, -0.04522705078125, -0.03844451904296875, -0.0316619873046875, -0.02487945556640625, -0.018096923828125, -0.01131439208984375, -0.0045318603515625, 0.00225067138671875, 0.009033203125, 0.01581573486328125, 0.0225982666015625, 0.02938079833984375, 0.036163330078125, 0.04294586181640625, 0.0497283935546875, 0.05651092529296875, 0.06329345703125, 0.07007598876953125, 0.0768585205078125, 0.08364105224609375, 0.090423583984375, 0.09720611572265625, 0.1039886474609375, 0.11077117919921875, 0.1175537109375, 0.12433624267578125, 0.1311187744140625, 0.13790130615234375, 0.144683837890625, 0.15146636962890625, 0.1582489013671875, 0.16503143310546875, 0.17181396484375, 0.17859649658203125, 0.1853790283203125, 0.19216156005859375, 0.198944091796875, 0.20572662353515625, 0.2125091552734375, 0.21929168701171875, 0.22607421875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 10.0, 25.0, 118.0, 405.0, 347.0, 80.0, 20.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.435122489929199, -7.201960563659668, -6.968798637390137, -6.7356367111206055, -6.502474784851074, -6.269312858581543, -6.03615140914917, -5.802989482879639, -5.569827556610107, -5.336665630340576, -5.103503704071045, -4.870341777801514, -4.637180328369141, -4.404018402099609, -4.170856475830078, -3.937694549560547, -3.7045326232910156, -3.4713706970214844, -3.238208770751953, -3.005047082901001, -2.7718851566314697, -2.5387232303619385, -2.3055615425109863, -2.072399616241455, -1.8392376899719238, -1.6060757637023926, -1.3729139566421509, -1.1397521495819092, -0.9065902233123779, -0.6734282970428467, -0.440266489982605, -0.20710468292236328, 0.02605724334716797, 0.25921911001205444, 0.4923809766769409, 0.7255428433418274, 0.9587047100067139, 1.1918666362762451, 1.4250284433364868, 1.6581902503967285, 1.8913521766662598, 2.124514102935791, 2.3576760292053223, 2.5908377170562744, 2.8239996433258057, 3.057161569595337, 3.290323257446289, 3.5234851837158203, 3.7566471099853516, 3.989809036254883, 4.222970962524414, 4.456132888793945, 4.689294815063477, 4.922456741333008, 5.155618190765381, 5.388780117034912, 5.621942043304443, 5.855103969573975, 6.088265895843506, 6.321427822113037, 6.55458927154541, 6.787751197814941, 7.020913124084473, 7.254075050354004, 7.487236976623535]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 6.0, 6.0, 5.0, 14.0, 11.0, 19.0, 32.0, 18.0, 32.0, 30.0, 40.0, 42.0, 41.0, 40.0, 52.0, 52.0, 41.0, 38.0, 58.0, 57.0, 39.0, 39.0, 50.0, 37.0, 27.0, 31.0, 21.0, 22.0, 23.0, 18.0, 9.0, 5.0, 8.0, 7.0, 5.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7985286712646484, -1.7434810400009155, -1.6884334087371826, -1.6333857774734497, -1.5783381462097168, -1.5232905149459839, -1.468242883682251, -1.413195252418518, -1.3581476211547852, -1.3030999898910522, -1.2480523586273193, -1.1930047273635864, -1.1379570960998535, -1.0829094648361206, -1.0278618335723877, -0.9728142023086548, -0.9177665710449219, -0.862718939781189, -0.807671308517456, -0.7526236772537231, -0.6975760459899902, -0.6425284147262573, -0.5874807834625244, -0.5324331521987915, -0.4773855209350586, -0.4223378896713257, -0.3672902584075928, -0.31224262714385986, -0.25719499588012695, -0.20214736461639404, -0.14709973335266113, -0.09205210208892822, -0.03700447082519531, 0.018043160438537598, 0.07309079170227051, 0.12813842296600342, 0.18318605422973633, 0.23823368549346924, 0.29328131675720215, 0.34832894802093506, 0.40337657928466797, 0.4584242105484009, 0.5134718418121338, 0.5685194730758667, 0.6235671043395996, 0.6786147356033325, 0.7336623668670654, 0.7887099981307983, 0.8437576293945312, 0.8988052606582642, 0.9538528919219971, 1.00890052318573, 1.063948154449463, 1.1189957857131958, 1.1740434169769287, 1.2290910482406616, 1.2841386795043945, 1.3391863107681274, 1.3942339420318604, 1.4492815732955933, 1.5043292045593262, 1.559376835823059, 1.614424467086792, 1.669472098350525, 1.7245197296142578]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 11.0, 9.0, 16.0, 16.0, 40.0, 73.0, 120.0, 224.0, 517.0, 1668.0, 13157.0, 3902830.0, 268165.0, 5975.0, 954.0, 264.0, 112.0, 69.0, 30.0, 12.0, 7.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.10546875, -2.0498504638671875, -1.994232177734375, -1.9386138916015625, -1.88299560546875, -1.8273773193359375, -1.771759033203125, -1.7161407470703125, -1.6605224609375, -1.6049041748046875, -1.549285888671875, -1.4936676025390625, -1.43804931640625, -1.3824310302734375, -1.326812744140625, -1.2711944580078125, -1.215576171875, -1.1599578857421875, -1.104339599609375, -1.0487213134765625, -0.99310302734375, -0.9374847412109375, -0.881866455078125, -0.8262481689453125, -0.7706298828125, -0.7150115966796875, -0.659393310546875, -0.6037750244140625, -0.54815673828125, -0.4925384521484375, -0.436920166015625, -0.3813018798828125, -0.32568359375, -0.2700653076171875, -0.214447021484375, -0.1588287353515625, -0.10321044921875, -0.0475921630859375, 0.008026123046875, 0.0636444091796875, 0.1192626953125, 0.1748809814453125, 0.230499267578125, 0.2861175537109375, 0.34173583984375, 0.3973541259765625, 0.452972412109375, 0.5085906982421875, 0.564208984375, 0.6198272705078125, 0.675445556640625, 0.7310638427734375, 0.78668212890625, 0.8423004150390625, 0.897918701171875, 0.9535369873046875, 1.0091552734375, 1.0647735595703125, 1.120391845703125, 1.1760101318359375, 1.23162841796875, 1.2872467041015625, 1.342864990234375, 1.3984832763671875, 1.4541015625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 11.0, 17.0, 26.0, 56.0, 55.0, 102.0, 119.0, 156.0, 113.0, 111.0, 93.0, 62.0, 31.0, 20.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.161376953125, -0.15759658813476562, -0.15381622314453125, -0.15003585815429688, -0.1462554931640625, -0.14247512817382812, -0.13869476318359375, -0.13491439819335938, -0.131134033203125, -0.12735366821289062, -0.12357330322265625, -0.11979293823242188, -0.1160125732421875, -0.11223220825195312, -0.10845184326171875, -0.10467147827148438, -0.10089111328125, -0.09711074829101562, -0.09333038330078125, -0.08955001831054688, -0.0857696533203125, -0.08198928833007812, -0.07820892333984375, -0.07442855834960938, -0.070648193359375, -0.06686782836914062, -0.06308746337890625, -0.059307098388671875, -0.0555267333984375, -0.051746368408203125, -0.04796600341796875, -0.044185638427734375, -0.0404052734375, -0.036624908447265625, -0.03284454345703125, -0.029064178466796875, -0.0252838134765625, -0.021503448486328125, -0.01772308349609375, -0.013942718505859375, -0.010162353515625, -0.006381988525390625, -0.00260162353515625, 0.001178741455078125, 0.0049591064453125, 0.008739471435546875, 0.01251983642578125, 0.016300201416015625, 0.02008056640625, 0.023860931396484375, 0.02764129638671875, 0.031421661376953125, 0.0352020263671875, 0.038982391357421875, 0.04276275634765625, 0.046543121337890625, 0.050323486328125, 0.054103851318359375, 0.05788421630859375, 0.061664581298828125, 0.0654449462890625, 0.06922531127929688, 0.07300567626953125, 0.07678604125976562, 0.08056640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 11.0, 20.0, 30.0, 64.0, 91.0, 234.0, 512.0, 1347.0, 6510.0, 227596.0, 3935048.0, 19224.0, 2310.0, 706.0, 287.0, 154.0, 75.0, 19.0, 20.0, 7.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.47265625, -1.434112548828125, -1.39556884765625, -1.357025146484375, -1.3184814453125, -1.279937744140625, -1.24139404296875, -1.202850341796875, -1.164306640625, -1.125762939453125, -1.08721923828125, -1.048675537109375, -1.0101318359375, -0.971588134765625, -0.93304443359375, -0.894500732421875, -0.85595703125, -0.817413330078125, -0.77886962890625, -0.740325927734375, -0.7017822265625, -0.663238525390625, -0.62469482421875, -0.586151123046875, -0.547607421875, -0.509063720703125, -0.47052001953125, -0.431976318359375, -0.3934326171875, -0.354888916015625, -0.31634521484375, -0.277801513671875, -0.2392578125, -0.200714111328125, -0.16217041015625, -0.123626708984375, -0.0850830078125, -0.046539306640625, -0.00799560546875, 0.030548095703125, 0.069091796875, 0.107635498046875, 0.14617919921875, 0.184722900390625, 0.2232666015625, 0.261810302734375, 0.30035400390625, 0.338897705078125, 0.37744140625, 0.415985107421875, 0.45452880859375, 0.493072509765625, 0.5316162109375, 0.570159912109375, 0.60870361328125, 0.647247314453125, 0.685791015625, 0.724334716796875, 0.76287841796875, 0.801422119140625, 0.8399658203125, 0.878509521484375, 0.91705322265625, 0.955596923828125, 0.994140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 8.0, 9.0, 14.0, 35.0, 63.0, 126.0, 298.0, 1186.0, 1692.0, 378.0, 124.0, 64.0, 23.0, 15.0, 10.0, 14.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.12624359130859375, -0.1207733154296875, -0.11530303955078125, -0.109832763671875, -0.10436248779296875, -0.0988922119140625, -0.09342193603515625, -0.08795166015625, -0.08248138427734375, -0.0770111083984375, -0.07154083251953125, -0.066070556640625, -0.06060028076171875, -0.0551300048828125, -0.04965972900390625, -0.044189453125, -0.03871917724609375, -0.0332489013671875, -0.02777862548828125, -0.022308349609375, -0.01683807373046875, -0.0113677978515625, -0.00589752197265625, -0.00042724609375, 0.00504302978515625, 0.0105133056640625, 0.01598358154296875, 0.021453857421875, 0.02692413330078125, 0.0323944091796875, 0.03786468505859375, 0.0433349609375, 0.04880523681640625, 0.0542755126953125, 0.05974578857421875, 0.065216064453125, 0.07068634033203125, 0.0761566162109375, 0.08162689208984375, 0.08709716796875, 0.09256744384765625, 0.0980377197265625, 0.10350799560546875, 0.108978271484375, 0.11444854736328125, 0.1199188232421875, 0.12538909912109375, 0.130859375, 0.13632965087890625, 0.1417999267578125, 0.14727020263671875, 0.152740478515625, 0.15821075439453125, 0.1636810302734375, 0.16915130615234375, 0.17462158203125, 0.18009185791015625, 0.1855621337890625, 0.19103240966796875, 0.196502685546875, 0.20197296142578125, 0.2074432373046875, 0.21291351318359375, 0.2183837890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 13.0, 31.0, 68.0, 205.0, 299.0, 230.0, 96.0, 27.0, 18.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7590133547782898, -0.7180695533752441, -0.6771257519721985, -0.6361819505691528, -0.595238208770752, -0.5542943477630615, -0.5133506059646606, -0.472406804561615, -0.43146300315856934, -0.3905192017555237, -0.349575400352478, -0.30863162875175476, -0.2676878273487091, -0.22674402594566345, -0.185800239443779, -0.14485645294189453, -0.10391265153884888, -0.06296885758638382, -0.022025063633918762, 0.018918730318546295, 0.05986252427101135, 0.100806325674057, 0.14175011217594147, 0.18269389867782593, 0.22363770008087158, 0.26458150148391724, 0.3055253028869629, 0.34646907448768616, 0.3874128758907318, 0.42835667729377747, 0.46930044889450073, 0.5102442502975464, 0.5511879920959473, 0.5921317934989929, 0.6330755949020386, 0.6740193963050842, 0.7149631977081299, 0.7559069395065308, 0.7968507409095764, 0.8377945423126221, 0.8787383437156677, 0.9196821451187134, 0.960625946521759, 1.0015697479248047, 1.0425134897232056, 1.083457350730896, 1.1244010925292969, 1.1653449535369873, 1.2062886953353882, 1.247232437133789, 1.2881762981414795, 1.3291200399398804, 1.3700639009475708, 1.4110076427459717, 1.451951503753662, 1.492895245552063, 1.5338389873504639, 1.5747827291488647, 1.6157265901565552, 1.656670331954956, 1.6976141929626465, 1.7385579347610474, 1.7795017957687378, 1.8204455375671387, 1.861389398574829]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 11.0, 10.0, 12.0, 18.0, 22.0, 30.0, 49.0, 42.0, 54.0, 71.0, 64.0, 64.0, 73.0, 85.0, 73.0, 59.0, 58.0, 50.0, 35.0, 27.0, 30.0, 18.0, 13.0, 12.0, 8.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.666449248790741, -0.6496491432189941, -0.6328489780426025, -0.6160488724708557, -0.5992487668991089, -0.5824486613273621, -0.5656485557556152, -0.5488483905792236, -0.5320482850074768, -0.51524817943573, -0.49844804406166077, -0.48164790868759155, -0.4648478031158447, -0.4480476975440979, -0.4312475621700287, -0.4144474267959595, -0.39764732122421265, -0.3808472156524658, -0.3640470802783966, -0.3472469449043274, -0.33044683933258057, -0.31364673376083374, -0.2968465983867645, -0.2800464630126953, -0.2632463574409485, -0.24644623696804047, -0.22964611649513245, -0.21284599602222443, -0.1960458755493164, -0.1792457550764084, -0.16244563460350037, -0.14564551413059235, -0.12884539365768433, -0.1120452731847763, -0.09524515271186829, -0.07844503223896027, -0.061644911766052246, -0.044844791293144226, -0.028044670820236206, -0.011244550347328186, 0.005555570125579834, 0.022355690598487854, 0.039155811071395874, 0.055955931544303894, 0.07275605201721191, 0.08955617249011993, 0.10635629296302795, 0.12315641343593597, 0.139956533908844, 0.15675665438175201, 0.17355677485466003, 0.19035689532756805, 0.20715701580047607, 0.2239571362733841, 0.24075725674629211, 0.25755739212036133, 0.27435749769210815, 0.291157603263855, 0.3079577386379242, 0.3247578740119934, 0.34155797958374023, 0.35835808515548706, 0.3751582205295563, 0.3919583559036255, 0.4087584614753723]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 9.0, 14.0, 15.0, 12.0, 29.0, 30.0, 45.0, 61.0, 98.0, 159.0, 210.0, 343.0, 632.0, 1043.0, 1930.0, 3901.0, 10547.0, 40247.0, 199709.0, 520126.0, 208035.0, 41827.0, 10891.0, 3980.0, 1907.0, 993.0, 620.0, 383.0, 222.0, 148.0, 115.0, 96.0, 46.0, 27.0, 25.0, 24.0, 14.0, 10.0, 11.0, 6.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3291015625, -0.31668853759765625, -0.3042755126953125, -0.29186248779296875, -0.279449462890625, -0.26703643798828125, -0.2546234130859375, -0.24221038818359375, -0.22979736328125, -0.21738433837890625, -0.2049713134765625, -0.19255828857421875, -0.180145263671875, -0.16773223876953125, -0.1553192138671875, -0.14290618896484375, -0.1304931640625, -0.11808013916015625, -0.1056671142578125, -0.09325408935546875, -0.080841064453125, -0.06842803955078125, -0.0560150146484375, -0.04360198974609375, -0.03118896484375, -0.01877593994140625, -0.0063629150390625, 0.00605010986328125, 0.018463134765625, 0.03087615966796875, 0.0432891845703125, 0.05570220947265625, 0.068115234375, 0.08052825927734375, 0.0929412841796875, 0.10535430908203125, 0.117767333984375, 0.13018035888671875, 0.1425933837890625, 0.15500640869140625, 0.16741943359375, 0.17983245849609375, 0.1922454833984375, 0.20465850830078125, 0.217071533203125, 0.22948455810546875, 0.2418975830078125, 0.25431060791015625, 0.2667236328125, 0.27913665771484375, 0.2915496826171875, 0.30396270751953125, 0.316375732421875, 0.32878875732421875, 0.3412017822265625, 0.35361480712890625, 0.36602783203125, 0.37844085693359375, 0.3908538818359375, 0.40326690673828125, 0.415679931640625, 0.42809295654296875, 0.4405059814453125, 0.45291900634765625, 0.46533203125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 15.0, 18.0, 50.0, 53.0, 75.0, 115.0, 136.0, 128.0, 119.0, 121.0, 62.0, 49.0, 18.0, 10.0, 12.0, 6.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.16165637969970703, -0.15790748596191406, -0.1541585922241211, -0.15040969848632812, -0.14666080474853516, -0.1429119110107422, -0.13916301727294922, -0.13541412353515625, -0.13166522979736328, -0.1279163360595703, -0.12416744232177734, -0.12041854858398438, -0.1166696548461914, -0.11292076110839844, -0.10917186737060547, -0.1054229736328125, -0.10167407989501953, -0.09792518615722656, -0.0941762924194336, -0.09042739868164062, -0.08667850494384766, -0.08292961120605469, -0.07918071746826172, -0.07543182373046875, -0.07168292999267578, -0.06793403625488281, -0.06418514251708984, -0.060436248779296875, -0.056687355041503906, -0.05293846130371094, -0.04918956756591797, -0.045440673828125, -0.04169178009033203, -0.03794288635253906, -0.034193992614746094, -0.030445098876953125, -0.026696205139160156, -0.022947311401367188, -0.01919841766357422, -0.01544952392578125, -0.011700630187988281, -0.007951736450195312, -0.004202842712402344, -0.000453948974609375, 0.0032949447631835938, 0.0070438385009765625, 0.010792732238769531, 0.0145416259765625, 0.01829051971435547, 0.022039413452148438, 0.025788307189941406, 0.029537200927734375, 0.033286094665527344, 0.03703498840332031, 0.04078388214111328, 0.04453277587890625, 0.04828166961669922, 0.05203056335449219, 0.055779457092285156, 0.059528350830078125, 0.0632772445678711, 0.06702613830566406, 0.07077503204345703, 0.07452392578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 16.0, 19.0, 17.0, 27.0, 52.0, 48.0, 108.0, 156.0, 254.0, 519.0, 828.0, 1727.0, 3266.0, 7296.0, 17375.0, 45056.0, 127405.0, 314724.0, 319485.0, 131384.0, 45941.0, 17982.0, 7663.0, 3416.0, 1681.0, 905.0, 492.0, 284.0, 145.0, 77.0, 72.0, 46.0, 29.0, 24.0, 10.0, 10.0, 7.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25732421875, -0.24902725219726562, -0.24073028564453125, -0.23243331909179688, -0.2241363525390625, -0.21583938598632812, -0.20754241943359375, -0.19924545288085938, -0.190948486328125, -0.18265151977539062, -0.17435455322265625, -0.16605758666992188, -0.1577606201171875, -0.14946365356445312, -0.14116668701171875, -0.13286972045898438, -0.12457275390625, -0.11627578735351562, -0.10797882080078125, -0.09968185424804688, -0.0913848876953125, -0.08308792114257812, -0.07479095458984375, -0.06649398803710938, -0.058197021484375, -0.049900054931640625, -0.04160308837890625, -0.033306121826171875, -0.0250091552734375, -0.016712188720703125, -0.00841522216796875, -0.000118255615234375, 0.0081787109375, 0.016475677490234375, 0.02477264404296875, 0.033069610595703125, 0.0413665771484375, 0.049663543701171875, 0.05796051025390625, 0.06625747680664062, 0.074554443359375, 0.08285140991210938, 0.09114837646484375, 0.09944534301757812, 0.1077423095703125, 0.11603927612304688, 0.12433624267578125, 0.13263320922851562, 0.14093017578125, 0.14922714233398438, 0.15752410888671875, 0.16582107543945312, 0.1741180419921875, 0.18241500854492188, 0.19071197509765625, 0.19900894165039062, 0.207305908203125, 0.21560287475585938, 0.22389984130859375, 0.23219680786132812, 0.2404937744140625, 0.24879074096679688, 0.25708770751953125, 0.2653846740722656, 0.273681640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 3.0, 6.0, 4.0, 6.0, 10.0, 12.0, 20.0, 19.0, 8.0, 29.0, 24.0, 35.0, 26.0, 28.0, 39.0, 39.0, 38.0, 50.0, 49.0, 48.0, 52.0, 45.0, 70.0, 41.0, 33.0, 41.0, 32.0, 33.0, 25.0, 22.0, 19.0, 13.0, 16.0, 15.0, 11.0, 11.0, 4.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305908203125, -0.29734039306640625, -0.2887725830078125, -0.28020477294921875, -0.271636962890625, -0.26306915283203125, -0.2545013427734375, -0.24593353271484375, -0.23736572265625, -0.22879791259765625, -0.2202301025390625, -0.21166229248046875, -0.203094482421875, -0.19452667236328125, -0.1859588623046875, -0.17739105224609375, -0.1688232421875, -0.16025543212890625, -0.1516876220703125, -0.14311981201171875, -0.134552001953125, -0.12598419189453125, -0.1174163818359375, -0.10884857177734375, -0.10028076171875, -0.09171295166015625, -0.0831451416015625, -0.07457733154296875, -0.066009521484375, -0.05744171142578125, -0.0488739013671875, -0.04030609130859375, -0.03173828125, -0.02317047119140625, -0.0146026611328125, -0.00603485107421875, 0.002532958984375, 0.01110076904296875, 0.0196685791015625, 0.02823638916015625, 0.03680419921875, 0.04537200927734375, 0.0539398193359375, 0.06250762939453125, 0.071075439453125, 0.07964324951171875, 0.0882110595703125, 0.09677886962890625, 0.1053466796875, 0.11391448974609375, 0.1224822998046875, 0.13105010986328125, 0.139617919921875, 0.14818572998046875, 0.1567535400390625, 0.16532135009765625, 0.17388916015625, 0.18245697021484375, 0.1910247802734375, 0.19959259033203125, 0.208160400390625, 0.21672821044921875, 0.2252960205078125, 0.23386383056640625, 0.242431640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 3.0, 18.0, 17.0, 15.0, 29.0, 33.0, 58.0, 81.0, 133.0, 225.0, 459.0, 883.0, 2428.0, 7986.0, 37289.0, 309848.0, 591453.0, 77626.0, 13689.0, 3507.0, 1395.0, 593.0, 299.0, 172.0, 110.0, 54.0, 44.0, 34.0, 15.0, 8.0, 14.0, 9.0, 6.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159912109375, -0.15423965454101562, -0.14856719970703125, -0.14289474487304688, -0.1372222900390625, -0.13154983520507812, -0.12587738037109375, -0.12020492553710938, -0.114532470703125, -0.10886001586914062, -0.10318756103515625, -0.09751510620117188, -0.0918426513671875, -0.08617019653320312, -0.08049774169921875, -0.07482528686523438, -0.06915283203125, -0.06348037719726562, -0.05780792236328125, -0.052135467529296875, -0.0464630126953125, -0.040790557861328125, -0.03511810302734375, -0.029445648193359375, -0.023773193359375, -0.018100738525390625, -0.01242828369140625, -0.006755828857421875, -0.0010833740234375, 0.004589080810546875, 0.01026153564453125, 0.015933990478515625, 0.0216064453125, 0.027278900146484375, 0.03295135498046875, 0.038623809814453125, 0.0442962646484375, 0.049968719482421875, 0.05564117431640625, 0.061313629150390625, 0.066986083984375, 0.07265853881835938, 0.07833099365234375, 0.08400344848632812, 0.0896759033203125, 0.09534835815429688, 0.10102081298828125, 0.10669326782226562, 0.11236572265625, 0.11803817749023438, 0.12371063232421875, 0.12938308715820312, 0.1350555419921875, 0.14072799682617188, 0.14640045166015625, 0.15207290649414062, 0.157745361328125, 0.16341781616210938, 0.16909027099609375, 0.17476272583007812, 0.1804351806640625, 0.18610763549804688, 0.19178009033203125, 0.19745254516601562, 0.203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 0.0, 6.0, 4.0, 7.0, 8.0, 15.0, 16.0, 15.0, 28.0, 48.0, 67.0, 64.0, 126.0, 160.0, 137.0, 65.0, 63.0, 44.0, 38.0, 33.0, 15.0, 10.0, 8.0, 7.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024056434631347656, -0.00023270398378372192, -0.00022484362125396729, -0.00021698325872421265, -0.000209122896194458, -0.00020126253366470337, -0.00019340217113494873, -0.0001855418086051941, -0.00017768144607543945, -0.00016982108354568481, -0.00016196072101593018, -0.00015410035848617554, -0.0001462399959564209, -0.00013837963342666626, -0.00013051927089691162, -0.00012265890836715698, -0.00011479854583740234, -0.0001069381833076477, -9.907782077789307e-05, -9.121745824813843e-05, -8.335709571838379e-05, -7.549673318862915e-05, -6.763637065887451e-05, -5.977600812911987e-05, -5.1915645599365234e-05, -4.4055283069610596e-05, -3.619492053985596e-05, -2.833455801010132e-05, -2.047419548034668e-05, -1.2613832950592041e-05, -4.753470420837402e-06, 3.1068921089172363e-06, 1.0967254638671875e-05, 1.8827617168426514e-05, 2.6687979698181152e-05, 3.454834222793579e-05, 4.240870475769043e-05, 5.026906728744507e-05, 5.812942981719971e-05, 6.598979234695435e-05, 7.385015487670898e-05, 8.171051740646362e-05, 8.957087993621826e-05, 9.74312424659729e-05, 0.00010529160499572754, 0.00011315196752548218, 0.00012101233005523682, 0.00012887269258499146, 0.0001367330551147461, 0.00014459341764450073, 0.00015245378017425537, 0.00016031414270401, 0.00016817450523376465, 0.0001760348677635193, 0.00018389523029327393, 0.00019175559282302856, 0.0001996159553527832, 0.00020747631788253784, 0.00021533668041229248, 0.00022319704294204712, 0.00023105740547180176, 0.0002389177680015564, 0.00024677813053131104, 0.0002546384930610657, 0.0002624988555908203]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 9.0, 12.0, 19.0, 25.0, 32.0, 56.0, 92.0, 172.0, 327.0, 634.0, 1472.0, 4094.0, 13976.0, 65347.0, 488514.0, 402532.0, 53065.0, 11907.0, 3594.0, 1316.0, 621.0, 321.0, 172.0, 79.0, 58.0, 40.0, 25.0, 17.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.19580078125, -0.19019699096679688, -0.18459320068359375, -0.17898941040039062, -0.1733856201171875, -0.16778182983398438, -0.16217803955078125, -0.15657424926757812, -0.150970458984375, -0.14536666870117188, -0.13976287841796875, -0.13415908813476562, -0.1285552978515625, -0.12295150756835938, -0.11734771728515625, -0.11174392700195312, -0.10614013671875, -0.10053634643554688, -0.09493255615234375, -0.08932876586914062, -0.0837249755859375, -0.07812118530273438, -0.07251739501953125, -0.06691360473632812, -0.061309814453125, -0.055706024169921875, -0.05010223388671875, -0.044498443603515625, -0.0388946533203125, -0.033290863037109375, -0.02768707275390625, -0.022083282470703125, -0.0164794921875, -0.010875701904296875, -0.00527191162109375, 0.000331878662109375, 0.0059356689453125, 0.011539459228515625, 0.01714324951171875, 0.022747039794921875, 0.028350830078125, 0.033954620361328125, 0.03955841064453125, 0.045162200927734375, 0.0507659912109375, 0.056369781494140625, 0.06197357177734375, 0.06757736206054688, 0.07318115234375, 0.07878494262695312, 0.08438873291015625, 0.08999252319335938, 0.0955963134765625, 0.10120010375976562, 0.10680389404296875, 0.11240768432617188, 0.118011474609375, 0.12361526489257812, 0.12921905517578125, 0.13482284545898438, 0.1404266357421875, 0.14603042602539062, 0.15163421630859375, 0.15723800659179688, 0.162841796875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 15.0, 16.0, 21.0, 44.0, 56.0, 83.0, 111.0, 131.0, 139.0, 95.0, 85.0, 45.0, 36.0, 24.0, 22.0, 22.0, 10.0, 6.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.17431640625, -0.169464111328125, -0.16461181640625, -0.159759521484375, -0.1549072265625, -0.150054931640625, -0.14520263671875, -0.140350341796875, -0.135498046875, -0.130645751953125, -0.12579345703125, -0.120941162109375, -0.1160888671875, -0.111236572265625, -0.10638427734375, -0.101531982421875, -0.0966796875, -0.091827392578125, -0.08697509765625, -0.082122802734375, -0.0772705078125, -0.072418212890625, -0.06756591796875, -0.062713623046875, -0.057861328125, -0.053009033203125, -0.04815673828125, -0.043304443359375, -0.0384521484375, -0.033599853515625, -0.02874755859375, -0.023895263671875, -0.01904296875, -0.014190673828125, -0.00933837890625, -0.004486083984375, 0.0003662109375, 0.005218505859375, 0.01007080078125, 0.014923095703125, 0.019775390625, 0.024627685546875, 0.02947998046875, 0.034332275390625, 0.0391845703125, 0.044036865234375, 0.04888916015625, 0.053741455078125, 0.05859375, 0.063446044921875, 0.06829833984375, 0.073150634765625, 0.0780029296875, 0.082855224609375, 0.08770751953125, 0.092559814453125, 0.097412109375, 0.102264404296875, 0.10711669921875, 0.111968994140625, 0.1168212890625, 0.121673583984375, 0.12652587890625, 0.131378173828125, 0.13623046875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 18.0, 42.0, 61.0, 112.0, 171.0, 207.0, 161.0, 92.0, 56.0, 25.0, 17.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.602572202682495, -2.5162413120269775, -2.429910659790039, -2.3435797691345215, -2.257249116897583, -2.1709182262420654, -2.084587574005127, -1.9982566833496094, -1.9119259119033813, -1.8255951404571533, -1.7392643690109253, -1.6529335975646973, -1.5666027069091797, -1.4802720546722412, -1.3939411640167236, -1.3076103925704956, -1.2212796211242676, -1.1349488496780396, -1.0486180782318115, -0.9622872471809387, -0.8759564757347107, -0.7896257042884827, -0.7032948732376099, -0.6169641017913818, -0.5306333303451538, -0.4443025588989258, -0.35797175765037537, -0.27164095640182495, -0.18531018495559692, -0.0989794135093689, -0.012648582458496094, 0.07368218898773193, 0.16001319885253906, 0.24634398519992828, 0.3326747715473175, 0.4190055727958679, 0.505336344242096, 0.591667115688324, 0.6779979467391968, 0.7643287181854248, 0.8506594896316528, 0.9369902610778809, 1.0233210325241089, 1.109651803970337, 1.1959826946258545, 1.282313346862793, 1.3686442375183105, 1.4549750089645386, 1.5413057804107666, 1.6276365518569946, 1.7139673233032227, 1.8002982139587402, 1.8866288661956787, 1.9729597568511963, 2.0592904090881348, 2.1456212997436523, 2.23195219039917, 2.3182830810546875, 2.404613733291626, 2.4909446239471436, 2.577275276184082, 2.6636061668395996, 2.749937057495117, 2.8362677097320557, 2.922598361968994]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 8.0, 7.0, 6.0, 8.0, 7.0, 12.0, 25.0, 28.0, 16.0, 25.0, 29.0, 34.0, 38.0, 38.0, 41.0, 57.0, 51.0, 41.0, 53.0, 48.0, 57.0, 41.0, 44.0, 31.0, 48.0, 31.0, 23.0, 32.0, 31.0, 19.0, 16.0, 12.0, 5.0, 3.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.524464726448059, -1.4742419719696045, -1.4240190982818604, -1.3737963438034058, -1.3235735893249512, -1.2733508348464966, -1.223128080368042, -1.1729052066802979, -1.1226824522018433, -1.0724596977233887, -1.0222368240356445, -0.9720140695571899, -0.9217913150787354, -0.8715685606002808, -0.8213457465171814, -0.771122932434082, -0.7209001779556274, -0.6706774234771729, -0.6204546093940735, -0.5702317953109741, -0.5200090408325195, -0.46978625655174255, -0.4195634722709656, -0.3693406879901886, -0.3191179037094116, -0.26889511942863464, -0.21867233514785767, -0.1684495508670807, -0.11822676658630371, -0.06800398230552673, -0.017781198024749756, 0.03244158625602722, 0.08266448974609375, 0.13288727402687073, 0.1831100583076477, 0.23333284258842468, 0.28355562686920166, 0.33377841114997864, 0.3840011954307556, 0.4342239797115326, 0.48444676399230957, 0.5346695184707642, 0.5848923325538635, 0.6351151466369629, 0.6853379011154175, 0.7355606555938721, 0.7857834696769714, 0.8360062837600708, 0.8862290382385254, 0.93645179271698, 0.9866746068000793, 1.0368974208831787, 1.0871201753616333, 1.137342929840088, 1.187565803527832, 1.2377885580062866, 1.2880113124847412, 1.3382340669631958, 1.3884568214416504, 1.4386796951293945, 1.4889024496078491, 1.5391252040863037, 1.5893480777740479, 1.6395708322525024, 1.689793586730957]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 7.0, 3.0, 4.0, 11.0, 9.0, 10.0, 16.0, 30.0, 30.0, 27.0, 52.0, 95.0, 131.0, 232.0, 432.0, 936.0, 2316.0, 7901.0, 52648.0, 3848182.0, 257270.0, 17536.0, 3957.0, 1325.0, 529.0, 276.0, 140.0, 73.0, 40.0, 22.0, 16.0, 7.0, 3.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.75048828125, -0.7294845581054688, -0.7084808349609375, -0.6874771118164062, -0.666473388671875, -0.6454696655273438, -0.6244659423828125, -0.6034622192382812, -0.58245849609375, -0.5614547729492188, -0.5404510498046875, -0.5194473266601562, -0.498443603515625, -0.47743988037109375, -0.4564361572265625, -0.43543243408203125, -0.4144287109375, -0.39342498779296875, -0.3724212646484375, -0.35141754150390625, -0.330413818359375, -0.30941009521484375, -0.2884063720703125, -0.26740264892578125, -0.24639892578125, -0.22539520263671875, -0.2043914794921875, -0.18338775634765625, -0.162384033203125, -0.14138031005859375, -0.1203765869140625, -0.09937286376953125, -0.078369140625, -0.05736541748046875, -0.0363616943359375, -0.01535797119140625, 0.005645751953125, 0.02664947509765625, 0.0476531982421875, 0.06865692138671875, 0.08966064453125, 0.11066436767578125, 0.1316680908203125, 0.15267181396484375, 0.173675537109375, 0.19467926025390625, 0.2156829833984375, 0.23668670654296875, 0.2576904296875, 0.27869415283203125, 0.2996978759765625, 0.32070159912109375, 0.341705322265625, 0.36270904541015625, 0.3837127685546875, 0.40471649169921875, 0.42572021484375, 0.44672393798828125, 0.4677276611328125, 0.48873138427734375, 0.509735107421875, 0.5307388305664062, 0.5517425537109375, 0.5727462768554688, 0.59375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 9.0, 18.0, 20.0, 50.0, 44.0, 64.0, 97.0, 122.0, 133.0, 112.0, 99.0, 76.0, 53.0, 40.0, 22.0, 11.0, 7.0, 9.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1622314453125, -0.15857982635498047, -0.15492820739746094, -0.1512765884399414, -0.14762496948242188, -0.14397335052490234, -0.1403217315673828, -0.13667011260986328, -0.13301849365234375, -0.12936687469482422, -0.1257152557373047, -0.12206363677978516, -0.11841201782226562, -0.1147603988647461, -0.11110877990722656, -0.10745716094970703, -0.1038055419921875, -0.10015392303466797, -0.09650230407714844, -0.0928506851196289, -0.08919906616210938, -0.08554744720458984, -0.08189582824707031, -0.07824420928955078, -0.07459259033203125, -0.07094097137451172, -0.06728935241699219, -0.06363773345947266, -0.059986114501953125, -0.056334495544433594, -0.05268287658691406, -0.04903125762939453, -0.045379638671875, -0.04172801971435547, -0.03807640075683594, -0.034424781799316406, -0.030773162841796875, -0.027121543884277344, -0.023469924926757812, -0.01981830596923828, -0.01616668701171875, -0.012515068054199219, -0.008863449096679688, -0.005211830139160156, -0.001560211181640625, 0.0020914077758789062, 0.0057430267333984375, 0.009394645690917969, 0.0130462646484375, 0.01669788360595703, 0.020349502563476562, 0.024001121520996094, 0.027652740478515625, 0.031304359436035156, 0.03495597839355469, 0.03860759735107422, 0.04225921630859375, 0.04591083526611328, 0.04956245422363281, 0.053214073181152344, 0.056865692138671875, 0.060517311096191406, 0.06416893005371094, 0.06782054901123047, 0.07147216796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 5.0, 12.0, 13.0, 31.0, 43.0, 99.0, 205.0, 428.0, 1036.0, 4303.0, 41038.0, 3953311.0, 183020.0, 8137.0, 1642.0, 500.0, 228.0, 116.0, 47.0, 29.0, 18.0, 15.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8515625, -0.8277053833007812, -0.8038482666015625, -0.7799911499023438, -0.756134033203125, -0.7322769165039062, -0.7084197998046875, -0.6845626831054688, -0.66070556640625, -0.6368484497070312, -0.6129913330078125, -0.5891342163085938, -0.565277099609375, -0.5414199829101562, -0.5175628662109375, -0.49370574951171875, -0.4698486328125, -0.44599151611328125, -0.4221343994140625, -0.39827728271484375, -0.374420166015625, -0.35056304931640625, -0.3267059326171875, -0.30284881591796875, -0.27899169921875, -0.25513458251953125, -0.2312774658203125, -0.20742034912109375, -0.183563232421875, -0.15970611572265625, -0.1358489990234375, -0.11199188232421875, -0.088134765625, -0.06427764892578125, -0.0404205322265625, -0.01656341552734375, 0.007293701171875, 0.03115081787109375, 0.0550079345703125, 0.07886505126953125, 0.10272216796875, 0.12657928466796875, 0.1504364013671875, 0.17429351806640625, 0.198150634765625, 0.22200775146484375, 0.2458648681640625, 0.26972198486328125, 0.2935791015625, 0.31743621826171875, 0.3412933349609375, 0.36515045166015625, 0.389007568359375, 0.41286468505859375, 0.4367218017578125, 0.46057891845703125, 0.48443603515625, 0.5082931518554688, 0.5321502685546875, 0.5560073852539062, 0.579864501953125, 0.6037216186523438, 0.6275787353515625, 0.6514358520507812, 0.67529296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 6.0, 7.0, 12.0, 24.0, 22.0, 39.0, 50.0, 55.0, 122.0, 221.0, 442.0, 1077.0, 1027.0, 407.0, 232.0, 99.0, 71.0, 49.0, 28.0, 17.0, 11.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.09417724609375, -0.0916290283203125, -0.089080810546875, -0.0865325927734375, -0.083984375, -0.0814361572265625, -0.078887939453125, -0.0763397216796875, -0.07379150390625, -0.0712432861328125, -0.068695068359375, -0.0661468505859375, -0.0635986328125, -0.0610504150390625, -0.058502197265625, -0.0559539794921875, -0.05340576171875, -0.0508575439453125, -0.048309326171875, -0.0457611083984375, -0.043212890625, -0.0406646728515625, -0.038116455078125, -0.0355682373046875, -0.03302001953125, -0.0304718017578125, -0.027923583984375, -0.0253753662109375, -0.0228271484375, -0.0202789306640625, -0.017730712890625, -0.0151824951171875, -0.01263427734375, -0.0100860595703125, -0.007537841796875, -0.0049896240234375, -0.00244140625, 0.0001068115234375, 0.002655029296875, 0.0052032470703125, 0.00775146484375, 0.0102996826171875, 0.012847900390625, 0.0153961181640625, 0.0179443359375, 0.0204925537109375, 0.023040771484375, 0.0255889892578125, 0.02813720703125, 0.0306854248046875, 0.033233642578125, 0.0357818603515625, 0.038330078125, 0.0408782958984375, 0.043426513671875, 0.0459747314453125, 0.04852294921875, 0.0510711669921875, 0.053619384765625, 0.0561676025390625, 0.0587158203125, 0.0612640380859375, 0.063812255859375, 0.0663604736328125, 0.06890869140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 13.0, 38.0, 66.0, 175.0, 256.0, 221.0, 130.0, 46.0, 26.0, 13.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.571729302406311, -0.5414240956306458, -0.5111188888549805, -0.4808137118816376, -0.4505085051059723, -0.420203298330307, -0.3898981213569641, -0.35959291458129883, -0.32928770780563354, -0.29898250102996826, -0.268677294254303, -0.23837211728096008, -0.2080669105052948, -0.17776170372962952, -0.14745651185512543, -0.11715131998062134, -0.08684611320495605, -0.05654091387987137, -0.026235714554786682, 0.004069484770298004, 0.03437468409538269, 0.06467989087104797, 0.09498508274555206, 0.12529027462005615, 0.15559548139572144, 0.18590068817138672, 0.2162058800458908, 0.2465110719203949, 0.2768162786960602, 0.30712148547172546, 0.33742666244506836, 0.36773186922073364, 0.3980370759963989, 0.4283422827720642, 0.4586474895477295, 0.4889526665210724, 0.5192579030990601, 0.5495630502700806, 0.5798682570457458, 0.6101734638214111, 0.6404786705970764, 0.6707838773727417, 0.701089084148407, 0.7313942909240723, 0.7616994380950928, 0.7920047044754028, 0.8223098516464233, 0.8526150584220886, 0.8829202651977539, 0.9132254719734192, 0.9435306787490845, 0.9738358855247498, 1.004141092300415, 1.0344462394714355, 1.0647515058517456, 1.0950566530227661, 1.1253619194030762, 1.1556670665740967, 1.1859723329544067, 1.2162774801254272, 1.2465827465057373, 1.2768878936767578, 1.3071931600570679, 1.3374983072280884, 1.3678034543991089]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 9.0, 4.0, 8.0, 12.0, 13.0, 12.0, 29.0, 28.0, 27.0, 27.0, 42.0, 46.0, 47.0, 56.0, 47.0, 56.0, 61.0, 63.0, 39.0, 47.0, 47.0, 46.0, 39.0, 29.0, 35.0, 34.0, 18.0, 18.0, 16.0, 11.0, 9.0, 10.0, 7.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2684744596481323, -0.2583796977996826, -0.2482849657535553, -0.23819021880626678, -0.22809547185897827, -0.21800072491168976, -0.20790597796440125, -0.19781121611595154, -0.18771648406982422, -0.1776217371225357, -0.1675269901752472, -0.15743224322795868, -0.14733749628067017, -0.13724274933338165, -0.12714800238609314, -0.11705324798822403, -0.10695849359035492, -0.0968637466430664, -0.0867689996957779, -0.07667425274848938, -0.06657950580120087, -0.056484755128622055, -0.04639000445604324, -0.03629525750875473, -0.026200510561466217, -0.016105763614177704, -0.0060110148042440414, 0.004083734005689621, 0.014178480952978134, 0.024273227900266647, 0.03436797857284546, 0.04446272552013397, 0.054557472467422485, 0.064652219414711, 0.07474696636199951, 0.08484171330928802, 0.09493646025657654, 0.10503120720386505, 0.11512596160173416, 0.12522071599960327, 0.1353154480457306, 0.1454101949930191, 0.15550494194030762, 0.16559968888759613, 0.17569443583488464, 0.18578918278217316, 0.19588392972946167, 0.20597869157791138, 0.2160734385251999, 0.2261681854724884, 0.23626293241977692, 0.24635767936706543, 0.25645244121551514, 0.26654717326164246, 0.27664193511009216, 0.2867366671562195, 0.2968314290046692, 0.3069261908531189, 0.3170209228992462, 0.3271156847476959, 0.33721041679382324, 0.34730517864227295, 0.35739991068840027, 0.36749467253685, 0.3775894045829773]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 9.0, 9.0, 19.0, 19.0, 28.0, 40.0, 59.0, 121.0, 203.0, 335.0, 584.0, 1075.0, 2136.0, 4981.0, 17027.0, 96249.0, 494325.0, 355162.0, 56831.0, 11720.0, 3924.0, 1733.0, 921.0, 422.0, 239.0, 142.0, 82.0, 59.0, 39.0, 25.0, 10.0, 6.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3896484375, -0.37458038330078125, -0.3595123291015625, -0.34444427490234375, -0.329376220703125, -0.31430816650390625, -0.2992401123046875, -0.28417205810546875, -0.26910400390625, -0.25403594970703125, -0.2389678955078125, -0.22389984130859375, -0.208831787109375, -0.19376373291015625, -0.1786956787109375, -0.16362762451171875, -0.1485595703125, -0.13349151611328125, -0.1184234619140625, -0.10335540771484375, -0.088287353515625, -0.07321929931640625, -0.0581512451171875, -0.04308319091796875, -0.02801513671875, -0.01294708251953125, 0.0021209716796875, 0.01718902587890625, 0.032257080078125, 0.04732513427734375, 0.0623931884765625, 0.07746124267578125, 0.092529296875, 0.10759735107421875, 0.1226654052734375, 0.13773345947265625, 0.152801513671875, 0.16786956787109375, 0.1829376220703125, 0.19800567626953125, 0.21307373046875, 0.22814178466796875, 0.2432098388671875, 0.25827789306640625, 0.273345947265625, 0.28841400146484375, 0.3034820556640625, 0.31855010986328125, 0.3336181640625, 0.34868621826171875, 0.3637542724609375, 0.37882232666015625, 0.393890380859375, 0.40895843505859375, 0.4240264892578125, 0.43909454345703125, 0.45416259765625, 0.46923065185546875, 0.4842987060546875, 0.49936676025390625, 0.514434814453125, 0.5295028686523438, 0.5445709228515625, 0.5596389770507812, 0.57470703125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 14.0, 10.0, 24.0, 40.0, 56.0, 54.0, 99.0, 112.0, 138.0, 119.0, 103.0, 74.0, 56.0, 42.0, 23.0, 7.0, 10.0, 9.0, 6.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1612548828125, -0.15755748748779297, -0.15386009216308594, -0.1501626968383789, -0.14646530151367188, -0.14276790618896484, -0.1390705108642578, -0.13537311553955078, -0.13167572021484375, -0.12797832489013672, -0.12428092956542969, -0.12058353424072266, -0.11688613891601562, -0.1131887435913086, -0.10949134826660156, -0.10579395294189453, -0.1020965576171875, -0.09839916229248047, -0.09470176696777344, -0.0910043716430664, -0.08730697631835938, -0.08360958099365234, -0.07991218566894531, -0.07621479034423828, -0.07251739501953125, -0.06881999969482422, -0.06512260437011719, -0.061425209045410156, -0.057727813720703125, -0.054030418395996094, -0.05033302307128906, -0.04663562774658203, -0.042938232421875, -0.03924083709716797, -0.03554344177246094, -0.031846046447753906, -0.028148651123046875, -0.024451255798339844, -0.020753860473632812, -0.01705646514892578, -0.01335906982421875, -0.009661674499511719, -0.0059642791748046875, -0.0022668838500976562, 0.001430511474609375, 0.005127906799316406, 0.008825302124023438, 0.012522697448730469, 0.0162200927734375, 0.01991748809814453, 0.023614883422851562, 0.027312278747558594, 0.031009674072265625, 0.034707069396972656, 0.03840446472167969, 0.04210186004638672, 0.04579925537109375, 0.04949665069580078, 0.05319404602050781, 0.056891441345214844, 0.060588836669921875, 0.0642862319946289, 0.06798362731933594, 0.07168102264404297, 0.07537841796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 5.0, 10.0, 21.0, 19.0, 33.0, 44.0, 74.0, 108.0, 188.0, 252.0, 402.0, 672.0, 1265.0, 2233.0, 4424.0, 9170.0, 21359.0, 55071.0, 151276.0, 329622.0, 283549.0, 114082.0, 42052.0, 16574.0, 7586.0, 3667.0, 1987.0, 1125.0, 618.0, 355.0, 249.0, 125.0, 94.0, 75.0, 53.0, 35.0, 18.0, 17.0, 9.0, 9.0, 7.0, 3.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.293701171875, -0.2855110168457031, -0.27732086181640625, -0.2691307067871094, -0.2609405517578125, -0.2527503967285156, -0.24456024169921875, -0.23637008666992188, -0.228179931640625, -0.21998977661132812, -0.21179962158203125, -0.20360946655273438, -0.1954193115234375, -0.18722915649414062, -0.17903900146484375, -0.17084884643554688, -0.16265869140625, -0.15446853637695312, -0.14627838134765625, -0.13808822631835938, -0.1298980712890625, -0.12170791625976562, -0.11351776123046875, -0.10532760620117188, -0.097137451171875, -0.08894729614257812, -0.08075714111328125, -0.07256698608398438, -0.0643768310546875, -0.056186676025390625, -0.04799652099609375, -0.039806365966796875, -0.0316162109375, -0.023426055908203125, -0.01523590087890625, -0.007045745849609375, 0.0011444091796875, 0.009334564208984375, 0.01752471923828125, 0.025714874267578125, 0.033905029296875, 0.042095184326171875, 0.05028533935546875, 0.058475494384765625, 0.0666656494140625, 0.07485580444335938, 0.08304595947265625, 0.09123611450195312, 0.09942626953125, 0.10761642456054688, 0.11580657958984375, 0.12399673461914062, 0.1321868896484375, 0.14037704467773438, 0.14856719970703125, 0.15675735473632812, 0.164947509765625, 0.17313766479492188, 0.18132781982421875, 0.18951797485351562, 0.1977081298828125, 0.20589828491210938, 0.21408843994140625, 0.22227859497070312, 0.23046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 6.0, 4.0, 8.0, 13.0, 11.0, 10.0, 23.0, 21.0, 17.0, 32.0, 34.0, 48.0, 36.0, 32.0, 50.0, 44.0, 52.0, 58.0, 51.0, 64.0, 47.0, 30.0, 52.0, 38.0, 32.0, 25.0, 22.0, 28.0, 15.0, 14.0, 19.0, 13.0, 12.0, 9.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.328125, -0.31884002685546875, -0.3095550537109375, -0.30027008056640625, -0.290985107421875, -0.28170013427734375, -0.2724151611328125, -0.26313018798828125, -0.25384521484375, -0.24456024169921875, -0.2352752685546875, -0.22599029541015625, -0.216705322265625, -0.20742034912109375, -0.1981353759765625, -0.18885040283203125, -0.1795654296875, -0.17028045654296875, -0.1609954833984375, -0.15171051025390625, -0.142425537109375, -0.13314056396484375, -0.1238555908203125, -0.11457061767578125, -0.10528564453125, -0.09600067138671875, -0.0867156982421875, -0.07743072509765625, -0.068145751953125, -0.05886077880859375, -0.0495758056640625, -0.04029083251953125, -0.031005859375, -0.02172088623046875, -0.0124359130859375, -0.00315093994140625, 0.006134033203125, 0.01541900634765625, 0.0247039794921875, 0.03398895263671875, 0.04327392578125, 0.05255889892578125, 0.0618438720703125, 0.07112884521484375, 0.080413818359375, 0.08969879150390625, 0.0989837646484375, 0.10826873779296875, 0.1175537109375, 0.12683868408203125, 0.1361236572265625, 0.14540863037109375, 0.154693603515625, 0.16397857666015625, 0.1732635498046875, 0.18254852294921875, 0.19183349609375, 0.20111846923828125, 0.2104034423828125, 0.21968841552734375, 0.228973388671875, 0.23825836181640625, 0.2475433349609375, 0.25682830810546875, 0.26611328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 6.0, 10.0, 3.0, 8.0, 19.0, 22.0, 35.0, 62.0, 89.0, 148.0, 253.0, 428.0, 799.0, 1544.0, 3312.0, 7824.0, 23844.0, 131292.0, 649907.0, 183152.0, 29129.0, 9078.0, 3731.0, 1756.0, 872.0, 511.0, 285.0, 146.0, 94.0, 55.0, 38.0, 29.0, 14.0, 13.0, 9.0, 4.0, 6.0, 4.0, 2.0, 0.0, 3.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.2235107421875, -0.21722793579101562, -0.21094512939453125, -0.20466232299804688, -0.1983795166015625, -0.19209671020507812, -0.18581390380859375, -0.17953109741210938, -0.173248291015625, -0.16696548461914062, -0.16068267822265625, -0.15439987182617188, -0.1481170654296875, -0.14183425903320312, -0.13555145263671875, -0.12926864624023438, -0.12298583984375, -0.11670303344726562, -0.11042022705078125, -0.10413742065429688, -0.0978546142578125, -0.09157180786132812, -0.08528900146484375, -0.07900619506835938, -0.072723388671875, -0.06644058227539062, -0.06015777587890625, -0.053874969482421875, -0.0475921630859375, -0.041309356689453125, -0.03502655029296875, -0.028743743896484375, -0.0224609375, -0.016178131103515625, -0.00989532470703125, -0.003612518310546875, 0.0026702880859375, 0.008953094482421875, 0.01523590087890625, 0.021518707275390625, 0.027801513671875, 0.034084320068359375, 0.04036712646484375, 0.046649932861328125, 0.0529327392578125, 0.059215545654296875, 0.06549835205078125, 0.07178115844726562, 0.07806396484375, 0.08434677124023438, 0.09062957763671875, 0.09691238403320312, 0.1031951904296875, 0.10947799682617188, 0.11576080322265625, 0.12204360961914062, 0.128326416015625, 0.13460922241210938, 0.14089202880859375, 0.14717483520507812, 0.1534576416015625, 0.15974044799804688, 0.16602325439453125, 0.17230606079101562, 0.1785888671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 3.0, 8.0, 2.0, 9.0, 10.0, 9.0, 8.0, 6.0, 19.0, 24.0, 29.0, 28.0, 35.0, 55.0, 62.0, 77.0, 76.0, 96.0, 80.0, 65.0, 54.0, 55.0, 37.0, 22.0, 24.0, 16.0, 14.0, 13.0, 12.0, 8.0, 7.0, 5.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0001423358917236328, -0.0001380518078804016, -0.0001337677240371704, -0.0001294836401939392, -0.000125199556350708, -0.0001209154725074768, -0.0001166313886642456, -0.0001123473048210144, -0.0001080632209777832, -0.000103779137134552, -9.94950532913208e-05, -9.52109694480896e-05, -9.09268856048584e-05, -8.66428017616272e-05, -8.2358717918396e-05, -7.80746340751648e-05, -7.37905502319336e-05, -6.950646638870239e-05, -6.522238254547119e-05, -6.093829870223999e-05, -5.665421485900879e-05, -5.237013101577759e-05, -4.808604717254639e-05, -4.3801963329315186e-05, -3.9517879486083984e-05, -3.523379564285278e-05, -3.094971179962158e-05, -2.666562795639038e-05, -2.238154411315918e-05, -1.809746026992798e-05, -1.3813376426696777e-05, -9.529292583465576e-06, -5.245208740234375e-06, -9.611248970031738e-07, 3.3229589462280273e-06, 7.6070427894592285e-06, 1.189112663269043e-05, 1.617521047592163e-05, 2.0459294319152832e-05, 2.4743378162384033e-05, 2.9027462005615234e-05, 3.3311545848846436e-05, 3.759562969207764e-05, 4.187971353530884e-05, 4.616379737854004e-05, 5.044788122177124e-05, 5.473196506500244e-05, 5.901604890823364e-05, 6.330013275146484e-05, 6.758421659469604e-05, 7.186830043792725e-05, 7.615238428115845e-05, 8.043646812438965e-05, 8.472055196762085e-05, 8.900463581085205e-05, 9.328871965408325e-05, 9.757280349731445e-05, 0.00010185688734054565, 0.00010614097118377686, 0.00011042505502700806, 0.00011470913887023926, 0.00011899322271347046, 0.00012327730655670166, 0.00012756139039993286, 0.00013184547424316406]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 13.0, 17.0, 4.0, 17.0, 24.0, 33.0, 53.0, 99.0, 144.0, 292.0, 519.0, 1017.0, 2351.0, 5801.0, 18017.0, 123646.0, 738199.0, 129638.0, 18034.0, 6019.0, 2352.0, 1095.0, 502.0, 232.0, 145.0, 96.0, 59.0, 39.0, 26.0, 14.0, 12.0, 7.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2247314453125, -0.2171154022216797, -0.20949935913085938, -0.20188331604003906, -0.19426727294921875, -0.18665122985839844, -0.17903518676757812, -0.1714191436767578, -0.1638031005859375, -0.1561870574951172, -0.14857101440429688, -0.14095497131347656, -0.13333892822265625, -0.12572288513183594, -0.11810684204101562, -0.11049079895019531, -0.102874755859375, -0.09525871276855469, -0.08764266967773438, -0.08002662658691406, -0.07241058349609375, -0.06479454040527344, -0.057178497314453125, -0.04956245422363281, -0.0419464111328125, -0.03433036804199219, -0.026714324951171875, -0.019098281860351562, -0.01148223876953125, -0.0038661956787109375, 0.003749847412109375, 0.011365890502929688, 0.01898193359375, 0.026597976684570312, 0.034214019775390625, 0.04183006286621094, 0.04944610595703125, 0.05706214904785156, 0.06467819213867188, 0.07229423522949219, 0.0799102783203125, 0.08752632141113281, 0.09514236450195312, 0.10275840759277344, 0.11037445068359375, 0.11799049377441406, 0.12560653686523438, 0.1332225799560547, 0.140838623046875, 0.1484546661376953, 0.15607070922851562, 0.16368675231933594, 0.17130279541015625, 0.17891883850097656, 0.18653488159179688, 0.1941509246826172, 0.2017669677734375, 0.2093830108642578, 0.21699905395507812, 0.22461509704589844, 0.23223114013671875, 0.23984718322753906, 0.24746322631835938, 0.2550792694091797, 0.2626953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 5.0, 8.0, 10.0, 13.0, 26.0, 27.0, 41.0, 50.0, 56.0, 66.0, 93.0, 102.0, 91.0, 77.0, 76.0, 58.0, 54.0, 36.0, 26.0, 15.0, 16.0, 8.0, 10.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11285400390625, -0.10867595672607422, -0.10449790954589844, -0.10031986236572266, -0.09614181518554688, -0.0919637680053711, -0.08778572082519531, -0.08360767364501953, -0.07942962646484375, -0.07525157928466797, -0.07107353210449219, -0.0668954849243164, -0.06271743774414062, -0.058539390563964844, -0.05436134338378906, -0.05018329620361328, -0.0460052490234375, -0.04182720184326172, -0.03764915466308594, -0.033471107482910156, -0.029293060302734375, -0.025115013122558594, -0.020936965942382812, -0.01675891876220703, -0.01258087158203125, -0.008402824401855469, -0.0042247772216796875, -4.673004150390625e-05, 0.004131317138671875, 0.008309364318847656, 0.012487411499023438, 0.01666545867919922, 0.020843505859375, 0.02502155303955078, 0.029199600219726562, 0.033377647399902344, 0.037555694580078125, 0.041733741760253906, 0.04591178894042969, 0.05008983612060547, 0.05426788330078125, 0.05844593048095703, 0.06262397766113281, 0.0668020248413086, 0.07098007202148438, 0.07515811920166016, 0.07933616638183594, 0.08351421356201172, 0.0876922607421875, 0.09187030792236328, 0.09604835510253906, 0.10022640228271484, 0.10440444946289062, 0.1085824966430664, 0.11276054382324219, 0.11693859100341797, 0.12111663818359375, 0.12529468536376953, 0.1294727325439453, 0.1336507797241211, 0.13782882690429688, 0.14200687408447266, 0.14618492126464844, 0.15036296844482422, 0.154541015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 11.0, 13.0, 35.0, 47.0, 61.0, 123.0, 160.0, 165.0, 158.0, 103.0, 50.0, 28.0, 20.0, 10.0, 7.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.9370779991149902, -3.846107244491577, -3.755136489868164, -3.664165735244751, -3.573194980621338, -3.4822239875793457, -3.3912532329559326, -3.3002824783325195, -3.2093117237091064, -3.1183409690856934, -3.0273702144622803, -2.936399459838867, -2.845428466796875, -2.754457712173462, -2.663486957550049, -2.5725162029266357, -2.4815454483032227, -2.3905746936798096, -2.2996039390563965, -2.2086331844329834, -2.1176624298095703, -2.026691436767578, -1.935720682144165, -1.844749927520752, -1.7537791728973389, -1.6628084182739258, -1.5718376636505127, -1.48086678981781, -1.389896035194397, -1.2989252805709839, -1.2079544067382812, -1.1169836521148682, -1.026012897491455, -0.935042142868042, -0.8440713286399841, -0.7531005144119263, -0.6621297597885132, -0.5711590051651001, -0.48018819093704224, -0.3892173767089844, -0.2982466220855713, -0.20727583765983582, -0.11630505323410034, -0.025334268808364868, 0.0656365156173706, 0.15660730004310608, 0.24757808446884155, 0.3385488986968994, 0.4295196533203125, 0.5204904079437256, 0.6114612221717834, 0.7024320363998413, 0.7934027910232544, 0.8843735456466675, 0.9753443598747253, 1.0663151741027832, 1.1572859287261963, 1.2482566833496094, 1.3392274379730225, 1.430198311805725, 1.5211690664291382, 1.6121398210525513, 1.703110694885254, 1.794081449508667, 1.88505220413208]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 5.0, 11.0, 9.0, 12.0, 26.0, 24.0, 31.0, 41.0, 54.0, 74.0, 61.0, 84.0, 65.0, 59.0, 58.0, 98.0, 49.0, 53.0, 44.0, 27.0, 29.0, 24.0, 14.0, 15.0, 12.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9354915618896484, -1.8664132356643677, -1.7973347902297974, -1.7282564640045166, -1.6591780185699463, -1.5900996923446655, -1.5210213661193848, -1.4519429206848145, -1.3828645944595337, -1.313786268234253, -1.2447078227996826, -1.1756294965744019, -1.106551170349121, -1.0374727249145508, -0.96839439868927, -0.8993160128593445, -0.830237627029419, -0.7611592411994934, -0.6920808553695679, -0.6230025291442871, -0.5539241433143616, -0.48484575748443604, -0.4157674014568329, -0.34668904542922974, -0.2776106595993042, -0.20853228867053986, -0.1394539177417755, -0.07037554681301117, -0.0012971758842468262, 0.06778120994567871, 0.13685956597328186, 0.205937922000885, 0.27501654624938965, 0.3440949320793152, 0.41317328810691833, 0.4822516441345215, 0.551330029964447, 0.6204084157943726, 0.6894867420196533, 0.7585651278495789, 0.8276435136795044, 0.8967218995094299, 0.9658002853393555, 1.0348786115646362, 1.103956937789917, 1.1730353832244873, 1.242113709449768, 1.3111920356750488, 1.3802704811096191, 1.4493488073349, 1.5184272527694702, 1.587505578994751, 1.6565840244293213, 1.725662350654602, 1.7947406768798828, 1.8638191223144531, 1.9328974485397339, 2.0019757747650146, 2.071054220199585, 2.1401326656341553, 2.2092108726501465, 2.278289318084717, 2.347367763519287, 2.4164459705352783, 2.4855244159698486]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 6.0, 17.0, 22.0, 27.0, 50.0, 60.0, 112.0, 177.0, 297.0, 562.0, 1131.0, 3010.0, 13173.0, 148357.0, 3888851.0, 119991.0, 13068.0, 3140.0, 1143.0, 494.0, 253.0, 129.0, 84.0, 45.0, 21.0, 20.0, 12.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82421875, -0.799591064453125, -0.77496337890625, -0.750335693359375, -0.7257080078125, -0.701080322265625, -0.67645263671875, -0.651824951171875, -0.627197265625, -0.602569580078125, -0.57794189453125, -0.553314208984375, -0.5286865234375, -0.504058837890625, -0.47943115234375, -0.454803466796875, -0.43017578125, -0.405548095703125, -0.38092041015625, -0.356292724609375, -0.3316650390625, -0.307037353515625, -0.28240966796875, -0.257781982421875, -0.233154296875, -0.208526611328125, -0.18389892578125, -0.159271240234375, -0.1346435546875, -0.110015869140625, -0.08538818359375, -0.060760498046875, -0.0361328125, -0.011505126953125, 0.01312255859375, 0.037750244140625, 0.0623779296875, 0.087005615234375, 0.11163330078125, 0.136260986328125, 0.160888671875, 0.185516357421875, 0.21014404296875, 0.234771728515625, 0.2593994140625, 0.284027099609375, 0.30865478515625, 0.333282470703125, 0.35791015625, 0.382537841796875, 0.40716552734375, 0.431793212890625, 0.4564208984375, 0.481048583984375, 0.50567626953125, 0.530303955078125, 0.554931640625, 0.579559326171875, 0.60418701171875, 0.628814697265625, 0.6534423828125, 0.678070068359375, 0.70269775390625, 0.727325439453125, 0.751953125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 10.0, 10.0, 32.0, 64.0, 106.0, 140.0, 150.0, 141.0, 138.0, 83.0, 48.0, 38.0, 14.0, 9.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.16385459899902344, -0.15888595581054688, -0.1539173126220703, -0.14894866943359375, -0.1439800262451172, -0.13901138305664062, -0.13404273986816406, -0.1290740966796875, -0.12410545349121094, -0.11913681030273438, -0.11416816711425781, -0.10919952392578125, -0.10423088073730469, -0.09926223754882812, -0.09429359436035156, -0.089324951171875, -0.08435630798339844, -0.07938766479492188, -0.07441902160644531, -0.06945037841796875, -0.06448173522949219, -0.059513092041015625, -0.05454444885253906, -0.0495758056640625, -0.04460716247558594, -0.039638519287109375, -0.03466987609863281, -0.02970123291015625, -0.024732589721679688, -0.019763946533203125, -0.014795303344726562, -0.00982666015625, -0.0048580169677734375, 0.000110626220703125, 0.0050792694091796875, 0.01004791259765625, 0.015016555786132812, 0.019985198974609375, 0.024953842163085938, 0.0299224853515625, 0.03489112854003906, 0.039859771728515625, 0.04482841491699219, 0.04979705810546875, 0.05476570129394531, 0.059734344482421875, 0.06470298767089844, 0.069671630859375, 0.07464027404785156, 0.07960891723632812, 0.08457756042480469, 0.08954620361328125, 0.09451484680175781, 0.09948348999023438, 0.10445213317871094, 0.1094207763671875, 0.11438941955566406, 0.11935806274414062, 0.12432670593261719, 0.12929534912109375, 0.1342639923095703, 0.13923263549804688, 0.14420127868652344, 0.149169921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 5.0, 9.0, 19.0, 24.0, 43.0, 64.0, 159.0, 245.0, 509.0, 1098.0, 3186.0, 14164.0, 459957.0, 3680055.0, 27720.0, 4477.0, 1333.0, 546.0, 265.0, 155.0, 79.0, 78.0, 33.0, 16.0, 14.0, 4.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9404296875, -0.908172607421875, -0.87591552734375, -0.843658447265625, -0.8114013671875, -0.779144287109375, -0.74688720703125, -0.714630126953125, -0.682373046875, -0.650115966796875, -0.61785888671875, -0.585601806640625, -0.5533447265625, -0.521087646484375, -0.48883056640625, -0.456573486328125, -0.42431640625, -0.392059326171875, -0.35980224609375, -0.327545166015625, -0.2952880859375, -0.263031005859375, -0.23077392578125, -0.198516845703125, -0.166259765625, -0.134002685546875, -0.10174560546875, -0.069488525390625, -0.0372314453125, -0.004974365234375, 0.02728271484375, 0.059539794921875, 0.091796875, 0.124053955078125, 0.15631103515625, 0.188568115234375, 0.2208251953125, 0.253082275390625, 0.28533935546875, 0.317596435546875, 0.349853515625, 0.382110595703125, 0.41436767578125, 0.446624755859375, 0.4788818359375, 0.511138916015625, 0.54339599609375, 0.575653076171875, 0.60791015625, 0.640167236328125, 0.67242431640625, 0.704681396484375, 0.7369384765625, 0.769195556640625, 0.80145263671875, 0.833709716796875, 0.865966796875, 0.898223876953125, 0.93048095703125, 0.962738037109375, 0.9949951171875, 1.027252197265625, 1.05950927734375, 1.091766357421875, 1.1240234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 7.0, 14.0, 16.0, 23.0, 50.0, 110.0, 233.0, 757.0, 1792.0, 625.0, 223.0, 96.0, 45.0, 27.0, 12.0, 16.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.25439453125, -0.246307373046875, -0.23822021484375, -0.230133056640625, -0.2220458984375, -0.213958740234375, -0.20587158203125, -0.197784423828125, -0.189697265625, -0.181610107421875, -0.17352294921875, -0.165435791015625, -0.1573486328125, -0.149261474609375, -0.14117431640625, -0.133087158203125, -0.125, -0.116912841796875, -0.10882568359375, -0.100738525390625, -0.0926513671875, -0.084564208984375, -0.07647705078125, -0.068389892578125, -0.060302734375, -0.052215576171875, -0.04412841796875, -0.036041259765625, -0.0279541015625, -0.019866943359375, -0.01177978515625, -0.003692626953125, 0.00439453125, 0.012481689453125, 0.02056884765625, 0.028656005859375, 0.0367431640625, 0.044830322265625, 0.05291748046875, 0.061004638671875, 0.069091796875, 0.077178955078125, 0.08526611328125, 0.093353271484375, 0.1014404296875, 0.109527587890625, 0.11761474609375, 0.125701904296875, 0.1337890625, 0.141876220703125, 0.14996337890625, 0.158050537109375, 0.1661376953125, 0.174224853515625, 0.18231201171875, 0.190399169921875, 0.198486328125, 0.206573486328125, 0.21466064453125, 0.222747802734375, 0.2308349609375, 0.238922119140625, 0.24700927734375, 0.255096435546875, 0.26318359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 14.0, 18.0, 56.0, 103.0, 234.0, 257.0, 174.0, 82.0, 27.0, 16.0, 7.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2767488956451416, -2.2123172283172607, -2.147885799407959, -2.083454132080078, -2.0190224647521973, -1.954590916633606, -1.8901593685150146, -1.8257277011871338, -1.761296033859253, -1.6968644857406616, -1.6324328184127808, -1.5680012702941895, -1.5035696029663086, -1.4391380548477173, -1.374706506729126, -1.3102748394012451, -1.2458432912826538, -1.1814117431640625, -1.1169800758361816, -1.0525485277175903, -0.9881168603897095, -0.9236853122711182, -0.8592537045478821, -0.794822096824646, -0.7303904891014099, -0.6659588813781738, -0.6015272736549377, -0.5370956659317017, -0.47266408801078796, -0.4082324802875519, -0.3438009023666382, -0.2793692946434021, -0.21493756771087646, -0.15050595998764038, -0.08607436716556549, -0.0216427743434906, 0.04278883337974548, 0.10722044110298157, 0.17165201902389526, 0.23608362674713135, 0.30051523447036743, 0.3649468421936035, 0.4293784499168396, 0.4938100278377533, 0.558241605758667, 0.6226732730865479, 0.6871048212051392, 0.7515364289283752, 0.8159680366516113, 0.8803996443748474, 0.9448312520980835, 1.0092628002166748, 1.0736944675445557, 1.138126015663147, 1.2025575637817383, 1.2669892311096191, 1.3314208984375, 1.3958524465560913, 1.4602841138839722, 1.5247156620025635, 1.5891473293304443, 1.6535788774490356, 1.718010425567627, 1.7824420928955078, 1.8468736410140991]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 10.0, 9.0, 25.0, 27.0, 41.0, 62.0, 87.0, 92.0, 115.0, 109.0, 91.0, 80.0, 78.0, 54.0, 47.0, 31.0, 19.0, 11.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1883189678192139, -1.1507377624511719, -1.1131565570831299, -1.0755754709243774, -1.0379942655563354, -1.0004130601882935, -0.9628318548202515, -0.9252506494522095, -0.8876695036888123, -0.8500882983207703, -0.812507152557373, -0.774925947189331, -0.7373447418212891, -0.6997635960578918, -0.6621823906898499, -0.6246012449264526, -0.5870200395584106, -0.5494388341903687, -0.5118576884269714, -0.47427648305892944, -0.43669530749320984, -0.39911413192749023, -0.36153292655944824, -0.32395175099372864, -0.28637057542800903, -0.24878939986228943, -0.21120820939540863, -0.17362701892852783, -0.13604584336280823, -0.09846466779708862, -0.060883477330207825, -0.023302286863327026, 0.014278888702392578, 0.05186007171869278, 0.08944125473499298, 0.12702244520187378, 0.16460362076759338, 0.202184796333313, 0.2397659868001938, 0.2773471772670746, 0.3149283528327942, 0.3525095283985138, 0.3900907039642334, 0.4276719093322754, 0.465253084897995, 0.5028342604637146, 0.5404154658317566, 0.5779966115951538, 0.6155778169631958, 0.6531590223312378, 0.690740168094635, 0.728321373462677, 0.7659025192260742, 0.8034837245941162, 0.8410649299621582, 0.8786461353302002, 0.9162272810935974, 0.9538084864616394, 0.9913896322250366, 1.0289708375930786, 1.0665520429611206, 1.104133129119873, 1.141714334487915, 1.179295539855957, 1.216876745223999]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 3.0, 7.0, 9.0, 17.0, 17.0, 27.0, 43.0, 46.0, 77.0, 124.0, 174.0, 267.0, 416.0, 706.0, 1075.0, 1977.0, 3734.0, 9273.0, 39604.0, 258004.0, 557540.0, 138747.0, 22790.0, 6711.0, 2963.0, 1597.0, 914.0, 574.0, 386.0, 230.0, 156.0, 112.0, 68.0, 61.0, 30.0, 27.0, 14.0, 13.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.476806640625, -0.4605522155761719, -0.44429779052734375, -0.4280433654785156, -0.4117889404296875, -0.3955345153808594, -0.37928009033203125, -0.3630256652832031, -0.346771240234375, -0.3305168151855469, -0.31426239013671875, -0.2980079650878906, -0.2817535400390625, -0.2654991149902344, -0.24924468994140625, -0.23299026489257812, -0.21673583984375, -0.20048141479492188, -0.18422698974609375, -0.16797256469726562, -0.1517181396484375, -0.13546371459960938, -0.11920928955078125, -0.10295486450195312, -0.086700439453125, -0.07044601440429688, -0.05419158935546875, -0.037937164306640625, -0.0216827392578125, -0.005428314208984375, 0.01082611083984375, 0.027080535888671875, 0.0433349609375, 0.059589385986328125, 0.07584381103515625, 0.09209823608398438, 0.1083526611328125, 0.12460708618164062, 0.14086151123046875, 0.15711593627929688, 0.173370361328125, 0.18962478637695312, 0.20587921142578125, 0.22213363647460938, 0.2383880615234375, 0.2546424865722656, 0.27089691162109375, 0.2871513366699219, 0.30340576171875, 0.3196601867675781, 0.33591461181640625, 0.3521690368652344, 0.3684234619140625, 0.3846778869628906, 0.40093231201171875, 0.4171867370605469, 0.433441162109375, 0.4496955871582031, 0.46595001220703125, 0.4822044372558594, 0.4984588623046875, 0.5147132873535156, 0.5309677124023438, 0.5472221374511719, 0.5634765625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 12.0, 14.0, 37.0, 63.0, 141.0, 156.0, 182.0, 143.0, 100.0, 64.0, 46.0, 19.0, 8.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1695556640625, -0.16399574279785156, -0.15843582153320312, -0.1528759002685547, -0.14731597900390625, -0.1417560577392578, -0.13619613647460938, -0.13063621520996094, -0.1250762939453125, -0.11951637268066406, -0.11395645141601562, -0.10839653015136719, -0.10283660888671875, -0.09727668762207031, -0.09171676635742188, -0.08615684509277344, -0.080596923828125, -0.07503700256347656, -0.06947708129882812, -0.06391716003417969, -0.05835723876953125, -0.05279731750488281, -0.047237396240234375, -0.04167747497558594, -0.0361175537109375, -0.030557632446289062, -0.024997711181640625, -0.019437789916992188, -0.01387786865234375, -0.008317947387695312, -0.002758026123046875, 0.0028018951416015625, 0.00836181640625, 0.013921737670898438, 0.019481658935546875, 0.025041580200195312, 0.03060150146484375, 0.03616142272949219, 0.041721343994140625, 0.04728126525878906, 0.0528411865234375, 0.05840110778808594, 0.06396102905273438, 0.06952095031738281, 0.07508087158203125, 0.08064079284667969, 0.08620071411132812, 0.09176063537597656, 0.097320556640625, 0.10288047790527344, 0.10844039916992188, 0.11400032043457031, 0.11956024169921875, 0.1251201629638672, 0.13068008422851562, 0.13624000549316406, 0.1417999267578125, 0.14735984802246094, 0.15291976928710938, 0.1584796905517578, 0.16403961181640625, 0.1695995330810547, 0.17515945434570312, 0.18071937561035156, 0.186279296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 6.0, 10.0, 4.0, 9.0, 12.0, 22.0, 29.0, 38.0, 64.0, 86.0, 142.0, 200.0, 328.0, 586.0, 1258.0, 2566.0, 6184.0, 15527.0, 41713.0, 113204.0, 260662.0, 323149.0, 174397.0, 67310.0, 24340.0, 9284.0, 3768.0, 1674.0, 796.0, 430.0, 269.0, 170.0, 96.0, 61.0, 36.0, 35.0, 33.0, 22.0, 15.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23876953125, -0.2311248779296875, -0.223480224609375, -0.2158355712890625, -0.20819091796875, -0.2005462646484375, -0.192901611328125, -0.1852569580078125, -0.1776123046875, -0.1699676513671875, -0.162322998046875, -0.1546783447265625, -0.14703369140625, -0.1393890380859375, -0.131744384765625, -0.1240997314453125, -0.116455078125, -0.1088104248046875, -0.101165771484375, -0.0935211181640625, -0.08587646484375, -0.0782318115234375, -0.070587158203125, -0.0629425048828125, -0.0552978515625, -0.0476531982421875, -0.040008544921875, -0.0323638916015625, -0.02471923828125, -0.0170745849609375, -0.009429931640625, -0.0017852783203125, 0.005859375, 0.0135040283203125, 0.021148681640625, 0.0287933349609375, 0.03643798828125, 0.0440826416015625, 0.051727294921875, 0.0593719482421875, 0.0670166015625, 0.0746612548828125, 0.082305908203125, 0.0899505615234375, 0.09759521484375, 0.1052398681640625, 0.112884521484375, 0.1205291748046875, 0.128173828125, 0.1358184814453125, 0.143463134765625, 0.1511077880859375, 0.15875244140625, 0.1663970947265625, 0.174041748046875, 0.1816864013671875, 0.1893310546875, 0.1969757080078125, 0.204620361328125, 0.2122650146484375, 0.21990966796875, 0.2275543212890625, 0.235198974609375, 0.2428436279296875, 0.25048828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 12.0, 9.0, 9.0, 15.0, 20.0, 31.0, 30.0, 34.0, 27.0, 34.0, 48.0, 36.0, 48.0, 41.0, 54.0, 52.0, 63.0, 50.0, 37.0, 33.0, 38.0, 35.0, 34.0, 30.0, 27.0, 24.0, 27.0, 23.0, 19.0, 9.0, 12.0, 7.0, 11.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.2620391845703125, -0.253570556640625, -0.2451019287109375, -0.23663330078125, -0.2281646728515625, -0.219696044921875, -0.2112274169921875, -0.2027587890625, -0.1942901611328125, -0.185821533203125, -0.1773529052734375, -0.16888427734375, -0.1604156494140625, -0.151947021484375, -0.1434783935546875, -0.135009765625, -0.1265411376953125, -0.118072509765625, -0.1096038818359375, -0.10113525390625, -0.0926666259765625, -0.084197998046875, -0.0757293701171875, -0.0672607421875, -0.0587921142578125, -0.050323486328125, -0.0418548583984375, -0.03338623046875, -0.0249176025390625, -0.016448974609375, -0.0079803466796875, 0.00048828125, 0.0089569091796875, 0.017425537109375, 0.0258941650390625, 0.03436279296875, 0.0428314208984375, 0.051300048828125, 0.0597686767578125, 0.0682373046875, 0.0767059326171875, 0.085174560546875, 0.0936431884765625, 0.10211181640625, 0.1105804443359375, 0.119049072265625, 0.1275177001953125, 0.135986328125, 0.1444549560546875, 0.152923583984375, 0.1613922119140625, 0.16986083984375, 0.1783294677734375, 0.186798095703125, 0.1952667236328125, 0.2037353515625, 0.2122039794921875, 0.220672607421875, 0.2291412353515625, 0.23760986328125, 0.2460784912109375, 0.254547119140625, 0.2630157470703125, 0.271484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 9.0, 30.0, 48.0, 91.0, 160.0, 377.0, 941.0, 3014.0, 17009.0, 199610.0, 743008.0, 72529.0, 8673.0, 1826.0, 642.0, 304.0, 123.0, 63.0, 39.0, 26.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29931640625, -0.29084205627441406, -0.2823677062988281, -0.2738933563232422, -0.26541900634765625, -0.2569446563720703, -0.24847030639648438, -0.23999595642089844, -0.2315216064453125, -0.22304725646972656, -0.21457290649414062, -0.2060985565185547, -0.19762420654296875, -0.1891498565673828, -0.18067550659179688, -0.17220115661621094, -0.163726806640625, -0.15525245666503906, -0.14677810668945312, -0.1383037567138672, -0.12982940673828125, -0.12135505676269531, -0.11288070678710938, -0.10440635681152344, -0.0959320068359375, -0.08745765686035156, -0.07898330688476562, -0.07050895690917969, -0.06203460693359375, -0.05356025695800781, -0.045085906982421875, -0.03661155700683594, -0.02813720703125, -0.019662857055664062, -0.011188507080078125, -0.0027141571044921875, 0.00576019287109375, 0.014234542846679688, 0.022708892822265625, 0.031183242797851562, 0.0396575927734375, 0.04813194274902344, 0.056606292724609375, 0.06508064270019531, 0.07355499267578125, 0.08202934265136719, 0.09050369262695312, 0.09897804260253906, 0.107452392578125, 0.11592674255371094, 0.12440109252929688, 0.1328754425048828, 0.14134979248046875, 0.1498241424560547, 0.15829849243164062, 0.16677284240722656, 0.1752471923828125, 0.18372154235839844, 0.19219589233398438, 0.2006702423095703, 0.20914459228515625, 0.2176189422607422, 0.22609329223632812, 0.23456764221191406, 0.2430419921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 6.0, 3.0, 5.0, 12.0, 15.0, 15.0, 15.0, 22.0, 31.0, 36.0, 39.0, 71.0, 77.0, 121.0, 91.0, 90.0, 74.0, 45.0, 61.0, 34.0, 30.0, 21.0, 20.0, 17.0, 12.0, 8.0, 10.0, 9.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.00019252300262451172, -0.00018721632659435272, -0.00018190965056419373, -0.00017660297453403473, -0.00017129629850387573, -0.00016598962247371674, -0.00016068294644355774, -0.00015537627041339874, -0.00015006959438323975, -0.00014476291835308075, -0.00013945624232292175, -0.00013414956629276276, -0.00012884289026260376, -0.00012353621423244476, -0.00011822953820228577, -0.00011292286217212677, -0.00010761618614196777, -0.00010230951011180878, -9.700283408164978e-05, -9.169615805149078e-05, -8.638948202133179e-05, -8.108280599117279e-05, -7.57761299610138e-05, -7.04694539308548e-05, -6.51627779006958e-05, -5.9856101870536804e-05, -5.454942584037781e-05, -4.924274981021881e-05, -4.3936073780059814e-05, -3.862939774990082e-05, -3.332272171974182e-05, -2.8016045689582825e-05, -2.2709369659423828e-05, -1.740269362926483e-05, -1.2096017599105835e-05, -6.789341568946838e-06, -1.4826655387878418e-06, 3.824010491371155e-06, 9.130686521530151e-06, 1.4437362551689148e-05, 1.9744038581848145e-05, 2.505071461200714e-05, 3.0357390642166138e-05, 3.5664066672325134e-05, 4.097074270248413e-05, 4.627741873264313e-05, 5.1584094762802124e-05, 5.689077079296112e-05, 6.219744682312012e-05, 6.750412285327911e-05, 7.281079888343811e-05, 7.811747491359711e-05, 8.34241509437561e-05, 8.87308269739151e-05, 9.40375030040741e-05, 9.93441790342331e-05, 0.00010465085506439209, 0.00010995753109455109, 0.00011526420712471008, 0.00012057088315486908, 0.00012587755918502808, 0.00013118423521518707, 0.00013649091124534607, 0.00014179758727550507, 0.00014710426330566406]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 5.0, 9.0, 10.0, 9.0, 18.0, 28.0, 28.0, 51.0, 75.0, 115.0, 212.0, 475.0, 969.0, 2424.0, 6487.0, 22147.0, 113709.0, 573240.0, 267960.0, 43195.0, 10759.0, 3656.0, 1454.0, 670.0, 343.0, 179.0, 95.0, 67.0, 36.0, 28.0, 19.0, 22.0, 11.0, 14.0, 6.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.203125, -0.19759368896484375, -0.1920623779296875, -0.18653106689453125, -0.180999755859375, -0.17546844482421875, -0.1699371337890625, -0.16440582275390625, -0.15887451171875, -0.15334320068359375, -0.1478118896484375, -0.14228057861328125, -0.136749267578125, -0.13121795654296875, -0.1256866455078125, -0.12015533447265625, -0.1146240234375, -0.10909271240234375, -0.1035614013671875, -0.09803009033203125, -0.092498779296875, -0.08696746826171875, -0.0814361572265625, -0.07590484619140625, -0.07037353515625, -0.06484222412109375, -0.0593109130859375, -0.05377960205078125, -0.048248291015625, -0.04271697998046875, -0.0371856689453125, -0.03165435791015625, -0.026123046875, -0.02059173583984375, -0.0150604248046875, -0.00952911376953125, -0.003997802734375, 0.00153350830078125, 0.0070648193359375, 0.01259613037109375, 0.01812744140625, 0.02365875244140625, 0.0291900634765625, 0.03472137451171875, 0.040252685546875, 0.04578399658203125, 0.0513153076171875, 0.05684661865234375, 0.0623779296875, 0.06790924072265625, 0.0734405517578125, 0.07897186279296875, 0.084503173828125, 0.09003448486328125, 0.0955657958984375, 0.10109710693359375, 0.10662841796875, 0.11215972900390625, 0.1176910400390625, 0.12322235107421875, 0.128753662109375, 0.13428497314453125, 0.1398162841796875, 0.14534759521484375, 0.15087890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 5.0, 9.0, 11.0, 14.0, 22.0, 29.0, 29.0, 50.0, 45.0, 50.0, 80.0, 81.0, 83.0, 82.0, 82.0, 68.0, 50.0, 38.0, 31.0, 30.0, 19.0, 15.0, 12.0, 13.0, 7.0, 10.0, 4.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10626220703125, -0.1024026870727539, -0.09854316711425781, -0.09468364715576172, -0.09082412719726562, -0.08696460723876953, -0.08310508728027344, -0.07924556732177734, -0.07538604736328125, -0.07152652740478516, -0.06766700744628906, -0.06380748748779297, -0.059947967529296875, -0.05608844757080078, -0.05222892761230469, -0.048369407653808594, -0.0445098876953125, -0.040650367736816406, -0.03679084777832031, -0.03293132781982422, -0.029071807861328125, -0.02521228790283203, -0.021352767944335938, -0.017493247985839844, -0.01363372802734375, -0.009774208068847656, -0.0059146881103515625, -0.0020551681518554688, 0.001804351806640625, 0.005663871765136719, 0.009523391723632812, 0.013382911682128906, 0.017242431640625, 0.021101951599121094, 0.024961471557617188, 0.02882099151611328, 0.032680511474609375, 0.03654003143310547, 0.04039955139160156, 0.044259071350097656, 0.04811859130859375, 0.051978111267089844, 0.05583763122558594, 0.05969715118408203, 0.06355667114257812, 0.06741619110107422, 0.07127571105957031, 0.0751352310180664, 0.0789947509765625, 0.0828542709350586, 0.08671379089355469, 0.09057331085205078, 0.09443283081054688, 0.09829235076904297, 0.10215187072753906, 0.10601139068603516, 0.10987091064453125, 0.11373043060302734, 0.11758995056152344, 0.12144947052001953, 0.12530899047851562, 0.12916851043701172, 0.1330280303955078, 0.1368875503540039, 0.1407470703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 32.0, 43.0, 119.0, 192.0, 222.0, 176.0, 109.0, 59.0, 26.0, 11.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.015063285827637, -5.893158912658691, -5.771254539489746, -5.649350166320801, -5.5274457931518555, -5.40554141998291, -5.283637046813965, -5.161733150482178, -5.039828777313232, -4.917924404144287, -4.796020030975342, -4.6741156578063965, -4.552211284637451, -4.430307388305664, -4.308403015136719, -4.186498641967773, -4.064594268798828, -3.942689895629883, -3.8207855224609375, -3.698881149291992, -3.576977014541626, -3.4550726413726807, -3.3331682682037354, -3.21126389503479, -3.0893592834472656, -2.9674549102783203, -2.845550537109375, -2.7236461639404297, -2.6017420291900635, -2.479837656021118, -2.357933282852173, -2.2360289096832275, -2.1141250133514404, -1.9922206401824951, -1.8703163862228394, -1.748412013053894, -1.6265077590942383, -1.504603385925293, -1.3826990127563477, -1.2607946395874023, -1.1388903856277466, -1.0169860124588013, -0.8950817584991455, -0.7731773853302002, -0.6512730717658997, -0.5293687582015991, -0.4074643850326538, -0.28556007146835327, -0.16365575790405273, -0.041751429438591, 0.08015289902687073, 0.20205724239349365, 0.3239615559577942, 0.4458658695220947, 0.56777024269104, 0.6896745562553406, 0.8115788698196411, 0.9334831833839417, 1.0553874969482422, 1.1772918701171875, 1.2991962432861328, 1.4211004972457886, 1.5430048704147339, 1.6649091243743896, 1.786813497543335]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 9.0, 4.0, 14.0, 9.0, 14.0, 13.0, 22.0, 17.0, 18.0, 33.0, 38.0, 33.0, 47.0, 44.0, 40.0, 51.0, 49.0, 42.0, 50.0, 45.0, 61.0, 51.0, 53.0, 34.0, 31.0, 26.0, 34.0, 24.0, 20.0, 14.0, 18.0, 10.0, 8.0, 7.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.8470747470855713, -1.7968776226043701, -1.746680498123169, -1.6964833736419678, -1.6462862491607666, -1.5960891246795654, -1.5458920001983643, -1.495694875717163, -1.445497751235962, -1.3953006267547607, -1.3451035022735596, -1.2949063777923584, -1.2447092533111572, -1.194512128829956, -1.1443150043487549, -1.0941178798675537, -1.0439207553863525, -0.9937236309051514, -0.9435265064239502, -0.893329381942749, -0.8431322574615479, -0.7929351329803467, -0.7427380084991455, -0.6925408840179443, -0.6423436403274536, -0.5921465158462524, -0.5419493913650513, -0.4917522668838501, -0.4415551424026489, -0.39135798811912537, -0.3411608636379242, -0.290963739156723, -0.24076664447784424, -0.19056951999664307, -0.1403723955154419, -0.09017525613307953, -0.03997813165187836, 0.010219007730484009, 0.06041613221168518, 0.11061325669288635, 0.16081038117408752, 0.2110075056552887, 0.26120463013648987, 0.3114017844200134, 0.3615989089012146, 0.41179603338241577, 0.46199315786361694, 0.5121902823448181, 0.5623874068260193, 0.6125845313072205, 0.6627816557884216, 0.7129787802696228, 0.763175904750824, 0.8133730888366699, 0.8635702133178711, 0.9137673377990723, 0.9639644622802734, 1.0141615867614746, 1.0643587112426758, 1.114555835723877, 1.1647529602050781, 1.2149500846862793, 1.2651472091674805, 1.3153443336486816, 1.3655414581298828]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 7.0, 9.0, 17.0, 22.0, 26.0, 43.0, 44.0, 85.0, 107.0, 164.0, 256.0, 495.0, 901.0, 2141.0, 6961.0, 43977.0, 3695548.0, 413808.0, 21723.0, 4623.0, 1568.0, 700.0, 383.0, 245.0, 145.0, 88.0, 54.0, 49.0, 34.0, 22.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62841796875, -0.608673095703125, -0.58892822265625, -0.569183349609375, -0.5494384765625, -0.529693603515625, -0.50994873046875, -0.490203857421875, -0.470458984375, -0.450714111328125, -0.43096923828125, -0.411224365234375, -0.3914794921875, -0.371734619140625, -0.35198974609375, -0.332244873046875, -0.3125, -0.292755126953125, -0.27301025390625, -0.253265380859375, -0.2335205078125, -0.213775634765625, -0.19403076171875, -0.174285888671875, -0.154541015625, -0.134796142578125, -0.11505126953125, -0.095306396484375, -0.0755615234375, -0.055816650390625, -0.03607177734375, -0.016326904296875, 0.00341796875, 0.023162841796875, 0.04290771484375, 0.062652587890625, 0.0823974609375, 0.102142333984375, 0.12188720703125, 0.141632080078125, 0.161376953125, 0.181121826171875, 0.20086669921875, 0.220611572265625, 0.2403564453125, 0.260101318359375, 0.27984619140625, 0.299591064453125, 0.3193359375, 0.339080810546875, 0.35882568359375, 0.378570556640625, 0.3983154296875, 0.418060302734375, 0.43780517578125, 0.457550048828125, 0.477294921875, 0.497039794921875, 0.51678466796875, 0.536529541015625, 0.5562744140625, 0.576019287109375, 0.59576416015625, 0.615509033203125, 0.63525390625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 4.0, 13.0, 21.0, 37.0, 85.0, 130.0, 152.0, 154.0, 127.0, 109.0, 72.0, 39.0, 22.0, 13.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1810302734375, -0.17525672912597656, -0.16948318481445312, -0.1637096405029297, -0.15793609619140625, -0.1521625518798828, -0.14638900756835938, -0.14061546325683594, -0.1348419189453125, -0.12906837463378906, -0.12329483032226562, -0.11752128601074219, -0.11174774169921875, -0.10597419738769531, -0.10020065307617188, -0.09442710876464844, -0.088653564453125, -0.08288002014160156, -0.07710647583007812, -0.07133293151855469, -0.06555938720703125, -0.05978584289550781, -0.054012298583984375, -0.04823875427246094, -0.0424652099609375, -0.03669166564941406, -0.030918121337890625, -0.025144577026367188, -0.01937103271484375, -0.013597488403320312, -0.007823944091796875, -0.0020503997802734375, 0.00372314453125, 0.009496688842773438, 0.015270233154296875, 0.021043777465820312, 0.02681732177734375, 0.03259086608886719, 0.038364410400390625, 0.04413795471191406, 0.0499114990234375, 0.05568504333496094, 0.061458587646484375, 0.06723213195800781, 0.07300567626953125, 0.07877922058105469, 0.08455276489257812, 0.09032630920410156, 0.096099853515625, 0.10187339782714844, 0.10764694213867188, 0.11342048645019531, 0.11919403076171875, 0.12496757507324219, 0.13074111938476562, 0.13651466369628906, 0.1422882080078125, 0.14806175231933594, 0.15383529663085938, 0.1596088409423828, 0.16538238525390625, 0.1711559295654297, 0.17692947387695312, 0.18270301818847656, 0.1884765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 10.0, 10.0, 9.0, 19.0, 25.0, 35.0, 43.0, 61.0, 75.0, 114.0, 151.0, 248.0, 358.0, 536.0, 847.0, 1632.0, 3737.0, 9599.0, 31719.0, 150967.0, 2844896.0, 1022017.0, 91255.0, 21975.0, 7133.0, 2954.0, 1489.0, 820.0, 437.0, 338.0, 221.0, 171.0, 108.0, 77.0, 50.0, 44.0, 27.0, 17.0, 17.0, 7.0, 6.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24186325073242188, -0.23348236083984375, -0.22510147094726562, -0.2167205810546875, -0.20833969116210938, -0.19995880126953125, -0.19157791137695312, -0.183197021484375, -0.17481613159179688, -0.16643524169921875, -0.15805435180664062, -0.1496734619140625, -0.14129257202148438, -0.13291168212890625, -0.12453079223632812, -0.11614990234375, -0.10776901245117188, -0.09938812255859375, -0.09100723266601562, -0.0826263427734375, -0.07424545288085938, -0.06586456298828125, -0.057483673095703125, -0.049102783203125, -0.040721893310546875, -0.03234100341796875, -0.023960113525390625, -0.0155792236328125, -0.007198333740234375, 0.00118255615234375, 0.009563446044921875, 0.0179443359375, 0.026325225830078125, 0.03470611572265625, 0.043087005615234375, 0.0514678955078125, 0.059848785400390625, 0.06822967529296875, 0.07661056518554688, 0.084991455078125, 0.09337234497070312, 0.10175323486328125, 0.11013412475585938, 0.1185150146484375, 0.12689590454101562, 0.13527679443359375, 0.14365768432617188, 0.15203857421875, 0.16041946411132812, 0.16880035400390625, 0.17718124389648438, 0.1855621337890625, 0.19394302368164062, 0.20232391357421875, 0.21070480346679688, 0.219085693359375, 0.22746658325195312, 0.23584747314453125, 0.24422836303710938, 0.2526092529296875, 0.2609901428222656, 0.26937103271484375, 0.2777519226074219, 0.2861328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 10.0, 19.0, 32.0, 44.0, 72.0, 152.0, 405.0, 1441.0, 1204.0, 331.0, 165.0, 82.0, 40.0, 26.0, 16.0, 7.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.1493091583251953, -0.14432144165039062, -0.13933372497558594, -0.13434600830078125, -0.12935829162597656, -0.12437057495117188, -0.11938285827636719, -0.1143951416015625, -0.10940742492675781, -0.10441970825195312, -0.09943199157714844, -0.09444427490234375, -0.08945655822753906, -0.08446884155273438, -0.07948112487792969, -0.074493408203125, -0.06950569152832031, -0.06451797485351562, -0.05953025817871094, -0.05454254150390625, -0.04955482482910156, -0.044567108154296875, -0.03957939147949219, -0.0345916748046875, -0.029603958129882812, -0.024616241455078125, -0.019628524780273438, -0.01464080810546875, -0.009653091430664062, -0.004665374755859375, 0.0003223419189453125, 0.00531005859375, 0.010297775268554688, 0.015285491943359375, 0.020273208618164062, 0.02526092529296875, 0.030248641967773438, 0.035236358642578125, 0.04022407531738281, 0.0452117919921875, 0.05019950866699219, 0.055187225341796875, 0.06017494201660156, 0.06516265869140625, 0.07015037536621094, 0.07513809204101562, 0.08012580871582031, 0.085113525390625, 0.09010124206542969, 0.09508895874023438, 0.10007667541503906, 0.10506439208984375, 0.11005210876464844, 0.11503982543945312, 0.12002754211425781, 0.1250152587890625, 0.1300029754638672, 0.13499069213867188, 0.13997840881347656, 0.14496612548828125, 0.14995384216308594, 0.15494155883789062, 0.1599292755126953, 0.1649169921875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 18.0, 35.0, 70.0, 115.0, 217.0, 236.0, 131.0, 90.0, 44.0, 17.0, 8.0, 7.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9648955464363098, -0.9337611794471741, -0.9026267528533936, -0.8714923858642578, -0.8403580188751221, -0.8092235922813416, -0.7780892252922058, -0.7469547986984253, -0.7158204317092896, -0.6846860647201538, -0.6535516381263733, -0.6224172711372375, -0.591282844543457, -0.5601484775543213, -0.5290141105651855, -0.4978797137737274, -0.4667453169822693, -0.43561092019081116, -0.404476523399353, -0.3733421564102173, -0.34220775961875916, -0.311073362827301, -0.2799389958381653, -0.24880459904670715, -0.21767020225524902, -0.1865358054637909, -0.15540142357349396, -0.12426703423261642, -0.09313264489173889, -0.06199824810028076, -0.030863866209983826, 0.00027051568031311035, 0.031404972076416016, 0.06253936141729355, 0.09367375075817108, 0.12480814009904861, 0.15594252943992615, 0.18707692623138428, 0.2182113081216812, 0.24934569001197815, 0.2804800868034363, 0.3116144835948944, 0.34274888038635254, 0.3738832473754883, 0.4050176441669464, 0.43615204095840454, 0.4672864079475403, 0.4984208047389984, 0.5295552015304565, 0.5606895685195923, 0.5918239951133728, 0.6229583621025085, 0.6540927886962891, 0.6852271556854248, 0.7163615226745605, 0.7474958896636963, 0.7786303162574768, 0.8097646832466125, 0.8408991098403931, 0.8720334768295288, 0.9031678438186646, 0.9343022704124451, 0.9654366374015808, 0.9965710639953613, 1.027705430984497]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 2.0, 9.0, 6.0, 13.0, 11.0, 16.0, 25.0, 23.0, 34.0, 34.0, 37.0, 38.0, 46.0, 52.0, 53.0, 60.0, 50.0, 53.0, 51.0, 54.0, 51.0, 42.0, 39.0, 40.0, 32.0, 23.0, 25.0, 19.0, 14.0, 13.0, 15.0, 3.0, 5.0, 4.0, 5.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3352075219154358, -0.321824848651886, -0.3084421753883362, -0.2950595021247864, -0.28167685866355896, -0.26829418540000916, -0.25491151213645935, -0.24152883887290955, -0.22814618051052094, -0.21476350724697113, -0.20138084888458252, -0.18799817562103271, -0.1746155023574829, -0.1612328439950943, -0.1478501707315445, -0.13446751236915588, -0.12108483910560608, -0.10770217329263687, -0.09431950747966766, -0.08093683421611786, -0.06755416840314865, -0.05417150259017944, -0.04078882932662964, -0.02740616351366043, -0.014023497700691223, -0.0006408300250768661, 0.01274183765053749, 0.026124507188796997, 0.039507173001766205, 0.05288983881473541, 0.06627251207828522, 0.07965517789125443, 0.09303784370422363, 0.10642050951719284, 0.11980317533016205, 0.13318584859371185, 0.14656850695610046, 0.15995118021965027, 0.17333385348320007, 0.18671652674674988, 0.2000991851091385, 0.2134818583726883, 0.2268645167350769, 0.2402471899986267, 0.2536298632621765, 0.2670125365257263, 0.2803952097892761, 0.29377785325050354, 0.30716052651405334, 0.32054319977760315, 0.33392587304115295, 0.34730851650238037, 0.3606911897659302, 0.37407386302948, 0.3874565362930298, 0.4008392095565796, 0.4142218828201294, 0.4276045560836792, 0.440987229347229, 0.4543699026107788, 0.4677525460720062, 0.48113521933555603, 0.49451789259910583, 0.5079005360603333, 0.5212832093238831]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 10.0, 9.0, 14.0, 28.0, 37.0, 55.0, 82.0, 122.0, 187.0, 266.0, 389.0, 640.0, 1075.0, 1883.0, 3900.0, 10214.0, 39248.0, 227427.0, 553411.0, 163899.0, 29613.0, 8269.0, 3462.0, 1656.0, 1013.0, 566.0, 341.0, 221.0, 146.0, 99.0, 76.0, 44.0, 49.0, 25.0, 17.0, 15.0, 11.0, 9.0, 8.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51708984375, -0.5006256103515625, -0.484161376953125, -0.4676971435546875, -0.45123291015625, -0.4347686767578125, -0.418304443359375, -0.4018402099609375, -0.3853759765625, -0.3689117431640625, -0.352447509765625, -0.3359832763671875, -0.31951904296875, -0.3030548095703125, -0.286590576171875, -0.2701263427734375, -0.253662109375, -0.2371978759765625, -0.220733642578125, -0.2042694091796875, -0.18780517578125, -0.1713409423828125, -0.154876708984375, -0.1384124755859375, -0.1219482421875, -0.1054840087890625, -0.089019775390625, -0.0725555419921875, -0.05609130859375, -0.0396270751953125, -0.023162841796875, -0.0066986083984375, 0.009765625, 0.0262298583984375, 0.042694091796875, 0.0591583251953125, 0.07562255859375, 0.0920867919921875, 0.108551025390625, 0.1250152587890625, 0.1414794921875, 0.1579437255859375, 0.174407958984375, 0.1908721923828125, 0.20733642578125, 0.2238006591796875, 0.240264892578125, 0.2567291259765625, 0.273193359375, 0.2896575927734375, 0.306121826171875, 0.3225860595703125, 0.33905029296875, 0.3555145263671875, 0.371978759765625, 0.3884429931640625, 0.4049072265625, 0.4213714599609375, 0.437835693359375, 0.4542999267578125, 0.47076416015625, 0.4872283935546875, 0.503692626953125, 0.5201568603515625, 0.53662109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 12.0, 24.0, 38.0, 75.0, 123.0, 151.0, 162.0, 146.0, 96.0, 70.0, 38.0, 28.0, 16.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1845703125, -0.17869949340820312, -0.17282867431640625, -0.16695785522460938, -0.1610870361328125, -0.15521621704101562, -0.14934539794921875, -0.14347457885742188, -0.137603759765625, -0.13173294067382812, -0.12586212158203125, -0.11999130249023438, -0.1141204833984375, -0.10824966430664062, -0.10237884521484375, -0.09650802612304688, -0.09063720703125, -0.08476638793945312, -0.07889556884765625, -0.07302474975585938, -0.0671539306640625, -0.061283111572265625, -0.05541229248046875, -0.049541473388671875, -0.043670654296875, -0.037799835205078125, -0.03192901611328125, -0.026058197021484375, -0.0201873779296875, -0.014316558837890625, -0.00844573974609375, -0.002574920654296875, 0.0032958984375, 0.009166717529296875, 0.01503753662109375, 0.020908355712890625, 0.0267791748046875, 0.032649993896484375, 0.03852081298828125, 0.044391632080078125, 0.050262451171875, 0.056133270263671875, 0.06200408935546875, 0.06787490844726562, 0.0737457275390625, 0.07961654663085938, 0.08548736572265625, 0.09135818481445312, 0.09722900390625, 0.10309982299804688, 0.10897064208984375, 0.11484146118164062, 0.1207122802734375, 0.12658309936523438, 0.13245391845703125, 0.13832473754882812, 0.144195556640625, 0.15006637573242188, 0.15593719482421875, 0.16180801391601562, 0.1676788330078125, 0.17354965209960938, 0.17942047119140625, 0.18529129028320312, 0.191162109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 1.0, 7.0, 7.0, 9.0, 18.0, 27.0, 30.0, 30.0, 49.0, 59.0, 77.0, 116.0, 184.0, 257.0, 447.0, 715.0, 1344.0, 2809.0, 6233.0, 14073.0, 33113.0, 79818.0, 179161.0, 290369.0, 237390.0, 115940.0, 48725.0, 20349.0, 8896.0, 3843.0, 1863.0, 1035.0, 540.0, 307.0, 187.0, 148.0, 109.0, 63.0, 64.0, 36.0, 23.0, 25.0, 14.0, 15.0, 6.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.204833984375, -0.1981658935546875, -0.191497802734375, -0.1848297119140625, -0.17816162109375, -0.1714935302734375, -0.164825439453125, -0.1581573486328125, -0.1514892578125, -0.1448211669921875, -0.138153076171875, -0.1314849853515625, -0.12481689453125, -0.1181488037109375, -0.111480712890625, -0.1048126220703125, -0.09814453125, -0.0914764404296875, -0.084808349609375, -0.0781402587890625, -0.07147216796875, -0.0648040771484375, -0.058135986328125, -0.0514678955078125, -0.0447998046875, -0.0381317138671875, -0.031463623046875, -0.0247955322265625, -0.01812744140625, -0.0114593505859375, -0.004791259765625, 0.0018768310546875, 0.008544921875, 0.0152130126953125, 0.021881103515625, 0.0285491943359375, 0.03521728515625, 0.0418853759765625, 0.048553466796875, 0.0552215576171875, 0.0618896484375, 0.0685577392578125, 0.075225830078125, 0.0818939208984375, 0.08856201171875, 0.0952301025390625, 0.101898193359375, 0.1085662841796875, 0.115234375, 0.1219024658203125, 0.128570556640625, 0.1352386474609375, 0.14190673828125, 0.1485748291015625, 0.155242919921875, 0.1619110107421875, 0.1685791015625, 0.1752471923828125, 0.181915283203125, 0.1885833740234375, 0.19525146484375, 0.2019195556640625, 0.208587646484375, 0.2152557373046875, 0.221923828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 9.0, 8.0, 12.0, 10.0, 4.0, 16.0, 12.0, 14.0, 15.0, 11.0, 23.0, 30.0, 21.0, 21.0, 38.0, 32.0, 35.0, 44.0, 20.0, 40.0, 31.0, 37.0, 53.0, 48.0, 40.0, 45.0, 35.0, 32.0, 35.0, 33.0, 21.0, 30.0, 18.0, 23.0, 15.0, 18.0, 15.0, 21.0, 5.0, 10.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.270263671875, -0.26224708557128906, -0.2542304992675781, -0.2462139129638672, -0.23819732666015625, -0.2301807403564453, -0.22216415405273438, -0.21414756774902344, -0.2061309814453125, -0.19811439514160156, -0.19009780883789062, -0.1820812225341797, -0.17406463623046875, -0.1660480499267578, -0.15803146362304688, -0.15001487731933594, -0.141998291015625, -0.13398170471191406, -0.12596511840820312, -0.11794853210449219, -0.10993194580078125, -0.10191535949707031, -0.09389877319335938, -0.08588218688964844, -0.0778656005859375, -0.06984901428222656, -0.061832427978515625, -0.05381584167480469, -0.04579925537109375, -0.03778266906738281, -0.029766082763671875, -0.021749496459960938, -0.01373291015625, -0.0057163238525390625, 0.002300262451171875, 0.010316848754882812, 0.01833343505859375, 0.026350021362304688, 0.034366607666015625, 0.04238319396972656, 0.0503997802734375, 0.05841636657714844, 0.06643295288085938, 0.07444953918457031, 0.08246612548828125, 0.09048271179199219, 0.09849929809570312, 0.10651588439941406, 0.114532470703125, 0.12254905700683594, 0.13056564331054688, 0.1385822296142578, 0.14659881591796875, 0.1546154022216797, 0.16263198852539062, 0.17064857482910156, 0.1786651611328125, 0.18668174743652344, 0.19469833374023438, 0.2027149200439453, 0.21073150634765625, 0.2187480926513672, 0.22676467895507812, 0.23478126525878906, 0.2427978515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 10.0, 12.0, 19.0, 24.0, 58.0, 105.0, 165.0, 416.0, 1016.0, 3122.0, 11667.0, 63763.0, 439215.0, 446483.0, 65424.0, 12011.0, 3137.0, 1004.0, 453.0, 197.0, 104.0, 63.0, 25.0, 15.0, 16.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1702880859375, -0.16441726684570312, -0.15854644775390625, -0.15267562866210938, -0.1468048095703125, -0.14093399047851562, -0.13506317138671875, -0.12919235229492188, -0.123321533203125, -0.11745071411132812, -0.11157989501953125, -0.10570907592773438, -0.0998382568359375, -0.09396743774414062, -0.08809661865234375, -0.08222579956054688, -0.07635498046875, -0.07048416137695312, -0.06461334228515625, -0.058742523193359375, -0.0528717041015625, -0.047000885009765625, -0.04113006591796875, -0.035259246826171875, -0.029388427734375, -0.023517608642578125, -0.01764678955078125, -0.011775970458984375, -0.0059051513671875, -3.4332275390625e-05, 0.00583648681640625, 0.011707305908203125, 0.017578125, 0.023448944091796875, 0.02931976318359375, 0.035190582275390625, 0.0410614013671875, 0.046932220458984375, 0.05280303955078125, 0.058673858642578125, 0.064544677734375, 0.07041549682617188, 0.07628631591796875, 0.08215713500976562, 0.0880279541015625, 0.09389877319335938, 0.09976959228515625, 0.10564041137695312, 0.11151123046875, 0.11738204956054688, 0.12325286865234375, 0.12912368774414062, 0.1349945068359375, 0.14086532592773438, 0.14673614501953125, 0.15260696411132812, 0.158477783203125, 0.16434860229492188, 0.17021942138671875, 0.17609024047851562, 0.1819610595703125, 0.18783187866210938, 0.19370269775390625, 0.19957351684570312, 0.2054443359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 10.0, 7.0, 8.0, 14.0, 19.0, 26.0, 24.0, 37.0, 37.0, 45.0, 42.0, 50.0, 78.0, 92.0, 76.0, 73.0, 51.0, 44.0, 42.0, 46.0, 32.0, 32.0, 26.0, 18.0, 10.0, 13.0, 9.0, 6.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0], "bins": [-0.00014710426330566406, -0.00014321133494377136, -0.00013931840658187866, -0.00013542547821998596, -0.00013153254985809326, -0.00012763962149620056, -0.00012374669313430786, -0.00011985376477241516, -0.00011596083641052246, -0.00011206790804862976, -0.00010817497968673706, -0.00010428205132484436, -0.00010038912296295166, -9.649619460105896e-05, -9.260326623916626e-05, -8.871033787727356e-05, -8.481740951538086e-05, -8.092448115348816e-05, -7.703155279159546e-05, -7.313862442970276e-05, -6.924569606781006e-05, -6.535276770591736e-05, -6.145983934402466e-05, -5.756691098213196e-05, -5.367398262023926e-05, -4.978105425834656e-05, -4.588812589645386e-05, -4.199519753456116e-05, -3.810226917266846e-05, -3.420934081077576e-05, -3.0316412448883057e-05, -2.6423484086990356e-05, -2.2530555725097656e-05, -1.8637627363204956e-05, -1.4744699001312256e-05, -1.0851770639419556e-05, -6.9588422775268555e-06, -3.0659139156341553e-06, 8.270144462585449e-07, 4.719942808151245e-06, 8.612871170043945e-06, 1.2505799531936646e-05, 1.6398727893829346e-05, 2.0291656255722046e-05, 2.4184584617614746e-05, 2.8077512979507446e-05, 3.1970441341400146e-05, 3.586336970329285e-05, 3.975629806518555e-05, 4.364922642707825e-05, 4.754215478897095e-05, 5.143508315086365e-05, 5.532801151275635e-05, 5.922093987464905e-05, 6.311386823654175e-05, 6.700679659843445e-05, 7.089972496032715e-05, 7.479265332221985e-05, 7.868558168411255e-05, 8.257851004600525e-05, 8.647143840789795e-05, 9.036436676979065e-05, 9.425729513168335e-05, 9.815022349357605e-05, 0.00010204315185546875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 12.0, 21.0, 34.0, 62.0, 110.0, 236.0, 632.0, 2151.0, 11465.0, 102045.0, 746082.0, 165002.0, 16465.0, 2867.0, 793.0, 272.0, 128.0, 68.0, 33.0, 21.0, 15.0, 15.0, 6.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208740234375, -0.20058441162109375, -0.1924285888671875, -0.18427276611328125, -0.176116943359375, -0.16796112060546875, -0.1598052978515625, -0.15164947509765625, -0.14349365234375, -0.13533782958984375, -0.1271820068359375, -0.11902618408203125, -0.110870361328125, -0.10271453857421875, -0.0945587158203125, -0.08640289306640625, -0.0782470703125, -0.07009124755859375, -0.0619354248046875, -0.05377960205078125, -0.045623779296875, -0.03746795654296875, -0.0293121337890625, -0.02115631103515625, -0.01300048828125, -0.00484466552734375, 0.0033111572265625, 0.01146697998046875, 0.019622802734375, 0.02777862548828125, 0.0359344482421875, 0.04409027099609375, 0.05224609375, 0.06040191650390625, 0.0685577392578125, 0.07671356201171875, 0.084869384765625, 0.09302520751953125, 0.1011810302734375, 0.10933685302734375, 0.11749267578125, 0.12564849853515625, 0.1338043212890625, 0.14196014404296875, 0.150115966796875, 0.15827178955078125, 0.1664276123046875, 0.17458343505859375, 0.1827392578125, 0.19089508056640625, 0.1990509033203125, 0.20720672607421875, 0.215362548828125, 0.22351837158203125, 0.2316741943359375, 0.23983001708984375, 0.24798583984375, 0.25614166259765625, 0.2642974853515625, 0.27245330810546875, 0.280609130859375, 0.28876495361328125, 0.2969207763671875, 0.30507659912109375, 0.313232421875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 9.0, 4.0, 10.0, 7.0, 7.0, 9.0, 14.0, 10.0, 14.0, 28.0, 23.0, 43.0, 33.0, 41.0, 53.0, 64.0, 67.0, 67.0, 54.0, 50.0, 58.0, 64.0, 41.0, 40.0, 30.0, 28.0, 28.0, 19.0, 10.0, 11.0, 11.0, 10.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.08319091796875, -0.0801401138305664, -0.07708930969238281, -0.07403850555419922, -0.07098770141601562, -0.06793689727783203, -0.06488609313964844, -0.061835289001464844, -0.05878448486328125, -0.055733680725097656, -0.05268287658691406, -0.04963207244873047, -0.046581268310546875, -0.04353046417236328, -0.04047966003417969, -0.037428855895996094, -0.0343780517578125, -0.031327247619628906, -0.028276443481445312, -0.02522563934326172, -0.022174835205078125, -0.01912403106689453, -0.016073226928710938, -0.013022422790527344, -0.00997161865234375, -0.006920814514160156, -0.0038700103759765625, -0.0008192062377929688, 0.002231597900390625, 0.005282402038574219, 0.008333206176757812, 0.011384010314941406, 0.014434814453125, 0.017485618591308594, 0.020536422729492188, 0.02358722686767578, 0.026638031005859375, 0.02968883514404297, 0.03273963928222656, 0.035790443420410156, 0.03884124755859375, 0.041892051696777344, 0.04494285583496094, 0.04799365997314453, 0.051044464111328125, 0.05409526824951172, 0.05714607238769531, 0.060196876525878906, 0.0632476806640625, 0.0662984848022461, 0.06934928894042969, 0.07240009307861328, 0.07545089721679688, 0.07850170135498047, 0.08155250549316406, 0.08460330963134766, 0.08765411376953125, 0.09070491790771484, 0.09375572204589844, 0.09680652618408203, 0.09985733032226562, 0.10290813446044922, 0.10595893859863281, 0.1090097427368164, 0.112060546875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 17.0, 36.0, 108.0, 316.0, 329.0, 129.0, 47.0, 13.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.66799545288086, -8.487131118774414, -8.306265830993652, -8.125401496887207, -7.9445366859436035, -7.763671875, -7.5828070640563965, -7.401942253112793, -7.221077919006348, -7.040213108062744, -6.859348297119141, -6.678483963012695, -6.497619152069092, -6.316754341125488, -6.135889530181885, -5.955024719238281, -5.774159908294678, -5.593295097351074, -5.412430286407471, -5.231565475463867, -5.050701141357422, -4.869836330413818, -4.688971519470215, -4.508106708526611, -4.327241897583008, -4.146377086639404, -3.96551251411438, -3.7846477031707764, -3.603783130645752, -3.4229183197021484, -3.242053508758545, -3.0611886978149414, -2.8803248405456543, -2.699460029602051, -2.5185954570770264, -2.337730646133423, -2.1568660736083984, -1.976001262664795, -1.7951364517211914, -1.6142717599868774, -1.4334070682525635, -1.2525423765182495, -1.0716776847839355, -0.890812873840332, -0.7099481821060181, -0.5290834903717041, -0.3482186794281006, -0.16735398769378662, 0.013510704040527344, 0.1943754255771637, 0.37524014711380005, 0.5561048984527588, 0.7369695901870728, 0.9178342819213867, 1.0986990928649902, 1.2795637845993042, 1.4604284763336182, 1.6412931680679321, 1.822157859802246, 2.0030226707458496, 2.183887481689453, 2.3647520542144775, 2.545616865158081, 2.7264814376831055, 2.907346248626709]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 10.0, 7.0, 6.0, 10.0, 18.0, 15.0, 15.0, 17.0, 28.0, 35.0, 34.0, 34.0, 25.0, 45.0, 34.0, 44.0, 56.0, 43.0, 43.0, 50.0, 39.0, 41.0, 39.0, 40.0, 32.0, 37.0, 30.0, 24.0, 35.0, 18.0, 14.0, 19.0, 10.0, 8.0, 8.0, 3.0, 4.0, 7.0, 3.0, 4.0, 7.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0], "bins": [-1.8163119554519653, -1.7647607326507568, -1.7132095098495483, -1.6616582870483398, -1.6101070642471313, -1.5585558414459229, -1.507004737854004, -1.4554533958435059, -1.403902292251587, -1.3523510694503784, -1.30079984664917, -1.2492486238479614, -1.197697401046753, -1.1461461782455444, -1.094594955444336, -1.043043851852417, -0.991492509841919, -0.9399412870407104, -0.888390064239502, -0.8368388414382935, -0.785287618637085, -0.7337363958358765, -0.6821852326393127, -0.6306340098381042, -0.5790827870368958, -0.5275315642356873, -0.47598034143447876, -0.42442914843559265, -0.37287792563438416, -0.32132670283317566, -0.26977550983428955, -0.21822428703308105, -0.1666731834411621, -0.11512196809053421, -0.06357075273990631, -0.012019544839859009, 0.03953167796134949, 0.09108290076255798, 0.1426340937614441, 0.1941853165626526, 0.24573653936386108, 0.2972877621650696, 0.3488389849662781, 0.4003901779651642, 0.4519414007663727, 0.5034925937652588, 0.5550438165664673, 0.6065950393676758, 0.6581462621688843, 0.7096974849700928, 0.7612487077713013, 0.8127999305725098, 0.8643511533737183, 0.9159023761749268, 0.9674535393714905, 1.0190048217773438, 1.0705559253692627, 1.1221071481704712, 1.1736583709716797, 1.2252095937728882, 1.2767608165740967, 1.3283120393753052, 1.3798632621765137, 1.4314143657684326, 1.4829657077789307]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 5.0, 7.0, 8.0, 23.0, 40.0, 63.0, 89.0, 206.0, 370.0, 808.0, 2435.0, 14435.0, 1829623.0, 2326201.0, 15542.0, 2661.0, 931.0, 420.0, 175.0, 88.0, 62.0, 34.0, 13.0, 12.0, 9.0, 2.0, 4.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.810546875, -0.7805328369140625, -0.750518798828125, -0.7205047607421875, -0.69049072265625, -0.6604766845703125, -0.630462646484375, -0.6004486083984375, -0.5704345703125, -0.5404205322265625, -0.510406494140625, -0.4803924560546875, -0.45037841796875, -0.4203643798828125, -0.390350341796875, -0.3603363037109375, -0.330322265625, -0.3003082275390625, -0.270294189453125, -0.2402801513671875, -0.21026611328125, -0.1802520751953125, -0.150238037109375, -0.1202239990234375, -0.0902099609375, -0.0601959228515625, -0.030181884765625, -0.0001678466796875, 0.02984619140625, 0.0598602294921875, 0.089874267578125, 0.1198883056640625, 0.14990234375, 0.1799163818359375, 0.209930419921875, 0.2399444580078125, 0.26995849609375, 0.2999725341796875, 0.329986572265625, 0.3600006103515625, 0.3900146484375, 0.4200286865234375, 0.450042724609375, 0.4800567626953125, 0.51007080078125, 0.5400848388671875, 0.570098876953125, 0.6001129150390625, 0.630126953125, 0.6601409912109375, 0.690155029296875, 0.7201690673828125, 0.75018310546875, 0.7801971435546875, 0.810211181640625, 0.8402252197265625, 0.8702392578125, 0.9002532958984375, 0.930267333984375, 0.9602813720703125, 0.99029541015625, 1.0203094482421875, 1.050323486328125, 1.0803375244140625, 1.1103515625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 10.0, 15.0, 23.0, 47.0, 85.0, 114.0, 144.0, 148.0, 140.0, 89.0, 65.0, 42.0, 37.0, 23.0, 4.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1929931640625, -0.1868610382080078, -0.18072891235351562, -0.17459678649902344, -0.16846466064453125, -0.16233253479003906, -0.15620040893554688, -0.1500682830810547, -0.1439361572265625, -0.1378040313720703, -0.13167190551757812, -0.12553977966308594, -0.11940765380859375, -0.11327552795410156, -0.10714340209960938, -0.10101127624511719, -0.094879150390625, -0.08874702453613281, -0.08261489868164062, -0.07648277282714844, -0.07035064697265625, -0.06421852111816406, -0.058086395263671875, -0.05195426940917969, -0.0458221435546875, -0.03969001770019531, -0.033557891845703125, -0.027425765991210938, -0.02129364013671875, -0.015161514282226562, -0.009029388427734375, -0.0028972625732421875, 0.00323486328125, 0.009366989135742188, 0.015499114990234375, 0.021631240844726562, 0.02776336669921875, 0.03389549255371094, 0.040027618408203125, 0.04615974426269531, 0.0522918701171875, 0.05842399597167969, 0.06455612182617188, 0.07068824768066406, 0.07682037353515625, 0.08295249938964844, 0.08908462524414062, 0.09521675109863281, 0.101348876953125, 0.10748100280761719, 0.11361312866210938, 0.11974525451660156, 0.12587738037109375, 0.13200950622558594, 0.13814163208007812, 0.1442737579345703, 0.1504058837890625, 0.1565380096435547, 0.16267013549804688, 0.16880226135253906, 0.17493438720703125, 0.18106651306152344, 0.18719863891601562, 0.1933307647705078, 0.199462890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 7.0, 1.0, 10.0, 17.0, 48.0, 98.0, 138.0, 277.0, 515.0, 1181.0, 2754.0, 7313.0, 26449.0, 171597.0, 3543986.0, 381241.0, 41760.0, 10384.0, 3576.0, 1457.0, 675.0, 337.0, 187.0, 110.0, 70.0, 35.0, 19.0, 19.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.352783203125, -0.34088134765625, -0.3289794921875, -0.31707763671875, -0.30517578125, -0.29327392578125, -0.2813720703125, -0.26947021484375, -0.257568359375, -0.24566650390625, -0.2337646484375, -0.22186279296875, -0.2099609375, -0.19805908203125, -0.1861572265625, -0.17425537109375, -0.162353515625, -0.15045166015625, -0.1385498046875, -0.12664794921875, -0.11474609375, -0.10284423828125, -0.0909423828125, -0.07904052734375, -0.067138671875, -0.05523681640625, -0.0433349609375, -0.03143310546875, -0.01953125, -0.00762939453125, 0.0042724609375, 0.01617431640625, 0.028076171875, 0.03997802734375, 0.0518798828125, 0.06378173828125, 0.07568359375, 0.08758544921875, 0.0994873046875, 0.11138916015625, 0.123291015625, 0.13519287109375, 0.1470947265625, 0.15899658203125, 0.1708984375, 0.18280029296875, 0.1947021484375, 0.20660400390625, 0.218505859375, 0.23040771484375, 0.2423095703125, 0.25421142578125, 0.26611328125, 0.27801513671875, 0.2899169921875, 0.30181884765625, 0.313720703125, 0.32562255859375, 0.3375244140625, 0.34942626953125, 0.361328125, 0.37322998046875, 0.3851318359375, 0.39703369140625, 0.408935546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 5.0, 15.0, 14.0, 36.0, 34.0, 75.0, 155.0, 311.0, 887.0, 1537.0, 494.0, 199.0, 104.0, 50.0, 38.0, 41.0, 19.0, 15.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136474609375, -0.13083839416503906, -0.12520217895507812, -0.11956596374511719, -0.11392974853515625, -0.10829353332519531, -0.10265731811523438, -0.09702110290527344, -0.0913848876953125, -0.08574867248535156, -0.08011245727539062, -0.07447624206542969, -0.06884002685546875, -0.06320381164550781, -0.057567596435546875, -0.05193138122558594, -0.046295166015625, -0.04065895080566406, -0.035022735595703125, -0.029386520385742188, -0.02375030517578125, -0.018114089965820312, -0.012477874755859375, -0.0068416595458984375, -0.0012054443359375, 0.0044307708740234375, 0.010066986083984375, 0.015703201293945312, 0.02133941650390625, 0.026975631713867188, 0.032611846923828125, 0.03824806213378906, 0.04388427734375, 0.04952049255371094, 0.055156707763671875, 0.06079292297363281, 0.06642913818359375, 0.07206535339355469, 0.07770156860351562, 0.08333778381347656, 0.0889739990234375, 0.09461021423339844, 0.10024642944335938, 0.10588264465332031, 0.11151885986328125, 0.11715507507324219, 0.12279129028320312, 0.12842750549316406, 0.134063720703125, 0.13969993591308594, 0.14533615112304688, 0.1509723663330078, 0.15660858154296875, 0.1622447967529297, 0.16788101196289062, 0.17351722717285156, 0.1791534423828125, 0.18478965759277344, 0.19042587280273438, 0.1960620880126953, 0.20169830322265625, 0.2073345184326172, 0.21297073364257812, 0.21860694885253906, 0.2242431640625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 28.0, 56.0, 147.0, 249.0, 244.0, 167.0, 68.0, 19.0, 14.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9786741733551025, -0.9270185232162476, -0.8753628730773926, -0.8237072229385376, -0.7720515727996826, -0.7203959226608276, -0.6687402725219727, -0.6170846223831177, -0.5654289722442627, -0.5137733221054077, -0.46211767196655273, -0.41046202182769775, -0.3588063716888428, -0.3071507513523102, -0.2554951012134552, -0.20383945107460022, -0.15218383073806763, -0.10052818059921265, -0.04887253791093826, 0.0027831047773361206, 0.0544387549161911, 0.10609439015388489, 0.15775004029273987, 0.20940569043159485, 0.26106134057044983, 0.3127169907093048, 0.3643726408481598, 0.4160282611846924, 0.46768391132354736, 0.5193395614624023, 0.5709952116012573, 0.6226508617401123, 0.6743065118789673, 0.7259621620178223, 0.7776178121566772, 0.8292734622955322, 0.8809291124343872, 0.9325847625732422, 0.9842404127120972, 1.0358960628509521, 1.0875517129898071, 1.139207363128662, 1.190863013267517, 1.242518663406372, 1.294174313545227, 1.345829963684082, 1.397485613822937, 1.449141263961792, 1.5007967948913574, 1.5524524450302124, 1.6041080951690674, 1.6557637453079224, 1.7074193954467773, 1.7590750455856323, 1.8107306957244873, 1.8623863458633423, 1.9140419960021973, 1.9656976461410522, 2.0173532962799072, 2.0690088272094727, 2.120664596557617, 2.1723201274871826, 2.223975896835327, 2.2756314277648926, 2.327287197113037]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 11.0, 24.0, 24.0, 34.0, 34.0, 34.0, 49.0, 64.0, 72.0, 65.0, 78.0, 59.0, 62.0, 61.0, 73.0, 49.0, 45.0, 33.0, 26.0, 32.0, 13.0, 11.0, 8.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.8303853869438171, -0.8079603314399719, -0.7855352759361267, -0.7631101608276367, -0.7406851053237915, -0.7182600498199463, -0.6958349943161011, -0.6734099388122559, -0.6509848833084106, -0.6285598278045654, -0.6061347723007202, -0.583709716796875, -0.561284601688385, -0.5388595461845398, -0.5164344906806946, -0.49400943517684937, -0.4715843200683594, -0.44915926456451416, -0.42673417925834656, -0.40430912375450134, -0.38188403844833374, -0.3594589829444885, -0.3370339274406433, -0.3146088719367981, -0.2921837866306305, -0.2697587311267853, -0.24733364582061768, -0.22490859031677246, -0.20248351991176605, -0.18005844950675964, -0.15763339400291443, -0.13520832359790802, -0.11278319358825684, -0.09035812318325043, -0.06793306022882462, -0.045507997274398804, -0.023082926869392395, -0.0006578564643859863, 0.02176719903945923, 0.04419226944446564, 0.06661733984947205, 0.08904241025447845, 0.11146747320890427, 0.13389253616333008, 0.1563176065683365, 0.1787426769733429, 0.2011677324771881, 0.22359280288219452, 0.24601787328720093, 0.26844292879104614, 0.29086801409721375, 0.31329306960105896, 0.33571815490722656, 0.3581432104110718, 0.380568265914917, 0.4029933214187622, 0.4254184067249298, 0.447843462228775, 0.4702685475349426, 0.49269360303878784, 0.5151186585426331, 0.537543773651123, 0.5599688291549683, 0.5823938846588135, 0.6048189401626587]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 8.0, 17.0, 25.0, 43.0, 50.0, 65.0, 118.0, 169.0, 231.0, 460.0, 792.0, 1561.0, 3323.0, 8983.0, 37737.0, 256102.0, 593411.0, 114300.0, 20015.0, 6049.0, 2376.0, 1141.0, 602.0, 317.0, 216.0, 130.0, 91.0, 64.0, 37.0, 42.0, 21.0, 15.0, 8.0, 2.0, 2.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.60546875, -0.5867233276367188, -0.5679779052734375, -0.5492324829101562, -0.530487060546875, -0.5117416381835938, -0.4929962158203125, -0.47425079345703125, -0.45550537109375, -0.43675994873046875, -0.4180145263671875, -0.39926910400390625, -0.380523681640625, -0.36177825927734375, -0.3430328369140625, -0.32428741455078125, -0.3055419921875, -0.28679656982421875, -0.2680511474609375, -0.24930572509765625, -0.230560302734375, -0.21181488037109375, -0.1930694580078125, -0.17432403564453125, -0.15557861328125, -0.13683319091796875, -0.1180877685546875, -0.09934234619140625, -0.080596923828125, -0.06185150146484375, -0.0431060791015625, -0.02436065673828125, -0.005615234375, 0.01313018798828125, 0.0318756103515625, 0.05062103271484375, 0.069366455078125, 0.08811187744140625, 0.1068572998046875, 0.12560272216796875, 0.14434814453125, 0.16309356689453125, 0.1818389892578125, 0.20058441162109375, 0.219329833984375, 0.23807525634765625, 0.2568206787109375, 0.27556610107421875, 0.2943115234375, 0.31305694580078125, 0.3318023681640625, 0.35054779052734375, 0.369293212890625, 0.38803863525390625, 0.4067840576171875, 0.42552947998046875, 0.44427490234375, 0.46302032470703125, 0.4817657470703125, 0.5005111694335938, 0.519256591796875, 0.5380020141601562, 0.5567474365234375, 0.5754928588867188, 0.59423828125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 14.0, 25.0, 39.0, 82.0, 125.0, 126.0, 147.0, 132.0, 117.0, 70.0, 45.0, 33.0, 17.0, 11.0, 5.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.195556640625, -0.1891632080078125, -0.182769775390625, -0.1763763427734375, -0.16998291015625, -0.1635894775390625, -0.157196044921875, -0.1508026123046875, -0.1444091796875, -0.1380157470703125, -0.131622314453125, -0.1252288818359375, -0.11883544921875, -0.1124420166015625, -0.106048583984375, -0.0996551513671875, -0.09326171875, -0.0868682861328125, -0.080474853515625, -0.0740814208984375, -0.06768798828125, -0.0612945556640625, -0.054901123046875, -0.0485076904296875, -0.0421142578125, -0.0357208251953125, -0.029327392578125, -0.0229339599609375, -0.01654052734375, -0.0101470947265625, -0.003753662109375, 0.0026397705078125, 0.009033203125, 0.0154266357421875, 0.021820068359375, 0.0282135009765625, 0.03460693359375, 0.0410003662109375, 0.047393798828125, 0.0537872314453125, 0.0601806640625, 0.0665740966796875, 0.072967529296875, 0.0793609619140625, 0.08575439453125, 0.0921478271484375, 0.098541259765625, 0.1049346923828125, 0.111328125, 0.1177215576171875, 0.124114990234375, 0.1305084228515625, 0.13690185546875, 0.1432952880859375, 0.149688720703125, 0.1560821533203125, 0.1624755859375, 0.1688690185546875, 0.175262451171875, 0.1816558837890625, 0.18804931640625, 0.1944427490234375, 0.200836181640625, 0.2072296142578125, 0.213623046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 9.0, 15.0, 14.0, 14.0, 22.0, 20.0, 42.0, 59.0, 69.0, 150.0, 229.0, 469.0, 1054.0, 3147.0, 11605.0, 57202.0, 317503.0, 511239.0, 115845.0, 21520.0, 5178.0, 1599.0, 674.0, 315.0, 150.0, 111.0, 81.0, 43.0, 46.0, 24.0, 23.0, 21.0, 9.0, 19.0, 8.0, 8.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.46875, -0.454193115234375, -0.43963623046875, -0.425079345703125, -0.4105224609375, -0.395965576171875, -0.38140869140625, -0.366851806640625, -0.352294921875, -0.337738037109375, -0.32318115234375, -0.308624267578125, -0.2940673828125, -0.279510498046875, -0.26495361328125, -0.250396728515625, -0.23583984375, -0.221282958984375, -0.20672607421875, -0.192169189453125, -0.1776123046875, -0.163055419921875, -0.14849853515625, -0.133941650390625, -0.119384765625, -0.104827880859375, -0.09027099609375, -0.075714111328125, -0.0611572265625, -0.046600341796875, -0.03204345703125, -0.017486572265625, -0.0029296875, 0.011627197265625, 0.02618408203125, 0.040740966796875, 0.0552978515625, 0.069854736328125, 0.08441162109375, 0.098968505859375, 0.113525390625, 0.128082275390625, 0.14263916015625, 0.157196044921875, 0.1717529296875, 0.186309814453125, 0.20086669921875, 0.215423583984375, 0.22998046875, 0.244537353515625, 0.25909423828125, 0.273651123046875, 0.2882080078125, 0.302764892578125, 0.31732177734375, 0.331878662109375, 0.346435546875, 0.360992431640625, 0.37554931640625, 0.390106201171875, 0.4046630859375, 0.419219970703125, 0.43377685546875, 0.448333740234375, 0.462890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 11.0, 6.0, 10.0, 10.0, 18.0, 24.0, 22.0, 30.0, 14.0, 35.0, 40.0, 50.0, 45.0, 48.0, 46.0, 57.0, 48.0, 51.0, 54.0, 53.0, 35.0, 34.0, 35.0, 36.0, 27.0, 23.0, 21.0, 18.0, 18.0, 9.0, 13.0, 14.0, 10.0, 6.0, 3.0, 5.0, 3.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.37451171875, -0.36356353759765625, -0.3526153564453125, -0.34166717529296875, -0.330718994140625, -0.31977081298828125, -0.3088226318359375, -0.29787445068359375, -0.28692626953125, -0.27597808837890625, -0.2650299072265625, -0.25408172607421875, -0.243133544921875, -0.23218536376953125, -0.2212371826171875, -0.21028900146484375, -0.1993408203125, -0.18839263916015625, -0.1774444580078125, -0.16649627685546875, -0.155548095703125, -0.14459991455078125, -0.1336517333984375, -0.12270355224609375, -0.11175537109375, -0.10080718994140625, -0.0898590087890625, -0.07891082763671875, -0.067962646484375, -0.05701446533203125, -0.0460662841796875, -0.03511810302734375, -0.024169921875, -0.01322174072265625, -0.0022735595703125, 0.00867462158203125, 0.019622802734375, 0.03057098388671875, 0.0415191650390625, 0.05246734619140625, 0.06341552734375, 0.07436370849609375, 0.0853118896484375, 0.09626007080078125, 0.107208251953125, 0.11815643310546875, 0.1291046142578125, 0.14005279541015625, 0.1510009765625, 0.16194915771484375, 0.1728973388671875, 0.18384552001953125, 0.194793701171875, 0.20574188232421875, 0.2166900634765625, 0.22763824462890625, 0.23858642578125, 0.24953460693359375, 0.2604827880859375, 0.27143096923828125, 0.282379150390625, 0.29332733154296875, 0.3042755126953125, 0.31522369384765625, 0.326171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 25.0, 68.0, 161.0, 700.0, 10872.0, 1032106.0, 4003.0, 424.0, 115.0, 41.0, 14.0, 13.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55859375, -1.50164794921875, -1.4447021484375, -1.38775634765625, -1.330810546875, -1.27386474609375, -1.2169189453125, -1.15997314453125, -1.10302734375, -1.04608154296875, -0.9891357421875, -0.93218994140625, -0.875244140625, -0.81829833984375, -0.7613525390625, -0.70440673828125, -0.6474609375, -0.59051513671875, -0.5335693359375, -0.47662353515625, -0.419677734375, -0.36273193359375, -0.3057861328125, -0.24884033203125, -0.19189453125, -0.13494873046875, -0.0780029296875, -0.02105712890625, 0.035888671875, 0.09283447265625, 0.1497802734375, 0.20672607421875, 0.263671875, 0.32061767578125, 0.3775634765625, 0.43450927734375, 0.491455078125, 0.54840087890625, 0.6053466796875, 0.66229248046875, 0.71923828125, 0.77618408203125, 0.8331298828125, 0.89007568359375, 0.947021484375, 1.00396728515625, 1.0609130859375, 1.11785888671875, 1.1748046875, 1.23175048828125, 1.2886962890625, 1.34564208984375, 1.402587890625, 1.45953369140625, 1.5164794921875, 1.57342529296875, 1.63037109375, 1.68731689453125, 1.7442626953125, 1.80120849609375, 1.858154296875, 1.91510009765625, 1.9720458984375, 2.02899169921875, 2.0859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 11.0, 15.0, 17.0, 43.0, 69.0, 141.0, 263.0, 222.0, 94.0, 52.0, 28.0, 19.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000244140625, -0.00023428350687026978, -0.00022442638874053955, -0.00021456927061080933, -0.0002047121524810791, -0.00019485503435134888, -0.00018499791622161865, -0.00017514079809188843, -0.0001652836799621582, -0.00015542656183242798, -0.00014556944370269775, -0.00013571232557296753, -0.0001258552074432373, -0.00011599808931350708, -0.00010614097118377686, -9.628385305404663e-05, -8.64267349243164e-05, -7.656961679458618e-05, -6.671249866485596e-05, -5.685538053512573e-05, -4.699826240539551e-05, -3.714114427566528e-05, -2.728402614593506e-05, -1.7426908016204834e-05, -7.569789886474609e-06, 2.2873282432556152e-06, 1.214444637298584e-05, 2.2001564502716064e-05, 3.185868263244629e-05, 4.1715800762176514e-05, 5.157291889190674e-05, 6.143003702163696e-05, 7.128715515136719e-05, 8.114427328109741e-05, 9.100139141082764e-05, 0.00010085850954055786, 0.00011071562767028809, 0.00012057274580001831, 0.00013042986392974854, 0.00014028698205947876, 0.00015014410018920898, 0.0001600012183189392, 0.00016985833644866943, 0.00017971545457839966, 0.00018957257270812988, 0.0001994296908378601, 0.00020928680896759033, 0.00021914392709732056, 0.00022900104522705078, 0.000238858163356781, 0.00024871528148651123, 0.00025857239961624146, 0.0002684295177459717, 0.0002782866358757019, 0.00028814375400543213, 0.00029800087213516235, 0.0003078579902648926, 0.0003177151083946228, 0.00032757222652435303, 0.00033742934465408325, 0.0003472864627838135, 0.0003571435809135437, 0.0003670006990432739, 0.00037685781717300415, 0.0003867149353027344]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 10.0, 22.0, 30.0, 61.0, 121.0, 216.0, 480.0, 2249.0, 106633.0, 933783.0, 3766.0, 654.0, 243.0, 129.0, 71.0, 39.0, 25.0, 12.0, 8.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.28125, -1.241363525390625, -1.20147705078125, -1.161590576171875, -1.1217041015625, -1.081817626953125, -1.04193115234375, -1.002044677734375, -0.962158203125, -0.922271728515625, -0.88238525390625, -0.842498779296875, -0.8026123046875, -0.762725830078125, -0.72283935546875, -0.682952880859375, -0.64306640625, -0.603179931640625, -0.56329345703125, -0.523406982421875, -0.4835205078125, -0.443634033203125, -0.40374755859375, -0.363861083984375, -0.323974609375, -0.284088134765625, -0.24420166015625, -0.204315185546875, -0.1644287109375, -0.124542236328125, -0.08465576171875, -0.044769287109375, -0.0048828125, 0.035003662109375, 0.07489013671875, 0.114776611328125, 0.1546630859375, 0.194549560546875, 0.23443603515625, 0.274322509765625, 0.314208984375, 0.354095458984375, 0.39398193359375, 0.433868408203125, 0.4737548828125, 0.513641357421875, 0.55352783203125, 0.593414306640625, 0.63330078125, 0.673187255859375, 0.71307373046875, 0.752960205078125, 0.7928466796875, 0.832733154296875, 0.87261962890625, 0.912506103515625, 0.952392578125, 0.992279052734375, 1.03216552734375, 1.072052001953125, 1.1119384765625, 1.151824951171875, 1.19171142578125, 1.231597900390625, 1.271484375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 15.0, 63.0, 374.0, 424.0, 99.0, 18.0, 9.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1015625, -1.068267822265625, -1.03497314453125, -1.001678466796875, -0.9683837890625, -0.935089111328125, -0.90179443359375, -0.868499755859375, -0.835205078125, -0.801910400390625, -0.76861572265625, -0.735321044921875, -0.7020263671875, -0.668731689453125, -0.63543701171875, -0.602142333984375, -0.56884765625, -0.535552978515625, -0.50225830078125, -0.468963623046875, -0.4356689453125, -0.402374267578125, -0.36907958984375, -0.335784912109375, -0.302490234375, -0.269195556640625, -0.23590087890625, -0.202606201171875, -0.1693115234375, -0.136016845703125, -0.10272216796875, -0.069427490234375, -0.0361328125, -0.002838134765625, 0.03045654296875, 0.063751220703125, 0.0970458984375, 0.130340576171875, 0.16363525390625, 0.196929931640625, 0.230224609375, 0.263519287109375, 0.29681396484375, 0.330108642578125, 0.3634033203125, 0.396697998046875, 0.42999267578125, 0.463287353515625, 0.49658203125, 0.529876708984375, 0.56317138671875, 0.596466064453125, 0.6297607421875, 0.663055419921875, 0.69635009765625, 0.729644775390625, 0.762939453125, 0.796234130859375, 0.82952880859375, 0.862823486328125, 0.8961181640625, 0.929412841796875, 0.96270751953125, 0.996002197265625, 1.029296875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 43.0, 314.0, 498.0, 121.0, 20.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-22.58203125, -22.140111923217773, -21.698190689086914, -21.256271362304688, -20.814350128173828, -20.3724308013916, -19.930509567260742, -19.488590240478516, -19.046669006347656, -18.60474967956543, -18.16282844543457, -17.720909118652344, -17.278987884521484, -16.837068557739258, -16.3951473236084, -15.953227996826172, -15.511308670043945, -15.069388389587402, -14.62746810913086, -14.185547828674316, -13.743627548217773, -13.301708221435547, -12.859786987304688, -12.417867660522461, -11.975946426391602, -11.534026145935059, -11.092105865478516, -10.650185585021973, -10.20826530456543, -9.766345977783203, -9.324424743652344, -8.882505416870117, -8.440584182739258, -7.998663902282715, -7.556743621826172, -7.114823341369629, -6.672903537750244, -6.230983257293701, -5.789062976837158, -5.347143173217773, -4.9052228927612305, -4.4633026123046875, -4.0213823318481445, -3.5794622898101807, -3.137542247772217, -2.695621967315674, -2.253701686859131, -1.811781644821167, -1.3698616027832031, -0.9279414415359497, -0.4860212206840515, -0.04410099983215332, 0.3978191614151001, 0.8397393226623535, 1.2816596031188965, 1.7235796451568604, 2.1654999256134033, 2.6074202060699463, 3.04934024810791, 3.491260528564453, 3.933180809020996, 4.375101089477539, 4.817021369934082, 5.258941173553467, 5.70086145401001]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 12.0, 3.0, 7.0, 14.0, 22.0, 18.0, 29.0, 19.0, 31.0, 31.0, 47.0, 37.0, 47.0, 48.0, 37.0, 49.0, 48.0, 61.0, 53.0, 47.0, 44.0, 52.0, 31.0, 32.0, 26.0, 26.0, 23.0, 32.0, 12.0, 11.0, 11.0, 3.0, 7.0, 11.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.638761520385742, -2.5725622177124023, -2.5063629150390625, -2.4401638507843018, -2.373964548110962, -2.307765245437622, -2.2415659427642822, -2.1753666400909424, -2.1091675758361816, -2.042968273162842, -1.9767690896987915, -1.9105697870254517, -1.8443706035614014, -1.7781713008880615, -1.7119719982147217, -1.6457726955413818, -1.579573392868042, -1.5133740901947021, -1.4471749067306519, -1.380975604057312, -1.3147764205932617, -1.2485771179199219, -1.182377815246582, -1.1161785125732422, -1.049979329109192, -0.9837800860404968, -0.9175808429718018, -0.8513815402984619, -0.7851822972297668, -0.7189830541610718, -0.6527837514877319, -0.5865845084190369, -0.5203855037689209, -0.45418626070022583, -0.3879869878292084, -0.3217877149581909, -0.25558847188949585, -0.18938922882080078, -0.12318995594978333, -0.05699068307876587, 0.0092085599899292, 0.07540781795978546, 0.14160707592964172, 0.20780633389949799, 0.27400559186935425, 0.3402048349380493, 0.4064041078090668, 0.47260338068008423, 0.5388026237487793, 0.6050018668174744, 0.6712011098861694, 0.7374004125595093, 0.8035996556282043, 0.8697988986968994, 0.9359982013702393, 1.002197504043579, 1.0683966875076294, 1.1345959901809692, 1.2007951736450195, 1.2669944763183594, 1.3331937789916992, 1.3993929624557495, 1.4655922651290894, 1.5317914485931396, 1.5979907512664795]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 3.0, 7.0, 5.0, 12.0, 13.0, 21.0, 18.0, 28.0, 28.0, 39.0, 73.0, 80.0, 128.0, 173.0, 313.0, 514.0, 1040.0, 2297.0, 5985.0, 19137.0, 107879.0, 3781946.0, 230589.0, 29212.0, 8202.0, 3195.0, 1428.0, 692.0, 398.0, 220.0, 171.0, 117.0, 83.0, 61.0, 42.0, 37.0, 28.0, 27.0, 9.0, 9.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.52685546875, -0.5116462707519531, -0.49643707275390625, -0.4812278747558594, -0.4660186767578125, -0.4508094787597656, -0.43560028076171875, -0.4203910827636719, -0.405181884765625, -0.3899726867675781, -0.37476348876953125, -0.3595542907714844, -0.3443450927734375, -0.3291358947753906, -0.31392669677734375, -0.2987174987792969, -0.28350830078125, -0.2682991027832031, -0.25308990478515625, -0.23788070678710938, -0.2226715087890625, -0.20746231079101562, -0.19225311279296875, -0.17704391479492188, -0.161834716796875, -0.14662551879882812, -0.13141632080078125, -0.11620712280273438, -0.1009979248046875, -0.08578872680664062, -0.07057952880859375, -0.055370330810546875, -0.0401611328125, -0.024951934814453125, -0.00974273681640625, 0.005466461181640625, 0.0206756591796875, 0.035884857177734375, 0.05109405517578125, 0.06630325317382812, 0.081512451171875, 0.09672164916992188, 0.11193084716796875, 0.12714004516601562, 0.1423492431640625, 0.15755844116210938, 0.17276763916015625, 0.18797683715820312, 0.20318603515625, 0.21839523315429688, 0.23360443115234375, 0.24881362915039062, 0.2640228271484375, 0.2792320251464844, 0.29444122314453125, 0.3096504211425781, 0.324859619140625, 0.3400688171386719, 0.35527801513671875, 0.3704872131347656, 0.3856964111328125, 0.4009056091308594, 0.41611480712890625, 0.4313240051269531, 0.446533203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 6.0, 18.0, 42.0, 47.0, 87.0, 127.0, 132.0, 132.0, 112.0, 87.0, 72.0, 53.0, 30.0, 24.0, 12.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.20914649963378906, -0.20247268676757812, -0.1957988739013672, -0.18912506103515625, -0.1824512481689453, -0.17577743530273438, -0.16910362243652344, -0.1624298095703125, -0.15575599670410156, -0.14908218383789062, -0.1424083709716797, -0.13573455810546875, -0.1290607452392578, -0.12238693237304688, -0.11571311950683594, -0.109039306640625, -0.10236549377441406, -0.09569168090820312, -0.08901786804199219, -0.08234405517578125, -0.07567024230957031, -0.06899642944335938, -0.06232261657714844, -0.0556488037109375, -0.04897499084472656, -0.042301177978515625, -0.03562736511230469, -0.02895355224609375, -0.022279739379882812, -0.015605926513671875, -0.008932113647460938, -0.00225830078125, 0.0044155120849609375, 0.011089324951171875, 0.017763137817382812, 0.02443695068359375, 0.031110763549804688, 0.037784576416015625, 0.04445838928222656, 0.0511322021484375, 0.05780601501464844, 0.06447982788085938, 0.07115364074707031, 0.07782745361328125, 0.08450126647949219, 0.09117507934570312, 0.09784889221191406, 0.104522705078125, 0.11119651794433594, 0.11787033081054688, 0.12454414367675781, 0.13121795654296875, 0.1378917694091797, 0.14456558227539062, 0.15123939514160156, 0.1579132080078125, 0.16458702087402344, 0.17126083374023438, 0.1779346466064453, 0.18460845947265625, 0.1912822723388672, 0.19795608520507812, 0.20462989807128906, 0.2113037109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 8.0, 16.0, 43.0, 58.0, 123.0, 252.0, 558.0, 1309.0, 3456.0, 11712.0, 65389.0, 3668535.0, 403704.0, 28658.0, 6591.0, 2176.0, 933.0, 407.0, 185.0, 70.0, 51.0, 21.0, 13.0, 8.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349365234375, -0.3307762145996094, -0.31218719482421875, -0.2935981750488281, -0.2750091552734375, -0.2564201354980469, -0.23783111572265625, -0.21924209594726562, -0.200653076171875, -0.18206405639648438, -0.16347503662109375, -0.14488601684570312, -0.1262969970703125, -0.10770797729492188, -0.08911895751953125, -0.07052993774414062, -0.05194091796875, -0.033351898193359375, -0.01476287841796875, 0.003826141357421875, 0.0224151611328125, 0.041004180908203125, 0.05959320068359375, 0.07818222045898438, 0.096771240234375, 0.11536026000976562, 0.13394927978515625, 0.15253829956054688, 0.1711273193359375, 0.18971633911132812, 0.20830535888671875, 0.22689437866210938, 0.2454833984375, 0.2640724182128906, 0.28266143798828125, 0.3012504577636719, 0.3198394775390625, 0.3384284973144531, 0.35701751708984375, 0.3756065368652344, 0.394195556640625, 0.4127845764160156, 0.43137359619140625, 0.4499626159667969, 0.4685516357421875, 0.4871406555175781, 0.5057296752929688, 0.5243186950683594, 0.54290771484375, 0.5614967346191406, 0.5800857543945312, 0.5986747741699219, 0.6172637939453125, 0.6358528137207031, 0.6544418334960938, 0.6730308532714844, 0.691619873046875, 0.7102088928222656, 0.7287979125976562, 0.7473869323730469, 0.7659759521484375, 0.7845649719238281, 0.8031539916992188, 0.8217430114746094, 0.84033203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 4.0, 12.0, 8.0, 11.0, 16.0, 19.0, 29.0, 66.0, 76.0, 146.0, 317.0, 1304.0, 1388.0, 303.0, 142.0, 63.0, 55.0, 25.0, 17.0, 14.0, 12.0, 11.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.158447265625, -0.15333938598632812, -0.14823150634765625, -0.14312362670898438, -0.1380157470703125, -0.13290786743164062, -0.12779998779296875, -0.12269210815429688, -0.117584228515625, -0.11247634887695312, -0.10736846923828125, -0.10226058959960938, -0.0971527099609375, -0.09204483032226562, -0.08693695068359375, -0.08182907104492188, -0.07672119140625, -0.07161331176757812, -0.06650543212890625, -0.061397552490234375, -0.0562896728515625, -0.051181793212890625, -0.04607391357421875, -0.040966033935546875, -0.035858154296875, -0.030750274658203125, -0.02564239501953125, -0.020534515380859375, -0.0154266357421875, -0.010318756103515625, -0.00521087646484375, -0.000102996826171875, 0.0050048828125, 0.010112762451171875, 0.01522064208984375, 0.020328521728515625, 0.0254364013671875, 0.030544281005859375, 0.03565216064453125, 0.040760040283203125, 0.045867919921875, 0.050975799560546875, 0.05608367919921875, 0.061191558837890625, 0.0662994384765625, 0.07140731811523438, 0.07651519775390625, 0.08162307739257812, 0.08673095703125, 0.09183883666992188, 0.09694671630859375, 0.10205459594726562, 0.1071624755859375, 0.11227035522460938, 0.11737823486328125, 0.12248611450195312, 0.127593994140625, 0.13270187377929688, 0.13780975341796875, 0.14291763305664062, 0.1480255126953125, 0.15313339233398438, 0.15824127197265625, 0.16334915161132812, 0.16845703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 10.0, 35.0, 128.0, 288.0, 326.0, 153.0, 39.0, 19.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8991286754608154, -2.823695659637451, -2.748262882232666, -2.6728298664093018, -2.5973970890045166, -2.5219640731811523, -2.446531295776367, -2.371098279953003, -2.2956652641296387, -2.2202322483062744, -2.1447994709014893, -2.069366455078125, -1.9939335584640503, -1.9185006618499756, -1.8430677652359009, -1.7676348686218262, -1.6922019720077515, -1.6167690753936768, -1.541336178779602, -1.4659032821655273, -1.390470266342163, -1.3150373697280884, -1.2396044731140137, -1.1641714572906494, -1.0887386798858643, -1.0133057832717896, -0.9378728270530701, -0.8624399304389954, -0.7870069742202759, -0.7115740776062012, -0.6361411809921265, -0.560708224773407, -0.4852752685546875, -0.4098423421382904, -0.3344094157218933, -0.2589765191078186, -0.1835435926914215, -0.10811066627502441, -0.03267776966094971, 0.042755186557769775, 0.11818808317184448, 0.19362100958824158, 0.26905393600463867, 0.3444868326187134, 0.4199197590351105, 0.49535268545150757, 0.5707855820655823, 0.6462185382843018, 0.7216514348983765, 0.7970843315124512, 0.8725172877311707, 0.9479501843452454, 1.0233831405639648, 1.0988160371780396, 1.1742489337921143, 1.2496819496154785, 1.3251147270202637, 1.4005476236343384, 1.475980520248413, 1.5514135360717773, 1.626846432685852, 1.7022793292999268, 1.7777122259140015, 1.8531451225280762, 1.9285781383514404]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 11.0, 14.0, 7.0, 18.0, 14.0, 24.0, 24.0, 18.0, 46.0, 40.0, 54.0, 43.0, 59.0, 68.0, 62.0, 62.0, 60.0, 49.0, 51.0, 50.0, 33.0, 35.0, 23.0, 20.0, 22.0, 24.0, 22.0, 10.0, 14.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4988066554069519, -0.47856348752975464, -0.4583203196525574, -0.4380771517753601, -0.41783398389816284, -0.3975908160209656, -0.3773476183414459, -0.35710445046424866, -0.3368612825870514, -0.3166181147098541, -0.29637494683265686, -0.2761317789554596, -0.25588858127593994, -0.23564542829990387, -0.2154022455215454, -0.19515907764434814, -0.17491590976715088, -0.1546727418899536, -0.13442957401275635, -0.11418639123439789, -0.09394322335720062, -0.07370005548000336, -0.053456880152225494, -0.03321370482444763, -0.012970536947250366, 0.007272634655237198, 0.027515806257724762, 0.047758977860212326, 0.06800214946269989, 0.08824531733989716, 0.10848849266767502, 0.12873166799545288, 0.14897489547729492, 0.1692180633544922, 0.18946123123168945, 0.2097044140100479, 0.22994758188724518, 0.25019073486328125, 0.2704339325428009, 0.29067710041999817, 0.31092026829719543, 0.3311634361743927, 0.35140660405158997, 0.37164977192878723, 0.3918929696083069, 0.41213613748550415, 0.4323793053627014, 0.4526224732398987, 0.47286564111709595, 0.4931088089942932, 0.5133519768714905, 0.5335951447486877, 0.553838312625885, 0.5740814805030823, 0.5943246483802795, 0.6145678758621216, 0.6348110437393188, 0.6550542116165161, 0.6752973794937134, 0.6955405473709106, 0.7157837152481079, 0.7360268831253052, 0.7562700510025024, 0.7765132188796997, 0.796756386756897]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 13.0, 30.0, 51.0, 96.0, 164.0, 355.0, 694.0, 1662.0, 5166.0, 35752.0, 470136.0, 488842.0, 37080.0, 5377.0, 1653.0, 783.0, 336.0, 171.0, 85.0, 41.0, 24.0, 17.0, 15.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8505859375, -0.8240127563476562, -0.7974395751953125, -0.7708663940429688, -0.744293212890625, -0.7177200317382812, -0.6911468505859375, -0.6645736694335938, -0.63800048828125, -0.6114273071289062, -0.5848541259765625, -0.5582809448242188, -0.531707763671875, -0.5051345825195312, -0.4785614013671875, -0.45198822021484375, -0.4254150390625, -0.39884185791015625, -0.3722686767578125, -0.34569549560546875, -0.319122314453125, -0.29254913330078125, -0.2659759521484375, -0.23940277099609375, -0.21282958984375, -0.18625640869140625, -0.1596832275390625, -0.13311004638671875, -0.106536865234375, -0.07996368408203125, -0.0533905029296875, -0.02681732177734375, -0.000244140625, 0.02632904052734375, 0.0529022216796875, 0.07947540283203125, 0.106048583984375, 0.13262176513671875, 0.1591949462890625, 0.18576812744140625, 0.21234130859375, 0.23891448974609375, 0.2654876708984375, 0.29206085205078125, 0.318634033203125, 0.34520721435546875, 0.3717803955078125, 0.39835357666015625, 0.4249267578125, 0.45149993896484375, 0.4780731201171875, 0.5046463012695312, 0.531219482421875, 0.5577926635742188, 0.5843658447265625, 0.6109390258789062, 0.63751220703125, 0.6640853881835938, 0.6906585693359375, 0.7172317504882812, 0.743804931640625, 0.7703781127929688, 0.7969512939453125, 0.8235244750976562, 0.85009765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 16.0, 19.0, 61.0, 64.0, 91.0, 131.0, 131.0, 124.0, 118.0, 79.0, 61.0, 39.0, 27.0, 17.0, 10.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.213623046875, -0.2069263458251953, -0.20022964477539062, -0.19353294372558594, -0.18683624267578125, -0.18013954162597656, -0.17344284057617188, -0.1667461395263672, -0.1600494384765625, -0.1533527374267578, -0.14665603637695312, -0.13995933532714844, -0.13326263427734375, -0.12656593322753906, -0.11986923217773438, -0.11317253112792969, -0.106475830078125, -0.09977912902832031, -0.09308242797851562, -0.08638572692871094, -0.07968902587890625, -0.07299232482910156, -0.06629562377929688, -0.05959892272949219, -0.0529022216796875, -0.04620552062988281, -0.039508819580078125, -0.03281211853027344, -0.02611541748046875, -0.019418716430664062, -0.012722015380859375, -0.0060253143310546875, 0.00067138671875, 0.0073680877685546875, 0.014064788818359375, 0.020761489868164062, 0.02745819091796875, 0.03415489196777344, 0.040851593017578125, 0.04754829406738281, 0.0542449951171875, 0.06094169616699219, 0.06763839721679688, 0.07433509826660156, 0.08103179931640625, 0.08772850036621094, 0.09442520141601562, 0.10112190246582031, 0.107818603515625, 0.11451530456542969, 0.12121200561523438, 0.12790870666503906, 0.13460540771484375, 0.14130210876464844, 0.14799880981445312, 0.1546955108642578, 0.1613922119140625, 0.1680889129638672, 0.17478561401367188, 0.18148231506347656, 0.18817901611328125, 0.19487571716308594, 0.20157241821289062, 0.2082691192626953, 0.2149658203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 8.0, 17.0, 31.0, 33.0, 37.0, 56.0, 74.0, 119.0, 166.0, 381.0, 848.0, 2325.0, 8376.0, 34832.0, 162134.0, 508647.0, 256540.0, 55361.0, 12910.0, 3409.0, 1113.0, 442.0, 224.0, 129.0, 77.0, 55.0, 45.0, 29.0, 23.0, 36.0, 19.0, 9.0, 4.0, 8.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3720703125, -0.3590850830078125, -0.346099853515625, -0.3331146240234375, -0.32012939453125, -0.3071441650390625, -0.294158935546875, -0.2811737060546875, -0.2681884765625, -0.2552032470703125, -0.242218017578125, -0.2292327880859375, -0.21624755859375, -0.2032623291015625, -0.190277099609375, -0.1772918701171875, -0.164306640625, -0.1513214111328125, -0.138336181640625, -0.1253509521484375, -0.11236572265625, -0.0993804931640625, -0.086395263671875, -0.0734100341796875, -0.0604248046875, -0.0474395751953125, -0.034454345703125, -0.0214691162109375, -0.00848388671875, 0.0045013427734375, 0.017486572265625, 0.0304718017578125, 0.04345703125, 0.0564422607421875, 0.069427490234375, 0.0824127197265625, 0.09539794921875, 0.1083831787109375, 0.121368408203125, 0.1343536376953125, 0.1473388671875, 0.1603240966796875, 0.173309326171875, 0.1862945556640625, 0.19927978515625, 0.2122650146484375, 0.225250244140625, 0.2382354736328125, 0.251220703125, 0.2642059326171875, 0.277191162109375, 0.2901763916015625, 0.30316162109375, 0.3161468505859375, 0.329132080078125, 0.3421173095703125, 0.3551025390625, 0.3680877685546875, 0.381072998046875, 0.3940582275390625, 0.40704345703125, 0.4200286865234375, 0.433013916015625, 0.4459991455078125, 0.458984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 7.0, 4.0, 7.0, 4.0, 8.0, 8.0, 17.0, 21.0, 26.0, 23.0, 35.0, 25.0, 34.0, 34.0, 37.0, 39.0, 49.0, 35.0, 47.0, 35.0, 58.0, 37.0, 36.0, 36.0, 40.0, 28.0, 30.0, 27.0, 27.0, 35.0, 18.0, 17.0, 15.0, 17.0, 17.0, 8.0, 7.0, 5.0, 5.0, 6.0, 4.0, 6.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.3271484375, -0.3177528381347656, -0.30835723876953125, -0.2989616394042969, -0.2895660400390625, -0.2801704406738281, -0.27077484130859375, -0.2613792419433594, -0.251983642578125, -0.24258804321289062, -0.23319244384765625, -0.22379684448242188, -0.2144012451171875, -0.20500564575195312, -0.19561004638671875, -0.18621444702148438, -0.17681884765625, -0.16742324829101562, -0.15802764892578125, -0.14863204956054688, -0.1392364501953125, -0.12984085083007812, -0.12044525146484375, -0.11104965209960938, -0.101654052734375, -0.09225845336914062, -0.08286285400390625, -0.07346725463867188, -0.0640716552734375, -0.054676055908203125, -0.04528045654296875, -0.035884857177734375, -0.0264892578125, -0.017093658447265625, -0.00769805908203125, 0.001697540283203125, 0.0110931396484375, 0.020488739013671875, 0.02988433837890625, 0.039279937744140625, 0.048675537109375, 0.058071136474609375, 0.06746673583984375, 0.07686233520507812, 0.0862579345703125, 0.09565353393554688, 0.10504913330078125, 0.11444473266601562, 0.12384033203125, 0.13323593139648438, 0.14263153076171875, 0.15202713012695312, 0.1614227294921875, 0.17081832885742188, 0.18021392822265625, 0.18960952758789062, 0.199005126953125, 0.20840072631835938, 0.21779632568359375, 0.22719192504882812, 0.2365875244140625, 0.24598312377929688, 0.25537872314453125, 0.2647743225097656, 0.274169921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 2.0, 2.0, 8.0, 16.0, 14.0, 15.0, 35.0, 64.0, 128.0, 229.0, 514.0, 1166.0, 2940.0, 7705.0, 22952.0, 83436.0, 496849.0, 341062.0, 62661.0, 18326.0, 6147.0, 2404.0, 1029.0, 405.0, 209.0, 100.0, 43.0, 26.0, 15.0, 20.0, 10.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1800537109375, -0.17530250549316406, -0.17055130004882812, -0.1658000946044922, -0.16104888916015625, -0.1562976837158203, -0.15154647827148438, -0.14679527282714844, -0.1420440673828125, -0.13729286193847656, -0.13254165649414062, -0.1277904510498047, -0.12303924560546875, -0.11828804016113281, -0.11353683471679688, -0.10878562927246094, -0.104034423828125, -0.09928321838378906, -0.09453201293945312, -0.08978080749511719, -0.08502960205078125, -0.08027839660644531, -0.07552719116210938, -0.07077598571777344, -0.0660247802734375, -0.06127357482910156, -0.056522369384765625, -0.05177116394042969, -0.04701995849609375, -0.04226875305175781, -0.037517547607421875, -0.03276634216308594, -0.02801513671875, -0.023263931274414062, -0.018512725830078125, -0.013761520385742188, -0.00901031494140625, -0.0042591094970703125, 0.000492095947265625, 0.0052433013916015625, 0.0099945068359375, 0.014745712280273438, 0.019496917724609375, 0.024248123168945312, 0.02899932861328125, 0.03375053405761719, 0.038501739501953125, 0.04325294494628906, 0.048004150390625, 0.05275535583496094, 0.057506561279296875, 0.06225776672363281, 0.06700897216796875, 0.07176017761230469, 0.07651138305664062, 0.08126258850097656, 0.0860137939453125, 0.09076499938964844, 0.09551620483398438, 0.10026741027832031, 0.10501861572265625, 0.10976982116699219, 0.11452102661132812, 0.11927223205566406, 0.1240234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 9.0, 11.0, 9.0, 9.0, 14.0, 11.0, 13.0, 20.0, 32.0, 37.0, 36.0, 39.0, 57.0, 89.0, 107.0, 120.0, 73.0, 54.0, 51.0, 34.0, 27.0, 25.0, 12.0, 13.0, 9.0, 15.0, 19.0, 7.0, 10.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00016450881958007812, -0.00015978701412677765, -0.00015506520867347717, -0.0001503434032201767, -0.00014562159776687622, -0.00014089979231357574, -0.00013617798686027527, -0.0001314561814069748, -0.00012673437595367432, -0.00012201257050037384, -0.00011729076504707336, -0.00011256895959377289, -0.00010784715414047241, -0.00010312534868717194, -9.840354323387146e-05, -9.368173778057098e-05, -8.895993232727051e-05, -8.423812687397003e-05, -7.951632142066956e-05, -7.479451596736908e-05, -7.00727105140686e-05, -6.535090506076813e-05, -6.062909960746765e-05, -5.5907294154167175e-05, -5.11854887008667e-05, -4.646368324756622e-05, -4.174187779426575e-05, -3.702007234096527e-05, -3.2298266887664795e-05, -2.757646143436432e-05, -2.2854655981063843e-05, -1.8132850527763367e-05, -1.341104507446289e-05, -8.689239621162415e-06, -3.9674341678619385e-06, 7.543712854385376e-07, 5.476176738739014e-06, 1.019798219203949e-05, 1.4919787645339966e-05, 1.9641593098640442e-05, 2.4363398551940918e-05, 2.9085204005241394e-05, 3.380700945854187e-05, 3.8528814911842346e-05, 4.325062036514282e-05, 4.79724258184433e-05, 5.2694231271743774e-05, 5.741603672504425e-05, 6.213784217834473e-05, 6.68596476316452e-05, 7.158145308494568e-05, 7.630325853824615e-05, 8.102506399154663e-05, 8.574686944484711e-05, 9.046867489814758e-05, 9.519048035144806e-05, 9.991228580474854e-05, 0.00010463409125804901, 0.00010935589671134949, 0.00011407770216464996, 0.00011879950761795044, 0.00012352131307125092, 0.0001282431185245514, 0.00013296492397785187, 0.00013768672943115234]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 11.0, 9.0, 15.0, 17.0, 26.0, 46.0, 78.0, 125.0, 235.0, 433.0, 1039.0, 2738.0, 8811.0, 37405.0, 318717.0, 605406.0, 55273.0, 12177.0, 3556.0, 1279.0, 550.0, 238.0, 124.0, 73.0, 38.0, 35.0, 29.0, 13.0, 14.0, 9.0, 10.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1861572265625, -0.1797637939453125, -0.173370361328125, -0.1669769287109375, -0.16058349609375, -0.1541900634765625, -0.147796630859375, -0.1414031982421875, -0.135009765625, -0.1286163330078125, -0.122222900390625, -0.1158294677734375, -0.10943603515625, -0.1030426025390625, -0.096649169921875, -0.0902557373046875, -0.0838623046875, -0.0774688720703125, -0.071075439453125, -0.0646820068359375, -0.05828857421875, -0.0518951416015625, -0.045501708984375, -0.0391082763671875, -0.03271484375, -0.0263214111328125, -0.019927978515625, -0.0135345458984375, -0.00714111328125, -0.0007476806640625, 0.005645751953125, 0.0120391845703125, 0.0184326171875, 0.0248260498046875, 0.031219482421875, 0.0376129150390625, 0.04400634765625, 0.0503997802734375, 0.056793212890625, 0.0631866455078125, 0.069580078125, 0.0759735107421875, 0.082366943359375, 0.0887603759765625, 0.09515380859375, 0.1015472412109375, 0.107940673828125, 0.1143341064453125, 0.1207275390625, 0.1271209716796875, 0.133514404296875, 0.1399078369140625, 0.14630126953125, 0.1526947021484375, 0.159088134765625, 0.1654815673828125, 0.171875, 0.1782684326171875, 0.184661865234375, 0.1910552978515625, 0.19744873046875, 0.2038421630859375, 0.210235595703125, 0.2166290283203125, 0.2230224609375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 9.0, 7.0, 5.0, 8.0, 13.0, 17.0, 27.0, 22.0, 34.0, 53.0, 50.0, 112.0, 159.0, 128.0, 97.0, 63.0, 40.0, 28.0, 24.0, 22.0, 14.0, 8.0, 11.0, 8.0, 3.0, 10.0, 2.0, 2.0, 6.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1153564453125, -0.11072349548339844, -0.10609054565429688, -0.10145759582519531, -0.09682464599609375, -0.09219169616699219, -0.08755874633789062, -0.08292579650878906, -0.0782928466796875, -0.07365989685058594, -0.06902694702148438, -0.06439399719238281, -0.05976104736328125, -0.05512809753417969, -0.050495147705078125, -0.04586219787597656, -0.041229248046875, -0.03659629821777344, -0.031963348388671875, -0.027330398559570312, -0.02269744873046875, -0.018064498901367188, -0.013431549072265625, -0.008798599243164062, -0.0041656494140625, 0.0004673004150390625, 0.005100250244140625, 0.009733200073242188, 0.01436614990234375, 0.018999099731445312, 0.023632049560546875, 0.028264999389648438, 0.03289794921875, 0.03753089904785156, 0.042163848876953125, 0.04679679870605469, 0.05142974853515625, 0.05606269836425781, 0.060695648193359375, 0.06532859802246094, 0.0699615478515625, 0.07459449768066406, 0.07922744750976562, 0.08386039733886719, 0.08849334716796875, 0.09312629699707031, 0.09775924682617188, 0.10239219665527344, 0.107025146484375, 0.11165809631347656, 0.11629104614257812, 0.12092399597167969, 0.12555694580078125, 0.1301898956298828, 0.13482284545898438, 0.13945579528808594, 0.1440887451171875, 0.14872169494628906, 0.15335464477539062, 0.1579875946044922, 0.16262054443359375, 0.1672534942626953, 0.17188644409179688, 0.17651939392089844, 0.18115234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 14.0, 10.0, 24.0, 53.0, 97.0, 146.0, 164.0, 164.0, 131.0, 78.0, 52.0, 30.0, 25.0, 8.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0489306449890137, -0.9510831236839294, -0.8532356023788452, -0.7553880214691162, -0.6575405597686768, -0.5596929788589478, -0.4618454575538635, -0.3639979362487793, -0.26615041494369507, -0.16830289363861084, -0.07045535743236542, 0.027392178773880005, 0.12523970007896423, 0.22308722138404846, 0.3209347724914551, 0.4187822937965393, 0.5166298151016235, 0.6144773364067078, 0.712324857711792, 0.810172438621521, 0.9080199003219604, 1.0058674812316895, 1.103714942932129, 1.201562523841858, 1.299410104751587, 1.397257685661316, 1.4951051473617554, 1.5929527282714844, 1.6908001899719238, 1.7886477708816528, 1.8864953517913818, 1.9843428134918213, 2.0821902751922607, 2.1800377368927, 2.2778854370117188, 2.375732898712158, 2.4735803604125977, 2.571427822113037, 2.6692755222320557, 2.767122983932495, 2.8649704456329346, 2.962817907333374, 3.0606656074523926, 3.158513069152832, 3.2563605308532715, 3.354207992553711, 3.4520556926727295, 3.549903154373169, 3.6477508544921875, 3.745598316192627, 3.8434460163116455, 3.941293478012085, 4.0391411781311035, 4.136988639831543, 4.234836101531982, 4.332683563232422, 4.430531024932861, 4.528378486633301, 4.62622594833374, 4.72407341003418, 4.821921348571777, 4.919768810272217, 5.017616271972656, 5.115463733673096, 5.213311195373535]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 9.0, 14.0, 16.0, 15.0, 14.0, 21.0, 12.0, 20.0, 21.0, 26.0, 27.0, 41.0, 29.0, 30.0, 26.0, 29.0, 31.0, 36.0, 29.0, 45.0, 39.0, 39.0, 49.0, 29.0, 32.0, 35.0, 26.0, 26.0, 28.0, 22.0, 24.0, 20.0, 25.0, 17.0, 14.0, 3.0, 10.0, 7.0, 9.0, 4.0, 2.0, 6.0, 3.0, 6.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0], "bins": [-1.4185442924499512, -1.375292420387268, -1.332040548324585, -1.2887885570526123, -1.2455366849899292, -1.202284812927246, -1.159032940864563, -1.1157810688018799, -1.0725290775299072, -1.0292772054672241, -0.9860252737998962, -0.9427734017372131, -0.8995214700698853, -0.8562695980072021, -0.813017725944519, -0.7697658538818359, -0.7265139818191528, -0.6832621097564697, -0.6400101780891418, -0.5967583060264587, -0.5535063743591309, -0.5102545022964478, -0.46700263023376465, -0.42375072836875916, -0.38049882650375366, -0.33724692463874817, -0.2939950227737427, -0.25074315071105957, -0.20749124884605408, -0.16423934698104858, -0.12098747491836548, -0.07773557305335999, -0.03448367118835449, 0.008768223226070404, 0.0520201176404953, 0.0952720046043396, 0.1385239064693451, 0.18177580833435059, 0.2250276803970337, 0.2682795822620392, 0.3115314841270447, 0.35478338599205017, 0.39803528785705566, 0.44128715991973877, 0.48453906178474426, 0.5277909636497498, 0.5710428357124329, 0.6142947673797607, 0.6575466394424438, 0.700798511505127, 0.7440504431724548, 0.7873023152351379, 0.8305542469024658, 0.8738061189651489, 0.917057991027832, 0.9603098630905151, 1.0035617351531982, 1.0468136072158813, 1.0900654792785645, 1.133317470550537, 1.1765693426132202, 1.2198212146759033, 1.2630730867385864, 1.3063249588012695, 1.3495769500732422]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 13.0, 8.0, 12.0, 35.0, 49.0, 68.0, 137.0, 214.0, 462.0, 1155.0, 3329.0, 13327.0, 115172.0, 3987153.0, 59368.0, 9199.0, 2586.0, 921.0, 462.0, 237.0, 112.0, 91.0, 40.0, 42.0, 32.0, 7.0, 12.0, 9.0, 10.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92626953125, -0.8897781372070312, -0.8532867431640625, -0.8167953491210938, -0.780303955078125, -0.7438125610351562, -0.7073211669921875, -0.6708297729492188, -0.63433837890625, -0.5978469848632812, -0.5613555908203125, -0.5248641967773438, -0.488372802734375, -0.45188140869140625, -0.4153900146484375, -0.37889862060546875, -0.3424072265625, -0.30591583251953125, -0.2694244384765625, -0.23293304443359375, -0.196441650390625, -0.15995025634765625, -0.1234588623046875, -0.08696746826171875, -0.05047607421875, -0.01398468017578125, 0.0225067138671875, 0.05899810791015625, 0.095489501953125, 0.13198089599609375, 0.1684722900390625, 0.20496368408203125, 0.241455078125, 0.27794647216796875, 0.3144378662109375, 0.35092926025390625, 0.387420654296875, 0.42391204833984375, 0.4604034423828125, 0.49689483642578125, 0.53338623046875, 0.5698776245117188, 0.6063690185546875, 0.6428604125976562, 0.679351806640625, 0.7158432006835938, 0.7523345947265625, 0.7888259887695312, 0.8253173828125, 0.8618087768554688, 0.8983001708984375, 0.9347915649414062, 0.971282958984375, 1.0077743530273438, 1.0442657470703125, 1.0807571411132812, 1.11724853515625, 1.1537399291992188, 1.1902313232421875, 1.2267227172851562, 1.263214111328125, 1.2997055053710938, 1.3361968994140625, 1.3726882934570312, 1.4091796875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 12.0, 11.0, 22.0, 50.0, 60.0, 84.0, 113.0, 105.0, 123.0, 108.0, 97.0, 76.0, 60.0, 32.0, 20.0, 13.0, 10.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2115478515625, -0.20479202270507812, -0.19803619384765625, -0.19128036499023438, -0.1845245361328125, -0.17776870727539062, -0.17101287841796875, -0.16425704956054688, -0.157501220703125, -0.15074539184570312, -0.14398956298828125, -0.13723373413085938, -0.1304779052734375, -0.12372207641601562, -0.11696624755859375, -0.11021041870117188, -0.10345458984375, -0.09669876098632812, -0.08994293212890625, -0.08318710327148438, -0.0764312744140625, -0.06967544555664062, -0.06291961669921875, -0.056163787841796875, -0.049407958984375, -0.042652130126953125, -0.03589630126953125, -0.029140472412109375, -0.0223846435546875, -0.015628814697265625, -0.00887298583984375, -0.002117156982421875, 0.004638671875, 0.011394500732421875, 0.01815032958984375, 0.024906158447265625, 0.0316619873046875, 0.038417816162109375, 0.04517364501953125, 0.051929473876953125, 0.058685302734375, 0.06544113159179688, 0.07219696044921875, 0.07895278930664062, 0.0857086181640625, 0.09246444702148438, 0.09922027587890625, 0.10597610473632812, 0.11273193359375, 0.11948776245117188, 0.12624359130859375, 0.13299942016601562, 0.1397552490234375, 0.14651107788085938, 0.15326690673828125, 0.16002273559570312, 0.166778564453125, 0.17353439331054688, 0.18029022216796875, 0.18704605102539062, 0.1938018798828125, 0.20055770874023438, 0.20731353759765625, 0.21406936645507812, 0.2208251953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 15.0, 29.0, 49.0, 149.0, 314.0, 899.0, 2592.0, 8713.0, 49779.0, 3769192.0, 331935.0, 22727.0, 5182.0, 1699.0, 576.0, 259.0, 101.0, 43.0, 18.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.7800521850585938, -0.7519989013671875, -0.7239456176757812, -0.695892333984375, -0.6678390502929688, -0.6397857666015625, -0.6117324829101562, -0.58367919921875, -0.5556259155273438, -0.5275726318359375, -0.49951934814453125, -0.471466064453125, -0.44341278076171875, -0.4153594970703125, -0.38730621337890625, -0.3592529296875, -0.33119964599609375, -0.3031463623046875, -0.27509307861328125, -0.247039794921875, -0.21898651123046875, -0.1909332275390625, -0.16287994384765625, -0.13482666015625, -0.10677337646484375, -0.0787200927734375, -0.05066680908203125, -0.022613525390625, 0.00543975830078125, 0.0334930419921875, 0.06154632568359375, 0.089599609375, 0.11765289306640625, 0.1457061767578125, 0.17375946044921875, 0.201812744140625, 0.22986602783203125, 0.2579193115234375, 0.28597259521484375, 0.31402587890625, 0.34207916259765625, 0.3701324462890625, 0.39818572998046875, 0.426239013671875, 0.45429229736328125, 0.4823455810546875, 0.5103988647460938, 0.5384521484375, 0.5665054321289062, 0.5945587158203125, 0.6226119995117188, 0.650665283203125, 0.6787185668945312, 0.7067718505859375, 0.7348251342773438, 0.76287841796875, 0.7909317016601562, 0.8189849853515625, 0.8470382690429688, 0.875091552734375, 0.9031448364257812, 0.9311981201171875, 0.9592514038085938, 0.9873046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 5.0, 3.0, 4.0, 10.0, 10.0, 9.0, 12.0, 24.0, 45.0, 57.0, 103.0, 254.0, 2067.0, 945.0, 226.0, 104.0, 63.0, 41.0, 23.0, 20.0, 16.0, 2.0, 10.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218017578125, -0.21072006225585938, -0.20342254638671875, -0.19612503051757812, -0.1888275146484375, -0.18152999877929688, -0.17423248291015625, -0.16693496704101562, -0.159637451171875, -0.15233993530273438, -0.14504241943359375, -0.13774490356445312, -0.1304473876953125, -0.12314987182617188, -0.11585235595703125, -0.10855484008789062, -0.10125732421875, -0.09395980834960938, -0.08666229248046875, -0.07936477661132812, -0.0720672607421875, -0.06476974487304688, -0.05747222900390625, -0.050174713134765625, -0.042877197265625, -0.035579681396484375, -0.02828216552734375, -0.020984649658203125, -0.0136871337890625, -0.006389617919921875, 0.00090789794921875, 0.008205413818359375, 0.0155029296875, 0.022800445556640625, 0.03009796142578125, 0.037395477294921875, 0.0446929931640625, 0.051990509033203125, 0.05928802490234375, 0.06658554077148438, 0.073883056640625, 0.08118057250976562, 0.08847808837890625, 0.09577560424804688, 0.1030731201171875, 0.11037063598632812, 0.11766815185546875, 0.12496566772460938, 0.13226318359375, 0.13956069946289062, 0.14685821533203125, 0.15415573120117188, 0.1614532470703125, 0.16875076293945312, 0.17604827880859375, 0.18334579467773438, 0.190643310546875, 0.19794082641601562, 0.20523834228515625, 0.21253585815429688, 0.2198333740234375, 0.22713088989257812, 0.23442840576171875, 0.24172592163085938, 0.2490234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 10.0, 47.0, 223.0, 443.0, 224.0, 41.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.302762508392334, -4.188028335571289, -4.073294162750244, -3.958559989929199, -3.8438258171081543, -3.7290916442871094, -3.6143572330474854, -3.4996230602264404, -3.3848888874053955, -3.2701547145843506, -3.1554205417633057, -3.0406863689422607, -2.9259519577026367, -2.811217784881592, -2.696483612060547, -2.581749439239502, -2.467015266418457, -2.352281093597412, -2.237546920776367, -2.1228127479553223, -2.0080785751342773, -1.8933442831039429, -1.7786099910736084, -1.6638758182525635, -1.5491416454315186, -1.4344074726104736, -1.3196732997894287, -1.2049390077590942, -1.0902048349380493, -0.9754706621170044, -0.8607364296913147, -0.746002197265625, -0.6312682628631592, -0.5165340900421143, -0.40179985761642456, -0.28706565499305725, -0.17233145236968994, -0.05759727954864502, 0.05713695287704468, 0.17187118530273438, 0.2866053581237793, 0.4013395607471466, 0.5160737633705139, 0.6308079957962036, 0.7455421686172485, 0.8602763414382935, 0.9750105738639832, 1.0897448062896729, 1.2044789791107178, 1.3192131519317627, 1.4339473247528076, 1.548681616783142, 1.663415789604187, 1.778149962425232, 1.8928842544555664, 2.0076184272766113, 2.1223526000976562, 2.237086772918701, 2.351820945739746, 2.466555118560791, 2.581289291381836, 2.696023464202881, 2.810757875442505, 2.92549204826355, 3.0402262210845947]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 2.0, 9.0, 18.0, 27.0, 31.0, 45.0, 49.0, 57.0, 77.0, 79.0, 89.0, 67.0, 58.0, 61.0, 74.0, 75.0, 55.0, 41.0, 33.0, 18.0, 19.0, 9.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2582192420959473, -1.2260786294937134, -1.1939380168914795, -1.161797285079956, -1.1296566724777222, -1.0975160598754883, -1.0653754472732544, -1.0332348346710205, -1.001094102859497, -0.9689534902572632, -0.9368128180503845, -0.9046722054481506, -0.872531533241272, -0.8403909206390381, -0.8082503080368042, -0.7761096954345703, -0.7439690828323364, -0.7118284702301025, -0.6796877980232239, -0.64754718542099, -0.6154065132141113, -0.5832659006118774, -0.5511252880096436, -0.5189846754074097, -0.486844003200531, -0.45470336079597473, -0.42256271839141846, -0.39042210578918457, -0.3582814633846283, -0.326140820980072, -0.29400020837783813, -0.26185956597328186, -0.22971880435943604, -0.19757816195487976, -0.16543753445148468, -0.1332969069480896, -0.10115626454353333, -0.06901562213897705, -0.03687499463558197, -0.00473436713218689, 0.027406275272369385, 0.05954691022634506, 0.09168754518032074, 0.12382818013429642, 0.1559688150882721, 0.18810945749282837, 0.22025008499622345, 0.25239071249961853, 0.2845313549041748, 0.3166719973087311, 0.34881263971328735, 0.38095325231552124, 0.4130938947200775, 0.4452345371246338, 0.4773751497268677, 0.5095157623291016, 0.5416564345359802, 0.5737970471382141, 0.6059377193450928, 0.6380783319473267, 0.6702189445495605, 0.7023596167564392, 0.7345002293586731, 0.7666409015655518, 0.7987815141677856]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 12.0, 19.0, 27.0, 48.0, 91.0, 138.0, 256.0, 514.0, 1115.0, 2530.0, 7928.0, 40237.0, 316502.0, 569118.0, 89176.0, 14120.0, 3804.0, 1433.0, 683.0, 340.0, 167.0, 109.0, 57.0, 36.0, 32.0, 19.0, 7.0, 6.0, 12.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82666015625, -0.8017578125, -0.77685546875, -0.751953125, -0.72705078125, -0.7021484375, -0.67724609375, -0.65234375, -0.62744140625, -0.6025390625, -0.57763671875, -0.552734375, -0.52783203125, -0.5029296875, -0.47802734375, -0.453125, -0.42822265625, -0.4033203125, -0.37841796875, -0.353515625, -0.32861328125, -0.3037109375, -0.27880859375, -0.25390625, -0.22900390625, -0.2041015625, -0.17919921875, -0.154296875, -0.12939453125, -0.1044921875, -0.07958984375, -0.0546875, -0.02978515625, -0.0048828125, 0.02001953125, 0.044921875, 0.06982421875, 0.0947265625, 0.11962890625, 0.14453125, 0.16943359375, 0.1943359375, 0.21923828125, 0.244140625, 0.26904296875, 0.2939453125, 0.31884765625, 0.34375, 0.36865234375, 0.3935546875, 0.41845703125, 0.443359375, 0.46826171875, 0.4931640625, 0.51806640625, 0.54296875, 0.56787109375, 0.5927734375, 0.61767578125, 0.642578125, 0.66748046875, 0.6923828125, 0.71728515625, 0.7421875, 0.76708984375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 11.0, 21.0, 27.0, 66.0, 69.0, 124.0, 103.0, 122.0, 110.0, 98.0, 96.0, 59.0, 33.0, 25.0, 19.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2183837890625, -0.21126556396484375, -0.2041473388671875, -0.19702911376953125, -0.189910888671875, -0.18279266357421875, -0.1756744384765625, -0.16855621337890625, -0.16143798828125, -0.15431976318359375, -0.1472015380859375, -0.14008331298828125, -0.132965087890625, -0.12584686279296875, -0.1187286376953125, -0.11161041259765625, -0.1044921875, -0.09737396240234375, -0.0902557373046875, -0.08313751220703125, -0.076019287109375, -0.06890106201171875, -0.0617828369140625, -0.05466461181640625, -0.04754638671875, -0.04042816162109375, -0.0333099365234375, -0.02619171142578125, -0.019073486328125, -0.01195526123046875, -0.0048370361328125, 0.00228118896484375, 0.0093994140625, 0.01651763916015625, 0.0236358642578125, 0.03075408935546875, 0.037872314453125, 0.04499053955078125, 0.0521087646484375, 0.05922698974609375, 0.06634521484375, 0.07346343994140625, 0.0805816650390625, 0.08769989013671875, 0.094818115234375, 0.10193634033203125, 0.1090545654296875, 0.11617279052734375, 0.123291015625, 0.13040924072265625, 0.1375274658203125, 0.14464569091796875, 0.151763916015625, 0.15888214111328125, 0.1660003662109375, 0.17311859130859375, 0.18023681640625, 0.18735504150390625, 0.1944732666015625, 0.20159149169921875, 0.208709716796875, 0.21582794189453125, 0.2229461669921875, 0.23006439208984375, 0.2371826171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 11.0, 16.0, 21.0, 30.0, 26.0, 62.0, 94.0, 172.0, 284.0, 538.0, 1069.0, 2526.0, 6962.0, 24666.0, 111126.0, 442495.0, 351861.0, 78630.0, 18546.0, 5367.0, 2085.0, 906.0, 427.0, 241.0, 142.0, 78.0, 54.0, 38.0, 26.0, 14.0, 14.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.59375, -0.5788650512695312, -0.5639801025390625, -0.5490951538085938, -0.534210205078125, -0.5193252563476562, -0.5044403076171875, -0.48955535888671875, -0.47467041015625, -0.45978546142578125, -0.4449005126953125, -0.43001556396484375, -0.415130615234375, -0.40024566650390625, -0.3853607177734375, -0.37047576904296875, -0.3555908203125, -0.34070587158203125, -0.3258209228515625, -0.31093597412109375, -0.296051025390625, -0.28116607666015625, -0.2662811279296875, -0.25139617919921875, -0.23651123046875, -0.22162628173828125, -0.2067413330078125, -0.19185638427734375, -0.176971435546875, -0.16208648681640625, -0.1472015380859375, -0.13231658935546875, -0.117431640625, -0.10254669189453125, -0.0876617431640625, -0.07277679443359375, -0.057891845703125, -0.04300689697265625, -0.0281219482421875, -0.01323699951171875, 0.00164794921875, 0.01653289794921875, 0.0314178466796875, 0.04630279541015625, 0.061187744140625, 0.07607269287109375, 0.0909576416015625, 0.10584259033203125, 0.1207275390625, 0.13561248779296875, 0.1504974365234375, 0.16538238525390625, 0.180267333984375, 0.19515228271484375, 0.2100372314453125, 0.22492218017578125, 0.23980712890625, 0.25469207763671875, 0.2695770263671875, 0.28446197509765625, 0.299346923828125, 0.31423187255859375, 0.3291168212890625, 0.34400177001953125, 0.35888671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 12.0, 11.0, 15.0, 14.0, 16.0, 19.0, 24.0, 20.0, 24.0, 29.0, 39.0, 38.0, 61.0, 58.0, 50.0, 50.0, 54.0, 44.0, 42.0, 50.0, 53.0, 46.0, 30.0, 39.0, 29.0, 18.0, 25.0, 16.0, 14.0, 7.0, 5.0, 9.0, 6.0, 5.0, 7.0, 3.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.5322265625, -0.5175857543945312, -0.5029449462890625, -0.48830413818359375, -0.473663330078125, -0.45902252197265625, -0.4443817138671875, -0.42974090576171875, -0.41510009765625, -0.40045928955078125, -0.3858184814453125, -0.37117767333984375, -0.356536865234375, -0.34189605712890625, -0.3272552490234375, -0.31261444091796875, -0.2979736328125, -0.28333282470703125, -0.2686920166015625, -0.25405120849609375, -0.239410400390625, -0.22476959228515625, -0.2101287841796875, -0.19548797607421875, -0.18084716796875, -0.16620635986328125, -0.1515655517578125, -0.13692474365234375, -0.122283935546875, -0.10764312744140625, -0.0930023193359375, -0.07836151123046875, -0.063720703125, -0.04907989501953125, -0.0344390869140625, -0.01979827880859375, -0.005157470703125, 0.00948333740234375, 0.0241241455078125, 0.03876495361328125, 0.05340576171875, 0.06804656982421875, 0.0826873779296875, 0.09732818603515625, 0.111968994140625, 0.12660980224609375, 0.1412506103515625, 0.15589141845703125, 0.1705322265625, 0.18517303466796875, 0.1998138427734375, 0.21445465087890625, 0.229095458984375, 0.24373626708984375, 0.2583770751953125, 0.27301788330078125, 0.28765869140625, 0.30229949951171875, 0.3169403076171875, 0.33158111572265625, 0.346221923828125, 0.36086273193359375, 0.3755035400390625, 0.39014434814453125, 0.40478515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 9.0, 16.0, 20.0, 34.0, 67.0, 93.0, 190.0, 321.0, 600.0, 1100.0, 2270.0, 5515.0, 21053.0, 226973.0, 731310.0, 44129.0, 8691.0, 3044.0, 1433.0, 713.0, 383.0, 249.0, 142.0, 80.0, 41.0, 26.0, 22.0, 11.0, 4.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51611328125, -0.5005645751953125, -0.485015869140625, -0.4694671630859375, -0.45391845703125, -0.4383697509765625, -0.422821044921875, -0.4072723388671875, -0.3917236328125, -0.3761749267578125, -0.360626220703125, -0.3450775146484375, -0.32952880859375, -0.3139801025390625, -0.298431396484375, -0.2828826904296875, -0.267333984375, -0.2517852783203125, -0.236236572265625, -0.2206878662109375, -0.20513916015625, -0.1895904541015625, -0.174041748046875, -0.1584930419921875, -0.1429443359375, -0.1273956298828125, -0.111846923828125, -0.0962982177734375, -0.08074951171875, -0.0652008056640625, -0.049652099609375, -0.0341033935546875, -0.0185546875, -0.0030059814453125, 0.012542724609375, 0.0280914306640625, 0.04364013671875, 0.0591888427734375, 0.074737548828125, 0.0902862548828125, 0.1058349609375, 0.1213836669921875, 0.136932373046875, 0.1524810791015625, 0.16802978515625, 0.1835784912109375, 0.199127197265625, 0.2146759033203125, 0.230224609375, 0.2457733154296875, 0.261322021484375, 0.2768707275390625, 0.29241943359375, 0.3079681396484375, 0.323516845703125, 0.3390655517578125, 0.3546142578125, 0.3701629638671875, 0.385711669921875, 0.4012603759765625, 0.41680908203125, 0.4323577880859375, 0.447906494140625, 0.4634552001953125, 0.47900390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 12.0, 14.0, 22.0, 29.0, 37.0, 37.0, 38.0, 60.0, 95.0, 128.0, 125.0, 82.0, 59.0, 47.0, 40.0, 26.0, 21.0, 20.0, 14.0, 18.0, 14.0, 6.0, 3.0, 3.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018084049224853516, -0.00017577968537807465, -0.00017071887850761414, -0.00016565807163715363, -0.00016059726476669312, -0.0001555364578962326, -0.0001504756510257721, -0.00014541484415531158, -0.00014035403728485107, -0.00013529323041439056, -0.00013023242354393005, -0.00012517161667346954, -0.00012011080980300903, -0.00011505000293254852, -0.00010998919606208801, -0.0001049283891916275, -9.986758232116699e-05, -9.480677545070648e-05, -8.974596858024597e-05, -8.468516170978546e-05, -7.962435483932495e-05, -7.456354796886444e-05, -6.950274109840393e-05, -6.444193422794342e-05, -5.938112735748291e-05, -5.43203204870224e-05, -4.925951361656189e-05, -4.419870674610138e-05, -3.913789987564087e-05, -3.407709300518036e-05, -2.901628613471985e-05, -2.395547926425934e-05, -1.8894672393798828e-05, -1.3833865523338318e-05, -8.773058652877808e-06, -3.7122517824172974e-06, 1.3485550880432129e-06, 6.409361958503723e-06, 1.1470168828964233e-05, 1.6530975699424744e-05, 2.1591782569885254e-05, 2.6652589440345764e-05, 3.1713396310806274e-05, 3.6774203181266785e-05, 4.1835010051727295e-05, 4.6895816922187805e-05, 5.1956623792648315e-05, 5.7017430663108826e-05, 6.207823753356934e-05, 6.713904440402985e-05, 7.219985127449036e-05, 7.726065814495087e-05, 8.232146501541138e-05, 8.738227188587189e-05, 9.24430787563324e-05, 9.750388562679291e-05, 0.00010256469249725342, 0.00010762549936771393, 0.00011268630623817444, 0.00011774711310863495, 0.00012280791997909546, 0.00012786872684955597, 0.00013292953372001648, 0.000137990340590477, 0.0001430511474609375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 4.0, 6.0, 12.0, 39.0, 78.0, 294.0, 1586.0, 22131.0, 997571.0, 24661.0, 1675.0, 312.0, 101.0, 22.0, 18.0, 12.0, 5.0, 6.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.0687103271484375, -1.025115966796875, -0.9815216064453125, -0.93792724609375, -0.8943328857421875, -0.850738525390625, -0.8071441650390625, -0.7635498046875, -0.7199554443359375, -0.676361083984375, -0.6327667236328125, -0.58917236328125, -0.5455780029296875, -0.501983642578125, -0.4583892822265625, -0.414794921875, -0.3712005615234375, -0.327606201171875, -0.2840118408203125, -0.24041748046875, -0.1968231201171875, -0.153228759765625, -0.1096343994140625, -0.0660400390625, -0.0224456787109375, 0.021148681640625, 0.0647430419921875, 0.10833740234375, 0.1519317626953125, 0.195526123046875, 0.2391204833984375, 0.28271484375, 0.3263092041015625, 0.369903564453125, 0.4134979248046875, 0.45709228515625, 0.5006866455078125, 0.544281005859375, 0.5878753662109375, 0.6314697265625, 0.6750640869140625, 0.718658447265625, 0.7622528076171875, 0.80584716796875, 0.8494415283203125, 0.893035888671875, 0.9366302490234375, 0.980224609375, 1.0238189697265625, 1.067413330078125, 1.1110076904296875, 1.15460205078125, 1.1981964111328125, 1.241790771484375, 1.2853851318359375, 1.3289794921875, 1.3725738525390625, 1.416168212890625, 1.4597625732421875, 1.50335693359375, 1.5469512939453125, 1.590545654296875, 1.6341400146484375, 1.677734375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 8.0, 18.0, 21.0, 43.0, 92.0, 130.0, 224.0, 216.0, 93.0, 51.0, 32.0, 13.0, 13.0, 7.0, 9.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67578125, -0.6563034057617188, -0.6368255615234375, -0.6173477172851562, -0.597869873046875, -0.5783920288085938, -0.5589141845703125, -0.5394363403320312, -0.51995849609375, -0.5004806518554688, -0.4810028076171875, -0.46152496337890625, -0.442047119140625, -0.42256927490234375, -0.4030914306640625, -0.38361358642578125, -0.3641357421875, -0.34465789794921875, -0.3251800537109375, -0.30570220947265625, -0.286224365234375, -0.26674652099609375, -0.2472686767578125, -0.22779083251953125, -0.20831298828125, -0.18883514404296875, -0.1693572998046875, -0.14987945556640625, -0.130401611328125, -0.11092376708984375, -0.0914459228515625, -0.07196807861328125, -0.052490234375, -0.03301239013671875, -0.0135345458984375, 0.00594329833984375, 0.025421142578125, 0.04489898681640625, 0.0643768310546875, 0.08385467529296875, 0.10333251953125, 0.12281036376953125, 0.1422882080078125, 0.16176605224609375, 0.181243896484375, 0.20072174072265625, 0.2201995849609375, 0.23967742919921875, 0.2591552734375, 0.27863311767578125, 0.2981109619140625, 0.31758880615234375, 0.337066650390625, 0.35654449462890625, 0.3760223388671875, 0.39550018310546875, 0.41497802734375, 0.43445587158203125, 0.4539337158203125, 0.47341156005859375, 0.492889404296875, 0.5123672485351562, 0.5318450927734375, 0.5513229370117188, 0.57080078125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 18.0, 64.0, 170.0, 339.0, 263.0, 110.0, 28.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.45939826965332, -9.105244636535645, -8.751090049743652, -8.396936416625977, -8.0427827835083, -7.688628673553467, -7.334474563598633, -6.980320930480957, -6.626167297363281, -6.272013187408447, -5.9178595542907715, -5.5637054443359375, -5.209551811218262, -4.855397701263428, -4.501243591308594, -4.147089958190918, -3.792935848236084, -3.438781976699829, -3.084628105163574, -2.7304739952087402, -2.3763203620910645, -2.0221662521362305, -1.6680123805999756, -1.3138585090637207, -0.9597046375274658, -0.6055507659912109, -0.2513968348503113, 0.10275709629058838, 0.45691096782684326, 0.8110648393630981, 1.1652188301086426, 1.5193727016448975, 1.8735265731811523, 2.2276804447174072, 2.581834316253662, 2.935988426208496, 3.290142059326172, 3.644296169281006, 3.9984500408172607, 4.352603912353516, 4.706757545471191, 5.060911655426025, 5.415065288543701, 5.769219398498535, 6.123373031616211, 6.477527141571045, 6.831681251525879, 7.185834884643555, 7.539988994598389, 7.894143104553223, 8.248296737670898, 8.602450370788574, 8.956604957580566, 9.310758590698242, 9.664912223815918, 10.019065856933594, 10.373220443725586, 10.727374076843262, 11.081528663635254, 11.43568229675293, 11.789835929870605, 12.143989562988281, 12.498144149780273, 12.85229778289795, 13.206451416015625]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 6.0, 5.0, 11.0, 10.0, 14.0, 17.0, 20.0, 21.0, 24.0, 25.0, 34.0, 25.0, 36.0, 55.0, 31.0, 47.0, 53.0, 44.0, 48.0, 57.0, 50.0, 32.0, 37.0, 34.0, 38.0, 29.0, 25.0, 29.0, 16.0, 27.0, 22.0, 16.0, 11.0, 7.0, 10.0, 9.0, 8.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.656383514404297, -2.5737974643707275, -2.491211414337158, -2.408625364303589, -2.3260393142700195, -2.24345326423645, -2.160867214202881, -2.0782811641693115, -1.9956951141357422, -1.9131090641021729, -1.8305230140686035, -1.7479369640350342, -1.6653509140014648, -1.5827648639678955, -1.5001788139343262, -1.4175927639007568, -1.335006833076477, -1.2524207830429077, -1.1698347330093384, -1.087248682975769, -1.0046626329421997, -0.9220765829086304, -0.8394905924797058, -0.7569045424461365, -0.6743184924125671, -0.5917324423789978, -0.5091463923454285, -0.4265603721141815, -0.3439743220806122, -0.26138827204704285, -0.1788022518157959, -0.09621620178222656, -0.013630151748657227, 0.06895589083433151, 0.15154193341732025, 0.2341279685497284, 0.31671401858329773, 0.39930006861686707, 0.481886088848114, 0.5644721388816833, 0.6470581889152527, 0.729644238948822, 0.8122302889823914, 0.8948162794113159, 0.9774023294448853, 1.0599883794784546, 1.142574429512024, 1.2251604795455933, 1.3077465295791626, 1.390332579612732, 1.4729186296463013, 1.5555046796798706, 1.63809072971344, 1.7206767797470093, 1.803262710571289, 1.8858487606048584, 1.9684348106384277, 2.051020860671997, 2.1336069107055664, 2.2161929607391357, 2.298779010772705, 2.3813650608062744, 2.4639511108398438, 2.546537160873413, 2.6291232109069824]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 5.0, 5.0, 4.0, 10.0, 12.0, 11.0, 14.0, 21.0, 30.0, 43.0, 62.0, 82.0, 158.0, 228.0, 453.0, 743.0, 1506.0, 3103.0, 6959.0, 18541.0, 67397.0, 972181.0, 3001107.0, 84466.0, 21808.0, 7904.0, 3448.0, 1697.0, 869.0, 504.0, 309.0, 193.0, 111.0, 79.0, 64.0, 51.0, 32.0, 18.0, 13.0, 6.0, 7.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.64501953125, -0.6242599487304688, -0.6035003662109375, -0.5827407836914062, -0.561981201171875, -0.5412216186523438, -0.5204620361328125, -0.49970245361328125, -0.47894287109375, -0.45818328857421875, -0.4374237060546875, -0.41666412353515625, -0.395904541015625, -0.37514495849609375, -0.3543853759765625, -0.33362579345703125, -0.3128662109375, -0.29210662841796875, -0.2713470458984375, -0.25058746337890625, -0.229827880859375, -0.20906829833984375, -0.1883087158203125, -0.16754913330078125, -0.14678955078125, -0.12602996826171875, -0.1052703857421875, -0.08451080322265625, -0.063751220703125, -0.04299163818359375, -0.0222320556640625, -0.00147247314453125, 0.019287109375, 0.04004669189453125, 0.0608062744140625, 0.08156585693359375, 0.102325439453125, 0.12308502197265625, 0.1438446044921875, 0.16460418701171875, 0.18536376953125, 0.20612335205078125, 0.2268829345703125, 0.24764251708984375, 0.268402099609375, 0.28916168212890625, 0.3099212646484375, 0.33068084716796875, 0.3514404296875, 0.37220001220703125, 0.3929595947265625, 0.41371917724609375, 0.434478759765625, 0.45523834228515625, 0.4759979248046875, 0.49675750732421875, 0.51751708984375, 0.5382766723632812, 0.5590362548828125, 0.5797958374023438, 0.600555419921875, 0.6213150024414062, 0.6420745849609375, 0.6628341674804688, 0.68359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 8.0, 11.0, 20.0, 27.0, 39.0, 67.0, 92.0, 90.0, 105.0, 97.0, 110.0, 97.0, 71.0, 59.0, 47.0, 22.0, 21.0, 10.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243408203125, -0.23590469360351562, -0.22840118408203125, -0.22089767456054688, -0.2133941650390625, -0.20589065551757812, -0.19838714599609375, -0.19088363647460938, -0.183380126953125, -0.17587661743164062, -0.16837310791015625, -0.16086959838867188, -0.1533660888671875, -0.14586257934570312, -0.13835906982421875, -0.13085556030273438, -0.12335205078125, -0.11584854125976562, -0.10834503173828125, -0.10084152221679688, -0.0933380126953125, -0.08583450317382812, -0.07833099365234375, -0.07082748413085938, -0.063323974609375, -0.055820465087890625, -0.04831695556640625, -0.040813446044921875, -0.0333099365234375, -0.025806427001953125, -0.01830291748046875, -0.010799407958984375, -0.0032958984375, 0.004207611083984375, 0.01171112060546875, 0.019214630126953125, 0.0267181396484375, 0.034221649169921875, 0.04172515869140625, 0.049228668212890625, 0.056732177734375, 0.06423568725585938, 0.07173919677734375, 0.07924270629882812, 0.0867462158203125, 0.09424972534179688, 0.10175323486328125, 0.10925674438476562, 0.11676025390625, 0.12426376342773438, 0.13176727294921875, 0.13927078247070312, 0.1467742919921875, 0.15427780151367188, 0.16178131103515625, 0.16928482055664062, 0.176788330078125, 0.18429183959960938, 0.19179534912109375, 0.19929885864257812, 0.2068023681640625, 0.21430587768554688, 0.22180938720703125, 0.22931289672851562, 0.23681640625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 12.0, 13.0, 33.0, 72.0, 199.0, 504.0, 1481.0, 6229.0, 37971.0, 3392088.0, 722060.0, 27021.0, 4654.0, 1265.0, 413.0, 154.0, 65.0, 18.0, 17.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21484375, -1.1742401123046875, -1.133636474609375, -1.0930328369140625, -1.05242919921875, -1.0118255615234375, -0.971221923828125, -0.9306182861328125, -0.8900146484375, -0.8494110107421875, -0.808807373046875, -0.7682037353515625, -0.72760009765625, -0.6869964599609375, -0.646392822265625, -0.6057891845703125, -0.565185546875, -0.5245819091796875, -0.483978271484375, -0.4433746337890625, -0.40277099609375, -0.3621673583984375, -0.321563720703125, -0.2809600830078125, -0.2403564453125, -0.1997528076171875, -0.159149169921875, -0.1185455322265625, -0.07794189453125, -0.0373382568359375, 0.003265380859375, 0.0438690185546875, 0.08447265625, 0.1250762939453125, 0.165679931640625, 0.2062835693359375, 0.24688720703125, 0.2874908447265625, 0.328094482421875, 0.3686981201171875, 0.4093017578125, 0.4499053955078125, 0.490509033203125, 0.5311126708984375, 0.57171630859375, 0.6123199462890625, 0.652923583984375, 0.6935272216796875, 0.734130859375, 0.7747344970703125, 0.815338134765625, 0.8559417724609375, 0.89654541015625, 0.9371490478515625, 0.977752685546875, 1.0183563232421875, 1.0589599609375, 1.0995635986328125, 1.140167236328125, 1.1807708740234375, 1.22137451171875, 1.2619781494140625, 1.302581787109375, 1.3431854248046875, 1.3837890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 13.0, 24.0, 31.0, 53.0, 65.0, 102.0, 221.0, 1093.0, 1825.0, 283.0, 107.0, 75.0, 40.0, 35.0, 16.0, 13.0, 16.0, 5.0, 4.0, 5.0, 5.0, 7.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.3272895812988281, -0.31473541259765625, -0.3021812438964844, -0.2896270751953125, -0.2770729064941406, -0.26451873779296875, -0.2519645690917969, -0.239410400390625, -0.22685623168945312, -0.21430206298828125, -0.20174789428710938, -0.1891937255859375, -0.17663955688476562, -0.16408538818359375, -0.15153121948242188, -0.13897705078125, -0.12642288208007812, -0.11386871337890625, -0.10131454467773438, -0.0887603759765625, -0.07620620727539062, -0.06365203857421875, -0.051097869873046875, -0.038543701171875, -0.025989532470703125, -0.01343536376953125, -0.000881195068359375, 0.0116729736328125, 0.024227142333984375, 0.03678131103515625, 0.049335479736328125, 0.0618896484375, 0.07444381713867188, 0.08699798583984375, 0.09955215454101562, 0.1121063232421875, 0.12466049194335938, 0.13721466064453125, 0.14976882934570312, 0.162322998046875, 0.17487716674804688, 0.18743133544921875, 0.19998550415039062, 0.2125396728515625, 0.22509384155273438, 0.23764801025390625, 0.2502021789550781, 0.26275634765625, 0.2753105163574219, 0.28786468505859375, 0.3004188537597656, 0.3129730224609375, 0.3255271911621094, 0.33808135986328125, 0.3506355285644531, 0.363189697265625, 0.3757438659667969, 0.38829803466796875, 0.4008522033691406, 0.4134063720703125, 0.4259605407714844, 0.43851470947265625, 0.4510688781738281, 0.463623046875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 19.0, 34.0, 86.0, 191.0, 224.0, 225.0, 115.0, 51.0, 34.0, 19.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3231747150421143, -3.218048572540283, -3.112922191619873, -3.007796049118042, -2.902669668197632, -2.797543525695801, -2.6924171447753906, -2.5872910022735596, -2.4821648597717285, -2.3770387172698975, -2.2719123363494873, -2.1667861938476562, -2.061659812927246, -1.956533670425415, -1.8514074087142944, -1.7462811470031738, -1.6411547660827637, -1.536028504371643, -1.4309022426605225, -1.3257761001586914, -1.2206497192382812, -1.1155235767364502, -1.0103973150253296, -0.905271053314209, -0.8001447916030884, -0.6950185298919678, -0.5898922681808472, -0.48476606607437134, -0.37963980436325073, -0.2745135426521301, -0.1693873405456543, -0.06426107883453369, 0.040865421295166016, 0.14599166810512543, 0.25111791491508484, 0.35624414682388306, 0.46137040853500366, 0.5664966702461243, 0.6716228723526001, 0.7767491340637207, 0.8818753957748413, 0.9870016574859619, 1.0921279191970825, 1.1972541809082031, 1.3023803234100342, 1.4075067043304443, 1.5126328468322754, 1.617759108543396, 1.7228853702545166, 1.8280116319656372, 1.9331378936767578, 2.038264036178589, 2.143390417098999, 2.24851655960083, 2.3536429405212402, 2.4587690830230713, 2.5638952255249023, 2.6690213680267334, 2.7741477489471436, 2.8792738914489746, 2.9844002723693848, 3.089526414871216, 3.194652557373047, 3.299778938293457, 3.404905319213867]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 10.0, 7.0, 6.0, 22.0, 30.0, 40.0, 39.0, 47.0, 67.0, 66.0, 71.0, 64.0, 73.0, 83.0, 62.0, 55.0, 48.0, 48.0, 42.0, 29.0, 28.0, 18.0, 20.0, 13.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.770959734916687, -1.7147836685180664, -1.6586076021194458, -1.6024315357208252, -1.5462554693222046, -1.490079402923584, -1.4339032173156738, -1.3777271509170532, -1.3215510845184326, -1.265375018119812, -1.2091989517211914, -1.1530228853225708, -1.0968468189239502, -1.04067063331604, -0.9844946265220642, -0.9283185005187988, -0.872142493724823, -0.8159664273262024, -0.7597903609275818, -0.7036142349243164, -0.6474381685256958, -0.5912621021270752, -0.5350860357284546, -0.4789099395275116, -0.422733873128891, -0.3665578067302704, -0.3103817105293274, -0.2542056441307068, -0.198029562830925, -0.1418534815311432, -0.08567741513252258, -0.02950131893157959, 0.026674747467041016, 0.08285082876682281, 0.13902691006660461, 0.19520297646522522, 0.2513790726661682, 0.3075551390647888, 0.3637312054634094, 0.4199073016643524, 0.476083368062973, 0.532259464263916, 0.5884355306625366, 0.6446115970611572, 0.7007876634597778, 0.7569637298583984, 0.813139796257019, 0.8693159222602844, 0.925491988658905, 0.9816680550575256, 1.037844181060791, 1.0940202474594116, 1.1501963138580322, 1.2063723802566528, 1.2625484466552734, 1.318724513053894, 1.3749005794525146, 1.4310766458511353, 1.4872527122497559, 1.5434287786483765, 1.599604845046997, 1.6557810306549072, 1.7119569778442383, 1.7681331634521484, 1.824309229850769]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 8.0, 14.0, 14.0, 40.0, 55.0, 78.0, 150.0, 240.0, 443.0, 839.0, 1832.0, 4399.0, 11926.0, 36931.0, 121726.0, 325676.0, 344572.0, 136771.0, 40782.0, 13277.0, 4790.0, 1928.0, 942.0, 465.0, 249.0, 149.0, 94.0, 53.0, 34.0, 28.0, 20.0, 6.0, 6.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.523590087890625, -0.50616455078125, -0.488739013671875, -0.4713134765625, -0.453887939453125, -0.43646240234375, -0.419036865234375, -0.401611328125, -0.384185791015625, -0.36676025390625, -0.349334716796875, -0.3319091796875, -0.314483642578125, -0.29705810546875, -0.279632568359375, -0.26220703125, -0.244781494140625, -0.22735595703125, -0.209930419921875, -0.1925048828125, -0.175079345703125, -0.15765380859375, -0.140228271484375, -0.122802734375, -0.105377197265625, -0.08795166015625, -0.070526123046875, -0.0531005859375, -0.035675048828125, -0.01824951171875, -0.000823974609375, 0.0166015625, 0.034027099609375, 0.05145263671875, 0.068878173828125, 0.0863037109375, 0.103729248046875, 0.12115478515625, 0.138580322265625, 0.156005859375, 0.173431396484375, 0.19085693359375, 0.208282470703125, 0.2257080078125, 0.243133544921875, 0.26055908203125, 0.277984619140625, 0.29541015625, 0.312835693359375, 0.33026123046875, 0.347686767578125, 0.3651123046875, 0.382537841796875, 0.39996337890625, 0.417388916015625, 0.434814453125, 0.452239990234375, 0.46966552734375, 0.487091064453125, 0.5045166015625, 0.521942138671875, 0.53936767578125, 0.556793212890625, 0.57421875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 4.0, 8.0, 19.0, 24.0, 36.0, 47.0, 66.0, 73.0, 82.0, 89.0, 105.0, 97.0, 88.0, 73.0, 53.0, 44.0, 35.0, 28.0, 13.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2445068359375, -0.23673439025878906, -0.22896194458007812, -0.2211894989013672, -0.21341705322265625, -0.2056446075439453, -0.19787216186523438, -0.19009971618652344, -0.1823272705078125, -0.17455482482910156, -0.16678237915039062, -0.1590099334716797, -0.15123748779296875, -0.1434650421142578, -0.13569259643554688, -0.12792015075683594, -0.120147705078125, -0.11237525939941406, -0.10460281372070312, -0.09683036804199219, -0.08905792236328125, -0.08128547668457031, -0.07351303100585938, -0.06574058532714844, -0.0579681396484375, -0.05019569396972656, -0.042423248291015625, -0.03465080261230469, -0.02687835693359375, -0.019105911254882812, -0.011333465576171875, -0.0035610198974609375, 0.00421142578125, 0.011983871459960938, 0.019756317138671875, 0.027528762817382812, 0.03530120849609375, 0.04307365417480469, 0.050846099853515625, 0.05861854553222656, 0.0663909912109375, 0.07416343688964844, 0.08193588256835938, 0.08970832824707031, 0.09748077392578125, 0.10525321960449219, 0.11302566528320312, 0.12079811096191406, 0.128570556640625, 0.13634300231933594, 0.14411544799804688, 0.1518878936767578, 0.15966033935546875, 0.1674327850341797, 0.17520523071289062, 0.18297767639160156, 0.1907501220703125, 0.19852256774902344, 0.20629501342773438, 0.2140674591064453, 0.22183990478515625, 0.2296123504638672, 0.23738479614257812, 0.24515724182128906, 0.2529296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 15.0, 31.0, 16.0, 28.0, 40.0, 93.0, 152.0, 238.0, 520.0, 1152.0, 3193.0, 10409.0, 39899.0, 185991.0, 512596.0, 226883.0, 48624.0, 12278.0, 3815.0, 1338.0, 581.0, 272.0, 142.0, 87.0, 33.0, 50.0, 32.0, 15.0, 9.0, 5.0, 8.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.822265625, -0.8003768920898438, -0.7784881591796875, -0.7565994262695312, -0.734710693359375, -0.7128219604492188, -0.6909332275390625, -0.6690444946289062, -0.64715576171875, -0.6252670288085938, -0.6033782958984375, -0.5814895629882812, -0.559600830078125, -0.5377120971679688, -0.5158233642578125, -0.49393463134765625, -0.4720458984375, -0.45015716552734375, -0.4282684326171875, -0.40637969970703125, -0.384490966796875, -0.36260223388671875, -0.3407135009765625, -0.31882476806640625, -0.29693603515625, -0.27504730224609375, -0.2531585693359375, -0.23126983642578125, -0.209381103515625, -0.18749237060546875, -0.1656036376953125, -0.14371490478515625, -0.121826171875, -0.09993743896484375, -0.0780487060546875, -0.05615997314453125, -0.034271240234375, -0.01238250732421875, 0.0095062255859375, 0.03139495849609375, 0.05328369140625, 0.07517242431640625, 0.0970611572265625, 0.11894989013671875, 0.140838623046875, 0.16272735595703125, 0.1846160888671875, 0.20650482177734375, 0.2283935546875, 0.25028228759765625, 0.2721710205078125, 0.29405975341796875, 0.315948486328125, 0.33783721923828125, 0.3597259521484375, 0.38161468505859375, 0.40350341796875, 0.42539215087890625, 0.4472808837890625, 0.46916961669921875, 0.491058349609375, 0.5129470825195312, 0.5348358154296875, 0.5567245483398438, 0.57861328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 9.0, 3.0, 7.0, 3.0, 5.0, 10.0, 8.0, 12.0, 11.0, 14.0, 18.0, 18.0, 33.0, 43.0, 37.0, 32.0, 28.0, 36.0, 42.0, 51.0, 57.0, 46.0, 54.0, 36.0, 48.0, 34.0, 38.0, 32.0, 39.0, 28.0, 32.0, 21.0, 21.0, 19.0, 20.0, 15.0, 5.0, 9.0, 10.0, 4.0, 4.0, 5.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.7353515625, -0.7147979736328125, -0.694244384765625, -0.6736907958984375, -0.65313720703125, -0.6325836181640625, -0.612030029296875, -0.5914764404296875, -0.5709228515625, -0.5503692626953125, -0.529815673828125, -0.5092620849609375, -0.48870849609375, -0.4681549072265625, -0.447601318359375, -0.4270477294921875, -0.406494140625, -0.3859405517578125, -0.365386962890625, -0.3448333740234375, -0.32427978515625, -0.3037261962890625, -0.283172607421875, -0.2626190185546875, -0.2420654296875, -0.2215118408203125, -0.200958251953125, -0.1804046630859375, -0.15985107421875, -0.1392974853515625, -0.118743896484375, -0.0981903076171875, -0.07763671875, -0.0570831298828125, -0.036529541015625, -0.0159759521484375, 0.00457763671875, 0.0251312255859375, 0.045684814453125, 0.0662384033203125, 0.0867919921875, 0.1073455810546875, 0.127899169921875, 0.1484527587890625, 0.16900634765625, 0.1895599365234375, 0.210113525390625, 0.2306671142578125, 0.251220703125, 0.2717742919921875, 0.292327880859375, 0.3128814697265625, 0.33343505859375, 0.3539886474609375, 0.374542236328125, 0.3950958251953125, 0.4156494140625, 0.4362030029296875, 0.456756591796875, 0.4773101806640625, 0.49786376953125, 0.5184173583984375, 0.538970947265625, 0.5595245361328125, 0.580078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 8.0, 15.0, 15.0, 15.0, 17.0, 37.0, 31.0, 80.0, 111.0, 198.0, 373.0, 809.0, 1866.0, 6098.0, 31591.0, 427606.0, 532380.0, 36644.0, 6859.0, 2015.0, 819.0, 416.0, 196.0, 140.0, 67.0, 52.0, 44.0, 20.0, 14.0, 10.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7412109375, -0.7147750854492188, -0.6883392333984375, -0.6619033813476562, -0.635467529296875, -0.6090316772460938, -0.5825958251953125, -0.5561599731445312, -0.52972412109375, -0.5032882690429688, -0.4768524169921875, -0.45041656494140625, -0.423980712890625, -0.39754486083984375, -0.3711090087890625, -0.34467315673828125, -0.3182373046875, -0.29180145263671875, -0.2653656005859375, -0.23892974853515625, -0.212493896484375, -0.18605804443359375, -0.1596221923828125, -0.13318634033203125, -0.10675048828125, -0.08031463623046875, -0.0538787841796875, -0.02744293212890625, -0.001007080078125, 0.02542877197265625, 0.0518646240234375, 0.07830047607421875, 0.104736328125, 0.13117218017578125, 0.1576080322265625, 0.18404388427734375, 0.210479736328125, 0.23691558837890625, 0.2633514404296875, 0.28978729248046875, 0.31622314453125, 0.34265899658203125, 0.3690948486328125, 0.39553070068359375, 0.421966552734375, 0.44840240478515625, 0.4748382568359375, 0.5012741088867188, 0.5277099609375, 0.5541458129882812, 0.5805816650390625, 0.6070175170898438, 0.633453369140625, 0.6598892211914062, 0.6863250732421875, 0.7127609252929688, 0.73919677734375, 0.7656326293945312, 0.7920684814453125, 0.8185043334960938, 0.844940185546875, 0.8713760375976562, 0.8978118896484375, 0.9242477416992188, 0.95068359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 9.0, 15.0, 33.0, 49.0, 73.0, 92.0, 147.0, 143.0, 142.0, 106.0, 59.0, 42.0, 34.0, 14.0, 8.0, 7.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020682811737060547, -0.00019803829491138458, -0.0001892484724521637, -0.0001804586499929428, -0.00017166882753372192, -0.00016287900507450104, -0.00015408918261528015, -0.00014529936015605927, -0.00013650953769683838, -0.0001277197152376175, -0.0001189298927783966, -0.00011014007031917572, -0.00010135024785995483, -9.256042540073395e-05, -8.377060294151306e-05, -7.498078048229218e-05, -6.619095802307129e-05, -5.74011355638504e-05, -4.8611313104629517e-05, -3.982149064540863e-05, -3.1031668186187744e-05, -2.2241845726966858e-05, -1.3452023267745972e-05, -4.6622008085250854e-06, 4.127621650695801e-06, 1.2917444109916687e-05, 2.1707266569137573e-05, 3.049708902835846e-05, 3.9286911487579346e-05, 4.807673394680023e-05, 5.686655640602112e-05, 6.5656378865242e-05, 7.444620132446289e-05, 8.323602378368378e-05, 9.202584624290466e-05, 0.00010081566870212555, 0.00010960549116134644, 0.00011839531362056732, 0.0001271851360797882, 0.0001359749585390091, 0.00014476478099822998, 0.00015355460345745087, 0.00016234442591667175, 0.00017113424837589264, 0.00017992407083511353, 0.0001887138932943344, 0.0001975037157535553, 0.00020629353821277618, 0.00021508336067199707, 0.00022387318313121796, 0.00023266300559043884, 0.00024145282804965973, 0.0002502426505088806, 0.0002590324729681015, 0.0002678222954273224, 0.0002766121178865433, 0.00028540194034576416, 0.00029419176280498505, 0.00030298158526420593, 0.0003117714077234268, 0.0003205612301826477, 0.0003293510526418686, 0.0003381408751010895, 0.00034693069756031036, 0.00035572052001953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 11.0, 13.0, 31.0, 62.0, 82.0, 238.0, 656.0, 2895.0, 41978.0, 927433.0, 70110.0, 3779.0, 778.0, 252.0, 97.0, 50.0, 30.0, 14.0, 13.0, 9.0, 3.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1533203125, -1.112945556640625, -1.07257080078125, -1.032196044921875, -0.9918212890625, -0.951446533203125, -0.91107177734375, -0.870697021484375, -0.830322265625, -0.789947509765625, -0.74957275390625, -0.709197998046875, -0.6688232421875, -0.628448486328125, -0.58807373046875, -0.547698974609375, -0.50732421875, -0.466949462890625, -0.42657470703125, -0.386199951171875, -0.3458251953125, -0.305450439453125, -0.26507568359375, -0.224700927734375, -0.184326171875, -0.143951416015625, -0.10357666015625, -0.063201904296875, -0.0228271484375, 0.017547607421875, 0.05792236328125, 0.098297119140625, 0.138671875, 0.179046630859375, 0.21942138671875, 0.259796142578125, 0.3001708984375, 0.340545654296875, 0.38092041015625, 0.421295166015625, 0.461669921875, 0.502044677734375, 0.54241943359375, 0.582794189453125, 0.6231689453125, 0.663543701171875, 0.70391845703125, 0.744293212890625, 0.78466796875, 0.825042724609375, 0.86541748046875, 0.905792236328125, 0.9461669921875, 0.986541748046875, 1.02691650390625, 1.067291259765625, 1.107666015625, 1.148040771484375, 1.18841552734375, 1.228790283203125, 1.2691650390625, 1.309539794921875, 1.34991455078125, 1.390289306640625, 1.4306640625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 4.0, 11.0, 11.0, 20.0, 16.0, 31.0, 69.0, 131.0, 164.0, 209.0, 118.0, 73.0, 55.0, 31.0, 16.0, 19.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97119140625, -0.9379806518554688, -0.9047698974609375, -0.8715591430664062, -0.838348388671875, -0.8051376342773438, -0.7719268798828125, -0.7387161254882812, -0.70550537109375, -0.6722946166992188, -0.6390838623046875, -0.6058731079101562, -0.572662353515625, -0.5394515991210938, -0.5062408447265625, -0.47303009033203125, -0.4398193359375, -0.40660858154296875, -0.3733978271484375, -0.34018707275390625, -0.306976318359375, -0.27376556396484375, -0.2405548095703125, -0.20734405517578125, -0.17413330078125, -0.14092254638671875, -0.1077117919921875, -0.07450103759765625, -0.041290283203125, -0.00807952880859375, 0.0251312255859375, 0.05834197998046875, 0.091552734375, 0.12476348876953125, 0.1579742431640625, 0.19118499755859375, 0.224395751953125, 0.25760650634765625, 0.2908172607421875, 0.32402801513671875, 0.35723876953125, 0.39044952392578125, 0.4236602783203125, 0.45687103271484375, 0.490081787109375, 0.5232925415039062, 0.5565032958984375, 0.5897140502929688, 0.6229248046875, 0.6561355590820312, 0.6893463134765625, 0.7225570678710938, 0.755767822265625, 0.7889785766601562, 0.8221893310546875, 0.8554000854492188, 0.88861083984375, 0.9218215942382812, 0.9550323486328125, 0.9882431030273438, 1.021453857421875, 1.0546646118164062, 1.0878753662109375, 1.1210861206054688, 1.154296875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 12.0, 90.0, 344.0, 413.0, 116.0, 24.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.767391204833984, -22.011369705200195, -21.255348205566406, -20.499326705932617, -19.743305206298828, -18.98728370666504, -18.23126220703125, -17.475242614746094, -16.719219207763672, -15.963197708129883, -15.207176208496094, -14.451154708862305, -13.695133209228516, -12.939111709594727, -12.183091163635254, -11.427069664001465, -10.671049118041992, -9.915027618408203, -9.159006118774414, -8.402984619140625, -7.646963596343994, -6.890942096710205, -6.134921073913574, -5.378899574279785, -4.622878074645996, -3.866856575012207, -3.110835313796997, -2.354814052581787, -1.598792552947998, -0.842771053314209, -0.08675003051757812, 0.6692714691162109, 1.4252910614013672, 2.1813125610351562, 2.937333822250366, 3.693355083465576, 4.449376583099365, 5.205398082733154, 5.961419105529785, 6.717440605163574, 7.473462104797363, 8.229483604431152, 8.985505104064941, 9.741525650024414, 10.497547149658203, 11.253568649291992, 12.009590148925781, 12.76561164855957, 13.52163314819336, 14.277654647827148, 15.033676147460938, 15.789697647094727, 16.545719146728516, 17.301740646362305, 18.057762145996094, 18.81378173828125, 19.569805145263672, 20.32582664489746, 21.08184814453125, 21.83786964416504, 22.593891143798828, 23.349912643432617, 24.105934143066406, 24.861953735351562, 25.61797523498535]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 5.0, 14.0, 10.0, 17.0, 18.0, 25.0, 19.0, 35.0, 45.0, 49.0, 59.0, 50.0, 58.0, 62.0, 38.0, 54.0, 56.0, 74.0, 64.0, 50.0, 36.0, 32.0, 24.0, 23.0, 24.0, 20.0, 7.0, 7.0, 4.0, 8.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.075491905212402, -4.907909870147705, -4.740327835083008, -4.5727458000183105, -4.405163764953613, -4.237581729888916, -4.069999694824219, -3.9024174213409424, -3.734835386276245, -3.567253351211548, -3.3996713161468506, -3.232089042663574, -3.064507007598877, -2.8969249725341797, -2.7293429374694824, -2.561760902404785, -2.394178867340088, -2.2265968322753906, -2.0590147972106934, -1.8914326429367065, -1.7238506078720093, -1.556268572807312, -1.3886864185333252, -1.221104383468628, -1.0535223484039307, -0.8859403133392334, -0.7183582186698914, -0.5507761240005493, -0.38319408893585205, -0.21561205387115479, -0.04802989959716797, 0.1195521354675293, 0.28713417053222656, 0.4547162353992462, 0.6222983002662659, 0.7898803949356079, 0.9574624300003052, 1.1250444650650024, 1.2926266193389893, 1.4602086544036865, 1.6277906894683838, 1.795372724533081, 1.9629547595977783, 2.1305370330810547, 2.298119068145752, 2.465701103210449, 2.6332831382751465, 2.8008651733398438, 2.968447208404541, 3.1360292434692383, 3.3036112785339355, 3.471193313598633, 3.63877534866333, 3.8063573837280273, 3.9739396572113037, 4.141521453857422, 4.309103965759277, 4.476686000823975, 4.644268035888672, 4.811850070953369, 4.979432106018066, 5.147014141082764, 5.314596176147461, 5.482178688049316, 5.6497602462768555]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 4.0, 3.0, 6.0, 8.0, 11.0, 11.0, 30.0, 43.0, 54.0, 91.0, 142.0, 244.0, 388.0, 649.0, 1335.0, 2518.0, 5431.0, 13695.0, 50699.0, 3624151.0, 436531.0, 37200.0, 11031.0, 4836.0, 2312.0, 1188.0, 628.0, 392.0, 227.0, 146.0, 93.0, 68.0, 46.0, 20.0, 11.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8095703125, -0.786376953125, -0.76318359375, -0.739990234375, -0.716796875, -0.693603515625, -0.67041015625, -0.647216796875, -0.6240234375, -0.600830078125, -0.57763671875, -0.554443359375, -0.53125, -0.508056640625, -0.48486328125, -0.461669921875, -0.4384765625, -0.415283203125, -0.39208984375, -0.368896484375, -0.345703125, -0.322509765625, -0.29931640625, -0.276123046875, -0.2529296875, -0.229736328125, -0.20654296875, -0.183349609375, -0.16015625, -0.136962890625, -0.11376953125, -0.090576171875, -0.0673828125, -0.044189453125, -0.02099609375, 0.002197265625, 0.025390625, 0.048583984375, 0.07177734375, 0.094970703125, 0.1181640625, 0.141357421875, 0.16455078125, 0.187744140625, 0.2109375, 0.234130859375, 0.25732421875, 0.280517578125, 0.3037109375, 0.326904296875, 0.35009765625, 0.373291015625, 0.396484375, 0.419677734375, 0.44287109375, 0.466064453125, 0.4892578125, 0.512451171875, 0.53564453125, 0.558837890625, 0.58203125, 0.605224609375, 0.62841796875, 0.651611328125, 0.6748046875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 9.0, 16.0, 11.0, 28.0, 33.0, 36.0, 53.0, 69.0, 83.0, 73.0, 72.0, 88.0, 74.0, 71.0, 63.0, 51.0, 36.0, 43.0, 32.0, 17.0, 11.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.2606468200683594, -0.25225067138671875, -0.24385452270507812, -0.2354583740234375, -0.22706222534179688, -0.21866607666015625, -0.21026992797851562, -0.201873779296875, -0.19347763061523438, -0.18508148193359375, -0.17668533325195312, -0.1682891845703125, -0.15989303588867188, -0.15149688720703125, -0.14310073852539062, -0.13470458984375, -0.12630844116210938, -0.11791229248046875, -0.10951614379882812, -0.1011199951171875, -0.09272384643554688, -0.08432769775390625, -0.07593154907226562, -0.067535400390625, -0.059139251708984375, -0.05074310302734375, -0.042346954345703125, -0.0339508056640625, -0.025554656982421875, -0.01715850830078125, -0.008762359619140625, -0.0003662109375, 0.008029937744140625, 0.01642608642578125, 0.024822235107421875, 0.0332183837890625, 0.041614532470703125, 0.05001068115234375, 0.058406829833984375, 0.066802978515625, 0.07519912719726562, 0.08359527587890625, 0.09199142456054688, 0.1003875732421875, 0.10878372192382812, 0.11717987060546875, 0.12557601928710938, 0.13397216796875, 0.14236831665039062, 0.15076446533203125, 0.15916061401367188, 0.1675567626953125, 0.17595291137695312, 0.18434906005859375, 0.19274520874023438, 0.201141357421875, 0.20953750610351562, 0.21793365478515625, 0.22632980346679688, 0.2347259521484375, 0.24312210083007812, 0.25151824951171875, 0.2599143981933594, 0.268310546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 13.0, 17.0, 18.0, 29.0, 42.0, 59.0, 99.0, 147.0, 255.0, 462.0, 671.0, 1218.0, 2302.0, 5021.0, 13952.0, 63936.0, 3916653.0, 154351.0, 21495.0, 6880.0, 2967.0, 1492.0, 854.0, 508.0, 286.0, 188.0, 98.0, 70.0, 38.0, 31.0, 24.0, 18.0, 14.0, 12.0, 13.0, 5.0, 4.0, 5.0, 3.0, 5.0, 1.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.86279296875, -0.8337173461914062, -0.8046417236328125, -0.7755661010742188, -0.746490478515625, -0.7174148559570312, -0.6883392333984375, -0.6592636108398438, -0.63018798828125, -0.6011123657226562, -0.5720367431640625, -0.5429611206054688, -0.513885498046875, -0.48480987548828125, -0.4557342529296875, -0.42665863037109375, -0.3975830078125, -0.36850738525390625, -0.3394317626953125, -0.31035614013671875, -0.281280517578125, -0.25220489501953125, -0.2231292724609375, -0.19405364990234375, -0.16497802734375, -0.13590240478515625, -0.1068267822265625, -0.07775115966796875, -0.048675537109375, -0.01959991455078125, 0.0094757080078125, 0.03855133056640625, 0.067626953125, 0.09670257568359375, 0.1257781982421875, 0.15485382080078125, 0.183929443359375, 0.21300506591796875, 0.2420806884765625, 0.27115631103515625, 0.30023193359375, 0.32930755615234375, 0.3583831787109375, 0.38745880126953125, 0.416534423828125, 0.44561004638671875, 0.4746856689453125, 0.5037612915039062, 0.5328369140625, 0.5619125366210938, 0.5909881591796875, 0.6200637817382812, 0.649139404296875, 0.6782150268554688, 0.7072906494140625, 0.7363662719726562, 0.76544189453125, 0.7945175170898438, 0.8235931396484375, 0.8526687622070312, 0.881744384765625, 0.9108200073242188, 0.9398956298828125, 0.9689712524414062, 0.998046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 15.0, 22.0, 40.0, 97.0, 2787.0, 917.0, 96.0, 38.0, 20.0, 15.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1929931640625, -0.1828136444091797, -0.17263412475585938, -0.16245460510253906, -0.15227508544921875, -0.14209556579589844, -0.13191604614257812, -0.12173652648925781, -0.1115570068359375, -0.10137748718261719, -0.09119796752929688, -0.08101844787597656, -0.07083892822265625, -0.06065940856933594, -0.050479888916015625, -0.04030036926269531, -0.030120849609375, -0.019941329956054688, -0.009761810302734375, 0.0004177093505859375, 0.01059722900390625, 0.020776748657226562, 0.030956268310546875, 0.04113578796386719, 0.0513153076171875, 0.06149482727050781, 0.07167434692382812, 0.08185386657714844, 0.09203338623046875, 0.10221290588378906, 0.11239242553710938, 0.12257194519042969, 0.13275146484375, 0.1429309844970703, 0.15311050415039062, 0.16329002380371094, 0.17346954345703125, 0.18364906311035156, 0.19382858276367188, 0.2040081024169922, 0.2141876220703125, 0.2243671417236328, 0.23454666137695312, 0.24472618103027344, 0.25490570068359375, 0.26508522033691406, 0.2752647399902344, 0.2854442596435547, 0.295623779296875, 0.3058032989501953, 0.3159828186035156, 0.32616233825683594, 0.33634185791015625, 0.34652137756347656, 0.3567008972167969, 0.3668804168701172, 0.3770599365234375, 0.3872394561767578, 0.3974189758300781, 0.40759849548339844, 0.41777801513671875, 0.42795753479003906, 0.4381370544433594, 0.4483165740966797, 0.45849609375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 18.0, 33.0, 61.0, 138.0, 207.0, 236.0, 155.0, 97.0, 30.0, 11.0, 12.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.230276107788086, -2.186631441116333, -2.142986536026001, -2.099341869354248, -2.055697202682495, -2.012052297592163, -1.9684076309204102, -1.9247629642486572, -1.8811181783676147, -1.8374733924865723, -1.7938287258148193, -1.7501839399337769, -1.7065391540527344, -1.6628944873809814, -1.619249701499939, -1.5756049156188965, -1.5319602489471436, -1.488315463066101, -1.4446707963943481, -1.4010260105133057, -1.3573813438415527, -1.3137365579605103, -1.2700917720794678, -1.2264471054077148, -1.1828023195266724, -1.1391575336456299, -1.095512866973877, -1.0518680810928345, -1.008223295211792, -0.9645786285400391, -0.9209338426589966, -0.8772891163825989, -0.8336445093154907, -0.789999783039093, -0.7463550567626953, -0.7027102708816528, -0.6590655446052551, -0.6154208183288574, -0.5717760324478149, -0.5281313061714172, -0.48448657989501953, -0.4408418536186218, -0.39719709753990173, -0.35355234146118164, -0.30990761518478394, -0.26626288890838623, -0.22261813282966614, -0.17897337675094604, -0.13532865047454834, -0.09168390929698944, -0.04803916811943054, -0.004394426941871643, 0.039250314235687256, 0.08289505541324615, 0.12653979659080505, 0.17018455266952515, 0.21382927894592285, 0.25747400522232056, 0.30111876130104065, 0.34476351737976074, 0.38840824365615845, 0.43205296993255615, 0.47569772601127625, 0.5193424820899963, 0.562987208366394]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 2.0, 8.0, 11.0, 7.0, 18.0, 11.0, 9.0, 25.0, 19.0, 27.0, 27.0, 31.0, 38.0, 38.0, 35.0, 45.0, 35.0, 54.0, 47.0, 41.0, 43.0, 48.0, 37.0, 49.0, 31.0, 32.0, 45.0, 35.0, 14.0, 24.0, 18.0, 20.0, 14.0, 7.0, 9.0, 10.0, 5.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3721722960472107, -0.3590085208415985, -0.34584471583366394, -0.33268094062805176, -0.3195171356201172, -0.306353360414505, -0.2931895852088928, -0.28002578020095825, -0.2668619751930237, -0.2536981999874115, -0.24053439497947693, -0.22737061977386475, -0.21420681476593018, -0.201043039560318, -0.18787924945354462, -0.17471545934677124, -0.16155168414115906, -0.14838789403438568, -0.1352241039276123, -0.12206032127141953, -0.10889653116464615, -0.09573274105787277, -0.08256895840167999, -0.06940516829490662, -0.05624137818813324, -0.04307758808135986, -0.029913801699876785, -0.016750015318393707, -0.003586225211620331, 0.009577564895153046, 0.022741347551345825, 0.0359051376581192, 0.04906892776489258, 0.062232717871665955, 0.07539650797843933, 0.08856029063463211, 0.10172408074140549, 0.11488787084817886, 0.12805165350437164, 0.14121544361114502, 0.1543792337179184, 0.16754302382469177, 0.18070681393146515, 0.19387060403823853, 0.2070343792438507, 0.22019818425178528, 0.23336195945739746, 0.24652574956417084, 0.2596895396709442, 0.2728533148765564, 0.28601711988449097, 0.29918089509010315, 0.3123447000980377, 0.3255084753036499, 0.3386722803115845, 0.35183605551719666, 0.36499983072280884, 0.378163605928421, 0.3913274109363556, 0.4044911861419678, 0.41765499114990234, 0.4308187663555145, 0.4439825415611267, 0.4571463465690613, 0.47031015157699585]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 0.0, 2.0, 10.0, 11.0, 13.0, 21.0, 37.0, 42.0, 76.0, 123.0, 215.0, 354.0, 707.0, 1599.0, 3896.0, 11599.0, 37594.0, 125948.0, 327696.0, 340876.0, 136551.0, 41020.0, 12400.0, 4305.0, 1731.0, 756.0, 386.0, 213.0, 128.0, 85.0, 50.0, 31.0, 28.0, 9.0, 13.0, 10.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6611328125, -0.6404953002929688, -0.6198577880859375, -0.5992202758789062, -0.578582763671875, -0.5579452514648438, -0.5373077392578125, -0.5166702270507812, -0.49603271484375, -0.47539520263671875, -0.4547576904296875, -0.43412017822265625, -0.413482666015625, -0.39284515380859375, -0.3722076416015625, -0.35157012939453125, -0.3309326171875, -0.31029510498046875, -0.2896575927734375, -0.26902008056640625, -0.248382568359375, -0.22774505615234375, -0.2071075439453125, -0.18647003173828125, -0.16583251953125, -0.14519500732421875, -0.1245574951171875, -0.10391998291015625, -0.083282470703125, -0.06264495849609375, -0.0420074462890625, -0.02136993408203125, -0.000732421875, 0.01990509033203125, 0.0405426025390625, 0.06118011474609375, 0.081817626953125, 0.10245513916015625, 0.1230926513671875, 0.14373016357421875, 0.16436767578125, 0.18500518798828125, 0.2056427001953125, 0.22628021240234375, 0.246917724609375, 0.26755523681640625, 0.2881927490234375, 0.30883026123046875, 0.3294677734375, 0.35010528564453125, 0.3707427978515625, 0.39138031005859375, 0.412017822265625, 0.43265533447265625, 0.4532928466796875, 0.47393035888671875, 0.49456787109375, 0.5152053833007812, 0.5358428955078125, 0.5564804077148438, 0.577117919921875, 0.5977554321289062, 0.6183929443359375, 0.6390304565429688, 0.65966796875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 13.0, 20.0, 17.0, 28.0, 44.0, 37.0, 52.0, 43.0, 71.0, 73.0, 81.0, 69.0, 86.0, 58.0, 61.0, 53.0, 50.0, 20.0, 34.0, 28.0, 13.0, 14.0, 10.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27197265625, -0.2635307312011719, -0.25508880615234375, -0.24664688110351562, -0.2382049560546875, -0.22976303100585938, -0.22132110595703125, -0.21287918090820312, -0.204437255859375, -0.19599533081054688, -0.18755340576171875, -0.17911148071289062, -0.1706695556640625, -0.16222763061523438, -0.15378570556640625, -0.14534378051757812, -0.13690185546875, -0.12845993041992188, -0.12001800537109375, -0.11157608032226562, -0.1031341552734375, -0.09469223022460938, -0.08625030517578125, -0.07780838012695312, -0.069366455078125, -0.060924530029296875, -0.05248260498046875, -0.044040679931640625, -0.0355987548828125, -0.027156829833984375, -0.01871490478515625, -0.010272979736328125, -0.0018310546875, 0.006610870361328125, 0.01505279541015625, 0.023494720458984375, 0.0319366455078125, 0.040378570556640625, 0.04882049560546875, 0.057262420654296875, 0.065704345703125, 0.07414627075195312, 0.08258819580078125, 0.09103012084960938, 0.0994720458984375, 0.10791397094726562, 0.11635589599609375, 0.12479782104492188, 0.13323974609375, 0.14168167114257812, 0.15012359619140625, 0.15856552124023438, 0.1670074462890625, 0.17544937133789062, 0.18389129638671875, 0.19233322143554688, 0.200775146484375, 0.20921707153320312, 0.21765899658203125, 0.22610092163085938, 0.2345428466796875, 0.24298477172851562, 0.25142669677734375, 0.2598686218261719, 0.268310546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 9.0, 5.0, 10.0, 17.0, 38.0, 31.0, 50.0, 78.0, 163.0, 305.0, 633.0, 1581.0, 5011.0, 21695.0, 133127.0, 591421.0, 244889.0, 37935.0, 7670.0, 2174.0, 836.0, 363.0, 204.0, 118.0, 64.0, 44.0, 28.0, 11.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8779296875, -0.845001220703125, -0.81207275390625, -0.779144287109375, -0.7462158203125, -0.713287353515625, -0.68035888671875, -0.647430419921875, -0.614501953125, -0.581573486328125, -0.54864501953125, -0.515716552734375, -0.4827880859375, -0.449859619140625, -0.41693115234375, -0.384002685546875, -0.35107421875, -0.318145751953125, -0.28521728515625, -0.252288818359375, -0.2193603515625, -0.186431884765625, -0.15350341796875, -0.120574951171875, -0.087646484375, -0.054718017578125, -0.02178955078125, 0.011138916015625, 0.0440673828125, 0.076995849609375, 0.10992431640625, 0.142852783203125, 0.17578125, 0.208709716796875, 0.24163818359375, 0.274566650390625, 0.3074951171875, 0.340423583984375, 0.37335205078125, 0.406280517578125, 0.439208984375, 0.472137451171875, 0.50506591796875, 0.537994384765625, 0.5709228515625, 0.603851318359375, 0.63677978515625, 0.669708251953125, 0.70263671875, 0.735565185546875, 0.76849365234375, 0.801422119140625, 0.8343505859375, 0.867279052734375, 0.90020751953125, 0.933135986328125, 0.966064453125, 0.998992919921875, 1.03192138671875, 1.064849853515625, 1.0977783203125, 1.130706787109375, 1.16363525390625, 1.196563720703125, 1.2294921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 6.0, 9.0, 12.0, 4.0, 7.0, 9.0, 18.0, 33.0, 17.0, 37.0, 21.0, 33.0, 34.0, 44.0, 36.0, 31.0, 58.0, 36.0, 54.0, 47.0, 37.0, 55.0, 50.0, 32.0, 45.0, 32.0, 41.0, 30.0, 32.0, 21.0, 15.0, 15.0, 16.0, 9.0, 6.0, 4.0, 6.0, 6.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0048828125, -0.971282958984375, -0.93768310546875, -0.904083251953125, -0.8704833984375, -0.836883544921875, -0.80328369140625, -0.769683837890625, -0.736083984375, -0.702484130859375, -0.66888427734375, -0.635284423828125, -0.6016845703125, -0.568084716796875, -0.53448486328125, -0.500885009765625, -0.46728515625, -0.433685302734375, -0.40008544921875, -0.366485595703125, -0.3328857421875, -0.299285888671875, -0.26568603515625, -0.232086181640625, -0.198486328125, -0.164886474609375, -0.13128662109375, -0.097686767578125, -0.0640869140625, -0.030487060546875, 0.00311279296875, 0.036712646484375, 0.0703125, 0.103912353515625, 0.13751220703125, 0.171112060546875, 0.2047119140625, 0.238311767578125, 0.27191162109375, 0.305511474609375, 0.339111328125, 0.372711181640625, 0.40631103515625, 0.439910888671875, 0.4735107421875, 0.507110595703125, 0.54071044921875, 0.574310302734375, 0.60791015625, 0.641510009765625, 0.67510986328125, 0.708709716796875, 0.7423095703125, 0.775909423828125, 0.80950927734375, 0.843109130859375, 0.876708984375, 0.910308837890625, 0.94390869140625, 0.977508544921875, 1.0111083984375, 1.044708251953125, 1.07830810546875, 1.111907958984375, 1.1455078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 16.0, 24.0, 38.0, 92.0, 229.0, 504.0, 1921.0, 21454.0, 968124.0, 52081.0, 2914.0, 680.0, 247.0, 96.0, 58.0, 32.0, 15.0, 9.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.83203125, -2.76397705078125, -2.6959228515625, -2.62786865234375, -2.559814453125, -2.49176025390625, -2.4237060546875, -2.35565185546875, -2.28759765625, -2.21954345703125, -2.1514892578125, -2.08343505859375, -2.015380859375, -1.94732666015625, -1.8792724609375, -1.81121826171875, -1.7431640625, -1.67510986328125, -1.6070556640625, -1.53900146484375, -1.470947265625, -1.40289306640625, -1.3348388671875, -1.26678466796875, -1.19873046875, -1.13067626953125, -1.0626220703125, -0.99456787109375, -0.926513671875, -0.85845947265625, -0.7904052734375, -0.72235107421875, -0.654296875, -0.58624267578125, -0.5181884765625, -0.45013427734375, -0.382080078125, -0.31402587890625, -0.2459716796875, -0.17791748046875, -0.10986328125, -0.04180908203125, 0.0262451171875, 0.09429931640625, 0.162353515625, 0.23040771484375, 0.2984619140625, 0.36651611328125, 0.4345703125, 0.50262451171875, 0.5706787109375, 0.63873291015625, 0.706787109375, 0.77484130859375, 0.8428955078125, 0.91094970703125, 0.97900390625, 1.04705810546875, 1.1151123046875, 1.18316650390625, 1.251220703125, 1.31927490234375, 1.3873291015625, 1.45538330078125, 1.5234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 18.0, 11.0, 21.0, 31.0, 51.0, 64.0, 92.0, 134.0, 137.0, 139.0, 98.0, 72.0, 46.0, 33.0, 17.0, 22.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019347667694091797, -0.0001862887293100357, -0.00017910078167915344, -0.00017191283404827118, -0.00016472488641738892, -0.00015753693878650665, -0.0001503489911556244, -0.00014316104352474213, -0.00013597309589385986, -0.0001287851482629776, -0.00012159720063209534, -0.00011440925300121307, -0.00010722130537033081, -0.00010003335773944855, -9.284541010856628e-05, -8.565746247768402e-05, -7.846951484680176e-05, -7.12815672159195e-05, -6.409361958503723e-05, -5.690567195415497e-05, -4.9717724323272705e-05, -4.252977669239044e-05, -3.534182906150818e-05, -2.8153881430625916e-05, -2.0965933799743652e-05, -1.377798616886139e-05, -6.590038537979126e-06, 5.979090929031372e-07, 7.7858567237854e-06, 1.4973804354667664e-05, 2.2161751985549927e-05, 2.934969961643219e-05, 3.653764724731445e-05, 4.3725594878196716e-05, 5.091354250907898e-05, 5.810149013996124e-05, 6.52894377708435e-05, 7.247738540172577e-05, 7.966533303260803e-05, 8.68532806634903e-05, 9.404122829437256e-05, 0.00010122917592525482, 0.00010841712355613708, 0.00011560507118701935, 0.0001227930188179016, 0.00012998096644878387, 0.00013716891407966614, 0.0001443568617105484, 0.00015154480934143066, 0.00015873275697231293, 0.0001659207046031952, 0.00017310865223407745, 0.00018029659986495972, 0.00018748454749584198, 0.00019467249512672424, 0.0002018604427576065, 0.00020904839038848877, 0.00021623633801937103, 0.0002234242856502533, 0.00023061223328113556, 0.00023780018091201782, 0.0002449881285429001, 0.00025217607617378235, 0.0002593640238046646, 0.0002665519714355469]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 17.0, 26.0, 28.0, 52.0, 120.0, 221.0, 621.0, 2740.0, 33137.0, 916818.0, 88921.0, 4406.0, 877.0, 291.0, 117.0, 51.0, 34.0, 19.0, 15.0, 11.0, 12.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0625, -1.0175323486328125, -0.972564697265625, -0.9275970458984375, -0.88262939453125, -0.8376617431640625, -0.792694091796875, -0.7477264404296875, -0.7027587890625, -0.6577911376953125, -0.612823486328125, -0.5678558349609375, -0.52288818359375, -0.4779205322265625, -0.432952880859375, -0.3879852294921875, -0.343017578125, -0.2980499267578125, -0.253082275390625, -0.2081146240234375, -0.16314697265625, -0.1181793212890625, -0.073211669921875, -0.0282440185546875, 0.0167236328125, 0.0616912841796875, 0.106658935546875, 0.1516265869140625, 0.19659423828125, 0.2415618896484375, 0.286529541015625, 0.3314971923828125, 0.37646484375, 0.4214324951171875, 0.466400146484375, 0.5113677978515625, 0.55633544921875, 0.6013031005859375, 0.646270751953125, 0.6912384033203125, 0.7362060546875, 0.7811737060546875, 0.826141357421875, 0.8711090087890625, 0.91607666015625, 0.9610443115234375, 1.006011962890625, 1.0509796142578125, 1.095947265625, 1.1409149169921875, 1.185882568359375, 1.2308502197265625, 1.27581787109375, 1.3207855224609375, 1.365753173828125, 1.4107208251953125, 1.4556884765625, 1.5006561279296875, 1.545623779296875, 1.5905914306640625, 1.63555908203125, 1.6805267333984375, 1.725494384765625, 1.7704620361328125, 1.8154296875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 9.0, 21.0, 34.0, 66.0, 107.0, 149.0, 171.0, 164.0, 103.0, 65.0, 37.0, 18.0, 14.0, 12.0, 8.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.4173736572265625, -1.370880126953125, -1.3243865966796875, -1.27789306640625, -1.2313995361328125, -1.184906005859375, -1.1384124755859375, -1.0919189453125, -1.0454254150390625, -0.998931884765625, -0.9524383544921875, -0.90594482421875, -0.8594512939453125, -0.812957763671875, -0.7664642333984375, -0.719970703125, -0.6734771728515625, -0.626983642578125, -0.5804901123046875, -0.53399658203125, -0.4875030517578125, -0.441009521484375, -0.3945159912109375, -0.3480224609375, -0.3015289306640625, -0.255035400390625, -0.2085418701171875, -0.16204833984375, -0.1155548095703125, -0.069061279296875, -0.0225677490234375, 0.02392578125, 0.0704193115234375, 0.116912841796875, 0.1634063720703125, 0.20989990234375, 0.2563934326171875, 0.302886962890625, 0.3493804931640625, 0.3958740234375, 0.4423675537109375, 0.488861083984375, 0.5353546142578125, 0.58184814453125, 0.6283416748046875, 0.674835205078125, 0.7213287353515625, 0.767822265625, 0.8143157958984375, 0.860809326171875, 0.9073028564453125, 0.95379638671875, 1.0002899169921875, 1.046783447265625, 1.0932769775390625, 1.1397705078125, 1.1862640380859375, 1.232757568359375, 1.2792510986328125, 1.32574462890625, 1.3722381591796875, 1.418731689453125, 1.4652252197265625, 1.51171875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 13.0, 25.0, 37.0, 102.0, 119.0, 185.0, 190.0, 137.0, 89.0, 46.0, 25.0, 12.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.667972564697266, -12.285761833190918, -11.903550148010254, -11.521339416503906, -11.139127731323242, -10.756916999816895, -10.374706268310547, -9.992494583129883, -9.610283851623535, -9.228073120117188, -8.845861434936523, -8.463650703430176, -8.081439971923828, -7.699228286743164, -7.317017555236816, -6.9348063468933105, -6.552595138549805, -6.170383930206299, -5.788172721862793, -5.405961990356445, -5.0237507820129395, -4.641539573669434, -4.259328842163086, -3.87711763381958, -3.494906425476074, -3.1126952171325684, -2.7304842472076416, -2.348273277282715, -1.966062068939209, -1.5838509798049927, -1.2016398906707764, -0.8194289207458496, -0.43721771240234375, -0.05500662326812744, 0.32720446586608887, 0.7094155550003052, 1.0916266441345215, 1.4738377332687378, 1.856048822402954, 2.238259792327881, 2.6204710006713867, 3.0026822090148926, 3.3848931789398193, 3.767104148864746, 4.149315357208252, 4.531526565551758, 4.9137372970581055, 5.295948505401611, 5.678159713745117, 6.060370922088623, 6.442582130432129, 6.824792861938477, 7.207004070281982, 7.589215278625488, 7.971426010131836, 8.3536376953125, 8.735848426818848, 9.118059158325195, 9.50027084350586, 9.882481575012207, 10.264692306518555, 10.646903991699219, 11.029114723205566, 11.411325454711914, 11.793537139892578]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 8.0, 8.0, 14.0, 16.0, 19.0, 21.0, 20.0, 37.0, 22.0, 28.0, 30.0, 47.0, 56.0, 55.0, 53.0, 39.0, 48.0, 54.0, 42.0, 53.0, 37.0, 24.0, 34.0, 30.0, 29.0, 24.0, 18.0, 22.0, 17.0, 12.0, 11.0, 15.0, 9.0, 8.0, 7.0, 4.0, 6.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.865495204925537, -4.699230194091797, -4.532965660095215, -4.366700649261475, -4.200435638427734, -4.034171104431152, -3.867906093597412, -3.701641321182251, -3.53537654876709, -3.3691117763519287, -3.2028470039367676, -3.0365819931030273, -2.870317220687866, -2.704052448272705, -2.537787437438965, -2.3715226650238037, -2.2052578926086426, -2.0389931201934814, -1.8727282285690308, -1.70646333694458, -1.540198564529419, -1.3739337921142578, -1.2076689004898071, -1.0414040088653564, -0.8751392364501953, -0.7088744044303894, -0.5426095724105835, -0.3763447403907776, -0.21007990837097168, -0.04381507635116577, 0.12244975566864014, 0.2887146472930908, 0.45497989654541016, 0.6212447285652161, 0.787509560585022, 0.9537743926048279, 1.1200392246246338, 1.286303997039795, 1.4525688886642456, 1.6188337802886963, 1.7850985527038574, 1.9513633251190186, 2.1176280975341797, 2.28389310836792, 2.450157880783081, 2.616422653198242, 2.7826876640319824, 2.9489524364471436, 3.1152172088623047, 3.281481981277466, 3.447746753692627, 3.614011764526367, 3.7802765369415283, 3.9465413093566895, 4.11280632019043, 4.279070854187012, 4.445335865020752, 4.611600875854492, 4.777865409851074, 4.9441304206848145, 5.110395431518555, 5.276659965515137, 5.442924976348877, 5.609189987182617, 5.775454521179199]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 12.0, 12.0, 27.0, 46.0, 87.0, 236.0, 526.0, 1580.0, 5741.0, 37047.0, 3994146.0, 138902.0, 11619.0, 2716.0, 872.0, 351.0, 169.0, 62.0, 41.0, 28.0, 24.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2255859375, -1.1739044189453125, -1.122222900390625, -1.0705413818359375, -1.01885986328125, -0.9671783447265625, -0.915496826171875, -0.8638153076171875, -0.8121337890625, -0.7604522705078125, -0.708770751953125, -0.6570892333984375, -0.60540771484375, -0.5537261962890625, -0.502044677734375, -0.4503631591796875, -0.398681640625, -0.3470001220703125, -0.295318603515625, -0.2436370849609375, -0.19195556640625, -0.1402740478515625, -0.088592529296875, -0.0369110107421875, 0.0147705078125, 0.0664520263671875, 0.118133544921875, 0.1698150634765625, 0.22149658203125, 0.2731781005859375, 0.324859619140625, 0.3765411376953125, 0.42822265625, 0.4799041748046875, 0.531585693359375, 0.5832672119140625, 0.63494873046875, 0.6866302490234375, 0.738311767578125, 0.7899932861328125, 0.8416748046875, 0.8933563232421875, 0.945037841796875, 0.9967193603515625, 1.04840087890625, 1.1000823974609375, 1.151763916015625, 1.2034454345703125, 1.255126953125, 1.3068084716796875, 1.358489990234375, 1.4101715087890625, 1.46185302734375, 1.5135345458984375, 1.565216064453125, 1.6168975830078125, 1.6685791015625, 1.7202606201171875, 1.771942138671875, 1.8236236572265625, 1.87530517578125, 1.9269866943359375, 1.978668212890625, 2.0303497314453125, 2.08203125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 14.0, 13.0, 25.0, 32.0, 31.0, 47.0, 32.0, 48.0, 46.0, 72.0, 68.0, 82.0, 62.0, 57.0, 64.0, 46.0, 47.0, 47.0, 26.0, 27.0, 20.0, 23.0, 13.0, 11.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.286865234375, -0.2781219482421875, -0.269378662109375, -0.2606353759765625, -0.25189208984375, -0.2431488037109375, -0.234405517578125, -0.2256622314453125, -0.2169189453125, -0.2081756591796875, -0.199432373046875, -0.1906890869140625, -0.18194580078125, -0.1732025146484375, -0.164459228515625, -0.1557159423828125, -0.14697265625, -0.1382293701171875, -0.129486083984375, -0.1207427978515625, -0.11199951171875, -0.1032562255859375, -0.094512939453125, -0.0857696533203125, -0.0770263671875, -0.0682830810546875, -0.059539794921875, -0.0507965087890625, -0.04205322265625, -0.0333099365234375, -0.024566650390625, -0.0158233642578125, -0.007080078125, 0.0016632080078125, 0.010406494140625, 0.0191497802734375, 0.02789306640625, 0.0366363525390625, 0.045379638671875, 0.0541229248046875, 0.0628662109375, 0.0716094970703125, 0.080352783203125, 0.0890960693359375, 0.09783935546875, 0.1065826416015625, 0.115325927734375, 0.1240692138671875, 0.1328125, 0.1415557861328125, 0.150299072265625, 0.1590423583984375, 0.16778564453125, 0.1765289306640625, 0.185272216796875, 0.1940155029296875, 0.2027587890625, 0.2115020751953125, 0.220245361328125, 0.2289886474609375, 0.23773193359375, 0.2464752197265625, 0.255218505859375, 0.2639617919921875, 0.272705078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 9.0, 10.0, 17.0, 17.0, 25.0, 39.0, 49.0, 76.0, 115.0, 145.0, 208.0, 304.0, 444.0, 598.0, 925.0, 1383.0, 2270.0, 3587.0, 6167.0, 11823.0, 25267.0, 68059.0, 314410.0, 3466621.0, 194881.0, 51919.0, 20764.0, 10018.0, 5279.0, 3014.0, 1991.0, 1247.0, 839.0, 548.0, 357.0, 246.0, 177.0, 112.0, 85.0, 63.0, 56.0, 30.0, 25.0, 20.0, 12.0, 14.0, 5.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.53857421875, -0.520843505859375, -0.50311279296875, -0.485382080078125, -0.4676513671875, -0.449920654296875, -0.43218994140625, -0.414459228515625, -0.396728515625, -0.378997802734375, -0.36126708984375, -0.343536376953125, -0.3258056640625, -0.308074951171875, -0.29034423828125, -0.272613525390625, -0.2548828125, -0.237152099609375, -0.21942138671875, -0.201690673828125, -0.1839599609375, -0.166229248046875, -0.14849853515625, -0.130767822265625, -0.113037109375, -0.095306396484375, -0.07757568359375, -0.059844970703125, -0.0421142578125, -0.024383544921875, -0.00665283203125, 0.011077880859375, 0.02880859375, 0.046539306640625, 0.06427001953125, 0.082000732421875, 0.0997314453125, 0.117462158203125, 0.13519287109375, 0.152923583984375, 0.170654296875, 0.188385009765625, 0.20611572265625, 0.223846435546875, 0.2415771484375, 0.259307861328125, 0.27703857421875, 0.294769287109375, 0.3125, 0.330230712890625, 0.34796142578125, 0.365692138671875, 0.3834228515625, 0.401153564453125, 0.41888427734375, 0.436614990234375, 0.454345703125, 0.472076416015625, 0.48980712890625, 0.507537841796875, 0.5252685546875, 0.542999267578125, 0.56072998046875, 0.578460693359375, 0.59619140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 10.0, 30.0, 27.0, 44.0, 65.0, 161.0, 391.0, 2691.0, 332.0, 132.0, 66.0, 29.0, 20.0, 10.0, 8.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258056640625, -0.24957656860351562, -0.24109649658203125, -0.23261642456054688, -0.2241363525390625, -0.21565628051757812, -0.20717620849609375, -0.19869613647460938, -0.190216064453125, -0.18173599243164062, -0.17325592041015625, -0.16477584838867188, -0.1562957763671875, -0.14781570434570312, -0.13933563232421875, -0.13085556030273438, -0.12237548828125, -0.11389541625976562, -0.10541534423828125, -0.09693527221679688, -0.0884552001953125, -0.07997512817382812, -0.07149505615234375, -0.06301498413085938, -0.054534912109375, -0.046054840087890625, -0.03757476806640625, -0.029094696044921875, -0.0206146240234375, -0.012134552001953125, -0.00365447998046875, 0.004825592041015625, 0.0133056640625, 0.021785736083984375, 0.03026580810546875, 0.038745880126953125, 0.0472259521484375, 0.055706024169921875, 0.06418609619140625, 0.07266616821289062, 0.081146240234375, 0.08962631225585938, 0.09810638427734375, 0.10658645629882812, 0.1150665283203125, 0.12354660034179688, 0.13202667236328125, 0.14050674438476562, 0.14898681640625, 0.15746688842773438, 0.16594696044921875, 0.17442703247070312, 0.1829071044921875, 0.19138717651367188, 0.19986724853515625, 0.20834732055664062, 0.216827392578125, 0.22530746459960938, 0.23378753662109375, 0.24226760864257812, 0.2507476806640625, 0.2592277526855469, 0.26770782470703125, 0.2761878967285156, 0.28466796875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 13.0, 62.0, 437.0, 433.0, 54.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.496169924736023, -1.3140807151794434, -1.1319915056228638, -0.949902355670929, -0.7678131461143494, -0.5857239365577698, -0.40363478660583496, -0.22154557704925537, -0.03945636749267578, 0.14263282716274261, 0.324722021818161, 0.5068112015724182, 0.6889004111289978, 0.8709896206855774, 1.0530787706375122, 1.2351679801940918, 1.4172571897506714, 1.599346399307251, 1.7814356088638306, 1.9635248184204102, 2.1456139087677, 2.3277032375335693, 2.5097923278808594, 2.6918816566467285, 2.8739707469940186, 3.0560598373413086, 3.2381491661071777, 3.4202382564544678, 3.602327585220337, 3.784416675567627, 3.966506004333496, 4.148594856262207, 4.330684185028076, 4.512773513793945, 4.694862365722656, 4.876951694488525, 5.0590410232543945, 5.241130352020264, 5.423219203948975, 5.605308532714844, 5.787397861480713, 5.969487190246582, 6.151576042175293, 6.333665370941162, 6.515754699707031, 6.6978440284729, 6.879932880401611, 7.0620222091674805, 7.244111061096191, 7.4262003898620605, 7.6082892417907715, 7.790378570556641, 7.97246789932251, 8.154557228088379, 8.33664608001709, 8.518735885620117, 8.700824737548828, 8.882913589477539, 9.065003395080566, 9.247092247009277, 9.429181098937988, 9.611270904541016, 9.793359756469727, 9.975448608398438, 10.157538414001465]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 9.0, 3.0, 11.0, 8.0, 9.0, 12.0, 10.0, 18.0, 21.0, 35.0, 24.0, 37.0, 29.0, 29.0, 39.0, 32.0, 42.0, 37.0, 40.0, 30.0, 42.0, 30.0, 37.0, 36.0, 35.0, 27.0, 26.0, 34.0, 34.0, 25.0, 16.0, 22.0, 18.0, 15.0, 13.0, 12.0, 17.0, 9.0, 11.0, 11.0, 7.0, 3.0, 6.0, 8.0, 4.0, 3.0, 2.0, 5.0, 5.0, 0.0, 3.0, 2.0], "bins": [-0.6169381737709045, -0.5983559489250183, -0.5797737836837769, -0.5611915588378906, -0.5426093339920044, -0.5240271091461182, -0.5054449439048767, -0.4868627190589905, -0.46828052401542664, -0.4496983289718628, -0.43111610412597656, -0.4125339090824127, -0.3939517140388489, -0.37536948919296265, -0.3567872941493988, -0.33820509910583496, -0.31962287425994873, -0.3010406792163849, -0.28245845437049866, -0.2638762593269348, -0.24529404938220978, -0.22671183943748474, -0.2081296443939209, -0.18954743444919586, -0.17096522450447083, -0.1523830145597458, -0.13380080461502075, -0.11521860957145691, -0.09663639962673187, -0.07805418968200684, -0.059471987187862396, -0.04088978469371796, -0.022307515144348145, -0.0037253089249134064, 0.014856897294521332, 0.03343910351395607, 0.05202130973339081, 0.07060351967811584, 0.08918572217226028, 0.10776792466640472, 0.12635013461112976, 0.1449323445558548, 0.16351455450057983, 0.18209674954414368, 0.2006789594888687, 0.21926116943359375, 0.2378433644771576, 0.25642555952072144, 0.27500778436660767, 0.2935899794101715, 0.31217220425605774, 0.3307543992996216, 0.3493366241455078, 0.36791881918907166, 0.3865010142326355, 0.40508323907852173, 0.42366543412208557, 0.4422476291656494, 0.46082985401153564, 0.4794120490550995, 0.49799424409866333, 0.5165764689445496, 0.5351586937904358, 0.5537408590316772, 0.5723230838775635]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 24.0, 21.0, 38.0, 52.0, 88.0, 145.0, 226.0, 391.0, 728.0, 1449.0, 2899.0, 6961.0, 17046.0, 45485.0, 121144.0, 264252.0, 310132.0, 169206.0, 65818.0, 24735.0, 9658.0, 4007.0, 1915.0, 945.0, 484.0, 290.0, 145.0, 79.0, 57.0, 44.0, 20.0, 16.0, 14.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.55517578125, -0.5389366149902344, -0.5226974487304688, -0.5064582824707031, -0.4902191162109375, -0.4739799499511719, -0.45774078369140625, -0.4415016174316406, -0.425262451171875, -0.4090232849121094, -0.39278411865234375, -0.3765449523925781, -0.3603057861328125, -0.3440666198730469, -0.32782745361328125, -0.3115882873535156, -0.29534912109375, -0.2791099548339844, -0.26287078857421875, -0.24663162231445312, -0.2303924560546875, -0.21415328979492188, -0.19791412353515625, -0.18167495727539062, -0.165435791015625, -0.14919662475585938, -0.13295745849609375, -0.11671829223632812, -0.1004791259765625, -0.08423995971679688, -0.06800079345703125, -0.051761627197265625, -0.0355224609375, -0.019283294677734375, -0.00304412841796875, 0.013195037841796875, 0.0294342041015625, 0.045673370361328125, 0.06191253662109375, 0.07815170288085938, 0.094390869140625, 0.11063003540039062, 0.12686920166015625, 0.14310836791992188, 0.1593475341796875, 0.17558670043945312, 0.19182586669921875, 0.20806503295898438, 0.22430419921875, 0.24054336547851562, 0.25678253173828125, 0.2730216979980469, 0.2892608642578125, 0.3055000305175781, 0.32173919677734375, 0.3379783630371094, 0.354217529296875, 0.3704566955566406, 0.38669586181640625, 0.4029350280761719, 0.4191741943359375, 0.4354133605957031, 0.45165252685546875, 0.4678916931152344, 0.484130859375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 10.0, 10.0, 9.0, 20.0, 24.0, 20.0, 20.0, 32.0, 51.0, 54.0, 48.0, 57.0, 65.0, 55.0, 69.0, 71.0, 57.0, 53.0, 48.0, 41.0, 34.0, 22.0, 22.0, 21.0, 25.0, 18.0, 9.0, 12.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28515625, -0.2760581970214844, -0.26696014404296875, -0.2578620910644531, -0.2487640380859375, -0.23966598510742188, -0.23056793212890625, -0.22146987915039062, -0.212371826171875, -0.20327377319335938, -0.19417572021484375, -0.18507766723632812, -0.1759796142578125, -0.16688156127929688, -0.15778350830078125, -0.14868545532226562, -0.13958740234375, -0.13048934936523438, -0.12139129638671875, -0.11229324340820312, -0.1031951904296875, -0.09409713745117188, -0.08499908447265625, -0.07590103149414062, -0.066802978515625, -0.057704925537109375, -0.04860687255859375, -0.039508819580078125, -0.0304107666015625, -0.021312713623046875, -0.01221466064453125, -0.003116607666015625, 0.0059814453125, 0.015079498291015625, 0.02417755126953125, 0.033275604248046875, 0.0423736572265625, 0.051471710205078125, 0.06056976318359375, 0.06966781616210938, 0.078765869140625, 0.08786392211914062, 0.09696197509765625, 0.10606002807617188, 0.1151580810546875, 0.12425613403320312, 0.13335418701171875, 0.14245223999023438, 0.15155029296875, 0.16064834594726562, 0.16974639892578125, 0.17884445190429688, 0.1879425048828125, 0.19704055786132812, 0.20613861083984375, 0.21523666381835938, 0.224334716796875, 0.23343276977539062, 0.24253082275390625, 0.2516288757324219, 0.2607269287109375, 0.2698249816894531, 0.27892303466796875, 0.2880210876464844, 0.297119140625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 9.0, 6.0, 8.0, 19.0, 16.0, 26.0, 42.0, 55.0, 109.0, 159.0, 349.0, 689.0, 1799.0, 6395.0, 41874.0, 495114.0, 454202.0, 38321.0, 6078.0, 1792.0, 697.0, 333.0, 174.0, 116.0, 61.0, 33.0, 27.0, 15.0, 9.0, 7.0, 8.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.123046875, -1.0798187255859375, -1.036590576171875, -0.9933624267578125, -0.95013427734375, -0.9069061279296875, -0.863677978515625, -0.8204498291015625, -0.7772216796875, -0.7339935302734375, -0.690765380859375, -0.6475372314453125, -0.60430908203125, -0.5610809326171875, -0.517852783203125, -0.4746246337890625, -0.431396484375, -0.3881683349609375, -0.344940185546875, -0.3017120361328125, -0.25848388671875, -0.2152557373046875, -0.172027587890625, -0.1287994384765625, -0.0855712890625, -0.0423431396484375, 0.000885009765625, 0.0441131591796875, 0.08734130859375, 0.1305694580078125, 0.173797607421875, 0.2170257568359375, 0.26025390625, 0.3034820556640625, 0.346710205078125, 0.3899383544921875, 0.43316650390625, 0.4763946533203125, 0.519622802734375, 0.5628509521484375, 0.6060791015625, 0.6493072509765625, 0.692535400390625, 0.7357635498046875, 0.77899169921875, 0.8222198486328125, 0.865447998046875, 0.9086761474609375, 0.951904296875, 0.9951324462890625, 1.038360595703125, 1.0815887451171875, 1.12481689453125, 1.1680450439453125, 1.211273193359375, 1.2545013427734375, 1.2977294921875, 1.3409576416015625, 1.384185791015625, 1.4274139404296875, 1.47064208984375, 1.5138702392578125, 1.557098388671875, 1.6003265380859375, 1.6435546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 3.0, 5.0, 3.0, 6.0, 8.0, 8.0, 16.0, 19.0, 14.0, 28.0, 33.0, 34.0, 40.0, 59.0, 48.0, 45.0, 41.0, 45.0, 49.0, 49.0, 44.0, 47.0, 41.0, 33.0, 44.0, 40.0, 28.0, 27.0, 28.0, 28.0, 13.0, 14.0, 14.0, 6.0, 12.0, 6.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.072265625, -1.03314208984375, -0.9940185546875, -0.95489501953125, -0.915771484375, -0.87664794921875, -0.8375244140625, -0.79840087890625, -0.75927734375, -0.72015380859375, -0.6810302734375, -0.64190673828125, -0.602783203125, -0.56365966796875, -0.5245361328125, -0.48541259765625, -0.4462890625, -0.40716552734375, -0.3680419921875, -0.32891845703125, -0.289794921875, -0.25067138671875, -0.2115478515625, -0.17242431640625, -0.13330078125, -0.09417724609375, -0.0550537109375, -0.01593017578125, 0.023193359375, 0.06231689453125, 0.1014404296875, 0.14056396484375, 0.1796875, 0.21881103515625, 0.2579345703125, 0.29705810546875, 0.336181640625, 0.37530517578125, 0.4144287109375, 0.45355224609375, 0.49267578125, 0.53179931640625, 0.5709228515625, 0.61004638671875, 0.649169921875, 0.68829345703125, 0.7274169921875, 0.76654052734375, 0.8056640625, 0.84478759765625, 0.8839111328125, 0.92303466796875, 0.962158203125, 1.00128173828125, 1.0404052734375, 1.07952880859375, 1.11865234375, 1.15777587890625, 1.1968994140625, 1.23602294921875, 1.275146484375, 1.31427001953125, 1.3533935546875, 1.39251708984375, 1.431640625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 9.0, 19.0, 26.0, 56.0, 90.0, 160.0, 322.0, 901.0, 3154.0, 37849.0, 921936.0, 77569.0, 4518.0, 1113.0, 410.0, 198.0, 82.0, 48.0, 31.0, 23.0, 14.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9423828125, -1.8933258056640625, -1.844268798828125, -1.7952117919921875, -1.74615478515625, -1.6970977783203125, -1.648040771484375, -1.5989837646484375, -1.5499267578125, -1.5008697509765625, -1.451812744140625, -1.4027557373046875, -1.35369873046875, -1.3046417236328125, -1.255584716796875, -1.2065277099609375, -1.157470703125, -1.1084136962890625, -1.059356689453125, -1.0102996826171875, -0.96124267578125, -0.9121856689453125, -0.863128662109375, -0.8140716552734375, -0.7650146484375, -0.7159576416015625, -0.666900634765625, -0.6178436279296875, -0.56878662109375, -0.5197296142578125, -0.470672607421875, -0.4216156005859375, -0.37255859375, -0.3235015869140625, -0.274444580078125, -0.2253875732421875, -0.17633056640625, -0.1272735595703125, -0.078216552734375, -0.0291595458984375, 0.0198974609375, 0.0689544677734375, 0.118011474609375, 0.1670684814453125, 0.21612548828125, 0.2651824951171875, 0.314239501953125, 0.3632965087890625, 0.412353515625, 0.4614105224609375, 0.510467529296875, 0.5595245361328125, 0.60858154296875, 0.6576385498046875, 0.706695556640625, 0.7557525634765625, 0.8048095703125, 0.8538665771484375, 0.902923583984375, 0.9519805908203125, 1.00103759765625, 1.0500946044921875, 1.099151611328125, 1.1482086181640625, 1.197265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 13.0, 21.0, 52.0, 60.0, 99.0, 136.0, 154.0, 137.0, 136.0, 60.0, 47.0, 30.0, 20.0, 12.0, 10.0, 3.0, 5.0, 4.0, 2.0, 1.0], "bins": [-0.0002639293670654297, -0.00025871768593788147, -0.00025350600481033325, -0.00024829432368278503, -0.00024308264255523682, -0.0002378709614276886, -0.00023265928030014038, -0.00022744759917259216, -0.00022223591804504395, -0.00021702423691749573, -0.0002118125557899475, -0.0002066008746623993, -0.00020138919353485107, -0.00019617751240730286, -0.00019096583127975464, -0.00018575415015220642, -0.0001805424690246582, -0.00017533078789710999, -0.00017011910676956177, -0.00016490742564201355, -0.00015969574451446533, -0.00015448406338691711, -0.0001492723822593689, -0.00014406070113182068, -0.00013884902000427246, -0.00013363733887672424, -0.00012842565774917603, -0.0001232139766216278, -0.00011800229549407959, -0.00011279061436653137, -0.00010757893323898315, -0.00010236725211143494, -9.715557098388672e-05, -9.19438898563385e-05, -8.673220872879028e-05, -8.152052760124207e-05, -7.630884647369385e-05, -7.109716534614563e-05, -6.588548421859741e-05, -6.0673803091049194e-05, -5.5462121963500977e-05, -5.025044083595276e-05, -4.503875970840454e-05, -3.982707858085632e-05, -3.4615397453308105e-05, -2.9403716325759888e-05, -2.419203519821167e-05, -1.8980354070663452e-05, -1.3768672943115234e-05, -8.556991815567017e-06, -3.345310688018799e-06, 1.866370439529419e-06, 7.078051567077637e-06, 1.2289732694625854e-05, 1.7501413822174072e-05, 2.271309494972229e-05, 2.7924776077270508e-05, 3.3136457204818726e-05, 3.834813833236694e-05, 4.355981945991516e-05, 4.877150058746338e-05, 5.39831817150116e-05, 5.9194862842559814e-05, 6.440654397010803e-05, 6.961822509765625e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 7.0, 6.0, 17.0, 14.0, 31.0, 43.0, 84.0, 137.0, 272.0, 575.0, 1511.0, 5738.0, 52369.0, 803248.0, 169575.0, 11046.0, 2264.0, 797.0, 346.0, 174.0, 101.0, 71.0, 34.0, 25.0, 12.0, 13.0, 10.0, 10.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.125, -1.0915985107421875, -1.058197021484375, -1.0247955322265625, -0.99139404296875, -0.9579925537109375, -0.924591064453125, -0.8911895751953125, -0.8577880859375, -0.8243865966796875, -0.790985107421875, -0.7575836181640625, -0.72418212890625, -0.6907806396484375, -0.657379150390625, -0.6239776611328125, -0.590576171875, -0.5571746826171875, -0.523773193359375, -0.4903717041015625, -0.45697021484375, -0.4235687255859375, -0.390167236328125, -0.3567657470703125, -0.3233642578125, -0.2899627685546875, -0.256561279296875, -0.2231597900390625, -0.18975830078125, -0.1563568115234375, -0.122955322265625, -0.0895538330078125, -0.05615234375, -0.0227508544921875, 0.010650634765625, 0.0440521240234375, 0.07745361328125, 0.1108551025390625, 0.144256591796875, 0.1776580810546875, 0.2110595703125, 0.2444610595703125, 0.277862548828125, 0.3112640380859375, 0.34466552734375, 0.3780670166015625, 0.411468505859375, 0.4448699951171875, 0.478271484375, 0.5116729736328125, 0.545074462890625, 0.5784759521484375, 0.61187744140625, 0.6452789306640625, 0.678680419921875, 0.7120819091796875, 0.7454833984375, 0.7788848876953125, 0.812286376953125, 0.8456878662109375, 0.87908935546875, 0.9124908447265625, 0.945892333984375, 0.9792938232421875, 1.0126953125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 16.0, 55.0, 96.0, 182.0, 189.0, 204.0, 111.0, 72.0, 37.0, 18.0, 7.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8294525146484375, -0.773162841796875, -0.7168731689453125, -0.66058349609375, -0.6042938232421875, -0.548004150390625, -0.4917144775390625, -0.4354248046875, -0.3791351318359375, -0.322845458984375, -0.2665557861328125, -0.21026611328125, -0.1539764404296875, -0.097686767578125, -0.0413970947265625, 0.014892578125, 0.0711822509765625, 0.127471923828125, 0.1837615966796875, 0.24005126953125, 0.2963409423828125, 0.352630615234375, 0.4089202880859375, 0.4652099609375, 0.5214996337890625, 0.577789306640625, 0.6340789794921875, 0.69036865234375, 0.7466583251953125, 0.802947998046875, 0.8592376708984375, 0.91552734375, 0.9718170166015625, 1.028106689453125, 1.0843963623046875, 1.14068603515625, 1.1969757080078125, 1.253265380859375, 1.3095550537109375, 1.3658447265625, 1.4221343994140625, 1.478424072265625, 1.5347137451171875, 1.59100341796875, 1.6472930908203125, 1.703582763671875, 1.7598724365234375, 1.816162109375, 1.8724517822265625, 1.928741455078125, 1.9850311279296875, 2.04132080078125, 2.0976104736328125, 2.153900146484375, 2.2101898193359375, 2.2664794921875, 2.3227691650390625, 2.379058837890625, 2.4353485107421875, 2.49163818359375, 2.5479278564453125, 2.604217529296875, 2.6605072021484375, 2.716796875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 20.0, 71.0, 213.0, 363.0, 240.0, 62.0, 26.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.64280700683594, -39.80159378051758, -38.96038055419922, -38.119171142578125, -37.277957916259766, -36.436744689941406, -35.59553527832031, -34.75432205200195, -33.913108825683594, -33.071895599365234, -32.230682373046875, -31.38947296142578, -30.548259735107422, -29.707046508789062, -28.865835189819336, -28.02462387084961, -27.18341064453125, -26.34219741821289, -25.500986099243164, -24.659774780273438, -23.818561553955078, -22.97734832763672, -22.136137008666992, -21.294925689697266, -20.453712463378906, -19.612499237060547, -18.77128791809082, -17.930076599121094, -17.088863372802734, -16.247650146484375, -15.406438827514648, -14.565226554870605, -13.724013328552246, -12.882801055908203, -12.04158878326416, -11.200376510620117, -10.359164237976074, -9.517951965332031, -8.676739692687988, -7.835527420043945, -6.994315147399902, -6.153102874755859, -5.311890602111816, -4.470678329467773, -3.6294660568237305, -2.7882537841796875, -1.9470415115356445, -1.1058292388916016, -0.2646169662475586, 0.5765953063964844, 1.4178075790405273, 2.2590198516845703, 3.1002321243286133, 3.9414443969726562, 4.782656669616699, 5.623868942260742, 6.465081214904785, 7.306293487548828, 8.147505760192871, 8.988718032836914, 9.829930305480957, 10.671142578125, 11.512354850769043, 12.353567123413086, 13.194779396057129]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 7.0, 9.0, 9.0, 13.0, 11.0, 17.0, 25.0, 30.0, 33.0, 37.0, 34.0, 35.0, 51.0, 53.0, 62.0, 54.0, 50.0, 55.0, 53.0, 63.0, 42.0, 51.0, 32.0, 25.0, 31.0, 21.0, 25.0, 17.0, 11.0, 11.0, 10.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.026670455932617, -5.824587821960449, -5.6225056648254395, -5.42042350769043, -5.218340873718262, -5.016258239746094, -4.814176082611084, -4.612093925476074, -4.410011291503906, -4.207928657531738, -4.0058465003967285, -3.8037641048431396, -3.601681709289551, -3.399599313735962, -3.197516918182373, -2.995434522628784, -2.7933521270751953, -2.5912697315216064, -2.3891873359680176, -2.1871049404144287, -1.9850225448608398, -1.782940149307251, -1.580857753753662, -1.3787753582000732, -1.1766929626464844, -0.9746105670928955, -0.7725281715393066, -0.5704457759857178, -0.3683633804321289, -0.16628098487854004, 0.03580141067504883, 0.2378838062286377, 0.43996667861938477, 0.6420490741729736, 0.8441314697265625, 1.0462138652801514, 1.2482962608337402, 1.450378656387329, 1.652461051940918, 1.8545434474945068, 2.0566258430480957, 2.2587082386016846, 2.4607906341552734, 2.6628730297088623, 2.864955425262451, 3.06703782081604, 3.269120216369629, 3.4712026119232178, 3.6732850074768066, 3.8753674030303955, 4.077449798583984, 4.279532432556152, 4.481614589691162, 4.683696746826172, 4.88577938079834, 5.087862014770508, 5.289944171905518, 5.492026329040527, 5.694108963012695, 5.896191596984863, 6.098273754119873, 6.300355911254883, 6.502438545227051, 6.704521179199219, 6.9066033363342285]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 10.0, 12.0, 18.0, 21.0, 37.0, 85.0, 123.0, 221.0, 473.0, 1112.0, 3041.0, 11142.0, 86111.0, 4035176.0, 44899.0, 7723.0, 2255.0, 868.0, 428.0, 210.0, 109.0, 72.0, 51.0, 37.0, 15.0, 7.0, 11.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8130722045898438, -0.7662811279296875, -0.7194900512695312, -0.672698974609375, -0.6259078979492188, -0.5791168212890625, -0.5323257446289062, -0.48553466796875, -0.43874359130859375, -0.3919525146484375, -0.34516143798828125, -0.298370361328125, -0.25157928466796875, -0.2047882080078125, -0.15799713134765625, -0.1112060546875, -0.06441497802734375, -0.0176239013671875, 0.02916717529296875, 0.075958251953125, 0.12274932861328125, 0.1695404052734375, 0.21633148193359375, 0.26312255859375, 0.30991363525390625, 0.3567047119140625, 0.40349578857421875, 0.450286865234375, 0.49707794189453125, 0.5438690185546875, 0.5906600952148438, 0.637451171875, 0.6842422485351562, 0.7310333251953125, 0.7778244018554688, 0.824615478515625, 0.8714065551757812, 0.9181976318359375, 0.9649887084960938, 1.01177978515625, 1.0585708618164062, 1.1053619384765625, 1.1521530151367188, 1.198944091796875, 1.2457351684570312, 1.2925262451171875, 1.3393173217773438, 1.3861083984375, 1.4328994750976562, 1.4796905517578125, 1.5264816284179688, 1.573272705078125, 1.6200637817382812, 1.6668548583984375, 1.7136459350585938, 1.76043701171875, 1.8072280883789062, 1.8540191650390625, 1.9008102416992188, 1.947601318359375, 1.9943923950195312, 2.0411834716796875, 2.0879745483398438, 2.134765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 6.0, 4.0, 9.0, 11.0, 17.0, 17.0, 37.0, 42.0, 40.0, 63.0, 75.0, 86.0, 80.0, 71.0, 77.0, 72.0, 58.0, 62.0, 47.0, 27.0, 25.0, 18.0, 11.0, 14.0, 6.0, 7.0, 9.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2942619323730469, -0.28163909912109375, -0.2690162658691406, -0.2563934326171875, -0.24377059936523438, -0.23114776611328125, -0.21852493286132812, -0.205902099609375, -0.19327926635742188, -0.18065643310546875, -0.16803359985351562, -0.1554107666015625, -0.14278793334960938, -0.13016510009765625, -0.11754226684570312, -0.10491943359375, -0.09229660034179688, -0.07967376708984375, -0.06705093383789062, -0.0544281005859375, -0.041805267333984375, -0.02918243408203125, -0.016559600830078125, -0.003936767578125, 0.008686065673828125, 0.02130889892578125, 0.033931732177734375, 0.0465545654296875, 0.059177398681640625, 0.07180023193359375, 0.08442306518554688, 0.0970458984375, 0.10966873168945312, 0.12229156494140625, 0.13491439819335938, 0.1475372314453125, 0.16016006469726562, 0.17278289794921875, 0.18540573120117188, 0.198028564453125, 0.21065139770507812, 0.22327423095703125, 0.23589706420898438, 0.2485198974609375, 0.2611427307128906, 0.27376556396484375, 0.2863883972167969, 0.29901123046875, 0.3116340637207031, 0.32425689697265625, 0.3368797302246094, 0.3495025634765625, 0.3621253967285156, 0.37474822998046875, 0.3873710632324219, 0.399993896484375, 0.4126167297363281, 0.42523956298828125, 0.4378623962402344, 0.4504852294921875, 0.4631080627441406, 0.47573089599609375, 0.4883537292480469, 0.5009765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 4.0, 5.0, 11.0, 14.0, 19.0, 34.0, 43.0, 43.0, 76.0, 98.0, 194.0, 274.0, 465.0, 714.0, 1412.0, 3083.0, 8039.0, 28261.0, 222537.0, 3847756.0, 58605.0, 13417.0, 4611.0, 2041.0, 1048.0, 511.0, 317.0, 214.0, 160.0, 93.0, 50.0, 37.0, 18.0, 27.0, 15.0, 9.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90869140625, -0.8753128051757812, -0.8419342041015625, -0.8085556030273438, -0.775177001953125, -0.7417984008789062, -0.7084197998046875, -0.6750411987304688, -0.64166259765625, -0.6082839965820312, -0.5749053955078125, -0.5415267944335938, -0.508148193359375, -0.47476959228515625, -0.4413909912109375, -0.40801239013671875, -0.3746337890625, -0.34125518798828125, -0.3078765869140625, -0.27449798583984375, -0.241119384765625, -0.20774078369140625, -0.1743621826171875, -0.14098358154296875, -0.10760498046875, -0.07422637939453125, -0.0408477783203125, -0.00746917724609375, 0.025909423828125, 0.05928802490234375, 0.0926666259765625, 0.12604522705078125, 0.159423828125, 0.19280242919921875, 0.2261810302734375, 0.25955963134765625, 0.292938232421875, 0.32631683349609375, 0.3596954345703125, 0.39307403564453125, 0.42645263671875, 0.45983123779296875, 0.4932098388671875, 0.5265884399414062, 0.559967041015625, 0.5933456420898438, 0.6267242431640625, 0.6601028442382812, 0.6934814453125, 0.7268600463867188, 0.7602386474609375, 0.7936172485351562, 0.826995849609375, 0.8603744506835938, 0.8937530517578125, 0.9271316528320312, 0.96051025390625, 0.9938888549804688, 1.0272674560546875, 1.0606460571289062, 1.094024658203125, 1.1274032592773438, 1.1607818603515625, 1.1941604614257812, 1.2275390625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 12.0, 23.0, 26.0, 59.0, 125.0, 2823.0, 771.0, 125.0, 43.0, 25.0, 9.0, 8.0, 8.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389404296875, -0.3779449462890625, -0.366485595703125, -0.3550262451171875, -0.34356689453125, -0.3321075439453125, -0.320648193359375, -0.3091888427734375, -0.2977294921875, -0.2862701416015625, -0.274810791015625, -0.2633514404296875, -0.25189208984375, -0.2404327392578125, -0.228973388671875, -0.2175140380859375, -0.2060546875, -0.1945953369140625, -0.183135986328125, -0.1716766357421875, -0.16021728515625, -0.1487579345703125, -0.137298583984375, -0.1258392333984375, -0.1143798828125, -0.1029205322265625, -0.091461181640625, -0.0800018310546875, -0.06854248046875, -0.0570831298828125, -0.045623779296875, -0.0341644287109375, -0.022705078125, -0.0112457275390625, 0.000213623046875, 0.0116729736328125, 0.02313232421875, 0.0345916748046875, 0.046051025390625, 0.0575103759765625, 0.0689697265625, 0.0804290771484375, 0.091888427734375, 0.1033477783203125, 0.11480712890625, 0.1262664794921875, 0.137725830078125, 0.1491851806640625, 0.16064453125, 0.1721038818359375, 0.183563232421875, 0.1950225830078125, 0.20648193359375, 0.2179412841796875, 0.229400634765625, 0.2408599853515625, 0.2523193359375, 0.2637786865234375, 0.275238037109375, 0.2866973876953125, 0.29815673828125, 0.3096160888671875, 0.321075439453125, 0.3325347900390625, 0.343994140625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 11.0, 10.0, 13.0, 39.0, 105.0, 141.0, 168.0, 180.0, 145.0, 79.0, 56.0, 29.0, 14.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0764315128326416, -1.0300545692443848, -0.9836775064468384, -0.9373005628585815, -0.8909235596656799, -0.8445465564727783, -0.7981696128845215, -0.7517926096916199, -0.7054156064987183, -0.6590386033058167, -0.612661600112915, -0.5662846565246582, -0.5199076533317566, -0.473530650138855, -0.42715367674827576, -0.38077670335769653, -0.3343997001647949, -0.2880226969718933, -0.2416457235813141, -0.19526873528957367, -0.14889174699783325, -0.10251475870609283, -0.05613777041435242, -0.009760797023773193, 0.03661620616912842, 0.08299319446086884, 0.12937018275260925, 0.17574717104434967, 0.2221241593360901, 0.2685011625289917, 0.3148781359195709, 0.36125510931015015, 0.4076322317123413, 0.4540092349052429, 0.5003862380981445, 0.5467631816864014, 0.593140184879303, 0.6395171880722046, 0.6858941316604614, 0.732271134853363, 0.7786481380462646, 0.8250251412391663, 0.8714021444320679, 0.9177790880203247, 0.9641560912132263, 1.010533094406128, 1.0569100379943848, 1.1032869815826416, 1.149664044380188, 1.1960409879684448, 1.2424180507659912, 1.288794994354248, 1.3351719379425049, 1.3815490007400513, 1.427925944328308, 1.4743030071258545, 1.5206799507141113, 1.5670568943023682, 1.6134339570999146, 1.6598109006881714, 1.7061879634857178, 1.7525649070739746, 1.7989418506622314, 1.8453187942504883, 1.8916958570480347]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 5.0, 8.0, 11.0, 9.0, 17.0, 21.0, 27.0, 28.0, 34.0, 45.0, 57.0, 48.0, 57.0, 54.0, 41.0, 53.0, 55.0, 62.0, 61.0, 46.0, 51.0, 40.0, 38.0, 23.0, 25.0, 18.0, 17.0, 12.0, 15.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6839041709899902, -0.6615318655967712, -0.6391595005989075, -0.6167871952056885, -0.5944148302078247, -0.5720425248146057, -0.5496701598167419, -0.527297854423523, -0.5049254894256592, -0.4825531542301178, -0.4601808190345764, -0.43780848383903503, -0.41543614864349365, -0.39306381344795227, -0.3706914782524109, -0.3483191728591919, -0.3259468376636505, -0.30357450246810913, -0.28120216727256775, -0.25882983207702637, -0.23645749688148499, -0.2140851616859436, -0.19171284139156342, -0.16934050619602203, -0.14696817100048065, -0.12459583580493927, -0.10222350060939789, -0.0798511728644371, -0.05747883766889572, -0.03510650247335434, -0.012734174728393555, 0.009638160467147827, 0.03201049566268921, 0.05438283085823059, 0.07675516605377197, 0.09912749379873276, 0.12149982899427414, 0.14387217164039612, 0.1662444919347763, 0.1886168271303177, 0.21098916232585907, 0.23336149752140045, 0.25573381781578064, 0.278106153011322, 0.3004784882068634, 0.3228508234024048, 0.34522315859794617, 0.36759549379348755, 0.38996782898902893, 0.4123401641845703, 0.4347124993801117, 0.4570848345756531, 0.47945716977119446, 0.5018295049667358, 0.5242018103599548, 0.5465741753578186, 0.5689464807510376, 0.5913187861442566, 0.6136911511421204, 0.6360634565353394, 0.6584358215332031, 0.6808081269264221, 0.7031804919242859, 0.7255527973175049, 0.7479251623153687]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 10.0, 8.0, 9.0, 22.0, 23.0, 26.0, 56.0, 57.0, 112.0, 190.0, 275.0, 455.0, 800.0, 1498.0, 2942.0, 6742.0, 16695.0, 47506.0, 146472.0, 355567.0, 301881.0, 108231.0, 35520.0, 12816.0, 5217.0, 2448.0, 1227.0, 665.0, 397.0, 227.0, 134.0, 88.0, 65.0, 58.0, 35.0, 23.0, 19.0, 12.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.58447265625, -0.5655364990234375, -0.546600341796875, -0.5276641845703125, -0.50872802734375, -0.4897918701171875, -0.470855712890625, -0.4519195556640625, -0.4329833984375, -0.4140472412109375, -0.395111083984375, -0.3761749267578125, -0.35723876953125, -0.3383026123046875, -0.319366455078125, -0.3004302978515625, -0.281494140625, -0.2625579833984375, -0.243621826171875, -0.2246856689453125, -0.20574951171875, -0.1868133544921875, -0.167877197265625, -0.1489410400390625, -0.1300048828125, -0.1110687255859375, -0.092132568359375, -0.0731964111328125, -0.05426025390625, -0.0353240966796875, -0.016387939453125, 0.0025482177734375, 0.021484375, 0.0404205322265625, 0.059356689453125, 0.0782928466796875, 0.09722900390625, 0.1161651611328125, 0.135101318359375, 0.1540374755859375, 0.1729736328125, 0.1919097900390625, 0.210845947265625, 0.2297821044921875, 0.24871826171875, 0.2676544189453125, 0.286590576171875, 0.3055267333984375, 0.324462890625, 0.3433990478515625, 0.362335205078125, 0.3812713623046875, 0.40020751953125, 0.4191436767578125, 0.438079833984375, 0.4570159912109375, 0.4759521484375, 0.4948883056640625, 0.513824462890625, 0.5327606201171875, 0.55169677734375, 0.5706329345703125, 0.589569091796875, 0.6085052490234375, 0.62744140625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 14.0, 15.0, 18.0, 17.0, 22.0, 32.0, 40.0, 49.0, 57.0, 72.0, 66.0, 74.0, 69.0, 57.0, 62.0, 51.0, 57.0, 34.0, 43.0, 27.0, 22.0, 23.0, 20.0, 12.0, 9.0, 4.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28564453125, -0.27442169189453125, -0.2631988525390625, -0.25197601318359375, -0.240753173828125, -0.22953033447265625, -0.2183074951171875, -0.20708465576171875, -0.19586181640625, -0.18463897705078125, -0.1734161376953125, -0.16219329833984375, -0.150970458984375, -0.13974761962890625, -0.1285247802734375, -0.11730194091796875, -0.1060791015625, -0.09485626220703125, -0.0836334228515625, -0.07241058349609375, -0.061187744140625, -0.04996490478515625, -0.0387420654296875, -0.02751922607421875, -0.01629638671875, -0.00507354736328125, 0.0061492919921875, 0.01737213134765625, 0.028594970703125, 0.03981781005859375, 0.0510406494140625, 0.06226348876953125, 0.073486328125, 0.08470916748046875, 0.0959320068359375, 0.10715484619140625, 0.118377685546875, 0.12960052490234375, 0.1408233642578125, 0.15204620361328125, 0.16326904296875, 0.17449188232421875, 0.1857147216796875, 0.19693756103515625, 0.208160400390625, 0.21938323974609375, 0.2306060791015625, 0.24182891845703125, 0.2530517578125, 0.26427459716796875, 0.2754974365234375, 0.28672027587890625, 0.297943115234375, 0.30916595458984375, 0.3203887939453125, 0.33161163330078125, 0.34283447265625, 0.35405731201171875, 0.3652801513671875, 0.37650299072265625, 0.387725830078125, 0.39894866943359375, 0.4101715087890625, 0.42139434814453125, 0.4326171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 10.0, 7.0, 11.0, 19.0, 15.0, 31.0, 52.0, 61.0, 104.0, 164.0, 248.0, 398.0, 864.0, 2175.0, 8246.0, 64091.0, 608164.0, 326135.0, 29689.0, 4822.0, 1541.0, 686.0, 320.0, 214.0, 159.0, 107.0, 65.0, 37.0, 27.0, 23.0, 15.0, 12.0, 11.0, 6.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.32421875, -1.287261962890625, -1.25030517578125, -1.213348388671875, -1.1763916015625, -1.139434814453125, -1.10247802734375, -1.065521240234375, -1.028564453125, -0.991607666015625, -0.95465087890625, -0.917694091796875, -0.8807373046875, -0.843780517578125, -0.80682373046875, -0.769866943359375, -0.73291015625, -0.695953369140625, -0.65899658203125, -0.622039794921875, -0.5850830078125, -0.548126220703125, -0.51116943359375, -0.474212646484375, -0.437255859375, -0.400299072265625, -0.36334228515625, -0.326385498046875, -0.2894287109375, -0.252471923828125, -0.21551513671875, -0.178558349609375, -0.1416015625, -0.104644775390625, -0.06768798828125, -0.030731201171875, 0.0062255859375, 0.043182373046875, 0.08013916015625, 0.117095947265625, 0.154052734375, 0.191009521484375, 0.22796630859375, 0.264923095703125, 0.3018798828125, 0.338836669921875, 0.37579345703125, 0.412750244140625, 0.44970703125, 0.486663818359375, 0.52362060546875, 0.560577392578125, 0.5975341796875, 0.634490966796875, 0.67144775390625, 0.708404541015625, 0.745361328125, 0.782318115234375, 0.81927490234375, 0.856231689453125, 0.8931884765625, 0.930145263671875, 0.96710205078125, 1.004058837890625, 1.041015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 4.0, 4.0, 5.0, 9.0, 6.0, 10.0, 13.0, 19.0, 17.0, 21.0, 21.0, 19.0, 30.0, 37.0, 29.0, 39.0, 36.0, 37.0, 52.0, 38.0, 42.0, 47.0, 46.0, 35.0, 36.0, 33.0, 33.0, 29.0, 31.0, 23.0, 30.0, 27.0, 24.0, 24.0, 18.0, 10.0, 21.0, 10.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 6.0, 0.0, 3.0], "bins": [-1.2255859375, -1.1900177001953125, -1.154449462890625, -1.1188812255859375, -1.08331298828125, -1.0477447509765625, -1.012176513671875, -0.9766082763671875, -0.9410400390625, -0.9054718017578125, -0.869903564453125, -0.8343353271484375, -0.79876708984375, -0.7631988525390625, -0.727630615234375, -0.6920623779296875, -0.656494140625, -0.6209259033203125, -0.585357666015625, -0.5497894287109375, -0.51422119140625, -0.4786529541015625, -0.443084716796875, -0.4075164794921875, -0.3719482421875, -0.3363800048828125, -0.300811767578125, -0.2652435302734375, -0.22967529296875, -0.1941070556640625, -0.158538818359375, -0.1229705810546875, -0.08740234375, -0.0518341064453125, -0.016265869140625, 0.0193023681640625, 0.05487060546875, 0.0904388427734375, 0.126007080078125, 0.1615753173828125, 0.1971435546875, 0.2327117919921875, 0.268280029296875, 0.3038482666015625, 0.33941650390625, 0.3749847412109375, 0.410552978515625, 0.4461212158203125, 0.481689453125, 0.5172576904296875, 0.552825927734375, 0.5883941650390625, 0.62396240234375, 0.6595306396484375, 0.695098876953125, 0.7306671142578125, 0.7662353515625, 0.8018035888671875, 0.837371826171875, 0.8729400634765625, 0.90850830078125, 0.9440765380859375, 0.979644775390625, 1.0152130126953125, 1.05078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 8.0, 15.0, 27.0, 41.0, 61.0, 134.0, 296.0, 1079.0, 6821.0, 604075.0, 428641.0, 5875.0, 923.0, 282.0, 101.0, 54.0, 40.0, 19.0, 20.0, 15.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6904296875, -1.64208984375, -1.59375, -1.54541015625, -1.4970703125, -1.44873046875, -1.400390625, -1.35205078125, -1.3037109375, -1.25537109375, -1.20703125, -1.15869140625, -1.1103515625, -1.06201171875, -1.013671875, -0.96533203125, -0.9169921875, -0.86865234375, -0.8203125, -0.77197265625, -0.7236328125, -0.67529296875, -0.626953125, -0.57861328125, -0.5302734375, -0.48193359375, -0.43359375, -0.38525390625, -0.3369140625, -0.28857421875, -0.240234375, -0.19189453125, -0.1435546875, -0.09521484375, -0.046875, 0.00146484375, 0.0498046875, 0.09814453125, 0.146484375, 0.19482421875, 0.2431640625, 0.29150390625, 0.33984375, 0.38818359375, 0.4365234375, 0.48486328125, 0.533203125, 0.58154296875, 0.6298828125, 0.67822265625, 0.7265625, 0.77490234375, 0.8232421875, 0.87158203125, 0.919921875, 0.96826171875, 1.0166015625, 1.06494140625, 1.11328125, 1.16162109375, 1.2099609375, 1.25830078125, 1.306640625, 1.35498046875, 1.4033203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 9.0, 15.0, 15.0, 22.0, 34.0, 44.0, 44.0, 57.0, 103.0, 98.0, 108.0, 109.0, 76.0, 77.0, 53.0, 39.0, 25.0, 15.0, 12.0, 11.0, 10.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.580352783203125e-05, -6.271898746490479e-05, -5.963444709777832e-05, -5.6549906730651855e-05, -5.346536636352539e-05, -5.0380825996398926e-05, -4.729628562927246e-05, -4.4211745262145996e-05, -4.112720489501953e-05, -3.8042664527893066e-05, -3.49581241607666e-05, -3.187358379364014e-05, -2.8789043426513672e-05, -2.5704503059387207e-05, -2.2619962692260742e-05, -1.9535422325134277e-05, -1.6450881958007812e-05, -1.3366341590881348e-05, -1.0281801223754883e-05, -7.197260856628418e-06, -4.112720489501953e-06, -1.0281801223754883e-06, 2.0563602447509766e-06, 5.140900611877441e-06, 8.225440979003906e-06, 1.1309981346130371e-05, 1.4394521713256836e-05, 1.74790620803833e-05, 2.0563602447509766e-05, 2.364814281463623e-05, 2.6732683181762695e-05, 2.981722354888916e-05, 3.2901763916015625e-05, 3.598630428314209e-05, 3.9070844650268555e-05, 4.215538501739502e-05, 4.5239925384521484e-05, 4.832446575164795e-05, 5.1409006118774414e-05, 5.449354648590088e-05, 5.7578086853027344e-05, 6.066262722015381e-05, 6.374716758728027e-05, 6.683170795440674e-05, 6.99162483215332e-05, 7.300078868865967e-05, 7.608532905578613e-05, 7.91698694229126e-05, 8.225440979003906e-05, 8.533895015716553e-05, 8.842349052429199e-05, 9.150803089141846e-05, 9.459257125854492e-05, 9.767711162567139e-05, 0.00010076165199279785, 0.00010384619235992432, 0.00010693073272705078, 0.00011001527309417725, 0.00011309981346130371, 0.00011618435382843018, 0.00011926889419555664, 0.0001223534345626831, 0.00012543797492980957, 0.00012852251529693604, 0.0001316070556640625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 15.0, 18.0, 27.0, 53.0, 104.0, 171.0, 377.0, 1086.0, 4070.0, 40275.0, 864895.0, 127688.0, 7259.0, 1503.0, 497.0, 215.0, 109.0, 58.0, 35.0, 30.0, 18.0, 12.0, 6.0, 10.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.041015625, -1.0109786987304688, -0.9809417724609375, -0.9509048461914062, -0.920867919921875, -0.8908309936523438, -0.8607940673828125, -0.8307571411132812, -0.80072021484375, -0.7706832885742188, -0.7406463623046875, -0.7106094360351562, -0.680572509765625, -0.6505355834960938, -0.6204986572265625, -0.5904617309570312, -0.5604248046875, -0.5303878784179688, -0.5003509521484375, -0.47031402587890625, -0.440277099609375, -0.41024017333984375, -0.3802032470703125, -0.35016632080078125, -0.32012939453125, -0.29009246826171875, -0.2600555419921875, -0.23001861572265625, -0.199981689453125, -0.16994476318359375, -0.1399078369140625, -0.10987091064453125, -0.079833984375, -0.04979705810546875, -0.0197601318359375, 0.01027679443359375, 0.040313720703125, 0.07035064697265625, 0.1003875732421875, 0.13042449951171875, 0.16046142578125, 0.19049835205078125, 0.2205352783203125, 0.25057220458984375, 0.280609130859375, 0.31064605712890625, 0.3406829833984375, 0.37071990966796875, 0.4007568359375, 0.43079376220703125, 0.4608306884765625, 0.49086761474609375, 0.520904541015625, 0.5509414672851562, 0.5809783935546875, 0.6110153198242188, 0.64105224609375, 0.6710891723632812, 0.7011260986328125, 0.7311630249023438, 0.761199951171875, 0.7912368774414062, 0.8212738037109375, 0.8513107299804688, 0.88134765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 17.0, 16.0, 21.0, 35.0, 30.0, 59.0, 57.0, 67.0, 82.0, 107.0, 84.0, 79.0, 69.0, 53.0, 46.0, 49.0, 32.0, 19.0, 8.0, 16.0, 9.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40673828125, -0.3888702392578125, -0.371002197265625, -0.3531341552734375, -0.33526611328125, -0.3173980712890625, -0.299530029296875, -0.2816619873046875, -0.2637939453125, -0.2459259033203125, -0.228057861328125, -0.2101898193359375, -0.19232177734375, -0.1744537353515625, -0.156585693359375, -0.1387176513671875, -0.120849609375, -0.1029815673828125, -0.085113525390625, -0.0672454833984375, -0.04937744140625, -0.0315093994140625, -0.013641357421875, 0.0042266845703125, 0.0220947265625, 0.0399627685546875, 0.057830810546875, 0.0756988525390625, 0.09356689453125, 0.1114349365234375, 0.129302978515625, 0.1471710205078125, 0.1650390625, 0.1829071044921875, 0.200775146484375, 0.2186431884765625, 0.23651123046875, 0.2543792724609375, 0.272247314453125, 0.2901153564453125, 0.3079833984375, 0.3258514404296875, 0.343719482421875, 0.3615875244140625, 0.37945556640625, 0.3973236083984375, 0.415191650390625, 0.4330596923828125, 0.450927734375, 0.4687957763671875, 0.486663818359375, 0.5045318603515625, 0.52239990234375, 0.5402679443359375, 0.558135986328125, 0.5760040283203125, 0.5938720703125, 0.6117401123046875, 0.629608154296875, 0.6474761962890625, 0.66534423828125, 0.6832122802734375, 0.701080322265625, 0.7189483642578125, 0.73681640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 36.0, 50.0, 119.0, 159.0, 197.0, 164.0, 114.0, 79.0, 39.0, 18.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.68136978149414, -13.344270706176758, -13.007170677185059, -12.67007064819336, -12.332971572875977, -11.995872497558594, -11.658772468566895, -11.321672439575195, -10.984573364257812, -10.64747428894043, -10.31037425994873, -9.973274230957031, -9.636175155639648, -9.299076080322266, -8.961976051330566, -8.624876022338867, -8.287776947021484, -7.950677394866943, -7.613577842712402, -7.276478290557861, -6.93937873840332, -6.602279186248779, -6.265179634094238, -5.928080081939697, -5.590980529785156, -5.253880977630615, -4.916781425476074, -4.579681873321533, -4.242582321166992, -3.905482769012451, -3.56838321685791, -3.231283664703369, -2.8941831588745117, -2.5570836067199707, -2.2199840545654297, -1.8828845024108887, -1.5457849502563477, -1.2086853981018066, -0.8715858459472656, -0.5344862937927246, -0.1973867416381836, 0.13971281051635742, 0.47681236267089844, 0.8139119148254395, 1.1510114669799805, 1.4881110191345215, 1.8252105712890625, 2.1623101234436035, 2.4994096755981445, 2.8365092277526855, 3.1736087799072266, 3.5107083320617676, 3.8478078842163086, 4.18490743637085, 4.522006988525391, 4.859106540679932, 5.196206092834473, 5.533305644989014, 5.870405197143555, 6.207504749298096, 6.544604301452637, 6.881703853607178, 7.218803405761719, 7.55590295791626, 7.893002510070801]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 13.0, 14.0, 14.0, 27.0, 26.0, 26.0, 26.0, 41.0, 33.0, 38.0, 52.0, 57.0, 55.0, 43.0, 58.0, 66.0, 52.0, 49.0, 49.0, 39.0, 36.0, 31.0, 26.0, 17.0, 13.0, 24.0, 12.0, 7.0, 11.0, 6.0, 6.0, 6.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.996451377868652, -6.802894592285156, -6.60933780670166, -6.415781021118164, -6.222224235534668, -6.028667449951172, -5.835110664367676, -5.64155387878418, -5.447997093200684, -5.2544403076171875, -5.060883522033691, -4.867326736450195, -4.673769950866699, -4.480213165283203, -4.286656379699707, -4.093099594116211, -3.899543285369873, -3.705986499786377, -3.512429714202881, -3.3188729286193848, -3.1253161430358887, -2.9317593574523926, -2.7382028102874756, -2.5446460247039795, -2.3510892391204834, -2.1575324535369873, -1.9639756679534912, -1.7704190015792847, -1.5768622159957886, -1.3833054304122925, -1.189748764038086, -0.9961919784545898, -0.802635669708252, -0.6090788841247559, -0.41552215814590454, -0.22196543216705322, -0.02840864658355713, 0.16514813899993896, 0.3587048053741455, 0.5522615909576416, 0.7458183765411377, 0.9393751621246338, 1.1329319477081299, 1.3264886140823364, 1.5200453996658325, 1.7136021852493286, 1.9071588516235352, 2.1007156372070312, 2.2942724227905273, 2.4878292083740234, 2.6813859939575195, 2.8749427795410156, 3.0684995651245117, 3.262056350708008, 3.455612897872925, 3.649169683456421, 3.842726469039917, 4.036283016204834, 4.22983980178833, 4.423396587371826, 4.616953372955322, 4.810510158538818, 5.0040669441223145, 5.1976237297058105, 5.391180515289307]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 8.0, 18.0, 27.0, 41.0, 75.0, 117.0, 217.0, 343.0, 661.0, 1340.0, 2996.0, 7882.0, 25669.0, 150951.0, 3824361.0, 141725.0, 24570.0, 7401.0, 2975.0, 1287.0, 687.0, 366.0, 185.0, 118.0, 68.0, 53.0, 36.0, 34.0, 26.0, 10.0, 9.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.85205078125, -0.8266067504882812, -0.8011627197265625, -0.7757186889648438, -0.750274658203125, -0.7248306274414062, -0.6993865966796875, -0.6739425659179688, -0.64849853515625, -0.6230545043945312, -0.5976104736328125, -0.5721664428710938, -0.546722412109375, -0.5212783813476562, -0.4958343505859375, -0.47039031982421875, -0.4449462890625, -0.41950225830078125, -0.3940582275390625, -0.36861419677734375, -0.343170166015625, -0.31772613525390625, -0.2922821044921875, -0.26683807373046875, -0.24139404296875, -0.21595001220703125, -0.1905059814453125, -0.16506195068359375, -0.139617919921875, -0.11417388916015625, -0.0887298583984375, -0.06328582763671875, -0.037841796875, -0.01239776611328125, 0.0130462646484375, 0.03849029541015625, 0.063934326171875, 0.08937835693359375, 0.1148223876953125, 0.14026641845703125, 0.16571044921875, 0.19115447998046875, 0.2165985107421875, 0.24204254150390625, 0.267486572265625, 0.29293060302734375, 0.3183746337890625, 0.34381866455078125, 0.3692626953125, 0.39470672607421875, 0.4201507568359375, 0.44559478759765625, 0.471038818359375, 0.49648284912109375, 0.5219268798828125, 0.5473709106445312, 0.57281494140625, 0.5982589721679688, 0.6237030029296875, 0.6491470336914062, 0.674591064453125, 0.7000350952148438, 0.7254791259765625, 0.7509231567382812, 0.7763671875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 11.0, 12.0, 21.0, 15.0, 32.0, 33.0, 58.0, 68.0, 77.0, 75.0, 88.0, 87.0, 70.0, 65.0, 54.0, 46.0, 36.0, 39.0, 35.0, 17.0, 6.0, 12.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.385986328125, -0.37351226806640625, -0.3610382080078125, -0.34856414794921875, -0.336090087890625, -0.32361602783203125, -0.3111419677734375, -0.29866790771484375, -0.28619384765625, -0.27371978759765625, -0.2612457275390625, -0.24877166748046875, -0.236297607421875, -0.22382354736328125, -0.2113494873046875, -0.19887542724609375, -0.1864013671875, -0.17392730712890625, -0.1614532470703125, -0.14897918701171875, -0.136505126953125, -0.12403106689453125, -0.1115570068359375, -0.09908294677734375, -0.08660888671875, -0.07413482666015625, -0.0616607666015625, -0.04918670654296875, -0.036712646484375, -0.02423858642578125, -0.0117645263671875, 0.00070953369140625, 0.01318359375, 0.02565765380859375, 0.0381317138671875, 0.05060577392578125, 0.063079833984375, 0.07555389404296875, 0.0880279541015625, 0.10050201416015625, 0.11297607421875, 0.12545013427734375, 0.1379241943359375, 0.15039825439453125, 0.162872314453125, 0.17534637451171875, 0.1878204345703125, 0.20029449462890625, 0.2127685546875, 0.22524261474609375, 0.2377166748046875, 0.25019073486328125, 0.262664794921875, 0.27513885498046875, 0.2876129150390625, 0.30008697509765625, 0.31256103515625, 0.32503509521484375, 0.3375091552734375, 0.34998321533203125, 0.362457275390625, 0.37493133544921875, 0.3874053955078125, 0.39987945556640625, 0.412353515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 11.0, 23.0, 18.0, 39.0, 61.0, 111.0, 179.0, 342.0, 606.0, 1019.0, 2118.0, 4533.0, 10827.0, 30115.0, 108972.0, 3136119.0, 773247.0, 83628.0, 25076.0, 9302.0, 3899.0, 1855.0, 946.0, 492.0, 273.0, 167.0, 117.0, 61.0, 44.0, 29.0, 19.0, 13.0, 9.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6015625, -0.5838241577148438, -0.5660858154296875, -0.5483474731445312, -0.530609130859375, -0.5128707885742188, -0.4951324462890625, -0.47739410400390625, -0.45965576171875, -0.44191741943359375, -0.4241790771484375, -0.40644073486328125, -0.388702392578125, -0.37096405029296875, -0.3532257080078125, -0.33548736572265625, -0.3177490234375, -0.30001068115234375, -0.2822723388671875, -0.26453399658203125, -0.246795654296875, -0.22905731201171875, -0.2113189697265625, -0.19358062744140625, -0.17584228515625, -0.15810394287109375, -0.1403656005859375, -0.12262725830078125, -0.104888916015625, -0.08715057373046875, -0.0694122314453125, -0.05167388916015625, -0.033935546875, -0.01619720458984375, 0.0015411376953125, 0.01927947998046875, 0.037017822265625, 0.05475616455078125, 0.0724945068359375, 0.09023284912109375, 0.10797119140625, 0.12570953369140625, 0.1434478759765625, 0.16118621826171875, 0.178924560546875, 0.19666290283203125, 0.2144012451171875, 0.23213958740234375, 0.2498779296875, 0.26761627197265625, 0.2853546142578125, 0.30309295654296875, 0.320831298828125, 0.33856964111328125, 0.3563079833984375, 0.37404632568359375, 0.39178466796875, 0.40952301025390625, 0.4272613525390625, 0.44499969482421875, 0.462738037109375, 0.48047637939453125, 0.4982147216796875, 0.5159530639648438, 0.53369140625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 9.0, 13.0, 19.0, 18.0, 23.0, 40.0, 63.0, 83.0, 191.0, 365.0, 2428.0, 413.0, 147.0, 83.0, 62.0, 33.0, 17.0, 23.0, 11.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31298828125, -0.3023872375488281, -0.29178619384765625, -0.2811851501464844, -0.2705841064453125, -0.2599830627441406, -0.24938201904296875, -0.23878097534179688, -0.228179931640625, -0.21757888793945312, -0.20697784423828125, -0.19637680053710938, -0.1857757568359375, -0.17517471313476562, -0.16457366943359375, -0.15397262573242188, -0.14337158203125, -0.13277053833007812, -0.12216949462890625, -0.11156845092773438, -0.1009674072265625, -0.09036636352539062, -0.07976531982421875, -0.06916427612304688, -0.058563232421875, -0.047962188720703125, -0.03736114501953125, -0.026760101318359375, -0.0161590576171875, -0.005558013916015625, 0.00504302978515625, 0.015644073486328125, 0.0262451171875, 0.036846160888671875, 0.04744720458984375, 0.058048248291015625, 0.0686492919921875, 0.07925033569335938, 0.08985137939453125, 0.10045242309570312, 0.111053466796875, 0.12165451049804688, 0.13225555419921875, 0.14285659790039062, 0.1534576416015625, 0.16405868530273438, 0.17465972900390625, 0.18526077270507812, 0.19586181640625, 0.20646286010742188, 0.21706390380859375, 0.22766494750976562, 0.2382659912109375, 0.24886703491210938, 0.25946807861328125, 0.2700691223144531, 0.280670166015625, 0.2912712097167969, 0.30187225341796875, 0.3124732971191406, 0.3230743408203125, 0.3336753845214844, 0.34427642822265625, 0.3548774719238281, 0.365478515625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 12.0, 31.0, 66.0, 135.0, 241.0, 230.0, 144.0, 82.0, 37.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.896330833435059, -4.804879188537598, -4.713428020477295, -4.621976375579834, -4.530524730682373, -4.43907356262207, -4.347621917724609, -4.256170272827148, -4.164719104766846, -4.073267459869385, -3.981816053390503, -3.890364646911621, -3.7989132404327393, -3.7074618339538574, -3.6160101890563965, -3.5245587825775146, -3.433107376098633, -3.341655969619751, -3.25020432472229, -3.158752918243408, -3.0673015117645264, -2.9758501052856445, -2.8843984603881836, -2.7929470539093018, -2.701495409011841, -2.610044002532959, -2.518592357635498, -2.427140951156616, -2.3356895446777344, -2.2442381381988525, -2.1527864933013916, -2.0613350868225098, -1.969883680343628, -1.8784321546554565, -1.7869807481765747, -1.6955292224884033, -1.6040778160095215, -1.51262629032135, -1.4211747646331787, -1.3297233581542969, -1.2382718324661255, -1.146820306777954, -1.0553689002990723, -0.9639173746109009, -0.872465968132019, -0.7810144424438477, -0.689562976360321, -0.5981115102767944, -0.5066600441932678, -0.4152085781097412, -0.3237571120262146, -0.2323056161403656, -0.140854150056839, -0.04940268397331238, 0.04204881191253662, 0.13350027799606323, 0.22495174407958984, 0.31640321016311646, 0.40785467624664307, 0.49930617213249207, 0.5907576084136963, 0.6822091341018677, 0.7736606001853943, 0.8651120662689209, 0.9565635323524475]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 4.0, 6.0, 10.0, 9.0, 17.0, 23.0, 15.0, 19.0, 23.0, 26.0, 32.0, 43.0, 41.0, 44.0, 36.0, 42.0, 42.0, 41.0, 38.0, 29.0, 33.0, 48.0, 31.0, 29.0, 45.0, 34.0, 25.0, 30.0, 30.0, 21.0, 22.0, 21.0, 12.0, 13.0, 12.0, 11.0, 9.0, 3.0, 3.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8800595998764038, -0.851436972618103, -0.8228143453598022, -0.7941917181015015, -0.7655691504478455, -0.7369465231895447, -0.7083238959312439, -0.6797012686729431, -0.6510787010192871, -0.6224560737609863, -0.5938334465026855, -0.5652108192443848, -0.5365882515907288, -0.507965624332428, -0.4793429970741272, -0.4507203698158264, -0.42209774255752563, -0.39347511529922485, -0.36485251784324646, -0.3362298905849457, -0.3076072931289673, -0.2789846658706665, -0.2503620386123657, -0.22173942625522614, -0.19311681389808655, -0.16449420154094696, -0.13587158918380737, -0.10724896192550659, -0.078626349568367, -0.05000373721122742, -0.021381109952926636, 0.007241502404212952, 0.035864055156707764, 0.06448666751384735, 0.09310928732156754, 0.12173190712928772, 0.1503545194864273, 0.1789771318435669, 0.20759975910186768, 0.23622237145900726, 0.26484498381614685, 0.29346761107444763, 0.322090208530426, 0.3507128357887268, 0.3793354630470276, 0.407958060503006, 0.43658068776130676, 0.46520328521728516, 0.49382591247558594, 0.5224485397338867, 0.5510711669921875, 0.5796937942504883, 0.6083163619041443, 0.6369389891624451, 0.6655616164207458, 0.6941842436790466, 0.7228068113327026, 0.7514294385910034, 0.7800520658493042, 0.808674693107605, 0.837297260761261, 0.8659198880195618, 0.8945425152778625, 0.9231651425361633, 0.9517877697944641]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 15.0, 9.0, 21.0, 35.0, 45.0, 73.0, 135.0, 287.0, 657.0, 1853.0, 7058.0, 41327.0, 353408.0, 552926.0, 75124.0, 11293.0, 2670.0, 882.0, 345.0, 149.0, 97.0, 57.0, 22.0, 17.0, 10.0, 9.0, 2.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.3232421875, -1.2885513305664062, -1.2538604736328125, -1.2191696166992188, -1.184478759765625, -1.1497879028320312, -1.1150970458984375, -1.0804061889648438, -1.04571533203125, -1.0110244750976562, -0.9763336181640625, -0.9416427612304688, -0.906951904296875, -0.8722610473632812, -0.8375701904296875, -0.8028793334960938, -0.7681884765625, -0.7334976196289062, -0.6988067626953125, -0.6641159057617188, -0.629425048828125, -0.5947341918945312, -0.5600433349609375, -0.5253524780273438, -0.49066162109375, -0.45597076416015625, -0.4212799072265625, -0.38658905029296875, -0.351898193359375, -0.31720733642578125, -0.2825164794921875, -0.24782562255859375, -0.213134765625, -0.17844390869140625, -0.1437530517578125, -0.10906219482421875, -0.074371337890625, -0.03968048095703125, -0.0049896240234375, 0.02970123291015625, 0.06439208984375, 0.09908294677734375, 0.1337738037109375, 0.16846466064453125, 0.203155517578125, 0.23784637451171875, 0.2725372314453125, 0.30722808837890625, 0.3419189453125, 0.37660980224609375, 0.4113006591796875, 0.44599151611328125, 0.480682373046875, 0.5153732299804688, 0.5500640869140625, 0.5847549438476562, 0.61944580078125, 0.6541366577148438, 0.6888275146484375, 0.7235183715820312, 0.758209228515625, 0.7929000854492188, 0.8275909423828125, 0.8622817993164062, 0.89697265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 5.0, 13.0, 11.0, 15.0, 15.0, 34.0, 41.0, 33.0, 49.0, 64.0, 71.0, 85.0, 101.0, 84.0, 74.0, 65.0, 59.0, 40.0, 30.0, 24.0, 22.0, 13.0, 16.0, 9.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.40283203125, -0.39003753662109375, -0.3772430419921875, -0.36444854736328125, -0.351654052734375, -0.33885955810546875, -0.3260650634765625, -0.31327056884765625, -0.30047607421875, -0.28768157958984375, -0.2748870849609375, -0.26209259033203125, -0.249298095703125, -0.23650360107421875, -0.2237091064453125, -0.21091461181640625, -0.1981201171875, -0.18532562255859375, -0.1725311279296875, -0.15973663330078125, -0.146942138671875, -0.13414764404296875, -0.1213531494140625, -0.10855865478515625, -0.09576416015625, -0.08296966552734375, -0.0701751708984375, -0.05738067626953125, -0.044586181640625, -0.03179168701171875, -0.0189971923828125, -0.00620269775390625, 0.006591796875, 0.01938629150390625, 0.0321807861328125, 0.04497528076171875, 0.057769775390625, 0.07056427001953125, 0.0833587646484375, 0.09615325927734375, 0.10894775390625, 0.12174224853515625, 0.1345367431640625, 0.14733123779296875, 0.160125732421875, 0.17292022705078125, 0.1857147216796875, 0.19850921630859375, 0.2113037109375, 0.22409820556640625, 0.2368927001953125, 0.24968719482421875, 0.262481689453125, 0.27527618408203125, 0.2880706787109375, 0.30086517333984375, 0.31365966796875, 0.32645416259765625, 0.3392486572265625, 0.35204315185546875, 0.364837646484375, 0.37763214111328125, 0.3904266357421875, 0.40322113037109375, 0.416015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 3.0, 4.0, 6.0, 3.0, 12.0, 14.0, 19.0, 26.0, 43.0, 56.0, 83.0, 117.0, 206.0, 337.0, 618.0, 1305.0, 3867.0, 20112.0, 237737.0, 696834.0, 74010.0, 8721.0, 2235.0, 941.0, 480.0, 241.0, 159.0, 120.0, 67.0, 55.0, 32.0, 20.0, 12.0, 14.0, 19.0, 6.0, 7.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.390625, -1.352294921875, -1.31396484375, -1.275634765625, -1.2373046875, -1.198974609375, -1.16064453125, -1.122314453125, -1.083984375, -1.045654296875, -1.00732421875, -0.968994140625, -0.9306640625, -0.892333984375, -0.85400390625, -0.815673828125, -0.77734375, -0.739013671875, -0.70068359375, -0.662353515625, -0.6240234375, -0.585693359375, -0.54736328125, -0.509033203125, -0.470703125, -0.432373046875, -0.39404296875, -0.355712890625, -0.3173828125, -0.279052734375, -0.24072265625, -0.202392578125, -0.1640625, -0.125732421875, -0.08740234375, -0.049072265625, -0.0107421875, 0.027587890625, 0.06591796875, 0.104248046875, 0.142578125, 0.180908203125, 0.21923828125, 0.257568359375, 0.2958984375, 0.334228515625, 0.37255859375, 0.410888671875, 0.44921875, 0.487548828125, 0.52587890625, 0.564208984375, 0.6025390625, 0.640869140625, 0.67919921875, 0.717529296875, 0.755859375, 0.794189453125, 0.83251953125, 0.870849609375, 0.9091796875, 0.947509765625, 0.98583984375, 1.024169921875, 1.0625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 1.0, 9.0, 9.0, 8.0, 12.0, 19.0, 22.0, 26.0, 25.0, 31.0, 32.0, 35.0, 30.0, 41.0, 44.0, 45.0, 53.0, 54.0, 55.0, 57.0, 44.0, 37.0, 36.0, 39.0, 35.0, 25.0, 27.0, 22.0, 19.0, 24.0, 17.0, 19.0, 7.0, 6.0, 11.0, 7.0, 3.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3759765625, -1.33538818359375, -1.2947998046875, -1.25421142578125, -1.213623046875, -1.17303466796875, -1.1324462890625, -1.09185791015625, -1.05126953125, -1.01068115234375, -0.9700927734375, -0.92950439453125, -0.888916015625, -0.84832763671875, -0.8077392578125, -0.76715087890625, -0.7265625, -0.68597412109375, -0.6453857421875, -0.60479736328125, -0.564208984375, -0.52362060546875, -0.4830322265625, -0.44244384765625, -0.40185546875, -0.36126708984375, -0.3206787109375, -0.28009033203125, -0.239501953125, -0.19891357421875, -0.1583251953125, -0.11773681640625, -0.0771484375, -0.03656005859375, 0.0040283203125, 0.04461669921875, 0.085205078125, 0.12579345703125, 0.1663818359375, 0.20697021484375, 0.24755859375, 0.28814697265625, 0.3287353515625, 0.36932373046875, 0.409912109375, 0.45050048828125, 0.4910888671875, 0.53167724609375, 0.572265625, 0.61285400390625, 0.6534423828125, 0.69403076171875, 0.734619140625, 0.77520751953125, 0.8157958984375, 0.85638427734375, 0.89697265625, 0.93756103515625, 0.9781494140625, 1.01873779296875, 1.059326171875, 1.09991455078125, 1.1405029296875, 1.18109130859375, 1.2216796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 6.0, 4.0, 6.0, 14.0, 16.0, 53.0, 57.0, 98.0, 164.0, 339.0, 811.0, 2367.0, 12241.0, 191496.0, 783181.0, 49622.0, 5513.0, 1411.0, 540.0, 235.0, 152.0, 65.0, 55.0, 32.0, 21.0, 14.0, 8.0, 4.0, 2.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.48575592041015625, -0.4685821533203125, -0.45140838623046875, -0.434234619140625, -0.41706085205078125, -0.3998870849609375, -0.38271331787109375, -0.36553955078125, -0.34836578369140625, -0.3311920166015625, -0.31401824951171875, -0.296844482421875, -0.27967071533203125, -0.2624969482421875, -0.24532318115234375, -0.2281494140625, -0.21097564697265625, -0.1938018798828125, -0.17662811279296875, -0.159454345703125, -0.14228057861328125, -0.1251068115234375, -0.10793304443359375, -0.09075927734375, -0.07358551025390625, -0.0564117431640625, -0.03923797607421875, -0.022064208984375, -0.00489044189453125, 0.0122833251953125, 0.02945709228515625, 0.046630859375, 0.06380462646484375, 0.0809783935546875, 0.09815216064453125, 0.115325927734375, 0.13249969482421875, 0.1496734619140625, 0.16684722900390625, 0.18402099609375, 0.20119476318359375, 0.2183685302734375, 0.23554229736328125, 0.252716064453125, 0.26988983154296875, 0.2870635986328125, 0.30423736572265625, 0.3214111328125, 0.33858489990234375, 0.3557586669921875, 0.37293243408203125, 0.390106201171875, 0.40727996826171875, 0.4244537353515625, 0.44162750244140625, 0.45880126953125, 0.47597503662109375, 0.4931488037109375, 0.5103225708007812, 0.527496337890625, 0.5446701049804688, 0.5618438720703125, 0.5790176391601562, 0.59619140625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 12.0, 8.0, 7.0, 19.0, 25.0, 38.0, 45.0, 62.0, 63.0, 110.0, 115.0, 133.0, 80.0, 62.0, 59.0, 35.0, 24.0, 28.0, 19.0, 19.0, 12.0, 9.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.606910705566406e-05, -8.32732766866684e-05, -8.047744631767273e-05, -7.768161594867706e-05, -7.48857855796814e-05, -7.208995521068573e-05, -6.929412484169006e-05, -6.64982944726944e-05, -6.370246410369873e-05, -6.0906633734703064e-05, -5.81108033657074e-05, -5.531497299671173e-05, -5.2519142627716064e-05, -4.97233122587204e-05, -4.692748188972473e-05, -4.4131651520729065e-05, -4.13358211517334e-05, -3.853999078273773e-05, -3.5744160413742065e-05, -3.29483300447464e-05, -3.0152499675750732e-05, -2.7356669306755066e-05, -2.45608389377594e-05, -2.1765008568763733e-05, -1.8969178199768066e-05, -1.61733478307724e-05, -1.3377517461776733e-05, -1.0581687092781067e-05, -7.7858567237854e-06, -4.990026354789734e-06, -2.1941959857940674e-06, 6.016343832015991e-07, 3.3974647521972656e-06, 6.193295121192932e-06, 8.989125490188599e-06, 1.1784955859184265e-05, 1.4580786228179932e-05, 1.7376616597175598e-05, 2.0172446966171265e-05, 2.296827733516693e-05, 2.5764107704162598e-05, 2.8559938073158264e-05, 3.135576844215393e-05, 3.41515988111496e-05, 3.6947429180145264e-05, 3.974325954914093e-05, 4.25390899181366e-05, 4.533492028713226e-05, 4.813075065612793e-05, 5.0926581025123596e-05, 5.372241139411926e-05, 5.651824176311493e-05, 5.9314072132110596e-05, 6.210990250110626e-05, 6.490573287010193e-05, 6.77015632390976e-05, 7.049739360809326e-05, 7.329322397708893e-05, 7.60890543460846e-05, 7.888488471508026e-05, 8.168071508407593e-05, 8.44765454530716e-05, 8.727237582206726e-05, 9.006820619106293e-05, 9.28640365600586e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 9.0, 18.0, 24.0, 51.0, 110.0, 297.0, 1002.0, 5397.0, 275253.0, 754245.0, 10063.0, 1409.0, 407.0, 133.0, 77.0, 29.0, 15.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0908203125, -1.0622024536132812, -1.0335845947265625, -1.0049667358398438, -0.976348876953125, -0.9477310180664062, -0.9191131591796875, -0.8904953002929688, -0.86187744140625, -0.8332595825195312, -0.8046417236328125, -0.7760238647460938, -0.747406005859375, -0.7187881469726562, -0.6901702880859375, -0.6615524291992188, -0.6329345703125, -0.6043167114257812, -0.5756988525390625, -0.5470809936523438, -0.518463134765625, -0.48984527587890625, -0.4612274169921875, -0.43260955810546875, -0.40399169921875, -0.37537384033203125, -0.3467559814453125, -0.31813812255859375, -0.289520263671875, -0.26090240478515625, -0.2322845458984375, -0.20366668701171875, -0.175048828125, -0.14643096923828125, -0.1178131103515625, -0.08919525146484375, -0.060577392578125, -0.03195953369140625, -0.0033416748046875, 0.02527618408203125, 0.05389404296875, 0.08251190185546875, 0.1111297607421875, 0.13974761962890625, 0.168365478515625, 0.19698333740234375, 0.2256011962890625, 0.25421905517578125, 0.2828369140625, 0.31145477294921875, 0.3400726318359375, 0.36869049072265625, 0.397308349609375, 0.42592620849609375, 0.4545440673828125, 0.48316192626953125, 0.51177978515625, 0.5403976440429688, 0.5690155029296875, 0.5976333618164062, 0.626251220703125, 0.6548690795898438, 0.6834869384765625, 0.7121047973632812, 0.74072265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 8.0, 3.0, 10.0, 16.0, 15.0, 34.0, 35.0, 42.0, 74.0, 64.0, 86.0, 109.0, 125.0, 90.0, 59.0, 63.0, 43.0, 36.0, 25.0, 16.0, 12.0, 10.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4189453125, -0.40431976318359375, -0.3896942138671875, -0.37506866455078125, -0.360443115234375, -0.34581756591796875, -0.3311920166015625, -0.31656646728515625, -0.30194091796875, -0.28731536865234375, -0.2726898193359375, -0.25806427001953125, -0.243438720703125, -0.22881317138671875, -0.2141876220703125, -0.19956207275390625, -0.1849365234375, -0.17031097412109375, -0.1556854248046875, -0.14105987548828125, -0.126434326171875, -0.11180877685546875, -0.0971832275390625, -0.08255767822265625, -0.06793212890625, -0.05330657958984375, -0.0386810302734375, -0.02405548095703125, -0.009429931640625, 0.00519561767578125, 0.0198211669921875, 0.03444671630859375, 0.049072265625, 0.06369781494140625, 0.0783233642578125, 0.09294891357421875, 0.107574462890625, 0.12220001220703125, 0.1368255615234375, 0.15145111083984375, 0.16607666015625, 0.18070220947265625, 0.1953277587890625, 0.20995330810546875, 0.224578857421875, 0.23920440673828125, 0.2538299560546875, 0.26845550537109375, 0.2830810546875, 0.29770660400390625, 0.3123321533203125, 0.32695770263671875, 0.341583251953125, 0.35620880126953125, 0.3708343505859375, 0.38545989990234375, 0.40008544921875, 0.41471099853515625, 0.4293365478515625, 0.44396209716796875, 0.458587646484375, 0.47321319580078125, 0.4878387451171875, 0.5024642944335938, 0.51708984375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 11.0, 53.0, 114.0, 248.0, 274.0, 167.0, 84.0, 25.0, 13.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.16891860961914, -15.74285888671875, -15.316798210144043, -14.890738487243652, -14.464678764343262, -14.038618087768555, -13.612558364868164, -13.186498641967773, -12.760438919067383, -12.334379196166992, -11.908318519592285, -11.482258796691895, -11.056199073791504, -10.630138397216797, -10.204078674316406, -9.778018951416016, -9.351958274841309, -8.925898551940918, -8.499837875366211, -8.07377815246582, -7.64771842956543, -7.221658229827881, -6.795598030090332, -6.369538307189941, -5.943478107452393, -5.517417907714844, -5.091358184814453, -4.665297985076904, -4.2392377853393555, -3.813178062438965, -3.387117862701416, -2.9610579013824463, -2.534998893737793, -2.1089389324188232, -1.682878851890564, -1.2568187713623047, -0.830758810043335, -0.40469884872436523, 0.021361351013183594, 0.4474213123321533, 0.873481273651123, 1.2995412349700928, 1.725601315498352, 2.1516613960266113, 2.577721357345581, 3.003781318664551, 3.4298415184020996, 3.8559014797210693, 4.281961441040039, 4.708021640777588, 5.1340813636779785, 5.560141563415527, 5.986201286315918, 6.412261486053467, 6.838321685791016, 7.264381408691406, 7.690441608428955, 8.116501808166504, 8.542561531066895, 8.968622207641602, 9.394681930541992, 9.820741653442383, 10.246801376342773, 10.67286205291748, 11.098921775817871]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 7.0, 10.0, 6.0, 7.0, 7.0, 22.0, 22.0, 21.0, 24.0, 38.0, 27.0, 29.0, 44.0, 49.0, 32.0, 50.0, 57.0, 55.0, 62.0, 55.0, 51.0, 46.0, 34.0, 45.0, 33.0, 23.0, 30.0, 22.0, 21.0, 19.0, 7.0, 7.0, 8.0, 4.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.240418434143066, -5.056118011474609, -4.8718180656433105, -4.687518119812012, -4.503217697143555, -4.318917274475098, -4.134617328643799, -3.950317144393921, -3.766016960144043, -3.581716775894165, -3.397416591644287, -3.213116407394409, -3.0288162231445312, -2.8445160388946533, -2.6602158546447754, -2.4759156703948975, -2.2916154861450195, -2.1073153018951416, -1.9230151176452637, -1.7387149333953857, -1.5544147491455078, -1.3701145648956299, -1.185814380645752, -1.001514196395874, -0.8172140121459961, -0.6329138278961182, -0.44861364364624023, -0.2643134593963623, -0.08001327514648438, 0.10428690910339355, 0.2885870933532715, 0.4728872776031494, 0.6571869850158691, 0.8414871692657471, 1.025787353515625, 1.210087537765503, 1.3943877220153809, 1.5786879062652588, 1.7629880905151367, 1.9472882747650146, 2.1315884590148926, 2.3158886432647705, 2.5001888275146484, 2.6844890117645264, 2.8687891960144043, 3.0530893802642822, 3.23738956451416, 3.421689748764038, 3.605989933013916, 3.790290117263794, 3.974590301513672, 4.158890724182129, 4.343190670013428, 4.527490615844727, 4.711791038513184, 4.896091461181641, 5.0803914070129395, 5.264691352844238, 5.448991775512695, 5.633292198181152, 5.817592144012451, 6.00189208984375, 6.186192512512207, 6.370492935180664, 6.554792881011963]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 7.0, 4.0, 16.0, 10.0, 19.0, 21.0, 31.0, 64.0, 89.0, 187.0, 380.0, 893.0, 3178.0, 17053.0, 313648.0, 3768992.0, 78342.0, 8243.0, 1822.0, 601.0, 269.0, 153.0, 81.0, 57.0, 33.0, 26.0, 17.0, 12.0, 14.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.130859375, -1.097900390625, -1.06494140625, -1.031982421875, -0.9990234375, -0.966064453125, -0.93310546875, -0.900146484375, -0.8671875, -0.834228515625, -0.80126953125, -0.768310546875, -0.7353515625, -0.702392578125, -0.66943359375, -0.636474609375, -0.603515625, -0.570556640625, -0.53759765625, -0.504638671875, -0.4716796875, -0.438720703125, -0.40576171875, -0.372802734375, -0.33984375, -0.306884765625, -0.27392578125, -0.240966796875, -0.2080078125, -0.175048828125, -0.14208984375, -0.109130859375, -0.076171875, -0.043212890625, -0.01025390625, 0.022705078125, 0.0556640625, 0.088623046875, 0.12158203125, 0.154541015625, 0.1875, 0.220458984375, 0.25341796875, 0.286376953125, 0.3193359375, 0.352294921875, 0.38525390625, 0.418212890625, 0.451171875, 0.484130859375, 0.51708984375, 0.550048828125, 0.5830078125, 0.615966796875, 0.64892578125, 0.681884765625, 0.71484375, 0.747802734375, 0.78076171875, 0.813720703125, 0.8466796875, 0.879638671875, 0.91259765625, 0.945556640625, 0.978515625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 10.0, 12.0, 16.0, 26.0, 27.0, 41.0, 52.0, 63.0, 77.0, 75.0, 73.0, 95.0, 83.0, 81.0, 62.0, 51.0, 43.0, 27.0, 28.0, 15.0, 16.0, 11.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.339111328125, -0.3261260986328125, -0.313140869140625, -0.3001556396484375, -0.28717041015625, -0.2741851806640625, -0.261199951171875, -0.2482147216796875, -0.2352294921875, -0.2222442626953125, -0.209259033203125, -0.1962738037109375, -0.18328857421875, -0.1703033447265625, -0.157318115234375, -0.1443328857421875, -0.13134765625, -0.1183624267578125, -0.105377197265625, -0.0923919677734375, -0.07940673828125, -0.0664215087890625, -0.053436279296875, -0.0404510498046875, -0.0274658203125, -0.0144805908203125, -0.001495361328125, 0.0114898681640625, 0.02447509765625, 0.0374603271484375, 0.050445556640625, 0.0634307861328125, 0.076416015625, 0.0894012451171875, 0.102386474609375, 0.1153717041015625, 0.12835693359375, 0.1413421630859375, 0.154327392578125, 0.1673126220703125, 0.1802978515625, 0.1932830810546875, 0.206268310546875, 0.2192535400390625, 0.23223876953125, 0.2452239990234375, 0.258209228515625, 0.2711944580078125, 0.2841796875, 0.2971649169921875, 0.310150146484375, 0.3231353759765625, 0.33612060546875, 0.3491058349609375, 0.362091064453125, 0.3750762939453125, 0.3880615234375, 0.4010467529296875, 0.414031982421875, 0.4270172119140625, 0.44000244140625, 0.4529876708984375, 0.465972900390625, 0.4789581298828125, 0.491943359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 3.0, 10.0, 5.0, 13.0, 13.0, 21.0, 21.0, 38.0, 77.0, 107.0, 179.0, 333.0, 828.0, 2679.0, 12223.0, 95268.0, 3615477.0, 431747.0, 28249.0, 4844.0, 1223.0, 427.0, 189.0, 105.0, 67.0, 29.0, 18.0, 15.0, 15.0, 11.0, 10.0, 8.0, 3.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77392578125, -0.7438430786132812, -0.7137603759765625, -0.6836776733398438, -0.653594970703125, -0.6235122680664062, -0.5934295654296875, -0.5633468627929688, -0.53326416015625, -0.5031814575195312, -0.4730987548828125, -0.44301605224609375, -0.412933349609375, -0.38285064697265625, -0.3527679443359375, -0.32268524169921875, -0.2926025390625, -0.26251983642578125, -0.2324371337890625, -0.20235443115234375, -0.172271728515625, -0.14218902587890625, -0.1121063232421875, -0.08202362060546875, -0.05194091796875, -0.02185821533203125, 0.0082244873046875, 0.03830718994140625, 0.068389892578125, 0.09847259521484375, 0.1285552978515625, 0.15863800048828125, 0.188720703125, 0.21880340576171875, 0.2488861083984375, 0.27896881103515625, 0.309051513671875, 0.33913421630859375, 0.3692169189453125, 0.39929962158203125, 0.42938232421875, 0.45946502685546875, 0.4895477294921875, 0.5196304321289062, 0.549713134765625, 0.5797958374023438, 0.6098785400390625, 0.6399612426757812, 0.6700439453125, 0.7001266479492188, 0.7302093505859375, 0.7602920532226562, 0.790374755859375, 0.8204574584960938, 0.8505401611328125, 0.8806228637695312, 0.91070556640625, 0.9407882690429688, 0.9708709716796875, 1.0009536743164062, 1.031036376953125, 1.0611190795898438, 1.0912017822265625, 1.1212844848632812, 1.1513671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 4.0, 8.0, 13.0, 11.0, 17.0, 23.0, 45.0, 65.0, 138.0, 285.0, 649.0, 1361.0, 766.0, 331.0, 146.0, 77.0, 38.0, 25.0, 15.0, 15.0, 17.0, 7.0, 6.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2529296875, -1.222808837890625, -1.19268798828125, -1.162567138671875, -1.1324462890625, -1.102325439453125, -1.07220458984375, -1.042083740234375, -1.011962890625, -0.981842041015625, -0.95172119140625, -0.921600341796875, -0.8914794921875, -0.861358642578125, -0.83123779296875, -0.801116943359375, -0.77099609375, -0.740875244140625, -0.71075439453125, -0.680633544921875, -0.6505126953125, -0.620391845703125, -0.59027099609375, -0.560150146484375, -0.530029296875, -0.499908447265625, -0.46978759765625, -0.439666748046875, -0.4095458984375, -0.379425048828125, -0.34930419921875, -0.319183349609375, -0.2890625, -0.258941650390625, -0.22882080078125, -0.198699951171875, -0.1685791015625, -0.138458251953125, -0.10833740234375, -0.078216552734375, -0.048095703125, -0.017974853515625, 0.01214599609375, 0.042266845703125, 0.0723876953125, 0.102508544921875, 0.13262939453125, 0.162750244140625, 0.19287109375, 0.222991943359375, 0.25311279296875, 0.283233642578125, 0.3133544921875, 0.343475341796875, 0.37359619140625, 0.403717041015625, 0.433837890625, 0.463958740234375, 0.49407958984375, 0.524200439453125, 0.5543212890625, 0.584442138671875, 0.61456298828125, 0.644683837890625, 0.6748046875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 6.0, 8.0, 14.0, 32.0, 69.0, 172.0, 209.0, 217.0, 138.0, 64.0, 30.0, 14.0, 6.0, 2.0, 7.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.639715194702148, -8.412349700927734, -8.184985160827637, -7.957619667053223, -7.730254173278809, -7.502889156341553, -7.275524139404297, -7.048158645629883, -6.820793628692627, -6.593428611755371, -6.366063117980957, -6.138698101043701, -5.911333084106445, -5.683967590332031, -5.456602573394775, -5.2292375564575195, -5.0018720626831055, -4.77450704574585, -4.5471415519714355, -4.31977653503418, -4.092411041259766, -3.8650460243225098, -3.637681007385254, -3.410315752029419, -3.182950496673584, -2.955585241317749, -2.728219985961914, -2.500854969024658, -2.2734897136688232, -2.0461244583129883, -1.8187593221664429, -1.5913941860198975, -1.3640289306640625, -1.1366636753082275, -0.9092985391616821, -0.6819333434104919, -0.45456814765930176, -0.2272028923034668, 0.00016224384307861328, 0.22752737998962402, 0.454892635345459, 0.6822578310966492, 0.9096230268478394, 1.1369881629943848, 1.3643534183502197, 1.5917186737060547, 1.8190838098526, 2.0464489459991455, 2.2738142013549805, 2.5011794567108154, 2.7285447120666504, 2.9559097290039062, 3.183274984359741, 3.410640239715576, 3.638005256652832, 3.865370512008667, 4.092735767364502, 4.320100784301758, 4.547466278076172, 4.774831295013428, 5.002196311950684, 5.229561805725098, 5.4569268226623535, 5.684291839599609, 5.911657333374023]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 7.0, 9.0, 4.0, 21.0, 24.0, 25.0, 26.0, 36.0, 50.0, 66.0, 55.0, 66.0, 70.0, 60.0, 65.0, 75.0, 55.0, 64.0, 54.0, 25.0, 24.0, 29.0, 22.0, 15.0, 17.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.453827857971191, -4.315446376800537, -4.177064895629883, -4.0386834144592285, -3.900301933288574, -3.76192045211792, -3.6235389709472656, -3.4851574897766113, -3.346776008605957, -3.2083945274353027, -3.0700130462646484, -2.931631565093994, -2.79325008392334, -2.6548686027526855, -2.5164871215820312, -2.378105640411377, -2.2397241592407227, -2.1013426780700684, -1.962961196899414, -1.8245797157287598, -1.6861982345581055, -1.5478167533874512, -1.4094352722167969, -1.2710537910461426, -1.1326723098754883, -0.994290828704834, -0.8559093475341797, -0.7175278663635254, -0.5791463851928711, -0.4407649040222168, -0.3023834228515625, -0.1640019416809082, -0.025620460510253906, 0.11276102066040039, 0.2511425018310547, 0.389523983001709, 0.5279054641723633, 0.6662869453430176, 0.8046684265136719, 0.9430499076843262, 1.0814313888549805, 1.2198128700256348, 1.358194351196289, 1.4965758323669434, 1.6349573135375977, 1.773338794708252, 1.9117202758789062, 2.0501017570495605, 2.188483238220215, 2.326864719390869, 2.4652462005615234, 2.6036276817321777, 2.742009162902832, 2.8803906440734863, 3.0187721252441406, 3.157153606414795, 3.295535087585449, 3.4339165687561035, 3.572298049926758, 3.710679531097412, 3.8490610122680664, 3.9874424934387207, 4.125823974609375, 4.264205455780029, 4.402586936950684]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 8.0, 13.0, 15.0, 28.0, 45.0, 72.0, 135.0, 228.0, 433.0, 790.0, 1660.0, 3467.0, 8098.0, 21052.0, 62056.0, 196013.0, 421623.0, 222423.0, 70072.0, 23789.0, 9002.0, 3823.0, 1765.0, 874.0, 414.0, 253.0, 152.0, 97.0, 51.0, 34.0, 18.0, 20.0, 11.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45166015625, -0.43637847900390625, -0.4210968017578125, -0.40581512451171875, -0.390533447265625, -0.37525177001953125, -0.3599700927734375, -0.34468841552734375, -0.32940673828125, -0.31412506103515625, -0.2988433837890625, -0.28356170654296875, -0.268280029296875, -0.25299835205078125, -0.2377166748046875, -0.22243499755859375, -0.2071533203125, -0.19187164306640625, -0.1765899658203125, -0.16130828857421875, -0.146026611328125, -0.13074493408203125, -0.1154632568359375, -0.10018157958984375, -0.08489990234375, -0.06961822509765625, -0.0543365478515625, -0.03905487060546875, -0.023773193359375, -0.00849151611328125, 0.0067901611328125, 0.02207183837890625, 0.037353515625, 0.05263519287109375, 0.0679168701171875, 0.08319854736328125, 0.098480224609375, 0.11376190185546875, 0.1290435791015625, 0.14432525634765625, 0.15960693359375, 0.17488861083984375, 0.1901702880859375, 0.20545196533203125, 0.220733642578125, 0.23601531982421875, 0.2512969970703125, 0.26657867431640625, 0.2818603515625, 0.29714202880859375, 0.3124237060546875, 0.32770538330078125, 0.342987060546875, 0.35826873779296875, 0.3735504150390625, 0.38883209228515625, 0.40411376953125, 0.41939544677734375, 0.4346771240234375, 0.44995880126953125, 0.465240478515625, 0.48052215576171875, 0.4958038330078125, 0.5110855102539062, 0.5263671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 6.0, 9.0, 10.0, 11.0, 24.0, 33.0, 35.0, 32.0, 49.0, 45.0, 51.0, 56.0, 67.0, 57.0, 68.0, 57.0, 56.0, 50.0, 49.0, 37.0, 42.0, 31.0, 31.0, 20.0, 11.0, 8.0, 11.0, 9.0, 8.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.331298828125, -0.32183074951171875, -0.3123626708984375, -0.30289459228515625, -0.293426513671875, -0.28395843505859375, -0.2744903564453125, -0.26502227783203125, -0.25555419921875, -0.24608612060546875, -0.2366180419921875, -0.22714996337890625, -0.217681884765625, -0.20821380615234375, -0.1987457275390625, -0.18927764892578125, -0.1798095703125, -0.17034149169921875, -0.1608734130859375, -0.15140533447265625, -0.141937255859375, -0.13246917724609375, -0.1230010986328125, -0.11353302001953125, -0.10406494140625, -0.09459686279296875, -0.0851287841796875, -0.07566070556640625, -0.066192626953125, -0.05672454833984375, -0.0472564697265625, -0.03778839111328125, -0.0283203125, -0.01885223388671875, -0.0093841552734375, 8.392333984375e-05, 0.009552001953125, 0.01902008056640625, 0.0284881591796875, 0.03795623779296875, 0.04742431640625, 0.05689239501953125, 0.0663604736328125, 0.07582855224609375, 0.085296630859375, 0.09476470947265625, 0.1042327880859375, 0.11370086669921875, 0.1231689453125, 0.13263702392578125, 0.1421051025390625, 0.15157318115234375, 0.161041259765625, 0.17050933837890625, 0.1799774169921875, 0.18944549560546875, 0.19891357421875, 0.20838165283203125, 0.2178497314453125, 0.22731781005859375, 0.236785888671875, 0.24625396728515625, 0.2557220458984375, 0.26519012451171875, 0.274658203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 9.0, 14.0, 15.0, 18.0, 38.0, 50.0, 87.0, 103.0, 209.0, 408.0, 838.0, 1896.0, 6923.0, 76940.0, 850735.0, 98240.0, 8041.0, 2073.0, 904.0, 415.0, 203.0, 134.0, 95.0, 56.0, 37.0, 21.0, 20.0, 17.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0248565673828125, -0.986236572265625, -0.9476165771484375, -0.90899658203125, -0.8703765869140625, -0.831756591796875, -0.7931365966796875, -0.7545166015625, -0.7158966064453125, -0.677276611328125, -0.6386566162109375, -0.60003662109375, -0.5614166259765625, -0.522796630859375, -0.4841766357421875, -0.445556640625, -0.4069366455078125, -0.368316650390625, -0.3296966552734375, -0.29107666015625, -0.2524566650390625, -0.213836669921875, -0.1752166748046875, -0.1365966796875, -0.0979766845703125, -0.059356689453125, -0.0207366943359375, 0.01788330078125, 0.0565032958984375, 0.095123291015625, 0.1337432861328125, 0.17236328125, 0.2109832763671875, 0.249603271484375, 0.2882232666015625, 0.32684326171875, 0.3654632568359375, 0.404083251953125, 0.4427032470703125, 0.4813232421875, 0.5199432373046875, 0.558563232421875, 0.5971832275390625, 0.63580322265625, 0.6744232177734375, 0.713043212890625, 0.7516632080078125, 0.790283203125, 0.8289031982421875, 0.867523193359375, 0.9061431884765625, 0.94476318359375, 0.9833831787109375, 1.022003173828125, 1.0606231689453125, 1.0992431640625, 1.1378631591796875, 1.176483154296875, 1.2151031494140625, 1.25372314453125, 1.2923431396484375, 1.330963134765625, 1.3695831298828125, 1.408203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 3.0, 3.0, 13.0, 21.0, 13.0, 19.0, 26.0, 29.0, 36.0, 39.0, 53.0, 44.0, 47.0, 76.0, 59.0, 59.0, 62.0, 63.0, 50.0, 51.0, 36.0, 47.0, 41.0, 24.0, 28.0, 19.0, 13.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3857421875, -1.3437042236328125, -1.301666259765625, -1.2596282958984375, -1.21759033203125, -1.1755523681640625, -1.133514404296875, -1.0914764404296875, -1.0494384765625, -1.0074005126953125, -0.965362548828125, -0.9233245849609375, -0.88128662109375, -0.8392486572265625, -0.797210693359375, -0.7551727294921875, -0.713134765625, -0.6710968017578125, -0.629058837890625, -0.5870208740234375, -0.54498291015625, -0.5029449462890625, -0.460906982421875, -0.4188690185546875, -0.3768310546875, -0.3347930908203125, -0.292755126953125, -0.2507171630859375, -0.20867919921875, -0.1666412353515625, -0.124603271484375, -0.0825653076171875, -0.04052734375, 0.0015106201171875, 0.043548583984375, 0.0855865478515625, 0.12762451171875, 0.1696624755859375, 0.211700439453125, 0.2537384033203125, 0.2957763671875, 0.3378143310546875, 0.379852294921875, 0.4218902587890625, 0.46392822265625, 0.5059661865234375, 0.548004150390625, 0.5900421142578125, 0.632080078125, 0.6741180419921875, 0.716156005859375, 0.7581939697265625, 0.80023193359375, 0.8422698974609375, 0.884307861328125, 0.9263458251953125, 0.9683837890625, 1.0104217529296875, 1.052459716796875, 1.0944976806640625, 1.13653564453125, 1.1785736083984375, 1.220611572265625, 1.2626495361328125, 1.3046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 8.0, 8.0, 17.0, 22.0, 29.0, 50.0, 72.0, 181.0, 422.0, 1565.0, 10596.0, 732056.0, 294460.0, 7188.0, 1169.0, 376.0, 160.0, 68.0, 45.0, 26.0, 9.0, 6.0, 11.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80224609375, -0.7762985229492188, -0.7503509521484375, -0.7244033813476562, -0.698455810546875, -0.6725082397460938, -0.6465606689453125, -0.6206130981445312, -0.59466552734375, -0.5687179565429688, -0.5427703857421875, -0.5168228149414062, -0.490875244140625, -0.46492767333984375, -0.4389801025390625, -0.41303253173828125, -0.3870849609375, -0.36113739013671875, -0.3351898193359375, -0.30924224853515625, -0.283294677734375, -0.25734710693359375, -0.2313995361328125, -0.20545196533203125, -0.17950439453125, -0.15355682373046875, -0.1276092529296875, -0.10166168212890625, -0.075714111328125, -0.04976654052734375, -0.0238189697265625, 0.00212860107421875, 0.028076171875, 0.05402374267578125, 0.0799713134765625, 0.10591888427734375, 0.131866455078125, 0.15781402587890625, 0.1837615966796875, 0.20970916748046875, 0.23565673828125, 0.26160430908203125, 0.2875518798828125, 0.31349945068359375, 0.339447021484375, 0.36539459228515625, 0.3913421630859375, 0.41728973388671875, 0.4432373046875, 0.46918487548828125, 0.4951324462890625, 0.5210800170898438, 0.547027587890625, 0.5729751586914062, 0.5989227294921875, 0.6248703002929688, 0.65081787109375, 0.6767654418945312, 0.7027130126953125, 0.7286605834960938, 0.754608154296875, 0.7805557250976562, 0.8065032958984375, 0.8324508666992188, 0.8583984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 5.0, 3.0, 11.0, 15.0, 13.0, 18.0, 20.0, 41.0, 42.0, 51.0, 86.0, 137.0, 138.0, 107.0, 71.0, 54.0, 37.0, 32.0, 24.0, 18.0, 14.0, 12.0, 7.0, 9.0, 7.0, 6.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.600950241088867e-05, -8.296500891447067e-05, -7.992051541805267e-05, -7.687602192163467e-05, -7.383152842521667e-05, -7.078703492879868e-05, -6.774254143238068e-05, -6.469804793596268e-05, -6.165355443954468e-05, -5.860906094312668e-05, -5.556456744670868e-05, -5.252007395029068e-05, -4.947558045387268e-05, -4.643108695745468e-05, -4.338659346103668e-05, -4.034209996461868e-05, -3.7297606468200684e-05, -3.4253112971782684e-05, -3.1208619475364685e-05, -2.8164125978946686e-05, -2.5119632482528687e-05, -2.2075138986110687e-05, -1.9030645489692688e-05, -1.598615199327469e-05, -1.294165849685669e-05, -9.89716500043869e-06, -6.852671504020691e-06, -3.8081780076026917e-06, -7.636845111846924e-07, 2.280808985233307e-06, 5.325302481651306e-06, 8.369795978069305e-06, 1.1414289474487305e-05, 1.4458782970905304e-05, 1.7503276467323303e-05, 2.0547769963741302e-05, 2.3592263460159302e-05, 2.66367569565773e-05, 2.96812504529953e-05, 3.27257439494133e-05, 3.57702374458313e-05, 3.88147309422493e-05, 4.18592244386673e-05, 4.49037179350853e-05, 4.7948211431503296e-05, 5.0992704927921295e-05, 5.4037198424339294e-05, 5.7081691920757294e-05, 6.012618541717529e-05, 6.317067891359329e-05, 6.621517241001129e-05, 6.925966590642929e-05, 7.230415940284729e-05, 7.534865289926529e-05, 7.839314639568329e-05, 8.143763989210129e-05, 8.448213338851929e-05, 8.752662688493729e-05, 9.057112038135529e-05, 9.361561387777328e-05, 9.666010737419128e-05, 9.970460087060928e-05, 0.00010274909436702728, 0.00010579358786344528, 0.00010883808135986328]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 6.0, 1.0, 7.0, 5.0, 10.0, 11.0, 24.0, 24.0, 63.0, 111.0, 213.0, 479.0, 1143.0, 3869.0, 27808.0, 786863.0, 212717.0, 11258.0, 2365.0, 836.0, 324.0, 172.0, 84.0, 56.0, 28.0, 27.0, 17.0, 6.0, 10.0, 7.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.63427734375, -0.6149444580078125, -0.595611572265625, -0.5762786865234375, -0.55694580078125, -0.5376129150390625, -0.518280029296875, -0.4989471435546875, -0.4796142578125, -0.4602813720703125, -0.440948486328125, -0.4216156005859375, -0.40228271484375, -0.3829498291015625, -0.363616943359375, -0.3442840576171875, -0.324951171875, -0.3056182861328125, -0.286285400390625, -0.2669525146484375, -0.24761962890625, -0.2282867431640625, -0.208953857421875, -0.1896209716796875, -0.1702880859375, -0.1509552001953125, -0.131622314453125, -0.1122894287109375, -0.09295654296875, -0.0736236572265625, -0.054290771484375, -0.0349578857421875, -0.015625, 0.0037078857421875, 0.023040771484375, 0.0423736572265625, 0.06170654296875, 0.0810394287109375, 0.100372314453125, 0.1197052001953125, 0.1390380859375, 0.1583709716796875, 0.177703857421875, 0.1970367431640625, 0.21636962890625, 0.2357025146484375, 0.255035400390625, 0.2743682861328125, 0.293701171875, 0.3130340576171875, 0.332366943359375, 0.3516998291015625, 0.37103271484375, 0.3903656005859375, 0.409698486328125, 0.4290313720703125, 0.4483642578125, 0.4676971435546875, 0.487030029296875, 0.5063629150390625, 0.52569580078125, 0.5450286865234375, 0.564361572265625, 0.5836944580078125, 0.60302734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 9.0, 10.0, 15.0, 16.0, 33.0, 46.0, 48.0, 102.0, 119.0, 122.0, 129.0, 91.0, 71.0, 57.0, 31.0, 29.0, 17.0, 18.0, 16.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5712890625, -0.553314208984375, -0.53533935546875, -0.517364501953125, -0.4993896484375, -0.481414794921875, -0.46343994140625, -0.445465087890625, -0.427490234375, -0.409515380859375, -0.39154052734375, -0.373565673828125, -0.3555908203125, -0.337615966796875, -0.31964111328125, -0.301666259765625, -0.28369140625, -0.265716552734375, -0.24774169921875, -0.229766845703125, -0.2117919921875, -0.193817138671875, -0.17584228515625, -0.157867431640625, -0.139892578125, -0.121917724609375, -0.10394287109375, -0.085968017578125, -0.0679931640625, -0.050018310546875, -0.03204345703125, -0.014068603515625, 0.00390625, 0.021881103515625, 0.03985595703125, 0.057830810546875, 0.0758056640625, 0.093780517578125, 0.11175537109375, 0.129730224609375, 0.147705078125, 0.165679931640625, 0.18365478515625, 0.201629638671875, 0.2196044921875, 0.237579345703125, 0.25555419921875, 0.273529052734375, 0.29150390625, 0.309478759765625, 0.32745361328125, 0.345428466796875, 0.3634033203125, 0.381378173828125, 0.39935302734375, 0.417327880859375, 0.435302734375, 0.453277587890625, 0.47125244140625, 0.489227294921875, 0.5072021484375, 0.525177001953125, 0.54315185546875, 0.561126708984375, 0.5791015625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 40.0, 63.0, 106.0, 206.0, 227.0, 151.0, 100.0, 38.0, 26.0, 9.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.062172889709473, -3.8374850749969482, -3.612797260284424, -3.3881092071533203, -3.163421392440796, -2.9387335777282715, -2.714045763015747, -2.4893579483032227, -2.264669895172119, -2.0399820804595947, -1.8152941465377808, -1.5906063318252563, -1.3659183979034424, -1.141230583190918, -0.9165427684783936, -0.6918548345565796, -0.4671671390533447, -0.24247927963733673, -0.017791420221328735, 0.20689642429351807, 0.43158429861068726, 0.6562721729278564, 0.8809599876403809, 1.1056479215621948, 1.3303357362747192, 1.5550235509872437, 1.7797114849090576, 2.004399299621582, 2.2290871143341064, 2.453774929046631, 2.6784629821777344, 2.903150796890259, 3.127838611602783, 3.3525264263153076, 3.577214241027832, 3.8019022941589355, 4.026589870452881, 4.251277923583984, 4.47596549987793, 4.700653553009033, 4.925341606140137, 5.15002965927124, 5.3747172355651855, 5.599405288696289, 5.824092864990234, 6.048780918121338, 6.273468971252441, 6.498156547546387, 6.722844123840332, 6.9475321769714355, 7.172219753265381, 7.396907806396484, 7.62159538269043, 7.846283435821533, 8.070971488952637, 8.295659065246582, 8.520347595214844, 8.745035171508789, 8.96972370147705, 9.194411277770996, 9.419098854064941, 9.643787384033203, 9.868474960327148, 10.093162536621094, 10.317850112915039]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 15.0, 14.0, 25.0, 27.0, 63.0, 45.0, 60.0, 96.0, 121.0, 94.0, 94.0, 63.0, 84.0, 55.0, 36.0, 28.0, 26.0, 16.0, 13.0, 6.0, 7.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.118273735046387, -7.866584300994873, -7.614894866943359, -7.3632049560546875, -7.111515522003174, -6.85982608795166, -6.608136177062988, -6.356446743011475, -6.104757308959961, -5.853067874908447, -5.601378440856934, -5.349688529968262, -5.097999095916748, -4.846309661865234, -4.5946197509765625, -4.342930316925049, -4.091240882873535, -3.8395514488220215, -3.5878617763519287, -3.336172103881836, -3.0844826698303223, -2.8327932357788086, -2.581103563308716, -2.329413890838623, -2.0777244567871094, -1.8260349035263062, -1.574345350265503, -1.3226557970046997, -1.0709662437438965, -0.8192766904830933, -0.56758713722229, -0.3158975839614868, -0.0642085075378418, 0.18748104572296143, 0.43917059898376465, 0.6908601522445679, 0.9425497055053711, 1.1942392587661743, 1.4459288120269775, 1.6976183652877808, 1.949307918548584, 2.2009973526000977, 2.4526870250701904, 2.704376697540283, 2.956066131591797, 3.2077555656433105, 3.4594452381134033, 3.711134910583496, 3.9628243446350098, 4.214513778686523, 4.466203689575195, 4.717893123626709, 4.969582557678223, 5.221271991729736, 5.47296142578125, 5.724651336669922, 5.9763407707214355, 6.228030204772949, 6.479720115661621, 6.731409549713135, 6.983098983764648, 7.234788417816162, 7.486477851867676, 7.738167762756348, 7.989857196807861]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 7.0, 12.0, 19.0, 25.0, 40.0, 71.0, 102.0, 281.0, 680.0, 2043.0, 9548.0, 105822.0, 3836436.0, 220713.0, 14139.0, 2868.0, 852.0, 315.0, 146.0, 57.0, 34.0, 24.0, 12.0, 7.0, 6.0, 11.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.091796875, -1.0649032592773438, -1.0380096435546875, -1.0111160278320312, -0.984222412109375, -0.9573287963867188, -0.9304351806640625, -0.9035415649414062, -0.87664794921875, -0.8497543334960938, -0.8228607177734375, -0.7959671020507812, -0.769073486328125, -0.7421798706054688, -0.7152862548828125, -0.6883926391601562, -0.6614990234375, -0.6346054077148438, -0.6077117919921875, -0.5808181762695312, -0.553924560546875, -0.5270309448242188, -0.5001373291015625, -0.47324371337890625, -0.44635009765625, -0.41945648193359375, -0.3925628662109375, -0.36566925048828125, -0.338775634765625, -0.31188201904296875, -0.2849884033203125, -0.25809478759765625, -0.231201171875, -0.20430755615234375, -0.1774139404296875, -0.15052032470703125, -0.123626708984375, -0.09673309326171875, -0.0698394775390625, -0.04294586181640625, -0.01605224609375, 0.01084136962890625, 0.0377349853515625, 0.06462860107421875, 0.091522216796875, 0.11841583251953125, 0.1453094482421875, 0.17220306396484375, 0.1990966796875, 0.22599029541015625, 0.2528839111328125, 0.27977752685546875, 0.306671142578125, 0.33356475830078125, 0.3604583740234375, 0.38735198974609375, 0.41424560546875, 0.44113922119140625, 0.4680328369140625, 0.49492645263671875, 0.521820068359375, 0.5487136840820312, 0.5756072998046875, 0.6025009155273438, 0.62939453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 13.0, 14.0, 36.0, 68.0, 98.0, 121.0, 139.0, 155.0, 128.0, 85.0, 75.0, 36.0, 23.0, 10.0, 11.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77587890625, -0.7543792724609375, -0.732879638671875, -0.7113800048828125, -0.68988037109375, -0.6683807373046875, -0.646881103515625, -0.6253814697265625, -0.6038818359375, -0.5823822021484375, -0.560882568359375, -0.5393829345703125, -0.51788330078125, -0.4963836669921875, -0.474884033203125, -0.4533843994140625, -0.431884765625, -0.4103851318359375, -0.388885498046875, -0.3673858642578125, -0.34588623046875, -0.3243865966796875, -0.302886962890625, -0.2813873291015625, -0.2598876953125, -0.2383880615234375, -0.216888427734375, -0.1953887939453125, -0.17388916015625, -0.1523895263671875, -0.130889892578125, -0.1093902587890625, -0.087890625, -0.0663909912109375, -0.044891357421875, -0.0233917236328125, -0.00189208984375, 0.0196075439453125, 0.041107177734375, 0.0626068115234375, 0.0841064453125, 0.1056060791015625, 0.127105712890625, 0.1486053466796875, 0.17010498046875, 0.1916046142578125, 0.213104248046875, 0.2346038818359375, 0.256103515625, 0.2776031494140625, 0.299102783203125, 0.3206024169921875, 0.34210205078125, 0.3636016845703125, 0.385101318359375, 0.4066009521484375, 0.4281005859375, 0.4496002197265625, 0.471099853515625, 0.4925994873046875, 0.51409912109375, 0.5355987548828125, 0.557098388671875, 0.5785980224609375, 0.60009765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 3.0, 6.0, 9.0, 26.0, 44.0, 70.0, 160.0, 438.0, 1198.0, 4702.0, 27905.0, 557137.0, 3515552.0, 74160.0, 9540.0, 2199.0, 689.0, 261.0, 93.0, 36.0, 23.0, 15.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.5684280395507812, -0.5416412353515625, -0.5148544311523438, -0.488067626953125, -0.46128082275390625, -0.4344940185546875, -0.40770721435546875, -0.38092041015625, -0.35413360595703125, -0.3273468017578125, -0.30055999755859375, -0.273773193359375, -0.24698638916015625, -0.2201995849609375, -0.19341278076171875, -0.1666259765625, -0.13983917236328125, -0.1130523681640625, -0.08626556396484375, -0.059478759765625, -0.03269195556640625, -0.0059051513671875, 0.02088165283203125, 0.04766845703125, 0.07445526123046875, 0.1012420654296875, 0.12802886962890625, 0.154815673828125, 0.18160247802734375, 0.2083892822265625, 0.23517608642578125, 0.261962890625, 0.28874969482421875, 0.3155364990234375, 0.34232330322265625, 0.369110107421875, 0.39589691162109375, 0.4226837158203125, 0.44947052001953125, 0.47625732421875, 0.5030441284179688, 0.5298309326171875, 0.5566177368164062, 0.583404541015625, 0.6101913452148438, 0.6369781494140625, 0.6637649536132812, 0.6905517578125, 0.7173385620117188, 0.7441253662109375, 0.7709121704101562, 0.797698974609375, 0.8244857788085938, 0.8512725830078125, 0.8780593872070312, 0.90484619140625, 0.9316329956054688, 0.9584197998046875, 0.9852066040039062, 1.011993408203125, 1.0387802124023438, 1.0655670166015625, 1.0923538208007812, 1.119140625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 13.0, 15.0, 19.0, 32.0, 33.0, 77.0, 132.0, 261.0, 569.0, 1195.0, 928.0, 383.0, 182.0, 79.0, 42.0, 30.0, 15.0, 26.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.81201171875, -0.7892913818359375, -0.766571044921875, -0.7438507080078125, -0.72113037109375, -0.6984100341796875, -0.675689697265625, -0.6529693603515625, -0.6302490234375, -0.6075286865234375, -0.584808349609375, -0.5620880126953125, -0.53936767578125, -0.5166473388671875, -0.493927001953125, -0.4712066650390625, -0.448486328125, -0.4257659912109375, -0.403045654296875, -0.3803253173828125, -0.35760498046875, -0.3348846435546875, -0.312164306640625, -0.2894439697265625, -0.2667236328125, -0.2440032958984375, -0.221282958984375, -0.1985626220703125, -0.17584228515625, -0.1531219482421875, -0.130401611328125, -0.1076812744140625, -0.0849609375, -0.0622406005859375, -0.039520263671875, -0.0167999267578125, 0.00592041015625, 0.0286407470703125, 0.051361083984375, 0.0740814208984375, 0.0968017578125, 0.1195220947265625, 0.142242431640625, 0.1649627685546875, 0.18768310546875, 0.2104034423828125, 0.233123779296875, 0.2558441162109375, 0.278564453125, 0.3012847900390625, 0.324005126953125, 0.3467254638671875, 0.36944580078125, 0.3921661376953125, 0.414886474609375, 0.4376068115234375, 0.4603271484375, 0.4830474853515625, 0.505767822265625, 0.5284881591796875, 0.55120849609375, 0.5739288330078125, 0.596649169921875, 0.6193695068359375, 0.64208984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 11.0, 52.0, 131.0, 336.0, 321.0, 97.0, 24.0, 3.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.753754615783691, -10.455516815185547, -10.157278060913086, -9.859040260314941, -9.560802459716797, -9.262564659118652, -8.964326858520508, -8.666088104248047, -8.367850303649902, -8.069612503051758, -7.771374225616455, -7.473135948181152, -7.174898147583008, -6.876660346984863, -6.5784220695495605, -6.280183792114258, -5.981945991516113, -5.683708190917969, -5.385469913482666, -5.087231636047363, -4.788993835449219, -4.490756034851074, -4.1925177574157715, -3.894279718399048, -3.596041679382324, -3.2978036403656006, -2.999565601348877, -2.7013275623321533, -2.4030895233154297, -2.104851484298706, -1.8066134452819824, -1.5083754062652588, -1.2101364135742188, -0.9118983745574951, -0.6136603355407715, -0.31542229652404785, -0.01718425750732422, 0.2810537815093994, 0.579291820526123, 0.8775298595428467, 1.1757678985595703, 1.474005937576294, 1.7722439765930176, 2.070482015609741, 2.368720054626465, 2.6669580936431885, 2.965196132659912, 3.2634341716766357, 3.5616722106933594, 3.859910249710083, 4.158148288726807, 4.456386566162109, 4.754624366760254, 5.052862167358398, 5.351100444793701, 5.649338722229004, 5.947576522827148, 6.245814323425293, 6.544052600860596, 6.842290878295898, 7.140528678894043, 7.4387664794921875, 7.73700475692749, 8.035243034362793, 8.333480834960938]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 11.0, 17.0, 11.0, 14.0, 24.0, 31.0, 40.0, 48.0, 58.0, 61.0, 71.0, 66.0, 65.0, 72.0, 69.0, 60.0, 51.0, 59.0, 37.0, 31.0, 22.0, 21.0, 15.0, 8.0, 11.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5510036945343018, -3.4221067428588867, -3.2932097911834717, -3.1643128395080566, -3.0354161262512207, -2.9065191745758057, -2.7776222229003906, -2.6487252712249756, -2.5198283195495605, -2.3909313678741455, -2.2620344161987305, -2.1331377029418945, -2.0042407512664795, -1.8753437995910645, -1.7464468479156494, -1.6175498962402344, -1.4886531829833984, -1.3597562313079834, -1.230859398841858, -1.1019624471664429, -0.9730655550956726, -0.8441686630249023, -0.7152717113494873, -0.586374819278717, -0.4574779272079468, -0.3285810351371765, -0.19968411326408386, -0.07078719139099121, 0.05810970067977905, 0.18700659275054932, 0.31590354442596436, 0.4448004364967346, 0.573697566986084, 0.7025944590568542, 0.8314913511276245, 0.9603883028030396, 1.089285135269165, 1.21818208694458, 1.3470790386199951, 1.4759759902954102, 1.6048728227615356, 1.7337697744369507, 1.8626666069030762, 1.9915635585784912, 2.1204605102539062, 2.249357223510742, 2.3782544136047363, 2.5071511268615723, 2.6360480785369873, 2.7649450302124023, 2.8938419818878174, 3.0227389335632324, 3.1516356468200684, 3.2805325984954834, 3.4094295501708984, 3.5383265018463135, 3.6672234535217285, 3.7961204051971436, 3.9250173568725586, 4.0539140701293945, 4.182811260223389, 4.311707973480225, 4.440605163574219, 4.569501876831055, 4.698398590087891]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 8.0, 15.0, 17.0, 18.0, 33.0, 55.0, 70.0, 118.0, 195.0, 325.0, 570.0, 1031.0, 1995.0, 4132.0, 8867.0, 21742.0, 61317.0, 196840.0, 425841.0, 216274.0, 66683.0, 23658.0, 9586.0, 4473.0, 2084.0, 1141.0, 577.0, 359.0, 190.0, 117.0, 78.0, 49.0, 25.0, 16.0, 12.0, 10.0, 9.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.50732421875, -0.49304962158203125, -0.4787750244140625, -0.46450042724609375, -0.450225830078125, -0.43595123291015625, -0.4216766357421875, -0.40740203857421875, -0.39312744140625, -0.37885284423828125, -0.3645782470703125, -0.35030364990234375, -0.336029052734375, -0.32175445556640625, -0.3074798583984375, -0.29320526123046875, -0.2789306640625, -0.26465606689453125, -0.2503814697265625, -0.23610687255859375, -0.221832275390625, -0.20755767822265625, -0.1932830810546875, -0.17900848388671875, -0.16473388671875, -0.15045928955078125, -0.1361846923828125, -0.12191009521484375, -0.107635498046875, -0.09336090087890625, -0.0790863037109375, -0.06481170654296875, -0.050537109375, -0.03626251220703125, -0.0219879150390625, -0.00771331787109375, 0.006561279296875, 0.02083587646484375, 0.0351104736328125, 0.04938507080078125, 0.06365966796875, 0.07793426513671875, 0.0922088623046875, 0.10648345947265625, 0.120758056640625, 0.13503265380859375, 0.1493072509765625, 0.16358184814453125, 0.1778564453125, 0.19213104248046875, 0.2064056396484375, 0.22068023681640625, 0.234954833984375, 0.24922943115234375, 0.2635040283203125, 0.27777862548828125, 0.29205322265625, 0.30632781982421875, 0.3206024169921875, 0.33487701416015625, 0.349151611328125, 0.36342620849609375, 0.3777008056640625, 0.39197540283203125, 0.40625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 12.0, 15.0, 24.0, 31.0, 44.0, 46.0, 68.0, 64.0, 60.0, 79.0, 85.0, 86.0, 79.0, 59.0, 53.0, 51.0, 39.0, 23.0, 24.0, 18.0, 12.0, 5.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48388671875, -0.4719276428222656, -0.45996856689453125, -0.4480094909667969, -0.4360504150390625, -0.4240913391113281, -0.41213226318359375, -0.4001731872558594, -0.388214111328125, -0.3762550354003906, -0.36429595947265625, -0.3523368835449219, -0.3403778076171875, -0.3284187316894531, -0.31645965576171875, -0.3045005798339844, -0.29254150390625, -0.2805824279785156, -0.26862335205078125, -0.2566642761230469, -0.2447052001953125, -0.23274612426757812, -0.22078704833984375, -0.20882797241210938, -0.196868896484375, -0.18490982055664062, -0.17295074462890625, -0.16099166870117188, -0.1490325927734375, -0.13707351684570312, -0.12511444091796875, -0.11315536499023438, -0.1011962890625, -0.08923721313476562, -0.07727813720703125, -0.06531906127929688, -0.0533599853515625, -0.041400909423828125, -0.02944183349609375, -0.017482757568359375, -0.005523681640625, 0.006435394287109375, 0.01839447021484375, 0.030353546142578125, 0.0423126220703125, 0.054271697998046875, 0.06623077392578125, 0.07818984985351562, 0.09014892578125, 0.10210800170898438, 0.11406707763671875, 0.12602615356445312, 0.1379852294921875, 0.14994430541992188, 0.16190338134765625, 0.17386245727539062, 0.185821533203125, 0.19778060913085938, 0.20973968505859375, 0.22169876098632812, 0.2336578369140625, 0.24561691284179688, 0.25757598876953125, 0.2695350646972656, 0.281494140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 9.0, 2.0, 8.0, 18.0, 18.0, 25.0, 40.0, 75.0, 108.0, 258.0, 519.0, 1325.0, 5005.0, 45453.0, 784854.0, 194458.0, 12450.0, 2441.0, 744.0, 345.0, 170.0, 85.0, 51.0, 30.0, 20.0, 11.0, 11.0, 6.0, 2.0, 2.0, 4.0, 7.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.619140625, -1.5812530517578125, -1.543365478515625, -1.5054779052734375, -1.46759033203125, -1.4297027587890625, -1.391815185546875, -1.3539276123046875, -1.3160400390625, -1.2781524658203125, -1.240264892578125, -1.2023773193359375, -1.16448974609375, -1.1266021728515625, -1.088714599609375, -1.0508270263671875, -1.012939453125, -0.9750518798828125, -0.937164306640625, -0.8992767333984375, -0.86138916015625, -0.8235015869140625, -0.785614013671875, -0.7477264404296875, -0.7098388671875, -0.6719512939453125, -0.634063720703125, -0.5961761474609375, -0.55828857421875, -0.5204010009765625, -0.482513427734375, -0.4446258544921875, -0.40673828125, -0.3688507080078125, -0.330963134765625, -0.2930755615234375, -0.25518798828125, -0.2173004150390625, -0.179412841796875, -0.1415252685546875, -0.1036376953125, -0.0657501220703125, -0.027862548828125, 0.0100250244140625, 0.04791259765625, 0.0858001708984375, 0.123687744140625, 0.1615753173828125, 0.199462890625, 0.2373504638671875, 0.275238037109375, 0.3131256103515625, 0.35101318359375, 0.3889007568359375, 0.426788330078125, 0.4646759033203125, 0.5025634765625, 0.5404510498046875, 0.578338623046875, 0.6162261962890625, 0.65411376953125, 0.6920013427734375, 0.729888916015625, 0.7677764892578125, 0.8056640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 11.0, 10.0, 10.0, 12.0, 26.0, 28.0, 34.0, 35.0, 46.0, 39.0, 52.0, 61.0, 61.0, 62.0, 55.0, 66.0, 61.0, 49.0, 53.0, 47.0, 35.0, 27.0, 31.0, 24.0, 20.0, 11.0, 10.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1182403564453125, -1.082183837890625, -1.0461273193359375, -1.01007080078125, -0.9740142822265625, -0.937957763671875, -0.9019012451171875, -0.8658447265625, -0.8297882080078125, -0.793731689453125, -0.7576751708984375, -0.72161865234375, -0.6855621337890625, -0.649505615234375, -0.6134490966796875, -0.577392578125, -0.5413360595703125, -0.505279541015625, -0.4692230224609375, -0.43316650390625, -0.3971099853515625, -0.361053466796875, -0.3249969482421875, -0.2889404296875, -0.2528839111328125, -0.216827392578125, -0.1807708740234375, -0.14471435546875, -0.1086578369140625, -0.072601318359375, -0.0365447998046875, -0.00048828125, 0.0355682373046875, 0.071624755859375, 0.1076812744140625, 0.14373779296875, 0.1797943115234375, 0.215850830078125, 0.2519073486328125, 0.2879638671875, 0.3240203857421875, 0.360076904296875, 0.3961334228515625, 0.43218994140625, 0.4682464599609375, 0.504302978515625, 0.5403594970703125, 0.576416015625, 0.6124725341796875, 0.648529052734375, 0.6845855712890625, 0.72064208984375, 0.7566986083984375, 0.792755126953125, 0.8288116455078125, 0.8648681640625, 0.9009246826171875, 0.936981201171875, 0.9730377197265625, 1.00909423828125, 1.0451507568359375, 1.081207275390625, 1.1172637939453125, 1.1533203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 11.0, 11.0, 37.0, 82.0, 173.0, 692.0, 5337.0, 895511.0, 143496.0, 2469.0, 422.0, 152.0, 58.0, 30.0, 21.0, 7.0, 9.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.991302490234375, -0.95916748046875, -0.927032470703125, -0.8948974609375, -0.862762451171875, -0.83062744140625, -0.798492431640625, -0.766357421875, -0.734222412109375, -0.70208740234375, -0.669952392578125, -0.6378173828125, -0.605682373046875, -0.57354736328125, -0.541412353515625, -0.50927734375, -0.477142333984375, -0.44500732421875, -0.412872314453125, -0.3807373046875, -0.348602294921875, -0.31646728515625, -0.284332275390625, -0.252197265625, -0.220062255859375, -0.18792724609375, -0.155792236328125, -0.1236572265625, -0.091522216796875, -0.05938720703125, -0.027252197265625, 0.0048828125, 0.037017822265625, 0.06915283203125, 0.101287841796875, 0.1334228515625, 0.165557861328125, 0.19769287109375, 0.229827880859375, 0.261962890625, 0.294097900390625, 0.32623291015625, 0.358367919921875, 0.3905029296875, 0.422637939453125, 0.45477294921875, 0.486907958984375, 0.51904296875, 0.551177978515625, 0.58331298828125, 0.615447998046875, 0.6475830078125, 0.679718017578125, 0.71185302734375, 0.743988037109375, 0.776123046875, 0.808258056640625, 0.84039306640625, 0.872528076171875, 0.9046630859375, 0.936798095703125, 0.96893310546875, 1.001068115234375, 1.033203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 8.0, 3.0, 5.0, 11.0, 14.0, 14.0, 24.0, 29.0, 38.0, 44.0, 49.0, 62.0, 89.0, 99.0, 84.0, 84.0, 82.0, 46.0, 47.0, 34.0, 18.0, 17.0, 20.0, 12.0, 14.0, 4.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.18832015991211e-05, -6.989296525716782e-05, -6.790272891521454e-05, -6.591249257326126e-05, -6.392225623130798e-05, -6.19320198893547e-05, -5.994178354740143e-05, -5.795154720544815e-05, -5.596131086349487e-05, -5.3971074521541595e-05, -5.198083817958832e-05, -4.999060183763504e-05, -4.800036549568176e-05, -4.6010129153728485e-05, -4.401989281177521e-05, -4.202965646982193e-05, -4.003942012786865e-05, -3.8049183785915375e-05, -3.60589474439621e-05, -3.406871110200882e-05, -3.207847476005554e-05, -3.0088238418102264e-05, -2.8098002076148987e-05, -2.610776573419571e-05, -2.411752939224243e-05, -2.2127293050289154e-05, -2.0137056708335876e-05, -1.81468203663826e-05, -1.615658402442932e-05, -1.4166347682476044e-05, -1.2176111340522766e-05, -1.0185874998569489e-05, -8.195638656616211e-06, -6.205402314662933e-06, -4.215165972709656e-06, -2.224929630756378e-06, -2.3469328880310059e-07, 1.755543053150177e-06, 3.7457793951034546e-06, 5.736015737056732e-06, 7.72625207901001e-06, 9.716488420963287e-06, 1.1706724762916565e-05, 1.3696961104869843e-05, 1.568719744682312e-05, 1.7677433788776398e-05, 1.9667670130729675e-05, 2.1657906472682953e-05, 2.364814281463623e-05, 2.5638379156589508e-05, 2.7628615498542786e-05, 2.9618851840496063e-05, 3.160908818244934e-05, 3.359932452440262e-05, 3.5589560866355896e-05, 3.7579797208309174e-05, 3.957003355026245e-05, 4.156026989221573e-05, 4.3550506234169006e-05, 4.5540742576122284e-05, 4.753097891807556e-05, 4.952121526002884e-05, 5.151145160198212e-05, 5.3501687943935394e-05, 5.549192428588867e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 9.0, 15.0, 20.0, 47.0, 77.0, 109.0, 270.0, 644.0, 2156.0, 12432.0, 345578.0, 665005.0, 18082.0, 2715.0, 778.0, 282.0, 137.0, 63.0, 41.0, 29.0, 14.0, 12.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40576171875, -0.38890838623046875, -0.3720550537109375, -0.35520172119140625, -0.338348388671875, -0.32149505615234375, -0.3046417236328125, -0.28778839111328125, -0.27093505859375, -0.25408172607421875, -0.2372283935546875, -0.22037506103515625, -0.203521728515625, -0.18666839599609375, -0.1698150634765625, -0.15296173095703125, -0.1361083984375, -0.11925506591796875, -0.1024017333984375, -0.08554840087890625, -0.068695068359375, -0.05184173583984375, -0.0349884033203125, -0.01813507080078125, -0.00128173828125, 0.01557159423828125, 0.0324249267578125, 0.04927825927734375, 0.066131591796875, 0.08298492431640625, 0.0998382568359375, 0.11669158935546875, 0.133544921875, 0.15039825439453125, 0.1672515869140625, 0.18410491943359375, 0.200958251953125, 0.21781158447265625, 0.2346649169921875, 0.25151824951171875, 0.26837158203125, 0.28522491455078125, 0.3020782470703125, 0.31893157958984375, 0.335784912109375, 0.35263824462890625, 0.3694915771484375, 0.38634490966796875, 0.4031982421875, 0.42005157470703125, 0.4369049072265625, 0.45375823974609375, 0.470611572265625, 0.48746490478515625, 0.5043182373046875, 0.5211715698242188, 0.53802490234375, 0.5548782348632812, 0.5717315673828125, 0.5885848999023438, 0.605438232421875, 0.6222915649414062, 0.6391448974609375, 0.6559982299804688, 0.6728515625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 12.0, 10.0, 12.0, 17.0, 20.0, 31.0, 27.0, 38.0, 47.0, 71.0, 64.0, 65.0, 70.0, 76.0, 66.0, 69.0, 62.0, 54.0, 33.0, 30.0, 31.0, 17.0, 15.0, 8.0, 12.0, 12.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.283203125, -0.2750988006591797, -0.2669944763183594, -0.25889015197753906, -0.25078582763671875, -0.24268150329589844, -0.23457717895507812, -0.2264728546142578, -0.2183685302734375, -0.2102642059326172, -0.20215988159179688, -0.19405555725097656, -0.18595123291015625, -0.17784690856933594, -0.16974258422851562, -0.1616382598876953, -0.153533935546875, -0.1454296112060547, -0.13732528686523438, -0.12922096252441406, -0.12111663818359375, -0.11301231384277344, -0.10490798950195312, -0.09680366516113281, -0.0886993408203125, -0.08059501647949219, -0.07249069213867188, -0.06438636779785156, -0.05628204345703125, -0.04817771911621094, -0.040073394775390625, -0.03196907043457031, -0.02386474609375, -0.015760421752929688, -0.007656097412109375, 0.0004482269287109375, 0.00855255126953125, 0.016656875610351562, 0.024761199951171875, 0.03286552429199219, 0.0409698486328125, 0.04907417297363281, 0.057178497314453125, 0.06528282165527344, 0.07338714599609375, 0.08149147033691406, 0.08959579467773438, 0.09770011901855469, 0.105804443359375, 0.11390876770019531, 0.12201309204101562, 0.13011741638183594, 0.13822174072265625, 0.14632606506347656, 0.15443038940429688, 0.1625347137451172, 0.1706390380859375, 0.1787433624267578, 0.18684768676757812, 0.19495201110839844, 0.20305633544921875, 0.21116065979003906, 0.21926498413085938, 0.2273693084716797, 0.2354736328125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 1.0, 21.0, 147.0, 463.0, 282.0, 59.0, 13.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.77346420288086, -20.297883987426758, -19.822303771972656, -19.346725463867188, -18.871145248413086, -18.395565032958984, -17.919984817504883, -17.444406509399414, -16.968826293945312, -16.49324607849121, -16.01766586303711, -15.542086601257324, -15.066507339477539, -14.590927124023438, -14.115347862243652, -13.63976764678955, -13.164188385009766, -12.688608169555664, -12.213028907775879, -11.737448692321777, -11.261869430541992, -10.78628921508789, -10.310709953308105, -9.835129737854004, -9.359549522399902, -8.8839693069458, -8.408390045166016, -7.932810306549072, -7.457230567932129, -6.981650352478027, -6.506071090698242, -6.030490875244141, -5.5549116134643555, -5.079331874847412, -4.603752136230469, -4.128172397613525, -3.652592658996582, -3.1770126819610596, -2.701432943344116, -2.225853204727173, -1.7502734661102295, -1.2746937274932861, -0.799113929271698, -0.32353413105010986, 0.1520456075668335, 0.6276254653930664, 1.1032052040100098, 1.5787849426269531, 2.0543646812438965, 2.52994441986084, 3.005524158477783, 3.4811038970947266, 3.95668363571167, 4.432263374328613, 4.907843589782715, 5.3834228515625, 5.859003067016602, 6.334582805633545, 6.810162544250488, 7.285742282867432, 7.761322021484375, 8.236902236938477, 8.712481498718262, 9.188061714172363, 9.663640975952148]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 2.0, 5.0, 8.0, 12.0, 16.0, 23.0, 19.0, 19.0, 22.0, 26.0, 32.0, 40.0, 42.0, 45.0, 45.0, 57.0, 54.0, 63.0, 58.0, 64.0, 41.0, 43.0, 37.0, 42.0, 38.0, 26.0, 19.0, 18.0, 17.0, 8.0, 17.0, 16.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.266371726989746, -5.125722885131836, -4.985073566436768, -4.844424724578857, -4.703775405883789, -4.563126564025879, -4.422477722167969, -4.2818284034729, -4.14117956161499, -4.00053071975708, -3.8598814010620117, -3.7192325592041016, -3.5785834789276123, -3.437934398651123, -3.297285318374634, -3.1566362380981445, -3.0159871578216553, -2.875338077545166, -2.7346889972686768, -2.5940399169921875, -2.4533910751342773, -2.312741994857788, -2.172092914581299, -2.0314438343048096, -1.8907948732376099, -1.7501457929611206, -1.609496831893921, -1.4688477516174316, -1.3281986713409424, -1.1875497102737427, -1.0469006299972534, -0.9062516093254089, -0.7656025886535645, -0.62495356798172, -0.4843045175075531, -0.34365546703338623, -0.20300644636154175, -0.062357425689697266, 0.07829165458679199, 0.21894067525863647, 0.35958969593048096, 0.5002387166023254, 0.6408877372741699, 0.7815368175506592, 0.9221858382225037, 1.0628348588943481, 1.2034839391708374, 1.344132900238037, 1.4847819805145264, 1.6254310607910156, 1.7660800218582153, 1.9067291021347046, 2.0473780632019043, 2.1880271434783936, 2.328676223754883, 2.469325304031372, 2.6099743843078613, 2.7506234645843506, 2.89127254486084, 3.03192138671875, 3.1725704669952393, 3.3132195472717285, 3.4538686275482178, 3.594517707824707, 3.735166549682617]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 14.0, 15.0, 25.0, 31.0, 62.0, 102.0, 157.0, 289.0, 534.0, 1178.0, 3078.0, 9942.0, 41256.0, 326890.0, 2927550.0, 787342.0, 72424.0, 15550.0, 4613.0, 1674.0, 694.0, 381.0, 208.0, 101.0, 57.0, 29.0, 28.0, 16.0, 10.0, 10.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.40943145751953125, -0.3964996337890625, -0.38356781005859375, -0.370635986328125, -0.35770416259765625, -0.3447723388671875, -0.33184051513671875, -0.31890869140625, -0.30597686767578125, -0.2930450439453125, -0.28011322021484375, -0.267181396484375, -0.25424957275390625, -0.2413177490234375, -0.22838592529296875, -0.2154541015625, -0.20252227783203125, -0.1895904541015625, -0.17665863037109375, -0.163726806640625, -0.15079498291015625, -0.1378631591796875, -0.12493133544921875, -0.11199951171875, -0.09906768798828125, -0.0861358642578125, -0.07320404052734375, -0.060272216796875, -0.04734039306640625, -0.0344085693359375, -0.02147674560546875, -0.008544921875, 0.00438690185546875, 0.0173187255859375, 0.03025054931640625, 0.043182373046875, 0.05611419677734375, 0.0690460205078125, 0.08197784423828125, 0.09490966796875, 0.10784149169921875, 0.1207733154296875, 0.13370513916015625, 0.146636962890625, 0.15956878662109375, 0.1725006103515625, 0.18543243408203125, 0.1983642578125, 0.21129608154296875, 0.2242279052734375, 0.23715972900390625, 0.250091552734375, 0.26302337646484375, 0.2759552001953125, 0.28888702392578125, 0.30181884765625, 0.31475067138671875, 0.3276824951171875, 0.34061431884765625, 0.353546142578125, 0.36647796630859375, 0.3794097900390625, 0.39234161376953125, 0.4052734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 6.0, 10.0, 13.0, 16.0, 27.0, 32.0, 42.0, 36.0, 61.0, 67.0, 75.0, 81.0, 73.0, 89.0, 69.0, 56.0, 46.0, 41.0, 39.0, 34.0, 28.0, 18.0, 8.0, 11.0, 11.0, 9.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.3710136413574219, -0.36141204833984375, -0.3518104553222656, -0.3422088623046875, -0.3326072692871094, -0.32300567626953125, -0.3134040832519531, -0.303802490234375, -0.2942008972167969, -0.28459930419921875, -0.2749977111816406, -0.2653961181640625, -0.2557945251464844, -0.24619293212890625, -0.23659133911132812, -0.22698974609375, -0.21738815307617188, -0.20778656005859375, -0.19818496704101562, -0.1885833740234375, -0.17898178100585938, -0.16938018798828125, -0.15977859497070312, -0.150177001953125, -0.14057540893554688, -0.13097381591796875, -0.12137222290039062, -0.1117706298828125, -0.10216903686523438, -0.09256744384765625, -0.08296585083007812, -0.0733642578125, -0.06376266479492188, -0.05416107177734375, -0.044559478759765625, -0.0349578857421875, -0.025356292724609375, -0.01575469970703125, -0.006153106689453125, 0.003448486328125, 0.013050079345703125, 0.02265167236328125, 0.032253265380859375, 0.0418548583984375, 0.051456451416015625, 0.06105804443359375, 0.07065963745117188, 0.08026123046875, 0.08986282348632812, 0.09946441650390625, 0.10906600952148438, 0.1186676025390625, 0.12826919555664062, 0.13787078857421875, 0.14747238159179688, 0.157073974609375, 0.16667556762695312, 0.17627716064453125, 0.18587875366210938, 0.1954803466796875, 0.20508193969726562, 0.21468353271484375, 0.22428512573242188, 0.23388671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 16.0, 22.0, 33.0, 33.0, 73.0, 81.0, 148.0, 342.0, 1127.0, 9970.0, 477526.0, 3667697.0, 34132.0, 2268.0, 460.0, 167.0, 83.0, 44.0, 23.0, 13.0, 15.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0528106689453125, -1.016754150390625, -0.9806976318359375, -0.94464111328125, -0.9085845947265625, -0.872528076171875, -0.8364715576171875, -0.8004150390625, -0.7643585205078125, -0.728302001953125, -0.6922454833984375, -0.65618896484375, -0.6201324462890625, -0.584075927734375, -0.5480194091796875, -0.511962890625, -0.4759063720703125, -0.439849853515625, -0.4037933349609375, -0.36773681640625, -0.3316802978515625, -0.295623779296875, -0.2595672607421875, -0.2235107421875, -0.1874542236328125, -0.151397705078125, -0.1153411865234375, -0.07928466796875, -0.0432281494140625, -0.007171630859375, 0.0288848876953125, 0.06494140625, 0.1009979248046875, 0.137054443359375, 0.1731109619140625, 0.20916748046875, 0.2452239990234375, 0.281280517578125, 0.3173370361328125, 0.3533935546875, 0.3894500732421875, 0.425506591796875, 0.4615631103515625, 0.49761962890625, 0.5336761474609375, 0.569732666015625, 0.6057891845703125, 0.641845703125, 0.6779022216796875, 0.713958740234375, 0.7500152587890625, 0.78607177734375, 0.8221282958984375, 0.858184814453125, 0.8942413330078125, 0.9302978515625, 0.9663543701171875, 1.002410888671875, 1.0384674072265625, 1.07452392578125, 1.1105804443359375, 1.146636962890625, 1.1826934814453125, 1.21875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 13.0, 10.0, 24.0, 27.0, 68.0, 87.0, 135.0, 301.0, 580.0, 939.0, 824.0, 493.0, 216.0, 129.0, 63.0, 57.0, 30.0, 19.0, 12.0, 10.0, 9.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-1.0576171875, -1.0345573425292969, -1.0114974975585938, -0.9884376525878906, -0.9653778076171875, -0.9423179626464844, -0.9192581176757812, -0.8961982727050781, -0.873138427734375, -0.8500785827636719, -0.8270187377929688, -0.8039588928222656, -0.7808990478515625, -0.7578392028808594, -0.7347793579101562, -0.7117195129394531, -0.68865966796875, -0.6655998229980469, -0.6425399780273438, -0.6194801330566406, -0.5964202880859375, -0.5733604431152344, -0.5503005981445312, -0.5272407531738281, -0.504180908203125, -0.4811210632324219, -0.45806121826171875, -0.4350013732910156, -0.4119415283203125, -0.3888816833496094, -0.36582183837890625, -0.3427619934082031, -0.3197021484375, -0.2966423034667969, -0.27358245849609375, -0.2505226135253906, -0.2274627685546875, -0.20440292358398438, -0.18134307861328125, -0.15828323364257812, -0.135223388671875, -0.11216354370117188, -0.08910369873046875, -0.06604385375976562, -0.0429840087890625, -0.019924163818359375, 0.00313568115234375, 0.026195526123046875, 0.04925537109375, 0.07231521606445312, 0.09537506103515625, 0.11843490600585938, 0.1414947509765625, 0.16455459594726562, 0.18761444091796875, 0.21067428588867188, 0.233734130859375, 0.2567939758300781, 0.27985382080078125, 0.3029136657714844, 0.3259735107421875, 0.3490333557128906, 0.37209320068359375, 0.3951530456542969, 0.418212890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 16.0, 40.0, 158.0, 385.0, 281.0, 88.0, 20.0, 8.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.395563125610352, -10.035148620605469, -9.674735069274902, -9.31432056427002, -8.953906059265137, -8.59349250793457, -8.233078002929688, -7.872663497924805, -7.51224946975708, -7.1518354415893555, -6.791420936584473, -6.431006908416748, -6.070592880249023, -5.710178375244141, -5.349764347076416, -4.989350318908691, -4.628935813903809, -4.268521785736084, -3.908107280731201, -3.5476932525634766, -3.187278985977173, -2.826864719390869, -2.4664506912231445, -2.106036424636841, -1.745622158050537, -1.3852078914642334, -1.0247937440872192, -0.6643795967102051, -0.30396533012390137, 0.056448936462402344, 0.41686296463012695, 0.7772772312164307, 1.137690544128418, 1.4981048107147217, 1.8585189580917358, 2.21893310546875, 2.5793473720550537, 2.9397616386413574, 3.300175666809082, 3.6605899333953857, 4.0210041999816895, 4.381418228149414, 4.741832733154297, 5.1022467613220215, 5.462660789489746, 5.823075294494629, 6.1834893226623535, 6.543903350830078, 6.904317855834961, 7.2647318840026855, 7.625146389007568, 7.985560417175293, 8.345974922180176, 8.706388473510742, 9.066802978515625, 9.427217483520508, 9.78763198852539, 10.148046493530273, 10.50846004486084, 10.868874549865723, 11.229289054870605, 11.589702606201172, 11.950117111206055, 12.310531616210938, 12.670945167541504]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 10.0, 12.0, 18.0, 19.0, 27.0, 24.0, 45.0, 38.0, 61.0, 45.0, 55.0, 57.0, 69.0, 70.0, 77.0, 72.0, 47.0, 52.0, 52.0, 38.0, 20.0, 16.0, 22.0, 18.0, 7.0, 12.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8141088485717773, -2.705805778503418, -2.5975029468536377, -2.4891998767852783, -2.380897045135498, -2.2725939750671387, -2.1642911434173584, -2.055988073348999, -1.9476852416992188, -1.839382290840149, -1.731079339981079, -1.6227763891220093, -1.5144734382629395, -1.40617036819458, -1.2978675365447998, -1.1895644664764404, -1.0812615156173706, -0.9729585647583008, -0.864655613899231, -0.7563526630401611, -0.6480497121810913, -0.5397467017173767, -0.4314437508583069, -0.32314079999923706, -0.21483784914016724, -0.10653489083051682, 0.001768067479133606, 0.11007103323936462, 0.21837398409843445, 0.32667696475982666, 0.4349799156188965, 0.5432828664779663, 0.6515858173370361, 0.759888768196106, 0.8681917190551758, 0.9764946699142456, 1.0847976207733154, 1.1931006908416748, 1.301403522491455, 1.4097065925598145, 1.5180094242095947, 1.6263123750686646, 1.7346153259277344, 1.8429182767868042, 1.951221227645874, 2.0595242977142334, 2.1678271293640137, 2.276130199432373, 2.3844332695007324, 2.492736339569092, 2.601039171218872, 2.7093422412872314, 2.8176450729370117, 2.925948143005371, 3.0342509746551514, 3.1425540447235107, 3.250856876373291, 3.3591599464416504, 3.4674627780914307, 3.57576584815979, 3.6840686798095703, 3.7923717498779297, 3.90067458152771, 4.00897741317749, 4.11728048324585]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 13.0, 23.0, 24.0, 42.0, 85.0, 111.0, 186.0, 289.0, 533.0, 1167.0, 2444.0, 5955.0, 15085.0, 43016.0, 126343.0, 331182.0, 328722.0, 125116.0, 42330.0, 15234.0, 5932.0, 2339.0, 1067.0, 533.0, 310.0, 178.0, 108.0, 64.0, 53.0, 24.0, 10.0, 16.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434814453125, -0.4220237731933594, -0.40923309326171875, -0.3964424133300781, -0.3836517333984375, -0.3708610534667969, -0.35807037353515625, -0.3452796936035156, -0.332489013671875, -0.3196983337402344, -0.30690765380859375, -0.2941169738769531, -0.2813262939453125, -0.2685356140136719, -0.25574493408203125, -0.24295425415039062, -0.23016357421875, -0.21737289428710938, -0.20458221435546875, -0.19179153442382812, -0.1790008544921875, -0.16621017456054688, -0.15341949462890625, -0.14062881469726562, -0.127838134765625, -0.11504745483398438, -0.10225677490234375, -0.08946609497070312, -0.0766754150390625, -0.06388473510742188, -0.05109405517578125, -0.038303375244140625, -0.0255126953125, -0.012722015380859375, 6.866455078125e-05, 0.012859344482421875, 0.0256500244140625, 0.038440704345703125, 0.05123138427734375, 0.06402206420898438, 0.076812744140625, 0.08960342407226562, 0.10239410400390625, 0.11518478393554688, 0.1279754638671875, 0.14076614379882812, 0.15355682373046875, 0.16634750366210938, 0.17913818359375, 0.19192886352539062, 0.20471954345703125, 0.21751022338867188, 0.2303009033203125, 0.24309158325195312, 0.25588226318359375, 0.2686729431152344, 0.281463623046875, 0.2942543029785156, 0.30704498291015625, 0.3198356628417969, 0.3326263427734375, 0.3454170227050781, 0.35820770263671875, 0.3709983825683594, 0.3837890625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 9.0, 11.0, 11.0, 18.0, 17.0, 18.0, 24.0, 31.0, 37.0, 30.0, 34.0, 43.0, 48.0, 54.0, 52.0, 69.0, 57.0, 44.0, 45.0, 53.0, 45.0, 44.0, 23.0, 34.0, 20.0, 25.0, 18.0, 17.0, 12.0, 9.0, 12.0, 7.0, 4.0, 7.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1953125, -0.18858718872070312, -0.18186187744140625, -0.17513656616210938, -0.1684112548828125, -0.16168594360351562, -0.15496063232421875, -0.14823532104492188, -0.141510009765625, -0.13478469848632812, -0.12805938720703125, -0.12133407592773438, -0.1146087646484375, -0.10788345336914062, -0.10115814208984375, -0.09443283081054688, -0.08770751953125, -0.08098220825195312, -0.07425689697265625, -0.06753158569335938, -0.0608062744140625, -0.054080963134765625, -0.04735565185546875, -0.040630340576171875, -0.033905029296875, -0.027179718017578125, -0.02045440673828125, -0.013729095458984375, -0.0070037841796875, -0.000278472900390625, 0.00644683837890625, 0.013172149658203125, 0.0198974609375, 0.026622772216796875, 0.03334808349609375, 0.040073394775390625, 0.0467987060546875, 0.053524017333984375, 0.06024932861328125, 0.06697463989257812, 0.073699951171875, 0.08042526245117188, 0.08715057373046875, 0.09387588500976562, 0.1006011962890625, 0.10732650756835938, 0.11405181884765625, 0.12077713012695312, 0.12750244140625, 0.13422775268554688, 0.14095306396484375, 0.14767837524414062, 0.1544036865234375, 0.16112899780273438, 0.16785430908203125, 0.17457962036132812, 0.181304931640625, 0.18803024291992188, 0.19475555419921875, 0.20148086547851562, 0.2082061767578125, 0.21493148803710938, 0.22165679931640625, 0.22838211059570312, 0.235107421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 6.0, 8.0, 11.0, 14.0, 15.0, 24.0, 32.0, 54.0, 73.0, 107.0, 189.0, 250.0, 407.0, 680.0, 1163.0, 2266.0, 5906.0, 29706.0, 318977.0, 624739.0, 49663.0, 8013.0, 2752.0, 1369.0, 753.0, 501.0, 298.0, 188.0, 116.0, 93.0, 55.0, 40.0, 27.0, 17.0, 13.0, 4.0, 10.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6513671875, -0.6264266967773438, -0.6014862060546875, -0.5765457153320312, -0.551605224609375, -0.5266647338867188, -0.5017242431640625, -0.47678375244140625, -0.45184326171875, -0.42690277099609375, -0.4019622802734375, -0.37702178955078125, -0.352081298828125, -0.32714080810546875, -0.3022003173828125, -0.27725982666015625, -0.2523193359375, -0.22737884521484375, -0.2024383544921875, -0.17749786376953125, -0.152557373046875, -0.12761688232421875, -0.1026763916015625, -0.07773590087890625, -0.05279541015625, -0.02785491943359375, -0.0029144287109375, 0.02202606201171875, 0.046966552734375, 0.07190704345703125, 0.0968475341796875, 0.12178802490234375, 0.146728515625, 0.17166900634765625, 0.1966094970703125, 0.22154998779296875, 0.246490478515625, 0.27143096923828125, 0.2963714599609375, 0.32131195068359375, 0.34625244140625, 0.37119293212890625, 0.3961334228515625, 0.42107391357421875, 0.446014404296875, 0.47095489501953125, 0.4958953857421875, 0.5208358764648438, 0.5457763671875, 0.5707168579101562, 0.5956573486328125, 0.6205978393554688, 0.645538330078125, 0.6704788208007812, 0.6954193115234375, 0.7203598022460938, 0.74530029296875, 0.7702407836914062, 0.7951812744140625, 0.8201217651367188, 0.845062255859375, 0.8700027465820312, 0.8949432373046875, 0.9198837280273438, 0.94482421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 4.0, 12.0, 11.0, 6.0, 14.0, 17.0, 25.0, 23.0, 35.0, 36.0, 47.0, 30.0, 42.0, 40.0, 60.0, 56.0, 50.0, 68.0, 45.0, 48.0, 46.0, 52.0, 38.0, 26.0, 32.0, 24.0, 16.0, 18.0, 20.0, 12.0, 12.0, 3.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.91162109375, -0.88262939453125, -0.8536376953125, -0.82464599609375, -0.795654296875, -0.76666259765625, -0.7376708984375, -0.70867919921875, -0.6796875, -0.65069580078125, -0.6217041015625, -0.59271240234375, -0.563720703125, -0.53472900390625, -0.5057373046875, -0.47674560546875, -0.44775390625, -0.41876220703125, -0.3897705078125, -0.36077880859375, -0.331787109375, -0.30279541015625, -0.2738037109375, -0.24481201171875, -0.2158203125, -0.18682861328125, -0.1578369140625, -0.12884521484375, -0.099853515625, -0.07086181640625, -0.0418701171875, -0.01287841796875, 0.01611328125, 0.04510498046875, 0.0740966796875, 0.10308837890625, 0.132080078125, 0.16107177734375, 0.1900634765625, 0.21905517578125, 0.248046875, 0.27703857421875, 0.3060302734375, 0.33502197265625, 0.364013671875, 0.39300537109375, 0.4219970703125, 0.45098876953125, 0.47998046875, 0.50897216796875, 0.5379638671875, 0.56695556640625, 0.595947265625, 0.62493896484375, 0.6539306640625, 0.68292236328125, 0.7119140625, 0.74090576171875, 0.7698974609375, 0.79888916015625, 0.827880859375, 0.85687255859375, 0.8858642578125, 0.91485595703125, 0.94384765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 8.0, 9.0, 12.0, 18.0, 31.0, 45.0, 59.0, 90.0, 157.0, 263.0, 517.0, 1306.0, 4858.0, 36763.0, 693387.0, 285819.0, 19924.0, 3196.0, 1049.0, 431.0, 223.0, 107.0, 70.0, 45.0, 51.0, 32.0, 22.0, 19.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30908203125, -0.2996788024902344, -0.29027557373046875, -0.2808723449707031, -0.2714691162109375, -0.2620658874511719, -0.25266265869140625, -0.24325942993164062, -0.233856201171875, -0.22445297241210938, -0.21504974365234375, -0.20564651489257812, -0.1962432861328125, -0.18684005737304688, -0.17743682861328125, -0.16803359985351562, -0.15863037109375, -0.14922714233398438, -0.13982391357421875, -0.13042068481445312, -0.1210174560546875, -0.11161422729492188, -0.10221099853515625, -0.09280776977539062, -0.083404541015625, -0.07400131225585938, -0.06459808349609375, -0.055194854736328125, -0.0457916259765625, -0.036388397216796875, -0.02698516845703125, -0.017581939697265625, -0.0081787109375, 0.001224517822265625, 0.01062774658203125, 0.020030975341796875, 0.0294342041015625, 0.038837432861328125, 0.04824066162109375, 0.057643890380859375, 0.067047119140625, 0.07645034790039062, 0.08585357666015625, 0.09525680541992188, 0.1046600341796875, 0.11406326293945312, 0.12346649169921875, 0.13286972045898438, 0.14227294921875, 0.15167617797851562, 0.16107940673828125, 0.17048263549804688, 0.1798858642578125, 0.18928909301757812, 0.19869232177734375, 0.20809555053710938, 0.217498779296875, 0.22690200805664062, 0.23630523681640625, 0.24570846557617188, 0.2551116943359375, 0.2645149230957031, 0.27391815185546875, 0.2833213806152344, 0.292724609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 14.0, 11.0, 15.0, 15.0, 22.0, 22.0, 25.0, 34.0, 48.0, 70.0, 70.0, 99.0, 83.0, 79.0, 77.0, 55.0, 58.0, 33.0, 26.0, 23.0, 21.0, 13.0, 15.0, 12.0, 8.0, 6.0, 10.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.604194641113281e-05, -6.37182965874672e-05, -6.139464676380157e-05, -5.9070996940135956e-05, -5.674734711647034e-05, -5.442369729280472e-05, -5.21000474691391e-05, -4.977639764547348e-05, -4.745274782180786e-05, -4.512909799814224e-05, -4.2805448174476624e-05, -4.0481798350811005e-05, -3.8158148527145386e-05, -3.583449870347977e-05, -3.351084887981415e-05, -3.118719905614853e-05, -2.886354923248291e-05, -2.653989940881729e-05, -2.4216249585151672e-05, -2.1892599761486053e-05, -1.9568949937820435e-05, -1.7245300114154816e-05, -1.4921650290489197e-05, -1.2598000466823578e-05, -1.0274350643157959e-05, -7.95070081949234e-06, -5.627050995826721e-06, -3.3034011721611023e-06, -9.797513484954834e-07, 1.3438984751701355e-06, 3.6675482988357544e-06, 5.991198122501373e-06, 8.314847946166992e-06, 1.0638497769832611e-05, 1.296214759349823e-05, 1.528579741716385e-05, 1.7609447240829468e-05, 1.9933097064495087e-05, 2.2256746888160706e-05, 2.4580396711826324e-05, 2.6904046535491943e-05, 2.9227696359157562e-05, 3.155134618282318e-05, 3.38749960064888e-05, 3.619864583015442e-05, 3.852229565382004e-05, 4.084594547748566e-05, 4.3169595301151276e-05, 4.5493245124816895e-05, 4.7816894948482513e-05, 5.014054477214813e-05, 5.246419459581375e-05, 5.478784441947937e-05, 5.711149424314499e-05, 5.943514406681061e-05, 6.175879389047623e-05, 6.408244371414185e-05, 6.640609353780746e-05, 6.872974336147308e-05, 7.10533931851387e-05, 7.337704300880432e-05, 7.570069283246994e-05, 7.802434265613556e-05, 8.034799247980118e-05, 8.26716423034668e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 15.0, 11.0, 10.0, 20.0, 27.0, 29.0, 49.0, 76.0, 98.0, 128.0, 200.0, 307.0, 564.0, 982.0, 1916.0, 4571.0, 13771.0, 67545.0, 650384.0, 257735.0, 34546.0, 8911.0, 3072.0, 1398.0, 784.0, 448.0, 303.0, 187.0, 113.0, 103.0, 65.0, 51.0, 41.0, 20.0, 18.0, 11.0, 14.0, 5.0, 6.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.2322998046875, -0.22542953491210938, -0.21855926513671875, -0.21168899536132812, -0.2048187255859375, -0.19794845581054688, -0.19107818603515625, -0.18420791625976562, -0.177337646484375, -0.17046737670898438, -0.16359710693359375, -0.15672683715820312, -0.1498565673828125, -0.14298629760742188, -0.13611602783203125, -0.12924575805664062, -0.12237548828125, -0.11550521850585938, -0.10863494873046875, -0.10176467895507812, -0.0948944091796875, -0.08802413940429688, -0.08115386962890625, -0.07428359985351562, -0.067413330078125, -0.060543060302734375, -0.05367279052734375, -0.046802520751953125, -0.0399322509765625, -0.033061981201171875, -0.02619171142578125, -0.019321441650390625, -0.012451171875, -0.005580902099609375, 0.00128936767578125, 0.008159637451171875, 0.0150299072265625, 0.021900177001953125, 0.02877044677734375, 0.035640716552734375, 0.042510986328125, 0.049381256103515625, 0.05625152587890625, 0.06312179565429688, 0.0699920654296875, 0.07686233520507812, 0.08373260498046875, 0.09060287475585938, 0.09747314453125, 0.10434341430664062, 0.11121368408203125, 0.11808395385742188, 0.1249542236328125, 0.13182449340820312, 0.13869476318359375, 0.14556503295898438, 0.152435302734375, 0.15930557250976562, 0.16617584228515625, 0.17304611206054688, 0.1799163818359375, 0.18678665161132812, 0.19365692138671875, 0.20052719116210938, 0.2073974609375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 8.0, 5.0, 6.0, 10.0, 7.0, 14.0, 20.0, 28.0, 28.0, 37.0, 48.0, 46.0, 64.0, 72.0, 75.0, 75.0, 74.0, 63.0, 59.0, 52.0, 46.0, 28.0, 27.0, 23.0, 16.0, 16.0, 15.0, 6.0, 6.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2313232421875, -0.22442626953125, -0.217529296875, -0.21063232421875, -0.2037353515625, -0.19683837890625, -0.18994140625, -0.18304443359375, -0.1761474609375, -0.16925048828125, -0.162353515625, -0.15545654296875, -0.1485595703125, -0.14166259765625, -0.134765625, -0.12786865234375, -0.1209716796875, -0.11407470703125, -0.107177734375, -0.10028076171875, -0.0933837890625, -0.08648681640625, -0.07958984375, -0.07269287109375, -0.0657958984375, -0.05889892578125, -0.052001953125, -0.04510498046875, -0.0382080078125, -0.03131103515625, -0.0244140625, -0.01751708984375, -0.0106201171875, -0.00372314453125, 0.003173828125, 0.01007080078125, 0.0169677734375, 0.02386474609375, 0.03076171875, 0.03765869140625, 0.0445556640625, 0.05145263671875, 0.058349609375, 0.06524658203125, 0.0721435546875, 0.07904052734375, 0.0859375, 0.09283447265625, 0.0997314453125, 0.10662841796875, 0.113525390625, 0.12042236328125, 0.1273193359375, 0.13421630859375, 0.14111328125, 0.14801025390625, 0.1549072265625, 0.16180419921875, 0.168701171875, 0.17559814453125, 0.1824951171875, 0.18939208984375, 0.1962890625, 0.20318603515625, 0.2100830078125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 17.0, 29.0, 93.0, 230.0, 316.0, 193.0, 60.0, 30.0, 10.0, 8.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.631749153137207, -6.396434307098389, -6.16111946105957, -5.92580509185791, -5.690490245819092, -5.455175399780273, -5.219860553741455, -4.984545707702637, -4.749230861663818, -4.513916015625, -4.278601169586182, -4.043286323547363, -3.807971715927124, -3.5726571083068848, -3.3373422622680664, -3.102027416229248, -2.866712808609009, -2.6313979625701904, -2.396083354949951, -2.160768508911133, -1.9254536628723145, -1.6901389360427856, -1.4548242092132568, -1.2195093631744385, -0.9841946363449097, -0.7488798499107361, -0.5135650634765625, -0.2782503366470337, -0.04293555021286011, 0.19237923622131348, 0.4276939630508423, 0.6630088090896606, 0.8983235359191895, 1.1336382627487183, 1.3689531087875366, 1.6042678356170654, 1.8395826816558838, 2.074897289276123, 2.3102121353149414, 2.5455269813537598, 2.780841827392578, 3.0161566734313965, 3.2514712810516357, 3.486786127090454, 3.7221009731292725, 3.9574155807495117, 4.19273042678833, 4.428045272827148, 4.663359642028809, 4.898674488067627, 5.133989334106445, 5.3693037033081055, 5.604618549346924, 5.839933395385742, 6.0752482414245605, 6.310563087463379, 6.545877933502197, 6.781192779541016, 7.016507625579834, 7.251822471618652, 7.4871368408203125, 7.722451686859131, 7.957766532897949, 8.19308090209961, 8.428396224975586]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 6.0, 3.0, 6.0, 8.0, 4.0, 15.0, 16.0, 17.0, 12.0, 15.0, 19.0, 24.0, 21.0, 44.0, 38.0, 41.0, 44.0, 61.0, 65.0, 72.0, 73.0, 46.0, 27.0, 48.0, 29.0, 24.0, 34.0, 32.0, 21.0, 16.0, 24.0, 27.0, 17.0, 10.0, 10.0, 7.0, 11.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.701176643371582, -2.6003732681274414, -2.4995696544647217, -2.398766279220581, -2.2979626655578613, -2.1971592903137207, -2.09635591506958, -1.99555242061615, -1.8947489261627197, -1.7939454317092896, -1.6931419372558594, -1.5923385620117188, -1.4915350675582886, -1.3907315731048584, -1.2899281978607178, -1.1891247034072876, -1.0883212089538574, -0.9875177145004272, -0.8867142796516418, -0.7859108448028564, -0.6851073503494263, -0.5843038558959961, -0.4835004210472107, -0.3826969861984253, -0.2818934917449951, -0.18109002709388733, -0.08028656244277954, 0.020516902208328247, 0.12132036685943604, 0.2221238613128662, 0.3229272961616516, 0.423730731010437, 0.5245342254638672, 0.6253377199172974, 0.7261411547660828, 0.8269445896148682, 0.9277480840682983, 1.0285515785217285, 1.1293549537658691, 1.2301584482192993, 1.3309619426727295, 1.4317654371261597, 1.5325689315795898, 1.6333723068237305, 1.7341758012771606, 1.8349792957305908, 1.9357826709747314, 2.036586284637451, 2.137389659881592, 2.2381930351257324, 2.338996648788452, 2.4398000240325928, 2.5406036376953125, 2.641407012939453, 2.7422103881835938, 2.8430137634277344, 2.943817377090454, 3.0446207523345947, 3.1454243659973145, 3.246227741241455, 3.3470311164855957, 3.4478347301483154, 3.548638105392456, 3.649441719055176, 3.7502450942993164]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 27.0, 18.0, 34.0, 86.0, 160.0, 308.0, 624.0, 1425.0, 3611.0, 11059.0, 41428.0, 259560.0, 2376539.0, 1336972.0, 125466.0, 24991.0, 7160.0, 2611.0, 1114.0, 494.0, 242.0, 138.0, 80.0, 43.0, 22.0, 17.0, 13.0, 13.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.42236328125, -0.4120197296142578, -0.4016761779785156, -0.39133262634277344, -0.38098907470703125, -0.37064552307128906, -0.3603019714355469, -0.3499584197998047, -0.3396148681640625, -0.3292713165283203, -0.3189277648925781, -0.30858421325683594, -0.29824066162109375, -0.28789710998535156, -0.2775535583496094, -0.2672100067138672, -0.256866455078125, -0.2465229034423828, -0.23617935180664062, -0.22583580017089844, -0.21549224853515625, -0.20514869689941406, -0.19480514526367188, -0.1844615936279297, -0.1741180419921875, -0.1637744903564453, -0.15343093872070312, -0.14308738708496094, -0.13274383544921875, -0.12240028381347656, -0.11205673217773438, -0.10171318054199219, -0.09136962890625, -0.08102607727050781, -0.07068252563476562, -0.06033897399902344, -0.04999542236328125, -0.03965187072753906, -0.029308319091796875, -0.018964767456054688, -0.0086212158203125, 0.0017223358154296875, 0.012065887451171875, 0.022409439086914062, 0.03275299072265625, 0.04309654235839844, 0.053440093994140625, 0.06378364562988281, 0.074127197265625, 0.08447074890136719, 0.09481430053710938, 0.10515785217285156, 0.11550140380859375, 0.12584495544433594, 0.13618850708007812, 0.1465320587158203, 0.1568756103515625, 0.1672191619873047, 0.17756271362304688, 0.18790626525878906, 0.19824981689453125, 0.20859336853027344, 0.21893692016601562, 0.2292804718017578, 0.2396240234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 13.0, 8.0, 6.0, 13.0, 23.0, 22.0, 25.0, 25.0, 39.0, 28.0, 45.0, 49.0, 53.0, 54.0, 52.0, 37.0, 55.0, 35.0, 49.0, 38.0, 41.0, 51.0, 32.0, 35.0, 34.0, 24.0, 20.0, 20.0, 11.0, 11.0, 9.0, 11.0, 7.0, 2.0, 4.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1822509765625, -0.17580413818359375, -0.1693572998046875, -0.16291046142578125, -0.156463623046875, -0.15001678466796875, -0.1435699462890625, -0.13712310791015625, -0.13067626953125, -0.12422943115234375, -0.1177825927734375, -0.11133575439453125, -0.104888916015625, -0.09844207763671875, -0.0919952392578125, -0.08554840087890625, -0.0791015625, -0.07265472412109375, -0.0662078857421875, -0.05976104736328125, -0.053314208984375, -0.04686737060546875, -0.0404205322265625, -0.03397369384765625, -0.02752685546875, -0.02108001708984375, -0.0146331787109375, -0.00818634033203125, -0.001739501953125, 0.00470733642578125, 0.0111541748046875, 0.01760101318359375, 0.0240478515625, 0.03049468994140625, 0.0369415283203125, 0.04338836669921875, 0.049835205078125, 0.05628204345703125, 0.0627288818359375, 0.06917572021484375, 0.07562255859375, 0.08206939697265625, 0.0885162353515625, 0.09496307373046875, 0.101409912109375, 0.10785675048828125, 0.1143035888671875, 0.12075042724609375, 0.127197265625, 0.13364410400390625, 0.1400909423828125, 0.14653778076171875, 0.152984619140625, 0.15943145751953125, 0.1658782958984375, 0.17232513427734375, 0.17877197265625, 0.18521881103515625, 0.1916656494140625, 0.19811248779296875, 0.204559326171875, 0.21100616455078125, 0.2174530029296875, 0.22389984130859375, 0.2303466796875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 6.0, 2.0, 8.0, 23.0, 22.0, 40.0, 44.0, 88.0, 159.0, 295.0, 618.0, 1547.0, 4347.0, 15948.0, 82112.0, 1180197.0, 2719138.0, 153564.0, 25637.0, 6447.0, 2175.0, 892.0, 405.0, 225.0, 122.0, 82.0, 50.0, 29.0, 20.0, 12.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.344482421875, -0.3307838439941406, -0.31708526611328125, -0.3033866882324219, -0.2896881103515625, -0.2759895324707031, -0.26229095458984375, -0.24859237670898438, -0.234893798828125, -0.22119522094726562, -0.20749664306640625, -0.19379806518554688, -0.1800994873046875, -0.16640090942382812, -0.15270233154296875, -0.13900375366210938, -0.12530517578125, -0.11160659790039062, -0.09790802001953125, -0.08420944213867188, -0.0705108642578125, -0.056812286376953125, -0.04311370849609375, -0.029415130615234375, -0.015716552734375, -0.002017974853515625, 0.01168060302734375, 0.025379180908203125, 0.0390777587890625, 0.052776336669921875, 0.06647491455078125, 0.08017349243164062, 0.0938720703125, 0.10757064819335938, 0.12126922607421875, 0.13496780395507812, 0.1486663818359375, 0.16236495971679688, 0.17606353759765625, 0.18976211547851562, 0.203460693359375, 0.21715927124023438, 0.23085784912109375, 0.24455642700195312, 0.2582550048828125, 0.2719535827636719, 0.28565216064453125, 0.2993507385253906, 0.31304931640625, 0.3267478942871094, 0.34044647216796875, 0.3541450500488281, 0.3678436279296875, 0.3815422058105469, 0.39524078369140625, 0.4089393615722656, 0.422637939453125, 0.4363365173339844, 0.45003509521484375, 0.4637336730957031, 0.4774322509765625, 0.4911308288574219, 0.5048294067382812, 0.5185279846191406, 0.5322265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 10.0, 12.0, 13.0, 16.0, 22.0, 37.0, 61.0, 82.0, 161.0, 239.0, 407.0, 717.0, 838.0, 571.0, 366.0, 171.0, 110.0, 79.0, 40.0, 31.0, 22.0, 12.0, 18.0, 12.0, 5.0, 9.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3916015625, -0.375457763671875, -0.35931396484375, -0.343170166015625, -0.3270263671875, -0.310882568359375, -0.29473876953125, -0.278594970703125, -0.262451171875, -0.246307373046875, -0.23016357421875, -0.214019775390625, -0.1978759765625, -0.181732177734375, -0.16558837890625, -0.149444580078125, -0.13330078125, -0.117156982421875, -0.10101318359375, -0.084869384765625, -0.0687255859375, -0.052581787109375, -0.03643798828125, -0.020294189453125, -0.004150390625, 0.011993408203125, 0.02813720703125, 0.044281005859375, 0.0604248046875, 0.076568603515625, 0.09271240234375, 0.108856201171875, 0.125, 0.141143798828125, 0.15728759765625, 0.173431396484375, 0.1895751953125, 0.205718994140625, 0.22186279296875, 0.238006591796875, 0.254150390625, 0.270294189453125, 0.28643798828125, 0.302581787109375, 0.3187255859375, 0.334869384765625, 0.35101318359375, 0.367156982421875, 0.38330078125, 0.399444580078125, 0.41558837890625, 0.431732177734375, 0.4478759765625, 0.464019775390625, 0.48016357421875, 0.496307373046875, 0.512451171875, 0.528594970703125, 0.54473876953125, 0.560882568359375, 0.5770263671875, 0.593170166015625, 0.60931396484375, 0.625457763671875, 0.6416015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 27.0, 62.0, 159.0, 346.0, 247.0, 116.0, 18.0, 7.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.518516540527344, -8.265787124633789, -8.013056755065918, -7.760326862335205, -7.507596969604492, -7.254867076873779, -7.002137184143066, -6.749407768249512, -6.496677398681641, -6.243947505950928, -5.991217613220215, -5.738487720489502, -5.485757827758789, -5.233027935028076, -4.980298042297363, -4.727568626403809, -4.474838733673096, -4.222108840942383, -3.96937894821167, -3.716649055480957, -3.463919162750244, -3.2111892700195312, -2.9584596157073975, -2.7057297229766846, -2.4529998302459717, -2.200269937515259, -1.947540044784546, -1.6948102712631226, -1.4420803785324097, -1.1893504858016968, -0.9366207122802734, -0.6838908195495605, -0.43116092681884766, -0.17843106389045715, 0.07429879903793335, 0.32702863216400146, 0.5797585248947144, 0.8324884176254272, 1.0852181911468506, 1.3379480838775635, 1.5906779766082764, 1.8434078693389893, 2.096137762069702, 2.348867416381836, 2.601597309112549, 2.8543272018432617, 3.1070570945739746, 3.3597869873046875, 3.6125168800354004, 3.8652467727661133, 4.117976665496826, 4.370706558227539, 4.623436450958252, 4.876166343688965, 5.1288957595825195, 5.381626129150391, 5.634355545043945, 5.887085437774658, 6.139815330505371, 6.392545223236084, 6.645275115966797, 6.89800500869751, 7.150734901428223, 7.403464317321777, 7.656194686889648]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 11.0, 15.0, 13.0, 21.0, 22.0, 28.0, 26.0, 39.0, 52.0, 61.0, 46.0, 46.0, 57.0, 56.0, 69.0, 50.0, 62.0, 41.0, 54.0, 34.0, 25.0, 33.0, 26.0, 15.0, 24.0, 16.0, 16.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.970703125, -1.888615369796753, -1.8065276145935059, -1.7244398593902588, -1.6423521041870117, -1.5602643489837646, -1.4781767129898071, -1.39608895778656, -1.314001202583313, -1.231913447380066, -1.1498256921768188, -1.0677379369735718, -0.9856502413749695, -0.9035624861717224, -0.8214747905731201, -0.739387035369873, -0.657299280166626, -0.5752115249633789, -0.4931237995624542, -0.41103607416152954, -0.32894831895828247, -0.2468605637550354, -0.16477283835411072, -0.08268511295318604, -0.0005973577499389648, 0.08149038255214691, 0.1635781228542328, 0.24566586315631866, 0.32775360345840454, 0.4098413586616516, 0.4919290840625763, 0.574016809463501, 0.656104326248169, 0.738192081451416, 0.8202798366546631, 0.9023675322532654, 0.9844552874565125, 1.0665431022644043, 1.1486307382583618, 1.2307184934616089, 1.312806248664856, 1.394894003868103, 1.47698175907135, 1.5590695142745972, 1.6411571502685547, 1.7232449054718018, 1.8053326606750488, 1.887420415878296, 1.969508171081543, 2.05159592628479, 2.133683681488037, 2.215771436691284, 2.2978591918945312, 2.3799469470977783, 2.4620347023010254, 2.5441222190856934, 2.6262102127075195, 2.7082979679107666, 2.7903857231140137, 2.8724734783172607, 2.954561233520508, 3.036648988723755, 3.118736743927002, 3.20082426071167, 3.282912015914917]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 15.0, 10.0, 15.0, 20.0, 47.0, 44.0, 65.0, 150.0, 256.0, 421.0, 865.0, 1564.0, 3130.0, 7145.0, 18222.0, 51281.0, 155912.0, 374972.0, 282270.0, 97298.0, 32671.0, 12029.0, 5084.0, 2300.0, 1195.0, 674.0, 352.0, 207.0, 111.0, 72.0, 48.0, 26.0, 22.0, 15.0, 11.0, 3.0, 4.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.3449516296386719, -0.33296966552734375, -0.3209877014160156, -0.3090057373046875, -0.2970237731933594, -0.28504180908203125, -0.2730598449707031, -0.261077880859375, -0.24909591674804688, -0.23711395263671875, -0.22513198852539062, -0.2131500244140625, -0.20116806030273438, -0.18918609619140625, -0.17720413208007812, -0.16522216796875, -0.15324020385742188, -0.14125823974609375, -0.12927627563476562, -0.1172943115234375, -0.10531234741210938, -0.09333038330078125, -0.08134841918945312, -0.069366455078125, -0.057384490966796875, -0.04540252685546875, -0.033420562744140625, -0.0214385986328125, -0.009456634521484375, 0.00252532958984375, 0.014507293701171875, 0.0264892578125, 0.038471221923828125, 0.05045318603515625, 0.062435150146484375, 0.0744171142578125, 0.08639907836914062, 0.09838104248046875, 0.11036300659179688, 0.122344970703125, 0.13432693481445312, 0.14630889892578125, 0.15829086303710938, 0.1702728271484375, 0.18225479125976562, 0.19423675537109375, 0.20621871948242188, 0.21820068359375, 0.23018264770507812, 0.24216461181640625, 0.2541465759277344, 0.2661285400390625, 0.2781105041503906, 0.29009246826171875, 0.3020744323730469, 0.314056396484375, 0.3260383605957031, 0.33802032470703125, 0.3500022888183594, 0.3619842529296875, 0.3739662170410156, 0.38594818115234375, 0.3979301452636719, 0.409912109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 4.0, 14.0, 12.0, 9.0, 13.0, 14.0, 21.0, 22.0, 28.0, 22.0, 38.0, 37.0, 31.0, 46.0, 56.0, 62.0, 58.0, 35.0, 54.0, 45.0, 54.0, 45.0, 29.0, 33.0, 44.0, 21.0, 22.0, 20.0, 25.0, 15.0, 11.0, 10.0, 15.0, 5.0, 7.0, 6.0, 4.0, 2.0, 6.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.17333984375, -0.16707801818847656, -0.16081619262695312, -0.1545543670654297, -0.14829254150390625, -0.1420307159423828, -0.13576889038085938, -0.12950706481933594, -0.1232452392578125, -0.11698341369628906, -0.11072158813476562, -0.10445976257324219, -0.09819793701171875, -0.09193611145019531, -0.08567428588867188, -0.07941246032714844, -0.073150634765625, -0.06688880920410156, -0.060626983642578125, -0.05436515808105469, -0.04810333251953125, -0.04184150695800781, -0.035579681396484375, -0.029317855834960938, -0.0230560302734375, -0.016794204711914062, -0.010532379150390625, -0.0042705535888671875, 0.00199127197265625, 0.008253097534179688, 0.014514923095703125, 0.020776748657226562, 0.02703857421875, 0.03330039978027344, 0.039562225341796875, 0.04582405090332031, 0.05208587646484375, 0.05834770202636719, 0.06460952758789062, 0.07087135314941406, 0.0771331787109375, 0.08339500427246094, 0.08965682983398438, 0.09591865539550781, 0.10218048095703125, 0.10844230651855469, 0.11470413208007812, 0.12096595764160156, 0.127227783203125, 0.13348960876464844, 0.13975143432617188, 0.1460132598876953, 0.15227508544921875, 0.1585369110107422, 0.16479873657226562, 0.17106056213378906, 0.1773223876953125, 0.18358421325683594, 0.18984603881835938, 0.1961078643798828, 0.20236968994140625, 0.2086315155029297, 0.21489334106445312, 0.22115516662597656, 0.2274169921875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 8.0, 6.0, 18.0, 25.0, 27.0, 64.0, 78.0, 109.0, 207.0, 440.0, 823.0, 1715.0, 5589.0, 44368.0, 808156.0, 169996.0, 11675.0, 2815.0, 1099.0, 538.0, 307.0, 190.0, 111.0, 61.0, 48.0, 26.0, 16.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96337890625, -0.9309616088867188, -0.8985443115234375, -0.8661270141601562, -0.833709716796875, -0.8012924194335938, -0.7688751220703125, -0.7364578247070312, -0.70404052734375, -0.6716232299804688, -0.6392059326171875, -0.6067886352539062, -0.574371337890625, -0.5419540405273438, -0.5095367431640625, -0.47711944580078125, -0.4447021484375, -0.41228485107421875, -0.3798675537109375, -0.34745025634765625, -0.315032958984375, -0.28261566162109375, -0.2501983642578125, -0.21778106689453125, -0.18536376953125, -0.15294647216796875, -0.1205291748046875, -0.08811187744140625, -0.055694580078125, -0.02327728271484375, 0.0091400146484375, 0.04155731201171875, 0.073974609375, 0.10639190673828125, 0.1388092041015625, 0.17122650146484375, 0.203643798828125, 0.23606109619140625, 0.2684783935546875, 0.30089569091796875, 0.33331298828125, 0.36573028564453125, 0.3981475830078125, 0.43056488037109375, 0.462982177734375, 0.49539947509765625, 0.5278167724609375, 0.5602340698242188, 0.5926513671875, 0.6250686645507812, 0.6574859619140625, 0.6899032592773438, 0.722320556640625, 0.7547378540039062, 0.7871551513671875, 0.8195724487304688, 0.85198974609375, 0.8844070434570312, 0.9168243408203125, 0.9492416381835938, 0.981658935546875, 1.0140762329101562, 1.0464935302734375, 1.0789108276367188, 1.111328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 9.0, 5.0, 6.0, 14.0, 25.0, 25.0, 29.0, 39.0, 40.0, 60.0, 49.0, 67.0, 65.0, 78.0, 66.0, 73.0, 66.0, 51.0, 49.0, 34.0, 39.0, 25.0, 20.0, 14.0, 15.0, 10.0, 8.0, 5.0, 6.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.251953125, -1.2189559936523438, -1.1859588623046875, -1.1529617309570312, -1.119964599609375, -1.0869674682617188, -1.0539703369140625, -1.0209732055664062, -0.98797607421875, -0.9549789428710938, -0.9219818115234375, -0.8889846801757812, -0.855987548828125, -0.8229904174804688, -0.7899932861328125, -0.7569961547851562, -0.7239990234375, -0.6910018920898438, -0.6580047607421875, -0.6250076293945312, -0.592010498046875, -0.5590133666992188, -0.5260162353515625, -0.49301910400390625, -0.46002197265625, -0.42702484130859375, -0.3940277099609375, -0.36103057861328125, -0.328033447265625, -0.29503631591796875, -0.2620391845703125, -0.22904205322265625, -0.196044921875, -0.16304779052734375, -0.1300506591796875, -0.09705352783203125, -0.064056396484375, -0.03105926513671875, 0.0019378662109375, 0.03493499755859375, 0.06793212890625, 0.10092926025390625, 0.1339263916015625, 0.16692352294921875, 0.199920654296875, 0.23291778564453125, 0.2659149169921875, 0.29891204833984375, 0.3319091796875, 0.36490631103515625, 0.3979034423828125, 0.43090057373046875, 0.463897705078125, 0.49689483642578125, 0.5298919677734375, 0.5628890991210938, 0.59588623046875, 0.6288833618164062, 0.6618804931640625, 0.6948776245117188, 0.727874755859375, 0.7608718872070312, 0.7938690185546875, 0.8268661499023438, 0.85986328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 7.0, 3.0, 8.0, 16.0, 11.0, 22.0, 31.0, 44.0, 73.0, 83.0, 132.0, 270.0, 714.0, 2641.0, 20919.0, 704131.0, 303041.0, 13282.0, 1881.0, 621.0, 247.0, 135.0, 54.0, 59.0, 37.0, 30.0, 19.0, 14.0, 10.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376708984375, -0.3649024963378906, -0.35309600830078125, -0.3412895202636719, -0.3294830322265625, -0.3176765441894531, -0.30587005615234375, -0.2940635681152344, -0.282257080078125, -0.2704505920410156, -0.25864410400390625, -0.24683761596679688, -0.2350311279296875, -0.22322463989257812, -0.21141815185546875, -0.19961166381835938, -0.18780517578125, -0.17599868774414062, -0.16419219970703125, -0.15238571166992188, -0.1405792236328125, -0.12877273559570312, -0.11696624755859375, -0.10515975952148438, -0.093353271484375, -0.08154678344726562, -0.06974029541015625, -0.057933807373046875, -0.0461273193359375, -0.034320831298828125, -0.02251434326171875, -0.010707855224609375, 0.0010986328125, 0.012905120849609375, 0.02471160888671875, 0.036518096923828125, 0.0483245849609375, 0.060131072998046875, 0.07193756103515625, 0.08374404907226562, 0.095550537109375, 0.10735702514648438, 0.11916351318359375, 0.13097000122070312, 0.1427764892578125, 0.15458297729492188, 0.16638946533203125, 0.17819595336914062, 0.19000244140625, 0.20180892944335938, 0.21361541748046875, 0.22542190551757812, 0.2372283935546875, 0.24903488159179688, 0.26084136962890625, 0.2726478576660156, 0.284454345703125, 0.2962608337402344, 0.30806732177734375, 0.3198738098144531, 0.3316802978515625, 0.3434867858886719, 0.35529327392578125, 0.3670997619628906, 0.37890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 2.0, 4.0, 6.0, 8.0, 8.0, 17.0, 16.0, 20.0, 26.0, 47.0, 60.0, 73.0, 102.0, 117.0, 105.0, 98.0, 90.0, 54.0, 34.0, 27.0, 27.0, 14.0, 10.0, 8.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.863210678100586e-05, -8.602812886238098e-05, -8.34241509437561e-05, -8.082017302513123e-05, -7.821619510650635e-05, -7.561221718788147e-05, -7.300823926925659e-05, -7.040426135063171e-05, -6.780028343200684e-05, -6.519630551338196e-05, -6.259232759475708e-05, -5.99883496761322e-05, -5.7384371757507324e-05, -5.4780393838882446e-05, -5.217641592025757e-05, -4.957243800163269e-05, -4.696846008300781e-05, -4.4364482164382935e-05, -4.176050424575806e-05, -3.915652632713318e-05, -3.65525484085083e-05, -3.394857048988342e-05, -3.1344592571258545e-05, -2.8740614652633667e-05, -2.613663673400879e-05, -2.353265881538391e-05, -2.0928680896759033e-05, -1.8324702978134155e-05, -1.5720725059509277e-05, -1.31167471408844e-05, -1.0512769222259521e-05, -7.908791303634644e-06, -5.304813385009766e-06, -2.7008354663848877e-06, -9.685754776000977e-08, 2.507120370864868e-06, 5.111098289489746e-06, 7.715076208114624e-06, 1.0319054126739502e-05, 1.292303204536438e-05, 1.5527009963989258e-05, 1.8130987882614136e-05, 2.0734965801239014e-05, 2.333894371986389e-05, 2.594292163848877e-05, 2.8546899557113647e-05, 3.1150877475738525e-05, 3.37548553943634e-05, 3.635883331298828e-05, 3.896281123161316e-05, 4.156678915023804e-05, 4.4170767068862915e-05, 4.677474498748779e-05, 4.937872290611267e-05, 5.198270082473755e-05, 5.458667874336243e-05, 5.7190656661987305e-05, 5.979463458061218e-05, 6.239861249923706e-05, 6.500259041786194e-05, 6.760656833648682e-05, 7.02105462551117e-05, 7.281452417373657e-05, 7.541850209236145e-05, 7.802248001098633e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 8.0, 7.0, 13.0, 10.0, 23.0, 34.0, 45.0, 76.0, 95.0, 184.0, 302.0, 533.0, 1133.0, 2919.0, 11169.0, 72517.0, 777542.0, 156713.0, 18038.0, 4161.0, 1461.0, 633.0, 341.0, 221.0, 120.0, 82.0, 49.0, 42.0, 34.0, 14.0, 13.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.238037109375, -0.2302703857421875, -0.222503662109375, -0.2147369384765625, -0.20697021484375, -0.1992034912109375, -0.191436767578125, -0.1836700439453125, -0.1759033203125, -0.1681365966796875, -0.160369873046875, -0.1526031494140625, -0.14483642578125, -0.1370697021484375, -0.129302978515625, -0.1215362548828125, -0.11376953125, -0.1060028076171875, -0.098236083984375, -0.0904693603515625, -0.08270263671875, -0.0749359130859375, -0.067169189453125, -0.0594024658203125, -0.0516357421875, -0.0438690185546875, -0.036102294921875, -0.0283355712890625, -0.02056884765625, -0.0128021240234375, -0.005035400390625, 0.0027313232421875, 0.010498046875, 0.0182647705078125, 0.026031494140625, 0.0337982177734375, 0.04156494140625, 0.0493316650390625, 0.057098388671875, 0.0648651123046875, 0.0726318359375, 0.0803985595703125, 0.088165283203125, 0.0959320068359375, 0.10369873046875, 0.1114654541015625, 0.119232177734375, 0.1269989013671875, 0.134765625, 0.1425323486328125, 0.150299072265625, 0.1580657958984375, 0.16583251953125, 0.1735992431640625, 0.181365966796875, 0.1891326904296875, 0.1968994140625, 0.2046661376953125, 0.212432861328125, 0.2201995849609375, 0.22796630859375, 0.2357330322265625, 0.243499755859375, 0.2512664794921875, 0.259033203125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 6.0, 2.0, 5.0, 3.0, 6.0, 10.0, 7.0, 9.0, 17.0, 21.0, 24.0, 50.0, 59.0, 88.0, 104.0, 140.0, 129.0, 100.0, 79.0, 38.0, 30.0, 21.0, 13.0, 9.0, 5.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1881103515625, -0.1801013946533203, -0.17209243774414062, -0.16408348083496094, -0.15607452392578125, -0.14806556701660156, -0.14005661010742188, -0.1320476531982422, -0.1240386962890625, -0.11602973937988281, -0.10802078247070312, -0.10001182556152344, -0.09200286865234375, -0.08399391174316406, -0.07598495483398438, -0.06797599792480469, -0.059967041015625, -0.05195808410644531, -0.043949127197265625, -0.03594017028808594, -0.02793121337890625, -0.019922256469726562, -0.011913299560546875, -0.0039043426513671875, 0.0041046142578125, 0.012113571166992188, 0.020122528076171875, 0.028131484985351562, 0.03614044189453125, 0.04414939880371094, 0.052158355712890625, 0.06016731262207031, 0.06817626953125, 0.07618522644042969, 0.08419418334960938, 0.09220314025878906, 0.10021209716796875, 0.10822105407714844, 0.11623001098632812, 0.12423896789550781, 0.1322479248046875, 0.1402568817138672, 0.14826583862304688, 0.15627479553222656, 0.16428375244140625, 0.17229270935058594, 0.18030166625976562, 0.1883106231689453, 0.196319580078125, 0.2043285369873047, 0.21233749389648438, 0.22034645080566406, 0.22835540771484375, 0.23636436462402344, 0.24437332153320312, 0.2523822784423828, 0.2603912353515625, 0.2684001922607422, 0.2764091491699219, 0.28441810607910156, 0.29242706298828125, 0.30043601989746094, 0.3084449768066406, 0.3164539337158203, 0.324462890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 7.0, 10.0, 7.0, 24.0, 47.0, 73.0, 119.0, 197.0, 218.0, 118.0, 69.0, 45.0, 22.0, 8.0, 10.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646583080291748, -3.521165609359741, -3.3957483768463135, -3.2703309059143066, -3.1449134349823, -3.019495964050293, -2.8940787315368652, -2.7686612606048584, -2.6432437896728516, -2.5178263187408447, -2.392409086227417, -2.26699161529541, -2.1415741443634033, -2.0161566734313965, -1.8907394409179688, -1.765321969985962, -1.6399047374725342, -1.514487385749817, -1.38906991481781, -1.2636525630950928, -1.138235092163086, -1.0128177404403687, -0.8874003887176514, -0.7619829773902893, -0.6365655660629272, -0.5111481547355652, -0.3857307732105255, -0.26031339168548584, -0.13489598035812378, -0.009478569030761719, 0.11593878269195557, 0.24135619401931763, 0.3667736053466797, 0.49219101667404175, 0.6176084280014038, 0.7430257797241211, 0.8684431910514832, 0.9938606023788452, 1.1192779541015625, 1.2446954250335693, 1.3701127767562866, 1.495530128479004, 1.6209475994110107, 1.746364951133728, 1.8717823028564453, 1.9971997737884521, 2.122617244720459, 2.2480344772338867, 2.3734519481658936, 2.4988694190979004, 2.624286651611328, 2.749704122543335, 2.875121593475342, 3.0005388259887695, 3.1259562969207764, 3.251373767852783, 3.376791000366211, 3.5022084712982178, 3.6276257038116455, 3.7530431747436523, 3.878460645675659, 4.003878116607666, 4.129295349121094, 4.2547125816345215, 4.380130290985107]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 5.0, 11.0, 12.0, 15.0, 10.0, 17.0, 13.0, 15.0, 20.0, 41.0, 30.0, 37.0, 30.0, 46.0, 56.0, 68.0, 65.0, 66.0, 60.0, 41.0, 41.0, 41.0, 30.0, 25.0, 35.0, 22.0, 18.0, 23.0, 16.0, 13.0, 13.0, 17.0, 11.0, 6.0, 7.0, 12.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5675745010375977, -2.4754998683929443, -2.383425235748291, -2.2913506031036377, -2.1992759704589844, -2.10720157623291, -2.0151267051696777, -1.9230523109436035, -1.8309776782989502, -1.7389030456542969, -1.6468284130096436, -1.5547537803649902, -1.4626792669296265, -1.3706046342849731, -1.2785300016403198, -1.186455488204956, -1.0943807363510132, -1.0023061037063599, -0.9102315306663513, -0.818156898021698, -0.7260823249816895, -0.6340076923370361, -0.5419330596923828, -0.44985848665237427, -0.35778385400772095, -0.26570925116539, -0.1736346334218979, -0.08156001567840576, 0.010514587163925171, 0.1025891900062561, 0.19466382265090942, 0.28673839569091797, 0.3788130283355713, 0.4708876311779022, 0.5629622340202332, 0.6550368666648865, 0.747111439704895, 0.8391860723495483, 0.9312607049942017, 1.0233352184295654, 1.1154098510742188, 1.207484483718872, 1.2995591163635254, 1.3916337490081787, 1.4837082624435425, 1.5757828950881958, 1.6678575277328491, 1.759932041168213, 1.8520067930221558, 1.944081425666809, 2.036155939102173, 2.128230571746826, 2.2203052043914795, 2.312379837036133, 2.404454469680786, 2.4965291023254395, 2.5886037349700928, 2.680678367614746, 2.7727530002593994, 2.8648276329040527, 2.956902265548706, 3.0489768981933594, 3.1410512924194336, 3.233125925064087, 3.3252005577087402]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 7.0, 8.0, 14.0, 21.0, 33.0, 62.0, 121.0, 204.0, 371.0, 756.0, 1862.0, 5478.0, 23259.0, 240094.0, 3166117.0, 702509.0, 41566.0, 7669.0, 2309.0, 870.0, 390.0, 228.0, 124.0, 77.0, 51.0, 25.0, 18.0, 16.0, 12.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.29938507080078125, -0.2872467041015625, -0.27510833740234375, -0.262969970703125, -0.25083160400390625, -0.2386932373046875, -0.22655487060546875, -0.21441650390625, -0.20227813720703125, -0.1901397705078125, -0.17800140380859375, -0.165863037109375, -0.15372467041015625, -0.1415863037109375, -0.12944793701171875, -0.1173095703125, -0.10517120361328125, -0.0930328369140625, -0.08089447021484375, -0.068756103515625, -0.05661773681640625, -0.0444793701171875, -0.03234100341796875, -0.02020263671875, -0.00806427001953125, 0.0040740966796875, 0.01621246337890625, 0.028350830078125, 0.04048919677734375, 0.0526275634765625, 0.06476593017578125, 0.076904296875, 0.08904266357421875, 0.1011810302734375, 0.11331939697265625, 0.125457763671875, 0.13759613037109375, 0.1497344970703125, 0.16187286376953125, 0.17401123046875, 0.18614959716796875, 0.1982879638671875, 0.21042633056640625, 0.222564697265625, 0.23470306396484375, 0.2468414306640625, 0.25897979736328125, 0.2711181640625, 0.28325653076171875, 0.2953948974609375, 0.30753326416015625, 0.319671630859375, 0.33180999755859375, 0.3439483642578125, 0.35608673095703125, 0.36822509765625, 0.38036346435546875, 0.3925018310546875, 0.40464019775390625, 0.416778564453125, 0.42891693115234375, 0.4410552978515625, 0.45319366455078125, 0.46533203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 10.0, 8.0, 9.0, 12.0, 23.0, 18.0, 29.0, 30.0, 28.0, 41.0, 43.0, 46.0, 58.0, 49.0, 57.0, 53.0, 53.0, 50.0, 46.0, 55.0, 38.0, 61.0, 23.0, 24.0, 27.0, 19.0, 15.0, 18.0, 9.0, 9.0, 3.0, 13.0, 6.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155517578125, -0.14900588989257812, -0.14249420166015625, -0.13598251342773438, -0.1294708251953125, -0.12295913696289062, -0.11644744873046875, -0.10993576049804688, -0.103424072265625, -0.09691238403320312, -0.09040069580078125, -0.08388900756835938, -0.0773773193359375, -0.07086563110351562, -0.06435394287109375, -0.057842254638671875, -0.05133056640625, -0.044818878173828125, -0.03830718994140625, -0.031795501708984375, -0.0252838134765625, -0.018772125244140625, -0.01226043701171875, -0.005748748779296875, 0.000762939453125, 0.007274627685546875, 0.01378631591796875, 0.020298004150390625, 0.0268096923828125, 0.033321380615234375, 0.03983306884765625, 0.046344757080078125, 0.0528564453125, 0.059368133544921875, 0.06587982177734375, 0.07239151000976562, 0.0789031982421875, 0.08541488647460938, 0.09192657470703125, 0.09843826293945312, 0.104949951171875, 0.11146163940429688, 0.11797332763671875, 0.12448501586914062, 0.1309967041015625, 0.13750839233398438, 0.14402008056640625, 0.15053176879882812, 0.15704345703125, 0.16355514526367188, 0.17006683349609375, 0.17657852172851562, 0.1830902099609375, 0.18960189819335938, 0.19611358642578125, 0.20262527465820312, 0.209136962890625, 0.21564865112304688, 0.22216033935546875, 0.22867202758789062, 0.2351837158203125, 0.24169540405273438, 0.24820709228515625, 0.2547187805175781, 0.26123046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 4.0, 9.0, 19.0, 20.0, 31.0, 41.0, 85.0, 153.0, 308.0, 531.0, 1345.0, 4520.0, 23105.0, 312748.0, 3648657.0, 177909.0, 18173.0, 4066.0, 1318.0, 563.0, 249.0, 171.0, 89.0, 56.0, 37.0, 27.0, 16.0, 7.0, 8.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.490478515625, -0.4743537902832031, -0.45822906494140625, -0.4421043395996094, -0.4259796142578125, -0.4098548889160156, -0.39373016357421875, -0.3776054382324219, -0.361480712890625, -0.3453559875488281, -0.32923126220703125, -0.3131065368652344, -0.2969818115234375, -0.2808570861816406, -0.26473236083984375, -0.24860763549804688, -0.23248291015625, -0.21635818481445312, -0.20023345947265625, -0.18410873413085938, -0.1679840087890625, -0.15185928344726562, -0.13573455810546875, -0.11960983276367188, -0.103485107421875, -0.08736038208007812, -0.07123565673828125, -0.055110931396484375, -0.0389862060546875, -0.022861480712890625, -0.00673675537109375, 0.009387969970703125, 0.0255126953125, 0.041637420654296875, 0.05776214599609375, 0.07388687133789062, 0.0900115966796875, 0.10613632202148438, 0.12226104736328125, 0.13838577270507812, 0.154510498046875, 0.17063522338867188, 0.18675994873046875, 0.20288467407226562, 0.2190093994140625, 0.23513412475585938, 0.25125885009765625, 0.2673835754394531, 0.28350830078125, 0.2996330261230469, 0.31575775146484375, 0.3318824768066406, 0.3480072021484375, 0.3641319274902344, 0.38025665283203125, 0.3963813781738281, 0.412506103515625, 0.4286308288574219, 0.44475555419921875, 0.4608802795410156, 0.4770050048828125, 0.4931297302246094, 0.5092544555664062, 0.5253791809082031, 0.54150390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 2.0, 10.0, 7.0, 15.0, 17.0, 31.0, 46.0, 74.0, 101.0, 165.0, 282.0, 506.0, 734.0, 708.0, 523.0, 305.0, 175.0, 104.0, 92.0, 53.0, 27.0, 18.0, 13.0, 13.0, 12.0, 9.0, 6.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.318359375, -0.3056449890136719, -0.29293060302734375, -0.2802162170410156, -0.2675018310546875, -0.2547874450683594, -0.24207305908203125, -0.22935867309570312, -0.216644287109375, -0.20392990112304688, -0.19121551513671875, -0.17850112915039062, -0.1657867431640625, -0.15307235717773438, -0.14035797119140625, -0.12764358520507812, -0.11492919921875, -0.10221481323242188, -0.08950042724609375, -0.07678604125976562, -0.0640716552734375, -0.051357269287109375, -0.03864288330078125, -0.025928497314453125, -0.013214111328125, -0.000499725341796875, 0.01221466064453125, 0.024929046630859375, 0.0376434326171875, 0.050357818603515625, 0.06307220458984375, 0.07578659057617188, 0.0885009765625, 0.10121536254882812, 0.11392974853515625, 0.12664413452148438, 0.1393585205078125, 0.15207290649414062, 0.16478729248046875, 0.17750167846679688, 0.190216064453125, 0.20293045043945312, 0.21564483642578125, 0.22835922241210938, 0.2410736083984375, 0.2537879943847656, 0.26650238037109375, 0.2792167663574219, 0.29193115234375, 0.3046455383300781, 0.31735992431640625, 0.3300743103027344, 0.3427886962890625, 0.3555030822753906, 0.36821746826171875, 0.3809318542480469, 0.393646240234375, 0.4063606262207031, 0.41907501220703125, 0.4317893981933594, 0.4445037841796875, 0.4572181701660156, 0.46993255615234375, 0.4826469421386719, 0.495361328125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 15.0, 23.0, 65.0, 214.0, 319.0, 211.0, 87.0, 29.0, 9.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.889784812927246, -7.703793525695801, -7.517802715301514, -7.331811428070068, -7.145820140838623, -6.959829330444336, -6.773838043212891, -6.587846755981445, -6.40185546875, -6.215864181518555, -6.029873371124268, -5.843882083892822, -5.657890796661377, -5.47189998626709, -5.2859086990356445, -5.099917411804199, -4.913926601409912, -4.727935314178467, -4.54194450378418, -4.355953216552734, -4.169961929321289, -3.983970880508423, -3.7979798316955566, -3.6119885444641113, -3.425997495651245, -3.240006446838379, -3.0540151596069336, -2.8680241107940674, -2.682033061981201, -2.496041774749756, -2.3100507259368896, -2.1240596771240234, -1.93806791305542, -1.7520767450332642, -1.5660855770111084, -1.3800945281982422, -1.1941033601760864, -1.0081121921539307, -0.8221211433410645, -0.6361299753189087, -0.45013880729675293, -0.26414766907691956, -0.07815653085708618, 0.1078345775604248, 0.29382574558258057, 0.47981691360473633, 0.6658079624176025, 0.8517991304397583, 1.037790298461914, 1.2237814664840698, 1.4097726345062256, 1.5957636833190918, 1.7817548513412476, 1.9677460193634033, 2.1537370681762695, 2.339728355407715, 2.525719404220581, 2.7117104530334473, 2.8977017402648926, 3.083692789077759, 3.269683837890625, 3.4556751251220703, 3.6416661739349365, 3.8276572227478027, 4.013648509979248]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 8.0, 11.0, 17.0, 13.0, 16.0, 23.0, 26.0, 28.0, 41.0, 43.0, 44.0, 59.0, 45.0, 58.0, 65.0, 42.0, 52.0, 54.0, 54.0, 39.0, 55.0, 24.0, 26.0, 32.0, 16.0, 23.0, 17.0, 17.0, 13.0, 6.0, 7.0, 4.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9379534721374512, -1.8723942041397095, -1.8068349361419678, -1.741275668144226, -1.6757164001464844, -1.6101572513580322, -1.5445979833602905, -1.4790387153625488, -1.4134794473648071, -1.3479201793670654, -1.2823609113693237, -1.216801643371582, -1.1512424945831299, -1.0856831073760986, -1.0201239585876465, -0.9545646905899048, -0.8890054225921631, -0.8234461545944214, -0.7578868865966797, -0.6923276782035828, -0.6267684102058411, -0.5612091422080994, -0.49564990401268005, -0.43009066581726074, -0.36453139781951904, -0.29897212982177734, -0.23341289162635803, -0.16785363852977753, -0.10229438543319702, -0.03673511743545532, 0.02882412075996399, 0.0943833589553833, 0.1599423885345459, 0.2255016416311264, 0.2910608947277069, 0.3566201329231262, 0.4221794009208679, 0.4877386689186096, 0.5532978773117065, 0.6188571453094482, 0.6844164133071899, 0.7499756813049316, 0.8155349493026733, 0.8810941576957703, 0.946653425693512, 1.0122127532958984, 1.0777719020843506, 1.1433311700820923, 1.208890438079834, 1.2744497060775757, 1.3400089740753174, 1.405568242073059, 1.4711275100708008, 1.536686658859253, 1.6022459268569946, 1.6678051948547363, 1.733364462852478, 1.7989237308502197, 1.8644829988479614, 1.9300422668457031, 1.9956014156341553, 2.0611608028411865, 2.1267199516296387, 2.19227933883667, 2.257838487625122]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 7.0, 4.0, 7.0, 3.0, 19.0, 20.0, 30.0, 37.0, 70.0, 108.0, 188.0, 391.0, 885.0, 2115.0, 6216.0, 23633.0, 110082.0, 446751.0, 356541.0, 76301.0, 16998.0, 4987.0, 1709.0, 695.0, 342.0, 154.0, 98.0, 49.0, 33.0, 23.0, 17.0, 6.0, 8.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.50244140625, -0.4871635437011719, -0.47188568115234375, -0.4566078186035156, -0.4413299560546875, -0.4260520935058594, -0.41077423095703125, -0.3954963684082031, -0.380218505859375, -0.3649406433105469, -0.34966278076171875, -0.3343849182128906, -0.3191070556640625, -0.3038291931152344, -0.28855133056640625, -0.2732734680175781, -0.25799560546875, -0.24271774291992188, -0.22743988037109375, -0.21216201782226562, -0.1968841552734375, -0.18160629272460938, -0.16632843017578125, -0.15105056762695312, -0.135772705078125, -0.12049484252929688, -0.10521697998046875, -0.08993911743164062, -0.0746612548828125, -0.059383392333984375, -0.04410552978515625, -0.028827667236328125, -0.0135498046875, 0.001728057861328125, 0.01700592041015625, 0.032283782958984375, 0.0475616455078125, 0.06283950805664062, 0.07811737060546875, 0.09339523315429688, 0.108673095703125, 0.12395095825195312, 0.13922882080078125, 0.15450668334960938, 0.1697845458984375, 0.18506240844726562, 0.20034027099609375, 0.21561813354492188, 0.23089599609375, 0.24617385864257812, 0.26145172119140625, 0.2767295837402344, 0.2920074462890625, 0.3072853088378906, 0.32256317138671875, 0.3378410339355469, 0.353118896484375, 0.3683967590332031, 0.38367462158203125, 0.3989524841308594, 0.4142303466796875, 0.4295082092285156, 0.44478607177734375, 0.4600639343261719, 0.475341796875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 11.0, 11.0, 13.0, 15.0, 21.0, 16.0, 28.0, 26.0, 37.0, 32.0, 48.0, 59.0, 63.0, 53.0, 46.0, 51.0, 59.0, 50.0, 50.0, 51.0, 47.0, 42.0, 25.0, 28.0, 24.0, 21.0, 20.0, 7.0, 12.0, 5.0, 7.0, 7.0, 9.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1572265625, -0.15021896362304688, -0.14321136474609375, -0.13620376586914062, -0.1291961669921875, -0.12218856811523438, -0.11518096923828125, -0.10817337036132812, -0.101165771484375, -0.09415817260742188, -0.08715057373046875, -0.08014297485351562, -0.0731353759765625, -0.06612777709960938, -0.05912017822265625, -0.052112579345703125, -0.04510498046875, -0.038097381591796875, -0.03108978271484375, -0.024082183837890625, -0.0170745849609375, -0.010066986083984375, -0.00305938720703125, 0.003948211669921875, 0.010955810546875, 0.017963409423828125, 0.02497100830078125, 0.031978607177734375, 0.0389862060546875, 0.045993804931640625, 0.05300140380859375, 0.060009002685546875, 0.0670166015625, 0.07402420043945312, 0.08103179931640625, 0.08803939819335938, 0.0950469970703125, 0.10205459594726562, 0.10906219482421875, 0.11606979370117188, 0.123077392578125, 0.13008499145507812, 0.13709259033203125, 0.14410018920898438, 0.1511077880859375, 0.15811538696289062, 0.16512298583984375, 0.17213058471679688, 0.17913818359375, 0.18614578247070312, 0.19315338134765625, 0.20016098022460938, 0.2071685791015625, 0.21417617797851562, 0.22118377685546875, 0.22819137573242188, 0.235198974609375, 0.24220657348632812, 0.24921417236328125, 0.2562217712402344, 0.2632293701171875, 0.2702369689941406, 0.27724456787109375, 0.2842521667480469, 0.291259765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 11.0, 13.0, 19.0, 19.0, 30.0, 59.0, 64.0, 110.0, 190.0, 372.0, 815.0, 2305.0, 8158.0, 41149.0, 281695.0, 616222.0, 78070.0, 13457.0, 3577.0, 1104.0, 447.0, 227.0, 150.0, 97.0, 58.0, 40.0, 24.0, 16.0, 12.0, 12.0, 4.0, 6.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5711593627929688, -0.5539398193359375, -0.5367202758789062, -0.519500732421875, -0.5022811889648438, -0.4850616455078125, -0.46784210205078125, -0.45062255859375, -0.43340301513671875, -0.4161834716796875, -0.39896392822265625, -0.381744384765625, -0.36452484130859375, -0.3473052978515625, -0.33008575439453125, -0.3128662109375, -0.29564666748046875, -0.2784271240234375, -0.26120758056640625, -0.243988037109375, -0.22676849365234375, -0.2095489501953125, -0.19232940673828125, -0.17510986328125, -0.15789031982421875, -0.1406707763671875, -0.12345123291015625, -0.106231689453125, -0.08901214599609375, -0.0717926025390625, -0.05457305908203125, -0.037353515625, -0.02013397216796875, -0.0029144287109375, 0.01430511474609375, 0.031524658203125, 0.04874420166015625, 0.0659637451171875, 0.08318328857421875, 0.10040283203125, 0.11762237548828125, 0.1348419189453125, 0.15206146240234375, 0.169281005859375, 0.18650054931640625, 0.2037200927734375, 0.22093963623046875, 0.2381591796875, 0.25537872314453125, 0.2725982666015625, 0.28981781005859375, 0.307037353515625, 0.32425689697265625, 0.3414764404296875, 0.35869598388671875, 0.37591552734375, 0.39313507080078125, 0.4103546142578125, 0.42757415771484375, 0.444793701171875, 0.46201324462890625, 0.4792327880859375, 0.49645233154296875, 0.513671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 11.0, 7.0, 14.0, 9.0, 16.0, 30.0, 37.0, 28.0, 42.0, 42.0, 56.0, 59.0, 60.0, 62.0, 62.0, 62.0, 61.0, 61.0, 47.0, 40.0, 38.0, 32.0, 20.0, 21.0, 15.0, 17.0, 14.0, 10.0, 1.0, 7.0, 7.0, 2.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.90234375, -0.8760910034179688, -0.8498382568359375, -0.8235855102539062, -0.797332763671875, -0.7710800170898438, -0.7448272705078125, -0.7185745239257812, -0.69232177734375, -0.6660690307617188, -0.6398162841796875, -0.6135635375976562, -0.587310791015625, -0.5610580444335938, -0.5348052978515625, -0.5085525512695312, -0.4822998046875, -0.45604705810546875, -0.4297943115234375, -0.40354156494140625, -0.377288818359375, -0.35103607177734375, -0.3247833251953125, -0.29853057861328125, -0.27227783203125, -0.24602508544921875, -0.2197723388671875, -0.19351959228515625, -0.167266845703125, -0.14101409912109375, -0.1147613525390625, -0.08850860595703125, -0.062255859375, -0.03600311279296875, -0.0097503662109375, 0.01650238037109375, 0.042755126953125, 0.06900787353515625, 0.0952606201171875, 0.12151336669921875, 0.14776611328125, 0.17401885986328125, 0.2002716064453125, 0.22652435302734375, 0.252777099609375, 0.27902984619140625, 0.3052825927734375, 0.33153533935546875, 0.3577880859375, 0.38404083251953125, 0.4102935791015625, 0.43654632568359375, 0.462799072265625, 0.48905181884765625, 0.5153045654296875, 0.5415573120117188, 0.56781005859375, 0.5940628051757812, 0.6203155517578125, 0.6465682983398438, 0.672821044921875, 0.6990737915039062, 0.7253265380859375, 0.7515792846679688, 0.77783203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 9.0, 15.0, 9.0, 11.0, 35.0, 46.0, 88.0, 142.0, 238.0, 636.0, 1704.0, 6870.0, 39260.0, 380875.0, 565805.0, 42429.0, 7180.0, 1884.0, 678.0, 272.0, 133.0, 86.0, 41.0, 27.0, 17.0, 13.0, 12.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.195556640625, -0.1896343231201172, -0.18371200561523438, -0.17778968811035156, -0.17186737060546875, -0.16594505310058594, -0.16002273559570312, -0.1541004180908203, -0.1481781005859375, -0.1422557830810547, -0.13633346557617188, -0.13041114807128906, -0.12448883056640625, -0.11856651306152344, -0.11264419555664062, -0.10672187805175781, -0.100799560546875, -0.09487724304199219, -0.08895492553710938, -0.08303260803222656, -0.07711029052734375, -0.07118797302246094, -0.06526565551757812, -0.05934333801269531, -0.0534210205078125, -0.04749870300292969, -0.041576385498046875, -0.03565406799316406, -0.02973175048828125, -0.023809432983398438, -0.017887115478515625, -0.011964797973632812, -0.00604248046875, -0.0001201629638671875, 0.005802154541015625, 0.011724472045898438, 0.01764678955078125, 0.023569107055664062, 0.029491424560546875, 0.03541374206542969, 0.0413360595703125, 0.04725837707519531, 0.053180694580078125, 0.05910301208496094, 0.06502532958984375, 0.07094764709472656, 0.07686996459960938, 0.08279228210449219, 0.088714599609375, 0.09463691711425781, 0.10055923461914062, 0.10648155212402344, 0.11240386962890625, 0.11832618713378906, 0.12424850463867188, 0.1301708221435547, 0.1360931396484375, 0.1420154571533203, 0.14793777465820312, 0.15386009216308594, 0.15978240966796875, 0.16570472717285156, 0.17162704467773438, 0.1775493621826172, 0.1834716796875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 9.0, 9.0, 12.0, 17.0, 21.0, 38.0, 44.0, 49.0, 65.0, 95.0, 89.0, 98.0, 96.0, 83.0, 74.0, 40.0, 38.0, 33.0, 25.0, 8.0, 15.0, 5.0, 7.0, 5.0, 3.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.607439041137695e-05, -4.4452957808971405e-05, -4.283152520656586e-05, -4.121009260416031e-05, -3.958866000175476e-05, -3.796722739934921e-05, -3.6345794796943665e-05, -3.4724362194538116e-05, -3.310292959213257e-05, -3.148149698972702e-05, -2.9860064387321472e-05, -2.8238631784915924e-05, -2.6617199182510376e-05, -2.4995766580104828e-05, -2.337433397769928e-05, -2.175290137529373e-05, -2.0131468772888184e-05, -1.8510036170482635e-05, -1.6888603568077087e-05, -1.526717096567154e-05, -1.3645738363265991e-05, -1.2024305760860443e-05, -1.0402873158454895e-05, -8.781440556049347e-06, -7.160007953643799e-06, -5.538575351238251e-06, -3.917142748832703e-06, -2.2957101464271545e-06, -6.742775440216064e-07, 9.471550583839417e-07, 2.5685876607894897e-06, 4.190020263195038e-06, 5.811452865600586e-06, 7.432885468006134e-06, 9.054318070411682e-06, 1.067575067281723e-05, 1.2297183275222778e-05, 1.3918615877628326e-05, 1.5540048480033875e-05, 1.7161481082439423e-05, 1.878291368484497e-05, 2.040434628725052e-05, 2.2025778889656067e-05, 2.3647211492061615e-05, 2.5268644094467163e-05, 2.689007669687271e-05, 2.851150929927826e-05, 3.0132941901683807e-05, 3.1754374504089355e-05, 3.3375807106494904e-05, 3.499723970890045e-05, 3.6618672311306e-05, 3.824010491371155e-05, 3.9861537516117096e-05, 4.1482970118522644e-05, 4.310440272092819e-05, 4.472583532333374e-05, 4.634726792573929e-05, 4.7968700528144836e-05, 4.9590133130550385e-05, 5.121156573295593e-05, 5.283299833536148e-05, 5.445443093776703e-05, 5.607586354017258e-05, 5.7697296142578125e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 4.0, 13.0, 8.0, 23.0, 48.0, 89.0, 234.0, 713.0, 3887.0, 50881.0, 906619.0, 79655.0, 5028.0, 853.0, 267.0, 92.0, 54.0, 33.0, 25.0, 9.0, 10.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28271484375, -0.27207183837890625, -0.2614288330078125, -0.25078582763671875, -0.240142822265625, -0.22949981689453125, -0.2188568115234375, -0.20821380615234375, -0.19757080078125, -0.18692779541015625, -0.1762847900390625, -0.16564178466796875, -0.154998779296875, -0.14435577392578125, -0.1337127685546875, -0.12306976318359375, -0.1124267578125, -0.10178375244140625, -0.0911407470703125, -0.08049774169921875, -0.069854736328125, -0.05921173095703125, -0.0485687255859375, -0.03792572021484375, -0.02728271484375, -0.01663970947265625, -0.0059967041015625, 0.00464630126953125, 0.015289306640625, 0.02593231201171875, 0.0365753173828125, 0.04721832275390625, 0.057861328125, 0.06850433349609375, 0.0791473388671875, 0.08979034423828125, 0.100433349609375, 0.11107635498046875, 0.1217193603515625, 0.13236236572265625, 0.14300537109375, 0.15364837646484375, 0.1642913818359375, 0.17493438720703125, 0.185577392578125, 0.19622039794921875, 0.2068634033203125, 0.21750640869140625, 0.2281494140625, 0.23879241943359375, 0.2494354248046875, 0.26007843017578125, 0.270721435546875, 0.28136444091796875, 0.2920074462890625, 0.30265045166015625, 0.31329345703125, 0.32393646240234375, 0.3345794677734375, 0.34522247314453125, 0.355865478515625, 0.36650848388671875, 0.3771514892578125, 0.38779449462890625, 0.3984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 8.0, 4.0, 12.0, 19.0, 21.0, 36.0, 49.0, 69.0, 83.0, 105.0, 104.0, 115.0, 89.0, 91.0, 44.0, 34.0, 25.0, 27.0, 20.0, 10.0, 9.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1514892578125, -0.14542007446289062, -0.13935089111328125, -0.13328170776367188, -0.1272125244140625, -0.12114334106445312, -0.11507415771484375, -0.10900497436523438, -0.102935791015625, -0.09686660766601562, -0.09079742431640625, -0.08472824096679688, -0.0786590576171875, -0.07258987426757812, -0.06652069091796875, -0.060451507568359375, -0.05438232421875, -0.048313140869140625, -0.04224395751953125, -0.036174774169921875, -0.0301055908203125, -0.024036407470703125, -0.01796722412109375, -0.011898040771484375, -0.005828857421875, 0.000240325927734375, 0.00630950927734375, 0.012378692626953125, 0.0184478759765625, 0.024517059326171875, 0.03058624267578125, 0.036655426025390625, 0.042724609375, 0.048793792724609375, 0.05486297607421875, 0.060932159423828125, 0.0670013427734375, 0.07307052612304688, 0.07913970947265625, 0.08520889282226562, 0.091278076171875, 0.09734725952148438, 0.10341644287109375, 0.10948562622070312, 0.1155548095703125, 0.12162399291992188, 0.12769317626953125, 0.13376235961914062, 0.13983154296875, 0.14590072631835938, 0.15196990966796875, 0.15803909301757812, 0.1641082763671875, 0.17017745971679688, 0.17624664306640625, 0.18231582641601562, 0.188385009765625, 0.19445419311523438, 0.20052337646484375, 0.20659255981445312, 0.2126617431640625, 0.21873092651367188, 0.22480010986328125, 0.23086929321289062, 0.2369384765625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 14.0, 18.0, 46.0, 88.0, 151.0, 271.0, 199.0, 97.0, 46.0, 29.0, 7.0, 8.0, 4.0, 5.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4549970626831055, -4.326457500457764, -4.19791841506958, -4.069378852844238, -3.9408395290374756, -3.812300205230713, -3.683760643005371, -3.5552213191986084, -3.4266819953918457, -3.298142671585083, -3.169603109359741, -3.0410637855529785, -2.912524461746216, -2.783985137939453, -2.6554455757141113, -2.5269062519073486, -2.398366689682007, -2.269827365875244, -2.1412878036499023, -2.0127484798431396, -1.884209156036377, -1.7556697130203247, -1.6271302700042725, -1.4985909461975098, -1.3700515031814575, -1.2415120601654053, -1.1129727363586426, -0.9844332933425903, -0.8558939099311829, -0.7273545265197754, -0.5988150835037231, -0.4702757000923157, -0.3417363166809082, -0.21319691836833954, -0.08465752005577087, 0.043881893157958984, 0.17242127656936646, 0.3009606599807739, 0.42950010299682617, 0.5580394864082336, 0.6865788698196411, 0.8151182532310486, 0.943657636642456, 1.0721970796585083, 1.2007365226745605, 1.3292758464813232, 1.4578152894973755, 1.5863547325134277, 1.7148940563201904, 1.8434334993362427, 1.9719728231430054, 2.1005122661590576, 2.2290515899658203, 2.357591152191162, 2.486130475997925, 2.6146697998046875, 2.7432093620300293, 2.871748685836792, 3.000288248062134, 3.1288275718688965, 3.257366895675659, 3.385906219482422, 3.5144457817077637, 3.6429851055145264, 3.771524429321289]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 8.0, 2.0, 14.0, 18.0, 17.0, 23.0, 21.0, 34.0, 32.0, 43.0, 60.0, 59.0, 80.0, 104.0, 115.0, 71.0, 70.0, 36.0, 43.0, 40.0, 29.0, 20.0, 16.0, 15.0, 11.0, 9.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6192779541015625, -4.4971842765808105, -4.375090599060059, -4.252996444702148, -4.1309027671813965, -4.0088090896606445, -3.8867154121398926, -3.7646217346191406, -3.6425278186798096, -3.5204341411590576, -3.3983402252197266, -3.2762465476989746, -3.1541528701782227, -3.0320589542388916, -2.9099652767181396, -2.7878713607788086, -2.6657776832580566, -2.5436840057373047, -2.4215900897979736, -2.2994964122772217, -2.1774024963378906, -2.0553088188171387, -1.9332151412963867, -1.8111213445663452, -1.6890275478363037, -1.5669337511062622, -1.4448399543762207, -1.3227462768554688, -1.2006524801254272, -1.0785586833953857, -0.956464946269989, -0.8343712091445923, -0.7122771739959717, -0.5901833772659302, -0.46808964014053345, -0.34599587321281433, -0.22390210628509521, -0.10180830955505371, 0.020285427570343018, 0.14237916469573975, 0.26447296142578125, 0.38656672835350037, 0.5086604952812195, 0.6307542324066162, 0.7528480291366577, 0.8749418258666992, 0.997035562992096, 1.1191293001174927, 1.2412230968475342, 1.3633168935775757, 1.4854106903076172, 1.6075043678283691, 1.7295981645584106, 1.8516919612884521, 1.973785638809204, 2.095879554748535, 2.217973232269287, 2.340066909790039, 2.46216082572937, 2.584254503250122, 2.706348419189453, 2.828442096710205, 2.950535774230957, 3.072629451751709, 3.19472336769104]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 4.0, 2.0, 5.0, 10.0, 10.0, 15.0, 32.0, 56.0, 68.0, 125.0, 192.0, 316.0, 601.0, 984.0, 1821.0, 4340.0, 12114.0, 51170.0, 322979.0, 2020976.0, 1511338.0, 215208.0, 35854.0, 9134.0, 3465.0, 1569.0, 790.0, 394.0, 277.0, 142.0, 87.0, 61.0, 53.0, 22.0, 17.0, 14.0, 9.0, 11.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2261962890625, -0.21910476684570312, -0.21201324462890625, -0.20492172241210938, -0.1978302001953125, -0.19073867797851562, -0.18364715576171875, -0.17655563354492188, -0.169464111328125, -0.16237258911132812, -0.15528106689453125, -0.14818954467773438, -0.1410980224609375, -0.13400650024414062, -0.12691497802734375, -0.11982345581054688, -0.11273193359375, -0.10564041137695312, -0.09854888916015625, -0.09145736694335938, -0.0843658447265625, -0.07727432250976562, -0.07018280029296875, -0.06309127807617188, -0.055999755859375, -0.048908233642578125, -0.04181671142578125, -0.034725189208984375, -0.0276336669921875, -0.020542144775390625, -0.01345062255859375, -0.006359100341796875, 0.000732421875, 0.007823944091796875, 0.01491546630859375, 0.022006988525390625, 0.0290985107421875, 0.036190032958984375, 0.04328155517578125, 0.050373077392578125, 0.057464599609375, 0.06455612182617188, 0.07164764404296875, 0.07873916625976562, 0.0858306884765625, 0.09292221069335938, 0.10001373291015625, 0.10710525512695312, 0.11419677734375, 0.12128829956054688, 0.12837982177734375, 0.13547134399414062, 0.1425628662109375, 0.14965438842773438, 0.15674591064453125, 0.16383743286132812, 0.170928955078125, 0.17802047729492188, 0.18511199951171875, 0.19220352172851562, 0.1992950439453125, 0.20638656616210938, 0.21347808837890625, 0.22056961059570312, 0.2276611328125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 5.0, 14.0, 12.0, 11.0, 8.0, 16.0, 13.0, 19.0, 23.0, 40.0, 30.0, 56.0, 40.0, 45.0, 49.0, 41.0, 53.0, 51.0, 49.0, 49.0, 42.0, 51.0, 26.0, 43.0, 33.0, 33.0, 17.0, 16.0, 21.0, 16.0, 13.0, 13.0, 11.0, 6.0, 3.0, 10.0, 2.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1588134765625, -0.15280532836914062, -0.14679718017578125, -0.14078903198242188, -0.1347808837890625, -0.12877273559570312, -0.12276458740234375, -0.11675643920898438, -0.110748291015625, -0.10474014282226562, -0.09873199462890625, -0.09272384643554688, -0.0867156982421875, -0.08070755004882812, -0.07469940185546875, -0.06869125366210938, -0.06268310546875, -0.056674957275390625, -0.05066680908203125, -0.044658660888671875, -0.0386505126953125, -0.032642364501953125, -0.02663421630859375, -0.020626068115234375, -0.014617919921875, -0.008609771728515625, -0.00260162353515625, 0.003406524658203125, 0.0094146728515625, 0.015422821044921875, 0.02143096923828125, 0.027439117431640625, 0.033447265625, 0.039455413818359375, 0.04546356201171875, 0.051471710205078125, 0.0574798583984375, 0.06348800659179688, 0.06949615478515625, 0.07550430297851562, 0.081512451171875, 0.08752059936523438, 0.09352874755859375, 0.09953689575195312, 0.1055450439453125, 0.11155319213867188, 0.11756134033203125, 0.12356948852539062, 0.12957763671875, 0.13558578491210938, 0.14159393310546875, 0.14760208129882812, 0.1536102294921875, 0.15961837768554688, 0.16562652587890625, 0.17163467407226562, 0.177642822265625, 0.18365097045898438, 0.18965911865234375, 0.19566726684570312, 0.2016754150390625, 0.20768356323242188, 0.21369171142578125, 0.21969985961914062, 0.2257080078125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 12.0, 12.0, 14.0, 25.0, 39.0, 69.0, 125.0, 278.0, 616.0, 1696.0, 7777.0, 80966.0, 3441166.0, 632076.0, 23806.0, 3694.0, 996.0, 398.0, 193.0, 129.0, 61.0, 43.0, 26.0, 13.0, 12.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59130859375, -0.5747756958007812, -0.5582427978515625, -0.5417098999023438, -0.525177001953125, -0.5086441040039062, -0.4921112060546875, -0.47557830810546875, -0.45904541015625, -0.44251251220703125, -0.4259796142578125, -0.40944671630859375, -0.392913818359375, -0.37638092041015625, -0.3598480224609375, -0.34331512451171875, -0.3267822265625, -0.31024932861328125, -0.2937164306640625, -0.27718353271484375, -0.260650634765625, -0.24411773681640625, -0.2275848388671875, -0.21105194091796875, -0.19451904296875, -0.17798614501953125, -0.1614532470703125, -0.14492034912109375, -0.128387451171875, -0.11185455322265625, -0.0953216552734375, -0.07878875732421875, -0.062255859375, -0.04572296142578125, -0.0291900634765625, -0.01265716552734375, 0.003875732421875, 0.02040863037109375, 0.0369415283203125, 0.05347442626953125, 0.07000732421875, 0.08654022216796875, 0.1030731201171875, 0.11960601806640625, 0.136138916015625, 0.15267181396484375, 0.1692047119140625, 0.18573760986328125, 0.2022705078125, 0.21880340576171875, 0.2353363037109375, 0.25186920166015625, 0.268402099609375, 0.28493499755859375, 0.3014678955078125, 0.31800079345703125, 0.33453369140625, 0.35106658935546875, 0.3675994873046875, 0.38413238525390625, 0.400665283203125, 0.41719818115234375, 0.4337310791015625, 0.45026397705078125, 0.466796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 22.0, 24.0, 39.0, 64.0, 141.0, 288.0, 503.0, 861.0, 940.0, 557.0, 255.0, 145.0, 79.0, 42.0, 45.0, 19.0, 16.0, 4.0, 4.0, 9.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400146484375, -0.3841590881347656, -0.36817169189453125, -0.3521842956542969, -0.3361968994140625, -0.3202095031738281, -0.30422210693359375, -0.2882347106933594, -0.272247314453125, -0.2562599182128906, -0.24027252197265625, -0.22428512573242188, -0.2082977294921875, -0.19231033325195312, -0.17632293701171875, -0.16033554077148438, -0.14434814453125, -0.12836074829101562, -0.11237335205078125, -0.09638595581054688, -0.0803985595703125, -0.06441116333007812, -0.04842376708984375, -0.032436370849609375, -0.016448974609375, -0.000461578369140625, 0.01552581787109375, 0.031513214111328125, 0.0475006103515625, 0.06348800659179688, 0.07947540283203125, 0.09546279907226562, 0.1114501953125, 0.12743759155273438, 0.14342498779296875, 0.15941238403320312, 0.1753997802734375, 0.19138717651367188, 0.20737457275390625, 0.22336196899414062, 0.239349365234375, 0.2553367614746094, 0.27132415771484375, 0.2873115539550781, 0.3032989501953125, 0.3192863464355469, 0.33527374267578125, 0.3512611389160156, 0.36724853515625, 0.3832359313964844, 0.39922332763671875, 0.4152107238769531, 0.4311981201171875, 0.4471855163574219, 0.46317291259765625, 0.4791603088378906, 0.495147705078125, 0.5111351013183594, 0.5271224975585938, 0.5431098937988281, 0.5590972900390625, 0.5750846862792969, 0.5910720825195312, 0.6070594787597656, 0.623046875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 11.0, 18.0, 69.0, 147.0, 260.0, 263.0, 114.0, 64.0, 32.0, 15.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.004892349243164, -5.853524684906006, -5.702157497406006, -5.550789833068848, -5.399422645568848, -5.2480549812316895, -5.096687316894531, -4.945320129394531, -4.793952465057373, -4.642584800720215, -4.491217613220215, -4.339849948883057, -4.188482761383057, -4.037115097045898, -3.8857476711273193, -3.7343802452087402, -3.583012819290161, -3.431645393371582, -3.280277967453003, -3.128910541534424, -2.9775428771972656, -2.8261754512786865, -2.6748080253601074, -2.523440361022949, -2.372073173522949, -2.22070574760437, -2.069338321685791, -1.9179707765579224, -1.7666032314300537, -1.6152358055114746, -1.4638683795928955, -1.3125008344650269, -1.1611332893371582, -1.009765863418579, -0.8583983182907104, -0.7070308923721313, -0.5556634068489075, -0.4042959213256836, -0.2529284954071045, -0.10156095027923584, 0.04980647563934326, 0.20117394626140594, 0.35254141688346863, 0.5039088726043701, 0.655276358127594, 0.8066438436508179, 0.958011269569397, 1.1093788146972656, 1.2607462406158447, 1.4121136665344238, 1.5634812116622925, 1.7148486375808716, 1.8662161827087402, 2.0175836086273193, 2.1689510345458984, 2.3203186988830566, 2.4716858863830566, 2.6230533123016357, 2.774420738220215, 2.925788402557373, 3.077155828475952, 3.2285232543945312, 3.3798906803131104, 3.5312581062316895, 3.6826257705688477]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 11.0, 13.0, 14.0, 18.0, 20.0, 34.0, 37.0, 29.0, 46.0, 50.0, 41.0, 64.0, 49.0, 50.0, 65.0, 60.0, 60.0, 48.0, 48.0, 40.0, 40.0, 30.0, 23.0, 19.0, 13.0, 13.0, 9.0, 12.0, 5.0, 9.0, 4.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5020151138305664, -1.4444628953933716, -1.3869106769561768, -1.3293583393096924, -1.2718061208724976, -1.2142539024353027, -1.156701683998108, -1.099149465560913, -1.0415971279144287, -0.9840449094772339, -0.9264926314353943, -0.8689404129981995, -0.8113881349563599, -0.753835916519165, -0.6962836980819702, -0.6387314200401306, -0.5811792016029358, -0.523626983165741, -0.46607470512390137, -0.40852248668670654, -0.35097020864486694, -0.2934179902076721, -0.2358657419681549, -0.1783134937286377, -0.12076124548912048, -0.06320899724960327, -0.0056567564606666565, 0.05189548432826996, 0.10944773256778717, 0.1669999659061432, 0.2245522141456604, 0.2821044623851776, 0.3396567106246948, 0.39720895886421204, 0.45476120710372925, 0.5123134255409241, 0.5698657035827637, 0.6274179220199585, 0.6849701404571533, 0.7425224184989929, 0.8000746965408325, 0.8576269149780273, 0.9151791930198669, 0.9727314114570618, 1.0302836894989014, 1.0878359079360962, 1.145388126373291, 1.2029404640197754, 1.2604925632476807, 1.3180447816848755, 1.3755970001220703, 1.4331493377685547, 1.4907015562057495, 1.5482537746429443, 1.6058059930801392, 1.663358211517334, 1.7209105491638184, 1.7784627676010132, 1.836014986038208, 1.8935673236846924, 1.9511195421218872, 2.008671760559082, 2.0662240982055664, 2.1237761974334717, 2.181328535079956]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 11.0, 25.0, 44.0, 88.0, 168.0, 433.0, 1176.0, 4394.0, 22638.0, 166375.0, 652224.0, 171126.0, 23301.0, 4535.0, 1201.0, 448.0, 176.0, 80.0, 61.0, 17.0, 12.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3798828125, -0.361358642578125, -0.34283447265625, -0.324310302734375, -0.3057861328125, -0.287261962890625, -0.26873779296875, -0.250213623046875, -0.231689453125, -0.213165283203125, -0.19464111328125, -0.176116943359375, -0.1575927734375, -0.139068603515625, -0.12054443359375, -0.102020263671875, -0.08349609375, -0.064971923828125, -0.04644775390625, -0.027923583984375, -0.0093994140625, 0.009124755859375, 0.02764892578125, 0.046173095703125, 0.064697265625, 0.083221435546875, 0.10174560546875, 0.120269775390625, 0.1387939453125, 0.157318115234375, 0.17584228515625, 0.194366455078125, 0.212890625, 0.231414794921875, 0.24993896484375, 0.268463134765625, 0.2869873046875, 0.305511474609375, 0.32403564453125, 0.342559814453125, 0.361083984375, 0.379608154296875, 0.39813232421875, 0.416656494140625, 0.4351806640625, 0.453704833984375, 0.47222900390625, 0.490753173828125, 0.50927734375, 0.527801513671875, 0.54632568359375, 0.564849853515625, 0.5833740234375, 0.601898193359375, 0.62042236328125, 0.638946533203125, 0.657470703125, 0.675994873046875, 0.69451904296875, 0.713043212890625, 0.7315673828125, 0.750091552734375, 0.76861572265625, 0.787139892578125, 0.8056640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 13.0, 11.0, 17.0, 11.0, 18.0, 20.0, 24.0, 40.0, 61.0, 46.0, 49.0, 43.0, 35.0, 55.0, 39.0, 61.0, 38.0, 51.0, 51.0, 38.0, 35.0, 38.0, 28.0, 30.0, 22.0, 19.0, 17.0, 15.0, 10.0, 10.0, 11.0, 8.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.196044921875, -0.1895313262939453, -0.18301773071289062, -0.17650413513183594, -0.16999053955078125, -0.16347694396972656, -0.15696334838867188, -0.1504497528076172, -0.1439361572265625, -0.1374225616455078, -0.13090896606445312, -0.12439537048339844, -0.11788177490234375, -0.11136817932128906, -0.10485458374023438, -0.09834098815917969, -0.091827392578125, -0.08531379699707031, -0.07880020141601562, -0.07228660583496094, -0.06577301025390625, -0.05925941467285156, -0.052745819091796875, -0.04623222351074219, -0.0397186279296875, -0.03320503234863281, -0.026691436767578125, -0.020177841186523438, -0.01366424560546875, -0.0071506500244140625, -0.000637054443359375, 0.0058765411376953125, 0.01239013671875, 0.018903732299804688, 0.025417327880859375, 0.03193092346191406, 0.03844451904296875, 0.04495811462402344, 0.051471710205078125, 0.05798530578613281, 0.0644989013671875, 0.07101249694824219, 0.07752609252929688, 0.08403968811035156, 0.09055328369140625, 0.09706687927246094, 0.10358047485351562, 0.11009407043457031, 0.116607666015625, 0.12312126159667969, 0.12963485717773438, 0.13614845275878906, 0.14266204833984375, 0.14917564392089844, 0.15568923950195312, 0.1622028350830078, 0.1687164306640625, 0.1752300262451172, 0.18174362182617188, 0.18825721740722656, 0.19477081298828125, 0.20128440856933594, 0.20779800415039062, 0.2143115997314453, 0.2208251953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 9.0, 10.0, 11.0, 16.0, 22.0, 25.0, 38.0, 67.0, 76.0, 100.0, 125.0, 211.0, 300.0, 443.0, 734.0, 1265.0, 3076.0, 9974.0, 45894.0, 287425.0, 607616.0, 69895.0, 13635.0, 3777.0, 1546.0, 753.0, 440.0, 313.0, 202.0, 161.0, 111.0, 70.0, 49.0, 38.0, 27.0, 23.0, 18.0, 17.0, 3.0, 4.0, 5.0, 3.0, 5.0, 6.0, 2.0, 5.0, 0.0, 0.0, 3.0, 1.0, 3.0], "bins": [-0.492431640625, -0.47756195068359375, -0.4626922607421875, -0.44782257080078125, -0.432952880859375, -0.41808319091796875, -0.4032135009765625, -0.38834381103515625, -0.37347412109375, -0.35860443115234375, -0.3437347412109375, -0.32886505126953125, -0.313995361328125, -0.29912567138671875, -0.2842559814453125, -0.26938629150390625, -0.2545166015625, -0.23964691162109375, -0.2247772216796875, -0.20990753173828125, -0.195037841796875, -0.18016815185546875, -0.1652984619140625, -0.15042877197265625, -0.13555908203125, -0.12068939208984375, -0.1058197021484375, -0.09095001220703125, -0.076080322265625, -0.06121063232421875, -0.0463409423828125, -0.03147125244140625, -0.0166015625, -0.00173187255859375, 0.0131378173828125, 0.02800750732421875, 0.042877197265625, 0.05774688720703125, 0.0726165771484375, 0.08748626708984375, 0.10235595703125, 0.11722564697265625, 0.1320953369140625, 0.14696502685546875, 0.161834716796875, 0.17670440673828125, 0.1915740966796875, 0.20644378662109375, 0.2213134765625, 0.23618316650390625, 0.2510528564453125, 0.26592254638671875, 0.280792236328125, 0.29566192626953125, 0.3105316162109375, 0.32540130615234375, 0.34027099609375, 0.35514068603515625, 0.3700103759765625, 0.38488006591796875, 0.399749755859375, 0.41461944580078125, 0.4294891357421875, 0.44435882568359375, 0.459228515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 9.0, 12.0, 13.0, 14.0, 20.0, 34.0, 27.0, 25.0, 36.0, 44.0, 36.0, 41.0, 59.0, 55.0, 61.0, 56.0, 57.0, 45.0, 58.0, 54.0, 47.0, 29.0, 27.0, 20.0, 24.0, 22.0, 10.0, 9.0, 12.0, 10.0, 8.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.9697265625, -0.9449844360351562, -0.9202423095703125, -0.8955001831054688, -0.870758056640625, -0.8460159301757812, -0.8212738037109375, -0.7965316772460938, -0.77178955078125, -0.7470474243164062, -0.7223052978515625, -0.6975631713867188, -0.672821044921875, -0.6480789184570312, -0.6233367919921875, -0.5985946655273438, -0.5738525390625, -0.5491104125976562, -0.5243682861328125, -0.49962615966796875, -0.474884033203125, -0.45014190673828125, -0.4253997802734375, -0.40065765380859375, -0.37591552734375, -0.35117340087890625, -0.3264312744140625, -0.30168914794921875, -0.276947021484375, -0.25220489501953125, -0.2274627685546875, -0.20272064208984375, -0.177978515625, -0.15323638916015625, -0.1284942626953125, -0.10375213623046875, -0.079010009765625, -0.05426788330078125, -0.0295257568359375, -0.00478363037109375, 0.01995849609375, 0.04470062255859375, 0.0694427490234375, 0.09418487548828125, 0.118927001953125, 0.14366912841796875, 0.1684112548828125, 0.19315338134765625, 0.2178955078125, 0.24263763427734375, 0.2673797607421875, 0.29212188720703125, 0.316864013671875, 0.34160614013671875, 0.3663482666015625, 0.39109039306640625, 0.41583251953125, 0.44057464599609375, 0.4653167724609375, 0.49005889892578125, 0.514801025390625, 0.5395431518554688, 0.5642852783203125, 0.5890274047851562, 0.61376953125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 17.0, 19.0, 25.0, 30.0, 54.0, 101.0, 175.0, 383.0, 698.0, 1858.0, 5313.0, 19472.0, 97365.0, 755584.0, 133170.0, 23898.0, 6396.0, 2199.0, 874.0, 395.0, 190.0, 127.0, 55.0, 43.0, 21.0, 20.0, 12.0, 7.0, 10.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1561279296875, -0.15102195739746094, -0.14591598510742188, -0.1408100128173828, -0.13570404052734375, -0.1305980682373047, -0.12549209594726562, -0.12038612365722656, -0.1152801513671875, -0.11017417907714844, -0.10506820678710938, -0.09996223449707031, -0.09485626220703125, -0.08975028991699219, -0.08464431762695312, -0.07953834533691406, -0.074432373046875, -0.06932640075683594, -0.06422042846679688, -0.05911445617675781, -0.05400848388671875, -0.04890251159667969, -0.043796539306640625, -0.03869056701660156, -0.0335845947265625, -0.028478622436523438, -0.023372650146484375, -0.018266677856445312, -0.01316070556640625, -0.008054733276367188, -0.002948760986328125, 0.0021572113037109375, 0.00726318359375, 0.012369155883789062, 0.017475128173828125, 0.022581100463867188, 0.02768707275390625, 0.03279304504394531, 0.037899017333984375, 0.04300498962402344, 0.0481109619140625, 0.05321693420410156, 0.058322906494140625, 0.06342887878417969, 0.06853485107421875, 0.07364082336425781, 0.07874679565429688, 0.08385276794433594, 0.088958740234375, 0.09406471252441406, 0.09917068481445312, 0.10427665710449219, 0.10938262939453125, 0.11448860168457031, 0.11959457397460938, 0.12470054626464844, 0.1298065185546875, 0.13491249084472656, 0.14001846313476562, 0.1451244354248047, 0.15023040771484375, 0.1553363800048828, 0.16044235229492188, 0.16554832458496094, 0.170654296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 18.0, 9.0, 15.0, 21.0, 31.0, 30.0, 27.0, 46.0, 59.0, 78.0, 79.0, 104.0, 97.0, 62.0, 59.0, 49.0, 41.0, 22.0, 30.0, 13.0, 16.0, 13.0, 12.0, 10.0, 6.0, 7.0, 9.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.790855407714844e-05, -3.657303750514984e-05, -3.5237520933151245e-05, -3.390200436115265e-05, -3.256648778915405e-05, -3.1230971217155457e-05, -2.989545464515686e-05, -2.8559938073158264e-05, -2.7224421501159668e-05, -2.5888904929161072e-05, -2.4553388357162476e-05, -2.321787178516388e-05, -2.1882355213165283e-05, -2.0546838641166687e-05, -1.921132206916809e-05, -1.7875805497169495e-05, -1.65402889251709e-05, -1.5204772353172302e-05, -1.3869255781173706e-05, -1.253373920917511e-05, -1.1198222637176514e-05, -9.862706065177917e-06, -8.527189493179321e-06, -7.191672921180725e-06, -5.856156349182129e-06, -4.520639777183533e-06, -3.1851232051849365e-06, -1.8496066331863403e-06, -5.140900611877441e-07, 8.21426510810852e-07, 2.1569430828094482e-06, 3.4924596548080444e-06, 4.827976226806641e-06, 6.163492798805237e-06, 7.499009370803833e-06, 8.83452594280243e-06, 1.0170042514801025e-05, 1.1505559086799622e-05, 1.2841075658798218e-05, 1.4176592230796814e-05, 1.551210880279541e-05, 1.6847625374794006e-05, 1.8183141946792603e-05, 1.95186585187912e-05, 2.0854175090789795e-05, 2.218969166278839e-05, 2.3525208234786987e-05, 2.4860724806785583e-05, 2.619624137878418e-05, 2.7531757950782776e-05, 2.8867274522781372e-05, 3.0202791094779968e-05, 3.1538307666778564e-05, 3.287382423877716e-05, 3.420934081077576e-05, 3.554485738277435e-05, 3.688037395477295e-05, 3.8215890526771545e-05, 3.955140709877014e-05, 4.088692367076874e-05, 4.2222440242767334e-05, 4.355795681476593e-05, 4.4893473386764526e-05, 4.622898995876312e-05, 4.756450653076172e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 9.0, 5.0, 8.0, 25.0, 34.0, 43.0, 58.0, 131.0, 220.0, 466.0, 746.0, 1775.0, 4897.0, 16905.0, 77418.0, 684306.0, 210685.0, 36188.0, 8986.0, 3062.0, 1212.0, 587.0, 310.0, 174.0, 105.0, 66.0, 41.0, 21.0, 23.0, 17.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.141357421875, -0.1367626190185547, -0.13216781616210938, -0.12757301330566406, -0.12297821044921875, -0.11838340759277344, -0.11378860473632812, -0.10919380187988281, -0.1045989990234375, -0.10000419616699219, -0.09540939331054688, -0.09081459045410156, -0.08621978759765625, -0.08162498474121094, -0.07703018188476562, -0.07243537902832031, -0.067840576171875, -0.06324577331542969, -0.058650970458984375, -0.05405616760253906, -0.04946136474609375, -0.04486656188964844, -0.040271759033203125, -0.03567695617675781, -0.0310821533203125, -0.026487350463867188, -0.021892547607421875, -0.017297744750976562, -0.01270294189453125, -0.008108139038085938, -0.003513336181640625, 0.0010814666748046875, 0.00567626953125, 0.010271072387695312, 0.014865875244140625, 0.019460678100585938, 0.02405548095703125, 0.028650283813476562, 0.033245086669921875, 0.03783988952636719, 0.0424346923828125, 0.04702949523925781, 0.051624298095703125, 0.05621910095214844, 0.06081390380859375, 0.06540870666503906, 0.07000350952148438, 0.07459831237792969, 0.079193115234375, 0.08378791809082031, 0.08838272094726562, 0.09297752380371094, 0.09757232666015625, 0.10216712951660156, 0.10676193237304688, 0.11135673522949219, 0.1159515380859375, 0.12054634094238281, 0.12514114379882812, 0.12973594665527344, 0.13433074951171875, 0.13892555236816406, 0.14352035522460938, 0.1481151580810547, 0.1527099609375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 7.0, 6.0, 11.0, 12.0, 17.0, 25.0, 26.0, 36.0, 43.0, 57.0, 81.0, 97.0, 103.0, 93.0, 67.0, 84.0, 51.0, 29.0, 43.0, 16.0, 14.0, 15.0, 11.0, 11.0, 5.0, 5.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.142578125, -0.13804054260253906, -0.13350296020507812, -0.1289653778076172, -0.12442779541015625, -0.11989021301269531, -0.11535263061523438, -0.11081504821777344, -0.1062774658203125, -0.10173988342285156, -0.09720230102539062, -0.09266471862792969, -0.08812713623046875, -0.08358955383300781, -0.07905197143554688, -0.07451438903808594, -0.069976806640625, -0.06543922424316406, -0.060901641845703125, -0.05636405944824219, -0.05182647705078125, -0.04728889465332031, -0.042751312255859375, -0.03821372985839844, -0.0336761474609375, -0.029138565063476562, -0.024600982666015625, -0.020063400268554688, -0.01552581787109375, -0.010988235473632812, -0.006450653076171875, -0.0019130706787109375, 0.00262451171875, 0.0071620941162109375, 0.011699676513671875, 0.016237258911132812, 0.02077484130859375, 0.025312423706054688, 0.029850006103515625, 0.03438758850097656, 0.0389251708984375, 0.04346275329589844, 0.048000335693359375, 0.05253791809082031, 0.05707550048828125, 0.06161308288574219, 0.06615066528320312, 0.07068824768066406, 0.075225830078125, 0.07976341247558594, 0.08430099487304688, 0.08883857727050781, 0.09337615966796875, 0.09791374206542969, 0.10245132446289062, 0.10698890686035156, 0.1115264892578125, 0.11606407165527344, 0.12060165405273438, 0.1251392364501953, 0.12967681884765625, 0.1342144012451172, 0.13875198364257812, 0.14328956604003906, 0.1478271484375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 9.0, 17.0, 36.0, 53.0, 80.0, 135.0, 299.0, 134.0, 79.0, 55.0, 34.0, 21.0, 9.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.667967677116394, -1.5528870820999146, -1.437806487083435, -1.322725772857666, -1.2076451778411865, -1.092564582824707, -0.9774839878082275, -0.862403392791748, -0.7473227977752686, -0.6322422027587891, -0.5171616077423096, -0.4020809531211853, -0.2870003581047058, -0.17191976308822632, -0.05683910846710205, 0.05824148654937744, 0.17332208156585693, 0.2884026765823364, 0.4034833014011383, 0.5185639262199402, 0.6336445212364197, 0.7487251162528992, 0.8638057708740234, 0.9788863658905029, 1.0939669609069824, 1.209047555923462, 1.3241281509399414, 1.439208745956421, 1.5542893409729004, 1.6693699359893799, 1.784450650215149, 1.8995312452316284, 2.0146117210388184, 2.129692316055298, 2.2447729110717773, 2.359853506088257, 2.4749341011047363, 2.590014696121216, 2.7050952911376953, 2.820176124572754, 2.9352564811706543, 3.050337076187134, 3.1654176712036133, 3.2804982662200928, 3.3955788612365723, 3.5106594562530518, 3.6257400512695312, 3.74082088470459, 3.8559014797210693, 3.970982074737549, 4.086062908172607, 4.201143264770508, 4.316224098205566, 4.431304454803467, 4.546385288238525, 4.661465644836426, 4.776546478271484, 4.891627311706543, 5.006707668304443, 5.121788501739502, 5.236868858337402, 5.351949691772461, 5.467030048370361, 5.58211088180542, 5.69719123840332]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 6.0, 9.0, 15.0, 11.0, 17.0, 20.0, 22.0, 21.0, 33.0, 30.0, 28.0, 36.0, 55.0, 71.0, 117.0, 100.0, 75.0, 55.0, 38.0, 39.0, 26.0, 23.0, 28.0, 18.0, 18.0, 12.0, 19.0, 18.0, 8.0, 4.0, 6.0, 3.0, 8.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.255918502807617, -3.162818670272827, -3.069719076156616, -2.976619243621826, -2.8835196495056152, -2.790419816970825, -2.697319984436035, -2.604220390319824, -2.5111207962036133, -2.4180209636688232, -2.3249213695526123, -2.2318215370178223, -2.1387219429016113, -2.0456221103668213, -1.9525223970413208, -1.8594226837158203, -1.7663228511810303, -1.6732231378555298, -1.5801234245300293, -1.4870235919952393, -1.3939239978790283, -1.3008241653442383, -1.2077244520187378, -1.1146247386932373, -1.0215250253677368, -0.9284253120422363, -0.8353255987167358, -0.7422258257865906, -0.6491261124610901, -0.5560263991355896, -0.46292662620544434, -0.36982691287994385, -0.27672719955444336, -0.18362747132778168, -0.09052774310112, 0.002572000026702881, 0.09567171335220337, 0.18877142667770386, 0.2818711996078491, 0.3749709129333496, 0.4680706262588501, 0.5611703395843506, 0.6542700529098511, 0.7473698258399963, 0.8404695391654968, 0.9335692524909973, 1.0266690254211426, 1.119768738746643, 1.2128684520721436, 1.305968165397644, 1.3990678787231445, 1.4921677112579346, 1.5852673053741455, 1.6783671379089355, 1.771466851234436, 1.8645665645599365, 1.957666277885437, 2.0507659912109375, 2.1438658237457275, 2.2369654178619385, 2.3300652503967285, 2.4231648445129395, 2.5162646770477295, 2.6093645095825195, 2.7024641036987305]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 20.0, 27.0, 63.0, 100.0, 199.0, 404.0, 905.0, 2325.0, 7695.0, 46829.0, 582114.0, 2893537.0, 600060.0, 48367.0, 7695.0, 2201.0, 863.0, 406.0, 174.0, 114.0, 69.0, 33.0, 22.0, 18.0, 7.0, 5.0, 7.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.43359375, -0.42314720153808594, -0.4127006530761719, -0.4022541046142578, -0.39180755615234375, -0.3813610076904297, -0.3709144592285156, -0.36046791076660156, -0.3500213623046875, -0.33957481384277344, -0.3291282653808594, -0.3186817169189453, -0.30823516845703125, -0.2977886199951172, -0.2873420715332031, -0.27689552307128906, -0.266448974609375, -0.25600242614746094, -0.24555587768554688, -0.2351093292236328, -0.22466278076171875, -0.2142162322998047, -0.20376968383789062, -0.19332313537597656, -0.1828765869140625, -0.17243003845214844, -0.16198348999023438, -0.1515369415283203, -0.14109039306640625, -0.1306438446044922, -0.12019729614257812, -0.10975074768066406, -0.09930419921875, -0.08885765075683594, -0.07841110229492188, -0.06796455383300781, -0.05751800537109375, -0.04707145690917969, -0.036624908447265625, -0.026178359985351562, -0.0157318115234375, -0.0052852630615234375, 0.005161285400390625, 0.015607833862304688, 0.02605438232421875, 0.03650093078613281, 0.046947479248046875, 0.05739402770996094, 0.067840576171875, 0.07828712463378906, 0.08873367309570312, 0.09918022155761719, 0.10962677001953125, 0.12007331848144531, 0.13051986694335938, 0.14096641540527344, 0.1514129638671875, 0.16185951232910156, 0.17230606079101562, 0.1827526092529297, 0.19319915771484375, 0.2036457061767578, 0.21409225463867188, 0.22453880310058594, 0.2349853515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 13.0, 11.0, 13.0, 18.0, 23.0, 37.0, 38.0, 51.0, 45.0, 53.0, 39.0, 41.0, 49.0, 54.0, 37.0, 49.0, 44.0, 56.0, 53.0, 42.0, 33.0, 39.0, 27.0, 25.0, 13.0, 21.0, 14.0, 10.0, 10.0, 10.0, 1.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208984375, -0.20225143432617188, -0.19551849365234375, -0.18878555297851562, -0.1820526123046875, -0.17531967163085938, -0.16858673095703125, -0.16185379028320312, -0.155120849609375, -0.14838790893554688, -0.14165496826171875, -0.13492202758789062, -0.1281890869140625, -0.12145614624023438, -0.11472320556640625, -0.10799026489257812, -0.10125732421875, -0.09452438354492188, -0.08779144287109375, -0.08105850219726562, -0.0743255615234375, -0.06759262084960938, -0.06085968017578125, -0.054126739501953125, -0.047393798828125, -0.040660858154296875, -0.03392791748046875, -0.027194976806640625, -0.0204620361328125, -0.013729095458984375, -0.00699615478515625, -0.000263214111328125, 0.0064697265625, 0.013202667236328125, 0.01993560791015625, 0.026668548583984375, 0.0334014892578125, 0.040134429931640625, 0.04686737060546875, 0.053600311279296875, 0.060333251953125, 0.06706619262695312, 0.07379913330078125, 0.08053207397460938, 0.0872650146484375, 0.09399795532226562, 0.10073089599609375, 0.10746383666992188, 0.11419677734375, 0.12092971801757812, 0.12766265869140625, 0.13439559936523438, 0.1411285400390625, 0.14786148071289062, 0.15459442138671875, 0.16132736206054688, 0.168060302734375, 0.17479324340820312, 0.18152618408203125, 0.18825912475585938, 0.1949920654296875, 0.20172500610351562, 0.20845794677734375, 0.21519088745117188, 0.221923828125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 13.0, 11.0, 14.0, 16.0, 47.0, 82.0, 176.0, 360.0, 1252.0, 8411.0, 384872.0, 3760117.0, 35130.0, 2681.0, 585.0, 250.0, 125.0, 58.0, 36.0, 13.0, 14.0, 9.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0207595825195312, -0.9965972900390625, -0.9724349975585938, -0.948272705078125, -0.9241104125976562, -0.8999481201171875, -0.8757858276367188, -0.85162353515625, -0.8274612426757812, -0.8032989501953125, -0.7791366577148438, -0.754974365234375, -0.7308120727539062, -0.7066497802734375, -0.6824874877929688, -0.6583251953125, -0.6341629028320312, -0.6100006103515625, -0.5858383178710938, -0.561676025390625, -0.5375137329101562, -0.5133514404296875, -0.48918914794921875, -0.46502685546875, -0.44086456298828125, -0.4167022705078125, -0.39253997802734375, -0.368377685546875, -0.34421539306640625, -0.3200531005859375, -0.29589080810546875, -0.271728515625, -0.24756622314453125, -0.2234039306640625, -0.19924163818359375, -0.175079345703125, -0.15091705322265625, -0.1267547607421875, -0.10259246826171875, -0.07843017578125, -0.05426788330078125, -0.0301055908203125, -0.00594329833984375, 0.018218994140625, 0.04238128662109375, 0.0665435791015625, 0.09070587158203125, 0.1148681640625, 0.13903045654296875, 0.1631927490234375, 0.18735504150390625, 0.211517333984375, 0.23567962646484375, 0.2598419189453125, 0.28400421142578125, 0.30816650390625, 0.33232879638671875, 0.3564910888671875, 0.38065338134765625, 0.404815673828125, 0.42897796630859375, 0.4531402587890625, 0.47730255126953125, 0.50146484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 9.0, 4.0, 6.0, 19.0, 18.0, 25.0, 39.0, 96.0, 150.0, 275.0, 495.0, 788.0, 812.0, 603.0, 328.0, 196.0, 84.0, 55.0, 24.0, 17.0, 14.0, 12.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.751953125, -0.7349205017089844, -0.7178878784179688, -0.7008552551269531, -0.6838226318359375, -0.6667900085449219, -0.6497573852539062, -0.6327247619628906, -0.615692138671875, -0.5986595153808594, -0.5816268920898438, -0.5645942687988281, -0.5475616455078125, -0.5305290222167969, -0.5134963989257812, -0.4964637756347656, -0.47943115234375, -0.4623985290527344, -0.44536590576171875, -0.4283332824707031, -0.4113006591796875, -0.3942680358886719, -0.37723541259765625, -0.3602027893066406, -0.343170166015625, -0.3261375427246094, -0.30910491943359375, -0.2920722961425781, -0.2750396728515625, -0.2580070495605469, -0.24097442626953125, -0.22394180297851562, -0.2069091796875, -0.18987655639648438, -0.17284393310546875, -0.15581130981445312, -0.1387786865234375, -0.12174606323242188, -0.10471343994140625, -0.08768081665039062, -0.070648193359375, -0.053615570068359375, -0.03658294677734375, -0.019550323486328125, -0.0025177001953125, 0.014514923095703125, 0.03154754638671875, 0.048580169677734375, 0.06561279296875, 0.08264541625976562, 0.09967803955078125, 0.11671066284179688, 0.1337432861328125, 0.15077590942382812, 0.16780853271484375, 0.18484115600585938, 0.201873779296875, 0.21890640258789062, 0.23593902587890625, 0.2529716491699219, 0.2700042724609375, 0.2870368957519531, 0.30406951904296875, 0.3211021423339844, 0.338134765625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 16.0, 32.0, 99.0, 271.0, 339.0, 158.0, 50.0, 18.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.036361694335938, -7.841573238372803, -7.646785259246826, -7.451996803283691, -7.257208824157715, -7.06242036819458, -6.867631912231445, -6.672843933105469, -6.478055953979492, -6.283267498016357, -6.088479518890381, -5.893691062927246, -5.6989030838012695, -5.504114627838135, -5.309326171875, -5.114538192749023, -4.919749736785889, -4.724961280822754, -4.530173301696777, -4.335384845733643, -4.140596866607666, -3.9458084106445312, -3.7510201930999756, -3.55623197555542, -3.3614437580108643, -3.1666555404663086, -2.971867322921753, -2.7770791053771973, -2.5822906494140625, -2.387502670288086, -2.192714214324951, -1.9979259967803955, -1.8031377792358398, -1.6083495616912842, -1.4135613441467285, -1.2187730073928833, -1.0239847898483276, -0.829196572303772, -0.6344082355499268, -0.4396200180053711, -0.24483180046081543, -0.05004355311393738, 0.14474469423294067, 0.3395329713821411, 0.5343211889266968, 0.7291094064712524, 0.9238977432250977, 1.1186859607696533, 1.313474178314209, 1.5082623958587646, 1.7030506134033203, 1.8978389501571655, 2.0926270484924316, 2.2874155044555664, 2.482203722000122, 2.6769919395446777, 2.8717801570892334, 3.066568374633789, 3.2613565921783447, 3.4561448097229004, 3.650933265686035, 3.8457212448120117, 4.0405097007751465, 4.235298156738281, 4.430086135864258]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 6.0, 5.0, 7.0, 10.0, 7.0, 12.0, 17.0, 24.0, 19.0, 23.0, 41.0, 24.0, 32.0, 51.0, 49.0, 56.0, 66.0, 49.0, 48.0, 68.0, 66.0, 42.0, 31.0, 35.0, 30.0, 35.0, 27.0, 27.0, 23.0, 19.0, 15.0, 9.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.259957790374756, -2.196604013442993, -2.1332499980926514, -2.0698962211608887, -2.006542205810547, -1.9431883096694946, -1.8798344135284424, -1.8164806365966797, -1.753126621246338, -1.6897727251052856, -1.6264188289642334, -1.5630649328231812, -1.499711036682129, -1.4363571405410767, -1.3730032444000244, -1.3096494674682617, -1.2462955713272095, -1.1829416751861572, -1.119587779045105, -1.0562338829040527, -0.9928799867630005, -0.9295260906219482, -0.8661722540855408, -0.8028183579444885, -0.7394644618034363, -0.676110565662384, -0.6127566695213318, -0.5494028329849243, -0.4860489070415497, -0.42269501090049744, -0.3593411445617676, -0.29598724842071533, -0.23263335227966309, -0.16927945613861084, -0.10592557489871979, -0.042571693658828735, 0.02078220248222351, 0.08413609862327576, 0.14748996496200562, 0.21084386110305786, 0.2741977572441101, 0.33755165338516235, 0.4009055495262146, 0.46425941586494446, 0.5276132822036743, 0.5909671783447266, 0.6543210744857788, 0.717674970626831, 0.7810288667678833, 0.8443827629089355, 0.9077366590499878, 0.97109055519104, 1.0344444513320923, 1.0977983474731445, 1.1611521244049072, 1.224506139755249, 1.2878599166870117, 1.351213812828064, 1.4145677089691162, 1.4779216051101685, 1.5412755012512207, 1.604629397392273, 1.6679832935333252, 1.731337070465088, 1.7946910858154297]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 3.0, 6.0, 17.0, 38.0, 83.0, 255.0, 749.0, 3044.0, 17307.0, 171678.0, 744108.0, 96776.0, 11402.0, 2175.0, 596.0, 199.0, 69.0, 31.0, 10.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68017578125, -0.6553421020507812, -0.6305084228515625, -0.6056747436523438, -0.580841064453125, -0.5560073852539062, -0.5311737060546875, -0.5063400268554688, -0.48150634765625, -0.45667266845703125, -0.4318389892578125, -0.40700531005859375, -0.382171630859375, -0.35733795166015625, -0.3325042724609375, -0.30767059326171875, -0.2828369140625, -0.25800323486328125, -0.2331695556640625, -0.20833587646484375, -0.183502197265625, -0.15866851806640625, -0.1338348388671875, -0.10900115966796875, -0.08416748046875, -0.05933380126953125, -0.0345001220703125, -0.00966644287109375, 0.015167236328125, 0.04000091552734375, 0.0648345947265625, 0.08966827392578125, 0.114501953125, 0.13933563232421875, 0.1641693115234375, 0.18900299072265625, 0.213836669921875, 0.23867034912109375, 0.2635040283203125, 0.28833770751953125, 0.31317138671875, 0.33800506591796875, 0.3628387451171875, 0.38767242431640625, 0.412506103515625, 0.43733978271484375, 0.4621734619140625, 0.48700714111328125, 0.5118408203125, 0.5366744995117188, 0.5615081787109375, 0.5863418579101562, 0.611175537109375, 0.6360092163085938, 0.6608428955078125, 0.6856765747070312, 0.71051025390625, 0.7353439331054688, 0.7601776123046875, 0.7850112915039062, 0.809844970703125, 0.8346786499023438, 0.8595123291015625, 0.8843460083007812, 0.9091796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 6.0, 6.0, 10.0, 8.0, 14.0, 13.0, 23.0, 35.0, 36.0, 38.0, 49.0, 36.0, 48.0, 51.0, 54.0, 68.0, 47.0, 44.0, 44.0, 46.0, 54.0, 43.0, 39.0, 31.0, 34.0, 20.0, 18.0, 23.0, 20.0, 11.0, 4.0, 10.0, 5.0, 4.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23046875, -0.2235698699951172, -0.21667098999023438, -0.20977210998535156, -0.20287322998046875, -0.19597434997558594, -0.18907546997070312, -0.1821765899658203, -0.1752777099609375, -0.1683788299560547, -0.16147994995117188, -0.15458106994628906, -0.14768218994140625, -0.14078330993652344, -0.13388442993164062, -0.1269855499267578, -0.120086669921875, -0.11318778991699219, -0.10628890991210938, -0.09939002990722656, -0.09249114990234375, -0.08559226989746094, -0.07869338989257812, -0.07179450988769531, -0.0648956298828125, -0.05799674987792969, -0.051097869873046875, -0.04419898986816406, -0.03730010986328125, -0.030401229858398438, -0.023502349853515625, -0.016603469848632812, -0.00970458984375, -0.0028057098388671875, 0.004093170166015625, 0.010992050170898438, 0.01789093017578125, 0.024789810180664062, 0.031688690185546875, 0.03858757019042969, 0.0454864501953125, 0.05238533020019531, 0.059284210205078125, 0.06618309020996094, 0.07308197021484375, 0.07998085021972656, 0.08687973022460938, 0.09377861022949219, 0.100677490234375, 0.10757637023925781, 0.11447525024414062, 0.12137413024902344, 0.12827301025390625, 0.13517189025878906, 0.14207077026367188, 0.1489696502685547, 0.1558685302734375, 0.1627674102783203, 0.16966629028320312, 0.17656517028808594, 0.18346405029296875, 0.19036293029785156, 0.19726181030273438, 0.2041606903076172, 0.2110595703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 9.0, 5.0, 14.0, 14.0, 15.0, 23.0, 26.0, 49.0, 60.0, 87.0, 108.0, 192.0, 251.0, 416.0, 659.0, 1210.0, 2752.0, 10571.0, 115692.0, 847735.0, 56743.0, 7091.0, 2122.0, 1026.0, 581.0, 317.0, 209.0, 153.0, 126.0, 87.0, 50.0, 40.0, 33.0, 17.0, 20.0, 10.0, 8.0, 7.0, 2.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6660614013671875, -0.644134521484375, -0.6222076416015625, -0.60028076171875, -0.5783538818359375, -0.556427001953125, -0.5345001220703125, -0.5125732421875, -0.4906463623046875, -0.468719482421875, -0.4467926025390625, -0.42486572265625, -0.4029388427734375, -0.381011962890625, -0.3590850830078125, -0.337158203125, -0.3152313232421875, -0.293304443359375, -0.2713775634765625, -0.24945068359375, -0.2275238037109375, -0.205596923828125, -0.1836700439453125, -0.1617431640625, -0.1398162841796875, -0.117889404296875, -0.0959625244140625, -0.07403564453125, -0.0521087646484375, -0.030181884765625, -0.0082550048828125, 0.013671875, 0.0355987548828125, 0.057525634765625, 0.0794525146484375, 0.10137939453125, 0.1233062744140625, 0.145233154296875, 0.1671600341796875, 0.1890869140625, 0.2110137939453125, 0.232940673828125, 0.2548675537109375, 0.27679443359375, 0.2987213134765625, 0.320648193359375, 0.3425750732421875, 0.364501953125, 0.3864288330078125, 0.408355712890625, 0.4302825927734375, 0.45220947265625, 0.4741363525390625, 0.496063232421875, 0.5179901123046875, 0.5399169921875, 0.5618438720703125, 0.583770751953125, 0.6056976318359375, 0.62762451171875, 0.6495513916015625, 0.671478271484375, 0.6934051513671875, 0.71533203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 10.0, 13.0, 19.0, 26.0, 17.0, 25.0, 38.0, 46.0, 63.0, 66.0, 60.0, 67.0, 56.0, 66.0, 64.0, 55.0, 51.0, 43.0, 36.0, 46.0, 24.0, 18.0, 13.0, 11.0, 8.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.88671875, -0.8603744506835938, -0.8340301513671875, -0.8076858520507812, -0.781341552734375, -0.7549972534179688, -0.7286529541015625, -0.7023086547851562, -0.67596435546875, -0.6496200561523438, -0.6232757568359375, -0.5969314575195312, -0.570587158203125, -0.5442428588867188, -0.5178985595703125, -0.49155426025390625, -0.4652099609375, -0.43886566162109375, -0.4125213623046875, -0.38617706298828125, -0.359832763671875, -0.33348846435546875, -0.3071441650390625, -0.28079986572265625, -0.25445556640625, -0.22811126708984375, -0.2017669677734375, -0.17542266845703125, -0.149078369140625, -0.12273406982421875, -0.0963897705078125, -0.07004547119140625, -0.043701171875, -0.01735687255859375, 0.0089874267578125, 0.03533172607421875, 0.061676025390625, 0.08802032470703125, 0.1143646240234375, 0.14070892333984375, 0.16705322265625, 0.19339752197265625, 0.2197418212890625, 0.24608612060546875, 0.272430419921875, 0.29877471923828125, 0.3251190185546875, 0.35146331787109375, 0.3778076171875, 0.40415191650390625, 0.4304962158203125, 0.45684051513671875, 0.483184814453125, 0.5095291137695312, 0.5358734130859375, 0.5622177124023438, 0.58856201171875, 0.6149063110351562, 0.6412506103515625, 0.6675949096679688, 0.693939208984375, 0.7202835083007812, 0.7466278076171875, 0.7729721069335938, 0.79931640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 10.0, 6.0, 21.0, 15.0, 14.0, 27.0, 32.0, 58.0, 70.0, 153.0, 303.0, 691.0, 2270.0, 14764.0, 825589.0, 193110.0, 8715.0, 1606.0, 502.0, 219.0, 116.0, 74.0, 46.0, 48.0, 18.0, 19.0, 11.0, 13.0, 7.0, 5.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.2739601135253906, -0.26447296142578125, -0.2549858093261719, -0.2454986572265625, -0.23601150512695312, -0.22652435302734375, -0.21703720092773438, -0.207550048828125, -0.19806289672851562, -0.18857574462890625, -0.17908859252929688, -0.1696014404296875, -0.16011428833007812, -0.15062713623046875, -0.14113998413085938, -0.13165283203125, -0.12216567993164062, -0.11267852783203125, -0.10319137573242188, -0.0937042236328125, -0.08421707153320312, -0.07472991943359375, -0.06524276733398438, -0.055755615234375, -0.046268463134765625, -0.03678131103515625, -0.027294158935546875, -0.0178070068359375, -0.008319854736328125, 0.00116729736328125, 0.010654449462890625, 0.0201416015625, 0.029628753662109375, 0.03911590576171875, 0.048603057861328125, 0.0580902099609375, 0.06757736206054688, 0.07706451416015625, 0.08655166625976562, 0.096038818359375, 0.10552597045898438, 0.11501312255859375, 0.12450027465820312, 0.1339874267578125, 0.14347457885742188, 0.15296173095703125, 0.16244888305664062, 0.17193603515625, 0.18142318725585938, 0.19091033935546875, 0.20039749145507812, 0.2098846435546875, 0.21937179565429688, 0.22885894775390625, 0.23834609985351562, 0.247833251953125, 0.2573204040527344, 0.26680755615234375, 0.2762947082519531, 0.2857818603515625, 0.2952690124511719, 0.30475616455078125, 0.3142433166503906, 0.32373046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 5.0, 8.0, 8.0, 12.0, 12.0, 18.0, 10.0, 19.0, 46.0, 51.0, 62.0, 91.0, 87.0, 122.0, 99.0, 93.0, 65.0, 39.0, 36.0, 16.0, 15.0, 15.0, 14.0, 18.0, 4.0, 5.0, 7.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.257129669189453e-05, -5.0951726734638214e-05, -4.93321567773819e-05, -4.771258682012558e-05, -4.609301686286926e-05, -4.4473446905612946e-05, -4.285387694835663e-05, -4.123430699110031e-05, -3.9614737033843994e-05, -3.799516707658768e-05, -3.637559711933136e-05, -3.475602716207504e-05, -3.3136457204818726e-05, -3.151688724756241e-05, -2.989731729030609e-05, -2.8277747333049774e-05, -2.6658177375793457e-05, -2.503860741853714e-05, -2.3419037461280823e-05, -2.1799467504024506e-05, -2.017989754676819e-05, -1.856032758951187e-05, -1.6940757632255554e-05, -1.5321187674999237e-05, -1.370161771774292e-05, -1.2082047760486603e-05, -1.0462477803230286e-05, -8.842907845973969e-06, -7.223337888717651e-06, -5.603767931461334e-06, -3.984197974205017e-06, -2.3646280169487e-06, -7.450580596923828e-07, 8.745118975639343e-07, 2.4940818548202515e-06, 4.113651812076569e-06, 5.733221769332886e-06, 7.352791726589203e-06, 8.97236168384552e-06, 1.0591931641101837e-05, 1.2211501598358154e-05, 1.3831071555614471e-05, 1.545064151287079e-05, 1.7070211470127106e-05, 1.8689781427383423e-05, 2.030935138463974e-05, 2.1928921341896057e-05, 2.3548491299152374e-05, 2.516806125640869e-05, 2.678763121366501e-05, 2.8407201170921326e-05, 3.0026771128177643e-05, 3.164634108543396e-05, 3.326591104269028e-05, 3.4885480999946594e-05, 3.650505095720291e-05, 3.812462091445923e-05, 3.9744190871715546e-05, 4.136376082897186e-05, 4.298333078622818e-05, 4.46029007434845e-05, 4.6222470700740814e-05, 4.784204065799713e-05, 4.946161061525345e-05, 5.1081180572509766e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 5.0, 6.0, 7.0, 3.0, 11.0, 4.0, 17.0, 14.0, 16.0, 20.0, 31.0, 34.0, 54.0, 91.0, 97.0, 137.0, 241.0, 292.0, 530.0, 913.0, 1650.0, 3594.0, 9150.0, 32668.0, 219903.0, 695584.0, 59824.0, 13508.0, 4910.0, 2295.0, 1143.0, 616.0, 357.0, 228.0, 158.0, 111.0, 80.0, 56.0, 51.0, 36.0, 22.0, 18.0, 19.0, 15.0, 11.0, 5.0, 7.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1221923828125, -0.11850929260253906, -0.11482620239257812, -0.11114311218261719, -0.10746002197265625, -0.10377693176269531, -0.10009384155273438, -0.09641075134277344, -0.0927276611328125, -0.08904457092285156, -0.08536148071289062, -0.08167839050292969, -0.07799530029296875, -0.07431221008300781, -0.07062911987304688, -0.06694602966308594, -0.063262939453125, -0.05957984924316406, -0.055896759033203125, -0.05221366882324219, -0.04853057861328125, -0.04484748840332031, -0.041164398193359375, -0.03748130798339844, -0.0337982177734375, -0.030115127563476562, -0.026432037353515625, -0.022748947143554688, -0.01906585693359375, -0.015382766723632812, -0.011699676513671875, -0.008016586303710938, -0.00433349609375, -0.0006504058837890625, 0.003032684326171875, 0.0067157745361328125, 0.01039886474609375, 0.014081954956054688, 0.017765045166015625, 0.021448135375976562, 0.0251312255859375, 0.028814315795898438, 0.032497406005859375, 0.03618049621582031, 0.03986358642578125, 0.04354667663574219, 0.047229766845703125, 0.05091285705566406, 0.054595947265625, 0.05827903747558594, 0.061962127685546875, 0.06564521789550781, 0.06932830810546875, 0.07301139831542969, 0.07669448852539062, 0.08037757873535156, 0.0840606689453125, 0.08774375915527344, 0.09142684936523438, 0.09510993957519531, 0.09879302978515625, 0.10247611999511719, 0.10615921020507812, 0.10984230041503906, 0.113525390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 1.0, 4.0, 6.0, 3.0, 4.0, 3.0, 7.0, 3.0, 12.0, 15.0, 24.0, 36.0, 36.0, 39.0, 56.0, 88.0, 114.0, 119.0, 110.0, 74.0, 41.0, 45.0, 38.0, 22.0, 17.0, 20.0, 14.0, 8.0, 5.0, 4.0, 6.0, 7.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.1317138671875, -0.12735557556152344, -0.12299728393554688, -0.11863899230957031, -0.11428070068359375, -0.10992240905761719, -0.10556411743164062, -0.10120582580566406, -0.0968475341796875, -0.09248924255371094, -0.08813095092773438, -0.08377265930175781, -0.07941436767578125, -0.07505607604980469, -0.07069778442382812, -0.06633949279785156, -0.061981201171875, -0.05762290954589844, -0.053264617919921875, -0.04890632629394531, -0.04454803466796875, -0.04018974304199219, -0.035831451416015625, -0.03147315979003906, -0.0271148681640625, -0.022756576538085938, -0.018398284912109375, -0.014039993286132812, -0.00968170166015625, -0.0053234100341796875, -0.000965118408203125, 0.0033931732177734375, 0.00775146484375, 0.012109756469726562, 0.016468048095703125, 0.020826339721679688, 0.02518463134765625, 0.029542922973632812, 0.033901214599609375, 0.03825950622558594, 0.0426177978515625, 0.04697608947753906, 0.051334381103515625, 0.05569267272949219, 0.06005096435546875, 0.06440925598144531, 0.06876754760742188, 0.07312583923339844, 0.077484130859375, 0.08184242248535156, 0.08620071411132812, 0.09055900573730469, 0.09491729736328125, 0.09927558898925781, 0.10363388061523438, 0.10799217224121094, 0.1123504638671875, 0.11670875549316406, 0.12106704711914062, 0.1254253387451172, 0.12978363037109375, 0.1341419219970703, 0.13850021362304688, 0.14285850524902344, 0.147216796875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 5.0, 9.0, 20.0, 74.0, 328.0, 375.0, 122.0, 39.0, 13.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.278661727905273, -8.05510425567627, -7.831547260284424, -7.607990264892578, -7.384432792663574, -7.1608757972717285, -6.937318801879883, -6.713761329650879, -6.490203857421875, -6.266646862030029, -6.043089389801025, -5.81953239440918, -5.595974922180176, -5.37241792678833, -5.148860931396484, -4.9253034591674805, -4.701746463775635, -4.478189468383789, -4.254631996154785, -4.0310750007629395, -3.8075175285339355, -3.58396053314209, -3.360403299331665, -3.1368460655212402, -2.9132888317108154, -2.6897315979003906, -2.466174364089966, -2.242617130279541, -2.0190601348876953, -1.795502781867981, -1.5719456672668457, -1.348388433456421, -1.124830722808838, -0.9012734889984131, -0.6777163147926331, -0.454159140586853, -0.23060190677642822, -0.007044672966003418, 0.21651244163513184, 0.44006967544555664, 0.6636269092559814, 0.8871841430664062, 1.110741376876831, 1.3342984914779663, 1.5578557252883911, 1.781412959098816, 2.004970073699951, 2.228527307510376, 2.452084541320801, 2.6756417751312256, 2.8991990089416504, 3.122756004333496, 3.3463134765625, 3.5698704719543457, 3.7934277057647705, 4.016984939575195, 4.240542411804199, 4.464099407196045, 4.687656879425049, 4.9112138748168945, 5.134771347045898, 5.358328342437744, 5.58188533782959, 5.805442810058594, 6.0289998054504395]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 7.0, 8.0, 9.0, 12.0, 12.0, 13.0, 19.0, 8.0, 15.0, 19.0, 20.0, 12.0, 27.0, 29.0, 24.0, 32.0, 45.0, 95.0, 126.0, 94.0, 38.0, 49.0, 30.0, 22.0, 23.0, 26.0, 23.0, 22.0, 22.0, 21.0, 14.0, 17.0, 5.0, 15.0, 5.0, 4.0, 6.0, 3.0, 7.0, 2.0, 1.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.2721033096313477, -2.2023508548736572, -2.132598400115967, -2.0628459453582764, -1.9930933713912964, -1.923340916633606, -1.853588342666626, -1.7838358879089355, -1.7140834331512451, -1.6443309783935547, -1.5745785236358643, -1.5048259496688843, -1.4350734949111938, -1.3653210401535034, -1.2955684661865234, -1.225816011428833, -1.1560635566711426, -1.0863111019134521, -1.0165586471557617, -0.9468060731887817, -0.8770536184310913, -0.8073011636734009, -0.7375486493110657, -0.6677961349487305, -0.59804368019104, -0.5282912254333496, -0.4585387110710144, -0.3887862265110016, -0.31903374195098877, -0.24928125739097595, -0.17952877283096313, -0.10977628827095032, -0.0400238037109375, 0.029728680849075317, 0.09948116540908813, 0.16923364996910095, 0.23898613452911377, 0.3087386190891266, 0.3784911036491394, 0.4482435882091522, 0.517996072769165, 0.5877485275268555, 0.6575010418891907, 0.7272535562515259, 0.7970060110092163, 0.8667584657669067, 0.9365109801292419, 1.0062634944915771, 1.0760159492492676, 1.145768404006958, 1.2155208587646484, 1.2852734327316284, 1.3550258874893188, 1.4247783422470093, 1.4945309162139893, 1.5642833709716797, 1.6340358257293701, 1.7037882804870605, 1.773540735244751, 1.843293309211731, 1.9130457639694214, 1.9827982187271118, 2.052550792694092, 2.1223032474517822, 2.1920557022094727]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 10.0, 11.0, 12.0, 14.0, 21.0, 21.0, 41.0, 63.0, 99.0, 156.0, 251.0, 422.0, 616.0, 1141.0, 2124.0, 4101.0, 8998.0, 23922.0, 86803.0, 390340.0, 1334910.0, 1636801.0, 531639.0, 119144.0, 31300.0, 10724.0, 4825.0, 2394.0, 1314.0, 795.0, 435.0, 300.0, 189.0, 121.0, 72.0, 35.0, 34.0, 27.0, 21.0, 14.0, 4.0, 6.0, 1.0, 6.0, 7.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.223388671875, -0.21544265747070312, -0.20749664306640625, -0.19955062866210938, -0.1916046142578125, -0.18365859985351562, -0.17571258544921875, -0.16776657104492188, -0.159820556640625, -0.15187454223632812, -0.14392852783203125, -0.13598251342773438, -0.1280364990234375, -0.12009048461914062, -0.11214447021484375, -0.10419845581054688, -0.09625244140625, -0.08830642700195312, -0.08036041259765625, -0.07241439819335938, -0.0644683837890625, -0.056522369384765625, -0.04857635498046875, -0.040630340576171875, -0.032684326171875, -0.024738311767578125, -0.01679229736328125, -0.008846282958984375, -0.0009002685546875, 0.007045745849609375, 0.01499176025390625, 0.022937774658203125, 0.0308837890625, 0.038829803466796875, 0.04677581787109375, 0.054721832275390625, 0.0626678466796875, 0.07061386108398438, 0.07855987548828125, 0.08650588989257812, 0.094451904296875, 0.10239791870117188, 0.11034393310546875, 0.11828994750976562, 0.1262359619140625, 0.13418197631835938, 0.14212799072265625, 0.15007400512695312, 0.15802001953125, 0.16596603393554688, 0.17391204833984375, 0.18185806274414062, 0.1898040771484375, 0.19775009155273438, 0.20569610595703125, 0.21364212036132812, 0.221588134765625, 0.22953414916992188, 0.23748016357421875, 0.24542617797851562, 0.2533721923828125, 0.2613182067871094, 0.26926422119140625, 0.2772102355957031, 0.28515625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 8.0, 4.0, 11.0, 10.0, 18.0, 28.0, 21.0, 26.0, 43.0, 35.0, 47.0, 46.0, 51.0, 56.0, 63.0, 53.0, 55.0, 49.0, 43.0, 41.0, 46.0, 31.0, 40.0, 23.0, 25.0, 26.0, 12.0, 21.0, 14.0, 12.0, 10.0, 9.0, 8.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2012939453125, -0.1949748992919922, -0.18865585327148438, -0.18233680725097656, -0.17601776123046875, -0.16969871520996094, -0.16337966918945312, -0.1570606231689453, -0.1507415771484375, -0.1444225311279297, -0.13810348510742188, -0.13178443908691406, -0.12546539306640625, -0.11914634704589844, -0.11282730102539062, -0.10650825500488281, -0.100189208984375, -0.09387016296386719, -0.08755111694335938, -0.08123207092285156, -0.07491302490234375, -0.06859397888183594, -0.062274932861328125, -0.05595588684082031, -0.0496368408203125, -0.04331779479980469, -0.036998748779296875, -0.030679702758789062, -0.02436065673828125, -0.018041610717773438, -0.011722564697265625, -0.0054035186767578125, 0.00091552734375, 0.0072345733642578125, 0.013553619384765625, 0.019872665405273438, 0.02619171142578125, 0.03251075744628906, 0.038829803466796875, 0.04514884948730469, 0.0514678955078125, 0.05778694152832031, 0.06410598754882812, 0.07042503356933594, 0.07674407958984375, 0.08306312561035156, 0.08938217163085938, 0.09570121765136719, 0.102020263671875, 0.10833930969238281, 0.11465835571289062, 0.12097740173339844, 0.12729644775390625, 0.13361549377441406, 0.13993453979492188, 0.1462535858154297, 0.1525726318359375, 0.1588916778564453, 0.16521072387695312, 0.17152976989746094, 0.17784881591796875, 0.18416786193847656, 0.19048690795898438, 0.1968059539794922, 0.203125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 5.0, 7.0, 5.0, 8.0, 15.0, 16.0, 23.0, 34.0, 45.0, 79.0, 124.0, 223.0, 350.0, 674.0, 1594.0, 5063.0, 45674.0, 3830812.0, 293565.0, 11207.0, 2566.0, 984.0, 464.0, 264.0, 162.0, 90.0, 74.0, 39.0, 36.0, 22.0, 18.0, 10.0, 6.0, 6.0, 6.0, 2.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95703125, -0.925872802734375, -0.89471435546875, -0.863555908203125, -0.8323974609375, -0.801239013671875, -0.77008056640625, -0.738922119140625, -0.707763671875, -0.676605224609375, -0.64544677734375, -0.614288330078125, -0.5831298828125, -0.551971435546875, -0.52081298828125, -0.489654541015625, -0.45849609375, -0.427337646484375, -0.39617919921875, -0.365020751953125, -0.3338623046875, -0.302703857421875, -0.27154541015625, -0.240386962890625, -0.209228515625, -0.178070068359375, -0.14691162109375, -0.115753173828125, -0.0845947265625, -0.053436279296875, -0.02227783203125, 0.008880615234375, 0.0400390625, 0.071197509765625, 0.10235595703125, 0.133514404296875, 0.1646728515625, 0.195831298828125, 0.22698974609375, 0.258148193359375, 0.289306640625, 0.320465087890625, 0.35162353515625, 0.382781982421875, 0.4139404296875, 0.445098876953125, 0.47625732421875, 0.507415771484375, 0.53857421875, 0.569732666015625, 0.60089111328125, 0.632049560546875, 0.6632080078125, 0.694366455078125, 0.72552490234375, 0.756683349609375, 0.787841796875, 0.819000244140625, 0.85015869140625, 0.881317138671875, 0.9124755859375, 0.943634033203125, 0.97479248046875, 1.005950927734375, 1.037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 9.0, 10.0, 12.0, 19.0, 26.0, 40.0, 42.0, 58.0, 72.0, 119.0, 147.0, 220.0, 306.0, 405.0, 512.0, 514.0, 432.0, 319.0, 219.0, 163.0, 116.0, 78.0, 64.0, 49.0, 37.0, 19.0, 16.0, 14.0, 6.0, 0.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52294921875, -0.5060043334960938, -0.4890594482421875, -0.47211456298828125, -0.455169677734375, -0.43822479248046875, -0.4212799072265625, -0.40433502197265625, -0.38739013671875, -0.37044525146484375, -0.3535003662109375, -0.33655548095703125, -0.319610595703125, -0.30266571044921875, -0.2857208251953125, -0.26877593994140625, -0.2518310546875, -0.23488616943359375, -0.2179412841796875, -0.20099639892578125, -0.184051513671875, -0.16710662841796875, -0.1501617431640625, -0.13321685791015625, -0.11627197265625, -0.09932708740234375, -0.0823822021484375, -0.06543731689453125, -0.048492431640625, -0.03154754638671875, -0.0146026611328125, 0.00234222412109375, 0.019287109375, 0.03623199462890625, 0.0531768798828125, 0.07012176513671875, 0.087066650390625, 0.10401153564453125, 0.1209564208984375, 0.13790130615234375, 0.15484619140625, 0.17179107666015625, 0.1887359619140625, 0.20568084716796875, 0.222625732421875, 0.23957061767578125, 0.2565155029296875, 0.27346038818359375, 0.2904052734375, 0.30735015869140625, 0.3242950439453125, 0.34123992919921875, 0.358184814453125, 0.37512969970703125, 0.3920745849609375, 0.40901947021484375, 0.42596435546875, 0.44290924072265625, 0.4598541259765625, 0.47679901123046875, 0.493743896484375, 0.5106887817382812, 0.5276336669921875, 0.5445785522460938, 0.5615234375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 11.0, 21.0, 39.0, 68.0, 109.0, 172.0, 196.0, 133.0, 81.0, 54.0, 36.0, 21.0, 11.0, 11.0, 2.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.19105339050293, -4.985244274139404, -4.779434680938721, -4.573625564575195, -4.367815971374512, -4.162006855010986, -3.956197500228882, -3.7503881454467773, -3.544578790664673, -3.3387694358825684, -3.132960081100464, -2.9271507263183594, -2.721341609954834, -2.5155320167541504, -2.309722900390625, -2.1039135456085205, -1.898104190826416, -1.6922948360443115, -1.486485481262207, -1.280676245689392, -1.0748668909072876, -0.8690575361251831, -0.6632483005523682, -0.45743894577026367, -0.2516295909881592, -0.045820266008377075, 0.15998905897140503, 0.36579835414886475, 0.5716077089309692, 0.7774170637130737, 0.9832262992858887, 1.1890356540679932, 1.3948450088500977, 1.6006543636322021, 1.8064637184143066, 2.012272834777832, 2.2180824279785156, 2.423891544342041, 2.6297008991241455, 2.83551025390625, 3.0413196086883545, 3.247128963470459, 3.4529383182525635, 3.658747673034668, 3.8645567893981934, 4.070366382598877, 4.276175498962402, 4.481985092163086, 4.687794208526611, 4.893603324890137, 5.09941291809082, 5.305222034454346, 5.511031627655029, 5.716840744018555, 5.922650337219238, 6.128459453582764, 6.334268569946289, 6.5400776863098145, 6.745887279510498, 6.951696395874023, 7.157505989074707, 7.363315105438232, 7.569124221801758, 7.774933815002441, 7.980743408203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 4.0, 5.0, 9.0, 6.0, 8.0, 9.0, 14.0, 13.0, 16.0, 18.0, 17.0, 31.0, 29.0, 39.0, 44.0, 29.0, 53.0, 52.0, 54.0, 64.0, 77.0, 70.0, 48.0, 46.0, 41.0, 43.0, 28.0, 30.0, 24.0, 19.0, 16.0, 18.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9535839557647705, -3.8372952938079834, -3.7210066318511963, -3.604717969894409, -3.488429546356201, -3.372140884399414, -3.255852222442627, -3.13956356048584, -3.0232748985290527, -2.9069862365722656, -2.7906975746154785, -2.6744089126586914, -2.5581202507019043, -2.441831588745117, -2.325543165206909, -2.209254503250122, -2.092965841293335, -1.9766771793365479, -1.8603885173797607, -1.7440999746322632, -1.627811312675476, -1.511522650718689, -1.3952341079711914, -1.2789454460144043, -1.1626567840576172, -1.04636812210083, -0.9300795197486877, -0.8137909173965454, -0.6975022554397583, -0.5812135934829712, -0.46492499113082886, -0.3486363887786865, -0.2323474884033203, -0.11605885624885559, 0.00022977590560913086, 0.11651840806007385, 0.23280704021453857, 0.3490957021713257, 0.465384304523468, 0.5816729068756104, 0.6979615688323975, 0.8142502307891846, 0.9305388331413269, 1.0468274354934692, 1.1631160974502563, 1.2794047594070435, 1.395693302154541, 1.5119819641113281, 1.6282706260681152, 1.7445592880249023, 1.8608479499816895, 1.977136492729187, 2.0934252738952637, 2.209713935852051, 2.326002359390259, 2.442291021347046, 2.558579683303833, 2.67486834526062, 2.7911570072174072, 2.9074456691741943, 3.0237340927124023, 3.1400227546691895, 3.2563114166259766, 3.3726000785827637, 3.488888740539551]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 15.0, 18.0, 17.0, 17.0, 61.0, 82.0, 118.0, 285.0, 516.0, 1019.0, 2313.0, 5802.0, 17493.0, 75563.0, 600815.0, 279186.0, 45369.0, 12030.0, 4226.0, 1812.0, 829.0, 392.0, 221.0, 133.0, 59.0, 42.0, 32.0, 17.0, 15.0, 13.0, 8.0, 0.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.44873046875, -0.4354705810546875, -0.422210693359375, -0.4089508056640625, -0.39569091796875, -0.3824310302734375, -0.369171142578125, -0.3559112548828125, -0.3426513671875, -0.3293914794921875, -0.316131591796875, -0.3028717041015625, -0.28961181640625, -0.2763519287109375, -0.263092041015625, -0.2498321533203125, -0.236572265625, -0.2233123779296875, -0.210052490234375, -0.1967926025390625, -0.18353271484375, -0.1702728271484375, -0.157012939453125, -0.1437530517578125, -0.1304931640625, -0.1172332763671875, -0.103973388671875, -0.0907135009765625, -0.07745361328125, -0.0641937255859375, -0.050933837890625, -0.0376739501953125, -0.0244140625, -0.0111541748046875, 0.002105712890625, 0.0153656005859375, 0.02862548828125, 0.0418853759765625, 0.055145263671875, 0.0684051513671875, 0.0816650390625, 0.0949249267578125, 0.108184814453125, 0.1214447021484375, 0.13470458984375, 0.1479644775390625, 0.161224365234375, 0.1744842529296875, 0.187744140625, 0.2010040283203125, 0.214263916015625, 0.2275238037109375, 0.24078369140625, 0.2540435791015625, 0.267303466796875, 0.2805633544921875, 0.2938232421875, 0.3070831298828125, 0.320343017578125, 0.3336029052734375, 0.34686279296875, 0.3601226806640625, 0.373382568359375, 0.3866424560546875, 0.39990234375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 18.0, 8.0, 18.0, 27.0, 35.0, 61.0, 69.0, 78.0, 60.0, 79.0, 74.0, 75.0, 80.0, 66.0, 57.0, 43.0, 39.0, 22.0, 29.0, 16.0, 7.0, 11.0, 11.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357666015625, -0.3466835021972656, -0.33570098876953125, -0.3247184753417969, -0.3137359619140625, -0.3027534484863281, -0.29177093505859375, -0.2807884216308594, -0.269805908203125, -0.2588233947753906, -0.24784088134765625, -0.23685836791992188, -0.2258758544921875, -0.21489334106445312, -0.20391082763671875, -0.19292831420898438, -0.18194580078125, -0.17096328735351562, -0.15998077392578125, -0.14899826049804688, -0.1380157470703125, -0.12703323364257812, -0.11605072021484375, -0.10506820678710938, -0.094085693359375, -0.08310317993164062, -0.07212066650390625, -0.061138153076171875, -0.0501556396484375, -0.039173126220703125, -0.02819061279296875, -0.017208099365234375, -0.0062255859375, 0.004756927490234375, 0.01573944091796875, 0.026721954345703125, 0.0377044677734375, 0.048686981201171875, 0.05966949462890625, 0.07065200805664062, 0.081634521484375, 0.09261703491210938, 0.10359954833984375, 0.11458206176757812, 0.1255645751953125, 0.13654708862304688, 0.14752960205078125, 0.15851211547851562, 0.16949462890625, 0.18047714233398438, 0.19145965576171875, 0.20244216918945312, 0.2134246826171875, 0.22440719604492188, 0.23538970947265625, 0.24637222290039062, 0.257354736328125, 0.2683372497558594, 0.27931976318359375, 0.2903022766113281, 0.3012847900390625, 0.3122673034667969, 0.32324981689453125, 0.3342323303222656, 0.34521484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 2.0, 6.0, 5.0, 10.0, 7.0, 11.0, 17.0, 25.0, 28.0, 38.0, 58.0, 77.0, 103.0, 178.0, 298.0, 518.0, 1064.0, 2798.0, 12085.0, 103665.0, 875529.0, 41615.0, 6480.0, 1905.0, 758.0, 422.0, 280.0, 179.0, 118.0, 79.0, 57.0, 33.0, 13.0, 24.0, 12.0, 9.0, 9.0, 10.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.44677734375, -0.432037353515625, -0.41729736328125, -0.402557373046875, -0.3878173828125, -0.373077392578125, -0.35833740234375, -0.343597412109375, -0.328857421875, -0.314117431640625, -0.29937744140625, -0.284637451171875, -0.2698974609375, -0.255157470703125, -0.24041748046875, -0.225677490234375, -0.2109375, -0.196197509765625, -0.18145751953125, -0.166717529296875, -0.1519775390625, -0.137237548828125, -0.12249755859375, -0.107757568359375, -0.093017578125, -0.078277587890625, -0.06353759765625, -0.048797607421875, -0.0340576171875, -0.019317626953125, -0.00457763671875, 0.010162353515625, 0.02490234375, 0.039642333984375, 0.05438232421875, 0.069122314453125, 0.0838623046875, 0.098602294921875, 0.11334228515625, 0.128082275390625, 0.142822265625, 0.157562255859375, 0.17230224609375, 0.187042236328125, 0.2017822265625, 0.216522216796875, 0.23126220703125, 0.246002197265625, 0.2607421875, 0.275482177734375, 0.29022216796875, 0.304962158203125, 0.3197021484375, 0.334442138671875, 0.34918212890625, 0.363922119140625, 0.378662109375, 0.393402099609375, 0.40814208984375, 0.422882080078125, 0.4376220703125, 0.452362060546875, 0.46710205078125, 0.481842041015625, 0.49658203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 1.0, 2.0, 5.0, 8.0, 9.0, 6.0, 8.0, 13.0, 8.0, 20.0, 20.0, 18.0, 21.0, 35.0, 35.0, 40.0, 76.0, 86.0, 99.0, 94.0, 74.0, 61.0, 50.0, 32.0, 30.0, 27.0, 21.0, 17.0, 14.0, 14.0, 13.0, 8.0, 5.0, 9.0, 9.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.94775390625, -0.9168624877929688, -0.8859710693359375, -0.8550796508789062, -0.824188232421875, -0.7932968139648438, -0.7624053955078125, -0.7315139770507812, -0.70062255859375, -0.6697311401367188, -0.6388397216796875, -0.6079483032226562, -0.577056884765625, -0.5461654663085938, -0.5152740478515625, -0.48438262939453125, -0.4534912109375, -0.42259979248046875, -0.3917083740234375, -0.36081695556640625, -0.329925537109375, -0.29903411865234375, -0.2681427001953125, -0.23725128173828125, -0.20635986328125, -0.17546844482421875, -0.1445770263671875, -0.11368560791015625, -0.082794189453125, -0.05190277099609375, -0.0210113525390625, 0.00988006591796875, 0.040771484375, 0.07166290283203125, 0.1025543212890625, 0.13344573974609375, 0.164337158203125, 0.19522857666015625, 0.2261199951171875, 0.25701141357421875, 0.28790283203125, 0.31879425048828125, 0.3496856689453125, 0.38057708740234375, 0.411468505859375, 0.44235992431640625, 0.4732513427734375, 0.5041427612304688, 0.5350341796875, 0.5659255981445312, 0.5968170166015625, 0.6277084350585938, 0.658599853515625, 0.6894912719726562, 0.7203826904296875, 0.7512741088867188, 0.78216552734375, 0.8130569458007812, 0.8439483642578125, 0.8748397827148438, 0.905731201171875, 0.9366226196289062, 0.9675140380859375, 0.9984054565429688, 1.029296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 3.0, 3.0, 5.0, 10.0, 16.0, 21.0, 21.0, 41.0, 45.0, 95.0, 127.0, 213.0, 301.0, 529.0, 1025.0, 2245.0, 5719.0, 18097.0, 80383.0, 830374.0, 80882.0, 17847.0, 5730.0, 2287.0, 1078.0, 574.0, 336.0, 179.0, 97.0, 75.0, 36.0, 47.0, 33.0, 17.0, 11.0, 12.0, 5.0, 6.0, 5.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.05682229995727539, -0.05495929718017578, -0.05309629440307617, -0.05123329162597656, -0.04937028884887695, -0.047507286071777344, -0.045644283294677734, -0.043781280517578125, -0.041918277740478516, -0.040055274963378906, -0.0381922721862793, -0.03632926940917969, -0.03446626663208008, -0.03260326385498047, -0.03074026107788086, -0.02887725830078125, -0.02701425552368164, -0.02515125274658203, -0.023288249969482422, -0.021425247192382812, -0.019562244415283203, -0.017699241638183594, -0.015836238861083984, -0.013973236083984375, -0.012110233306884766, -0.010247230529785156, -0.008384227752685547, -0.0065212249755859375, -0.004658222198486328, -0.0027952194213867188, -0.0009322166442871094, 0.0009307861328125, 0.0027937889099121094, 0.004656791687011719, 0.006519794464111328, 0.008382797241210938, 0.010245800018310547, 0.012108802795410156, 0.013971805572509766, 0.015834808349609375, 0.017697811126708984, 0.019560813903808594, 0.021423816680908203, 0.023286819458007812, 0.025149822235107422, 0.02701282501220703, 0.02887582778930664, 0.03073883056640625, 0.03260183334350586, 0.03446483612060547, 0.03632783889770508, 0.03819084167480469, 0.0400538444519043, 0.041916847229003906, 0.043779850006103516, 0.045642852783203125, 0.047505855560302734, 0.049368858337402344, 0.05123186111450195, 0.05309486389160156, 0.05495786666870117, 0.05682086944580078, 0.05868387222290039, 0.060546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 3.0, 8.0, 5.0, 9.0, 8.0, 16.0, 12.0, 9.0, 17.0, 19.0, 22.0, 44.0, 35.0, 44.0, 52.0, 61.0, 88.0, 98.0, 73.0, 61.0, 47.0, 46.0, 43.0, 24.0, 28.0, 16.0, 14.0, 14.0, 12.0, 7.0, 8.0, 8.0, 7.0, 6.0, 2.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.777576446533203e-05, -2.6756897568702698e-05, -2.5738030672073364e-05, -2.471916377544403e-05, -2.3700296878814697e-05, -2.2681429982185364e-05, -2.166256308555603e-05, -2.0643696188926697e-05, -1.9624829292297363e-05, -1.860596239566803e-05, -1.7587095499038696e-05, -1.6568228602409363e-05, -1.554936170578003e-05, -1.4530494809150696e-05, -1.3511627912521362e-05, -1.2492761015892029e-05, -1.1473894119262695e-05, -1.0455027222633362e-05, -9.436160326004028e-06, -8.417293429374695e-06, -7.398426532745361e-06, -6.379559636116028e-06, -5.360692739486694e-06, -4.341825842857361e-06, -3.3229589462280273e-06, -2.304092049598694e-06, -1.2852251529693604e-06, -2.6635825634002686e-07, 7.525086402893066e-07, 1.7713755369186401e-06, 2.7902424335479736e-06, 3.809109330177307e-06, 4.827976226806641e-06, 5.846843123435974e-06, 6.865710020065308e-06, 7.884576916694641e-06, 8.903443813323975e-06, 9.922310709953308e-06, 1.0941177606582642e-05, 1.1960044503211975e-05, 1.2978911399841309e-05, 1.3997778296470642e-05, 1.5016645193099976e-05, 1.603551208972931e-05, 1.7054378986358643e-05, 1.8073245882987976e-05, 1.909211277961731e-05, 2.0110979676246643e-05, 2.1129846572875977e-05, 2.214871346950531e-05, 2.3167580366134644e-05, 2.4186447262763977e-05, 2.520531415939331e-05, 2.6224181056022644e-05, 2.7243047952651978e-05, 2.826191484928131e-05, 2.9280781745910645e-05, 3.0299648642539978e-05, 3.131851553916931e-05, 3.2337382435798645e-05, 3.335624933242798e-05, 3.437511622905731e-05, 3.5393983125686646e-05, 3.641285002231598e-05, 3.743171691894531e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 8.0, 6.0, 4.0, 5.0, 15.0, 15.0, 20.0, 38.0, 38.0, 49.0, 76.0, 122.0, 160.0, 274.0, 429.0, 657.0, 1168.0, 2083.0, 3902.0, 8168.0, 19381.0, 58434.0, 701748.0, 180560.0, 41538.0, 15091.0, 6753.0, 3246.0, 1772.0, 1002.0, 649.0, 377.0, 236.0, 156.0, 100.0, 76.0, 50.0, 26.0, 31.0, 19.0, 15.0, 8.0, 9.0, 9.0, 9.0, 5.0, 1.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.03924560546875, -0.03801393508911133, -0.036782264709472656, -0.035550594329833984, -0.03431892395019531, -0.03308725357055664, -0.03185558319091797, -0.030623912811279297, -0.029392242431640625, -0.028160572052001953, -0.02692890167236328, -0.02569723129272461, -0.024465560913085938, -0.023233890533447266, -0.022002220153808594, -0.020770549774169922, -0.01953887939453125, -0.018307209014892578, -0.017075538635253906, -0.015843868255615234, -0.014612197875976562, -0.01338052749633789, -0.012148857116699219, -0.010917186737060547, -0.009685516357421875, -0.008453845977783203, -0.007222175598144531, -0.005990505218505859, -0.0047588348388671875, -0.0035271644592285156, -0.0022954940795898438, -0.0010638236999511719, 0.0001678466796875, 0.0013995170593261719, 0.0026311874389648438, 0.0038628578186035156, 0.0050945281982421875, 0.006326198577880859, 0.007557868957519531, 0.008789539337158203, 0.010021209716796875, 0.011252880096435547, 0.012484550476074219, 0.01371622085571289, 0.014947891235351562, 0.016179561614990234, 0.017411231994628906, 0.018642902374267578, 0.01987457275390625, 0.021106243133544922, 0.022337913513183594, 0.023569583892822266, 0.024801254272460938, 0.02603292465209961, 0.02726459503173828, 0.028496265411376953, 0.029727935791015625, 0.030959606170654297, 0.03219127655029297, 0.03342294692993164, 0.03465461730957031, 0.035886287689208984, 0.037117958068847656, 0.03834962844848633, 0.039581298828125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 9.0, 18.0, 21.0, 21.0, 21.0, 31.0, 53.0, 52.0, 80.0, 95.0, 121.0, 83.0, 76.0, 67.0, 55.0, 42.0, 27.0, 29.0, 19.0, 18.0, 15.0, 5.0, 5.0, 2.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.096435546875, -0.0938119888305664, -0.09118843078613281, -0.08856487274169922, -0.08594131469726562, -0.08331775665283203, -0.08069419860839844, -0.07807064056396484, -0.07544708251953125, -0.07282352447509766, -0.07019996643066406, -0.06757640838623047, -0.06495285034179688, -0.06232929229736328, -0.05970573425292969, -0.057082176208496094, -0.0544586181640625, -0.051835060119628906, -0.04921150207519531, -0.04658794403076172, -0.043964385986328125, -0.04134082794189453, -0.03871726989746094, -0.036093711853027344, -0.03347015380859375, -0.030846595764160156, -0.028223037719726562, -0.02559947967529297, -0.022975921630859375, -0.02035236358642578, -0.017728805541992188, -0.015105247497558594, -0.012481689453125, -0.009858131408691406, -0.0072345733642578125, -0.004611015319824219, -0.001987457275390625, 0.0006361007690429688, 0.0032596588134765625, 0.005883216857910156, 0.00850677490234375, 0.011130332946777344, 0.013753890991210938, 0.01637744903564453, 0.019001007080078125, 0.02162456512451172, 0.024248123168945312, 0.026871681213378906, 0.0294952392578125, 0.032118797302246094, 0.03474235534667969, 0.03736591339111328, 0.039989471435546875, 0.04261302947998047, 0.04523658752441406, 0.047860145568847656, 0.05048370361328125, 0.053107261657714844, 0.05573081970214844, 0.05835437774658203, 0.060977935791015625, 0.06360149383544922, 0.06622505187988281, 0.0688486099243164, 0.07147216796875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 18.0, 45.0, 83.0, 407.0, 280.0, 95.0, 29.0, 22.0, 4.0, 3.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.082947731018066, -3.925687789916992, -3.768427848815918, -3.6111679077148438, -3.4539079666137695, -3.2966480255126953, -3.1393883228302, -2.982128381729126, -2.8248684406280518, -2.6676084995269775, -2.5103485584259033, -2.353088617324829, -2.195828914642334, -2.0385689735412598, -1.8813090324401855, -1.7240490913391113, -1.566789150238037, -1.409529209136963, -1.2522692680358887, -1.095009446144104, -0.9377495050430298, -0.7804895639419556, -0.6232296824455261, -0.4659698009490967, -0.30870985984802246, -0.15144994854927063, 0.005809962749481201, 0.16306987404823303, 0.32032978534698486, 0.4775897264480591, 0.6348496079444885, 0.792109489440918, 0.949368953704834, 1.1066288948059082, 1.2638888359069824, 1.421148657798767, 1.5784085988998413, 1.7356685400009155, 1.8929283618927002, 2.0501883029937744, 2.2074482440948486, 2.364708185195923, 2.521968126296997, 2.6792280673980713, 2.8364877700805664, 2.9937477111816406, 3.151007652282715, 3.308267593383789, 3.4655275344848633, 3.6227874755859375, 3.7800474166870117, 3.937307357788086, 4.09456729888916, 4.251827239990234, 4.409087181091309, 4.566347122192383, 4.723607063293457, 4.880867004394531, 5.0381269454956055, 5.19538688659668, 5.352646827697754, 5.509906768798828, 5.667166709899902, 5.824426651000977, 5.981686115264893]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 13.0, 7.0, 9.0, 13.0, 16.0, 11.0, 15.0, 9.0, 16.0, 12.0, 20.0, 21.0, 21.0, 46.0, 135.0, 199.0, 149.0, 32.0, 30.0, 16.0, 24.0, 22.0, 18.0, 24.0, 12.0, 12.0, 14.0, 10.0, 15.0, 9.0, 9.0, 4.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.3717689514160156, -2.303168773651123, -2.2345685958862305, -2.165968179702759, -2.097368001937866, -2.0287678241729736, -1.960167646408081, -1.8915674686431885, -1.8229671716690063, -1.7543669939041138, -1.6857666969299316, -1.617166519165039, -1.5485663414001465, -1.4799660444259644, -1.4113658666610718, -1.3427655696868896, -1.274165391921997, -1.2055652141571045, -1.1369649171829224, -1.0683647394180298, -0.9997645020484924, -0.9311642646789551, -0.8625640869140625, -0.7939638495445251, -0.7253636121749878, -0.6567633748054504, -0.5881631374359131, -0.5195629596710205, -0.45096272230148315, -0.3823624849319458, -0.31376227736473083, -0.24516206979751587, -0.17656159400939941, -0.10796137154102325, -0.039361149072647095, 0.029239073395729065, 0.09783929586410522, 0.16643953323364258, 0.23503974080085754, 0.3036399483680725, 0.37224018573760986, 0.4408404231071472, 0.5094406604766846, 0.5780408382415771, 0.6466410756111145, 0.7152413129806519, 0.7838414907455444, 0.8524417281150818, 0.9210419654846191, 0.9896422028541565, 1.0582424402236938, 1.1268426179885864, 1.1954429149627686, 1.2640430927276611, 1.3326432704925537, 1.4012434482574463, 1.4698437452316284, 1.538443922996521, 1.6070442199707031, 1.6756443977355957, 1.7442445755004883, 1.8128448724746704, 1.881445050239563, 1.9500453472137451, 2.0186455249786377]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 9.0, 15.0, 12.0, 15.0, 16.0, 22.0, 27.0, 40.0, 38.0, 34.0, 47.0, 125.0, 253.0, 61.0, 25.0, 38.0, 38.0, 25.0, 23.0, 24.0, 15.0, 11.0, 11.0, 8.0, 7.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1572265625, -0.15047836303710938, -0.14373016357421875, -0.13698196411132812, -0.1302337646484375, -0.12348556518554688, -0.11673736572265625, -0.10998916625976562, -0.103240966796875, -0.09649276733398438, -0.08974456787109375, -0.08299636840820312, -0.0762481689453125, -0.06949996948242188, -0.06275177001953125, -0.056003570556640625, -0.04925537109375, -0.042507171630859375, -0.03575897216796875, -0.029010772705078125, -0.0222625732421875, -0.015514373779296875, -0.00876617431640625, -0.002017974853515625, 0.004730224609375, 0.011478424072265625, 0.01822662353515625, 0.024974822998046875, 0.0317230224609375, 0.038471221923828125, 0.04521942138671875, 0.051967620849609375, 0.0587158203125, 0.06546401977539062, 0.07221221923828125, 0.07896041870117188, 0.0857086181640625, 0.09245681762695312, 0.09920501708984375, 0.10595321655273438, 0.112701416015625, 0.11944961547851562, 0.12619781494140625, 0.13294601440429688, 0.1396942138671875, 0.14644241333007812, 0.15319061279296875, 0.15993881225585938, 0.16668701171875, 0.17343521118164062, 0.18018341064453125, 0.18693161010742188, 0.1936798095703125, 0.20042800903320312, 0.20717620849609375, 0.21392440795898438, 0.220672607421875, 0.22742080688476562, 0.23416900634765625, 0.24091720581054688, 0.2476654052734375, 0.2544136047363281, 0.26116180419921875, 0.2679100036621094, 0.274658203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 8.0, 17.0, 16.0, 25.0, 56.0, 86.0, 264.0, 750.0, 4065.0, 8262953.0, 116026.0, 3163.0, 665.0, 240.0, 105.0, 53.0, 25.0, 14.0, 15.0, 9.0, 10.0, 10.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.584643602371216, -2.4921183586120605, -2.399592876434326, -2.307067632675171, -2.2145423889160156, -2.1220169067382812, -2.029491662979126, -1.9369663000106812, -1.8444409370422363, -1.7519155740737915, -1.6593903303146362, -1.5668649673461914, -1.4743396043777466, -1.3818142414093018, -1.2892889976501465, -1.1967636346817017, -1.1042383909225464, -1.0117130279541016, -0.9191877245903015, -0.8266624212265015, -0.7341370582580566, -0.6416117548942566, -0.5490864515304565, -0.4565610885620117, -0.36403578519821167, -0.27151045203208923, -0.178985133767128, -0.08645981550216675, 0.0060655176639556885, 0.09859085083007812, 0.19111615419387817, 0.283641517162323, 0.37616682052612305, 0.4686921536922455, 0.5612174868583679, 0.653742790222168, 0.7462681531906128, 0.8387934565544128, 0.9313187599182129, 1.0238441228866577, 1.1163694858551025, 1.2088948488235474, 1.3014200925827026, 1.3939454555511475, 1.4864708185195923, 1.578996181488037, 1.6715214252471924, 1.7640467882156372, 1.8565720319747925, 1.9490973949432373, 2.0416226387023926, 2.134148120880127, 2.2266733646392822, 2.3191986083984375, 2.411724090576172, 2.504249334335327, 2.5967745780944824, 2.6892998218536377, 2.781825304031372, 2.8743505477905273, 2.9668757915496826, 3.059401273727417, 3.1519265174865723, 3.2444519996643066, 3.336977243423462]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 5.0, 10.0, 2.0, 6.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 3.0, 5.0, 5.0, 5.0, 7.0, 6.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.9421043395996094, -3.840648651123047, -3.7391929626464844, -3.637737274169922, -3.5362815856933594, -3.434825897216797, -3.3333702087402344, -3.231914520263672, -3.1304588317871094, -3.029003143310547, -2.9275474548339844, -2.826091766357422, -2.7246360778808594, -2.623180389404297, -2.5217247009277344, -2.420269012451172, -2.3188135623931885, -2.217357873916626, -2.1159021854400635, -2.014446496963501, -1.9129908084869385, -1.811535120010376, -1.710079550743103, -1.6086238622665405, -1.507168173789978, -1.4057124853134155, -1.304256796836853, -1.20280122756958, -1.1013455390930176, -0.9998897910118103, -0.8984341621398926, -0.7969784736633301, -0.6955227851867676, -0.5940670967102051, -0.49261143803596497, -0.39115577936172485, -0.28970009088516235, -0.18824440240859985, -0.08678877353668213, 0.014666914939880371, 0.11612260341644287, 0.21757827699184418, 0.3190339505672455, 0.4204896092414856, 0.5219452977180481, 0.6234009861946106, 0.7248566150665283, 0.8263123035430908, 0.9277679920196533, 1.0292236804962158, 1.1306793689727783, 1.2321350574493408, 1.3335907459259033, 1.4350464344024658, 1.5365020036697388, 1.6379576921463013, 1.7394133806228638, 1.8408690690994263, 1.9423247575759888, 2.0437803268432617, 2.145236015319824, 2.2466917037963867, 2.348147392272949, 2.4496030807495117, 2.551058769226074]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 9.0, 11.0, 14.0, 20.0, 25.0, 28.0, 41.0, 46.0, 79.0, 107.0, 211.0, 288.0, 506.0, 1206.0, 3217.0, 9794.0, 33183.0, 120212.0, 227162.0, 90185.0, 25357.0, 7633.0, 2618.0, 1037.0, 489.0, 254.0, 175.0, 98.0, 68.0, 49.0, 32.0, 24.0, 20.0, 21.0, 6.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9892578125, -1.93304443359375, -1.8768310546875, -1.82061767578125, -1.764404296875, -1.70819091796875, -1.6519775390625, -1.59576416015625, -1.53955078125, -1.48333740234375, -1.4271240234375, -1.37091064453125, -1.314697265625, -1.25848388671875, -1.2022705078125, -1.14605712890625, -1.08984375, -1.03363037109375, -0.9774169921875, -0.92120361328125, -0.864990234375, -0.80877685546875, -0.7525634765625, -0.69635009765625, -0.64013671875, -0.58392333984375, -0.5277099609375, -0.47149658203125, -0.415283203125, -0.35906982421875, -0.3028564453125, -0.24664306640625, -0.1904296875, -0.13421630859375, -0.0780029296875, -0.02178955078125, 0.034423828125, 0.09063720703125, 0.1468505859375, 0.20306396484375, 0.25927734375, 0.31549072265625, 0.3717041015625, 0.42791748046875, 0.484130859375, 0.54034423828125, 0.5965576171875, 0.65277099609375, 0.708984375, 0.76519775390625, 0.8214111328125, 0.87762451171875, 0.933837890625, 0.99005126953125, 1.0462646484375, 1.10247802734375, 1.15869140625, 1.21490478515625, 1.2711181640625, 1.32733154296875, 1.383544921875, 1.43975830078125, 1.4959716796875, 1.55218505859375, 1.6083984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 6.0, 3.0, 10.0, 5.0, 12.0, 16.0, 30.0, 40.0, 54.0, 59.0, 55.0, 72.0, 76.0, 76.0, 101.0, 81.0, 66.0, 50.0, 53.0, 31.0, 27.0, 14.0, 18.0, 6.0, 9.0, 9.0, 8.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.3583984375, -0.348358154296875, -0.33831787109375, -0.328277587890625, -0.3182373046875, -0.308197021484375, -0.29815673828125, -0.288116455078125, -0.278076171875, -0.268035888671875, -0.25799560546875, -0.247955322265625, -0.2379150390625, -0.227874755859375, -0.21783447265625, -0.207794189453125, -0.19775390625, -0.187713623046875, -0.17767333984375, -0.167633056640625, -0.1575927734375, -0.147552490234375, -0.13751220703125, -0.127471923828125, -0.117431640625, -0.107391357421875, -0.09735107421875, -0.087310791015625, -0.0772705078125, -0.067230224609375, -0.05718994140625, -0.047149658203125, -0.037109375, -0.027069091796875, -0.01702880859375, -0.006988525390625, 0.0030517578125, 0.013092041015625, 0.02313232421875, 0.033172607421875, 0.043212890625, 0.053253173828125, 0.06329345703125, 0.073333740234375, 0.0833740234375, 0.093414306640625, 0.10345458984375, 0.113494873046875, 0.12353515625, 0.133575439453125, 0.14361572265625, 0.153656005859375, 0.1636962890625, 0.173736572265625, 0.18377685546875, 0.193817138671875, 0.203857421875, 0.213897705078125, 0.22393798828125, 0.233978271484375, 0.2440185546875, 0.254058837890625, 0.26409912109375, 0.274139404296875, 0.2841796875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 10.0, 19.0, 33.0, 81.0, 96.0, 93.0, 67.0, 35.0, 9.0, 12.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.1596553325653076, -3.085617780685425, -3.011580228805542, -2.937542676925659, -2.8635051250457764, -2.7894675731658936, -2.7154300212860107, -2.641392707824707, -2.567355155944824, -2.4933176040649414, -2.4192800521850586, -2.345242500305176, -2.271204948425293, -2.19716739654541, -2.1231298446655273, -2.0490922927856445, -1.9750547409057617, -1.901017189025879, -1.826979637145996, -1.7529420852661133, -1.6789045333862305, -1.6048669815063477, -1.5308295488357544, -1.4567919969558716, -1.3827544450759888, -1.308716893196106, -1.2346793413162231, -1.1606417894363403, -1.086604356765747, -1.0125668048858643, -0.9385292530059814, -0.8644917011260986, -0.7904542684555054, -0.7164167165756226, -0.6423791646957397, -0.5683416724205017, -0.4943041205406189, -0.4202665686607361, -0.34622904658317566, -0.27219152450561523, -0.19815397262573242, -0.1241164356470108, -0.050078898668289185, 0.023958638310432434, 0.09799617528915405, 0.17203372716903687, 0.2460712492465973, 0.3201087713241577, 0.3941463232040405, 0.46818387508392334, 0.5422214269638062, 0.6162589192390442, 0.690296471118927, 0.7643340229988098, 0.8383715152740479, 0.9124090671539307, 0.9864466190338135, 1.0604841709136963, 1.134521722793579, 1.208559274673462, 1.2825968265533447, 1.3566343784332275, 1.4306718111038208, 1.5047093629837036, 1.5787469148635864]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 10.0, 15.0, 14.0, 35.0, 55.0, 116.0, 98.0, 50.0, 26.0, 14.0, 11.0, 7.0, 6.0, 1.0, 1.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.063533067703247, -2.007631301879883, -1.951729416847229, -1.8958276510238647, -1.839925765991211, -1.7840240001678467, -1.7281222343444824, -1.6722203493118286, -1.6163185834884644, -1.5604168176651, -1.5045149326324463, -1.448613166809082, -1.3927112817764282, -1.336809515953064, -1.2809076309204102, -1.225005865097046, -1.1691040992736816, -1.1132023334503174, -1.0573004484176636, -1.0013986825942993, -0.9454968571662903, -0.8895950317382812, -0.8336932063102722, -0.7777913808822632, -0.7218894958496094, -0.6659876704216003, -0.6100858449935913, -0.554184079170227, -0.498282253742218, -0.442380428314209, -0.38647860288619995, -0.3305768072605133, -0.27467501163482666, -0.21877320110797882, -0.16287139058113098, -0.10696956515312195, -0.05106775462627411, 0.0048340559005737305, 0.060735881328582764, 0.11663767695426941, 0.17253950238227844, 0.22844131290912628, 0.2843431234359741, 0.34024494886398315, 0.3961467742919922, 0.45204856991767883, 0.5079504251480103, 0.5638521909713745, 0.6197540163993835, 0.6756558418273926, 0.7315576672554016, 0.7874594926834106, 0.8433612585067749, 0.8992630839347839, 0.955164909362793, 1.0110666751861572, 1.066968560218811, 1.1228703260421753, 1.178772211074829, 1.2346739768981934, 1.2905758619308472, 1.3464776277542114, 1.4023795127868652, 1.4582812786102295, 1.5141830444335938]}, "eval/loss": 4.216550350189209, "eval/wer": 2.3908964696548987, "eval/runtime": 932.3753, "eval/samples_per_second": 2.834, "eval/steps_per_second": 0.237, "train/train_runtime": 5668.958, "train/train_samples_per_second": 5.034, "train/train_steps_per_second": 0.105, "train/total_flos": 0.0, "train/train_loss": 4.277455122382553} \ No newline at end of file +{"train/loss": 4.2767, "train/learning_rate": 2.1276595744680853e-06, "train/epoch": 1.0, "train/global_step": 594, "_runtime": 6892, "_timestamp": 1646194276, "_step": 596, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 9.0, 923.0, 85.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.87272644042969, -32.01921463012695, -20.16570472717285, -8.31219482421875, 3.5413169860839844, 15.394828796386719, 27.248336791992188, 39.10185241699219, 50.955360412597656, 62.80887222290039, 74.66238403320312, 86.5158920288086, 98.36940002441406, 110.22291564941406, 122.07642364501953, 133.929931640625, 145.783447265625, 157.636962890625, 169.49046325683594, 181.34397888183594, 193.19749450683594, 205.05099487304688, 216.90451049804688, 228.75802612304688, 240.61154174804688, 252.46505737304688, 264.3185729980469, 276.17205810546875, 288.02557373046875, 299.87908935546875, 311.73260498046875, 323.58612060546875, 335.4396057128906, 347.2931213378906, 359.1466369628906, 371.0001220703125, 382.8536376953125, 394.7071533203125, 406.5606689453125, 418.4141845703125, 430.2677001953125, 442.1212158203125, 453.9747314453125, 465.8282470703125, 477.6817321777344, 489.5352478027344, 501.3887634277344, 513.2423095703125, 525.0957641601562, 536.9492797851562, 548.8027954101562, 560.6563110351562, 572.5098266601562, 584.3633422851562, 596.216796875, 608.0703125, 619.9238891601562, 631.7774047851562, 643.6309204101562, 655.4844360351562, 667.3379516601562, 679.1914672851562, 691.044921875, 702.8984375, 714.751953125]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 6.0, 4.0, 8.0, 11.0, 17.0, 16.0, 17.0, 21.0, 28.0, 22.0, 38.0, 39.0, 49.0, 43.0, 54.0, 38.0, 54.0, 53.0, 52.0, 53.0, 51.0, 42.0, 36.0, 42.0, 33.0, 34.0, 42.0, 24.0, 20.0, 8.0, 9.0, 12.0, 5.0, 6.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.28767395019531, -48.571067810058594, -46.854461669921875, -45.137855529785156, -43.42124938964844, -41.70464324951172, -39.988037109375, -38.27143096923828, -36.55482482910156, -34.838218688964844, -33.121612548828125, -31.405006408691406, -29.688400268554688, -27.97179412841797, -26.25518798828125, -24.53858184814453, -22.821977615356445, -21.105371475219727, -19.388765335083008, -17.67215919494629, -15.95555305480957, -14.238947868347168, -12.52234172821045, -10.80573558807373, -9.089129447937012, -7.372523307800293, -5.655917167663574, -3.9393115043640137, -2.222705364227295, -0.5060997009277344, 1.2105064392089844, 2.927112579345703, 4.643718719482422, 6.360324859619141, 8.07693099975586, 9.793537139892578, 11.510143280029297, 13.2267484664917, 14.943354606628418, 16.659961700439453, 18.376567840576172, 20.09317398071289, 21.80978012084961, 23.526386260986328, 25.242992401123047, 26.959598541259766, 28.676204681396484, 30.392810821533203, 32.109413146972656, 33.826019287109375, 35.542625427246094, 37.25923156738281, 38.97583770751953, 40.69244384765625, 42.40904998779297, 44.12565612792969, 45.842262268066406, 47.558868408203125, 49.275474548339844, 50.99208068847656, 52.70868682861328, 54.42529296875, 56.14189910888672, 57.85850524902344, 59.575111389160156]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 9.0, 10.0, 4.0, 12.0, 16.0, 9.0, 12.0, 19.0, 23.0, 19.0, 24.0, 36.0, 27.0, 38.0, 25.0, 35.0, 33.0, 40.0, 37.0, 39.0, 41.0, 29.0, 38.0, 46.0, 28.0, 43.0, 35.0, 32.0, 28.0, 31.0, 29.0, 25.0, 31.0, 17.0, 21.0, 10.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.64453125, -1.59210205078125, -1.5396728515625, -1.48724365234375, -1.434814453125, -1.38238525390625, -1.3299560546875, -1.27752685546875, -1.22509765625, -1.17266845703125, -1.1202392578125, -1.06781005859375, -1.015380859375, -0.96295166015625, -0.9105224609375, -0.85809326171875, -0.8056640625, -0.75323486328125, -0.7008056640625, -0.64837646484375, -0.595947265625, -0.54351806640625, -0.4910888671875, -0.43865966796875, -0.38623046875, -0.33380126953125, -0.2813720703125, -0.22894287109375, -0.176513671875, -0.12408447265625, -0.0716552734375, -0.01922607421875, 0.033203125, 0.08563232421875, 0.1380615234375, 0.19049072265625, 0.242919921875, 0.29534912109375, 0.3477783203125, 0.40020751953125, 0.45263671875, 0.50506591796875, 0.5574951171875, 0.60992431640625, 0.662353515625, 0.71478271484375, 0.7672119140625, 0.81964111328125, 0.8720703125, 0.92449951171875, 0.9769287109375, 1.02935791015625, 1.081787109375, 1.13421630859375, 1.1866455078125, 1.23907470703125, 1.29150390625, 1.34393310546875, 1.3963623046875, 1.44879150390625, 1.501220703125, 1.55364990234375, 1.6060791015625, 1.65850830078125, 1.7109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 9.0, 10.0, 16.0, 17.0, 22.0, 27.0, 30.0, 48.0, 65.0, 93.0, 82.0, 140.0, 221.0, 317.0, 511.0, 797.0, 1340.0, 2651.0, 7074.0, 28746.0, 255415.0, 3042783.0, 777788.0, 57020.0, 10956.0, 3779.0, 1617.0, 921.0, 563.0, 375.0, 237.0, 190.0, 113.0, 89.0, 54.0, 42.0, 26.0, 22.0, 12.0, 12.0, 7.0, 5.0, 6.0, 10.0, 10.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.796875, -8.5277099609375, -8.258544921875, -7.9893798828125, -7.72021484375, -7.4510498046875, -7.181884765625, -6.9127197265625, -6.6435546875, -6.3743896484375, -6.105224609375, -5.8360595703125, -5.56689453125, -5.2977294921875, -5.028564453125, -4.7593994140625, -4.490234375, -4.2210693359375, -3.951904296875, -3.6827392578125, -3.41357421875, -3.1444091796875, -2.875244140625, -2.6060791015625, -2.3369140625, -2.0677490234375, -1.798583984375, -1.5294189453125, -1.26025390625, -0.9910888671875, -0.721923828125, -0.4527587890625, -0.18359375, 0.0855712890625, 0.354736328125, 0.6239013671875, 0.89306640625, 1.1622314453125, 1.431396484375, 1.7005615234375, 1.9697265625, 2.2388916015625, 2.508056640625, 2.7772216796875, 3.04638671875, 3.3155517578125, 3.584716796875, 3.8538818359375, 4.123046875, 4.3922119140625, 4.661376953125, 4.9305419921875, 5.19970703125, 5.4688720703125, 5.738037109375, 6.0072021484375, 6.2763671875, 6.5455322265625, 6.814697265625, 7.0838623046875, 7.35302734375, 7.6221923828125, 7.891357421875, 8.1605224609375, 8.4296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 15.0, 18.0, 40.0, 65.0, 100.0, 182.0, 312.0, 521.0, 780.0, 720.0, 504.0, 298.0, 161.0, 115.0, 90.0, 47.0, 32.0, 21.0, 17.0, 7.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.3828125, -12.04638671875, -11.7099609375, -11.37353515625, -11.037109375, -10.70068359375, -10.3642578125, -10.02783203125, -9.69140625, -9.35498046875, -9.0185546875, -8.68212890625, -8.345703125, -8.00927734375, -7.6728515625, -7.33642578125, -7.0, -6.66357421875, -6.3271484375, -5.99072265625, -5.654296875, -5.31787109375, -4.9814453125, -4.64501953125, -4.30859375, -3.97216796875, -3.6357421875, -3.29931640625, -2.962890625, -2.62646484375, -2.2900390625, -1.95361328125, -1.6171875, -1.28076171875, -0.9443359375, -0.60791015625, -0.271484375, 0.06494140625, 0.4013671875, 0.73779296875, 1.07421875, 1.41064453125, 1.7470703125, 2.08349609375, 2.419921875, 2.75634765625, 3.0927734375, 3.42919921875, 3.765625, 4.10205078125, 4.4384765625, 4.77490234375, 5.111328125, 5.44775390625, 5.7841796875, 6.12060546875, 6.45703125, 6.79345703125, 7.1298828125, 7.46630859375, 7.802734375, 8.13916015625, 8.4755859375, 8.81201171875, 9.1484375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 8.0, 9.0, 10.0, 13.0, 31.0, 52.0, 94.0, 156.0, 366.0, 691.0, 1758.0, 8100.0, 1546976.0, 2622237.0, 9988.0, 2071.0, 774.0, 431.0, 208.0, 105.0, 80.0, 41.0, 18.0, 11.0, 5.0, 15.0, 11.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.25, -36.15576171875, -35.0615234375, -33.96728515625, -32.873046875, -31.77880859375, -30.6845703125, -29.59033203125, -28.49609375, -27.40185546875, -26.3076171875, -25.21337890625, -24.119140625, -23.02490234375, -21.9306640625, -20.83642578125, -19.7421875, -18.64794921875, -17.5537109375, -16.45947265625, -15.365234375, -14.27099609375, -13.1767578125, -12.08251953125, -10.98828125, -9.89404296875, -8.7998046875, -7.70556640625, -6.611328125, -5.51708984375, -4.4228515625, -3.32861328125, -2.234375, -1.14013671875, -0.0458984375, 1.04833984375, 2.142578125, 3.23681640625, 4.3310546875, 5.42529296875, 6.51953125, 7.61376953125, 8.7080078125, 9.80224609375, 10.896484375, 11.99072265625, 13.0849609375, 14.17919921875, 15.2734375, 16.36767578125, 17.4619140625, 18.55615234375, 19.650390625, 20.74462890625, 21.8388671875, 22.93310546875, 24.02734375, 25.12158203125, 26.2158203125, 27.31005859375, 28.404296875, 29.49853515625, 30.5927734375, 31.68701171875, 32.78125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 384.0, 620.0, 11.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-496.1153564453125, -487.0934143066406, -478.07147216796875, -469.04949951171875, -460.0275573730469, -451.005615234375, -441.9836730957031, -432.96173095703125, -423.93975830078125, -414.9178161621094, -405.8958740234375, -396.8739013671875, -387.8519592285156, -378.83001708984375, -369.8080749511719, -360.7861328125, -351.7641906738281, -342.74224853515625, -333.7203063964844, -324.6983337402344, -315.6763916015625, -306.6544494628906, -297.63250732421875, -288.6105651855469, -279.588623046875, -270.5666809082031, -261.54473876953125, -252.5227813720703, -243.50082397460938, -234.4788818359375, -225.45693969726562, -216.43499755859375, -207.41305541992188, -198.39111328125, -189.36915588378906, -180.3472137451172, -171.32525634765625, -162.30331420898438, -153.2813720703125, -144.25942993164062, -135.2374725341797, -126.21552276611328, -117.19357299804688, -108.171630859375, -99.1496810913086, -90.12773132324219, -81.10578918457031, -72.0838394165039, -63.0618896484375, -54.039939880371094, -45.01799392700195, -35.99604797363281, -26.974098205566406, -17.9521484375, -8.93020248413086, 0.09174346923828125, 9.113693237304688, 18.13564109802246, 27.157588958740234, 36.179534912109375, 45.20148468017578, 54.22343444824219, 63.24538040161133, 72.26732635498047, 81.28927612304688]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 5.0, 10.0, 15.0, 20.0, 25.0, 26.0, 29.0, 32.0, 45.0, 48.0, 48.0, 61.0, 62.0, 58.0, 74.0, 74.0, 61.0, 57.0, 45.0, 42.0, 30.0, 32.0, 28.0, 17.0, 16.0, 10.0, 8.0, 8.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.311134338378906, -54.782867431640625, -53.254600524902344, -51.72633361816406, -50.19806671142578, -48.6697998046875, -47.14153289794922, -45.61326599121094, -44.084999084472656, -42.556732177734375, -41.028465270996094, -39.50019836425781, -37.97193145751953, -36.44366455078125, -34.91539764404297, -33.38713073730469, -31.85886573791504, -30.330598831176758, -28.802331924438477, -27.274065017700195, -25.745798110961914, -24.217531204223633, -22.689266204833984, -21.160999298095703, -19.632732391357422, -18.10446548461914, -16.57619857788086, -15.047931671142578, -13.519664764404297, -11.991397857666016, -10.46313190460205, -8.93486499786377, -7.406597137451172, -5.878330230712891, -4.350063323974609, -2.8217968940734863, -1.293529987335205, 0.23473691940307617, 1.7630033493041992, 3.2912702560424805, 4.819537162780762, 6.347804069519043, 7.876070976257324, 9.404336929321289, 10.93260383605957, 12.460870742797852, 13.989137649536133, 15.517404556274414, 17.045671463012695, 18.573938369750977, 20.102205276489258, 21.63047218322754, 23.15873908996582, 24.6870059967041, 26.21527099609375, 27.74353790283203, 29.271804809570312, 30.800071716308594, 32.328338623046875, 33.856605529785156, 35.38487243652344, 36.91313934326172, 38.44140625, 39.96967315673828, 41.49794006347656]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 4.0, 6.0, 4.0, 5.0, 8.0, 12.0, 8.0, 12.0, 22.0, 18.0, 18.0, 19.0, 22.0, 20.0, 25.0, 27.0, 36.0, 37.0, 29.0, 32.0, 31.0, 49.0, 35.0, 47.0, 31.0, 41.0, 42.0, 30.0, 32.0, 37.0, 36.0, 28.0, 31.0, 23.0, 15.0, 22.0, 16.0, 22.0, 11.0, 14.0, 12.0, 3.0, 4.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.771484375, -1.717926025390625, -1.66436767578125, -1.610809326171875, -1.5572509765625, -1.503692626953125, -1.45013427734375, -1.396575927734375, -1.343017578125, -1.289459228515625, -1.23590087890625, -1.182342529296875, -1.1287841796875, -1.075225830078125, -1.02166748046875, -0.968109130859375, -0.91455078125, -0.860992431640625, -0.80743408203125, -0.753875732421875, -0.7003173828125, -0.646759033203125, -0.59320068359375, -0.539642333984375, -0.486083984375, -0.432525634765625, -0.37896728515625, -0.325408935546875, -0.2718505859375, -0.218292236328125, -0.16473388671875, -0.111175537109375, -0.0576171875, -0.004058837890625, 0.04949951171875, 0.103057861328125, 0.1566162109375, 0.210174560546875, 0.26373291015625, 0.317291259765625, 0.370849609375, 0.424407958984375, 0.47796630859375, 0.531524658203125, 0.5850830078125, 0.638641357421875, 0.69219970703125, 0.745758056640625, 0.79931640625, 0.852874755859375, 0.90643310546875, 0.959991455078125, 1.0135498046875, 1.067108154296875, 1.12066650390625, 1.174224853515625, 1.227783203125, 1.281341552734375, 1.33489990234375, 1.388458251953125, 1.4420166015625, 1.495574951171875, 1.54913330078125, 1.602691650390625, 1.65625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 9.0, 18.0, 21.0, 34.0, 38.0, 64.0, 92.0, 137.0, 190.0, 302.0, 368.0, 608.0, 833.0, 1344.0, 1884.0, 2947.0, 4315.0, 6756.0, 10448.0, 16068.0, 24776.0, 39014.0, 60683.0, 93016.0, 137368.0, 178796.0, 155979.0, 109966.0, 71956.0, 46150.0, 29586.0, 19178.0, 11938.0, 7947.0, 5279.0, 3415.0, 2324.0, 1537.0, 1019.0, 700.0, 457.0, 320.0, 222.0, 117.0, 118.0, 63.0, 55.0, 43.0, 26.0, 17.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1435546875, -0.13916397094726562, -0.13477325439453125, -0.13038253784179688, -0.1259918212890625, -0.12160110473632812, -0.11721038818359375, -0.11281967163085938, -0.108428955078125, -0.10403823852539062, -0.09964752197265625, -0.09525680541992188, -0.0908660888671875, -0.08647537231445312, -0.08208465576171875, -0.07769393920898438, -0.07330322265625, -0.06891250610351562, -0.06452178955078125, -0.060131072998046875, -0.0557403564453125, -0.051349639892578125, -0.04695892333984375, -0.042568206787109375, -0.038177490234375, -0.033786773681640625, -0.02939605712890625, -0.025005340576171875, -0.0206146240234375, -0.016223907470703125, -0.01183319091796875, -0.007442474365234375, -0.0030517578125, 0.001338958740234375, 0.00572967529296875, 0.010120391845703125, 0.0145111083984375, 0.018901824951171875, 0.02329254150390625, 0.027683258056640625, 0.032073974609375, 0.036464691162109375, 0.04085540771484375, 0.045246124267578125, 0.0496368408203125, 0.054027557373046875, 0.05841827392578125, 0.06280899047851562, 0.06719970703125, 0.07159042358398438, 0.07598114013671875, 0.08037185668945312, 0.0847625732421875, 0.08915328979492188, 0.09354400634765625, 0.09793472290039062, 0.102325439453125, 0.10671615600585938, 0.11110687255859375, 0.11549758911132812, 0.1198883056640625, 0.12427902221679688, 0.12866973876953125, 0.13306045532226562, 0.137451171875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 8.0, 7.0, 11.0, 13.0, 13.0, 14.0, 23.0, 17.0, 19.0, 16.0, 29.0, 21.0, 33.0, 35.0, 29.0, 37.0, 22.0, 35.0, 44.0, 38.0, 1060.0, 35.0, 36.0, 34.0, 42.0, 34.0, 31.0, 32.0, 37.0, 18.0, 26.0, 13.0, 25.0, 16.0, 23.0, 11.0, 15.0, 9.0, 9.0, 8.0, 15.0, 4.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.1064453125, -1.072662353515625, -1.03887939453125, -1.005096435546875, -0.9713134765625, -0.937530517578125, -0.90374755859375, -0.869964599609375, -0.836181640625, -0.802398681640625, -0.76861572265625, -0.734832763671875, -0.7010498046875, -0.667266845703125, -0.63348388671875, -0.599700927734375, -0.56591796875, -0.532135009765625, -0.49835205078125, -0.464569091796875, -0.4307861328125, -0.397003173828125, -0.36322021484375, -0.329437255859375, -0.295654296875, -0.261871337890625, -0.22808837890625, -0.194305419921875, -0.1605224609375, -0.126739501953125, -0.09295654296875, -0.059173583984375, -0.025390625, 0.008392333984375, 0.04217529296875, 0.075958251953125, 0.1097412109375, 0.143524169921875, 0.17730712890625, 0.211090087890625, 0.244873046875, 0.278656005859375, 0.31243896484375, 0.346221923828125, 0.3800048828125, 0.413787841796875, 0.44757080078125, 0.481353759765625, 0.51513671875, 0.548919677734375, 0.58270263671875, 0.616485595703125, 0.6502685546875, 0.684051513671875, 0.71783447265625, 0.751617431640625, 0.785400390625, 0.819183349609375, 0.85296630859375, 0.886749267578125, 0.9205322265625, 0.954315185546875, 0.98809814453125, 1.021881103515625, 1.0556640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 6.0, 4.0, 10.0, 6.0, 11.0, 20.0, 26.0, 41.0, 59.0, 90.0, 124.0, 165.0, 296.0, 388.0, 599.0, 903.0, 1322.0, 2070.0, 3231.0, 4965.0, 7650.0, 11672.0, 18476.0, 27734.0, 42064.0, 62696.0, 89930.0, 121550.0, 979118.0, 348097.0, 115483.0, 85317.0, 58969.0, 39578.0, 26107.0, 16836.0, 11080.0, 7076.0, 4592.0, 2938.0, 1968.0, 1263.0, 883.0, 563.0, 373.0, 258.0, 174.0, 122.0, 78.0, 38.0, 35.0, 28.0, 18.0, 12.0, 8.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.0828857421875, -0.08028888702392578, -0.07769203186035156, -0.07509517669677734, -0.07249832153320312, -0.0699014663696289, -0.06730461120605469, -0.06470775604248047, -0.06211090087890625, -0.05951404571533203, -0.05691719055175781, -0.054320335388183594, -0.051723480224609375, -0.049126625061035156, -0.04652976989746094, -0.04393291473388672, -0.0413360595703125, -0.03873920440673828, -0.03614234924316406, -0.033545494079589844, -0.030948638916015625, -0.028351783752441406, -0.025754928588867188, -0.02315807342529297, -0.02056121826171875, -0.01796436309814453, -0.015367507934570312, -0.012770652770996094, -0.010173797607421875, -0.007576942443847656, -0.0049800872802734375, -0.0023832321166992188, 0.000213623046875, 0.0028104782104492188, 0.0054073333740234375, 0.008004188537597656, 0.010601043701171875, 0.013197898864746094, 0.015794754028320312, 0.01839160919189453, 0.02098846435546875, 0.02358531951904297, 0.026182174682617188, 0.028779029846191406, 0.031375885009765625, 0.033972740173339844, 0.03656959533691406, 0.03916645050048828, 0.0417633056640625, 0.04436016082763672, 0.04695701599121094, 0.049553871154785156, 0.052150726318359375, 0.054747581481933594, 0.05734443664550781, 0.05994129180908203, 0.06253814697265625, 0.06513500213623047, 0.06773185729980469, 0.0703287124633789, 0.07292556762695312, 0.07552242279052734, 0.07811927795410156, 0.08071613311767578, 0.08331298828125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 1.0, 6.0, 4.0, 11.0, 10.0, 6.0, 9.0, 8.0, 11.0, 13.0, 23.0, 23.0, 27.0, 45.0, 37.0, 59.0, 75.0, 70.0, 99.0, 88.0, 67.0, 46.0, 44.0, 32.0, 31.0, 23.0, 26.0, 21.0, 16.0, 10.0, 12.0, 7.0, 4.0, 2.0, 6.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00447845458984375, -0.004344522953033447, -0.0042105913162231445, -0.004076659679412842, -0.003942728042602539, -0.0038087964057922363, -0.0036748647689819336, -0.003540933132171631, -0.003407001495361328, -0.0032730698585510254, -0.0031391382217407227, -0.00300520658493042, -0.002871274948120117, -0.0027373433113098145, -0.0026034116744995117, -0.002469480037689209, -0.0023355484008789062, -0.0022016167640686035, -0.0020676851272583008, -0.001933753490447998, -0.0017998218536376953, -0.0016658902168273926, -0.0015319585800170898, -0.0013980269432067871, -0.0012640953063964844, -0.0011301636695861816, -0.000996232032775879, -0.0008623003959655762, -0.0007283687591552734, -0.0005944371223449707, -0.00046050548553466797, -0.00032657384872436523, -0.0001926422119140625, -5.8710575103759766e-05, 7.522106170654297e-05, 0.0002091526985168457, 0.00034308433532714844, 0.00047701597213745117, 0.0006109476089477539, 0.0007448792457580566, 0.0008788108825683594, 0.0010127425193786621, 0.0011466741561889648, 0.0012806057929992676, 0.0014145374298095703, 0.001548469066619873, 0.0016824007034301758, 0.0018163323402404785, 0.0019502639770507812, 0.002084195613861084, 0.0022181272506713867, 0.0023520588874816895, 0.002485990524291992, 0.002619922161102295, 0.0027538537979125977, 0.0028877854347229004, 0.003021717071533203, 0.003155648708343506, 0.0032895803451538086, 0.0034235119819641113, 0.003557443618774414, 0.003691375255584717, 0.0038253068923950195, 0.003959238529205322, 0.004093170166015625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 11.0, 11.0, 7.0, 15.0, 19.0, 18.0, 21.0, 19.0, 29.0, 53.0, 43.0, 86.0, 92.0, 126.0, 211.0, 289.0, 490.0, 1299.0, 944716.0, 98725.0, 851.0, 475.0, 252.0, 197.0, 108.0, 101.0, 56.0, 37.0, 33.0, 24.0, 25.0, 14.0, 19.0, 13.0, 14.0, 7.0, 11.0, 12.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08233642578125, -0.07957935333251953, -0.07682228088378906, -0.0740652084350586, -0.07130813598632812, -0.06855106353759766, -0.06579399108886719, -0.06303691864013672, -0.06027984619140625, -0.05752277374267578, -0.05476570129394531, -0.052008628845214844, -0.049251556396484375, -0.046494483947753906, -0.04373741149902344, -0.04098033905029297, -0.0382232666015625, -0.03546619415283203, -0.03270912170410156, -0.029952049255371094, -0.027194976806640625, -0.024437904357910156, -0.021680831909179688, -0.01892375946044922, -0.01616668701171875, -0.013409614562988281, -0.010652542114257812, -0.007895469665527344, -0.005138397216796875, -0.0023813247680664062, 0.0003757476806640625, 0.0031328201293945312, 0.005889892578125, 0.008646965026855469, 0.011404037475585938, 0.014161109924316406, 0.016918182373046875, 0.019675254821777344, 0.022432327270507812, 0.02518939971923828, 0.02794647216796875, 0.03070354461669922, 0.03346061706542969, 0.036217689514160156, 0.038974761962890625, 0.041731834411621094, 0.04448890686035156, 0.04724597930908203, 0.0500030517578125, 0.05276012420654297, 0.05551719665527344, 0.058274269104003906, 0.061031341552734375, 0.06378841400146484, 0.06654548645019531, 0.06930255889892578, 0.07205963134765625, 0.07481670379638672, 0.07757377624511719, 0.08033084869384766, 0.08308792114257812, 0.0858449935913086, 0.08860206604003906, 0.09135913848876953, 0.0941162109375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 223.0, 794.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10006608814001083, -0.09713046997785568, -0.09419485181570053, -0.09125923365354538, -0.08832362294197083, -0.08538800477981567, -0.08245238661766052, -0.07951676845550537, -0.07658115029335022, -0.07364553213119507, -0.07070991396903992, -0.06777429580688477, -0.06483867764472961, -0.06190306320786476, -0.05896744877099991, -0.05603183060884476, -0.053096212446689606, -0.050160594284534454, -0.0472249761223793, -0.04428936168551445, -0.0413537435233593, -0.03841812536120415, -0.035482510924339294, -0.03254689276218414, -0.02961127460002899, -0.02667565643787384, -0.023740040138363838, -0.020804423838853836, -0.017868805676698685, -0.014933188445866108, -0.011997571215033531, -0.009061954915523529, -0.006126329302787781, -0.003190712071955204, -0.00025509484112262726, 0.0026805223897099495, 0.005616139620542526, 0.008551756851375103, 0.01148737408220768, 0.014422990381717682, 0.017358608543872833, 0.020294226706027985, 0.023229843005537987, 0.02616545930504799, 0.02910107746720314, 0.03203669562935829, 0.034972310066223145, 0.037907928228378296, 0.04084354639053345, 0.0437791645526886, 0.04671478271484375, 0.0496503971517086, 0.052586015313863754, 0.055521633476018906, 0.05845724791288376, 0.06139286607503891, 0.06432848423719406, 0.06726410239934921, 0.07019972056150436, 0.07313533872365952, 0.07607094943523407, 0.07900656759738922, 0.08194218575954437, 0.08487780392169952, 0.08781342208385468]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 13.0, 15.0, 31.0, 25.0, 34.0, 36.0, 42.0, 49.0, 68.0, 82.0, 87.0, 73.0, 63.0, 68.0, 48.0, 53.0, 41.0, 42.0, 32.0, 23.0, 24.0, 19.0, 7.0, 8.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004254341125488281, -0.004040941596031189, -0.0038275420665740967, -0.0036141425371170044, -0.003400743007659912, -0.00318734347820282, -0.0029739439487457275, -0.0027605444192886353, -0.002547144889831543, -0.0023337453603744507, -0.0021203458309173584, -0.0019069463014602661, -0.0016935467720031738, -0.0014801472425460815, -0.0012667477130889893, -0.001053348183631897, -0.0008399486541748047, -0.0006265491247177124, -0.0004131495952606201, -0.00019975006580352783, 1.3649463653564453e-05, 0.00022704899311065674, 0.000440448522567749, 0.0006538480520248413, 0.0008672475814819336, 0.0010806471109390259, 0.0012940466403961182, 0.0015074461698532104, 0.0017208456993103027, 0.001934245228767395, 0.0021476447582244873, 0.0023610442876815796, 0.002574443817138672, 0.002787843346595764, 0.0030012428760528564, 0.0032146424055099487, 0.003428041934967041, 0.0036414414644241333, 0.0038548409938812256, 0.004068240523338318, 0.00428164005279541, 0.0044950395822525024, 0.004708439111709595, 0.004921838641166687, 0.005135238170623779, 0.005348637700080872, 0.005562037229537964, 0.005775436758995056, 0.0059888362884521484, 0.006202235817909241, 0.006415635347366333, 0.006629034876823425, 0.006842434406280518, 0.00705583393573761, 0.007269233465194702, 0.007482632994651794, 0.007696032524108887, 0.007909432053565979, 0.008122831583023071, 0.008336231112480164, 0.008549630641937256, 0.008763030171394348, 0.00897642970085144, 0.009189829230308533, 0.009403228759765625]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 4.0, 6.0, 4.0, 5.0, 8.0, 12.0, 8.0, 12.0, 22.0, 18.0, 18.0, 19.0, 22.0, 20.0, 25.0, 27.0, 36.0, 37.0, 29.0, 32.0, 31.0, 50.0, 34.0, 47.0, 31.0, 41.0, 42.0, 30.0, 32.0, 38.0, 35.0, 28.0, 31.0, 23.0, 15.0, 22.0, 16.0, 21.0, 12.0, 14.0, 12.0, 3.0, 4.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.771484375, -1.717926025390625, -1.66436767578125, -1.610809326171875, -1.5572509765625, -1.503692626953125, -1.45013427734375, -1.396575927734375, -1.343017578125, -1.289459228515625, -1.23590087890625, -1.182342529296875, -1.1287841796875, -1.075225830078125, -1.02166748046875, -0.968109130859375, -0.91455078125, -0.860992431640625, -0.80743408203125, -0.753875732421875, -0.7003173828125, -0.646759033203125, -0.59320068359375, -0.539642333984375, -0.486083984375, -0.432525634765625, -0.37896728515625, -0.325408935546875, -0.2718505859375, -0.218292236328125, -0.16473388671875, -0.111175537109375, -0.0576171875, -0.004058837890625, 0.04949951171875, 0.103057861328125, 0.1566162109375, 0.210174560546875, 0.26373291015625, 0.317291259765625, 0.370849609375, 0.424407958984375, 0.47796630859375, 0.531524658203125, 0.5850830078125, 0.638641357421875, 0.69219970703125, 0.745758056640625, 0.79931640625, 0.852874755859375, 0.90643310546875, 0.959991455078125, 1.0135498046875, 1.067108154296875, 1.12066650390625, 1.174224853515625, 1.227783203125, 1.281341552734375, 1.33489990234375, 1.388458251953125, 1.4420166015625, 1.495574951171875, 1.54913330078125, 1.602691650390625, 1.65625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 20.0, 31.0, 21.0, 34.0, 47.0, 54.0, 74.0, 98.0, 153.0, 186.0, 232.0, 319.0, 486.0, 627.0, 853.0, 1198.0, 1703.0, 2583.0, 3726.0, 5796.0, 9347.0, 16432.0, 34837.0, 92764.0, 262451.0, 352889.0, 152828.0, 52539.0, 22456.0, 11931.0, 7066.0, 4491.0, 2947.0, 2084.0, 1505.0, 1044.0, 702.0, 537.0, 364.0, 293.0, 218.0, 162.0, 117.0, 77.0, 61.0, 46.0, 41.0, 20.0, 21.0, 14.0, 11.0, 9.0, 7.0, 2.0, 4.0, 1.0], "bins": [-4.81640625, -4.67144775390625, -4.5264892578125, -4.38153076171875, -4.236572265625, -4.09161376953125, -3.9466552734375, -3.80169677734375, -3.65673828125, -3.51177978515625, -3.3668212890625, -3.22186279296875, -3.076904296875, -2.93194580078125, -2.7869873046875, -2.64202880859375, -2.4970703125, -2.35211181640625, -2.2071533203125, -2.06219482421875, -1.917236328125, -1.77227783203125, -1.6273193359375, -1.48236083984375, -1.33740234375, -1.19244384765625, -1.0474853515625, -0.90252685546875, -0.757568359375, -0.61260986328125, -0.4676513671875, -0.32269287109375, -0.177734375, -0.03277587890625, 0.1121826171875, 0.25714111328125, 0.402099609375, 0.54705810546875, 0.6920166015625, 0.83697509765625, 0.98193359375, 1.12689208984375, 1.2718505859375, 1.41680908203125, 1.561767578125, 1.70672607421875, 1.8516845703125, 1.99664306640625, 2.1416015625, 2.28656005859375, 2.4315185546875, 2.57647705078125, 2.721435546875, 2.86639404296875, 3.0113525390625, 3.15631103515625, 3.30126953125, 3.44622802734375, 3.5911865234375, 3.73614501953125, 3.881103515625, 4.02606201171875, 4.1710205078125, 4.31597900390625, 4.4609375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 2.0, 4.0, 6.0, 10.0, 10.0, 5.0, 12.0, 8.0, 21.0, 13.0, 18.0, 25.0, 36.0, 30.0, 35.0, 33.0, 60.0, 60.0, 93.0, 203.0, 281.0, 1295.0, 193.0, 136.0, 85.0, 65.0, 54.0, 39.0, 39.0, 31.0, 23.0, 28.0, 21.0, 7.0, 13.0, 14.0, 13.0, 10.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7734375, -5.5811767578125, -5.388916015625, -5.1966552734375, -5.00439453125, -4.8121337890625, -4.619873046875, -4.4276123046875, -4.2353515625, -4.0430908203125, -3.850830078125, -3.6585693359375, -3.46630859375, -3.2740478515625, -3.081787109375, -2.8895263671875, -2.697265625, -2.5050048828125, -2.312744140625, -2.1204833984375, -1.92822265625, -1.7359619140625, -1.543701171875, -1.3514404296875, -1.1591796875, -0.9669189453125, -0.774658203125, -0.5823974609375, -0.39013671875, -0.1978759765625, -0.005615234375, 0.1866455078125, 0.37890625, 0.5711669921875, 0.763427734375, 0.9556884765625, 1.14794921875, 1.3402099609375, 1.532470703125, 1.7247314453125, 1.9169921875, 2.1092529296875, 2.301513671875, 2.4937744140625, 2.68603515625, 2.8782958984375, 3.070556640625, 3.2628173828125, 3.455078125, 3.6473388671875, 3.839599609375, 4.0318603515625, 4.22412109375, 4.4163818359375, 4.608642578125, 4.8009033203125, 4.9931640625, 5.1854248046875, 5.377685546875, 5.5699462890625, 5.76220703125, 5.9544677734375, 6.146728515625, 6.3389892578125, 6.53125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 8.0, 4.0, 4.0, 12.0, 8.0, 13.0, 16.0, 21.0, 19.0, 16.0, 20.0, 34.0, 54.0, 64.0, 104.0, 177.0, 458.0, 1468.0, 45252.0, 3068675.0, 27089.0, 1273.0, 373.0, 168.0, 94.0, 54.0, 44.0, 25.0, 36.0, 21.0, 14.0, 16.0, 8.0, 7.0, 12.0, 8.0, 3.0, 7.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.375, -20.6494140625, -19.923828125, -19.1982421875, -18.47265625, -17.7470703125, -17.021484375, -16.2958984375, -15.5703125, -14.8447265625, -14.119140625, -13.3935546875, -12.66796875, -11.9423828125, -11.216796875, -10.4912109375, -9.765625, -9.0400390625, -8.314453125, -7.5888671875, -6.86328125, -6.1376953125, -5.412109375, -4.6865234375, -3.9609375, -3.2353515625, -2.509765625, -1.7841796875, -1.05859375, -0.3330078125, 0.392578125, 1.1181640625, 1.84375, 2.5693359375, 3.294921875, 4.0205078125, 4.74609375, 5.4716796875, 6.197265625, 6.9228515625, 7.6484375, 8.3740234375, 9.099609375, 9.8251953125, 10.55078125, 11.2763671875, 12.001953125, 12.7275390625, 13.453125, 14.1787109375, 14.904296875, 15.6298828125, 16.35546875, 17.0810546875, 17.806640625, 18.5322265625, 19.2578125, 19.9833984375, 20.708984375, 21.4345703125, 22.16015625, 22.8857421875, 23.611328125, 24.3369140625, 25.0625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 16.0, 990.0, 11.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.18864440917969, -31.492420196533203, -25.79619598388672, -20.099971771240234, -14.40374755859375, -8.707523345947266, -3.0112991333007812, 2.684925079345703, 8.381149291992188, 14.077373504638672, 19.773597717285156, 25.46982192993164, 31.166046142578125, 36.86227035522461, 42.558494567871094, 48.25471878051758, 53.95094299316406, 59.64716720581055, 65.34339141845703, 71.03961181640625, 76.73583984375, 82.43206787109375, 88.12828826904297, 93.82450866699219, 99.52073669433594, 105.21696472167969, 110.9131851196289, 116.60940551757812, 122.30563354492188, 128.00186157226562, 133.69808959960938, 139.39430236816406, 145.09054565429688, 150.78677368164062, 156.48300170898438, 162.17921447753906, 167.8754425048828, 173.57167053222656, 179.26788330078125, 184.964111328125, 190.66033935546875, 196.3565673828125, 202.05279541015625, 207.74900817871094, 213.4452362060547, 219.14146423339844, 224.83767700195312, 230.53390502929688, 236.23013305664062, 241.92636108398438, 247.62258911132812, 253.3188018798828, 259.0150146484375, 264.71124267578125, 270.407470703125, 276.10369873046875, 281.7999267578125, 287.49615478515625, 293.1923828125, 298.88861083984375, 304.5848388671875, 310.2810363769531, 315.9772644042969, 321.6734924316406, 327.3697204589844]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 1.0, 8.0, 8.0, 3.0, 8.0, 8.0, 17.0, 9.0, 15.0, 12.0, 14.0, 21.0, 18.0, 25.0, 27.0, 27.0, 37.0, 43.0, 45.0, 46.0, 43.0, 40.0, 54.0, 38.0, 38.0, 40.0, 39.0, 32.0, 30.0, 30.0, 27.0, 21.0, 18.0, 25.0, 23.0, 13.0, 15.0, 15.0, 11.0, 10.0, 16.0, 4.0, 9.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-17.912866592407227, -17.33602523803711, -16.759183883666992, -16.182342529296875, -15.605502128601074, -15.028660774230957, -14.451820373535156, -13.874979019165039, -13.298137664794922, -12.721296310424805, -12.144454956054688, -11.567614555358887, -10.99077320098877, -10.413931846618652, -9.837091445922852, -9.260250091552734, -8.683408737182617, -8.1065673828125, -7.529726505279541, -6.952885627746582, -6.376044273376465, -5.799202919006348, -5.222362041473389, -4.64552116394043, -4.0686798095703125, -3.4918386936187744, -2.9149975776672363, -2.3381564617156982, -1.7613153457641602, -1.184474229812622, -0.607633113861084, -0.030792236328125, 0.5460491180419922, 1.1228902339935303, 1.6997313499450684, 2.2765724658966064, 2.8534135818481445, 3.4302546977996826, 4.007095813751221, 4.58393669128418, 5.160778045654297, 5.737619400024414, 6.314460277557373, 6.891301155090332, 7.468142509460449, 8.044983863830566, 8.621824264526367, 9.198665618896484, 9.775506973266602, 10.352348327636719, 10.929189682006836, 11.506030082702637, 12.082871437072754, 12.659712791442871, 13.236553192138672, 13.813394546508789, 14.390235900878906, 14.967077255249023, 15.54391860961914, 16.120759963989258, 16.697601318359375, 17.27444076538086, 17.851282119750977, 18.428123474121094, 19.00496482849121]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 9.0, 11.0, 11.0, 12.0, 16.0, 14.0, 13.0, 17.0, 21.0, 21.0, 30.0, 30.0, 33.0, 33.0, 31.0, 45.0, 42.0, 46.0, 45.0, 36.0, 36.0, 29.0, 43.0, 43.0, 34.0, 44.0, 28.0, 42.0, 21.0, 21.0, 17.0, 24.0, 11.0, 18.0, 13.0, 13.0, 10.0, 5.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.056640625, -1.9964141845703125, -1.936187744140625, -1.8759613037109375, -1.81573486328125, -1.7555084228515625, -1.695281982421875, -1.6350555419921875, -1.5748291015625, -1.5146026611328125, -1.454376220703125, -1.3941497802734375, -1.33392333984375, -1.2736968994140625, -1.213470458984375, -1.1532440185546875, -1.093017578125, -1.0327911376953125, -0.972564697265625, -0.9123382568359375, -0.85211181640625, -0.7918853759765625, -0.731658935546875, -0.6714324951171875, -0.6112060546875, -0.5509796142578125, -0.490753173828125, -0.4305267333984375, -0.37030029296875, -0.3100738525390625, -0.249847412109375, -0.1896209716796875, -0.12939453125, -0.0691680908203125, -0.008941650390625, 0.0512847900390625, 0.11151123046875, 0.1717376708984375, 0.231964111328125, 0.2921905517578125, 0.3524169921875, 0.4126434326171875, 0.472869873046875, 0.5330963134765625, 0.59332275390625, 0.6535491943359375, 0.713775634765625, 0.7740020751953125, 0.834228515625, 0.8944549560546875, 0.954681396484375, 1.0149078369140625, 1.07513427734375, 1.1353607177734375, 1.195587158203125, 1.2558135986328125, 1.3160400390625, 1.3762664794921875, 1.436492919921875, 1.4967193603515625, 1.55694580078125, 1.6171722412109375, 1.677398681640625, 1.7376251220703125, 1.7978515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 4.0, 9.0, 9.0, 10.0, 14.0, 25.0, 16.0, 33.0, 38.0, 53.0, 56.0, 76.0, 114.0, 136.0, 190.0, 239.0, 372.0, 667.0, 1309.0, 3744.0, 14348.0, 86752.0, 1009503.0, 2735835.0, 293498.0, 34926.0, 7347.0, 2291.0, 956.0, 499.0, 321.0, 226.0, 164.0, 107.0, 95.0, 63.0, 58.0, 55.0, 25.0, 16.0, 12.0, 14.0, 15.0, 8.0, 5.0, 4.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.296875, -7.0557861328125, -6.814697265625, -6.5736083984375, -6.33251953125, -6.0914306640625, -5.850341796875, -5.6092529296875, -5.3681640625, -5.1270751953125, -4.885986328125, -4.6448974609375, -4.40380859375, -4.1627197265625, -3.921630859375, -3.6805419921875, -3.439453125, -3.1983642578125, -2.957275390625, -2.7161865234375, -2.47509765625, -2.2340087890625, -1.992919921875, -1.7518310546875, -1.5107421875, -1.2696533203125, -1.028564453125, -0.7874755859375, -0.54638671875, -0.3052978515625, -0.064208984375, 0.1768798828125, 0.41796875, 0.6590576171875, 0.900146484375, 1.1412353515625, 1.38232421875, 1.6234130859375, 1.864501953125, 2.1055908203125, 2.3466796875, 2.5877685546875, 2.828857421875, 3.0699462890625, 3.31103515625, 3.5521240234375, 3.793212890625, 4.0343017578125, 4.275390625, 4.5164794921875, 4.757568359375, 4.9986572265625, 5.23974609375, 5.4808349609375, 5.721923828125, 5.9630126953125, 6.2041015625, 6.4451904296875, 6.686279296875, 6.9273681640625, 7.16845703125, 7.4095458984375, 7.650634765625, 7.8917236328125, 8.1328125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 16.0, 14.0, 27.0, 33.0, 58.0, 54.0, 119.0, 163.0, 187.0, 309.0, 424.0, 480.0, 552.0, 454.0, 335.0, 261.0, 173.0, 136.0, 82.0, 60.0, 33.0, 26.0, 23.0, 15.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.30743408203125, -7.0797119140625, -6.85198974609375, -6.624267578125, -6.39654541015625, -6.1688232421875, -5.94110107421875, -5.71337890625, -5.48565673828125, -5.2579345703125, -5.03021240234375, -4.802490234375, -4.57476806640625, -4.3470458984375, -4.11932373046875, -3.8916015625, -3.66387939453125, -3.4361572265625, -3.20843505859375, -2.980712890625, -2.75299072265625, -2.5252685546875, -2.29754638671875, -2.06982421875, -1.84210205078125, -1.6143798828125, -1.38665771484375, -1.158935546875, -0.93121337890625, -0.7034912109375, -0.47576904296875, -0.248046875, -0.02032470703125, 0.2073974609375, 0.43511962890625, 0.662841796875, 0.89056396484375, 1.1182861328125, 1.34600830078125, 1.57373046875, 1.80145263671875, 2.0291748046875, 2.25689697265625, 2.484619140625, 2.71234130859375, 2.9400634765625, 3.16778564453125, 3.3955078125, 3.62322998046875, 3.8509521484375, 4.07867431640625, 4.306396484375, 4.53411865234375, 4.7618408203125, 4.98956298828125, 5.21728515625, 5.44500732421875, 5.6727294921875, 5.90045166015625, 6.128173828125, 6.35589599609375, 6.5836181640625, 6.81134033203125, 7.0390625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 11.0, 17.0, 26.0, 39.0, 104.0, 139.0, 310.0, 635.0, 1623.0, 4740.0, 34518.0, 791175.0, 3156677.0, 186934.0, 12707.0, 2775.0, 987.0, 428.0, 201.0, 103.0, 64.0, 29.0, 15.0, 8.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8984375, -15.3902587890625, -14.882080078125, -14.3739013671875, -13.86572265625, -13.3575439453125, -12.849365234375, -12.3411865234375, -11.8330078125, -11.3248291015625, -10.816650390625, -10.3084716796875, -9.80029296875, -9.2921142578125, -8.783935546875, -8.2757568359375, -7.767578125, -7.2593994140625, -6.751220703125, -6.2430419921875, -5.73486328125, -5.2266845703125, -4.718505859375, -4.2103271484375, -3.7021484375, -3.1939697265625, -2.685791015625, -2.1776123046875, -1.66943359375, -1.1612548828125, -0.653076171875, -0.1448974609375, 0.36328125, 0.8714599609375, 1.379638671875, 1.8878173828125, 2.39599609375, 2.9041748046875, 3.412353515625, 3.9205322265625, 4.4287109375, 4.9368896484375, 5.445068359375, 5.9532470703125, 6.46142578125, 6.9696044921875, 7.477783203125, 7.9859619140625, 8.494140625, 9.0023193359375, 9.510498046875, 10.0186767578125, 10.52685546875, 11.0350341796875, 11.543212890625, 12.0513916015625, 12.5595703125, 13.0677490234375, 13.575927734375, 14.0841064453125, 14.59228515625, 15.1004638671875, 15.608642578125, 16.1168212890625, 16.625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 9.0, 185.0, 564.0, 234.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.34942626953125, -60.21497344970703, -56.08051681518555, -51.94606399536133, -47.811607360839844, -43.677154541015625, -39.542701721191406, -35.40824890136719, -31.273792266845703, -27.13933753967285, -23.0048828125, -18.87042999267578, -14.73597526550293, -10.601520538330078, -6.467067718505859, -2.332612991333008, 1.8018417358398438, 5.936295986175537, 10.07075023651123, 14.205204010009766, 18.339658737182617, 22.47411346435547, 26.608566284179688, 30.74302101135254, 34.87747573852539, 39.01192855834961, 43.146385192871094, 47.28083801269531, 51.41529083251953, 55.549747467041016, 59.684200286865234, 63.81865692138672, 67.95310974121094, 72.08756256103516, 76.22201538085938, 80.35647583007812, 84.49092864990234, 88.62538146972656, 92.75983428955078, 96.894287109375, 101.02874755859375, 105.16320037841797, 109.29765319824219, 113.43211364746094, 117.56656646728516, 121.70101928710938, 125.8354721069336, 129.9699249267578, 134.1043701171875, 138.23883056640625, 142.37327575683594, 146.5077362060547, 150.64218139648438, 154.77664184570312, 158.91110229492188, 163.04554748535156, 167.1800079345703, 171.31446838378906, 175.44891357421875, 179.5833740234375, 183.7178192138672, 187.85227966308594, 191.98672485351562, 196.12118530273438, 200.25564575195312]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 10.0, 9.0, 10.0, 10.0, 12.0, 12.0, 16.0, 24.0, 25.0, 18.0, 21.0, 24.0, 28.0, 30.0, 21.0, 36.0, 35.0, 39.0, 33.0, 44.0, 34.0, 48.0, 46.0, 40.0, 38.0, 32.0, 37.0, 36.0, 23.0, 24.0, 29.0, 24.0, 24.0, 18.0, 17.0, 19.0, 15.0, 6.0, 11.0, 6.0, 7.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.43444061279297, -17.770204544067383, -17.105968475341797, -16.44173240661621, -15.777497291564941, -15.113261222839355, -14.449026107788086, -13.7847900390625, -13.120553970336914, -12.456317901611328, -11.792081832885742, -11.127846717834473, -10.463610649108887, -9.7993745803833, -9.135139465332031, -8.470903396606445, -7.806667327880859, -7.142431259155273, -6.478195667266846, -5.813960075378418, -5.149724006652832, -4.485487937927246, -3.8212523460388184, -3.1570167541503906, -2.4927806854248047, -1.8285448551177979, -1.164309024810791, -0.5000731945037842, 0.16416263580322266, 0.8283984661102295, 1.4926342964172363, 2.156869888305664, 2.82110595703125, 3.485341787338257, 4.149577617645264, 4.813813209533691, 5.478049278259277, 6.142285346984863, 6.806520938873291, 7.470756530761719, 8.134992599487305, 8.79922866821289, 9.463464736938477, 10.127699851989746, 10.791935920715332, 11.456171989440918, 12.120407104492188, 12.784643173217773, 13.44887924194336, 14.113115310668945, 14.777351379394531, 15.4415864944458, 16.105823516845703, 16.770057678222656, 17.434293746948242, 18.098529815673828, 18.762765884399414, 19.427001953125, 20.091238021850586, 20.755474090576172, 21.419708251953125, 22.08394432067871, 22.748180389404297, 23.412416458129883, 24.07665252685547]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 8.0, 5.0, 6.0, 7.0, 4.0, 13.0, 17.0, 19.0, 16.0, 17.0, 19.0, 24.0, 25.0, 30.0, 30.0, 36.0, 34.0, 42.0, 31.0, 49.0, 43.0, 36.0, 45.0, 40.0, 28.0, 34.0, 40.0, 43.0, 36.0, 33.0, 26.0, 27.0, 22.0, 17.0, 19.0, 15.0, 11.0, 12.0, 10.0, 12.0, 7.0, 4.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.1484375, -2.0880889892578125, -2.027740478515625, -1.9673919677734375, -1.90704345703125, -1.8466949462890625, -1.786346435546875, -1.7259979248046875, -1.6656494140625, -1.6053009033203125, -1.544952392578125, -1.4846038818359375, -1.42425537109375, -1.3639068603515625, -1.303558349609375, -1.2432098388671875, -1.182861328125, -1.1225128173828125, -1.062164306640625, -1.0018157958984375, -0.94146728515625, -0.8811187744140625, -0.820770263671875, -0.7604217529296875, -0.7000732421875, -0.6397247314453125, -0.579376220703125, -0.5190277099609375, -0.45867919921875, -0.3983306884765625, -0.337982177734375, -0.2776336669921875, -0.21728515625, -0.1569366455078125, -0.096588134765625, -0.0362396240234375, 0.02410888671875, 0.0844573974609375, 0.144805908203125, 0.2051544189453125, 0.2655029296875, 0.3258514404296875, 0.386199951171875, 0.4465484619140625, 0.50689697265625, 0.5672454833984375, 0.627593994140625, 0.6879425048828125, 0.748291015625, 0.8086395263671875, 0.868988037109375, 0.9293365478515625, 0.98968505859375, 1.0500335693359375, 1.110382080078125, 1.1707305908203125, 1.2310791015625, 1.2914276123046875, 1.351776123046875, 1.4121246337890625, 1.47247314453125, 1.5328216552734375, 1.593170166015625, 1.6535186767578125, 1.7138671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 3.0, 7.0, 13.0, 13.0, 16.0, 32.0, 52.0, 62.0, 116.0, 164.0, 247.0, 352.0, 591.0, 852.0, 1297.0, 1962.0, 3019.0, 4765.0, 7474.0, 12053.0, 18645.0, 29798.0, 46195.0, 72207.0, 108329.0, 150231.0, 174010.0, 139787.0, 97493.0, 64958.0, 41244.0, 26483.0, 16597.0, 10596.0, 6726.0, 4348.0, 2747.0, 1777.0, 1087.0, 755.0, 473.0, 312.0, 213.0, 152.0, 97.0, 70.0, 51.0, 23.0, 29.0, 10.0, 9.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.1514892578125, -0.14694976806640625, -0.1424102783203125, -0.13787078857421875, -0.133331298828125, -0.12879180908203125, -0.1242523193359375, -0.11971282958984375, -0.11517333984375, -0.11063385009765625, -0.1060943603515625, -0.10155487060546875, -0.097015380859375, -0.09247589111328125, -0.0879364013671875, -0.08339691162109375, -0.078857421875, -0.07431793212890625, -0.0697784423828125, -0.06523895263671875, -0.060699462890625, -0.05615997314453125, -0.0516204833984375, -0.04708099365234375, -0.04254150390625, -0.03800201416015625, -0.0334625244140625, -0.02892303466796875, -0.024383544921875, -0.01984405517578125, -0.0153045654296875, -0.01076507568359375, -0.0062255859375, -0.00168609619140625, 0.0028533935546875, 0.00739288330078125, 0.011932373046875, 0.01647186279296875, 0.0210113525390625, 0.02555084228515625, 0.03009033203125, 0.03462982177734375, 0.0391693115234375, 0.04370880126953125, 0.048248291015625, 0.05278778076171875, 0.0573272705078125, 0.06186676025390625, 0.06640625, 0.07094573974609375, 0.0754852294921875, 0.08002471923828125, 0.084564208984375, 0.08910369873046875, 0.0936431884765625, 0.09818267822265625, 0.10272216796875, 0.10726165771484375, 0.1118011474609375, 0.11634063720703125, 0.120880126953125, 0.12541961669921875, 0.1299591064453125, 0.13449859619140625, 0.1390380859375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 1.0, 6.0, 9.0, 7.0, 11.0, 11.0, 20.0, 14.0, 14.0, 22.0, 24.0, 27.0, 32.0, 31.0, 32.0, 26.0, 37.0, 41.0, 41.0, 46.0, 40.0, 1059.0, 41.0, 54.0, 41.0, 30.0, 41.0, 23.0, 23.0, 34.0, 24.0, 22.0, 22.0, 16.0, 8.0, 16.0, 15.0, 13.0, 12.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.15234375, -1.1144866943359375, -1.076629638671875, -1.0387725830078125, -1.00091552734375, -0.9630584716796875, -0.925201416015625, -0.8873443603515625, -0.8494873046875, -0.8116302490234375, -0.773773193359375, -0.7359161376953125, -0.69805908203125, -0.6602020263671875, -0.622344970703125, -0.5844879150390625, -0.546630859375, -0.5087738037109375, -0.470916748046875, -0.4330596923828125, -0.39520263671875, -0.3573455810546875, -0.319488525390625, -0.2816314697265625, -0.2437744140625, -0.2059173583984375, -0.168060302734375, -0.1302032470703125, -0.09234619140625, -0.0544891357421875, -0.016632080078125, 0.0212249755859375, 0.05908203125, 0.0969390869140625, 0.134796142578125, 0.1726531982421875, 0.21051025390625, 0.2483673095703125, 0.286224365234375, 0.3240814208984375, 0.3619384765625, 0.3997955322265625, 0.437652587890625, 0.4755096435546875, 0.51336669921875, 0.5512237548828125, 0.589080810546875, 0.6269378662109375, 0.664794921875, 0.7026519775390625, 0.740509033203125, 0.7783660888671875, 0.81622314453125, 0.8540802001953125, 0.891937255859375, 0.9297943115234375, 0.9676513671875, 1.0055084228515625, 1.043365478515625, 1.0812225341796875, 1.11907958984375, 1.1569366455078125, 1.194793701171875, 1.2326507568359375, 1.2705078125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 8.0, 16.0, 23.0, 47.0, 49.0, 87.0, 121.0, 196.0, 259.0, 441.0, 663.0, 953.0, 1463.0, 2219.0, 3434.0, 5250.0, 8079.0, 12198.0, 18608.0, 28453.0, 42461.0, 62764.0, 89319.0, 121533.0, 962313.0, 359881.0, 115088.0, 84708.0, 59468.0, 39972.0, 26812.0, 17309.0, 11500.0, 7359.0, 4858.0, 3186.0, 2015.0, 1292.0, 913.0, 601.0, 376.0, 237.0, 185.0, 145.0, 97.0, 59.0, 34.0, 22.0, 26.0, 13.0, 8.0, 7.0, 2.0, 2.0], "bins": [-0.09521484375, -0.09248828887939453, -0.08976173400878906, -0.0870351791381836, -0.08430862426757812, -0.08158206939697266, -0.07885551452636719, -0.07612895965576172, -0.07340240478515625, -0.07067584991455078, -0.06794929504394531, -0.06522274017333984, -0.062496185302734375, -0.059769630432128906, -0.05704307556152344, -0.05431652069091797, -0.0515899658203125, -0.04886341094970703, -0.04613685607910156, -0.043410301208496094, -0.040683746337890625, -0.037957191467285156, -0.03523063659667969, -0.03250408172607422, -0.02977752685546875, -0.02705097198486328, -0.024324417114257812, -0.021597862243652344, -0.018871307373046875, -0.016144752502441406, -0.013418197631835938, -0.010691642761230469, -0.007965087890625, -0.005238533020019531, -0.0025119781494140625, 0.00021457672119140625, 0.002941131591796875, 0.005667686462402344, 0.008394241333007812, 0.011120796203613281, 0.01384735107421875, 0.01657390594482422, 0.019300460815429688, 0.022027015686035156, 0.024753570556640625, 0.027480125427246094, 0.030206680297851562, 0.03293323516845703, 0.0356597900390625, 0.03838634490966797, 0.04111289978027344, 0.043839454650878906, 0.046566009521484375, 0.049292564392089844, 0.05201911926269531, 0.05474567413330078, 0.05747222900390625, 0.06019878387451172, 0.06292533874511719, 0.06565189361572266, 0.06837844848632812, 0.0711050033569336, 0.07383155822753906, 0.07655811309814453, 0.07928466796875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 8.0, 6.0, 6.0, 6.0, 6.0, 7.0, 12.0, 24.0, 33.0, 29.0, 46.0, 59.0, 115.0, 113.0, 113.0, 104.0, 94.0, 41.0, 51.0, 27.0, 27.0, 21.0, 13.0, 6.0, 6.0, 5.0, 6.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009185791015625, -0.008950889110565186, -0.008715987205505371, -0.008481085300445557, -0.008246183395385742, -0.008011281490325928, -0.007776379585266113, -0.007541477680206299, -0.007306575775146484, -0.00707167387008667, -0.0068367719650268555, -0.006601870059967041, -0.0063669681549072266, -0.006132066249847412, -0.005897164344787598, -0.005662262439727783, -0.005427360534667969, -0.005192458629608154, -0.00495755672454834, -0.004722654819488525, -0.004487752914428711, -0.0042528510093688965, -0.004017949104309082, -0.0037830471992492676, -0.003548145294189453, -0.0033132433891296387, -0.0030783414840698242, -0.0028434395790100098, -0.0026085376739501953, -0.002373635768890381, -0.0021387338638305664, -0.001903831958770752, -0.0016689300537109375, -0.001434028148651123, -0.0011991262435913086, -0.0009642243385314941, -0.0007293224334716797, -0.0004944205284118652, -0.0002595186233520508, -2.4616718292236328e-05, 0.00021028518676757812, 0.0004451870918273926, 0.000680088996887207, 0.0009149909019470215, 0.001149892807006836, 0.0013847947120666504, 0.0016196966171264648, 0.0018545985221862793, 0.0020895004272460938, 0.002324402332305908, 0.0025593042373657227, 0.002794206142425537, 0.0030291080474853516, 0.003264009952545166, 0.0034989118576049805, 0.003733813762664795, 0.003968715667724609, 0.004203617572784424, 0.004438519477844238, 0.004673421382904053, 0.004908323287963867, 0.005143225193023682, 0.005378127098083496, 0.0056130290031433105, 0.005847930908203125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 7.0, 5.0, 3.0, 7.0, 4.0, 13.0, 11.0, 22.0, 24.0, 23.0, 31.0, 46.0, 71.0, 97.0, 189.0, 408.0, 1771.0, 1042453.0, 2436.0, 405.0, 187.0, 98.0, 62.0, 44.0, 42.0, 17.0, 14.0, 13.0, 11.0, 7.0, 13.0, 6.0, 1.0, 6.0, 1.0, 0.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138916015625, -0.1336822509765625, -0.128448486328125, -0.1232147216796875, -0.11798095703125, -0.1127471923828125, -0.107513427734375, -0.1022796630859375, -0.0970458984375, -0.0918121337890625, -0.086578369140625, -0.0813446044921875, -0.07611083984375, -0.0708770751953125, -0.065643310546875, -0.0604095458984375, -0.05517578125, -0.0499420166015625, -0.044708251953125, -0.0394744873046875, -0.03424072265625, -0.0290069580078125, -0.023773193359375, -0.0185394287109375, -0.0133056640625, -0.0080718994140625, -0.002838134765625, 0.0023956298828125, 0.00762939453125, 0.0128631591796875, 0.018096923828125, 0.0233306884765625, 0.028564453125, 0.0337982177734375, 0.039031982421875, 0.0442657470703125, 0.04949951171875, 0.0547332763671875, 0.059967041015625, 0.0652008056640625, 0.0704345703125, 0.0756683349609375, 0.080902099609375, 0.0861358642578125, 0.09136962890625, 0.0966033935546875, 0.101837158203125, 0.1070709228515625, 0.1123046875, 0.1175384521484375, 0.122772216796875, 0.1280059814453125, 0.13323974609375, 0.1384735107421875, 0.143707275390625, 0.1489410400390625, 0.1541748046875, 0.1594085693359375, 0.164642333984375, 0.1698760986328125, 0.17510986328125, 0.1803436279296875, 0.185577392578125, 0.1908111572265625, 0.196044921875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1009.0, 7.0, 0.0, 0.0, 1.0], "bins": [-0.2553044557571411, -0.2510179281234741, -0.24673143029212952, -0.24244491755962372, -0.23815840482711792, -0.23387187719345093, -0.22958537936210632, -0.22529885172843933, -0.22101233899593353, -0.21672582626342773, -0.21243931353092194, -0.20815280079841614, -0.20386628806591034, -0.19957977533340454, -0.19529324769973755, -0.19100673496723175, -0.18672022223472595, -0.18243370950222015, -0.17814719676971436, -0.17386068403720856, -0.16957417130470276, -0.16528764367103577, -0.16100114583969116, -0.15671461820602417, -0.15242812037467957, -0.14814160764217377, -0.14385509490966797, -0.13956858217716217, -0.13528206944465637, -0.13099554181098938, -0.12670904397964478, -0.12242252379655838, -0.11813601106405258, -0.11384949833154678, -0.10956298559904099, -0.10527646541595459, -0.10098995268344879, -0.096703439950943, -0.0924169272184372, -0.0881304144859314, -0.0838439017534256, -0.0795573890209198, -0.075270876288414, -0.0709843635559082, -0.06669784337282181, -0.06241133064031601, -0.05812481790781021, -0.05383830517530441, -0.04955178499221802, -0.04526527225971222, -0.04097875580191612, -0.036692243069410324, -0.03240572661161423, -0.02811921387910843, -0.02383270114660263, -0.019546186551451683, -0.015259671956300735, -0.010973157361149788, -0.006686643697321415, -0.002400130033493042, 0.0018863845616579056, 0.006172899156808853, 0.010459411889314651, 0.014745926484465599, 0.019032441079616547]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 10.0, 12.0, 12.0, 25.0, 23.0, 35.0, 47.0, 40.0, 46.0, 68.0, 62.0, 58.0, 67.0, 57.0, 51.0, 50.0, 48.0, 45.0, 41.0, 24.0, 29.0, 32.0, 28.0, 16.0, 23.0, 14.0, 9.0, 11.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005879044532775879, -0.005641903728246689, -0.005404762923717499, -0.005167622119188309, -0.004930481314659119, -0.004693340510129929, -0.0044561997056007385, -0.0042190589010715485, -0.003981918096542358, -0.0037447772920131683, -0.0035076364874839783, -0.003270495682954788, -0.003033354878425598, -0.002796214073896408, -0.002559073269367218, -0.002321932464838028, -0.002084791660308838, -0.0018476508557796478, -0.0016105100512504578, -0.0013733692467212677, -0.0011362284421920776, -0.0008990876376628876, -0.0006619468331336975, -0.00042480602860450745, -0.00018766522407531738, 4.947558045387268e-05, 0.00028661638498306274, 0.0005237571895122528, 0.0007608979940414429, 0.000998038798570633, 0.001235179603099823, 0.001472320407629013, 0.0017094612121582031, 0.0019466020166873932, 0.0021837428212165833, 0.0024208836257457733, 0.0026580244302749634, 0.0028951652348041534, 0.0031323060393333435, 0.0033694468438625336, 0.0036065876483917236, 0.0038437284529209137, 0.004080869257450104, 0.004318010061979294, 0.004555150866508484, 0.004792291671037674, 0.005029432475566864, 0.005266573280096054, 0.005503714084625244, 0.005740854889154434, 0.005977995693683624, 0.006215136498212814, 0.006452277302742004, 0.0066894181072711945, 0.0069265589118003845, 0.007163699716329575, 0.007400840520858765, 0.007637981325387955, 0.007875122129917145, 0.008112262934446335, 0.008349403738975525, 0.008586544543504715, 0.008823685348033905, 0.009060826152563095, 0.009297966957092285]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 8.0, 5.0, 6.0, 7.0, 4.0, 13.0, 17.0, 19.0, 16.0, 17.0, 19.0, 24.0, 25.0, 30.0, 30.0, 36.0, 34.0, 42.0, 31.0, 49.0, 43.0, 36.0, 45.0, 40.0, 28.0, 34.0, 41.0, 42.0, 36.0, 33.0, 26.0, 27.0, 22.0, 17.0, 19.0, 15.0, 11.0, 12.0, 10.0, 12.0, 7.0, 4.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.1484375, -2.0880889892578125, -2.027740478515625, -1.9673919677734375, -1.90704345703125, -1.8466949462890625, -1.786346435546875, -1.7259979248046875, -1.6656494140625, -1.6053009033203125, -1.544952392578125, -1.4846038818359375, -1.42425537109375, -1.3639068603515625, -1.303558349609375, -1.2432098388671875, -1.182861328125, -1.1225128173828125, -1.062164306640625, -1.0018157958984375, -0.94146728515625, -0.8811187744140625, -0.820770263671875, -0.7604217529296875, -0.7000732421875, -0.6397247314453125, -0.579376220703125, -0.5190277099609375, -0.45867919921875, -0.3983306884765625, -0.337982177734375, -0.2776336669921875, -0.21728515625, -0.1569366455078125, -0.096588134765625, -0.0362396240234375, 0.02410888671875, 0.0844573974609375, 0.144805908203125, 0.2051544189453125, 0.2655029296875, 0.3258514404296875, 0.386199951171875, 0.4465484619140625, 0.50689697265625, 0.5672454833984375, 0.627593994140625, 0.6879425048828125, 0.748291015625, 0.8086395263671875, 0.868988037109375, 0.9293365478515625, 0.98968505859375, 1.0500335693359375, 1.110382080078125, 1.1707305908203125, 1.2310791015625, 1.2914276123046875, 1.351776123046875, 1.4121246337890625, 1.47247314453125, 1.5328216552734375, 1.593170166015625, 1.6535186767578125, 1.7138671875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 6.0, 15.0, 6.0, 10.0, 25.0, 31.0, 34.0, 38.0, 69.0, 95.0, 142.0, 190.0, 308.0, 444.0, 690.0, 1130.0, 2149.0, 4236.0, 9189.0, 20676.0, 47248.0, 108628.0, 219055.0, 288835.0, 186593.0, 88453.0, 38236.0, 16556.0, 7320.0, 3550.0, 1757.0, 1008.0, 633.0, 395.0, 256.0, 164.0, 109.0, 73.0, 56.0, 44.0, 36.0, 25.0, 21.0, 7.0, 10.0, 3.0, 5.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0], "bins": [-2.39453125, -2.324859619140625, -2.25518798828125, -2.185516357421875, -2.1158447265625, -2.046173095703125, -1.97650146484375, -1.906829833984375, -1.837158203125, -1.767486572265625, -1.69781494140625, -1.628143310546875, -1.5584716796875, -1.488800048828125, -1.41912841796875, -1.349456787109375, -1.27978515625, -1.210113525390625, -1.14044189453125, -1.070770263671875, -1.0010986328125, -0.931427001953125, -0.86175537109375, -0.792083740234375, -0.722412109375, -0.652740478515625, -0.58306884765625, -0.513397216796875, -0.4437255859375, -0.374053955078125, -0.30438232421875, -0.234710693359375, -0.1650390625, -0.095367431640625, -0.02569580078125, 0.043975830078125, 0.1136474609375, 0.183319091796875, 0.25299072265625, 0.322662353515625, 0.392333984375, 0.462005615234375, 0.53167724609375, 0.601348876953125, 0.6710205078125, 0.740692138671875, 0.81036376953125, 0.880035400390625, 0.94970703125, 1.019378662109375, 1.08905029296875, 1.158721923828125, 1.2283935546875, 1.298065185546875, 1.36773681640625, 1.437408447265625, 1.507080078125, 1.576751708984375, 1.64642333984375, 1.716094970703125, 1.7857666015625, 1.855438232421875, 1.92510986328125, 1.994781494140625, 2.064453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 13.0, 11.0, 15.0, 17.0, 17.0, 22.0, 23.0, 31.0, 28.0, 43.0, 37.0, 55.0, 71.0, 99.0, 145.0, 236.0, 1339.0, 218.0, 125.0, 86.0, 56.0, 40.0, 39.0, 42.0, 31.0, 30.0, 17.0, 27.0, 21.0, 11.0, 20.0, 8.0, 16.0, 7.0, 8.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.8671875, -6.6549072265625, -6.442626953125, -6.2303466796875, -6.01806640625, -5.8057861328125, -5.593505859375, -5.3812255859375, -5.1689453125, -4.9566650390625, -4.744384765625, -4.5321044921875, -4.31982421875, -4.1075439453125, -3.895263671875, -3.6829833984375, -3.470703125, -3.2584228515625, -3.046142578125, -2.8338623046875, -2.62158203125, -2.4093017578125, -2.197021484375, -1.9847412109375, -1.7724609375, -1.5601806640625, -1.347900390625, -1.1356201171875, -0.92333984375, -0.7110595703125, -0.498779296875, -0.2864990234375, -0.07421875, 0.1380615234375, 0.350341796875, 0.5626220703125, 0.77490234375, 0.9871826171875, 1.199462890625, 1.4117431640625, 1.6240234375, 1.8363037109375, 2.048583984375, 2.2608642578125, 2.47314453125, 2.6854248046875, 2.897705078125, 3.1099853515625, 3.322265625, 3.5345458984375, 3.746826171875, 3.9591064453125, 4.17138671875, 4.3836669921875, 4.595947265625, 4.8082275390625, 5.0205078125, 5.2327880859375, 5.445068359375, 5.6573486328125, 5.86962890625, 6.0819091796875, 6.294189453125, 6.5064697265625, 6.71875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 9.0, 12.0, 5.0, 23.0, 10.0, 20.0, 16.0, 38.0, 40.0, 49.0, 53.0, 81.0, 146.0, 239.0, 440.0, 1196.0, 5456.0, 161564.0, 2896274.0, 74126.0, 3914.0, 931.0, 372.0, 201.0, 114.0, 64.0, 64.0, 51.0, 47.0, 24.0, 17.0, 21.0, 11.0, 14.0, 13.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-14.0, -13.568115234375, -13.13623046875, -12.704345703125, -12.2724609375, -11.840576171875, -11.40869140625, -10.976806640625, -10.544921875, -10.113037109375, -9.68115234375, -9.249267578125, -8.8173828125, -8.385498046875, -7.95361328125, -7.521728515625, -7.08984375, -6.657958984375, -6.22607421875, -5.794189453125, -5.3623046875, -4.930419921875, -4.49853515625, -4.066650390625, -3.634765625, -3.202880859375, -2.77099609375, -2.339111328125, -1.9072265625, -1.475341796875, -1.04345703125, -0.611572265625, -0.1796875, 0.252197265625, 0.68408203125, 1.115966796875, 1.5478515625, 1.979736328125, 2.41162109375, 2.843505859375, 3.275390625, 3.707275390625, 4.13916015625, 4.571044921875, 5.0029296875, 5.434814453125, 5.86669921875, 6.298583984375, 6.73046875, 7.162353515625, 7.59423828125, 8.026123046875, 8.4580078125, 8.889892578125, 9.32177734375, 9.753662109375, 10.185546875, 10.617431640625, 11.04931640625, 11.481201171875, 11.9130859375, 12.344970703125, 12.77685546875, 13.208740234375, 13.640625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 12.0, 333.0, 617.0, 51.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.640289306640625, -40.293643951416016, -37.946998596191406, -35.60034942626953, -33.25370407104492, -30.907058715820312, -28.56041145324707, -26.213764190673828, -23.86711883544922, -21.52047348022461, -19.173826217651367, -16.827178955078125, -14.480533599853516, -12.13388729095459, -9.787240982055664, -7.440593719482422, -5.0939483642578125, -2.7473020553588867, -0.40065574645996094, 1.9459905624389648, 4.292636871337891, 6.639283180236816, 8.985929489135742, 11.332576751708984, 13.679222106933594, 16.025867462158203, 18.372514724731445, 20.719161987304688, 23.065807342529297, 25.412452697753906, 27.75909996032715, 30.10574722290039, 32.452392578125, 34.79903793334961, 37.14568328857422, 39.492332458496094, 41.8389778137207, 44.18562316894531, 46.53227233886719, 48.8789176940918, 51.225563049316406, 53.572208404541016, 55.918853759765625, 58.2655029296875, 60.61214828491211, 62.95879364013672, 65.3054428100586, 67.65208435058594, 69.99873352050781, 72.34538269042969, 74.69202423095703, 77.0386734008789, 79.38531494140625, 81.73196411132812, 84.07861328125, 86.42526245117188, 88.77190399169922, 91.1185531616211, 93.46519470214844, 95.81184387207031, 98.15849304199219, 100.50513458251953, 102.8517837524414, 105.19842529296875, 107.54507446289062]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 5.0, 5.0, 12.0, 9.0, 14.0, 12.0, 20.0, 20.0, 20.0, 20.0, 33.0, 31.0, 28.0, 41.0, 28.0, 36.0, 34.0, 44.0, 34.0, 41.0, 43.0, 39.0, 50.0, 38.0, 37.0, 35.0, 35.0, 31.0, 34.0, 24.0, 18.0, 20.0, 18.0, 21.0, 10.0, 10.0, 4.0, 6.0, 12.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.50856590270996, -22.797746658325195, -22.086929321289062, -21.376110076904297, -20.665292739868164, -19.9544734954834, -19.243656158447266, -18.5328369140625, -17.822017669677734, -17.11119842529297, -16.400381088256836, -15.68956184387207, -14.978744506835938, -14.267925262451172, -13.557106971740723, -12.846288681030273, -12.13547134399414, -11.424653053283691, -10.713834762573242, -10.003015518188477, -9.292198181152344, -8.581378936767578, -7.870560646057129, -7.15974235534668, -6.4489240646362305, -5.738105773925781, -5.027287483215332, -4.316468715667725, -3.6056504249572754, -2.894832134246826, -2.1840133666992188, -1.4731950759887695, -0.7623748779296875, -0.05155646800994873, 0.65926194190979, 1.3700804710388184, 2.0808987617492676, 2.791717052459717, 3.502535820007324, 4.213354110717773, 4.924172401428223, 5.634990692138672, 6.345808982849121, 7.0566277503967285, 7.767446041107178, 8.478263854980469, 9.189083099365234, 9.899901390075684, 10.610719680786133, 11.321537971496582, 12.032356262207031, 12.743175506591797, 13.45399284362793, 14.164812088012695, 14.875630378723145, 15.586448669433594, 16.29726791381836, 17.008087158203125, 17.718904495239258, 18.429723739624023, 19.140541076660156, 19.851360321044922, 20.562179565429688, 21.27299690246582, 21.983814239501953]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 5.0, 8.0, 14.0, 15.0, 15.0, 15.0, 26.0, 25.0, 14.0, 32.0, 22.0, 47.0, 25.0, 33.0, 42.0, 42.0, 39.0, 52.0, 39.0, 38.0, 43.0, 38.0, 33.0, 40.0, 27.0, 38.0, 36.0, 28.0, 22.0, 24.0, 17.0, 15.0, 21.0, 12.0, 8.0, 12.0, 9.0, 11.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.1622314453125, -2.097900390625, -2.0335693359375, -1.96923828125, -1.9049072265625, -1.840576171875, -1.7762451171875, -1.7119140625, -1.6475830078125, -1.583251953125, -1.5189208984375, -1.45458984375, -1.3902587890625, -1.325927734375, -1.2615966796875, -1.197265625, -1.1329345703125, -1.068603515625, -1.0042724609375, -0.93994140625, -0.8756103515625, -0.811279296875, -0.7469482421875, -0.6826171875, -0.6182861328125, -0.553955078125, -0.4896240234375, -0.42529296875, -0.3609619140625, -0.296630859375, -0.2322998046875, -0.16796875, -0.1036376953125, -0.039306640625, 0.0250244140625, 0.08935546875, 0.1536865234375, 0.218017578125, 0.2823486328125, 0.3466796875, 0.4110107421875, 0.475341796875, 0.5396728515625, 0.60400390625, 0.6683349609375, 0.732666015625, 0.7969970703125, 0.861328125, 0.9256591796875, 0.989990234375, 1.0543212890625, 1.11865234375, 1.1829833984375, 1.247314453125, 1.3116455078125, 1.3759765625, 1.4403076171875, 1.504638671875, 1.5689697265625, 1.63330078125, 1.6976318359375, 1.761962890625, 1.8262939453125, 1.890625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 1.0, 9.0, 4.0, 10.0, 10.0, 7.0, 15.0, 22.0, 27.0, 31.0, 42.0, 42.0, 53.0, 63.0, 90.0, 101.0, 177.0, 360.0, 729.0, 1995.0, 7463.0, 34270.0, 219243.0, 1903308.0, 1781364.0, 201846.0, 32184.0, 6980.0, 1997.0, 763.0, 317.0, 191.0, 128.0, 74.0, 52.0, 58.0, 38.0, 43.0, 36.0, 30.0, 20.0, 17.0, 12.0, 13.0, 8.0, 7.0, 4.0, 8.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0], "bins": [-6.97265625, -6.7674560546875, -6.562255859375, -6.3570556640625, -6.15185546875, -5.9466552734375, -5.741455078125, -5.5362548828125, -5.3310546875, -5.1258544921875, -4.920654296875, -4.7154541015625, -4.51025390625, -4.3050537109375, -4.099853515625, -3.8946533203125, -3.689453125, -3.4842529296875, -3.279052734375, -3.0738525390625, -2.86865234375, -2.6634521484375, -2.458251953125, -2.2530517578125, -2.0478515625, -1.8426513671875, -1.637451171875, -1.4322509765625, -1.22705078125, -1.0218505859375, -0.816650390625, -0.6114501953125, -0.40625, -0.2010498046875, 0.004150390625, 0.2093505859375, 0.41455078125, 0.6197509765625, 0.824951171875, 1.0301513671875, 1.2353515625, 1.4405517578125, 1.645751953125, 1.8509521484375, 2.05615234375, 2.2613525390625, 2.466552734375, 2.6717529296875, 2.876953125, 3.0821533203125, 3.287353515625, 3.4925537109375, 3.69775390625, 3.9029541015625, 4.108154296875, 4.3133544921875, 4.5185546875, 4.7237548828125, 4.928955078125, 5.1341552734375, 5.33935546875, 5.5445556640625, 5.749755859375, 5.9549560546875, 6.16015625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 10.0, 10.0, 6.0, 24.0, 16.0, 40.0, 43.0, 59.0, 81.0, 151.0, 188.0, 267.0, 393.0, 422.0, 487.0, 475.0, 354.0, 300.0, 234.0, 151.0, 116.0, 72.0, 56.0, 33.0, 24.0, 16.0, 16.0, 7.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41796875, -7.203857421875, -6.98974609375, -6.775634765625, -6.5615234375, -6.347412109375, -6.13330078125, -5.919189453125, -5.705078125, -5.490966796875, -5.27685546875, -5.062744140625, -4.8486328125, -4.634521484375, -4.42041015625, -4.206298828125, -3.9921875, -3.778076171875, -3.56396484375, -3.349853515625, -3.1357421875, -2.921630859375, -2.70751953125, -2.493408203125, -2.279296875, -2.065185546875, -1.85107421875, -1.636962890625, -1.4228515625, -1.208740234375, -0.99462890625, -0.780517578125, -0.56640625, -0.352294921875, -0.13818359375, 0.075927734375, 0.2900390625, 0.504150390625, 0.71826171875, 0.932373046875, 1.146484375, 1.360595703125, 1.57470703125, 1.788818359375, 2.0029296875, 2.217041015625, 2.43115234375, 2.645263671875, 2.859375, 3.073486328125, 3.28759765625, 3.501708984375, 3.7158203125, 3.929931640625, 4.14404296875, 4.358154296875, 4.572265625, 4.786376953125, 5.00048828125, 5.214599609375, 5.4287109375, 5.642822265625, 5.85693359375, 6.071044921875, 6.28515625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 8.0, 6.0, 13.0, 21.0, 41.0, 63.0, 83.0, 129.0, 237.0, 445.0, 951.0, 2098.0, 6399.0, 28303.0, 163798.0, 1136871.0, 2321547.0, 445705.0, 67888.0, 13294.0, 3548.0, 1405.0, 647.0, 314.0, 166.0, 96.0, 78.0, 35.0, 26.0, 21.0, 8.0, 7.0, 6.0, 10.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75, -9.44775390625, -9.1455078125, -8.84326171875, -8.541015625, -8.23876953125, -7.9365234375, -7.63427734375, -7.33203125, -7.02978515625, -6.7275390625, -6.42529296875, -6.123046875, -5.82080078125, -5.5185546875, -5.21630859375, -4.9140625, -4.61181640625, -4.3095703125, -4.00732421875, -3.705078125, -3.40283203125, -3.1005859375, -2.79833984375, -2.49609375, -2.19384765625, -1.8916015625, -1.58935546875, -1.287109375, -0.98486328125, -0.6826171875, -0.38037109375, -0.078125, 0.22412109375, 0.5263671875, 0.82861328125, 1.130859375, 1.43310546875, 1.7353515625, 2.03759765625, 2.33984375, 2.64208984375, 2.9443359375, 3.24658203125, 3.548828125, 3.85107421875, 4.1533203125, 4.45556640625, 4.7578125, 5.06005859375, 5.3623046875, 5.66455078125, 5.966796875, 6.26904296875, 6.5712890625, 6.87353515625, 7.17578125, 7.47802734375, 7.7802734375, 8.08251953125, 8.384765625, 8.68701171875, 8.9892578125, 9.29150390625, 9.59375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 25.0, 98.0, 258.0, 326.0, 219.0, 72.0, 13.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.46650695800781, -58.83403778076172, -56.201568603515625, -53.569095611572266, -50.93662643432617, -48.30415725708008, -45.67168426513672, -43.039215087890625, -40.40674591064453, -37.77427673339844, -35.141807556152344, -32.509334564208984, -29.87686538696289, -27.244396209716797, -24.61192512512207, -21.979454040527344, -19.34698486328125, -16.714515686035156, -14.08204460144043, -11.44957447052002, -8.81710433959961, -6.184634208679199, -3.552164077758789, -0.9196929931640625, 1.7127761840820312, 4.345246315002441, 6.977716445922852, 9.610186576843262, 12.242656707763672, 14.875126838684082, 17.507596969604492, 20.14006805419922, 22.77252960205078, 25.404998779296875, 28.0374698638916, 30.669940948486328, 33.30241012573242, 35.934879302978516, 38.567352294921875, 41.19982147216797, 43.83229064941406, 46.464759826660156, 49.09722900390625, 51.72970199584961, 54.3621711730957, 56.9946403503418, 59.627113342285156, 62.25958251953125, 64.89205169677734, 67.52452087402344, 70.15699005126953, 72.78945922851562, 75.42193603515625, 78.05440521240234, 80.68687438964844, 83.31934356689453, 85.95181274414062, 88.58428192138672, 91.21675109863281, 93.8492202758789, 96.481689453125, 99.11416625976562, 101.74663543701172, 104.37910461425781, 107.0115737915039]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 6.0, 4.0, 10.0, 12.0, 9.0, 12.0, 26.0, 20.0, 20.0, 31.0, 21.0, 16.0, 31.0, 37.0, 38.0, 48.0, 32.0, 33.0, 41.0, 48.0, 33.0, 35.0, 59.0, 49.0, 40.0, 31.0, 42.0, 42.0, 25.0, 24.0, 31.0, 24.0, 12.0, 13.0, 10.0, 10.0, 7.0, 5.0, 8.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.72806739807129, -19.070178985595703, -18.412290573120117, -17.75440216064453, -17.096513748168945, -16.43862533569336, -15.78073787689209, -15.122849464416504, -14.464961051940918, -13.807072639465332, -13.149184226989746, -12.49129581451416, -11.83340835571289, -11.175519943237305, -10.517631530761719, -9.859743118286133, -9.201854705810547, -8.543966293334961, -7.886077880859375, -7.228189945220947, -6.570301532745361, -5.912413120269775, -5.254525184631348, -4.596636772155762, -3.938748359680176, -3.28085994720459, -2.622971773147583, -1.9650834798812866, -1.3071951866149902, -0.6493067741394043, 0.008581399917602539, 0.6664695739746094, 1.3243560791015625, 1.9822443723678589, 2.6401326656341553, 3.298020839691162, 3.955909252166748, 4.613797664642334, 5.271685600280762, 5.929574012756348, 6.587462425231934, 7.2453508377075195, 7.9032392501831055, 8.561127662658691, 9.219015121459961, 9.876903533935547, 10.534791946411133, 11.192680358886719, 11.850568771362305, 12.50845718383789, 13.166345596313477, 13.824234008789062, 14.482122421264648, 15.140010833740234, 15.797898292541504, 16.455787658691406, 17.11367416381836, 17.771562576293945, 18.42945098876953, 19.087339401245117, 19.745227813720703, 20.40311622619629, 21.061004638671875, 21.718891143798828, 22.376781463623047]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 4.0, 4.0, 7.0, 12.0, 11.0, 12.0, 18.0, 17.0, 21.0, 21.0, 25.0, 31.0, 30.0, 31.0, 22.0, 31.0, 34.0, 36.0, 41.0, 28.0, 34.0, 37.0, 40.0, 38.0, 43.0, 40.0, 28.0, 37.0, 37.0, 28.0, 30.0, 20.0, 26.0, 20.0, 17.0, 12.0, 15.0, 9.0, 7.0, 10.0, 3.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-2.142578125, -2.08154296875, -2.0205078125, -1.95947265625, -1.8984375, -1.83740234375, -1.7763671875, -1.71533203125, -1.654296875, -1.59326171875, -1.5322265625, -1.47119140625, -1.41015625, -1.34912109375, -1.2880859375, -1.22705078125, -1.166015625, -1.10498046875, -1.0439453125, -0.98291015625, -0.921875, -0.86083984375, -0.7998046875, -0.73876953125, -0.677734375, -0.61669921875, -0.5556640625, -0.49462890625, -0.43359375, -0.37255859375, -0.3115234375, -0.25048828125, -0.189453125, -0.12841796875, -0.0673828125, -0.00634765625, 0.0546875, 0.11572265625, 0.1767578125, 0.23779296875, 0.298828125, 0.35986328125, 0.4208984375, 0.48193359375, 0.54296875, 0.60400390625, 0.6650390625, 0.72607421875, 0.787109375, 0.84814453125, 0.9091796875, 0.97021484375, 1.03125, 1.09228515625, 1.1533203125, 1.21435546875, 1.275390625, 1.33642578125, 1.3974609375, 1.45849609375, 1.51953125, 1.58056640625, 1.6416015625, 1.70263671875, 1.763671875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 19.0, 33.0, 23.0, 50.0, 61.0, 95.0, 125.0, 183.0, 289.0, 403.0, 570.0, 909.0, 1426.0, 2156.0, 3420.0, 5263.0, 8540.0, 13568.0, 21859.0, 35456.0, 58108.0, 93199.0, 141067.0, 185834.0, 165895.0, 115909.0, 73661.0, 45489.0, 27867.0, 17350.0, 10715.0, 6789.0, 4159.0, 2723.0, 1798.0, 1135.0, 759.0, 541.0, 333.0, 220.0, 153.0, 117.0, 78.0, 50.0, 41.0, 27.0, 17.0, 15.0, 13.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.1781005859375, -0.17266273498535156, -0.16722488403320312, -0.1617870330810547, -0.15634918212890625, -0.1509113311767578, -0.14547348022460938, -0.14003562927246094, -0.1345977783203125, -0.12915992736816406, -0.12372207641601562, -0.11828422546386719, -0.11284637451171875, -0.10740852355957031, -0.10197067260742188, -0.09653282165527344, -0.091094970703125, -0.08565711975097656, -0.08021926879882812, -0.07478141784667969, -0.06934356689453125, -0.06390571594238281, -0.058467864990234375, -0.05303001403808594, -0.0475921630859375, -0.04215431213378906, -0.036716461181640625, -0.03127861022949219, -0.02584075927734375, -0.020402908325195312, -0.014965057373046875, -0.009527206420898438, -0.00408935546875, 0.0013484954833984375, 0.006786346435546875, 0.012224197387695312, 0.01766204833984375, 0.023099899291992188, 0.028537750244140625, 0.03397560119628906, 0.0394134521484375, 0.04485130310058594, 0.050289154052734375, 0.05572700500488281, 0.06116485595703125, 0.06660270690917969, 0.07204055786132812, 0.07747840881347656, 0.082916259765625, 0.08835411071777344, 0.09379196166992188, 0.09922981262207031, 0.10466766357421875, 0.11010551452636719, 0.11554336547851562, 0.12098121643066406, 0.1264190673828125, 0.13185691833496094, 0.13729476928710938, 0.1427326202392578, 0.14817047119140625, 0.1536083221435547, 0.15904617309570312, 0.16448402404785156, 0.169921875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 0.0, 7.0, 5.0, 9.0, 3.0, 15.0, 11.0, 14.0, 13.0, 17.0, 21.0, 18.0, 21.0, 30.0, 38.0, 24.0, 33.0, 38.0, 37.0, 33.0, 35.0, 35.0, 1067.0, 39.0, 43.0, 43.0, 33.0, 30.0, 39.0, 20.0, 34.0, 27.0, 28.0, 28.0, 16.0, 25.0, 22.0, 10.0, 9.0, 10.0, 7.0, 14.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.3251953125, -1.285980224609375, -1.24676513671875, -1.207550048828125, -1.1683349609375, -1.129119873046875, -1.08990478515625, -1.050689697265625, -1.011474609375, -0.972259521484375, -0.93304443359375, -0.893829345703125, -0.8546142578125, -0.815399169921875, -0.77618408203125, -0.736968994140625, -0.69775390625, -0.658538818359375, -0.61932373046875, -0.580108642578125, -0.5408935546875, -0.501678466796875, -0.46246337890625, -0.423248291015625, -0.384033203125, -0.344818115234375, -0.30560302734375, -0.266387939453125, -0.2271728515625, -0.187957763671875, -0.14874267578125, -0.109527587890625, -0.0703125, -0.031097412109375, 0.00811767578125, 0.047332763671875, 0.0865478515625, 0.125762939453125, 0.16497802734375, 0.204193115234375, 0.243408203125, 0.282623291015625, 0.32183837890625, 0.361053466796875, 0.4002685546875, 0.439483642578125, 0.47869873046875, 0.517913818359375, 0.55712890625, 0.596343994140625, 0.63555908203125, 0.674774169921875, 0.7139892578125, 0.753204345703125, 0.79241943359375, 0.831634521484375, 0.870849609375, 0.910064697265625, 0.94927978515625, 0.988494873046875, 1.0277099609375, 1.066925048828125, 1.10614013671875, 1.145355224609375, 1.1845703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 14.0, 6.0, 11.0, 17.0, 30.0, 46.0, 63.0, 85.0, 125.0, 171.0, 244.0, 380.0, 535.0, 784.0, 1187.0, 1759.0, 2761.0, 4036.0, 6308.0, 9897.0, 14883.0, 22735.0, 34770.0, 51569.0, 73868.0, 102172.0, 143104.0, 1160210.0, 140182.0, 101772.0, 73388.0, 50689.0, 34267.0, 22324.0, 14631.0, 9461.0, 6316.0, 4090.0, 2750.0, 1779.0, 1235.0, 794.0, 539.0, 362.0, 262.0, 181.0, 124.0, 84.0, 45.0, 26.0, 18.0, 17.0, 10.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.09136962890625, -0.08846759796142578, -0.08556556701660156, -0.08266353607177734, -0.07976150512695312, -0.0768594741821289, -0.07395744323730469, -0.07105541229248047, -0.06815338134765625, -0.06525135040283203, -0.06234931945800781, -0.059447288513183594, -0.056545257568359375, -0.053643226623535156, -0.05074119567871094, -0.04783916473388672, -0.0449371337890625, -0.04203510284423828, -0.03913307189941406, -0.036231040954589844, -0.033329010009765625, -0.030426979064941406, -0.027524948120117188, -0.02462291717529297, -0.02172088623046875, -0.01881885528564453, -0.015916824340820312, -0.013014793395996094, -0.010112762451171875, -0.007210731506347656, -0.0043087005615234375, -0.0014066696166992188, 0.001495361328125, 0.004397392272949219, 0.0072994232177734375, 0.010201454162597656, 0.013103485107421875, 0.016005516052246094, 0.018907546997070312, 0.02180957794189453, 0.02471160888671875, 0.02761363983154297, 0.030515670776367188, 0.033417701721191406, 0.036319732666015625, 0.039221763610839844, 0.04212379455566406, 0.04502582550048828, 0.0479278564453125, 0.05082988739013672, 0.05373191833496094, 0.056633949279785156, 0.059535980224609375, 0.062438011169433594, 0.06534004211425781, 0.06824207305908203, 0.07114410400390625, 0.07404613494873047, 0.07694816589355469, 0.0798501968383789, 0.08275222778320312, 0.08565425872802734, 0.08855628967285156, 0.09145832061767578, 0.0943603515625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 6.0, 6.0, 5.0, 10.0, 9.0, 14.0, 13.0, 18.0, 19.0, 29.0, 22.0, 37.0, 36.0, 64.0, 108.0, 107.0, 146.0, 98.0, 56.0, 40.0, 32.0, 21.0, 23.0, 19.0, 14.0, 10.0, 10.0, 8.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00475311279296875, -0.0045830607414245605, -0.004413008689880371, -0.004242956638336182, -0.004072904586791992, -0.0039028525352478027, -0.0037328004837036133, -0.003562748432159424, -0.0033926963806152344, -0.003222644329071045, -0.0030525922775268555, -0.002882540225982666, -0.0027124881744384766, -0.002542436122894287, -0.0023723840713500977, -0.002202332019805908, -0.0020322799682617188, -0.0018622279167175293, -0.0016921758651733398, -0.0015221238136291504, -0.001352071762084961, -0.0011820197105407715, -0.001011967658996582, -0.0008419156074523926, -0.0006718635559082031, -0.0005018115043640137, -0.0003317594528198242, -0.00016170740127563477, 8.344650268554688e-06, 0.00017839670181274414, 0.0003484487533569336, 0.000518500804901123, 0.0006885528564453125, 0.000858604907989502, 0.0010286569595336914, 0.0011987090110778809, 0.0013687610626220703, 0.0015388131141662598, 0.0017088651657104492, 0.0018789172172546387, 0.002048969268798828, 0.0022190213203430176, 0.002389073371887207, 0.0025591254234313965, 0.002729177474975586, 0.0028992295265197754, 0.003069281578063965, 0.0032393336296081543, 0.0034093856811523438, 0.003579437732696533, 0.0037494897842407227, 0.003919541835784912, 0.0040895938873291016, 0.004259645938873291, 0.0044296979904174805, 0.00459975004196167, 0.004769802093505859, 0.004939854145050049, 0.005109906196594238, 0.005279958248138428, 0.005450010299682617, 0.005620062351226807, 0.005790114402770996, 0.0059601664543151855, 0.006130218505859375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 13.0, 15.0, 13.0, 10.0, 14.0, 25.0, 27.0, 38.0, 57.0, 78.0, 141.0, 262.0, 718.0, 39117.0, 1002712.0, 4178.0, 460.0, 168.0, 145.0, 80.0, 64.0, 57.0, 32.0, 25.0, 22.0, 10.0, 19.0, 8.0, 10.0, 10.0, 1.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1676025390625, -0.16298484802246094, -0.15836715698242188, -0.1537494659423828, -0.14913177490234375, -0.1445140838623047, -0.13989639282226562, -0.13527870178222656, -0.1306610107421875, -0.12604331970214844, -0.12142562866210938, -0.11680793762207031, -0.11219024658203125, -0.10757255554199219, -0.10295486450195312, -0.09833717346191406, -0.093719482421875, -0.08910179138183594, -0.08448410034179688, -0.07986640930175781, -0.07524871826171875, -0.07063102722167969, -0.06601333618164062, -0.06139564514160156, -0.0567779541015625, -0.05216026306152344, -0.047542572021484375, -0.04292488098144531, -0.03830718994140625, -0.03368949890136719, -0.029071807861328125, -0.024454116821289062, -0.01983642578125, -0.015218734741210938, -0.010601043701171875, -0.0059833526611328125, -0.00136566162109375, 0.0032520294189453125, 0.007869720458984375, 0.012487411499023438, 0.0171051025390625, 0.021722793579101562, 0.026340484619140625, 0.030958175659179688, 0.03557586669921875, 0.04019355773925781, 0.044811248779296875, 0.04942893981933594, 0.054046630859375, 0.05866432189941406, 0.06328201293945312, 0.06789970397949219, 0.07251739501953125, 0.07713508605957031, 0.08175277709960938, 0.08637046813964844, 0.0909881591796875, 0.09560585021972656, 0.10022354125976562, 0.10484123229980469, 0.10945892333984375, 0.11407661437988281, 0.11869430541992188, 0.12331199645996094, 0.1279296875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 30.0, 860.0, 128.0], "bins": [-0.20568373799324036, -0.20240294933319092, -0.19912216067314148, -0.19584137201309204, -0.1925605684518814, -0.18927977979183197, -0.18599899113178253, -0.1827182024717331, -0.17943741381168365, -0.17615662515163422, -0.17287583649158478, -0.16959503293037415, -0.1663142442703247, -0.16303345561027527, -0.15975266695022583, -0.1564718782901764, -0.15319107472896576, -0.14991028606891632, -0.14662949740886688, -0.14334869384765625, -0.1400679051876068, -0.13678711652755737, -0.13350632786750793, -0.1302255392074585, -0.12694475054740906, -0.12366396188735962, -0.12038316577672958, -0.11710237711668015, -0.1138215884566307, -0.11054079234600067, -0.10726000368595123, -0.1039792150259018, -0.10069841146469116, -0.09741762280464172, -0.09413682669401169, -0.09085603803396225, -0.08757524937391281, -0.08429445326328278, -0.08101366460323334, -0.0777328759431839, -0.07445207983255386, -0.07117129117250443, -0.06789049506187439, -0.06460970640182495, -0.061328914016485214, -0.05804812163114548, -0.05476733297109604, -0.0514865405857563, -0.04820575192570686, -0.044924959540367126, -0.04164417088031769, -0.03836337849497795, -0.035082586109638214, -0.031801797449588776, -0.02852100506424904, -0.025240212678909302, -0.021959422156214714, -0.018678631633520126, -0.01539783924818039, -0.012117048725485802, -0.00883625727146864, -0.005555465817451477, -0.0022746752947568893, 0.0010061170905828476, 0.004286907147616148]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 4.0, 10.0, 14.0, 11.0, 13.0, 10.0, 18.0, 19.0, 33.0, 41.0, 31.0, 39.0, 39.0, 50.0, 42.0, 48.0, 56.0, 51.0, 51.0, 41.0, 41.0, 40.0, 30.0, 42.0, 25.0, 29.0, 29.0, 30.0, 27.0, 15.0, 14.0, 13.0, 10.0, 6.0, 8.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004167735576629639, -0.0040216511115431786, -0.0038755666464567184, -0.0037294821813702583, -0.0035833977162837982, -0.003437313251197338, -0.003291228786110878, -0.003145144321024418, -0.0029990598559379578, -0.0028529753908514977, -0.0027068909257650375, -0.0025608064606785774, -0.0024147219955921173, -0.002268637530505657, -0.002122553065419197, -0.001976468600332737, -0.0018303841352462769, -0.0016842996701598167, -0.0015382152050733566, -0.0013921307399868965, -0.0012460462749004364, -0.0010999618098139763, -0.0009538773447275162, -0.0008077928796410561, -0.000661708414554596, -0.0005156239494681358, -0.0003695394843816757, -0.0002234550192952156, -7.737055420875549e-05, 6.871391087770462e-05, 0.00021479837596416473, 0.00036088284105062485, 0.000506967306137085, 0.0006530517712235451, 0.0007991362363100052, 0.0009452207013964653, 0.0010913051664829254, 0.0012373896315693855, 0.0013834740966558456, 0.0015295585617423058, 0.0016756430268287659, 0.001821727491915226, 0.001967811957001686, 0.002113896422088146, 0.0022599808871746063, 0.0024060653522610664, 0.0025521498173475266, 0.0026982342824339867, 0.0028443187475204468, 0.002990403212606907, 0.003136487677693367, 0.003282572142779827, 0.0034286566078662872, 0.0035747410729527473, 0.0037208255380392075, 0.0038669100031256676, 0.004012994468212128, 0.004159078933298588, 0.004305163398385048, 0.004451247863471508, 0.004597332328557968, 0.004743416793644428, 0.004889501258730888, 0.0050355857238173485, 0.005181670188903809]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 4.0, 4.0, 7.0, 12.0, 11.0, 12.0, 18.0, 17.0, 21.0, 21.0, 25.0, 31.0, 30.0, 31.0, 22.0, 31.0, 34.0, 36.0, 41.0, 28.0, 34.0, 37.0, 40.0, 38.0, 42.0, 41.0, 28.0, 37.0, 37.0, 28.0, 30.0, 20.0, 26.0, 20.0, 17.0, 12.0, 15.0, 9.0, 7.0, 10.0, 3.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-2.142578125, -2.08154296875, -2.0205078125, -1.95947265625, -1.8984375, -1.83740234375, -1.7763671875, -1.71533203125, -1.654296875, -1.59326171875, -1.5322265625, -1.47119140625, -1.41015625, -1.34912109375, -1.2880859375, -1.22705078125, -1.166015625, -1.10498046875, -1.0439453125, -0.98291015625, -0.921875, -0.86083984375, -0.7998046875, -0.73876953125, -0.677734375, -0.61669921875, -0.5556640625, -0.49462890625, -0.43359375, -0.37255859375, -0.3115234375, -0.25048828125, -0.189453125, -0.12841796875, -0.0673828125, -0.00634765625, 0.0546875, 0.11572265625, 0.1767578125, 0.23779296875, 0.298828125, 0.35986328125, 0.4208984375, 0.48193359375, 0.54296875, 0.60400390625, 0.6650390625, 0.72607421875, 0.787109375, 0.84814453125, 0.9091796875, 0.97021484375, 1.03125, 1.09228515625, 1.1533203125, 1.21435546875, 1.275390625, 1.33642578125, 1.3974609375, 1.45849609375, 1.51953125, 1.58056640625, 1.6416015625, 1.70263671875, 1.763671875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [6.0, 3.0, 3.0, 1.0, 15.0, 12.0, 25.0, 8.0, 25.0, 30.0, 44.0, 70.0, 113.0, 115.0, 161.0, 229.0, 354.0, 529.0, 732.0, 1190.0, 1913.0, 2933.0, 4782.0, 7807.0, 13144.0, 23014.0, 41011.0, 76952.0, 145981.0, 262305.0, 213285.0, 113387.0, 59613.0, 32331.0, 18260.0, 10701.0, 6350.0, 3910.0, 2447.0, 1550.0, 1035.0, 670.0, 476.0, 313.0, 221.0, 166.0, 104.0, 62.0, 57.0, 30.0, 28.0, 26.0, 16.0, 5.0, 7.0, 8.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.521484375, -1.470428466796875, -1.41937255859375, -1.368316650390625, -1.3172607421875, -1.266204833984375, -1.21514892578125, -1.164093017578125, -1.113037109375, -1.061981201171875, -1.01092529296875, -0.959869384765625, -0.9088134765625, -0.857757568359375, -0.80670166015625, -0.755645751953125, -0.70458984375, -0.653533935546875, -0.60247802734375, -0.551422119140625, -0.5003662109375, -0.449310302734375, -0.39825439453125, -0.347198486328125, -0.296142578125, -0.245086669921875, -0.19403076171875, -0.142974853515625, -0.0919189453125, -0.040863037109375, 0.01019287109375, 0.061248779296875, 0.1123046875, 0.163360595703125, 0.21441650390625, 0.265472412109375, 0.3165283203125, 0.367584228515625, 0.41864013671875, 0.469696044921875, 0.520751953125, 0.571807861328125, 0.62286376953125, 0.673919677734375, 0.7249755859375, 0.776031494140625, 0.82708740234375, 0.878143310546875, 0.92919921875, 0.980255126953125, 1.03131103515625, 1.082366943359375, 1.1334228515625, 1.184478759765625, 1.23553466796875, 1.286590576171875, 1.337646484375, 1.388702392578125, 1.43975830078125, 1.490814208984375, 1.5418701171875, 1.592926025390625, 1.64398193359375, 1.695037841796875, 1.74609375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 2.0, 6.0, 3.0, 3.0, 10.0, 10.0, 18.0, 21.0, 19.0, 21.0, 23.0, 25.0, 28.0, 34.0, 35.0, 46.0, 41.0, 54.0, 65.0, 125.0, 249.0, 1483.0, 185.0, 91.0, 73.0, 54.0, 40.0, 33.0, 38.0, 31.0, 33.0, 24.0, 23.0, 22.0, 17.0, 14.0, 8.0, 13.0, 7.0, 3.0, 2.0, 5.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.49609375, -7.26422119140625, -7.0323486328125, -6.80047607421875, -6.568603515625, -6.33673095703125, -6.1048583984375, -5.87298583984375, -5.64111328125, -5.40924072265625, -5.1773681640625, -4.94549560546875, -4.713623046875, -4.48175048828125, -4.2498779296875, -4.01800537109375, -3.7861328125, -3.55426025390625, -3.3223876953125, -3.09051513671875, -2.858642578125, -2.62677001953125, -2.3948974609375, -2.16302490234375, -1.93115234375, -1.69927978515625, -1.4674072265625, -1.23553466796875, -1.003662109375, -0.77178955078125, -0.5399169921875, -0.30804443359375, -0.076171875, 0.15570068359375, 0.3875732421875, 0.61944580078125, 0.851318359375, 1.08319091796875, 1.3150634765625, 1.54693603515625, 1.77880859375, 2.01068115234375, 2.2425537109375, 2.47442626953125, 2.706298828125, 2.93817138671875, 3.1700439453125, 3.40191650390625, 3.6337890625, 3.86566162109375, 4.0975341796875, 4.32940673828125, 4.561279296875, 4.79315185546875, 5.0250244140625, 5.25689697265625, 5.48876953125, 5.72064208984375, 5.9525146484375, 6.18438720703125, 6.416259765625, 6.64813232421875, 6.8800048828125, 7.11187744140625, 7.34375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 11.0, 10.0, 14.0, 15.0, 22.0, 21.0, 26.0, 57.0, 53.0, 90.0, 106.0, 148.0, 240.0, 540.0, 1347.0, 7412.0, 128309.0, 2867335.0, 129520.0, 7669.0, 1406.0, 505.0, 282.0, 123.0, 94.0, 68.0, 52.0, 44.0, 34.0, 37.0, 23.0, 23.0, 14.0, 11.0, 9.0, 6.0, 3.0, 3.0, 6.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.765625, -11.3798828125, -10.994140625, -10.6083984375, -10.22265625, -9.8369140625, -9.451171875, -9.0654296875, -8.6796875, -8.2939453125, -7.908203125, -7.5224609375, -7.13671875, -6.7509765625, -6.365234375, -5.9794921875, -5.59375, -5.2080078125, -4.822265625, -4.4365234375, -4.05078125, -3.6650390625, -3.279296875, -2.8935546875, -2.5078125, -2.1220703125, -1.736328125, -1.3505859375, -0.96484375, -0.5791015625, -0.193359375, 0.1923828125, 0.578125, 0.9638671875, 1.349609375, 1.7353515625, 2.12109375, 2.5068359375, 2.892578125, 3.2783203125, 3.6640625, 4.0498046875, 4.435546875, 4.8212890625, 5.20703125, 5.5927734375, 5.978515625, 6.3642578125, 6.75, 7.1357421875, 7.521484375, 7.9072265625, 8.29296875, 8.6787109375, 9.064453125, 9.4501953125, 9.8359375, 10.2216796875, 10.607421875, 10.9931640625, 11.37890625, 11.7646484375, 12.150390625, 12.5361328125, 12.921875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [329.0, 683.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.175058841705322, -0.6615290641784668, 3.8520007133483887, 8.365530014038086, 12.879060745239258, 17.39259147644043, 21.90612030029297, 26.419649124145508, 30.93317985534668, 35.44670867919922, 39.96023941040039, 44.47377014160156, 48.98729705810547, 53.500831604003906, 58.01435852050781, 62.52788543701172, 67.04141998291016, 71.55494689941406, 76.0684814453125, 80.5820083618164, 85.09553527832031, 89.60906982421875, 94.12259674072266, 98.63612365722656, 103.149658203125, 107.6631851196289, 112.17671966552734, 116.69024658203125, 121.20378112792969, 125.7173080444336, 130.2308349609375, 134.74436950683594, 139.25790405273438, 143.7714385986328, 148.2849578857422, 152.79849243164062, 157.31202697753906, 161.8255615234375, 166.33908081054688, 170.8526153564453, 175.36614990234375, 179.8796844482422, 184.39320373535156, 188.90673828125, 193.42027282714844, 197.93380737304688, 202.44732666015625, 206.9608612060547, 211.47438049316406, 215.9879150390625, 220.50143432617188, 225.0149688720703, 229.52850341796875, 234.04202270507812, 238.55555725097656, 243.069091796875, 247.58261108398438, 252.0961456298828, 256.60968017578125, 261.1231994628906, 265.63671875, 270.1502685546875, 274.6637878417969, 279.17730712890625, 283.69085693359375]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 6.0, 5.0, 8.0, 10.0, 9.0, 9.0, 22.0, 21.0, 23.0, 21.0, 27.0, 33.0, 32.0, 36.0, 33.0, 27.0, 33.0, 38.0, 49.0, 42.0, 44.0, 40.0, 41.0, 27.0, 29.0, 34.0, 29.0, 27.0, 37.0, 21.0, 31.0, 25.0, 18.0, 17.0, 15.0, 16.0, 13.0, 8.0, 11.0, 5.0, 10.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.62816047668457, -21.891433715820312, -21.154705047607422, -20.417978286743164, -19.681249618530273, -18.944522857666016, -18.207794189453125, -17.471067428588867, -16.73434066772461, -15.997612953186035, -15.260885238647461, -14.524158477783203, -13.787429809570312, -13.050703048706055, -12.31397533416748, -11.577247619628906, -10.840518951416016, -10.103791236877441, -9.367063522338867, -8.63033676147461, -7.893608570098877, -7.156880855560303, -6.420153617858887, -5.6834259033203125, -4.946698188781738, -4.209970474243164, -3.473242998123169, -2.736515522003174, -1.9997878074645996, -1.2630600929260254, -0.5263328552246094, 0.21039485931396484, 0.9471244812011719, 1.6838520765304565, 2.420579671859741, 3.1573071479797363, 3.8940348625183105, 4.630762577056885, 5.367489814758301, 6.104217529296875, 6.840945243835449, 7.577672958374023, 8.314400672912598, 9.051128387451172, 9.78785514831543, 10.52458381652832, 11.261310577392578, 11.998038291931152, 12.734766006469727, 13.4714937210083, 14.208221435546875, 14.944948196411133, 15.681676864624023, 16.41840362548828, 17.155132293701172, 17.89185905456543, 18.628585815429688, 19.365312576293945, 20.102041244506836, 20.838768005371094, 21.575496673583984, 22.312223434448242, 23.0489501953125, 23.78567886352539, 24.52240753173828]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 5.0, 10.0, 12.0, 13.0, 8.0, 17.0, 26.0, 20.0, 28.0, 22.0, 38.0, 32.0, 21.0, 32.0, 32.0, 29.0, 41.0, 42.0, 31.0, 44.0, 46.0, 32.0, 45.0, 40.0, 30.0, 32.0, 34.0, 43.0, 26.0, 21.0, 15.0, 21.0, 26.0, 10.0, 15.0, 6.0, 7.0, 12.0, 4.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.271484375, -2.204864501953125, -2.13824462890625, -2.071624755859375, -2.0050048828125, -1.938385009765625, -1.87176513671875, -1.805145263671875, -1.738525390625, -1.671905517578125, -1.60528564453125, -1.538665771484375, -1.4720458984375, -1.405426025390625, -1.33880615234375, -1.272186279296875, -1.20556640625, -1.138946533203125, -1.07232666015625, -1.005706787109375, -0.9390869140625, -0.872467041015625, -0.80584716796875, -0.739227294921875, -0.672607421875, -0.605987548828125, -0.53936767578125, -0.472747802734375, -0.4061279296875, -0.339508056640625, -0.27288818359375, -0.206268310546875, -0.1396484375, -0.073028564453125, -0.00640869140625, 0.060211181640625, 0.1268310546875, 0.193450927734375, 0.26007080078125, 0.326690673828125, 0.393310546875, 0.459930419921875, 0.52655029296875, 0.593170166015625, 0.6597900390625, 0.726409912109375, 0.79302978515625, 0.859649658203125, 0.92626953125, 0.992889404296875, 1.05950927734375, 1.126129150390625, 1.1927490234375, 1.259368896484375, 1.32598876953125, 1.392608642578125, 1.459228515625, 1.525848388671875, 1.59246826171875, 1.659088134765625, 1.7257080078125, 1.792327880859375, 1.85894775390625, 1.925567626953125, 1.9921875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 8.0, 7.0, 11.0, 17.0, 16.0, 14.0, 27.0, 20.0, 31.0, 35.0, 42.0, 55.0, 53.0, 115.0, 176.0, 423.0, 1101.0, 4434.0, 23342.0, 196136.0, 2258493.0, 1562776.0, 125082.0, 16731.0, 3262.0, 929.0, 350.0, 152.0, 94.0, 71.0, 47.0, 40.0, 29.0, 23.0, 34.0, 18.0, 14.0, 8.0, 16.0, 6.0, 9.0, 7.0, 10.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.5546875, -8.3023681640625, -8.050048828125, -7.7977294921875, -7.54541015625, -7.2930908203125, -7.040771484375, -6.7884521484375, -6.5361328125, -6.2838134765625, -6.031494140625, -5.7791748046875, -5.52685546875, -5.2745361328125, -5.022216796875, -4.7698974609375, -4.517578125, -4.2652587890625, -4.012939453125, -3.7606201171875, -3.50830078125, -3.2559814453125, -3.003662109375, -2.7513427734375, -2.4990234375, -2.2467041015625, -1.994384765625, -1.7420654296875, -1.48974609375, -1.2374267578125, -0.985107421875, -0.7327880859375, -0.48046875, -0.2281494140625, 0.024169921875, 0.2764892578125, 0.52880859375, 0.7811279296875, 1.033447265625, 1.2857666015625, 1.5380859375, 1.7904052734375, 2.042724609375, 2.2950439453125, 2.54736328125, 2.7996826171875, 3.052001953125, 3.3043212890625, 3.556640625, 3.8089599609375, 4.061279296875, 4.3135986328125, 4.56591796875, 4.8182373046875, 5.070556640625, 5.3228759765625, 5.5751953125, 5.8275146484375, 6.079833984375, 6.3321533203125, 6.58447265625, 6.8367919921875, 7.089111328125, 7.3414306640625, 7.59375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 12.0, 16.0, 14.0, 25.0, 39.0, 50.0, 86.0, 110.0, 146.0, 227.0, 328.0, 463.0, 512.0, 514.0, 429.0, 364.0, 218.0, 168.0, 93.0, 82.0, 44.0, 26.0, 26.0, 20.0, 22.0, 14.0, 9.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5390625, -9.30059814453125, -9.0621337890625, -8.82366943359375, -8.585205078125, -8.34674072265625, -8.1082763671875, -7.86981201171875, -7.63134765625, -7.39288330078125, -7.1544189453125, -6.91595458984375, -6.677490234375, -6.43902587890625, -6.2005615234375, -5.96209716796875, -5.7236328125, -5.48516845703125, -5.2467041015625, -5.00823974609375, -4.769775390625, -4.53131103515625, -4.2928466796875, -4.05438232421875, -3.81591796875, -3.57745361328125, -3.3389892578125, -3.10052490234375, -2.862060546875, -2.62359619140625, -2.3851318359375, -2.14666748046875, -1.908203125, -1.66973876953125, -1.4312744140625, -1.19281005859375, -0.954345703125, -0.71588134765625, -0.4774169921875, -0.23895263671875, -0.00048828125, 0.23797607421875, 0.4764404296875, 0.71490478515625, 0.953369140625, 1.19183349609375, 1.4302978515625, 1.66876220703125, 1.9072265625, 2.14569091796875, 2.3841552734375, 2.62261962890625, 2.861083984375, 3.09954833984375, 3.3380126953125, 3.57647705078125, 3.81494140625, 4.05340576171875, 4.2918701171875, 4.53033447265625, 4.768798828125, 5.00726318359375, 5.2457275390625, 5.48419189453125, 5.72265625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 15.0, 13.0, 27.0, 32.0, 36.0, 65.0, 121.0, 220.0, 443.0, 1115.0, 3871.0, 22346.0, 259739.0, 2821632.0, 1005699.0, 67540.0, 8075.0, 1950.0, 657.0, 302.0, 142.0, 84.0, 47.0, 46.0, 22.0, 16.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.921875, -11.458740234375, -10.99560546875, -10.532470703125, -10.0693359375, -9.606201171875, -9.14306640625, -8.679931640625, -8.216796875, -7.753662109375, -7.29052734375, -6.827392578125, -6.3642578125, -5.901123046875, -5.43798828125, -4.974853515625, -4.51171875, -4.048583984375, -3.58544921875, -3.122314453125, -2.6591796875, -2.196044921875, -1.73291015625, -1.269775390625, -0.806640625, -0.343505859375, 0.11962890625, 0.582763671875, 1.0458984375, 1.509033203125, 1.97216796875, 2.435302734375, 2.8984375, 3.361572265625, 3.82470703125, 4.287841796875, 4.7509765625, 5.214111328125, 5.67724609375, 6.140380859375, 6.603515625, 7.066650390625, 7.52978515625, 7.992919921875, 8.4560546875, 8.919189453125, 9.38232421875, 9.845458984375, 10.30859375, 10.771728515625, 11.23486328125, 11.697998046875, 12.1611328125, 12.624267578125, 13.08740234375, 13.550537109375, 14.013671875, 14.476806640625, 14.93994140625, 15.403076171875, 15.8662109375, 16.329345703125, 16.79248046875, 17.255615234375, 17.71875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 14.0, 28.0, 51.0, 53.0, 73.0, 119.0, 116.0, 118.0, 106.0, 92.0, 76.0, 58.0, 37.0, 29.0, 14.0, 8.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.619972229003906, -32.55096435546875, -31.48195457458496, -30.412946701049805, -29.343936920166016, -28.27492904663086, -27.205921173095703, -26.136913299560547, -25.067903518676758, -23.9988956451416, -22.929885864257812, -21.860877990722656, -20.7918701171875, -19.72286033630371, -18.653852462768555, -17.584842681884766, -16.51583480834961, -15.446825981140137, -14.377817153930664, -13.308809280395508, -12.239800453186035, -11.170791625976562, -10.101783752441406, -9.032774925231934, -7.963766098022461, -6.894757270812988, -5.825748920440674, -4.756740570068359, -3.6877317428588867, -2.618722915649414, -1.5497145652770996, -0.48070621490478516, 0.5882987976074219, 1.6573073863983154, 2.726315975189209, 3.7953245639801025, 4.864333152770996, 5.933341979980469, 7.002350330352783, 8.071358680725098, 9.14036750793457, 10.209376335144043, 11.278385162353516, 12.347393035888672, 13.416401863098145, 14.485410690307617, 15.554418563842773, 16.623428344726562, 17.69243621826172, 18.761444091796875, 19.830453872680664, 20.89946174621582, 21.96847152709961, 23.037479400634766, 24.106487274169922, 25.175495147705078, 26.244504928588867, 27.313512802124023, 28.382522583007812, 29.45153045654297, 30.520538330078125, 31.589548110961914, 32.6585578918457, 33.72756576538086, 34.796573638916016]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 5.0, 10.0, 9.0, 12.0, 18.0, 25.0, 17.0, 14.0, 28.0, 21.0, 31.0, 38.0, 24.0, 31.0, 34.0, 27.0, 37.0, 48.0, 29.0, 44.0, 39.0, 36.0, 28.0, 50.0, 39.0, 36.0, 26.0, 33.0, 19.0, 20.0, 21.0, 16.0, 17.0, 17.0, 13.0, 12.0, 9.0, 15.0, 9.0, 4.0, 6.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.896915435791016, -17.28498077392578, -16.673046112060547, -16.061113357543945, -15.449178695678711, -14.837244033813477, -14.225310325622559, -13.61337661743164, -13.001441955566406, -12.389507293701172, -11.777573585510254, -11.165639877319336, -10.553705215454102, -9.941770553588867, -9.32983684539795, -8.717903137207031, -8.105968475341797, -7.494034290313721, -6.8821001052856445, -6.270165920257568, -5.658231735229492, -5.046297550201416, -4.43436336517334, -3.8224291801452637, -3.2104949951171875, -2.5985608100891113, -1.9866266250610352, -1.374692440032959, -0.7627582550048828, -0.15082406997680664, 0.46111011505126953, 1.0730443000793457, 1.6849784851074219, 2.296912670135498, 2.908846855163574, 3.5207810401916504, 4.132715225219727, 4.744649410247803, 5.356583595275879, 5.968517780303955, 6.580451965332031, 7.192386150360107, 7.804320335388184, 8.416254043579102, 9.028188705444336, 9.64012336730957, 10.252057075500488, 10.863990783691406, 11.47592544555664, 12.087860107421875, 12.699793815612793, 13.311727523803711, 13.923662185668945, 14.53559684753418, 15.147530555725098, 15.759464263916016, 16.37139892578125, 16.983333587646484, 17.59526824951172, 18.20720100402832, 18.819135665893555, 19.43107032775879, 20.04300308227539, 20.654937744140625, 21.26687240600586]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 8.0, 6.0, 7.0, 9.0, 9.0, 13.0, 12.0, 10.0, 22.0, 24.0, 28.0, 16.0, 25.0, 25.0, 24.0, 38.0, 34.0, 36.0, 32.0, 32.0, 42.0, 43.0, 39.0, 36.0, 38.0, 42.0, 42.0, 39.0, 38.0, 30.0, 36.0, 21.0, 20.0, 19.0, 8.0, 21.0, 12.0, 10.0, 15.0, 8.0, 6.0, 8.0, 3.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0546875, -1.98779296875, -1.9208984375, -1.85400390625, -1.787109375, -1.72021484375, -1.6533203125, -1.58642578125, -1.51953125, -1.45263671875, -1.3857421875, -1.31884765625, -1.251953125, -1.18505859375, -1.1181640625, -1.05126953125, -0.984375, -0.91748046875, -0.8505859375, -0.78369140625, -0.716796875, -0.64990234375, -0.5830078125, -0.51611328125, -0.44921875, -0.38232421875, -0.3154296875, -0.24853515625, -0.181640625, -0.11474609375, -0.0478515625, 0.01904296875, 0.0859375, 0.15283203125, 0.2197265625, 0.28662109375, 0.353515625, 0.42041015625, 0.4873046875, 0.55419921875, 0.62109375, 0.68798828125, 0.7548828125, 0.82177734375, 0.888671875, 0.95556640625, 1.0224609375, 1.08935546875, 1.15625, 1.22314453125, 1.2900390625, 1.35693359375, 1.423828125, 1.49072265625, 1.5576171875, 1.62451171875, 1.69140625, 1.75830078125, 1.8251953125, 1.89208984375, 1.958984375, 2.02587890625, 2.0927734375, 2.15966796875, 2.2265625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 5.0, 7.0, 6.0, 10.0, 10.0, 8.0, 21.0, 28.0, 48.0, 73.0, 92.0, 152.0, 204.0, 285.0, 434.0, 658.0, 980.0, 1482.0, 2379.0, 3783.0, 5842.0, 9769.0, 16207.0, 26892.0, 44298.0, 72399.0, 114122.0, 165984.0, 188432.0, 145525.0, 95994.0, 59206.0, 36125.0, 21946.0, 13157.0, 8198.0, 4932.0, 3060.0, 1972.0, 1295.0, 845.0, 521.0, 391.0, 238.0, 171.0, 105.0, 83.0, 55.0, 43.0, 26.0, 15.0, 17.0, 10.0, 10.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.1907958984375, -0.1848888397216797, -0.17898178100585938, -0.17307472229003906, -0.16716766357421875, -0.16126060485839844, -0.15535354614257812, -0.1494464874267578, -0.1435394287109375, -0.1376323699951172, -0.13172531127929688, -0.12581825256347656, -0.11991119384765625, -0.11400413513183594, -0.10809707641601562, -0.10219001770019531, -0.096282958984375, -0.09037590026855469, -0.08446884155273438, -0.07856178283691406, -0.07265472412109375, -0.06674766540527344, -0.060840606689453125, -0.05493354797363281, -0.0490264892578125, -0.04311943054199219, -0.037212371826171875, -0.03130531311035156, -0.02539825439453125, -0.019491195678710938, -0.013584136962890625, -0.0076770782470703125, -0.00177001953125, 0.0041370391845703125, 0.010044097900390625, 0.015951156616210938, 0.02185821533203125, 0.027765274047851562, 0.033672332763671875, 0.03957939147949219, 0.0454864501953125, 0.05139350891113281, 0.057300567626953125, 0.06320762634277344, 0.06911468505859375, 0.07502174377441406, 0.08092880249023438, 0.08683586120605469, 0.092742919921875, 0.09864997863769531, 0.10455703735351562, 0.11046409606933594, 0.11637115478515625, 0.12227821350097656, 0.12818527221679688, 0.1340923309326172, 0.1399993896484375, 0.1459064483642578, 0.15181350708007812, 0.15772056579589844, 0.16362762451171875, 0.16953468322753906, 0.17544174194335938, 0.1813488006591797, 0.187255859375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 1.0, 7.0, 7.0, 8.0, 8.0, 12.0, 7.0, 9.0, 21.0, 12.0, 26.0, 24.0, 25.0, 34.0, 28.0, 43.0, 37.0, 44.0, 36.0, 51.0, 41.0, 1071.0, 45.0, 41.0, 44.0, 39.0, 35.0, 39.0, 43.0, 20.0, 21.0, 18.0, 17.0, 11.0, 13.0, 17.0, 21.0, 10.0, 9.0, 11.0, 2.0, 2.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-1.705078125, -1.6590423583984375, -1.613006591796875, -1.5669708251953125, -1.52093505859375, -1.4748992919921875, -1.428863525390625, -1.3828277587890625, -1.3367919921875, -1.2907562255859375, -1.244720458984375, -1.1986846923828125, -1.15264892578125, -1.1066131591796875, -1.060577392578125, -1.0145416259765625, -0.968505859375, -0.9224700927734375, -0.876434326171875, -0.8303985595703125, -0.78436279296875, -0.7383270263671875, -0.692291259765625, -0.6462554931640625, -0.6002197265625, -0.5541839599609375, -0.508148193359375, -0.4621124267578125, -0.41607666015625, -0.3700408935546875, -0.324005126953125, -0.2779693603515625, -0.23193359375, -0.1858978271484375, -0.139862060546875, -0.0938262939453125, -0.04779052734375, -0.0017547607421875, 0.044281005859375, 0.0903167724609375, 0.1363525390625, 0.1823883056640625, 0.228424072265625, 0.2744598388671875, 0.32049560546875, 0.3665313720703125, 0.412567138671875, 0.4586029052734375, 0.504638671875, 0.5506744384765625, 0.596710205078125, 0.6427459716796875, 0.68878173828125, 0.7348175048828125, 0.780853271484375, 0.8268890380859375, 0.8729248046875, 0.9189605712890625, 0.964996337890625, 1.0110321044921875, 1.05706787109375, 1.1031036376953125, 1.149139404296875, 1.1951751708984375, 1.2412109375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 6.0, 15.0, 23.0, 36.0, 63.0, 77.0, 157.0, 258.0, 463.0, 725.0, 1355.0, 2339.0, 4050.0, 7419.0, 13520.0, 24887.0, 43629.0, 75350.0, 121922.0, 195773.0, 1219874.0, 153440.0, 98042.0, 58384.0, 33396.0, 18734.0, 10296.0, 5570.0, 3251.0, 1769.0, 970.0, 528.0, 303.0, 199.0, 119.0, 72.0, 37.0, 22.0, 14.0, 8.0, 14.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1339111328125, -0.1293354034423828, -0.12475967407226562, -0.12018394470214844, -0.11560821533203125, -0.11103248596191406, -0.10645675659179688, -0.10188102722167969, -0.0973052978515625, -0.09272956848144531, -0.08815383911132812, -0.08357810974121094, -0.07900238037109375, -0.07442665100097656, -0.06985092163085938, -0.06527519226074219, -0.060699462890625, -0.05612373352050781, -0.051548004150390625, -0.04697227478027344, -0.04239654541015625, -0.03782081604003906, -0.033245086669921875, -0.028669357299804688, -0.0240936279296875, -0.019517898559570312, -0.014942169189453125, -0.010366439819335938, -0.00579071044921875, -0.0012149810791015625, 0.003360748291015625, 0.007936477661132812, 0.01251220703125, 0.017087936401367188, 0.021663665771484375, 0.026239395141601562, 0.03081512451171875, 0.03539085388183594, 0.039966583251953125, 0.04454231262207031, 0.0491180419921875, 0.05369377136230469, 0.058269500732421875, 0.06284523010253906, 0.06742095947265625, 0.07199668884277344, 0.07657241821289062, 0.08114814758300781, 0.085723876953125, 0.09029960632324219, 0.09487533569335938, 0.09945106506347656, 0.10402679443359375, 0.10860252380371094, 0.11317825317382812, 0.11775398254394531, 0.1223297119140625, 0.1269054412841797, 0.13148117065429688, 0.13605690002441406, 0.14063262939453125, 0.14520835876464844, 0.14978408813476562, 0.1543598175048828, 0.158935546875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 8.0, 8.0, 10.0, 11.0, 14.0, 20.0, 19.0, 32.0, 46.0, 30.0, 39.0, 56.0, 73.0, 88.0, 80.0, 78.0, 71.0, 61.0, 44.0, 45.0, 34.0, 20.0, 10.0, 19.0, 15.0, 8.0, 10.0, 7.0, 7.0, 7.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00803375244140625, -0.007800281047821045, -0.00756680965423584, -0.007333338260650635, -0.00709986686706543, -0.006866395473480225, -0.0066329240798950195, -0.0063994526863098145, -0.006165981292724609, -0.005932509899139404, -0.005699038505554199, -0.005465567111968994, -0.005232095718383789, -0.004998624324798584, -0.004765152931213379, -0.004531681537628174, -0.004298210144042969, -0.004064738750457764, -0.0038312673568725586, -0.0035977959632873535, -0.0033643245697021484, -0.0031308531761169434, -0.0028973817825317383, -0.002663910388946533, -0.002430438995361328, -0.002196967601776123, -0.001963496208190918, -0.0017300248146057129, -0.0014965534210205078, -0.0012630820274353027, -0.0010296106338500977, -0.0007961392402648926, -0.0005626678466796875, -0.0003291964530944824, -9.572505950927734e-05, 0.00013774633407592773, 0.0003712177276611328, 0.0006046891212463379, 0.000838160514831543, 0.001071631908416748, 0.0013051033020019531, 0.0015385746955871582, 0.0017720460891723633, 0.0020055174827575684, 0.0022389888763427734, 0.0024724602699279785, 0.0027059316635131836, 0.0029394030570983887, 0.0031728744506835938, 0.003406345844268799, 0.003639817237854004, 0.003873288631439209, 0.004106760025024414, 0.004340231418609619, 0.004573702812194824, 0.004807174205780029, 0.005040645599365234, 0.0052741169929504395, 0.0055075883865356445, 0.00574105978012085, 0.005974531173706055, 0.00620800256729126, 0.006441473960876465, 0.00667494535446167, 0.006908416748046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 8.0, 5.0, 6.0, 10.0, 11.0, 12.0, 22.0, 17.0, 31.0, 34.0, 33.0, 63.0, 63.0, 97.0, 126.0, 216.0, 560.0, 8035.0, 1004614.0, 32927.0, 789.0, 291.0, 126.0, 77.0, 68.0, 54.0, 38.0, 31.0, 32.0, 25.0, 27.0, 18.0, 12.0, 18.0, 4.0, 6.0, 4.0, 5.0, 6.0, 1.0, 2.0, 4.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1312255859375, -0.12679672241210938, -0.12236785888671875, -0.11793899536132812, -0.1135101318359375, -0.10908126831054688, -0.10465240478515625, -0.10022354125976562, -0.095794677734375, -0.09136581420898438, -0.08693695068359375, -0.08250808715820312, -0.0780792236328125, -0.07365036010742188, -0.06922149658203125, -0.06479263305664062, -0.06036376953125, -0.055934906005859375, -0.05150604248046875, -0.047077178955078125, -0.0426483154296875, -0.038219451904296875, -0.03379058837890625, -0.029361724853515625, -0.024932861328125, -0.020503997802734375, -0.01607513427734375, -0.011646270751953125, -0.0072174072265625, -0.002788543701171875, 0.00164031982421875, 0.006069183349609375, 0.010498046875, 0.014926910400390625, 0.01935577392578125, 0.023784637451171875, 0.0282135009765625, 0.032642364501953125, 0.03707122802734375, 0.041500091552734375, 0.045928955078125, 0.050357818603515625, 0.05478668212890625, 0.059215545654296875, 0.0636444091796875, 0.06807327270507812, 0.07250213623046875, 0.07693099975585938, 0.08135986328125, 0.08578872680664062, 0.09021759033203125, 0.09464645385742188, 0.0990753173828125, 0.10350418090820312, 0.10793304443359375, 0.11236190795898438, 0.116790771484375, 0.12121963500976562, 0.12564849853515625, 0.13007736206054688, 0.1345062255859375, 0.13893508911132812, 0.14336395263671875, 0.14779281616210938, 0.1522216796875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 895.0, 97.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.22215846180915833, -0.21793340146541595, -0.21370834112167358, -0.20948326587677002, -0.20525820553302765, -0.20103314518928528, -0.1968080699443817, -0.19258300960063934, -0.18835794925689697, -0.1841328889131546, -0.17990782856941223, -0.17568275332450867, -0.1714576929807663, -0.16723263263702393, -0.16300755739212036, -0.158782497048378, -0.15455743670463562, -0.15033237636089325, -0.14610731601715088, -0.14188224077224731, -0.13765718042850494, -0.13343212008476257, -0.129207044839859, -0.12498198449611664, -0.12075692415237427, -0.1165318638086319, -0.11230679601430893, -0.10808172821998596, -0.10385666787624359, -0.09963160753250122, -0.09540653973817825, -0.09118147194385529, -0.08695642650127411, -0.08273136615753174, -0.07850629836320877, -0.0742812305688858, -0.07005617022514343, -0.06583110988140106, -0.061606042087078094, -0.057380978018045425, -0.053155913949012756, -0.04893084987998009, -0.04470578581094742, -0.04048072174191475, -0.03625565767288208, -0.03203059360384941, -0.027805529534816742, -0.023580465465784073, -0.019355401396751404, -0.015130337327718735, -0.010905273258686066, -0.006680209189653397, -0.0024551451206207275, 0.0017699189484119415, 0.005994983017444611, 0.01022004708647728, 0.014445111155509949, 0.018670175224542618, 0.022895239293575287, 0.027120303362607956, 0.031345367431640625, 0.035570431500673294, 0.03979549556970596, 0.04402055963873863, 0.0482456237077713]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 2.0, 4.0, 5.0, 5.0, 8.0, 11.0, 17.0, 21.0, 18.0, 21.0, 17.0, 38.0, 28.0, 36.0, 36.0, 45.0, 42.0, 47.0, 38.0, 65.0, 38.0, 43.0, 38.0, 40.0, 39.0, 25.0, 38.0, 28.0, 29.0, 33.0, 29.0, 20.0, 21.0, 14.0, 20.0, 9.0, 6.0, 7.0, 7.0, 5.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.010283708572387695, -0.009949051775038242, -0.00961439497768879, -0.009279738180339336, -0.008945081382989883, -0.00861042458564043, -0.008275767788290977, -0.007941110990941525, -0.0076064541935920715, -0.0072717973962426186, -0.006937140598893166, -0.006602483801543713, -0.00626782700419426, -0.005933170206844807, -0.005598513409495354, -0.005263856612145901, -0.004929199814796448, -0.004594543017446995, -0.004259886220097542, -0.003925229422748089, -0.003590572625398636, -0.003255915828049183, -0.00292125903069973, -0.002586602233350277, -0.002251945436000824, -0.001917288638651371, -0.001582631841301918, -0.001247975043952465, -0.0009133182466030121, -0.0005786614492535591, -0.00024400465190410614, 9.065214544534683e-05, 0.0004253089427947998, 0.0007599657401442528, 0.0010946225374937057, 0.0014292793348431587, 0.0017639361321926117, 0.0020985929295420647, 0.0024332497268915176, 0.0027679065242409706, 0.0031025633215904236, 0.0034372201189398766, 0.0037718769162893295, 0.0041065337136387825, 0.0044411905109882355, 0.0047758473083376884, 0.005110504105687141, 0.005445160903036594, 0.005779817700386047, 0.0061144744977355, 0.006449131295084953, 0.006783788092434406, 0.007118444889783859, 0.007453101687133312, 0.007787758484482765, 0.008122415281832218, 0.008457072079181671, 0.008791728876531124, 0.009126385673880577, 0.00946104247123003, 0.009795699268579483, 0.010130356065928936, 0.010465012863278389, 0.010799669660627842, 0.011134326457977295]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 8.0, 6.0, 7.0, 9.0, 9.0, 13.0, 12.0, 10.0, 22.0, 24.0, 28.0, 16.0, 25.0, 25.0, 24.0, 38.0, 34.0, 36.0, 32.0, 32.0, 42.0, 43.0, 39.0, 36.0, 38.0, 42.0, 42.0, 39.0, 38.0, 30.0, 36.0, 21.0, 20.0, 19.0, 8.0, 21.0, 12.0, 10.0, 15.0, 8.0, 6.0, 8.0, 3.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0546875, -1.98779296875, -1.9208984375, -1.85400390625, -1.787109375, -1.72021484375, -1.6533203125, -1.58642578125, -1.51953125, -1.45263671875, -1.3857421875, -1.31884765625, -1.251953125, -1.18505859375, -1.1181640625, -1.05126953125, -0.984375, -0.91748046875, -0.8505859375, -0.78369140625, -0.716796875, -0.64990234375, -0.5830078125, -0.51611328125, -0.44921875, -0.38232421875, -0.3154296875, -0.24853515625, -0.181640625, -0.11474609375, -0.0478515625, 0.01904296875, 0.0859375, 0.15283203125, 0.2197265625, 0.28662109375, 0.353515625, 0.42041015625, 0.4873046875, 0.55419921875, 0.62109375, 0.68798828125, 0.7548828125, 0.82177734375, 0.888671875, 0.95556640625, 1.0224609375, 1.08935546875, 1.15625, 1.22314453125, 1.2900390625, 1.35693359375, 1.423828125, 1.49072265625, 1.5576171875, 1.62451171875, 1.69140625, 1.75830078125, 1.8251953125, 1.89208984375, 1.958984375, 2.02587890625, 2.0927734375, 2.15966796875, 2.2265625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 8.0, 6.0, 8.0, 10.0, 14.0, 16.0, 33.0, 40.0, 58.0, 58.0, 103.0, 137.0, 196.0, 301.0, 478.0, 822.0, 1469.0, 2666.0, 5342.0, 11377.0, 25467.0, 63730.0, 167096.0, 347237.0, 251767.0, 99508.0, 38343.0, 16237.0, 7622.0, 3749.0, 1890.0, 1034.0, 586.0, 379.0, 241.0, 158.0, 102.0, 59.0, 59.0, 40.0, 34.0, 20.0, 17.0, 11.0, 11.0, 9.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.119140625, -2.045379638671875, -1.97161865234375, -1.897857666015625, -1.8240966796875, -1.750335693359375, -1.67657470703125, -1.602813720703125, -1.529052734375, -1.455291748046875, -1.38153076171875, -1.307769775390625, -1.2340087890625, -1.160247802734375, -1.08648681640625, -1.012725830078125, -0.93896484375, -0.865203857421875, -0.79144287109375, -0.717681884765625, -0.6439208984375, -0.570159912109375, -0.49639892578125, -0.422637939453125, -0.348876953125, -0.275115966796875, -0.20135498046875, -0.127593994140625, -0.0538330078125, 0.019927978515625, 0.09368896484375, 0.167449951171875, 0.2412109375, 0.314971923828125, 0.38873291015625, 0.462493896484375, 0.5362548828125, 0.610015869140625, 0.68377685546875, 0.757537841796875, 0.831298828125, 0.905059814453125, 0.97882080078125, 1.052581787109375, 1.1263427734375, 1.200103759765625, 1.27386474609375, 1.347625732421875, 1.42138671875, 1.495147705078125, 1.56890869140625, 1.642669677734375, 1.7164306640625, 1.790191650390625, 1.86395263671875, 1.937713623046875, 2.011474609375, 2.085235595703125, 2.15899658203125, 2.232757568359375, 2.3065185546875, 2.380279541015625, 2.45404052734375, 2.527801513671875, 2.6015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 6.0, 6.0, 14.0, 12.0, 11.0, 13.0, 29.0, 24.0, 30.0, 36.0, 34.0, 43.0, 35.0, 56.0, 69.0, 98.0, 195.0, 1553.0, 229.0, 100.0, 72.0, 44.0, 45.0, 43.0, 38.0, 30.0, 31.0, 24.0, 24.0, 16.0, 13.0, 15.0, 11.0, 10.0, 9.0, 5.0, 8.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.4439697265625, -8.177001953125, -7.9100341796875, -7.64306640625, -7.3760986328125, -7.109130859375, -6.8421630859375, -6.5751953125, -6.3082275390625, -6.041259765625, -5.7742919921875, -5.50732421875, -5.2403564453125, -4.973388671875, -4.7064208984375, -4.439453125, -4.1724853515625, -3.905517578125, -3.6385498046875, -3.37158203125, -3.1046142578125, -2.837646484375, -2.5706787109375, -2.3037109375, -2.0367431640625, -1.769775390625, -1.5028076171875, -1.23583984375, -0.9688720703125, -0.701904296875, -0.4349365234375, -0.16796875, 0.0989990234375, 0.365966796875, 0.6329345703125, 0.89990234375, 1.1668701171875, 1.433837890625, 1.7008056640625, 1.9677734375, 2.2347412109375, 2.501708984375, 2.7686767578125, 3.03564453125, 3.3026123046875, 3.569580078125, 3.8365478515625, 4.103515625, 4.3704833984375, 4.637451171875, 4.9044189453125, 5.17138671875, 5.4383544921875, 5.705322265625, 5.9722900390625, 6.2392578125, 6.5062255859375, 6.773193359375, 7.0401611328125, 7.30712890625, 7.5740966796875, 7.841064453125, 8.1080322265625, 8.375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 8.0, 9.0, 12.0, 13.0, 14.0, 20.0, 24.0, 32.0, 32.0, 43.0, 56.0, 72.0, 121.0, 178.0, 316.0, 682.0, 1975.0, 13238.0, 404542.0, 2673631.0, 44383.0, 4003.0, 1127.0, 430.0, 205.0, 133.0, 93.0, 60.0, 51.0, 43.0, 29.0, 28.0, 12.0, 18.0, 18.0, 11.0, 8.0, 6.0, 4.0, 9.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.6796875, -11.293212890625, -10.90673828125, -10.520263671875, -10.1337890625, -9.747314453125, -9.36083984375, -8.974365234375, -8.587890625, -8.201416015625, -7.81494140625, -7.428466796875, -7.0419921875, -6.655517578125, -6.26904296875, -5.882568359375, -5.49609375, -5.109619140625, -4.72314453125, -4.336669921875, -3.9501953125, -3.563720703125, -3.17724609375, -2.790771484375, -2.404296875, -2.017822265625, -1.63134765625, -1.244873046875, -0.8583984375, -0.471923828125, -0.08544921875, 0.301025390625, 0.6875, 1.073974609375, 1.46044921875, 1.846923828125, 2.2333984375, 2.619873046875, 3.00634765625, 3.392822265625, 3.779296875, 4.165771484375, 4.55224609375, 4.938720703125, 5.3251953125, 5.711669921875, 6.09814453125, 6.484619140625, 6.87109375, 7.257568359375, 7.64404296875, 8.030517578125, 8.4169921875, 8.803466796875, 9.18994140625, 9.576416015625, 9.962890625, 10.349365234375, 10.73583984375, 11.122314453125, 11.5087890625, 11.895263671875, 12.28173828125, 12.668212890625, 13.0546875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [2.0, 19.0, 634.0, 362.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.162151336669922, -6.605534076690674, -3.048916816711426, 0.5076999664306641, 4.06431770324707, 7.620935440063477, 11.17755126953125, 14.734169006347656, 18.290786743164062, 21.84740447998047, 25.404022216796875, 28.96063804626465, 32.51725769042969, 36.073875427246094, 39.630489349365234, 43.18710708618164, 46.74372482299805, 50.30034255981445, 53.85696029663086, 57.41357421875, 60.970191955566406, 64.52680969238281, 68.08342742919922, 71.64004516601562, 75.19666290283203, 78.75328063964844, 82.30989837646484, 85.86651611328125, 89.42313385009766, 92.97975158691406, 96.53636169433594, 100.09298706054688, 103.64959716796875, 107.20621490478516, 110.76283264160156, 114.31945037841797, 117.87606811523438, 121.43268585205078, 124.98930358886719, 128.54591369628906, 132.1025390625, 135.65914916992188, 139.2157745361328, 142.7723846435547, 146.32901000976562, 149.8856201171875, 153.44224548339844, 156.9988555908203, 160.55548095703125, 164.11209106445312, 167.66871643066406, 171.22532653808594, 174.78195190429688, 178.33856201171875, 181.8951873779297, 185.45179748535156, 189.00840759277344, 192.5650177001953, 196.12164306640625, 199.67825317382812, 203.23487854003906, 206.79148864746094, 210.34811401367188, 213.90472412109375, 217.4613494873047]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 8.0, 7.0, 18.0, 13.0, 7.0, 13.0, 18.0, 22.0, 23.0, 24.0, 23.0, 29.0, 33.0, 39.0, 33.0, 39.0, 39.0, 33.0, 51.0, 43.0, 40.0, 42.0, 37.0, 43.0, 31.0, 47.0, 43.0, 24.0, 27.0, 20.0, 16.0, 32.0, 12.0, 12.0, 14.0, 10.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.91610336303711, -24.085018157958984, -23.253931045532227, -22.4228458404541, -21.591760635375977, -20.76067352294922, -19.929588317871094, -19.09850311279297, -18.267417907714844, -17.43633270263672, -16.60524559020996, -15.774160385131836, -14.943075180053711, -14.11198902130127, -13.280902862548828, -12.449817657470703, -11.618730545043945, -10.787644386291504, -9.956559181213379, -9.125473022460938, -8.294387817382812, -7.463301658630371, -6.63221549987793, -5.8011298179626465, -4.970044136047363, -4.13895845413208, -3.3078725337982178, -2.4767866134643555, -1.6457009315490723, -0.8146152496337891, 0.016470909118652344, 0.8475565910339355, 1.6786422729492188, 2.509727954864502, 3.3408138751983643, 4.171899795532227, 5.00298547744751, 5.834071159362793, 6.665157318115234, 7.496243000030518, 8.3273286819458, 9.158414840698242, 9.989500045776367, 10.820586204528809, 11.65167236328125, 12.482757568359375, 13.313843727111816, 14.144929885864258, 14.976015090942383, 15.807101249694824, 16.638187408447266, 17.46927261352539, 18.300357818603516, 19.13144302368164, 19.9625301361084, 20.793615341186523, 21.62470245361328, 22.455787658691406, 23.286874771118164, 24.11795997619629, 24.949045181274414, 25.780132293701172, 26.611217498779297, 27.442302703857422, 28.273387908935547]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 5.0, 5.0, 8.0, 8.0, 12.0, 14.0, 17.0, 23.0, 18.0, 23.0, 24.0, 23.0, 27.0, 27.0, 32.0, 33.0, 33.0, 35.0, 37.0, 28.0, 44.0, 40.0, 47.0, 42.0, 46.0, 37.0, 39.0, 38.0, 27.0, 35.0, 24.0, 23.0, 14.0, 19.0, 13.0, 8.0, 7.0, 14.0, 12.0, 7.0, 3.0, 6.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.22265625, -2.152618408203125, -2.08258056640625, -2.012542724609375, -1.9425048828125, -1.872467041015625, -1.80242919921875, -1.732391357421875, -1.662353515625, -1.592315673828125, -1.52227783203125, -1.452239990234375, -1.3822021484375, -1.312164306640625, -1.24212646484375, -1.172088623046875, -1.10205078125, -1.032012939453125, -0.96197509765625, -0.891937255859375, -0.8218994140625, -0.751861572265625, -0.68182373046875, -0.611785888671875, -0.541748046875, -0.471710205078125, -0.40167236328125, -0.331634521484375, -0.2615966796875, -0.191558837890625, -0.12152099609375, -0.051483154296875, 0.0185546875, 0.088592529296875, 0.15863037109375, 0.228668212890625, 0.2987060546875, 0.368743896484375, 0.43878173828125, 0.508819580078125, 0.578857421875, 0.648895263671875, 0.71893310546875, 0.788970947265625, 0.8590087890625, 0.929046630859375, 0.99908447265625, 1.069122314453125, 1.13916015625, 1.209197998046875, 1.27923583984375, 1.349273681640625, 1.4193115234375, 1.489349365234375, 1.55938720703125, 1.629425048828125, 1.699462890625, 1.769500732421875, 1.83953857421875, 1.909576416015625, 1.9796142578125, 2.049652099609375, 2.11968994140625, 2.189727783203125, 2.259765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 5.0, 6.0, 15.0, 12.0, 16.0, 19.0, 31.0, 40.0, 50.0, 78.0, 107.0, 193.0, 448.0, 1152.0, 3319.0, 11078.0, 39039.0, 172611.0, 953324.0, 2172041.0, 673412.0, 124226.0, 29815.0, 8660.0, 2716.0, 959.0, 350.0, 203.0, 82.0, 77.0, 37.0, 32.0, 26.0, 11.0, 25.0, 14.0, 6.0, 8.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03515625, -4.8695068359375, -4.703857421875, -4.5382080078125, -4.37255859375, -4.2069091796875, -4.041259765625, -3.8756103515625, -3.7099609375, -3.5443115234375, -3.378662109375, -3.2130126953125, -3.04736328125, -2.8817138671875, -2.716064453125, -2.5504150390625, -2.384765625, -2.2191162109375, -2.053466796875, -1.8878173828125, -1.72216796875, -1.5565185546875, -1.390869140625, -1.2252197265625, -1.0595703125, -0.8939208984375, -0.728271484375, -0.5626220703125, -0.39697265625, -0.2313232421875, -0.065673828125, 0.0999755859375, 0.265625, 0.4312744140625, 0.596923828125, 0.7625732421875, 0.92822265625, 1.0938720703125, 1.259521484375, 1.4251708984375, 1.5908203125, 1.7564697265625, 1.922119140625, 2.0877685546875, 2.25341796875, 2.4190673828125, 2.584716796875, 2.7503662109375, 2.916015625, 3.0816650390625, 3.247314453125, 3.4129638671875, 3.57861328125, 3.7442626953125, 3.909912109375, 4.0755615234375, 4.2412109375, 4.4068603515625, 4.572509765625, 4.7381591796875, 4.90380859375, 5.0694580078125, 5.235107421875, 5.4007568359375, 5.56640625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 12.0, 16.0, 16.0, 31.0, 47.0, 53.0, 58.0, 124.0, 131.0, 179.0, 256.0, 351.0, 414.0, 454.0, 451.0, 364.0, 282.0, 232.0, 155.0, 125.0, 86.0, 68.0, 43.0, 31.0, 24.0, 13.0, 12.0, 10.0, 5.0, 7.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.08203125, -6.87188720703125, -6.6617431640625, -6.45159912109375, -6.241455078125, -6.03131103515625, -5.8211669921875, -5.61102294921875, -5.40087890625, -5.19073486328125, -4.9805908203125, -4.77044677734375, -4.560302734375, -4.35015869140625, -4.1400146484375, -3.92987060546875, -3.7197265625, -3.50958251953125, -3.2994384765625, -3.08929443359375, -2.879150390625, -2.66900634765625, -2.4588623046875, -2.24871826171875, -2.03857421875, -1.82843017578125, -1.6182861328125, -1.40814208984375, -1.197998046875, -0.98785400390625, -0.7777099609375, -0.56756591796875, -0.357421875, -0.14727783203125, 0.0628662109375, 0.27301025390625, 0.483154296875, 0.69329833984375, 0.9034423828125, 1.11358642578125, 1.32373046875, 1.53387451171875, 1.7440185546875, 1.95416259765625, 2.164306640625, 2.37445068359375, 2.5845947265625, 2.79473876953125, 3.0048828125, 3.21502685546875, 3.4251708984375, 3.63531494140625, 3.845458984375, 4.05560302734375, 4.2657470703125, 4.47589111328125, 4.68603515625, 4.89617919921875, 5.1063232421875, 5.31646728515625, 5.526611328125, 5.73675537109375, 5.9468994140625, 6.15704345703125, 6.3671875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 10.0, 18.0, 31.0, 50.0, 84.0, 119.0, 254.0, 446.0, 995.0, 2723.0, 9769.0, 52805.0, 363705.0, 2209649.0, 1333006.0, 182813.0, 28296.0, 5994.0, 1896.0, 779.0, 364.0, 176.0, 114.0, 62.0, 40.0, 24.0, 21.0, 11.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.2578125, -12.9249267578125, -12.592041015625, -12.2591552734375, -11.92626953125, -11.5933837890625, -11.260498046875, -10.9276123046875, -10.5947265625, -10.2618408203125, -9.928955078125, -9.5960693359375, -9.26318359375, -8.9302978515625, -8.597412109375, -8.2645263671875, -7.931640625, -7.5987548828125, -7.265869140625, -6.9329833984375, -6.60009765625, -6.2672119140625, -5.934326171875, -5.6014404296875, -5.2685546875, -4.9356689453125, -4.602783203125, -4.2698974609375, -3.93701171875, -3.6041259765625, -3.271240234375, -2.9383544921875, -2.60546875, -2.2725830078125, -1.939697265625, -1.6068115234375, -1.27392578125, -0.9410400390625, -0.608154296875, -0.2752685546875, 0.0576171875, 0.3905029296875, 0.723388671875, 1.0562744140625, 1.38916015625, 1.7220458984375, 2.054931640625, 2.3878173828125, 2.720703125, 3.0535888671875, 3.386474609375, 3.7193603515625, 4.05224609375, 4.3851318359375, 4.718017578125, 5.0509033203125, 5.3837890625, 5.7166748046875, 6.049560546875, 6.3824462890625, 6.71533203125, 7.0482177734375, 7.381103515625, 7.7139892578125, 8.046875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 24.0, 62.0, 144.0, 214.0, 227.0, 182.0, 104.0, 33.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.97291564941406, -92.60398864746094, -90.23506164550781, -87.86613464355469, -85.4972152709961, -83.12828826904297, -80.75936126708984, -78.39043426513672, -76.0215072631836, -73.65258026123047, -71.28365325927734, -68.91473388671875, -66.54580688476562, -64.1768798828125, -61.807952880859375, -59.43902587890625, -57.07010269165039, -54.701175689697266, -52.332252502441406, -49.96332550048828, -47.594398498535156, -45.22547149658203, -42.85654830932617, -40.48762130737305, -38.11869812011719, -35.74977111816406, -33.3808479309082, -31.011920928955078, -28.642993927001953, -26.27406883239746, -23.90514373779297, -21.536216735839844, -19.167293548583984, -16.798368453979492, -14.429441452026367, -12.060516357421875, -9.691590309143066, -7.322664260864258, -4.953739166259766, -2.5848121643066406, -0.21588706970214844, 2.153038740158081, 4.5219645500183105, 6.890890121459961, 9.25981616973877, 11.628742218017578, 13.99766731262207, 16.366594314575195, 18.735519409179688, 21.10444450378418, 23.473371505737305, 25.842296600341797, 28.211223602294922, 30.580148696899414, 32.949073791503906, 35.31800079345703, 37.686927795410156, 40.05585479736328, 42.42477798461914, 44.793704986572266, 47.16263198852539, 49.53155517578125, 51.900482177734375, 54.2694091796875, 56.63833236694336]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 9.0, 9.0, 6.0, 15.0, 12.0, 19.0, 19.0, 11.0, 22.0, 27.0, 25.0, 31.0, 29.0, 38.0, 38.0, 39.0, 43.0, 36.0, 43.0, 52.0, 39.0, 37.0, 46.0, 36.0, 28.0, 32.0, 43.0, 31.0, 23.0, 24.0, 24.0, 17.0, 24.0, 21.0, 15.0, 4.0, 10.0, 5.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.37346839904785, -19.657672882080078, -18.941877365112305, -18.22608184814453, -17.510286331176758, -16.794490814208984, -16.07869529724121, -15.362899780273438, -14.647104263305664, -13.93130874633789, -13.215513229370117, -12.499717712402344, -11.78392219543457, -11.068126678466797, -10.352331161499023, -9.63653564453125, -8.920741081237793, -8.20494556427002, -7.489150047302246, -6.773354530334473, -6.057559013366699, -5.341763496398926, -4.6259684562683105, -3.910172939300537, -3.1943774223327637, -2.4785819053649902, -1.7627865076065063, -1.0469911098480225, -0.331195592880249, 0.3845999240875244, 1.1003952026367188, 1.8161907196044922, 2.5319862365722656, 3.247781753540039, 3.9635772705078125, 4.679372787475586, 5.395168304443359, 6.110963821411133, 6.826758861541748, 7.5425543785095215, 8.258350372314453, 8.974145889282227, 9.68994140625, 10.405736923217773, 11.121532440185547, 11.83732795715332, 12.553123474121094, 13.268918991088867, 13.984713554382324, 14.700509071350098, 15.416304588317871, 16.132099151611328, 16.8478946685791, 17.563690185546875, 18.27948570251465, 18.995281219482422, 19.711076736450195, 20.42687225341797, 21.142667770385742, 21.858463287353516, 22.57425880432129, 23.290054321289062, 24.005849838256836, 24.72164535522461, 25.437440872192383]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 4.0, 9.0, 10.0, 14.0, 16.0, 10.0, 11.0, 27.0, 19.0, 15.0, 29.0, 34.0, 30.0, 21.0, 37.0, 40.0, 33.0, 30.0, 46.0, 33.0, 51.0, 51.0, 40.0, 30.0, 42.0, 33.0, 37.0, 33.0, 25.0, 26.0, 18.0, 22.0, 26.0, 21.0, 12.0, 10.0, 6.0, 7.0, 4.0, 7.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.2578125, -2.184661865234375, -2.11151123046875, -2.038360595703125, -1.9652099609375, -1.892059326171875, -1.81890869140625, -1.745758056640625, -1.672607421875, -1.599456787109375, -1.52630615234375, -1.453155517578125, -1.3800048828125, -1.306854248046875, -1.23370361328125, -1.160552978515625, -1.08740234375, -1.014251708984375, -0.94110107421875, -0.867950439453125, -0.7947998046875, -0.721649169921875, -0.64849853515625, -0.575347900390625, -0.502197265625, -0.429046630859375, -0.35589599609375, -0.282745361328125, -0.2095947265625, -0.136444091796875, -0.06329345703125, 0.009857177734375, 0.0830078125, 0.156158447265625, 0.22930908203125, 0.302459716796875, 0.3756103515625, 0.448760986328125, 0.52191162109375, 0.595062255859375, 0.668212890625, 0.741363525390625, 0.81451416015625, 0.887664794921875, 0.9608154296875, 1.033966064453125, 1.10711669921875, 1.180267333984375, 1.25341796875, 1.326568603515625, 1.39971923828125, 1.472869873046875, 1.5460205078125, 1.619171142578125, 1.69232177734375, 1.765472412109375, 1.838623046875, 1.911773681640625, 1.98492431640625, 2.058074951171875, 2.1312255859375, 2.204376220703125, 2.27752685546875, 2.350677490234375, 2.423828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 9.0, 13.0, 27.0, 19.0, 27.0, 71.0, 105.0, 144.0, 192.0, 332.0, 466.0, 741.0, 1089.0, 1574.0, 2535.0, 3819.0, 5804.0, 9192.0, 14680.0, 23061.0, 37495.0, 60412.0, 95226.0, 140454.0, 177090.0, 159786.0, 114495.0, 74387.0, 46912.0, 28758.0, 17873.0, 11198.0, 7166.0, 4613.0, 2928.0, 2007.0, 1259.0, 875.0, 546.0, 394.0, 246.0, 161.0, 124.0, 78.0, 59.0, 53.0, 25.0, 13.0, 12.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1962890625, -0.19010162353515625, -0.1839141845703125, -0.17772674560546875, -0.171539306640625, -0.16535186767578125, -0.1591644287109375, -0.15297698974609375, -0.14678955078125, -0.14060211181640625, -0.1344146728515625, -0.12822723388671875, -0.122039794921875, -0.11585235595703125, -0.1096649169921875, -0.10347747802734375, -0.0972900390625, -0.09110260009765625, -0.0849151611328125, -0.07872772216796875, -0.072540283203125, -0.06635284423828125, -0.0601654052734375, -0.05397796630859375, -0.04779052734375, -0.04160308837890625, -0.0354156494140625, -0.02922821044921875, -0.023040771484375, -0.01685333251953125, -0.0106658935546875, -0.00447845458984375, 0.001708984375, 0.00789642333984375, 0.0140838623046875, 0.02027130126953125, 0.026458740234375, 0.03264617919921875, 0.0388336181640625, 0.04502105712890625, 0.05120849609375, 0.05739593505859375, 0.0635833740234375, 0.06977081298828125, 0.075958251953125, 0.08214569091796875, 0.0883331298828125, 0.09452056884765625, 0.1007080078125, 0.10689544677734375, 0.1130828857421875, 0.11927032470703125, 0.125457763671875, 0.13164520263671875, 0.1378326416015625, 0.14402008056640625, 0.15020751953125, 0.15639495849609375, 0.1625823974609375, 0.16876983642578125, 0.174957275390625, 0.18114471435546875, 0.1873321533203125, 0.19351959228515625, 0.19970703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 8.0, 8.0, 9.0, 6.0, 5.0, 4.0, 6.0, 13.0, 8.0, 14.0, 21.0, 26.0, 23.0, 33.0, 34.0, 30.0, 27.0, 43.0, 44.0, 37.0, 42.0, 36.0, 1071.0, 39.0, 40.0, 44.0, 30.0, 37.0, 34.0, 32.0, 32.0, 24.0, 19.0, 30.0, 15.0, 22.0, 18.0, 8.0, 9.0, 6.0, 10.0, 3.0, 8.0, 7.0, 0.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.3766937255859375, -1.330535888671875, -1.2843780517578125, -1.23822021484375, -1.1920623779296875, -1.145904541015625, -1.0997467041015625, -1.0535888671875, -1.0074310302734375, -0.961273193359375, -0.9151153564453125, -0.86895751953125, -0.8227996826171875, -0.776641845703125, -0.7304840087890625, -0.684326171875, -0.6381683349609375, -0.592010498046875, -0.5458526611328125, -0.49969482421875, -0.4535369873046875, -0.407379150390625, -0.3612213134765625, -0.3150634765625, -0.2689056396484375, -0.222747802734375, -0.1765899658203125, -0.13043212890625, -0.0842742919921875, -0.038116455078125, 0.0080413818359375, 0.05419921875, 0.1003570556640625, 0.146514892578125, 0.1926727294921875, 0.23883056640625, 0.2849884033203125, 0.331146240234375, 0.3773040771484375, 0.4234619140625, 0.4696197509765625, 0.515777587890625, 0.5619354248046875, 0.60809326171875, 0.6542510986328125, 0.700408935546875, 0.7465667724609375, 0.792724609375, 0.8388824462890625, 0.885040283203125, 0.9311981201171875, 0.97735595703125, 1.0235137939453125, 1.069671630859375, 1.1158294677734375, 1.1619873046875, 1.2081451416015625, 1.254302978515625, 1.3004608154296875, 1.34661865234375, 1.3927764892578125, 1.438934326171875, 1.4850921630859375, 1.53125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 15.0, 29.0, 32.0, 63.0, 74.0, 118.0, 183.0, 259.0, 373.0, 577.0, 972.0, 1470.0, 2260.0, 3711.0, 5808.0, 8985.0, 14200.0, 23203.0, 37282.0, 57715.0, 87216.0, 124018.0, 505971.0, 845924.0, 125516.0, 89557.0, 59511.0, 38154.0, 23803.0, 15025.0, 9376.0, 5675.0, 3587.0, 2273.0, 1441.0, 963.0, 604.0, 413.0, 247.0, 174.0, 81.0, 85.0, 68.0, 42.0, 19.0, 17.0, 14.0, 13.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1163330078125, -0.11245918273925781, -0.10858535766601562, -0.10471153259277344, -0.10083770751953125, -0.09696388244628906, -0.09309005737304688, -0.08921623229980469, -0.0853424072265625, -0.08146858215332031, -0.07759475708007812, -0.07372093200683594, -0.06984710693359375, -0.06597328186035156, -0.062099456787109375, -0.05822563171386719, -0.054351806640625, -0.05047798156738281, -0.046604156494140625, -0.04273033142089844, -0.03885650634765625, -0.03498268127441406, -0.031108856201171875, -0.027235031127929688, -0.0233612060546875, -0.019487380981445312, -0.015613555908203125, -0.011739730834960938, -0.00786590576171875, -0.0039920806884765625, -0.000118255615234375, 0.0037555694580078125, 0.00762939453125, 0.011503219604492188, 0.015377044677734375, 0.019250869750976562, 0.02312469482421875, 0.026998519897460938, 0.030872344970703125, 0.03474617004394531, 0.0386199951171875, 0.04249382019042969, 0.046367645263671875, 0.05024147033691406, 0.05411529541015625, 0.05798912048339844, 0.061862945556640625, 0.06573677062988281, 0.069610595703125, 0.07348442077636719, 0.07735824584960938, 0.08123207092285156, 0.08510589599609375, 0.08897972106933594, 0.09285354614257812, 0.09672737121582031, 0.1006011962890625, 0.10447502136230469, 0.10834884643554688, 0.11222267150878906, 0.11609649658203125, 0.11997032165527344, 0.12384414672851562, 0.1277179718017578, 0.131591796875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 10.0, 6.0, 8.0, 9.0, 17.0, 20.0, 17.0, 39.0, 30.0, 64.0, 85.0, 135.0, 125.0, 95.0, 77.0, 52.0, 40.0, 32.0, 18.0, 16.0, 18.0, 13.0, 11.0, 6.0, 7.0, 1.0, 2.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0074920654296875, -0.007260143756866455, -0.00702822208404541, -0.006796300411224365, -0.00656437873840332, -0.006332457065582275, -0.0061005353927612305, -0.0058686137199401855, -0.005636692047119141, -0.005404770374298096, -0.005172848701477051, -0.004940927028656006, -0.004709005355834961, -0.004477083683013916, -0.004245162010192871, -0.004013240337371826, -0.0037813186645507812, -0.0035493969917297363, -0.0033174753189086914, -0.0030855536460876465, -0.0028536319732666016, -0.0026217103004455566, -0.0023897886276245117, -0.002157866954803467, -0.0019259452819824219, -0.001694023609161377, -0.001462101936340332, -0.0012301802635192871, -0.0009982585906982422, -0.0007663369178771973, -0.0005344152450561523, -0.0003024935722351074, -7.05718994140625e-05, 0.00016134977340698242, 0.00039327144622802734, 0.0006251931190490723, 0.0008571147918701172, 0.0010890364646911621, 0.001320958137512207, 0.001552879810333252, 0.0017848014831542969, 0.002016723155975342, 0.0022486448287963867, 0.0024805665016174316, 0.0027124881744384766, 0.0029444098472595215, 0.0031763315200805664, 0.0034082531929016113, 0.0036401748657226562, 0.003872096538543701, 0.004104018211364746, 0.004335939884185791, 0.004567861557006836, 0.004799783229827881, 0.005031704902648926, 0.005263626575469971, 0.005495548248291016, 0.0057274699211120605, 0.0059593915939331055, 0.00619131326675415, 0.006423234939575195, 0.00665515661239624, 0.006887078285217285, 0.00711899995803833, 0.007350921630859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 3.0, 1.0, 4.0, 9.0, 12.0, 8.0, 12.0, 27.0, 27.0, 51.0, 97.0, 163.0, 287.0, 962.0, 92947.0, 949834.0, 3199.0, 391.0, 173.0, 104.0, 69.0, 47.0, 26.0, 18.0, 11.0, 14.0, 6.0, 4.0, 12.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1748046875, -0.16920089721679688, -0.16359710693359375, -0.15799331665039062, -0.1523895263671875, -0.14678573608398438, -0.14118194580078125, -0.13557815551757812, -0.129974365234375, -0.12437057495117188, -0.11876678466796875, -0.11316299438476562, -0.1075592041015625, -0.10195541381835938, -0.09635162353515625, -0.09074783325195312, -0.08514404296875, -0.07954025268554688, -0.07393646240234375, -0.06833267211914062, -0.0627288818359375, -0.057125091552734375, -0.05152130126953125, -0.045917510986328125, -0.040313720703125, -0.034709930419921875, -0.02910614013671875, -0.023502349853515625, -0.0178985595703125, -0.012294769287109375, -0.00669097900390625, -0.001087188720703125, 0.0045166015625, 0.010120391845703125, 0.01572418212890625, 0.021327972412109375, 0.0269317626953125, 0.032535552978515625, 0.03813934326171875, 0.043743133544921875, 0.049346923828125, 0.054950714111328125, 0.06055450439453125, 0.06615829467773438, 0.0717620849609375, 0.07736587524414062, 0.08296966552734375, 0.08857345581054688, 0.09417724609375, 0.09978103637695312, 0.10538482666015625, 0.11098861694335938, 0.1165924072265625, 0.12219619750976562, 0.12779998779296875, 0.13340377807617188, 0.139007568359375, 0.14461135864257812, 0.15021514892578125, 0.15581893920898438, 0.1614227294921875, 0.16702651977539062, 0.17263031005859375, 0.17823410034179688, 0.183837890625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 123.0, 734.0, 127.0, 16.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13747811317443848, -0.1349993646144867, -0.1325206160545349, -0.13004186749458313, -0.12756311893463135, -0.12508437037467957, -0.12260562181472778, -0.120126873254776, -0.11764812469482422, -0.11516937613487244, -0.11269062757492065, -0.11021187901496887, -0.10773313045501709, -0.10525438189506531, -0.10277563333511353, -0.10029688477516174, -0.09781814366579056, -0.09533939510583878, -0.092860646545887, -0.09038189798593521, -0.08790314942598343, -0.08542440086603165, -0.08294565230607986, -0.08046691119670868, -0.0779881626367569, -0.07550941407680511, -0.07303066551685333, -0.07055191695690155, -0.06807316839694977, -0.06559441983699799, -0.0631156712770462, -0.06063692644238472, -0.05815816670656204, -0.05567941814661026, -0.05320066958665848, -0.050721921026706696, -0.04824317246675491, -0.04576442390680313, -0.04328567907214165, -0.040806930512189865, -0.03832818567752838, -0.0358494371175766, -0.03337068855762482, -0.030891941860318184, -0.0284131933003664, -0.02593444474041462, -0.023455698043107986, -0.020976949483156204, -0.018498199060559273, -0.01601945050060749, -0.013540702871978283, -0.011061955243349075, -0.008583206683397293, -0.006104458123445511, -0.0036257104948163033, -0.0011469628661870956, 0.0013317856937646866, 0.0038105337880551815, 0.006289281882345676, 0.008768029510974884, 0.011246778070926666, 0.013725526630878448, 0.01620427519083023, 0.018683021888136864, 0.021161770448088646]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 13.0, 14.0, 9.0, 7.0, 19.0, 17.0, 23.0, 22.0, 31.0, 27.0, 29.0, 32.0, 43.0, 41.0, 43.0, 47.0, 46.0, 39.0, 38.0, 41.0, 43.0, 42.0, 39.0, 33.0, 34.0, 45.0, 22.0, 24.0, 15.0, 31.0, 18.0, 13.0, 9.0, 13.0, 6.0, 5.0, 6.0, 5.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.006684482097625732, -0.00648366566747427, -0.006282849237322807, -0.006082032807171345, -0.005881216377019882, -0.00568039994686842, -0.005479583516716957, -0.0052787670865654945, -0.005077950656414032, -0.004877134226262569, -0.004676317796111107, -0.004475501365959644, -0.004274684935808182, -0.004073868505656719, -0.0038730520755052567, -0.003672235645353794, -0.0034714192152023315, -0.003270602785050869, -0.0030697863548994064, -0.002868969924747944, -0.0026681534945964813, -0.0024673370644450188, -0.002266520634293556, -0.0020657042041420937, -0.001864887773990631, -0.0016640713438391685, -0.001463254913687706, -0.0012624384835362434, -0.0010616220533847809, -0.0008608056232333183, -0.0006599891930818558, -0.0004591727629303932, -0.00025835633277893066, -5.753990262746811e-05, 0.00014327652752399445, 0.000344092957675457, 0.0005449093878269196, 0.0007457258179783821, 0.0009465422481298447, 0.0011473586782813072, 0.0013481751084327698, 0.0015489915385842323, 0.0017498079687356949, 0.0019506243988871574, 0.00215144082903862, 0.0023522572591900826, 0.002553073689341545, 0.0027538901194930077, 0.00295470654964447, 0.0031555229797959328, 0.0033563394099473953, 0.003557155840098858, 0.0037579722702503204, 0.003958788700401783, 0.0041596051305532455, 0.004360421560704708, 0.004561237990856171, 0.004762054421007633, 0.004962870851159096, 0.005163687281310558, 0.005364503711462021, 0.005565320141613483, 0.005766136571764946, 0.0059669530019164085, 0.006167769432067871]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 4.0, 9.0, 10.0, 15.0, 15.0, 10.0, 12.0, 26.0, 19.0, 16.0, 29.0, 34.0, 30.0, 20.0, 38.0, 40.0, 32.0, 31.0, 45.0, 33.0, 52.0, 50.0, 41.0, 29.0, 42.0, 33.0, 37.0, 33.0, 26.0, 25.0, 18.0, 23.0, 25.0, 21.0, 12.0, 10.0, 6.0, 7.0, 4.0, 7.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.255859375, -2.1827392578125, -2.109619140625, -2.0364990234375, -1.96337890625, -1.8902587890625, -1.817138671875, -1.7440185546875, -1.6708984375, -1.5977783203125, -1.524658203125, -1.4515380859375, -1.37841796875, -1.3052978515625, -1.232177734375, -1.1590576171875, -1.0859375, -1.0128173828125, -0.939697265625, -0.8665771484375, -0.79345703125, -0.7203369140625, -0.647216796875, -0.5740966796875, -0.5009765625, -0.4278564453125, -0.354736328125, -0.2816162109375, -0.20849609375, -0.1353759765625, -0.062255859375, 0.0108642578125, 0.083984375, 0.1571044921875, 0.230224609375, 0.3033447265625, 0.37646484375, 0.4495849609375, 0.522705078125, 0.5958251953125, 0.6689453125, 0.7420654296875, 0.815185546875, 0.8883056640625, 0.96142578125, 1.0345458984375, 1.107666015625, 1.1807861328125, 1.25390625, 1.3270263671875, 1.400146484375, 1.4732666015625, 1.54638671875, 1.6195068359375, 1.692626953125, 1.7657470703125, 1.8388671875, 1.9119873046875, 1.985107421875, 2.0582275390625, 2.13134765625, 2.2044677734375, 2.277587890625, 2.3507080078125, 2.423828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 10.0, 17.0, 23.0, 36.0, 52.0, 92.0, 118.0, 201.0, 234.0, 403.0, 678.0, 956.0, 1668.0, 2774.0, 4763.0, 8594.0, 16666.0, 32820.0, 65263.0, 125342.0, 210439.0, 237904.0, 160783.0, 86517.0, 43749.0, 22184.0, 11279.0, 6123.0, 3301.0, 2043.0, 1213.0, 831.0, 495.0, 319.0, 230.0, 135.0, 101.0, 59.0, 39.0, 25.0, 30.0, 11.0, 6.0, 6.0, 5.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8544921875, -1.7931060791015625, -1.731719970703125, -1.6703338623046875, -1.60894775390625, -1.5475616455078125, -1.486175537109375, -1.4247894287109375, -1.3634033203125, -1.3020172119140625, -1.240631103515625, -1.1792449951171875, -1.11785888671875, -1.0564727783203125, -0.995086669921875, -0.9337005615234375, -0.872314453125, -0.8109283447265625, -0.749542236328125, -0.6881561279296875, -0.62677001953125, -0.5653839111328125, -0.503997802734375, -0.4426116943359375, -0.3812255859375, -0.3198394775390625, -0.258453369140625, -0.1970672607421875, -0.13568115234375, -0.0742950439453125, -0.012908935546875, 0.0484771728515625, 0.10986328125, 0.1712493896484375, 0.232635498046875, 0.2940216064453125, 0.35540771484375, 0.4167938232421875, 0.478179931640625, 0.5395660400390625, 0.6009521484375, 0.6623382568359375, 0.723724365234375, 0.7851104736328125, 0.84649658203125, 0.9078826904296875, 0.969268798828125, 1.0306549072265625, 1.092041015625, 1.1534271240234375, 1.214813232421875, 1.2761993408203125, 1.33758544921875, 1.3989715576171875, 1.460357666015625, 1.5217437744140625, 1.5831298828125, 1.6445159912109375, 1.705902099609375, 1.7672882080078125, 1.82867431640625, 1.8900604248046875, 1.951446533203125, 2.0128326416015625, 2.07421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 7.0, 17.0, 14.0, 10.0, 23.0, 33.0, 30.0, 32.0, 32.0, 37.0, 46.0, 35.0, 71.0, 125.0, 222.0, 1413.0, 294.0, 125.0, 69.0, 60.0, 50.0, 46.0, 35.0, 39.0, 33.0, 23.0, 21.0, 18.0, 19.0, 7.0, 14.0, 12.0, 3.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.3726806640625, -8.081298828125, -7.7899169921875, -7.49853515625, -7.2071533203125, -6.915771484375, -6.6243896484375, -6.3330078125, -6.0416259765625, -5.750244140625, -5.4588623046875, -5.16748046875, -4.8760986328125, -4.584716796875, -4.2933349609375, -4.001953125, -3.7105712890625, -3.419189453125, -3.1278076171875, -2.83642578125, -2.5450439453125, -2.253662109375, -1.9622802734375, -1.6708984375, -1.3795166015625, -1.088134765625, -0.7967529296875, -0.50537109375, -0.2139892578125, 0.077392578125, 0.3687744140625, 0.66015625, 0.9515380859375, 1.242919921875, 1.5343017578125, 1.82568359375, 2.1170654296875, 2.408447265625, 2.6998291015625, 2.9912109375, 3.2825927734375, 3.573974609375, 3.8653564453125, 4.15673828125, 4.4481201171875, 4.739501953125, 5.0308837890625, 5.322265625, 5.6136474609375, 5.905029296875, 6.1964111328125, 6.48779296875, 6.7791748046875, 7.070556640625, 7.3619384765625, 7.6533203125, 7.9447021484375, 8.236083984375, 8.5274658203125, 8.81884765625, 9.1102294921875, 9.401611328125, 9.6929931640625, 9.984375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 11.0, 12.0, 18.0, 20.0, 25.0, 20.0, 49.0, 58.0, 78.0, 78.0, 137.0, 226.0, 407.0, 1128.0, 6031.0, 101640.0, 2803999.0, 219760.0, 9261.0, 1369.0, 515.0, 239.0, 173.0, 105.0, 71.0, 57.0, 50.0, 31.0, 30.0, 20.0, 14.0, 13.0, 13.0, 7.0, 6.0, 6.0, 5.0, 1.0, 3.0, 6.0, 0.0, 1.0, 1.0, 3.0], "bins": [-16.171875, -15.72998046875, -15.2880859375, -14.84619140625, -14.404296875, -13.96240234375, -13.5205078125, -13.07861328125, -12.63671875, -12.19482421875, -11.7529296875, -11.31103515625, -10.869140625, -10.42724609375, -9.9853515625, -9.54345703125, -9.1015625, -8.65966796875, -8.2177734375, -7.77587890625, -7.333984375, -6.89208984375, -6.4501953125, -6.00830078125, -5.56640625, -5.12451171875, -4.6826171875, -4.24072265625, -3.798828125, -3.35693359375, -2.9150390625, -2.47314453125, -2.03125, -1.58935546875, -1.1474609375, -0.70556640625, -0.263671875, 0.17822265625, 0.6201171875, 1.06201171875, 1.50390625, 1.94580078125, 2.3876953125, 2.82958984375, 3.271484375, 3.71337890625, 4.1552734375, 4.59716796875, 5.0390625, 5.48095703125, 5.9228515625, 6.36474609375, 6.806640625, 7.24853515625, 7.6904296875, 8.13232421875, 8.57421875, 9.01611328125, 9.4580078125, 9.89990234375, 10.341796875, 10.78369140625, 11.2255859375, 11.66748046875, 12.109375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 89.0, 562.0, 339.0, 27.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.015636444091797, -17.07900619506836, -14.142375946044922, -11.205745697021484, -8.269115447998047, -5.332485198974609, -2.395854949951172, 0.5407752990722656, 3.477405548095703, 6.414035797119141, 9.350666046142578, 12.287296295166016, 15.223926544189453, 18.16055679321289, 21.097187042236328, 24.033817291259766, 26.970447540283203, 29.90707778930664, 32.84370803833008, 35.780338287353516, 38.71696853637695, 41.65359878540039, 44.59022903442383, 47.526859283447266, 50.4634895324707, 53.40011978149414, 56.33675003051758, 59.273380279541016, 62.21001052856445, 65.14663696289062, 68.08326721191406, 71.0198974609375, 73.95652770996094, 76.89315795898438, 79.82978820800781, 82.76641845703125, 85.70304870605469, 88.63967895507812, 91.57630920410156, 94.512939453125, 97.44956970214844, 100.38619995117188, 103.32283020019531, 106.25946044921875, 109.19609069824219, 112.13272094726562, 115.06935119628906, 118.0059814453125, 120.94261169433594, 123.87924194335938, 126.81587219238281, 129.75250244140625, 132.6891326904297, 135.62576293945312, 138.56239318847656, 141.4990234375, 144.43565368652344, 147.37228393554688, 150.3089141845703, 153.24554443359375, 156.1821746826172, 159.11880493164062, 162.05543518066406, 164.9920654296875, 167.92869567871094]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 2.0, 5.0, 7.0, 5.0, 6.0, 10.0, 15.0, 23.0, 13.0, 17.0, 36.0, 26.0, 31.0, 30.0, 31.0, 31.0, 37.0, 40.0, 42.0, 42.0, 44.0, 43.0, 37.0, 47.0, 35.0, 33.0, 34.0, 37.0, 31.0, 34.0, 29.0, 20.0, 26.0, 17.0, 13.0, 8.0, 10.0, 10.0, 8.0, 3.0, 6.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.738584518432617, -24.90179443359375, -24.06500244140625, -23.228212356567383, -22.391422271728516, -21.554630279541016, -20.71784019470215, -19.88105010986328, -19.04425811767578, -18.207468032836914, -17.370676040649414, -16.533885955810547, -15.69709587097168, -14.860304832458496, -14.023513793945312, -13.186723709106445, -12.349933624267578, -11.513142585754395, -10.676352500915527, -9.839561462402344, -9.002771377563477, -8.165980339050293, -7.329189300537109, -6.492398738861084, -5.655608177185059, -4.818817615509033, -3.9820268154144287, -3.145236015319824, -2.308445453643799, -1.4716548919677734, -0.6348638534545898, 0.20192670822143555, 1.038717269897461, 1.8755079507827759, 2.712298631668091, 3.5490894317626953, 4.385879993438721, 5.222670555114746, 6.05946159362793, 6.896252155303955, 7.7330427169799805, 8.569833755493164, 9.406623840332031, 10.243414878845215, 11.080205917358398, 11.916996002197266, 12.75378704071045, 13.590578079223633, 14.4273681640625, 15.264159202575684, 16.100950241088867, 16.937740325927734, 17.7745304107666, 18.61132049560547, 19.44811248779297, 20.284902572631836, 21.121692657470703, 21.95848274230957, 22.79527473449707, 23.632064819335938, 24.468854904174805, 25.305644989013672, 26.142436981201172, 26.97922706604004, 27.81601905822754]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 5.0, 19.0, 20.0, 14.0, 16.0, 14.0, 18.0, 26.0, 32.0, 25.0, 30.0, 31.0, 31.0, 35.0, 38.0, 44.0, 37.0, 43.0, 41.0, 45.0, 33.0, 55.0, 36.0, 28.0, 39.0, 32.0, 31.0, 24.0, 23.0, 22.0, 18.0, 19.0, 11.0, 3.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.578125, -2.499237060546875, -2.42034912109375, -2.341461181640625, -2.2625732421875, -2.183685302734375, -2.10479736328125, -2.025909423828125, -1.947021484375, -1.868133544921875, -1.78924560546875, -1.710357666015625, -1.6314697265625, -1.552581787109375, -1.47369384765625, -1.394805908203125, -1.31591796875, -1.237030029296875, -1.15814208984375, -1.079254150390625, -1.0003662109375, -0.921478271484375, -0.84259033203125, -0.763702392578125, -0.684814453125, -0.605926513671875, -0.52703857421875, -0.448150634765625, -0.3692626953125, -0.290374755859375, -0.21148681640625, -0.132598876953125, -0.0537109375, 0.025177001953125, 0.10406494140625, 0.182952880859375, 0.2618408203125, 0.340728759765625, 0.41961669921875, 0.498504638671875, 0.577392578125, 0.656280517578125, 0.73516845703125, 0.814056396484375, 0.8929443359375, 0.971832275390625, 1.05072021484375, 1.129608154296875, 1.20849609375, 1.287384033203125, 1.36627197265625, 1.445159912109375, 1.5240478515625, 1.602935791015625, 1.68182373046875, 1.760711669921875, 1.839599609375, 1.918487548828125, 1.99737548828125, 2.076263427734375, 2.1551513671875, 2.234039306640625, 2.31292724609375, 2.391815185546875, 2.470703125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 6.0, 9.0, 6.0, 7.0, 9.0, 13.0, 14.0, 19.0, 24.0, 29.0, 37.0, 53.0, 52.0, 105.0, 192.0, 403.0, 998.0, 3154.0, 11117.0, 47003.0, 245104.0, 1357564.0, 1968413.0, 453878.0, 80718.0, 17799.0, 4777.0, 1497.0, 588.0, 230.0, 144.0, 78.0, 70.0, 39.0, 25.0, 16.0, 18.0, 19.0, 7.0, 4.0, 11.0, 8.0, 5.0, 8.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.02734375, -5.84564208984375, -5.6639404296875, -5.48223876953125, -5.300537109375, -5.11883544921875, -4.9371337890625, -4.75543212890625, -4.57373046875, -4.39202880859375, -4.2103271484375, -4.02862548828125, -3.846923828125, -3.66522216796875, -3.4835205078125, -3.30181884765625, -3.1201171875, -2.93841552734375, -2.7567138671875, -2.57501220703125, -2.393310546875, -2.21160888671875, -2.0299072265625, -1.84820556640625, -1.66650390625, -1.48480224609375, -1.3031005859375, -1.12139892578125, -0.939697265625, -0.75799560546875, -0.5762939453125, -0.39459228515625, -0.212890625, -0.03118896484375, 0.1505126953125, 0.33221435546875, 0.513916015625, 0.69561767578125, 0.8773193359375, 1.05902099609375, 1.24072265625, 1.42242431640625, 1.6041259765625, 1.78582763671875, 1.967529296875, 2.14923095703125, 2.3309326171875, 2.51263427734375, 2.6943359375, 2.87603759765625, 3.0577392578125, 3.23944091796875, 3.421142578125, 3.60284423828125, 3.7845458984375, 3.96624755859375, 4.14794921875, 4.32965087890625, 4.5113525390625, 4.69305419921875, 4.874755859375, 5.05645751953125, 5.2381591796875, 5.41986083984375, 5.6015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 4.0, 7.0, 15.0, 9.0, 8.0, 11.0, 19.0, 31.0, 34.0, 50.0, 70.0, 83.0, 90.0, 148.0, 187.0, 241.0, 285.0, 380.0, 377.0, 395.0, 346.0, 300.0, 235.0, 181.0, 123.0, 108.0, 76.0, 69.0, 47.0, 38.0, 22.0, 26.0, 11.0, 14.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.31732177734375, -6.1190185546875, -5.92071533203125, -5.722412109375, -5.52410888671875, -5.3258056640625, -5.12750244140625, -4.92919921875, -4.73089599609375, -4.5325927734375, -4.33428955078125, -4.135986328125, -3.93768310546875, -3.7393798828125, -3.54107666015625, -3.3427734375, -3.14447021484375, -2.9461669921875, -2.74786376953125, -2.549560546875, -2.35125732421875, -2.1529541015625, -1.95465087890625, -1.75634765625, -1.55804443359375, -1.3597412109375, -1.16143798828125, -0.963134765625, -0.76483154296875, -0.5665283203125, -0.36822509765625, -0.169921875, 0.02838134765625, 0.2266845703125, 0.42498779296875, 0.623291015625, 0.82159423828125, 1.0198974609375, 1.21820068359375, 1.41650390625, 1.61480712890625, 1.8131103515625, 2.01141357421875, 2.209716796875, 2.40802001953125, 2.6063232421875, 2.80462646484375, 3.0029296875, 3.20123291015625, 3.3995361328125, 3.59783935546875, 3.796142578125, 3.99444580078125, 4.1927490234375, 4.39105224609375, 4.58935546875, 4.78765869140625, 4.9859619140625, 5.18426513671875, 5.382568359375, 5.58087158203125, 5.7791748046875, 5.97747802734375, 6.17578125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 7.0, 14.0, 10.0, 27.0, 36.0, 54.0, 104.0, 118.0, 203.0, 343.0, 611.0, 1309.0, 3211.0, 9470.0, 37117.0, 183433.0, 967620.0, 2176440.0, 653187.0, 123001.0, 25862.0, 7111.0, 2478.0, 1090.0, 562.0, 293.0, 212.0, 121.0, 66.0, 45.0, 25.0, 17.0, 29.0, 10.0, 9.0, 6.0, 3.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.40625, -8.1201171875, -7.833984375, -7.5478515625, -7.26171875, -6.9755859375, -6.689453125, -6.4033203125, -6.1171875, -5.8310546875, -5.544921875, -5.2587890625, -4.97265625, -4.6865234375, -4.400390625, -4.1142578125, -3.828125, -3.5419921875, -3.255859375, -2.9697265625, -2.68359375, -2.3974609375, -2.111328125, -1.8251953125, -1.5390625, -1.2529296875, -0.966796875, -0.6806640625, -0.39453125, -0.1083984375, 0.177734375, 0.4638671875, 0.75, 1.0361328125, 1.322265625, 1.6083984375, 1.89453125, 2.1806640625, 2.466796875, 2.7529296875, 3.0390625, 3.3251953125, 3.611328125, 3.8974609375, 4.18359375, 4.4697265625, 4.755859375, 5.0419921875, 5.328125, 5.6142578125, 5.900390625, 6.1865234375, 6.47265625, 6.7587890625, 7.044921875, 7.3310546875, 7.6171875, 7.9033203125, 8.189453125, 8.4755859375, 8.76171875, 9.0478515625, 9.333984375, 9.6201171875, 9.90625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 5.0, 32.0, 68.0, 119.0, 181.0, 218.0, 177.0, 123.0, 53.0, 20.0, 14.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.094093322753906, -18.868501663208008, -16.64291000366211, -14.417318344116211, -12.191726684570312, -9.966135025024414, -7.740543365478516, -5.514951705932617, -3.2893600463867188, -1.0637683868408203, 1.1618232727050781, 3.3874149322509766, 5.613006591796875, 7.838598251342773, 10.064189910888672, 12.28978157043457, 14.515373229980469, 16.740964889526367, 18.966556549072266, 21.192148208618164, 23.417739868164062, 25.64333152770996, 27.86892318725586, 30.094514846801758, 32.320106506347656, 34.54570007324219, 36.77128982543945, 38.99687957763672, 41.22247314453125, 43.44806671142578, 45.67365646362305, 47.89924621582031, 50.124847412109375, 52.350440979003906, 54.57603073120117, 56.80162048339844, 59.02721405029297, 61.2528076171875, 63.478397369384766, 65.70398712158203, 67.92958068847656, 70.1551742553711, 72.38076782226562, 74.60635375976562, 76.83194732666016, 79.05754089355469, 81.28312683105469, 83.50872039794922, 85.73431396484375, 87.95990753173828, 90.18550109863281, 92.41108703613281, 94.63668060302734, 96.86227416992188, 99.08786010742188, 101.3134536743164, 103.53904724121094, 105.76464080810547, 107.990234375, 110.2158203125, 112.44141387939453, 114.66700744628906, 116.89259338378906, 119.1181869506836, 121.34378051757812]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 7.0, 4.0, 4.0, 9.0, 4.0, 7.0, 9.0, 9.0, 20.0, 7.0, 9.0, 17.0, 17.0, 18.0, 19.0, 19.0, 19.0, 32.0, 25.0, 22.0, 32.0, 27.0, 33.0, 42.0, 34.0, 38.0, 46.0, 41.0, 36.0, 36.0, 35.0, 30.0, 32.0, 26.0, 31.0, 20.0, 16.0, 18.0, 20.0, 16.0, 18.0, 19.0, 8.0, 11.0, 8.0, 15.0, 5.0, 6.0, 5.0, 3.0, 7.0, 7.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.83978271484375, -17.23238754272461, -16.624990463256836, -16.017595291137695, -15.410199165344238, -14.802803039550781, -14.195406913757324, -13.588010787963867, -12.980615615844727, -12.37321949005127, -11.765823364257812, -11.158428192138672, -10.551032066345215, -9.943635940551758, -9.3362398147583, -8.728843688964844, -8.121447563171387, -7.51405143737793, -6.906655788421631, -6.299259662628174, -5.691864013671875, -5.084467887878418, -4.477071762084961, -3.869676113128662, -3.262279987335205, -2.654884099960327, -2.047488212585449, -1.4400920867919922, -0.8326961994171143, -0.22530031204223633, 0.3820958137512207, 0.9894914627075195, 1.5968875885009766, 2.2042834758758545, 2.8116793632507324, 3.4190754890441895, 4.026471138000488, 4.633867263793945, 5.241263389587402, 5.848659038543701, 6.456055164337158, 7.063451290130615, 7.670846939086914, 8.278243064880371, 8.885639190673828, 9.493034362792969, 10.100431442260742, 10.707826614379883, 11.31522274017334, 11.922618865966797, 12.530014991760254, 13.137411117553711, 13.744806289672852, 14.352202415466309, 14.959598541259766, 15.566993713378906, 16.17439079284668, 16.78178596496582, 17.389183044433594, 17.996578216552734, 18.603975296020508, 19.21137046813965, 19.818767547607422, 20.426162719726562, 21.033557891845703]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 5.0, 11.0, 10.0, 11.0, 13.0, 16.0, 19.0, 21.0, 24.0, 20.0, 16.0, 45.0, 24.0, 30.0, 38.0, 33.0, 37.0, 31.0, 52.0, 50.0, 44.0, 43.0, 47.0, 44.0, 37.0, 46.0, 26.0, 24.0, 28.0, 29.0, 15.0, 14.0, 11.0, 16.0, 12.0, 12.0, 14.0, 10.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.76171875, -2.67889404296875, -2.5960693359375, -2.51324462890625, -2.430419921875, -2.34759521484375, -2.2647705078125, -2.18194580078125, -2.09912109375, -2.01629638671875, -1.9334716796875, -1.85064697265625, -1.767822265625, -1.68499755859375, -1.6021728515625, -1.51934814453125, -1.4365234375, -1.35369873046875, -1.2708740234375, -1.18804931640625, -1.105224609375, -1.02239990234375, -0.9395751953125, -0.85675048828125, -0.77392578125, -0.69110107421875, -0.6082763671875, -0.52545166015625, -0.442626953125, -0.35980224609375, -0.2769775390625, -0.19415283203125, -0.111328125, -0.02850341796875, 0.0543212890625, 0.13714599609375, 0.219970703125, 0.30279541015625, 0.3856201171875, 0.46844482421875, 0.55126953125, 0.63409423828125, 0.7169189453125, 0.79974365234375, 0.882568359375, 0.96539306640625, 1.0482177734375, 1.13104248046875, 1.2138671875, 1.29669189453125, 1.3795166015625, 1.46234130859375, 1.545166015625, 1.62799072265625, 1.7108154296875, 1.79364013671875, 1.87646484375, 1.95928955078125, 2.0421142578125, 2.12493896484375, 2.207763671875, 2.29058837890625, 2.3734130859375, 2.45623779296875, 2.5390625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 19.0, 34.0, 37.0, 71.0, 81.0, 138.0, 173.0, 261.0, 430.0, 589.0, 915.0, 1306.0, 1954.0, 3041.0, 4488.0, 6735.0, 10650.0, 16347.0, 24982.0, 38282.0, 59527.0, 90353.0, 131444.0, 170961.0, 156703.0, 112210.0, 75622.0, 49315.0, 31810.0, 20720.0, 13498.0, 8779.0, 5732.0, 3858.0, 2553.0, 1602.0, 1098.0, 714.0, 485.0, 352.0, 222.0, 147.0, 79.0, 70.0, 49.0, 36.0, 14.0, 17.0, 8.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.222412109375, -0.21541404724121094, -0.20841598510742188, -0.2014179229736328, -0.19441986083984375, -0.1874217987060547, -0.18042373657226562, -0.17342567443847656, -0.1664276123046875, -0.15942955017089844, -0.15243148803710938, -0.1454334259033203, -0.13843536376953125, -0.1314373016357422, -0.12443923950195312, -0.11744117736816406, -0.110443115234375, -0.10344505310058594, -0.09644699096679688, -0.08944892883300781, -0.08245086669921875, -0.07545280456542969, -0.06845474243164062, -0.06145668029785156, -0.0544586181640625, -0.04746055603027344, -0.040462493896484375, -0.03346443176269531, -0.02646636962890625, -0.019468307495117188, -0.012470245361328125, -0.0054721832275390625, 0.00152587890625, 0.008523941040039062, 0.015522003173828125, 0.022520065307617188, 0.02951812744140625, 0.03651618957519531, 0.043514251708984375, 0.05051231384277344, 0.0575103759765625, 0.06450843811035156, 0.07150650024414062, 0.07850456237792969, 0.08550262451171875, 0.09250068664550781, 0.09949874877929688, 0.10649681091308594, 0.113494873046875, 0.12049293518066406, 0.12749099731445312, 0.1344890594482422, 0.14148712158203125, 0.1484851837158203, 0.15548324584960938, 0.16248130798339844, 0.1694793701171875, 0.17647743225097656, 0.18347549438476562, 0.1904735565185547, 0.19747161865234375, 0.2044696807861328, 0.21146774291992188, 0.21846580505371094, 0.2254638671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 4.0, 6.0, 8.0, 4.0, 10.0, 11.0, 12.0, 15.0, 19.0, 17.0, 26.0, 31.0, 21.0, 19.0, 40.0, 35.0, 44.0, 42.0, 32.0, 43.0, 35.0, 1073.0, 41.0, 43.0, 33.0, 25.0, 47.0, 32.0, 33.0, 36.0, 27.0, 27.0, 21.0, 15.0, 14.0, 18.0, 8.0, 8.0, 8.0, 7.0, 9.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.640625, -1.588775634765625, -1.53692626953125, -1.485076904296875, -1.4332275390625, -1.381378173828125, -1.32952880859375, -1.277679443359375, -1.225830078125, -1.173980712890625, -1.12213134765625, -1.070281982421875, -1.0184326171875, -0.966583251953125, -0.91473388671875, -0.862884521484375, -0.81103515625, -0.759185791015625, -0.70733642578125, -0.655487060546875, -0.6036376953125, -0.551788330078125, -0.49993896484375, -0.448089599609375, -0.396240234375, -0.344390869140625, -0.29254150390625, -0.240692138671875, -0.1888427734375, -0.136993408203125, -0.08514404296875, -0.033294677734375, 0.0185546875, 0.070404052734375, 0.12225341796875, 0.174102783203125, 0.2259521484375, 0.277801513671875, 0.32965087890625, 0.381500244140625, 0.433349609375, 0.485198974609375, 0.53704833984375, 0.588897705078125, 0.6407470703125, 0.692596435546875, 0.74444580078125, 0.796295166015625, 0.84814453125, 0.899993896484375, 0.95184326171875, 1.003692626953125, 1.0555419921875, 1.107391357421875, 1.15924072265625, 1.211090087890625, 1.262939453125, 1.314788818359375, 1.36663818359375, 1.418487548828125, 1.4703369140625, 1.522186279296875, 1.57403564453125, 1.625885009765625, 1.677734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 7.0, 15.0, 17.0, 38.0, 48.0, 77.0, 82.0, 161.0, 260.0, 344.0, 530.0, 880.0, 1328.0, 2085.0, 3224.0, 5209.0, 8292.0, 13242.0, 20746.0, 32162.0, 49002.0, 72762.0, 102600.0, 138708.0, 1171127.0, 147560.0, 105952.0, 75965.0, 51445.0, 33910.0, 21752.0, 13734.0, 8825.0, 5437.0, 3492.0, 2196.0, 1386.0, 848.0, 620.0, 353.0, 244.0, 164.0, 97.0, 81.0, 47.0, 25.0, 20.0, 15.0, 4.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.1328125, -0.1286029815673828, -0.12439346313476562, -0.12018394470214844, -0.11597442626953125, -0.11176490783691406, -0.10755538940429688, -0.10334587097167969, -0.0991363525390625, -0.09492683410644531, -0.09071731567382812, -0.08650779724121094, -0.08229827880859375, -0.07808876037597656, -0.07387924194335938, -0.06966972351074219, -0.065460205078125, -0.06125068664550781, -0.057041168212890625, -0.05283164978027344, -0.04862213134765625, -0.04441261291503906, -0.040203094482421875, -0.03599357604980469, -0.0317840576171875, -0.027574539184570312, -0.023365020751953125, -0.019155502319335938, -0.01494598388671875, -0.010736465454101562, -0.006526947021484375, -0.0023174285888671875, 0.00189208984375, 0.0061016082763671875, 0.010311126708984375, 0.014520645141601562, 0.01873016357421875, 0.022939682006835938, 0.027149200439453125, 0.03135871887207031, 0.0355682373046875, 0.03977775573730469, 0.043987274169921875, 0.04819679260253906, 0.05240631103515625, 0.05661582946777344, 0.060825347900390625, 0.06503486633300781, 0.069244384765625, 0.07345390319824219, 0.07766342163085938, 0.08187294006347656, 0.08608245849609375, 0.09029197692871094, 0.09450149536132812, 0.09871101379394531, 0.1029205322265625, 0.10713005065917969, 0.11133956909179688, 0.11554908752441406, 0.11975860595703125, 0.12396812438964844, 0.12817764282226562, 0.1323871612548828, 0.1365966796875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 8.0, 8.0, 4.0, 9.0, 26.0, 21.0, 13.0, 34.0, 49.0, 36.0, 64.0, 76.0, 79.0, 89.0, 88.0, 83.0, 72.0, 49.0, 36.0, 34.0, 22.0, 20.0, 14.0, 11.0, 6.0, 9.0, 2.0, 6.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00914764404296875, -0.008875608444213867, -0.008603572845458984, -0.008331537246704102, -0.008059501647949219, -0.007787466049194336, -0.007515430450439453, -0.00724339485168457, -0.0069713592529296875, -0.006699323654174805, -0.006427288055419922, -0.006155252456665039, -0.005883216857910156, -0.0056111812591552734, -0.005339145660400391, -0.005067110061645508, -0.004795074462890625, -0.004523038864135742, -0.004251003265380859, -0.0039789676666259766, -0.0037069320678710938, -0.003434896469116211, -0.003162860870361328, -0.0028908252716064453, -0.0026187896728515625, -0.0023467540740966797, -0.002074718475341797, -0.001802682876586914, -0.0015306472778320312, -0.0012586116790771484, -0.0009865760803222656, -0.0007145404815673828, -0.0004425048828125, -0.0001704692840576172, 0.00010156631469726562, 0.00037360191345214844, 0.0006456375122070312, 0.0009176731109619141, 0.0011897087097167969, 0.0014617443084716797, 0.0017337799072265625, 0.0020058155059814453, 0.002277851104736328, 0.002549886703491211, 0.0028219223022460938, 0.0030939579010009766, 0.0033659934997558594, 0.003638029098510742, 0.003910064697265625, 0.004182100296020508, 0.004454135894775391, 0.0047261714935302734, 0.004998207092285156, 0.005270242691040039, 0.005542278289794922, 0.005814313888549805, 0.0060863494873046875, 0.00635838508605957, 0.006630420684814453, 0.006902456283569336, 0.007174491882324219, 0.0074465274810791016, 0.007718563079833984, 0.007990598678588867, 0.00826263427734375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 7.0, 13.0, 10.0, 10.0, 9.0, 13.0, 21.0, 26.0, 29.0, 54.0, 58.0, 75.0, 147.0, 246.0, 762.0, 10159.0, 921639.0, 111874.0, 2407.0, 424.0, 153.0, 102.0, 79.0, 56.0, 32.0, 31.0, 23.0, 17.0, 20.0, 15.0, 3.0, 5.0, 6.0, 3.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.1581401824951172, -0.15282821655273438, -0.14751625061035156, -0.14220428466796875, -0.13689231872558594, -0.13158035278320312, -0.1262683868408203, -0.1209564208984375, -0.11564445495605469, -0.11033248901367188, -0.10502052307128906, -0.09970855712890625, -0.09439659118652344, -0.08908462524414062, -0.08377265930175781, -0.078460693359375, -0.07314872741699219, -0.06783676147460938, -0.06252479553222656, -0.05721282958984375, -0.05190086364746094, -0.046588897705078125, -0.04127693176269531, -0.0359649658203125, -0.030652999877929688, -0.025341033935546875, -0.020029067993164062, -0.01471710205078125, -0.009405136108398438, -0.004093170166015625, 0.0012187957763671875, 0.00653076171875, 0.011842727661132812, 0.017154693603515625, 0.022466659545898438, 0.02777862548828125, 0.03309059143066406, 0.038402557373046875, 0.04371452331542969, 0.0490264892578125, 0.05433845520019531, 0.059650421142578125, 0.06496238708496094, 0.07027435302734375, 0.07558631896972656, 0.08089828491210938, 0.08621025085449219, 0.091522216796875, 0.09683418273925781, 0.10214614868164062, 0.10745811462402344, 0.11277008056640625, 0.11808204650878906, 0.12339401245117188, 0.1287059783935547, 0.1340179443359375, 0.1393299102783203, 0.14464187622070312, 0.14995384216308594, 0.15526580810546875, 0.16057777404785156, 0.16588973999023438, 0.1712017059326172, 0.176513671875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 14.0, 160.0, 642.0, 152.0, 40.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13771268725395203, -0.13492564857006073, -0.13213860988616943, -0.12935155630111694, -0.12656451761722565, -0.12377747893333435, -0.12099044024944305, -0.11820340156555176, -0.11541636288166046, -0.11262932419776917, -0.10984227806329727, -0.10705523937940598, -0.10426820069551468, -0.10148115456104279, -0.09869411587715149, -0.09590707719326019, -0.0931200310587883, -0.090332992374897, -0.08754594624042511, -0.08475890755653381, -0.08197186887264252, -0.07918483018875122, -0.07639778405427933, -0.07361074537038803, -0.07082369923591614, -0.06803666055202484, -0.06524961441755295, -0.06246257573366165, -0.059675537049770355, -0.05688849464058876, -0.054101452231407166, -0.05131441354751587, -0.048527367413043976, -0.04574032500386238, -0.042953286319971085, -0.04016624391078949, -0.03737920522689819, -0.0345921628177166, -0.031805120408535004, -0.029018079861998558, -0.026231039315462112, -0.023443998768925667, -0.02065695822238922, -0.017869915813207626, -0.01508287526667118, -0.012295834720134735, -0.00950879231095314, -0.006721751764416695, -0.003934711217880249, -0.001147670205682516, 0.0016393708065152168, 0.004426412284374237, 0.007213452830910683, 0.010000493377447128, 0.012787535786628723, 0.015574576333165169, 0.018361616879701614, 0.02114865742623806, 0.023935697972774506, 0.0267227403819561, 0.029509780928492546, 0.03229682147502899, 0.03508386388421059, 0.03787090629339218, 0.04065794497728348]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 6.0, 9.0, 13.0, 8.0, 16.0, 22.0, 17.0, 19.0, 21.0, 24.0, 35.0, 30.0, 28.0, 30.0, 30.0, 36.0, 39.0, 35.0, 35.0, 40.0, 46.0, 43.0, 34.0, 40.0, 36.0, 33.0, 32.0, 23.0, 28.0, 31.0, 21.0, 21.0, 22.0, 16.0, 16.0, 8.0, 9.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.008411288261413574, -0.008155453018844128, -0.007899617776274681, -0.0076437825337052345, -0.007387947291135788, -0.007132112048566341, -0.006876276805996895, -0.006620441563427448, -0.006364606320858002, -0.006108771078288555, -0.005852935835719109, -0.005597100593149662, -0.0053412653505802155, -0.005085430108010769, -0.004829594865441322, -0.004573759622871876, -0.004317924380302429, -0.004062089137732983, -0.003806253895163536, -0.0035504186525940895, -0.003294583410024643, -0.0030387481674551964, -0.00278291292488575, -0.0025270776823163033, -0.0022712424397468567, -0.00201540719717741, -0.0017595719546079636, -0.001503736712038517, -0.0012479014694690704, -0.0009920662268996239, -0.0007362309843301773, -0.00048039574176073074, -0.00022456049919128418, 3.1274743378162384e-05, 0.00028710998594760895, 0.0005429452285170555, 0.0007987804710865021, 0.0010546157136559486, 0.0013104509562253952, 0.0015662861987948418, 0.0018221214413642883, 0.002077956683933735, 0.0023337919265031815, 0.002589627169072628, 0.0028454624116420746, 0.003101297654211521, 0.0033571328967809677, 0.0036129681393504143, 0.003868803381919861, 0.004124638624489307, 0.004380473867058754, 0.0046363091096282005, 0.004892144352197647, 0.005147979594767094, 0.00540381483733654, 0.005659650079905987, 0.005915485322475433, 0.00617132056504488, 0.0064271558076143265, 0.006682991050183773, 0.00693882629275322, 0.007194661535322666, 0.007450496777892113, 0.007706332020461559, 0.007962167263031006]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 5.0, 11.0, 10.0, 11.0, 13.0, 16.0, 19.0, 21.0, 24.0, 20.0, 16.0, 45.0, 24.0, 30.0, 38.0, 33.0, 37.0, 31.0, 52.0, 50.0, 44.0, 43.0, 47.0, 44.0, 37.0, 46.0, 26.0, 24.0, 28.0, 29.0, 15.0, 14.0, 11.0, 16.0, 12.0, 12.0, 14.0, 10.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.76171875, -2.67889404296875, -2.5960693359375, -2.51324462890625, -2.430419921875, -2.34759521484375, -2.2647705078125, -2.18194580078125, -2.09912109375, -2.01629638671875, -1.9334716796875, -1.85064697265625, -1.767822265625, -1.68499755859375, -1.6021728515625, -1.51934814453125, -1.4365234375, -1.35369873046875, -1.2708740234375, -1.18804931640625, -1.105224609375, -1.02239990234375, -0.9395751953125, -0.85675048828125, -0.77392578125, -0.69110107421875, -0.6082763671875, -0.52545166015625, -0.442626953125, -0.35980224609375, -0.2769775390625, -0.19415283203125, -0.111328125, -0.02850341796875, 0.0543212890625, 0.13714599609375, 0.219970703125, 0.30279541015625, 0.3856201171875, 0.46844482421875, 0.55126953125, 0.63409423828125, 0.7169189453125, 0.79974365234375, 0.882568359375, 0.96539306640625, 1.0482177734375, 1.13104248046875, 1.2138671875, 1.29669189453125, 1.3795166015625, 1.46234130859375, 1.545166015625, 1.62799072265625, 1.7108154296875, 1.79364013671875, 1.87646484375, 1.95928955078125, 2.0421142578125, 2.12493896484375, 2.207763671875, 2.29058837890625, 2.3734130859375, 2.45623779296875, 2.5390625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 9.0, 11.0, 31.0, 38.0, 49.0, 75.0, 104.0, 160.0, 224.0, 459.0, 714.0, 1261.0, 2391.0, 4287.0, 8488.0, 19145.0, 48207.0, 140689.0, 405684.0, 269722.0, 87865.0, 31830.0, 13232.0, 6200.0, 3331.0, 1715.0, 1041.0, 592.0, 373.0, 196.0, 126.0, 96.0, 50.0, 35.0, 27.0, 24.0, 14.0, 14.0, 12.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.046875, -3.9195556640625, -3.792236328125, -3.6649169921875, -3.53759765625, -3.4102783203125, -3.282958984375, -3.1556396484375, -3.0283203125, -2.9010009765625, -2.773681640625, -2.6463623046875, -2.51904296875, -2.3917236328125, -2.264404296875, -2.1370849609375, -2.009765625, -1.8824462890625, -1.755126953125, -1.6278076171875, -1.50048828125, -1.3731689453125, -1.245849609375, -1.1185302734375, -0.9912109375, -0.8638916015625, -0.736572265625, -0.6092529296875, -0.48193359375, -0.3546142578125, -0.227294921875, -0.0999755859375, 0.02734375, 0.1546630859375, 0.281982421875, 0.4093017578125, 0.53662109375, 0.6639404296875, 0.791259765625, 0.9185791015625, 1.0458984375, 1.1732177734375, 1.300537109375, 1.4278564453125, 1.55517578125, 1.6824951171875, 1.809814453125, 1.9371337890625, 2.064453125, 2.1917724609375, 2.319091796875, 2.4464111328125, 2.57373046875, 2.7010498046875, 2.828369140625, 2.9556884765625, 3.0830078125, 3.2103271484375, 3.337646484375, 3.4649658203125, 3.59228515625, 3.7196044921875, 3.846923828125, 3.9742431640625, 4.1015625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 11.0, 10.0, 11.0, 11.0, 10.0, 20.0, 19.0, 18.0, 22.0, 27.0, 35.0, 51.0, 61.0, 68.0, 91.0, 152.0, 284.0, 1391.0, 235.0, 113.0, 75.0, 50.0, 41.0, 42.0, 31.0, 33.0, 23.0, 21.0, 17.0, 16.0, 11.0, 11.0, 16.0, 8.0, 4.0, 0.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.625, -10.285400390625, -9.94580078125, -9.606201171875, -9.2666015625, -8.927001953125, -8.58740234375, -8.247802734375, -7.908203125, -7.568603515625, -7.22900390625, -6.889404296875, -6.5498046875, -6.210205078125, -5.87060546875, -5.531005859375, -5.19140625, -4.851806640625, -4.51220703125, -4.172607421875, -3.8330078125, -3.493408203125, -3.15380859375, -2.814208984375, -2.474609375, -2.135009765625, -1.79541015625, -1.455810546875, -1.1162109375, -0.776611328125, -0.43701171875, -0.097412109375, 0.2421875, 0.581787109375, 0.92138671875, 1.260986328125, 1.6005859375, 1.940185546875, 2.27978515625, 2.619384765625, 2.958984375, 3.298583984375, 3.63818359375, 3.977783203125, 4.3173828125, 4.656982421875, 4.99658203125, 5.336181640625, 5.67578125, 6.015380859375, 6.35498046875, 6.694580078125, 7.0341796875, 7.373779296875, 7.71337890625, 8.052978515625, 8.392578125, 8.732177734375, 9.07177734375, 9.411376953125, 9.7509765625, 10.090576171875, 10.43017578125, 10.769775390625, 11.109375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 11.0, 13.0, 14.0, 24.0, 23.0, 43.0, 49.0, 77.0, 123.0, 183.0, 356.0, 978.0, 7536.0, 1139258.0, 1985471.0, 9472.0, 1061.0, 397.0, 211.0, 112.0, 84.0, 52.0, 47.0, 29.0, 25.0, 17.0, 7.0, 8.0, 8.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.640625, -28.769775390625, -27.89892578125, -27.028076171875, -26.1572265625, -25.286376953125, -24.41552734375, -23.544677734375, -22.673828125, -21.802978515625, -20.93212890625, -20.061279296875, -19.1904296875, -18.319580078125, -17.44873046875, -16.577880859375, -15.70703125, -14.836181640625, -13.96533203125, -13.094482421875, -12.2236328125, -11.352783203125, -10.48193359375, -9.611083984375, -8.740234375, -7.869384765625, -6.99853515625, -6.127685546875, -5.2568359375, -4.385986328125, -3.51513671875, -2.644287109375, -1.7734375, -0.902587890625, -0.03173828125, 0.839111328125, 1.7099609375, 2.580810546875, 3.45166015625, 4.322509765625, 5.193359375, 6.064208984375, 6.93505859375, 7.805908203125, 8.6767578125, 9.547607421875, 10.41845703125, 11.289306640625, 12.16015625, 13.031005859375, 13.90185546875, 14.772705078125, 15.6435546875, 16.514404296875, 17.38525390625, 18.256103515625, 19.126953125, 19.997802734375, 20.86865234375, 21.739501953125, 22.6103515625, 23.481201171875, 24.35205078125, 25.222900390625, 26.09375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 20.0, 62.0, 105.0, 190.0, 232.0, 173.0, 119.0, 62.0, 29.0, 9.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.874847412109375, -47.75250244140625, -46.63016128540039, -45.507816314697266, -44.385475158691406, -43.26313018798828, -42.14078903198242, -41.0184440612793, -39.89610290527344, -38.77375793457031, -37.65141677856445, -36.52907180786133, -35.40673065185547, -34.284385681152344, -33.162044525146484, -32.03969955444336, -30.917354583740234, -29.795011520385742, -28.67266845703125, -27.550325393676758, -26.427982330322266, -25.30563735961914, -24.18329429626465, -23.060951232910156, -21.938608169555664, -20.816265106201172, -19.69392204284668, -18.571578979492188, -17.449234008789062, -16.326892852783203, -15.204547882080078, -14.082204818725586, -12.95986557006836, -11.837522506713867, -10.715179443359375, -9.592835426330566, -8.470492362976074, -7.348149299621582, -6.225805759429932, -5.103462219238281, -3.981119155883789, -2.8587758541107178, -1.7364325523376465, -0.6140892505645752, 0.5082540512084961, 1.6305971145629883, 2.7529406547546387, 3.875284194946289, 4.997627258300781, 6.119970321655273, 7.242313861846924, 8.364657402038574, 9.487000465393066, 10.609343528747559, 11.731687545776367, 12.85403060913086, 13.976373672485352, 15.098716735839844, 16.221059799194336, 17.343402862548828, 18.465747833251953, 19.588088989257812, 20.710433959960938, 21.83277702331543, 22.955120086669922]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 8.0, 6.0, 7.0, 2.0, 5.0, 18.0, 10.0, 18.0, 12.0, 16.0, 20.0, 23.0, 20.0, 22.0, 29.0, 25.0, 27.0, 25.0, 37.0, 29.0, 43.0, 37.0, 42.0, 40.0, 23.0, 32.0, 29.0, 28.0, 32.0, 40.0, 36.0, 42.0, 29.0, 24.0, 24.0, 18.0, 22.0, 12.0, 18.0, 14.0, 7.0, 6.0, 9.0, 5.0, 6.0, 10.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.633089065551758, -23.84441375732422, -23.055740356445312, -22.267065048217773, -21.478389739990234, -20.689716339111328, -19.90104103088379, -19.11236572265625, -18.323692321777344, -17.535017013549805, -16.7463436126709, -15.95766830444336, -15.168993949890137, -14.380319595336914, -13.591644287109375, -12.802969932556152, -12.01429557800293, -11.225621223449707, -10.436946868896484, -9.648271560668945, -8.859597206115723, -8.0709228515625, -7.282248020172119, -6.493573188781738, -5.704898834228516, -4.916224479675293, -4.127549648284912, -3.3388750553131104, -2.5502004623413086, -1.7615258693695068, -0.9728512763977051, -0.18417644500732422, 0.6044998168945312, 1.393174409866333, 2.1818490028381348, 2.9705235958099365, 3.7591981887817383, 4.547872543334961, 5.336547374725342, 6.125222206115723, 6.913896560668945, 7.702570915222168, 8.49124526977539, 9.27992057800293, 10.068594932556152, 10.857269287109375, 11.645944595336914, 12.434618949890137, 13.22329330444336, 14.011967658996582, 14.800642013549805, 15.589317321777344, 16.37799072265625, 17.16666603088379, 17.955341339111328, 18.744014739990234, 19.532690048217773, 20.321365356445312, 21.11003875732422, 21.898714065551758, 22.687389373779297, 23.476062774658203, 24.264738082885742, 25.05341339111328, 25.842086791992188]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 9.0, 11.0, 12.0, 5.0, 11.0, 15.0, 15.0, 16.0, 20.0, 28.0, 24.0, 21.0, 44.0, 27.0, 31.0, 31.0, 45.0, 34.0, 37.0, 51.0, 43.0, 44.0, 44.0, 43.0, 26.0, 41.0, 34.0, 33.0, 28.0, 26.0, 30.0, 21.0, 8.0, 15.0, 9.0, 18.0, 9.0, 13.0, 5.0, 7.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.939453125, -2.852752685546875, -2.76605224609375, -2.679351806640625, -2.5926513671875, -2.505950927734375, -2.41925048828125, -2.332550048828125, -2.245849609375, -2.159149169921875, -2.07244873046875, -1.985748291015625, -1.8990478515625, -1.812347412109375, -1.72564697265625, -1.638946533203125, -1.55224609375, -1.465545654296875, -1.37884521484375, -1.292144775390625, -1.2054443359375, -1.118743896484375, -1.03204345703125, -0.945343017578125, -0.858642578125, -0.771942138671875, -0.68524169921875, -0.598541259765625, -0.5118408203125, -0.425140380859375, -0.33843994140625, -0.251739501953125, -0.1650390625, -0.078338623046875, 0.00836181640625, 0.095062255859375, 0.1817626953125, 0.268463134765625, 0.35516357421875, 0.441864013671875, 0.528564453125, 0.615264892578125, 0.70196533203125, 0.788665771484375, 0.8753662109375, 0.962066650390625, 1.04876708984375, 1.135467529296875, 1.22216796875, 1.308868408203125, 1.39556884765625, 1.482269287109375, 1.5689697265625, 1.655670166015625, 1.74237060546875, 1.829071044921875, 1.915771484375, 2.002471923828125, 2.08917236328125, 2.175872802734375, 2.2625732421875, 2.349273681640625, 2.43597412109375, 2.522674560546875, 2.609375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 9.0, 17.0, 18.0, 20.0, 30.0, 29.0, 46.0, 74.0, 97.0, 153.0, 261.0, 487.0, 745.0, 1460.0, 2856.0, 6003.0, 12776.0, 30041.0, 72836.0, 186324.0, 480845.0, 1034169.0, 1222286.0, 681906.0, 277017.0, 106658.0, 42627.0, 17995.0, 8032.0, 3839.0, 1979.0, 1040.0, 603.0, 339.0, 225.0, 127.0, 94.0, 60.0, 41.0, 30.0, 19.0, 17.0, 18.0, 5.0, 5.0, 10.0, 2.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.074005126953125, -2.97222900390625, -2.870452880859375, -2.7686767578125, -2.666900634765625, -2.56512451171875, -2.463348388671875, -2.361572265625, -2.259796142578125, -2.15802001953125, -2.056243896484375, -1.9544677734375, -1.852691650390625, -1.75091552734375, -1.649139404296875, -1.54736328125, -1.445587158203125, -1.34381103515625, -1.242034912109375, -1.1402587890625, -1.038482666015625, -0.93670654296875, -0.834930419921875, -0.733154296875, -0.631378173828125, -0.52960205078125, -0.427825927734375, -0.3260498046875, -0.224273681640625, -0.12249755859375, -0.020721435546875, 0.0810546875, 0.182830810546875, 0.28460693359375, 0.386383056640625, 0.4881591796875, 0.589935302734375, 0.69171142578125, 0.793487548828125, 0.895263671875, 0.997039794921875, 1.09881591796875, 1.200592041015625, 1.3023681640625, 1.404144287109375, 1.50592041015625, 1.607696533203125, 1.70947265625, 1.811248779296875, 1.91302490234375, 2.014801025390625, 2.1165771484375, 2.218353271484375, 2.32012939453125, 2.421905517578125, 2.523681640625, 2.625457763671875, 2.72723388671875, 2.829010009765625, 2.9307861328125, 3.032562255859375, 3.13433837890625, 3.236114501953125, 3.337890625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 13.0, 11.0, 16.0, 35.0, 39.0, 56.0, 69.0, 91.0, 132.0, 181.0, 236.0, 298.0, 393.0, 436.0, 447.0, 372.0, 310.0, 215.0, 189.0, 137.0, 120.0, 73.0, 57.0, 41.0, 28.0, 18.0, 14.0, 12.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.92578125, -5.69842529296875, -5.4710693359375, -5.24371337890625, -5.016357421875, -4.78900146484375, -4.5616455078125, -4.33428955078125, -4.10693359375, -3.87957763671875, -3.6522216796875, -3.42486572265625, -3.197509765625, -2.97015380859375, -2.7427978515625, -2.51544189453125, -2.2880859375, -2.06072998046875, -1.8333740234375, -1.60601806640625, -1.378662109375, -1.15130615234375, -0.9239501953125, -0.69659423828125, -0.46923828125, -0.24188232421875, -0.0145263671875, 0.21282958984375, 0.440185546875, 0.66754150390625, 0.8948974609375, 1.12225341796875, 1.349609375, 1.57696533203125, 1.8043212890625, 2.03167724609375, 2.259033203125, 2.48638916015625, 2.7137451171875, 2.94110107421875, 3.16845703125, 3.39581298828125, 3.6231689453125, 3.85052490234375, 4.077880859375, 4.30523681640625, 4.5325927734375, 4.75994873046875, 4.9873046875, 5.21466064453125, 5.4420166015625, 5.66937255859375, 5.896728515625, 6.12408447265625, 6.3514404296875, 6.57879638671875, 6.80615234375, 7.03350830078125, 7.2608642578125, 7.48822021484375, 7.715576171875, 7.94293212890625, 8.1702880859375, 8.39764404296875, 8.625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 12.0, 19.0, 32.0, 39.0, 58.0, 132.0, 219.0, 440.0, 897.0, 2352.0, 7944.0, 36588.0, 197951.0, 1084186.0, 2145648.0, 585874.0, 104005.0, 19941.0, 4949.0, 1529.0, 638.0, 330.0, 192.0, 109.0, 58.0, 42.0, 22.0, 23.0, 12.0, 7.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.8203125, -10.5223388671875, -10.224365234375, -9.9263916015625, -9.62841796875, -9.3304443359375, -9.032470703125, -8.7344970703125, -8.4365234375, -8.1385498046875, -7.840576171875, -7.5426025390625, -7.24462890625, -6.9466552734375, -6.648681640625, -6.3507080078125, -6.052734375, -5.7547607421875, -5.456787109375, -5.1588134765625, -4.86083984375, -4.5628662109375, -4.264892578125, -3.9669189453125, -3.6689453125, -3.3709716796875, -3.072998046875, -2.7750244140625, -2.47705078125, -2.1790771484375, -1.881103515625, -1.5831298828125, -1.28515625, -0.9871826171875, -0.689208984375, -0.3912353515625, -0.09326171875, 0.2047119140625, 0.502685546875, 0.8006591796875, 1.0986328125, 1.3966064453125, 1.694580078125, 1.9925537109375, 2.29052734375, 2.5885009765625, 2.886474609375, 3.1844482421875, 3.482421875, 3.7803955078125, 4.078369140625, 4.3763427734375, 4.67431640625, 4.9722900390625, 5.270263671875, 5.5682373046875, 5.8662109375, 6.1641845703125, 6.462158203125, 6.7601318359375, 7.05810546875, 7.3560791015625, 7.654052734375, 7.9520263671875, 8.25]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 11.0, 32.0, 55.0, 78.0, 118.0, 135.0, 153.0, 163.0, 121.0, 66.0, 43.0, 23.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.18747901916504, -24.4775390625, -22.76759910583496, -21.057659149169922, -19.347719192504883, -17.637779235839844, -15.927839279174805, -14.217899322509766, -12.507959365844727, -10.798019409179688, -9.088079452514648, -7.378139495849609, -5.66819953918457, -3.9582595825195312, -2.248319625854492, -0.5383796691894531, 1.171560287475586, 2.881500244140625, 4.591440200805664, 6.301380157470703, 8.011320114135742, 9.721260070800781, 11.43120002746582, 13.14113998413086, 14.851079940795898, 16.561019897460938, 18.270959854125977, 19.980899810791016, 21.690839767456055, 23.400779724121094, 25.110719680786133, 26.820659637451172, 28.530601501464844, 30.240541458129883, 31.950481414794922, 33.660423278808594, 35.370361328125, 37.080299377441406, 38.79024124145508, 40.50018310546875, 42.210121154785156, 43.92005920410156, 45.630001068115234, 47.339942932128906, 49.04988098144531, 50.75981903076172, 52.46976089477539, 54.17970275878906, 55.88964080810547, 57.599578857421875, 59.30952072143555, 61.01946258544922, 62.729400634765625, 64.43933868408203, 66.14927673339844, 67.85922241210938, 69.56916046142578, 71.27909851074219, 72.98904418945312, 74.69898223876953, 76.40892028808594, 78.11885833740234, 79.82879638671875, 81.53874206542969, 83.2486801147461]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 9.0, 5.0, 6.0, 6.0, 12.0, 7.0, 12.0, 16.0, 12.0, 24.0, 18.0, 32.0, 33.0, 32.0, 28.0, 28.0, 27.0, 42.0, 44.0, 39.0, 30.0, 37.0, 43.0, 39.0, 40.0, 31.0, 39.0, 48.0, 33.0, 35.0, 20.0, 29.0, 19.0, 16.0, 20.0, 15.0, 22.0, 11.0, 8.0, 6.0, 12.0, 4.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.491764068603516, -23.77920150756836, -23.06663703918457, -22.354074478149414, -21.641511917114258, -20.9289493560791, -20.216384887695312, -19.503822326660156, -18.791259765625, -18.078697204589844, -17.366132736206055, -16.6535701751709, -15.941007614135742, -15.22844409942627, -14.515880584716797, -13.80331802368164, -13.090754508972168, -12.378190994262695, -11.665628433227539, -10.953064918518066, -10.24050235748291, -9.527938842773438, -8.815376281738281, -8.102812767028809, -7.390249729156494, -6.67768669128418, -5.965123653411865, -5.252560615539551, -4.539997100830078, -3.8274343013763428, -3.114871025085449, -2.4023079872131348, -1.6897449493408203, -0.9771818518638611, -0.26461875438690186, 0.44794440269470215, 1.1605074405670166, 1.873070478439331, 2.5856337547302246, 3.298196792602539, 4.0107598304748535, 4.723322868347168, 5.435885906219482, 6.148448944091797, 6.8610124588012695, 7.573575019836426, 8.286138534545898, 8.998701095581055, 9.711264610290527, 10.423828125, 11.136390686035156, 11.848954200744629, 12.561516761779785, 13.274080276489258, 13.986642837524414, 14.699206352233887, 15.41176986694336, 16.124332427978516, 16.836896896362305, 17.54945945739746, 18.262022018432617, 18.974584579467773, 19.687149047851562, 20.39971160888672, 21.112274169921875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 12.0, 12.0, 9.0, 10.0, 17.0, 18.0, 19.0, 19.0, 24.0, 22.0, 41.0, 25.0, 41.0, 37.0, 42.0, 52.0, 30.0, 52.0, 43.0, 46.0, 43.0, 45.0, 44.0, 39.0, 37.0, 31.0, 25.0, 20.0, 12.0, 19.0, 26.0, 16.0, 20.0, 12.0, 7.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.142578125, -3.04754638671875, -2.9525146484375, -2.85748291015625, -2.762451171875, -2.66741943359375, -2.5723876953125, -2.47735595703125, -2.38232421875, -2.28729248046875, -2.1922607421875, -2.09722900390625, -2.002197265625, -1.90716552734375, -1.8121337890625, -1.71710205078125, -1.6220703125, -1.52703857421875, -1.4320068359375, -1.33697509765625, -1.241943359375, -1.14691162109375, -1.0518798828125, -0.95684814453125, -0.86181640625, -0.76678466796875, -0.6717529296875, -0.57672119140625, -0.481689453125, -0.38665771484375, -0.2916259765625, -0.19659423828125, -0.1015625, -0.00653076171875, 0.0885009765625, 0.18353271484375, 0.278564453125, 0.37359619140625, 0.4686279296875, 0.56365966796875, 0.65869140625, 0.75372314453125, 0.8487548828125, 0.94378662109375, 1.038818359375, 1.13385009765625, 1.2288818359375, 1.32391357421875, 1.4189453125, 1.51397705078125, 1.6090087890625, 1.70404052734375, 1.799072265625, 1.89410400390625, 1.9891357421875, 2.08416748046875, 2.17919921875, 2.27423095703125, 2.3692626953125, 2.46429443359375, 2.559326171875, 2.65435791015625, 2.7493896484375, 2.84442138671875, 2.939453125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 25.0, 28.0, 41.0, 53.0, 95.0, 118.0, 182.0, 298.0, 455.0, 695.0, 1027.0, 1477.0, 2335.0, 3669.0, 5671.0, 8913.0, 13946.0, 21861.0, 35462.0, 57322.0, 91814.0, 142676.0, 190265.0, 167866.0, 112792.0, 70951.0, 43667.0, 27396.0, 17117.0, 10762.0, 6853.0, 4486.0, 2833.0, 1829.0, 1149.0, 826.0, 483.0, 344.0, 264.0, 171.0, 113.0, 76.0, 52.0, 40.0, 22.0, 13.0, 3.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29345703125, -0.2842063903808594, -0.27495574951171875, -0.2657051086425781, -0.2564544677734375, -0.24720382690429688, -0.23795318603515625, -0.22870254516601562, -0.219451904296875, -0.21020126342773438, -0.20095062255859375, -0.19169998168945312, -0.1824493408203125, -0.17319869995117188, -0.16394805908203125, -0.15469741821289062, -0.14544677734375, -0.13619613647460938, -0.12694549560546875, -0.11769485473632812, -0.1084442138671875, -0.09919357299804688, -0.08994293212890625, -0.08069229125976562, -0.071441650390625, -0.062191009521484375, -0.05294036865234375, -0.043689727783203125, -0.0344390869140625, -0.025188446044921875, -0.01593780517578125, -0.006687164306640625, 0.0025634765625, 0.011814117431640625, 0.02106475830078125, 0.030315399169921875, 0.0395660400390625, 0.048816680908203125, 0.05806732177734375, 0.06731796264648438, 0.076568603515625, 0.08581924438476562, 0.09506988525390625, 0.10432052612304688, 0.1135711669921875, 0.12282180786132812, 0.13207244873046875, 0.14132308959960938, 0.15057373046875, 0.15982437133789062, 0.16907501220703125, 0.17832565307617188, 0.1875762939453125, 0.19682693481445312, 0.20607757568359375, 0.21532821655273438, 0.224578857421875, 0.23382949829101562, 0.24308013916015625, 0.2523307800292969, 0.2615814208984375, 0.2708320617675781, 0.28008270263671875, 0.2893333435058594, 0.298583984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 10.0, 7.0, 8.0, 8.0, 10.0, 14.0, 19.0, 24.0, 23.0, 21.0, 25.0, 36.0, 37.0, 38.0, 34.0, 55.0, 46.0, 48.0, 1057.0, 47.0, 56.0, 35.0, 37.0, 39.0, 31.0, 36.0, 37.0, 25.0, 29.0, 19.0, 23.0, 15.0, 12.0, 13.0, 14.0, 12.0, 5.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0], "bins": [-2.341796875, -2.278778076171875, -2.21575927734375, -2.152740478515625, -2.0897216796875, -2.026702880859375, -1.96368408203125, -1.900665283203125, -1.837646484375, -1.774627685546875, -1.71160888671875, -1.648590087890625, -1.5855712890625, -1.522552490234375, -1.45953369140625, -1.396514892578125, -1.33349609375, -1.270477294921875, -1.20745849609375, -1.144439697265625, -1.0814208984375, -1.018402099609375, -0.95538330078125, -0.892364501953125, -0.829345703125, -0.766326904296875, -0.70330810546875, -0.640289306640625, -0.5772705078125, -0.514251708984375, -0.45123291015625, -0.388214111328125, -0.3251953125, -0.262176513671875, -0.19915771484375, -0.136138916015625, -0.0731201171875, -0.010101318359375, 0.05291748046875, 0.115936279296875, 0.178955078125, 0.241973876953125, 0.30499267578125, 0.368011474609375, 0.4310302734375, 0.494049072265625, 0.55706787109375, 0.620086669921875, 0.68310546875, 0.746124267578125, 0.80914306640625, 0.872161865234375, 0.9351806640625, 0.998199462890625, 1.06121826171875, 1.124237060546875, 1.187255859375, 1.250274658203125, 1.31329345703125, 1.376312255859375, 1.4393310546875, 1.502349853515625, 1.56536865234375, 1.628387451171875, 1.69140625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 10.0, 11.0, 15.0, 20.0, 47.0, 61.0, 61.0, 86.0, 155.0, 167.0, 306.0, 474.0, 699.0, 1163.0, 1865.0, 2961.0, 4606.0, 7471.0, 12099.0, 19806.0, 31854.0, 49365.0, 75284.0, 108892.0, 166523.0, 1171016.0, 147207.0, 102344.0, 70202.0, 45524.0, 28907.0, 18049.0, 11200.0, 6888.0, 4259.0, 2619.0, 1643.0, 1100.0, 743.0, 448.0, 324.0, 241.0, 136.0, 78.0, 72.0, 51.0, 27.0, 15.0, 18.0, 4.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.1578369140625, -0.15281295776367188, -0.14778900146484375, -0.14276504516601562, -0.1377410888671875, -0.13271713256835938, -0.12769317626953125, -0.12266921997070312, -0.117645263671875, -0.11262130737304688, -0.10759735107421875, -0.10257339477539062, -0.0975494384765625, -0.09252548217773438, -0.08750152587890625, -0.08247756958007812, -0.07745361328125, -0.07242965698242188, -0.06740570068359375, -0.062381744384765625, -0.0573577880859375, -0.052333831787109375, -0.04730987548828125, -0.042285919189453125, -0.037261962890625, -0.032238006591796875, -0.02721405029296875, -0.022190093994140625, -0.0171661376953125, -0.012142181396484375, -0.00711822509765625, -0.002094268798828125, 0.0029296875, 0.007953643798828125, 0.01297760009765625, 0.018001556396484375, 0.0230255126953125, 0.028049468994140625, 0.03307342529296875, 0.038097381591796875, 0.043121337890625, 0.048145294189453125, 0.05316925048828125, 0.058193206787109375, 0.0632171630859375, 0.06824111938476562, 0.07326507568359375, 0.07828903198242188, 0.08331298828125, 0.08833694458007812, 0.09336090087890625, 0.09838485717773438, 0.1034088134765625, 0.10843276977539062, 0.11345672607421875, 0.11848068237304688, 0.123504638671875, 0.12852859497070312, 0.13355255126953125, 0.13857650756835938, 0.1436004638671875, 0.14862442016601562, 0.15364837646484375, 0.15867233276367188, 0.1636962890625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 6.0, 9.0, 7.0, 14.0, 2.0, 11.0, 10.0, 14.0, 19.0, 18.0, 30.0, 39.0, 27.0, 56.0, 87.0, 123.0, 122.0, 94.0, 62.0, 36.0, 33.0, 28.0, 20.0, 13.0, 18.0, 13.0, 10.0, 11.0, 6.0, 9.0, 5.0, 10.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0130462646484375, -0.012595653533935547, -0.012145042419433594, -0.01169443130493164, -0.011243820190429688, -0.010793209075927734, -0.010342597961425781, -0.009891986846923828, -0.009441375732421875, -0.008990764617919922, -0.008540153503417969, -0.008089542388916016, -0.0076389312744140625, -0.007188320159912109, -0.006737709045410156, -0.006287097930908203, -0.00583648681640625, -0.005385875701904297, -0.004935264587402344, -0.004484653472900391, -0.0040340423583984375, -0.0035834312438964844, -0.0031328201293945312, -0.002682209014892578, -0.002231597900390625, -0.0017809867858886719, -0.0013303756713867188, -0.0008797645568847656, -0.0004291534423828125, 2.1457672119140625e-05, 0.00047206878662109375, 0.0009226799011230469, 0.001373291015625, 0.0018239021301269531, 0.0022745132446289062, 0.0027251243591308594, 0.0031757354736328125, 0.0036263465881347656, 0.004076957702636719, 0.004527568817138672, 0.004978179931640625, 0.005428791046142578, 0.005879402160644531, 0.006330013275146484, 0.0067806243896484375, 0.007231235504150391, 0.007681846618652344, 0.008132457733154297, 0.00858306884765625, 0.009033679962158203, 0.009484291076660156, 0.00993490219116211, 0.010385513305664062, 0.010836124420166016, 0.011286735534667969, 0.011737346649169922, 0.012187957763671875, 0.012638568878173828, 0.013089179992675781, 0.013539791107177734, 0.013990402221679688, 0.01444101333618164, 0.014891624450683594, 0.015342235565185547, 0.0157928466796875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 10.0, 13.0, 6.0, 7.0, 8.0, 8.0, 11.0, 14.0, 22.0, 26.0, 41.0, 64.0, 93.0, 148.0, 257.0, 783.0, 26223.0, 1002965.0, 16487.0, 680.0, 245.0, 109.0, 90.0, 69.0, 45.0, 19.0, 18.0, 20.0, 6.0, 7.0, 8.0, 13.0, 6.0, 6.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.351806640625, -0.34215545654296875, -0.3325042724609375, -0.32285308837890625, -0.313201904296875, -0.30355072021484375, -0.2938995361328125, -0.28424835205078125, -0.27459716796875, -0.26494598388671875, -0.2552947998046875, -0.24564361572265625, -0.235992431640625, -0.22634124755859375, -0.2166900634765625, -0.20703887939453125, -0.1973876953125, -0.18773651123046875, -0.1780853271484375, -0.16843414306640625, -0.158782958984375, -0.14913177490234375, -0.1394805908203125, -0.12982940673828125, -0.12017822265625, -0.11052703857421875, -0.1008758544921875, -0.09122467041015625, -0.081573486328125, -0.07192230224609375, -0.0622711181640625, -0.05261993408203125, -0.04296875, -0.03331756591796875, -0.0236663818359375, -0.01401519775390625, -0.004364013671875, 0.00528717041015625, 0.0149383544921875, 0.02458953857421875, 0.03424072265625, 0.04389190673828125, 0.0535430908203125, 0.06319427490234375, 0.072845458984375, 0.08249664306640625, 0.0921478271484375, 0.10179901123046875, 0.1114501953125, 0.12110137939453125, 0.1307525634765625, 0.14040374755859375, 0.150054931640625, 0.15970611572265625, 0.1693572998046875, 0.17900848388671875, 0.18865966796875, 0.19831085205078125, 0.2079620361328125, 0.21761322021484375, 0.227264404296875, 0.23691558837890625, 0.2465667724609375, 0.25621795654296875, 0.265869140625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 17.0, 426.0, 535.0, 34.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.4404247999191284, -0.4326992332935333, -0.42497366666793823, -0.41724810004234314, -0.40952253341674805, -0.40179696679115295, -0.39407140016555786, -0.38634583353996277, -0.3786202669143677, -0.3708947002887726, -0.3631691336631775, -0.3554435670375824, -0.3477180004119873, -0.3399924337863922, -0.3322668671607971, -0.324541300535202, -0.31681573390960693, -0.30909016728401184, -0.30136460065841675, -0.29363903403282166, -0.28591346740722656, -0.27818790078163147, -0.2704623341560364, -0.2627367675304413, -0.2550112009048462, -0.2472856342792511, -0.239560067653656, -0.2318345010280609, -0.22410893440246582, -0.21638336777687073, -0.20865780115127563, -0.20093223452568054, -0.19320665299892426, -0.18548108637332916, -0.17775551974773407, -0.17002995312213898, -0.16230438649654388, -0.1545788198709488, -0.1468532532453537, -0.1391276866197586, -0.1314021199941635, -0.12367655336856842, -0.11595098674297333, -0.10822542011737823, -0.10049985349178314, -0.09277428686618805, -0.08504872024059296, -0.07732315361499786, -0.06959757953882217, -0.06187201291322708, -0.05414644628763199, -0.046420879662036896, -0.0386953130364418, -0.030969742685556412, -0.02324417605996132, -0.015518609434366226, -0.007793042808771133, -6.747571751475334e-05, 0.007658091373741627, 0.015383658930659294, 0.023109225556254387, 0.03083479404449463, 0.03856036067008972, 0.046285927295684814, 0.05401149392127991]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 2.0, 7.0, 5.0, 5.0, 4.0, 10.0, 8.0, 12.0, 23.0, 20.0, 18.0, 23.0, 21.0, 20.0, 24.0, 33.0, 37.0, 36.0, 33.0, 35.0, 41.0, 41.0, 46.0, 48.0, 46.0, 30.0, 40.0, 33.0, 31.0, 36.0, 29.0, 21.0, 26.0, 27.0, 23.0, 15.0, 18.0, 10.0, 15.0, 15.0, 8.0, 3.0, 6.0, 4.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01959174871444702, -0.018993398174643517, -0.01839504763484001, -0.017796697095036507, -0.017198346555233, -0.016599996015429497, -0.016001645475625992, -0.015403294935822487, -0.014804944396018982, -0.014206593856215477, -0.013608243316411972, -0.013009892776608467, -0.012411542236804962, -0.011813191697001457, -0.011214841157197952, -0.010616490617394447, -0.010018140077590942, -0.009419789537787437, -0.008821438997983932, -0.008223088458180428, -0.007624737918376923, -0.007026387378573418, -0.006428036838769913, -0.005829686298966408, -0.005231335759162903, -0.004632985219359398, -0.004034634679555893, -0.003436284139752388, -0.002837933599948883, -0.002239583060145378, -0.0016412325203418732, -0.0010428819805383682, -0.0004445314407348633, 0.00015381909906864166, 0.0007521696388721466, 0.0013505201786756516, 0.0019488707184791565, 0.0025472212582826614, 0.0031455717980861664, 0.0037439223378896713, 0.004342272877693176, 0.004940623417496681, 0.005538973957300186, 0.006137324497103691, 0.006735675036907196, 0.007334025576710701, 0.007932376116514206, 0.008530726656317711, 0.009129077196121216, 0.00972742773592472, 0.010325778275728226, 0.01092412881553173, 0.011522479355335236, 0.01212082989513874, 0.012719180434942245, 0.01331753097474575, 0.013915881514549255, 0.01451423205435276, 0.015112582594156265, 0.01571093313395977, 0.016309283673763275, 0.01690763421356678, 0.017505984753370285, 0.01810433529317379, 0.018702685832977295]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 12.0, 12.0, 9.0, 10.0, 17.0, 18.0, 19.0, 19.0, 24.0, 22.0, 41.0, 25.0, 40.0, 38.0, 42.0, 52.0, 30.0, 52.0, 43.0, 46.0, 43.0, 45.0, 44.0, 39.0, 37.0, 31.0, 26.0, 19.0, 12.0, 19.0, 26.0, 16.0, 20.0, 12.0, 7.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.142578125, -3.04754638671875, -2.9525146484375, -2.85748291015625, -2.762451171875, -2.66741943359375, -2.5723876953125, -2.47735595703125, -2.38232421875, -2.28729248046875, -2.1922607421875, -2.09722900390625, -2.002197265625, -1.90716552734375, -1.8121337890625, -1.71710205078125, -1.6220703125, -1.52703857421875, -1.4320068359375, -1.33697509765625, -1.241943359375, -1.14691162109375, -1.0518798828125, -0.95684814453125, -0.86181640625, -0.76678466796875, -0.6717529296875, -0.57672119140625, -0.481689453125, -0.38665771484375, -0.2916259765625, -0.19659423828125, -0.1015625, -0.00653076171875, 0.0885009765625, 0.18353271484375, 0.278564453125, 0.37359619140625, 0.4686279296875, 0.56365966796875, 0.65869140625, 0.75372314453125, 0.8487548828125, 0.94378662109375, 1.038818359375, 1.13385009765625, 1.2288818359375, 1.32391357421875, 1.4189453125, 1.51397705078125, 1.6090087890625, 1.70404052734375, 1.799072265625, 1.89410400390625, 1.9891357421875, 2.08416748046875, 2.17919921875, 2.27423095703125, 2.3692626953125, 2.46429443359375, 2.559326171875, 2.65435791015625, 2.7493896484375, 2.84442138671875, 2.939453125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 7.0, 7.0, 7.0, 16.0, 18.0, 21.0, 44.0, 54.0, 71.0, 123.0, 158.0, 241.0, 372.0, 570.0, 831.0, 1329.0, 2152.0, 3603.0, 5785.0, 9907.0, 18679.0, 41085.0, 103932.0, 268324.0, 337706.0, 143822.0, 55215.0, 24046.0, 12325.0, 7010.0, 4109.0, 2412.0, 1629.0, 1009.0, 663.0, 400.0, 281.0, 170.0, 119.0, 99.0, 61.0, 42.0, 36.0, 16.0, 22.0, 9.0, 4.0, 3.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.291015625, -3.1854248046875, -3.079833984375, -2.9742431640625, -2.86865234375, -2.7630615234375, -2.657470703125, -2.5518798828125, -2.4462890625, -2.3406982421875, -2.235107421875, -2.1295166015625, -2.02392578125, -1.9183349609375, -1.812744140625, -1.7071533203125, -1.6015625, -1.4959716796875, -1.390380859375, -1.2847900390625, -1.17919921875, -1.0736083984375, -0.968017578125, -0.8624267578125, -0.7568359375, -0.6512451171875, -0.545654296875, -0.4400634765625, -0.33447265625, -0.2288818359375, -0.123291015625, -0.0177001953125, 0.087890625, 0.1934814453125, 0.299072265625, 0.4046630859375, 0.51025390625, 0.6158447265625, 0.721435546875, 0.8270263671875, 0.9326171875, 1.0382080078125, 1.143798828125, 1.2493896484375, 1.35498046875, 1.4605712890625, 1.566162109375, 1.6717529296875, 1.77734375, 1.8829345703125, 1.988525390625, 2.0941162109375, 2.19970703125, 2.3052978515625, 2.410888671875, 2.5164794921875, 2.6220703125, 2.7276611328125, 2.833251953125, 2.9388427734375, 3.04443359375, 3.1500244140625, 3.255615234375, 3.3612060546875, 3.466796875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 5.0, 6.0, 4.0, 6.0, 9.0, 8.0, 6.0, 9.0, 17.0, 18.0, 20.0, 22.0, 37.0, 31.0, 39.0, 51.0, 59.0, 76.0, 98.0, 166.0, 1372.0, 329.0, 157.0, 73.0, 74.0, 65.0, 45.0, 27.0, 37.0, 34.0, 37.0, 25.0, 13.0, 13.0, 11.0, 11.0, 9.0, 7.0, 8.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.1171875, -10.745849609375, -10.37451171875, -10.003173828125, -9.6318359375, -9.260498046875, -8.88916015625, -8.517822265625, -8.146484375, -7.775146484375, -7.40380859375, -7.032470703125, -6.6611328125, -6.289794921875, -5.91845703125, -5.547119140625, -5.17578125, -4.804443359375, -4.43310546875, -4.061767578125, -3.6904296875, -3.319091796875, -2.94775390625, -2.576416015625, -2.205078125, -1.833740234375, -1.46240234375, -1.091064453125, -0.7197265625, -0.348388671875, 0.02294921875, 0.394287109375, 0.765625, 1.136962890625, 1.50830078125, 1.879638671875, 2.2509765625, 2.622314453125, 2.99365234375, 3.364990234375, 3.736328125, 4.107666015625, 4.47900390625, 4.850341796875, 5.2216796875, 5.593017578125, 5.96435546875, 6.335693359375, 6.70703125, 7.078369140625, 7.44970703125, 7.821044921875, 8.1923828125, 8.563720703125, 8.93505859375, 9.306396484375, 9.677734375, 10.049072265625, 10.42041015625, 10.791748046875, 11.1630859375, 11.534423828125, 11.90576171875, 12.277099609375, 12.6484375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 7.0, 15.0, 19.0, 37.0, 34.0, 62.0, 111.0, 156.0, 317.0, 836.0, 7056.0, 3028174.0, 106306.0, 1499.0, 479.0, 226.0, 127.0, 79.0, 51.0, 29.0, 19.0, 18.0, 10.0, 5.0, 10.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.65625, -54.322998046875, -52.98974609375, -51.656494140625, -50.3232421875, -48.989990234375, -47.65673828125, -46.323486328125, -44.990234375, -43.656982421875, -42.32373046875, -40.990478515625, -39.6572265625, -38.323974609375, -36.99072265625, -35.657470703125, -34.32421875, -32.990966796875, -31.65771484375, -30.324462890625, -28.9912109375, -27.657958984375, -26.32470703125, -24.991455078125, -23.658203125, -22.324951171875, -20.99169921875, -19.658447265625, -18.3251953125, -16.991943359375, -15.65869140625, -14.325439453125, -12.9921875, -11.658935546875, -10.32568359375, -8.992431640625, -7.6591796875, -6.325927734375, -4.99267578125, -3.659423828125, -2.326171875, -0.992919921875, 0.34033203125, 1.673583984375, 3.0068359375, 4.340087890625, 5.67333984375, 7.006591796875, 8.33984375, 9.673095703125, 11.00634765625, 12.339599609375, 13.6728515625, 15.006103515625, 16.33935546875, 17.672607421875, 19.005859375, 20.339111328125, 21.67236328125, 23.005615234375, 24.3388671875, 25.672119140625, 27.00537109375, 28.338623046875, 29.671875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [967.0, 49.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.791018486022949, 3.4811325073242188, 14.753283500671387, 26.025432586669922, 37.297584533691406, 48.56973648071289, 59.84188461303711, 71.11404418945312, 82.38619232177734, 93.65834045410156, 104.93049621582031, 116.20264434814453, 127.47479248046875, 138.7469482421875, 150.01910400390625, 161.291259765625, 172.5634002685547, 183.83555603027344, 195.10769653320312, 206.37985229492188, 217.65200805664062, 228.92416381835938, 240.19630432128906, 251.4684600830078, 262.7406005859375, 274.01275634765625, 285.284912109375, 296.55706787109375, 307.8291931152344, 319.1013488769531, 330.3735046386719, 341.6456604003906, 352.9178161621094, 364.1899719238281, 375.4621276855469, 386.7342529296875, 398.00640869140625, 409.278564453125, 420.55072021484375, 431.8228759765625, 443.09503173828125, 454.3671875, 465.63934326171875, 476.9114990234375, 488.1836242675781, 499.4557800292969, 510.7279357910156, 522.0001220703125, 533.272216796875, 544.5443725585938, 555.8165283203125, 567.0886840820312, 578.36083984375, 589.6329956054688, 600.9051513671875, 612.17724609375, 623.449462890625, 634.7216186523438, 645.9937744140625, 657.2659301757812, 668.5380859375, 679.8102416992188, 691.0823974609375, 702.3544921875, 713.6266479492188]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 8.0, 9.0, 15.0, 12.0, 16.0, 17.0, 20.0, 25.0, 18.0, 24.0, 22.0, 34.0, 33.0, 40.0, 32.0, 36.0, 39.0, 50.0, 48.0, 49.0, 38.0, 30.0, 38.0, 34.0, 33.0, 40.0, 28.0, 17.0, 29.0, 30.0, 19.0, 16.0, 20.0, 12.0, 7.0, 10.0, 11.0, 9.0, 7.0, 6.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-27.962600708007812, -27.07193374633789, -26.18126678466797, -25.290599822998047, -24.399932861328125, -23.509265899658203, -22.61859703063965, -21.727930068969727, -20.837263107299805, -19.946596145629883, -19.05592918395996, -18.16526222229004, -17.274593353271484, -16.383926391601562, -15.49325942993164, -14.602592468261719, -13.711925506591797, -12.821258544921875, -11.930591583251953, -11.039923667907715, -10.149256706237793, -9.258589744567871, -8.367921829223633, -7.477254867553711, -6.586587905883789, -5.695920944213867, -4.805253505706787, -3.914586305618286, -3.023919105529785, -2.1332521438598633, -1.2425847053527832, -0.3519172668457031, 0.5387516021728516, 1.4294188022613525, 2.3200860023498535, 3.2107532024383545, 4.1014204025268555, 4.992087364196777, 5.882754802703857, 6.7734222412109375, 7.664089202880859, 8.554756164550781, 9.445423126220703, 10.336091041564941, 11.226758003234863, 12.117424964904785, 13.008092880249023, 13.898759841918945, 14.789426803588867, 15.680093765258789, 16.57076072692871, 17.461427688598633, 18.352096557617188, 19.24276351928711, 20.13343048095703, 21.024097442626953, 21.914764404296875, 22.805431365966797, 23.69609832763672, 24.58676528930664, 25.477432250976562, 26.368099212646484, 27.25876808166504, 28.14943504333496, 29.040102005004883]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 11.0, 7.0, 11.0, 17.0, 21.0, 16.0, 20.0, 27.0, 19.0, 25.0, 34.0, 33.0, 41.0, 29.0, 32.0, 44.0, 46.0, 43.0, 38.0, 37.0, 38.0, 42.0, 45.0, 41.0, 32.0, 29.0, 23.0, 31.0, 22.0, 16.0, 15.0, 16.0, 8.0, 20.0, 16.0, 4.0, 3.0, 11.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.1875, -3.0914306640625, -2.995361328125, -2.8992919921875, -2.80322265625, -2.7071533203125, -2.611083984375, -2.5150146484375, -2.4189453125, -2.3228759765625, -2.226806640625, -2.1307373046875, -2.03466796875, -1.9385986328125, -1.842529296875, -1.7464599609375, -1.650390625, -1.5543212890625, -1.458251953125, -1.3621826171875, -1.26611328125, -1.1700439453125, -1.073974609375, -0.9779052734375, -0.8818359375, -0.7857666015625, -0.689697265625, -0.5936279296875, -0.49755859375, -0.4014892578125, -0.305419921875, -0.2093505859375, -0.11328125, -0.0172119140625, 0.078857421875, 0.1749267578125, 0.27099609375, 0.3670654296875, 0.463134765625, 0.5592041015625, 0.6552734375, 0.7513427734375, 0.847412109375, 0.9434814453125, 1.03955078125, 1.1356201171875, 1.231689453125, 1.3277587890625, 1.423828125, 1.5198974609375, 1.615966796875, 1.7120361328125, 1.80810546875, 1.9041748046875, 2.000244140625, 2.0963134765625, 2.1923828125, 2.2884521484375, 2.384521484375, 2.4805908203125, 2.57666015625, 2.6727294921875, 2.768798828125, 2.8648681640625, 2.9609375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 9.0, 11.0, 19.0, 11.0, 18.0, 21.0, 38.0, 30.0, 43.0, 46.0, 55.0, 61.0, 80.0, 105.0, 164.0, 451.0, 1588.0, 9920.0, 122013.0, 1906478.0, 2007818.0, 131806.0, 10558.0, 1664.0, 494.0, 216.0, 98.0, 76.0, 67.0, 52.0, 30.0, 35.0, 41.0, 23.0, 25.0, 24.0, 14.0, 17.0, 5.0, 10.0, 8.0, 10.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.1953125, -10.856201171875, -10.51708984375, -10.177978515625, -9.8388671875, -9.499755859375, -9.16064453125, -8.821533203125, -8.482421875, -8.143310546875, -7.80419921875, -7.465087890625, -7.1259765625, -6.786865234375, -6.44775390625, -6.108642578125, -5.76953125, -5.430419921875, -5.09130859375, -4.752197265625, -4.4130859375, -4.073974609375, -3.73486328125, -3.395751953125, -3.056640625, -2.717529296875, -2.37841796875, -2.039306640625, -1.7001953125, -1.361083984375, -1.02197265625, -0.682861328125, -0.34375, -0.004638671875, 0.33447265625, 0.673583984375, 1.0126953125, 1.351806640625, 1.69091796875, 2.030029296875, 2.369140625, 2.708251953125, 3.04736328125, 3.386474609375, 3.7255859375, 4.064697265625, 4.40380859375, 4.742919921875, 5.08203125, 5.421142578125, 5.76025390625, 6.099365234375, 6.4384765625, 6.777587890625, 7.11669921875, 7.455810546875, 7.794921875, 8.134033203125, 8.47314453125, 8.812255859375, 9.1513671875, 9.490478515625, 9.82958984375, 10.168701171875, 10.5078125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 17.0, 19.0, 30.0, 64.0, 86.0, 127.0, 218.0, 356.0, 474.0, 630.0, 633.0, 508.0, 342.0, 206.0, 133.0, 96.0, 51.0, 37.0, 19.0, 11.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5390625, -11.1658935546875, -10.792724609375, -10.4195556640625, -10.04638671875, -9.6732177734375, -9.300048828125, -8.9268798828125, -8.5537109375, -8.1805419921875, -7.807373046875, -7.4342041015625, -7.06103515625, -6.6878662109375, -6.314697265625, -5.9415283203125, -5.568359375, -5.1951904296875, -4.822021484375, -4.4488525390625, -4.07568359375, -3.7025146484375, -3.329345703125, -2.9561767578125, -2.5830078125, -2.2098388671875, -1.836669921875, -1.4635009765625, -1.09033203125, -0.7171630859375, -0.343994140625, 0.0291748046875, 0.40234375, 0.7755126953125, 1.148681640625, 1.5218505859375, 1.89501953125, 2.2681884765625, 2.641357421875, 3.0145263671875, 3.3876953125, 3.7608642578125, 4.134033203125, 4.5072021484375, 4.88037109375, 5.2535400390625, 5.626708984375, 5.9998779296875, 6.373046875, 6.7462158203125, 7.119384765625, 7.4925537109375, 7.86572265625, 8.2388916015625, 8.612060546875, 8.9852294921875, 9.3583984375, 9.7315673828125, 10.104736328125, 10.4779052734375, 10.85107421875, 11.2242431640625, 11.597412109375, 11.9705810546875, 12.34375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 10.0, 17.0, 34.0, 44.0, 83.0, 133.0, 231.0, 555.0, 2354.0, 107401.0, 3842528.0, 236330.0, 3361.0, 622.0, 252.0, 114.0, 85.0, 55.0, 31.0, 18.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.5, -31.531982421875, -30.56396484375, -29.595947265625, -28.6279296875, -27.659912109375, -26.69189453125, -25.723876953125, -24.755859375, -23.787841796875, -22.81982421875, -21.851806640625, -20.8837890625, -19.915771484375, -18.94775390625, -17.979736328125, -17.01171875, -16.043701171875, -15.07568359375, -14.107666015625, -13.1396484375, -12.171630859375, -11.20361328125, -10.235595703125, -9.267578125, -8.299560546875, -7.33154296875, -6.363525390625, -5.3955078125, -4.427490234375, -3.45947265625, -2.491455078125, -1.5234375, -0.555419921875, 0.41259765625, 1.380615234375, 2.3486328125, 3.316650390625, 4.28466796875, 5.252685546875, 6.220703125, 7.188720703125, 8.15673828125, 9.124755859375, 10.0927734375, 11.060791015625, 12.02880859375, 12.996826171875, 13.96484375, 14.932861328125, 15.90087890625, 16.868896484375, 17.8369140625, 18.804931640625, 19.77294921875, 20.740966796875, 21.708984375, 22.677001953125, 23.64501953125, 24.613037109375, 25.5810546875, 26.549072265625, 27.51708984375, 28.485107421875, 29.453125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 55.0, 397.0, 493.0, 69.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-305.763671875, -298.3138122558594, -290.86395263671875, -283.4140930175781, -275.9642333984375, -268.5143737792969, -261.06451416015625, -253.61463928222656, -246.16477966308594, -238.7149200439453, -231.2650604248047, -223.81520080566406, -216.36532592773438, -208.91546630859375, -201.46560668945312, -194.0157470703125, -186.56588745117188, -179.11602783203125, -171.66616821289062, -164.21630859375, -156.76644897460938, -149.31658935546875, -141.86671447753906, -134.41685485839844, -126.96699523925781, -119.51713562011719, -112.06727600097656, -104.6174087524414, -97.16754913330078, -89.71768951416016, -82.267822265625, -74.81796264648438, -67.36810302734375, -59.918243408203125, -52.468379974365234, -45.018516540527344, -37.56865692138672, -30.118797302246094, -22.668933868408203, -15.219070434570312, -7.7692108154296875, -0.3193492889404297, 7.130512237548828, 14.580373764038086, 22.030235290527344, 29.48009490966797, 36.92995834350586, 44.37982177734375, 51.829681396484375, 59.279541015625, 66.72940063476562, 74.17926788330078, 81.6291275024414, 89.07898712158203, 96.52885437011719, 103.97871398925781, 111.42857360839844, 118.87843322753906, 126.32829284667969, 133.7781524658203, 141.22802734375, 148.67788696289062, 156.12774658203125, 163.57760620117188, 171.0274658203125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 12.0, 16.0, 13.0, 25.0, 20.0, 22.0, 25.0, 31.0, 34.0, 33.0, 32.0, 47.0, 42.0, 50.0, 45.0, 58.0, 43.0, 35.0, 53.0, 43.0, 41.0, 36.0, 36.0, 37.0, 27.0, 24.0, 24.0, 17.0, 17.0, 9.0, 16.0, 7.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.787200927734375, -25.8486328125, -24.910062789916992, -23.971494674682617, -23.03292465209961, -22.094356536865234, -21.15578842163086, -20.21721839904785, -19.278648376464844, -18.34008026123047, -17.40151023864746, -16.462942123413086, -15.524372100830078, -14.585803985595703, -13.647234916687012, -12.70866584777832, -11.770097732543945, -10.831528663635254, -9.892959594726562, -8.954391479492188, -8.01582145690918, -7.0772528648376465, -6.138684272766113, -5.200115203857422, -4.2615461349487305, -3.322977066040039, -2.3844082355499268, -1.4458394050598145, -0.507270336151123, 0.43129873275756836, 1.3698673248291016, 2.308436393737793, 3.2470054626464844, 4.185574531555176, 5.124143600463867, 6.0627121925354, 7.001281261444092, 7.939850330352783, 8.878418922424316, 9.816987991333008, 10.7555570602417, 11.69412612915039, 12.632695198059082, 13.571264266967773, 14.509832382202148, 15.448402404785156, 16.38697052001953, 17.325538635253906, 18.264108657836914, 19.20267677307129, 20.141246795654297, 21.079814910888672, 22.01838493347168, 22.956953048706055, 23.895523071289062, 24.834091186523438, 25.772659301757812, 26.711227416992188, 27.649797439575195, 28.58836555480957, 29.526935577392578, 30.465503692626953, 31.404071807861328, 32.34264373779297, 33.281211853027344]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 9.0, 9.0, 13.0, 15.0, 8.0, 11.0, 21.0, 10.0, 25.0, 14.0, 21.0, 36.0, 34.0, 27.0, 27.0, 36.0, 43.0, 39.0, 35.0, 36.0, 57.0, 43.0, 37.0, 46.0, 36.0, 32.0, 32.0, 34.0, 24.0, 27.0, 16.0, 27.0, 20.0, 21.0, 8.0, 14.0, 4.0, 7.0, 8.0, 5.0, 10.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.744140625, -2.650238037109375, -2.55633544921875, -2.462432861328125, -2.3685302734375, -2.274627685546875, -2.18072509765625, -2.086822509765625, -1.992919921875, -1.899017333984375, -1.80511474609375, -1.711212158203125, -1.6173095703125, -1.523406982421875, -1.42950439453125, -1.335601806640625, -1.24169921875, -1.147796630859375, -1.05389404296875, -0.959991455078125, -0.8660888671875, -0.772186279296875, -0.67828369140625, -0.584381103515625, -0.490478515625, -0.396575927734375, -0.30267333984375, -0.208770751953125, -0.1148681640625, -0.020965576171875, 0.07293701171875, 0.166839599609375, 0.2607421875, 0.354644775390625, 0.44854736328125, 0.542449951171875, 0.6363525390625, 0.730255126953125, 0.82415771484375, 0.918060302734375, 1.011962890625, 1.105865478515625, 1.19976806640625, 1.293670654296875, 1.3875732421875, 1.481475830078125, 1.57537841796875, 1.669281005859375, 1.76318359375, 1.857086181640625, 1.95098876953125, 2.044891357421875, 2.1387939453125, 2.232696533203125, 2.32659912109375, 2.420501708984375, 2.514404296875, 2.608306884765625, 2.70220947265625, 2.796112060546875, 2.8900146484375, 2.983917236328125, 3.07781982421875, 3.171722412109375, 3.265625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 7.0, 8.0, 19.0, 17.0, 25.0, 53.0, 61.0, 89.0, 141.0, 200.0, 269.0, 401.0, 557.0, 854.0, 1230.0, 1799.0, 2672.0, 3996.0, 5767.0, 8602.0, 12779.0, 18826.0, 28506.0, 41834.0, 62466.0, 90332.0, 122976.0, 149078.0, 141687.0, 110418.0, 79138.0, 53766.0, 35862.0, 24284.0, 16209.0, 10857.0, 7182.0, 4901.0, 3378.0, 2279.0, 1585.0, 1093.0, 757.0, 504.0, 340.0, 223.0, 163.0, 107.0, 96.0, 62.0, 39.0, 28.0, 21.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.2344970703125, -0.2268848419189453, -0.21927261352539062, -0.21166038513183594, -0.20404815673828125, -0.19643592834472656, -0.18882369995117188, -0.1812114715576172, -0.1735992431640625, -0.1659870147705078, -0.15837478637695312, -0.15076255798339844, -0.14315032958984375, -0.13553810119628906, -0.12792587280273438, -0.12031364440917969, -0.112701416015625, -0.10508918762207031, -0.09747695922851562, -0.08986473083496094, -0.08225250244140625, -0.07464027404785156, -0.06702804565429688, -0.05941581726074219, -0.0518035888671875, -0.04419136047363281, -0.036579132080078125, -0.028966903686523438, -0.02135467529296875, -0.013742446899414062, -0.006130218505859375, 0.0014820098876953125, 0.00909423828125, 0.016706466674804688, 0.024318695068359375, 0.03193092346191406, 0.03954315185546875, 0.04715538024902344, 0.054767608642578125, 0.06237983703613281, 0.0699920654296875, 0.07760429382324219, 0.08521652221679688, 0.09282875061035156, 0.10044097900390625, 0.10805320739746094, 0.11566543579101562, 0.12327766418457031, 0.130889892578125, 0.1385021209716797, 0.14611434936523438, 0.15372657775878906, 0.16133880615234375, 0.16895103454589844, 0.17656326293945312, 0.1841754913330078, 0.1917877197265625, 0.1993999481201172, 0.20701217651367188, 0.21462440490722656, 0.22223663330078125, 0.22984886169433594, 0.23746109008789062, 0.2450733184814453, 0.252685546875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 1.0, 9.0, 6.0, 6.0, 12.0, 13.0, 14.0, 16.0, 16.0, 15.0, 22.0, 27.0, 23.0, 26.0, 30.0, 37.0, 46.0, 42.0, 40.0, 39.0, 35.0, 41.0, 1060.0, 40.0, 40.0, 35.0, 33.0, 35.0, 31.0, 34.0, 30.0, 18.0, 26.0, 24.0, 17.0, 12.0, 20.0, 11.0, 9.0, 9.0, 7.0, 8.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.142578125, -2.079803466796875, -2.01702880859375, -1.954254150390625, -1.8914794921875, -1.828704833984375, -1.76593017578125, -1.703155517578125, -1.640380859375, -1.577606201171875, -1.51483154296875, -1.452056884765625, -1.3892822265625, -1.326507568359375, -1.26373291015625, -1.200958251953125, -1.13818359375, -1.075408935546875, -1.01263427734375, -0.949859619140625, -0.8870849609375, -0.824310302734375, -0.76153564453125, -0.698760986328125, -0.635986328125, -0.573211669921875, -0.51043701171875, -0.447662353515625, -0.3848876953125, -0.322113037109375, -0.25933837890625, -0.196563720703125, -0.1337890625, -0.071014404296875, -0.00823974609375, 0.054534912109375, 0.1173095703125, 0.180084228515625, 0.24285888671875, 0.305633544921875, 0.368408203125, 0.431182861328125, 0.49395751953125, 0.556732177734375, 0.6195068359375, 0.682281494140625, 0.74505615234375, 0.807830810546875, 0.87060546875, 0.933380126953125, 0.99615478515625, 1.058929443359375, 1.1217041015625, 1.184478759765625, 1.24725341796875, 1.310028076171875, 1.372802734375, 1.435577392578125, 1.49835205078125, 1.561126708984375, 1.6239013671875, 1.686676025390625, 1.74945068359375, 1.812225341796875, 1.875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 11.0, 12.0, 19.0, 29.0, 35.0, 63.0, 82.0, 137.0, 217.0, 316.0, 511.0, 740.0, 1220.0, 1866.0, 3008.0, 4823.0, 7652.0, 12497.0, 20283.0, 31912.0, 50730.0, 77055.0, 111848.0, 167424.0, 1181083.0, 138485.0, 100136.0, 67785.0, 43622.0, 27685.0, 17437.0, 10592.0, 6673.0, 4196.0, 2502.0, 1570.0, 1007.0, 663.0, 404.0, 294.0, 173.0, 118.0, 75.0, 52.0, 37.0, 21.0, 12.0, 13.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.1842041015625, -0.17883872985839844, -0.17347335815429688, -0.1681079864501953, -0.16274261474609375, -0.1573772430419922, -0.15201187133789062, -0.14664649963378906, -0.1412811279296875, -0.13591575622558594, -0.13055038452148438, -0.1251850128173828, -0.11981964111328125, -0.11445426940917969, -0.10908889770507812, -0.10372352600097656, -0.098358154296875, -0.09299278259277344, -0.08762741088867188, -0.08226203918457031, -0.07689666748046875, -0.07153129577636719, -0.06616592407226562, -0.06080055236816406, -0.0554351806640625, -0.05006980895996094, -0.044704437255859375, -0.03933906555175781, -0.03397369384765625, -0.028608322143554688, -0.023242950439453125, -0.017877578735351562, -0.01251220703125, -0.0071468353271484375, -0.001781463623046875, 0.0035839080810546875, 0.00894927978515625, 0.014314651489257812, 0.019680023193359375, 0.025045394897460938, 0.0304107666015625, 0.03577613830566406, 0.041141510009765625, 0.04650688171386719, 0.05187225341796875, 0.05723762512207031, 0.06260299682617188, 0.06796836853027344, 0.073333740234375, 0.07869911193847656, 0.08406448364257812, 0.08942985534667969, 0.09479522705078125, 0.10016059875488281, 0.10552597045898438, 0.11089134216308594, 0.1162567138671875, 0.12162208557128906, 0.12698745727539062, 0.1323528289794922, 0.13771820068359375, 0.1430835723876953, 0.14844894409179688, 0.15381431579589844, 0.1591796875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 8.0, 11.0, 9.0, 9.0, 20.0, 19.0, 31.0, 43.0, 46.0, 45.0, 56.0, 54.0, 61.0, 85.0, 70.0, 61.0, 54.0, 67.0, 43.0, 51.0, 30.0, 32.0, 24.0, 18.0, 13.0, 9.0, 8.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0127105712890625, -0.01234745979309082, -0.01198434829711914, -0.011621236801147461, -0.011258125305175781, -0.010895013809204102, -0.010531902313232422, -0.010168790817260742, -0.009805679321289062, -0.009442567825317383, -0.009079456329345703, -0.008716344833374023, -0.008353233337402344, -0.007990121841430664, -0.007627010345458984, -0.007263898849487305, -0.006900787353515625, -0.006537675857543945, -0.006174564361572266, -0.005811452865600586, -0.005448341369628906, -0.0050852298736572266, -0.004722118377685547, -0.004359006881713867, -0.0039958953857421875, -0.003632783889770508, -0.003269672393798828, -0.0029065608978271484, -0.0025434494018554688, -0.002180337905883789, -0.0018172264099121094, -0.0014541149139404297, -0.00109100341796875, -0.0007278919219970703, -0.0003647804260253906, -1.6689300537109375e-06, 0.00036144256591796875, 0.0007245540618896484, 0.0010876655578613281, 0.0014507770538330078, 0.0018138885498046875, 0.002177000045776367, 0.002540111541748047, 0.0029032230377197266, 0.0032663345336914062, 0.003629446029663086, 0.003992557525634766, 0.004355669021606445, 0.004718780517578125, 0.005081892013549805, 0.005445003509521484, 0.005808115005493164, 0.006171226501464844, 0.0065343379974365234, 0.006897449493408203, 0.007260560989379883, 0.0076236724853515625, 0.007986783981323242, 0.008349895477294922, 0.008713006973266602, 0.009076118469238281, 0.009439229965209961, 0.00980234146118164, 0.01016545295715332, 0.010528564453125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 19.0, 15.0, 24.0, 32.0, 40.0, 52.0, 58.0, 84.0, 140.0, 382.0, 2731.0, 851488.0, 191134.0, 1597.0, 278.0, 128.0, 79.0, 58.0, 60.0, 31.0, 22.0, 26.0, 12.0, 12.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.232177734375, -0.22414398193359375, -0.2161102294921875, -0.20807647705078125, -0.200042724609375, -0.19200897216796875, -0.1839752197265625, -0.17594146728515625, -0.16790771484375, -0.15987396240234375, -0.1518402099609375, -0.14380645751953125, -0.135772705078125, -0.12773895263671875, -0.1197052001953125, -0.11167144775390625, -0.1036376953125, -0.09560394287109375, -0.0875701904296875, -0.07953643798828125, -0.071502685546875, -0.06346893310546875, -0.0554351806640625, -0.04740142822265625, -0.03936767578125, -0.03133392333984375, -0.0233001708984375, -0.01526641845703125, -0.007232666015625, 0.00080108642578125, 0.0088348388671875, 0.01686859130859375, 0.02490234375, 0.03293609619140625, 0.0409698486328125, 0.04900360107421875, 0.057037353515625, 0.06507110595703125, 0.0731048583984375, 0.08113861083984375, 0.08917236328125, 0.09720611572265625, 0.1052398681640625, 0.11327362060546875, 0.121307373046875, 0.12934112548828125, 0.1373748779296875, 0.14540863037109375, 0.1534423828125, 0.16147613525390625, 0.1695098876953125, 0.17754364013671875, 0.185577392578125, 0.19361114501953125, 0.2016448974609375, 0.20967864990234375, 0.21771240234375, 0.22574615478515625, 0.2337799072265625, 0.24181365966796875, 0.249847412109375, 0.25788116455078125, 0.2659149169921875, 0.27394866943359375, 0.281982421875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 22.0, 98.0, 463.0, 300.0, 76.0, 26.0, 14.0, 11.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02557823807001114, -0.023577380925416946, -0.021576521918177605, -0.019575662910938263, -0.01757480576634407, -0.015573947690427303, -0.013573089614510536, -0.011572231538593769, -0.009571373462677002, -0.007570515386760235, -0.005569657310843468, -0.0035687992349267006, -0.0015679411590099335, 0.00043291691690683365, 0.0024337749928236008, 0.004434633068740368, 0.006435491144657135, 0.008436349220573902, 0.01043720729649067, 0.012438065372407436, 0.014438923448324203, 0.016439780592918396, 0.018440639600157738, 0.02044149860739708, 0.022442355751991272, 0.024443212896585464, 0.026444071903824806, 0.028444930911064148, 0.03044578805565834, 0.03244664520025253, 0.034447506070137024, 0.036448363214731216, 0.038449227809906006, 0.0404500849545002, 0.04245094209909439, 0.04445180296897888, 0.046452660113573074, 0.04845351725816727, 0.05045437812805176, 0.05245523527264595, 0.05445609241724014, 0.056456949561834335, 0.05845780670642853, 0.06045866757631302, 0.06245952472090721, 0.0644603818655014, 0.0664612427353859, 0.06846209615468979, 0.07046295702457428, 0.07246381789445877, 0.07446467131376266, 0.07646553218364716, 0.07846638560295105, 0.08046724647283554, 0.08246810734272003, 0.08446896076202393, 0.08646982163190842, 0.08847068250179291, 0.0904715359210968, 0.09247239679098129, 0.09447325766086578, 0.09647411108016968, 0.09847497195005417, 0.10047582536935806, 0.10247668623924255]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 9.0, 7.0, 6.0, 7.0, 16.0, 11.0, 17.0, 30.0, 35.0, 40.0, 29.0, 22.0, 27.0, 34.0, 47.0, 35.0, 61.0, 48.0, 45.0, 57.0, 47.0, 45.0, 41.0, 36.0, 26.0, 36.0, 28.0, 24.0, 22.0, 21.0, 23.0, 13.0, 17.0, 10.0, 12.0, 4.0, 7.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01805245876312256, -0.017528370022773743, -0.017004279419779778, -0.016480188816785812, -0.015956100076436996, -0.015432010404765606, -0.014907920733094215, -0.014383831061422825, -0.013859741389751434, -0.013335651718080044, -0.012811562046408653, -0.012287472374737263, -0.011763382703065872, -0.011239293031394482, -0.010715203359723091, -0.0101911136880517, -0.00966702401638031, -0.00914293434470892, -0.008618844673037529, -0.008094755001366138, -0.007570665329694748, -0.007046575658023357, -0.006522485986351967, -0.005998396314680576, -0.005474306643009186, -0.004950216971337795, -0.004426127299666405, -0.003902037627995014, -0.0033779479563236237, -0.002853858284652233, -0.0023297686129808426, -0.001805678941309452, -0.0012815892696380615, -0.000757499597966671, -0.00023340992629528046, 0.0002906797453761101, 0.0008147694170475006, 0.0013388590887188911, 0.0018629487603902817, 0.002387038432061672, 0.0029111281037330627, 0.0034352177754044533, 0.003959307447075844, 0.004483397118747234, 0.005007486790418625, 0.005531576462090015, 0.006055666133761406, 0.0065797558054327965, 0.007103845477104187, 0.0076279351487755775, 0.008152024820446968, 0.008676114492118359, 0.00920020416378975, 0.00972429383546114, 0.01024838350713253, 0.01077247317880392, 0.011296562850475311, 0.011820652522146702, 0.012344742193818092, 0.012868831865489483, 0.013392921537160873, 0.013917011208832264, 0.014441100880503654, 0.014965190552175045, 0.015489280223846436]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 9.0, 9.0, 13.0, 16.0, 7.0, 11.0, 21.0, 10.0, 25.0, 14.0, 21.0, 36.0, 34.0, 27.0, 27.0, 35.0, 43.0, 40.0, 35.0, 36.0, 57.0, 43.0, 36.0, 47.0, 36.0, 32.0, 32.0, 34.0, 24.0, 27.0, 16.0, 27.0, 22.0, 19.0, 8.0, 14.0, 4.0, 7.0, 8.0, 5.0, 10.0, 6.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.744140625, -2.650238037109375, -2.55633544921875, -2.462432861328125, -2.3685302734375, -2.274627685546875, -2.18072509765625, -2.086822509765625, -1.992919921875, -1.899017333984375, -1.80511474609375, -1.711212158203125, -1.6173095703125, -1.523406982421875, -1.42950439453125, -1.335601806640625, -1.24169921875, -1.147796630859375, -1.05389404296875, -0.959991455078125, -0.8660888671875, -0.772186279296875, -0.67828369140625, -0.584381103515625, -0.490478515625, -0.396575927734375, -0.30267333984375, -0.208770751953125, -0.1148681640625, -0.020965576171875, 0.07293701171875, 0.166839599609375, 0.2607421875, 0.354644775390625, 0.44854736328125, 0.542449951171875, 0.6363525390625, 0.730255126953125, 0.82415771484375, 0.918060302734375, 1.011962890625, 1.105865478515625, 1.19976806640625, 1.293670654296875, 1.3875732421875, 1.481475830078125, 1.57537841796875, 1.669281005859375, 1.76318359375, 1.857086181640625, 1.95098876953125, 2.044891357421875, 2.1387939453125, 2.232696533203125, 2.32659912109375, 2.420501708984375, 2.514404296875, 2.608306884765625, 2.70220947265625, 2.796112060546875, 2.8900146484375, 2.983917236328125, 3.07781982421875, 3.171722412109375, 3.265625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 15.0, 18.0, 33.0, 53.0, 81.0, 140.0, 291.0, 545.0, 1094.0, 2312.0, 4734.0, 9793.0, 19101.0, 36927.0, 78115.0, 218287.0, 369967.0, 175555.0, 65885.0, 32360.0, 16681.0, 8465.0, 4207.0, 1980.0, 878.0, 478.0, 204.0, 124.0, 80.0, 44.0, 29.0, 20.0, 22.0, 13.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.494140625, -3.38629150390625, -3.2784423828125, -3.17059326171875, -3.062744140625, -2.95489501953125, -2.8470458984375, -2.73919677734375, -2.63134765625, -2.52349853515625, -2.4156494140625, -2.30780029296875, -2.199951171875, -2.09210205078125, -1.9842529296875, -1.87640380859375, -1.7685546875, -1.66070556640625, -1.5528564453125, -1.44500732421875, -1.337158203125, -1.22930908203125, -1.1214599609375, -1.01361083984375, -0.90576171875, -0.79791259765625, -0.6900634765625, -0.58221435546875, -0.474365234375, -0.36651611328125, -0.2586669921875, -0.15081787109375, -0.04296875, 0.06488037109375, 0.1727294921875, 0.28057861328125, 0.388427734375, 0.49627685546875, 0.6041259765625, 0.71197509765625, 0.81982421875, 0.92767333984375, 1.0355224609375, 1.14337158203125, 1.251220703125, 1.35906982421875, 1.4669189453125, 1.57476806640625, 1.6826171875, 1.79046630859375, 1.8983154296875, 2.00616455078125, 2.114013671875, 2.22186279296875, 2.3297119140625, 2.43756103515625, 2.54541015625, 2.65325927734375, 2.7611083984375, 2.86895751953125, 2.976806640625, 3.08465576171875, 3.1925048828125, 3.30035400390625, 3.408203125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 8.0, 6.0, 9.0, 14.0, 11.0, 16.0, 20.0, 27.0, 31.0, 33.0, 35.0, 35.0, 36.0, 40.0, 57.0, 68.0, 92.0, 159.0, 1387.0, 299.0, 140.0, 90.0, 62.0, 47.0, 37.0, 28.0, 42.0, 27.0, 25.0, 28.0, 18.0, 13.0, 11.0, 9.0, 12.0, 11.0, 11.0, 5.0, 8.0, 4.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.5546875, -11.2022705078125, -10.849853515625, -10.4974365234375, -10.14501953125, -9.7926025390625, -9.440185546875, -9.0877685546875, -8.7353515625, -8.3829345703125, -8.030517578125, -7.6781005859375, -7.32568359375, -6.9732666015625, -6.620849609375, -6.2684326171875, -5.916015625, -5.5635986328125, -5.211181640625, -4.8587646484375, -4.50634765625, -4.1539306640625, -3.801513671875, -3.4490966796875, -3.0966796875, -2.7442626953125, -2.391845703125, -2.0394287109375, -1.68701171875, -1.3345947265625, -0.982177734375, -0.6297607421875, -0.27734375, 0.0750732421875, 0.427490234375, 0.7799072265625, 1.13232421875, 1.4847412109375, 1.837158203125, 2.1895751953125, 2.5419921875, 2.8944091796875, 3.246826171875, 3.5992431640625, 3.95166015625, 4.3040771484375, 4.656494140625, 5.0089111328125, 5.361328125, 5.7137451171875, 6.066162109375, 6.4185791015625, 6.77099609375, 7.1234130859375, 7.475830078125, 7.8282470703125, 8.1806640625, 8.5330810546875, 8.885498046875, 9.2379150390625, 9.59033203125, 9.9427490234375, 10.295166015625, 10.6475830078125, 11.0]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 1.0, 4.0, 2.0, 7.0, 13.0, 6.0, 10.0, 19.0, 18.0, 25.0, 35.0, 37.0, 59.0, 76.0, 116.0, 180.0, 316.0, 579.0, 2127.0, 69516.0, 3049432.0, 20369.0, 1415.0, 488.0, 258.0, 172.0, 113.0, 81.0, 51.0, 44.0, 20.0, 26.0, 10.0, 17.0, 10.0, 13.0, 8.0, 7.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.09375, -31.96728515625, -30.8408203125, -29.71435546875, -28.587890625, -27.46142578125, -26.3349609375, -25.20849609375, -24.08203125, -22.95556640625, -21.8291015625, -20.70263671875, -19.576171875, -18.44970703125, -17.3232421875, -16.19677734375, -15.0703125, -13.94384765625, -12.8173828125, -11.69091796875, -10.564453125, -9.43798828125, -8.3115234375, -7.18505859375, -6.05859375, -4.93212890625, -3.8056640625, -2.67919921875, -1.552734375, -0.42626953125, 0.7001953125, 1.82666015625, 2.953125, 4.07958984375, 5.2060546875, 6.33251953125, 7.458984375, 8.58544921875, 9.7119140625, 10.83837890625, 11.96484375, 13.09130859375, 14.2177734375, 15.34423828125, 16.470703125, 17.59716796875, 18.7236328125, 19.85009765625, 20.9765625, 22.10302734375, 23.2294921875, 24.35595703125, 25.482421875, 26.60888671875, 27.7353515625, 28.86181640625, 29.98828125, 31.11474609375, 32.2412109375, 33.36767578125, 34.494140625, 35.62060546875, 36.7470703125, 37.87353515625, 39.0]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 10.0, 273.0, 652.0, 80.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.60725784301758, -38.02503967285156, -33.44282150268555, -28.86060333251953, -24.278385162353516, -19.6961669921875, -15.113948822021484, -10.531730651855469, -5.949512481689453, -1.3672943115234375, 3.214923858642578, 7.797142028808594, 12.37936019897461, 16.961578369140625, 21.54379653930664, 26.126014709472656, 30.708232879638672, 35.29045104980469, 39.8726692199707, 44.45488739013672, 49.037105560302734, 53.61932373046875, 58.201541900634766, 62.78376007080078, 67.36598205566406, 71.94819641113281, 76.5304183959961, 81.11264038085938, 85.69485473632812, 90.27706909179688, 94.85929107666016, 99.44151306152344, 104.02372741699219, 108.60594177246094, 113.18816375732422, 117.7703857421875, 122.35260009765625, 126.934814453125, 131.51702880859375, 136.09925842285156, 140.6814727783203, 145.26368713378906, 149.84591674804688, 154.42813110351562, 159.01034545898438, 163.59255981445312, 168.17477416992188, 172.7570037841797, 177.33921813964844, 181.9214324951172, 186.503662109375, 191.08587646484375, 195.6680908203125, 200.25030517578125, 204.83251953125, 209.4147491455078, 213.99696350097656, 218.5791778564453, 223.16140747070312, 227.74362182617188, 232.32583618164062, 236.90805053710938, 241.49026489257812, 246.07249450683594, 250.6547088623047]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 9.0, 11.0, 13.0, 19.0, 20.0, 21.0, 18.0, 26.0, 31.0, 28.0, 25.0, 23.0, 33.0, 34.0, 30.0, 48.0, 55.0, 34.0, 36.0, 33.0, 43.0, 33.0, 39.0, 34.0, 40.0, 27.0, 32.0, 37.0, 26.0, 26.0, 17.0, 22.0, 13.0, 14.0, 9.0, 8.0, 3.0, 6.0, 7.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.59071350097656, -33.52473831176758, -32.458763122558594, -31.392789840698242, -30.326814651489258, -29.260839462280273, -28.194866180419922, -27.128890991210938, -26.062915802001953, -24.99694061279297, -23.930965423583984, -22.864992141723633, -21.79901695251465, -20.733041763305664, -19.667068481445312, -18.601093292236328, -17.535118103027344, -16.46914291381836, -15.403168678283691, -14.337194442749023, -13.271219253540039, -12.205244064331055, -11.139269828796387, -10.073295593261719, -9.007320404052734, -7.941345691680908, -6.875370979309082, -5.809396266937256, -4.74342155456543, -3.6774468421936035, -2.6114721298217773, -1.5454974174499512, -0.4795188903808594, 0.5864558219909668, 1.652430534362793, 2.718405246734619, 3.7843799591064453, 4.8503546714782715, 5.916329383850098, 6.982304096221924, 8.04827880859375, 9.114253997802734, 10.180228233337402, 11.24620246887207, 12.312177658081055, 13.378152847290039, 14.444127082824707, 15.510101318359375, 16.57607650756836, 17.642051696777344, 18.708026885986328, 19.77400016784668, 20.839975357055664, 21.90595054626465, 22.971923828125, 24.037899017333984, 25.10387420654297, 26.169849395751953, 27.235824584960938, 28.30179786682129, 29.367773056030273, 30.433748245239258, 31.49972152709961, 32.565696716308594, 33.63167190551758]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 7.0, 6.0, 4.0, 8.0, 11.0, 12.0, 19.0, 9.0, 14.0, 15.0, 29.0, 24.0, 28.0, 38.0, 28.0, 45.0, 17.0, 34.0, 37.0, 37.0, 47.0, 39.0, 58.0, 42.0, 46.0, 34.0, 34.0, 28.0, 27.0, 28.0, 23.0, 24.0, 27.0, 22.0, 12.0, 16.0, 10.0, 9.0, 5.0, 7.0, 5.0, 6.0, 9.0, 5.0, 5.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.12109375, -3.0181884765625, -2.915283203125, -2.8123779296875, -2.70947265625, -2.6065673828125, -2.503662109375, -2.4007568359375, -2.2978515625, -2.1949462890625, -2.092041015625, -1.9891357421875, -1.88623046875, -1.7833251953125, -1.680419921875, -1.5775146484375, -1.474609375, -1.3717041015625, -1.268798828125, -1.1658935546875, -1.06298828125, -0.9600830078125, -0.857177734375, -0.7542724609375, -0.6513671875, -0.5484619140625, -0.445556640625, -0.3426513671875, -0.23974609375, -0.1368408203125, -0.033935546875, 0.0689697265625, 0.171875, 0.2747802734375, 0.377685546875, 0.4805908203125, 0.58349609375, 0.6864013671875, 0.789306640625, 0.8922119140625, 0.9951171875, 1.0980224609375, 1.200927734375, 1.3038330078125, 1.40673828125, 1.5096435546875, 1.612548828125, 1.7154541015625, 1.818359375, 1.9212646484375, 2.024169921875, 2.1270751953125, 2.22998046875, 2.3328857421875, 2.435791015625, 2.5386962890625, 2.6416015625, 2.7445068359375, 2.847412109375, 2.9503173828125, 3.05322265625, 3.1561279296875, 3.259033203125, 3.3619384765625, 3.46484375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 9.0, 6.0, 5.0, 9.0, 11.0, 14.0, 8.0, 17.0, 32.0, 37.0, 48.0, 104.0, 155.0, 346.0, 767.0, 2102.0, 7504.0, 33472.0, 175655.0, 877574.0, 1964520.0, 904873.0, 180829.0, 34418.0, 7845.0, 2157.0, 857.0, 393.0, 170.0, 115.0, 81.0, 30.0, 25.0, 31.0, 12.0, 15.0, 5.0, 13.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.19921875, -5.99603271484375, -5.7928466796875, -5.58966064453125, -5.386474609375, -5.18328857421875, -4.9801025390625, -4.77691650390625, -4.57373046875, -4.37054443359375, -4.1673583984375, -3.96417236328125, -3.760986328125, -3.55780029296875, -3.3546142578125, -3.15142822265625, -2.9482421875, -2.74505615234375, -2.5418701171875, -2.33868408203125, -2.135498046875, -1.93231201171875, -1.7291259765625, -1.52593994140625, -1.32275390625, -1.11956787109375, -0.9163818359375, -0.71319580078125, -0.510009765625, -0.30682373046875, -0.1036376953125, 0.09954833984375, 0.302734375, 0.50592041015625, 0.7091064453125, 0.91229248046875, 1.115478515625, 1.31866455078125, 1.5218505859375, 1.72503662109375, 1.92822265625, 2.13140869140625, 2.3345947265625, 2.53778076171875, 2.740966796875, 2.94415283203125, 3.1473388671875, 3.35052490234375, 3.5537109375, 3.75689697265625, 3.9600830078125, 4.16326904296875, 4.366455078125, 4.56964111328125, 4.7728271484375, 4.97601318359375, 5.17919921875, 5.38238525390625, 5.5855712890625, 5.78875732421875, 5.991943359375, 6.19512939453125, 6.3983154296875, 6.60150146484375, 6.8046875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 15.0, 25.0, 22.0, 37.0, 73.0, 94.0, 139.0, 220.0, 296.0, 404.0, 495.0, 547.0, 478.0, 355.0, 292.0, 169.0, 157.0, 85.0, 59.0, 42.0, 25.0, 14.0, 11.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.609375, -9.269775390625, -8.93017578125, -8.590576171875, -8.2509765625, -7.911376953125, -7.57177734375, -7.232177734375, -6.892578125, -6.552978515625, -6.21337890625, -5.873779296875, -5.5341796875, -5.194580078125, -4.85498046875, -4.515380859375, -4.17578125, -3.836181640625, -3.49658203125, -3.156982421875, -2.8173828125, -2.477783203125, -2.13818359375, -1.798583984375, -1.458984375, -1.119384765625, -0.77978515625, -0.440185546875, -0.1005859375, 0.239013671875, 0.57861328125, 0.918212890625, 1.2578125, 1.597412109375, 1.93701171875, 2.276611328125, 2.6162109375, 2.955810546875, 3.29541015625, 3.635009765625, 3.974609375, 4.314208984375, 4.65380859375, 4.993408203125, 5.3330078125, 5.672607421875, 6.01220703125, 6.351806640625, 6.69140625, 7.031005859375, 7.37060546875, 7.710205078125, 8.0498046875, 8.389404296875, 8.72900390625, 9.068603515625, 9.408203125, 9.747802734375, 10.08740234375, 10.427001953125, 10.7666015625, 11.106201171875, 11.44580078125, 11.785400390625, 12.125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 16.0, 16.0, 18.0, 44.0, 57.0, 107.0, 184.0, 291.0, 611.0, 1855.0, 18550.0, 479145.0, 3256708.0, 417382.0, 16421.0, 1623.0, 555.0, 273.0, 181.0, 88.0, 58.0, 38.0, 22.0, 16.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.890625, -21.29052734375, -20.6904296875, -20.09033203125, -19.490234375, -18.89013671875, -18.2900390625, -17.68994140625, -17.08984375, -16.48974609375, -15.8896484375, -15.28955078125, -14.689453125, -14.08935546875, -13.4892578125, -12.88916015625, -12.2890625, -11.68896484375, -11.0888671875, -10.48876953125, -9.888671875, -9.28857421875, -8.6884765625, -8.08837890625, -7.48828125, -6.88818359375, -6.2880859375, -5.68798828125, -5.087890625, -4.48779296875, -3.8876953125, -3.28759765625, -2.6875, -2.08740234375, -1.4873046875, -0.88720703125, -0.287109375, 0.31298828125, 0.9130859375, 1.51318359375, 2.11328125, 2.71337890625, 3.3134765625, 3.91357421875, 4.513671875, 5.11376953125, 5.7138671875, 6.31396484375, 6.9140625, 7.51416015625, 8.1142578125, 8.71435546875, 9.314453125, 9.91455078125, 10.5146484375, 11.11474609375, 11.71484375, 12.31494140625, 12.9150390625, 13.51513671875, 14.115234375, 14.71533203125, 15.3154296875, 15.91552734375, 16.515625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 9.0, 41.0, 93.0, 188.0, 217.0, 211.0, 151.0, 62.0, 29.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.044071197509766, -57.2835807800293, -54.523094177246094, -51.762603759765625, -49.002113342285156, -46.24162292480469, -43.481136322021484, -40.720645904541016, -37.96015930175781, -35.199668884277344, -32.43918228149414, -29.678691864013672, -26.918201446533203, -24.157712936401367, -21.39722442626953, -18.636734008789062, -15.876243591308594, -13.115754127502441, -10.355264663696289, -7.594776153564453, -4.834286689758301, -2.0737972259521484, 0.6866912841796875, 3.4471817016601562, 6.207670211791992, 8.968159675598145, 11.728649139404297, 14.489137649536133, 17.24962615966797, 20.010116577148438, 22.770605087280273, 25.531095504760742, 28.291587829589844, 31.05207633972168, 33.812564849853516, 36.573055267333984, 39.33354568481445, 42.094032287597656, 44.854522705078125, 47.615013122558594, 50.37550354003906, 53.13599395751953, 55.896480560302734, 58.6569709777832, 61.41746139526367, 64.17794799804688, 66.93843841552734, 69.69892883300781, 72.45941162109375, 75.21990203857422, 77.98039245605469, 80.74087524414062, 83.5013656616211, 86.26185607910156, 89.02234649658203, 91.7828369140625, 94.54332733154297, 97.30381774902344, 100.0643081665039, 102.82479858398438, 105.58528137207031, 108.34577178955078, 111.10626220703125, 113.86675262451172, 116.62724304199219]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 2.0, 2.0, 13.0, 6.0, 12.0, 15.0, 21.0, 25.0, 19.0, 30.0, 24.0, 32.0, 30.0, 37.0, 36.0, 58.0, 59.0, 48.0, 45.0, 36.0, 41.0, 41.0, 32.0, 30.0, 37.0, 30.0, 32.0, 33.0, 25.0, 27.0, 23.0, 22.0, 10.0, 13.0, 12.0, 9.0, 10.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.402509689331055, -29.45628547668457, -28.51006317138672, -27.563838958740234, -26.617616653442383, -25.6713924407959, -24.725170135498047, -23.778945922851562, -22.83272361755371, -21.886499404907227, -20.940277099609375, -19.99405288696289, -19.04783058166504, -18.101606369018555, -17.155384063720703, -16.20915985107422, -15.26293659210205, -14.316713333129883, -13.370490074157715, -12.424266815185547, -11.478043556213379, -10.531820297241211, -9.585596084594727, -8.639373779296875, -7.693150043487549, -6.746926784515381, -5.800703525543213, -4.854479789733887, -3.908256769180298, -2.962033271789551, -2.015810012817383, -1.0695867538452148, -0.12336349487304688, 0.8228598237037659, 1.7690831422805786, 2.715306520462036, 3.661529779434204, 4.607753276824951, 5.553976535797119, 6.500199794769287, 7.446423053741455, 8.392646789550781, 9.33887004852295, 10.285093307495117, 11.231316566467285, 12.177539825439453, 13.123763084411621, 14.069986343383789, 15.016209602355957, 15.962432861328125, 16.90865707397461, 17.85487937927246, 18.801103591918945, 19.747325897216797, 20.69355010986328, 21.639772415161133, 22.585996627807617, 23.5322208404541, 24.478443145751953, 25.424667358398438, 26.37088966369629, 27.317113876342773, 28.263336181640625, 29.20956039428711, 30.15578269958496]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 7.0, 10.0, 11.0, 16.0, 23.0, 23.0, 29.0, 25.0, 33.0, 27.0, 20.0, 28.0, 34.0, 31.0, 33.0, 45.0, 53.0, 37.0, 59.0, 40.0, 43.0, 34.0, 35.0, 33.0, 26.0, 32.0, 23.0, 24.0, 22.0, 13.0, 19.0, 15.0, 16.0, 17.0, 7.0, 8.0, 13.0, 9.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.359375, -3.25341796875, -3.1474609375, -3.04150390625, -2.935546875, -2.82958984375, -2.7236328125, -2.61767578125, -2.51171875, -2.40576171875, -2.2998046875, -2.19384765625, -2.087890625, -1.98193359375, -1.8759765625, -1.77001953125, -1.6640625, -1.55810546875, -1.4521484375, -1.34619140625, -1.240234375, -1.13427734375, -1.0283203125, -0.92236328125, -0.81640625, -0.71044921875, -0.6044921875, -0.49853515625, -0.392578125, -0.28662109375, -0.1806640625, -0.07470703125, 0.03125, 0.13720703125, 0.2431640625, 0.34912109375, 0.455078125, 0.56103515625, 0.6669921875, 0.77294921875, 0.87890625, 0.98486328125, 1.0908203125, 1.19677734375, 1.302734375, 1.40869140625, 1.5146484375, 1.62060546875, 1.7265625, 1.83251953125, 1.9384765625, 2.04443359375, 2.150390625, 2.25634765625, 2.3623046875, 2.46826171875, 2.57421875, 2.68017578125, 2.7861328125, 2.89208984375, 2.998046875, 3.10400390625, 3.2099609375, 3.31591796875, 3.421875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 7.0, 3.0, 7.0, 11.0, 11.0, 8.0, 16.0, 27.0, 54.0, 68.0, 93.0, 184.0, 303.0, 427.0, 688.0, 1003.0, 1597.0, 2472.0, 3911.0, 6070.0, 9863.0, 15873.0, 26030.0, 40967.0, 66148.0, 105822.0, 157698.0, 187558.0, 152367.0, 101001.0, 63406.0, 39354.0, 24681.0, 15097.0, 9594.0, 5874.0, 3676.0, 2421.0, 1523.0, 943.0, 634.0, 368.0, 269.0, 159.0, 105.0, 72.0, 30.0, 23.0, 17.0, 8.0, 7.0, 5.0, 1.0, 2.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3095703125, -0.2994041442871094, -0.28923797607421875, -0.2790718078613281, -0.2689056396484375, -0.2587394714355469, -0.24857330322265625, -0.23840713500976562, -0.228240966796875, -0.21807479858398438, -0.20790863037109375, -0.19774246215820312, -0.1875762939453125, -0.17741012573242188, -0.16724395751953125, -0.15707778930664062, -0.14691162109375, -0.13674545288085938, -0.12657928466796875, -0.11641311645507812, -0.1062469482421875, -0.09608078002929688, -0.08591461181640625, -0.07574844360351562, -0.065582275390625, -0.055416107177734375, -0.04524993896484375, -0.035083770751953125, -0.0249176025390625, -0.014751434326171875, -0.00458526611328125, 0.005580902099609375, 0.0157470703125, 0.025913238525390625, 0.03607940673828125, 0.046245574951171875, 0.0564117431640625, 0.06657791137695312, 0.07674407958984375, 0.08691024780273438, 0.097076416015625, 0.10724258422851562, 0.11740875244140625, 0.12757492065429688, 0.1377410888671875, 0.14790725708007812, 0.15807342529296875, 0.16823959350585938, 0.17840576171875, 0.18857192993164062, 0.19873809814453125, 0.20890426635742188, 0.2190704345703125, 0.22923660278320312, 0.23940277099609375, 0.24956893920898438, 0.259735107421875, 0.2699012756347656, 0.28006744384765625, 0.2902336120605469, 0.3003997802734375, 0.3105659484863281, 0.32073211669921875, 0.3308982849121094, 0.341064453125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 8.0, 12.0, 20.0, 14.0, 18.0, 18.0, 23.0, 24.0, 23.0, 30.0, 36.0, 36.0, 47.0, 41.0, 48.0, 39.0, 1066.0, 45.0, 52.0, 48.0, 37.0, 31.0, 34.0, 23.0, 35.0, 35.0, 36.0, 22.0, 12.0, 16.0, 18.0, 10.0, 16.0, 2.0, 5.0, 12.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.115234375, -2.044219970703125, -1.97320556640625, -1.902191162109375, -1.8311767578125, -1.760162353515625, -1.68914794921875, -1.618133544921875, -1.547119140625, -1.476104736328125, -1.40509033203125, -1.334075927734375, -1.2630615234375, -1.192047119140625, -1.12103271484375, -1.050018310546875, -0.97900390625, -0.907989501953125, -0.83697509765625, -0.765960693359375, -0.6949462890625, -0.623931884765625, -0.55291748046875, -0.481903076171875, -0.410888671875, -0.339874267578125, -0.26885986328125, -0.197845458984375, -0.1268310546875, -0.055816650390625, 0.01519775390625, 0.086212158203125, 0.1572265625, 0.228240966796875, 0.29925537109375, 0.370269775390625, 0.4412841796875, 0.512298583984375, 0.58331298828125, 0.654327392578125, 0.725341796875, 0.796356201171875, 0.86737060546875, 0.938385009765625, 1.0093994140625, 1.080413818359375, 1.15142822265625, 1.222442626953125, 1.29345703125, 1.364471435546875, 1.43548583984375, 1.506500244140625, 1.5775146484375, 1.648529052734375, 1.71954345703125, 1.790557861328125, 1.861572265625, 1.932586669921875, 2.00360107421875, 2.074615478515625, 2.1456298828125, 2.216644287109375, 2.28765869140625, 2.358673095703125, 2.4296875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 7.0, 14.0, 18.0, 44.0, 63.0, 89.0, 119.0, 191.0, 245.0, 439.0, 597.0, 904.0, 1522.0, 2322.0, 3593.0, 5687.0, 9153.0, 14845.0, 23644.0, 37588.0, 58439.0, 86845.0, 120606.0, 376570.0, 971600.0, 124973.0, 89739.0, 60798.0, 39509.0, 25103.0, 15639.0, 9737.0, 5973.0, 3764.0, 2359.0, 1517.0, 958.0, 651.0, 429.0, 272.0, 190.0, 123.0, 88.0, 58.0, 35.0, 21.0, 18.0, 12.0, 10.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1851806640625, -0.1795787811279297, -0.17397689819335938, -0.16837501525878906, -0.16277313232421875, -0.15717124938964844, -0.15156936645507812, -0.1459674835205078, -0.1403656005859375, -0.1347637176513672, -0.12916183471679688, -0.12355995178222656, -0.11795806884765625, -0.11235618591308594, -0.10675430297851562, -0.10115242004394531, -0.095550537109375, -0.08994865417480469, -0.08434677124023438, -0.07874488830566406, -0.07314300537109375, -0.06754112243652344, -0.061939239501953125, -0.05633735656738281, -0.0507354736328125, -0.04513359069824219, -0.039531707763671875, -0.03392982482910156, -0.02832794189453125, -0.022726058959960938, -0.017124176025390625, -0.011522293090820312, -0.00592041015625, -0.0003185272216796875, 0.005283355712890625, 0.010885238647460938, 0.01648712158203125, 0.022089004516601562, 0.027690887451171875, 0.03329277038574219, 0.0388946533203125, 0.04449653625488281, 0.050098419189453125, 0.05570030212402344, 0.06130218505859375, 0.06690406799316406, 0.07250595092773438, 0.07810783386230469, 0.083709716796875, 0.08931159973144531, 0.09491348266601562, 0.10051536560058594, 0.10611724853515625, 0.11171913146972656, 0.11732101440429688, 0.12292289733886719, 0.1285247802734375, 0.1341266632080078, 0.13972854614257812, 0.14533042907714844, 0.15093231201171875, 0.15653419494628906, 0.16213607788085938, 0.1677379608154297, 0.17333984375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 8.0, 10.0, 16.0, 14.0, 15.0, 16.0, 20.0, 21.0, 32.0, 32.0, 47.0, 37.0, 51.0, 73.0, 113.0, 98.0, 88.0, 45.0, 26.0, 35.0, 37.0, 24.0, 19.0, 20.0, 17.0, 16.0, 24.0, 10.0, 5.0, 6.0, 6.0, 1.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.007534027099609375, -0.007284224033355713, -0.007034420967102051, -0.006784617900848389, -0.0065348148345947266, -0.0062850117683410645, -0.006035208702087402, -0.00578540563583374, -0.005535602569580078, -0.005285799503326416, -0.005035996437072754, -0.004786193370819092, -0.00453639030456543, -0.004286587238311768, -0.0040367841720581055, -0.0037869811058044434, -0.0035371780395507812, -0.003287374973297119, -0.003037571907043457, -0.002787768840789795, -0.002537965774536133, -0.0022881627082824707, -0.0020383596420288086, -0.0017885565757751465, -0.0015387535095214844, -0.0012889504432678223, -0.0010391473770141602, -0.000789344310760498, -0.0005395412445068359, -0.00028973817825317383, -3.993511199951172e-05, 0.0002098679542541504, 0.0004596710205078125, 0.0007094740867614746, 0.0009592771530151367, 0.0012090802192687988, 0.001458883285522461, 0.001708686351776123, 0.001958489418029785, 0.0022082924842834473, 0.0024580955505371094, 0.0027078986167907715, 0.0029577016830444336, 0.0032075047492980957, 0.003457307815551758, 0.00370711088180542, 0.003956913948059082, 0.004206717014312744, 0.004456520080566406, 0.004706323146820068, 0.0049561262130737305, 0.005205929279327393, 0.005455732345581055, 0.005705535411834717, 0.005955338478088379, 0.006205141544342041, 0.006454944610595703, 0.006704747676849365, 0.006954550743103027, 0.0072043538093566895, 0.0074541568756103516, 0.007703959941864014, 0.007953763008117676, 0.008203566074371338, 0.008453369140625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 1.0, 4.0, 7.0, 3.0, 8.0, 18.0, 18.0, 23.0, 15.0, 28.0, 26.0, 45.0, 63.0, 88.0, 269.0, 1329.0, 43504.0, 987592.0, 14111.0, 823.0, 216.0, 101.0, 56.0, 45.0, 26.0, 30.0, 19.0, 16.0, 12.0, 11.0, 10.0, 17.0, 2.0, 3.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.1816425323486328, -0.17566299438476562, -0.16968345642089844, -0.16370391845703125, -0.15772438049316406, -0.15174484252929688, -0.1457653045654297, -0.1397857666015625, -0.1338062286376953, -0.12782669067382812, -0.12184715270996094, -0.11586761474609375, -0.10988807678222656, -0.10390853881835938, -0.09792900085449219, -0.091949462890625, -0.08596992492675781, -0.07999038696289062, -0.07401084899902344, -0.06803131103515625, -0.06205177307128906, -0.056072235107421875, -0.05009269714355469, -0.0441131591796875, -0.03813362121582031, -0.032154083251953125, -0.026174545288085938, -0.02019500732421875, -0.014215469360351562, -0.008235931396484375, -0.0022563934326171875, 0.00372314453125, 0.009702682495117188, 0.015682220458984375, 0.021661758422851562, 0.02764129638671875, 0.03362083435058594, 0.039600372314453125, 0.04557991027832031, 0.0515594482421875, 0.05753898620605469, 0.06351852416992188, 0.06949806213378906, 0.07547760009765625, 0.08145713806152344, 0.08743667602539062, 0.09341621398925781, 0.099395751953125, 0.10537528991699219, 0.11135482788085938, 0.11733436584472656, 0.12331390380859375, 0.12929344177246094, 0.13527297973632812, 0.1412525177001953, 0.1472320556640625, 0.1532115936279297, 0.15919113159179688, 0.16517066955566406, 0.17115020751953125, 0.17712974548339844, 0.18310928344726562, 0.1890888214111328, 0.195068359375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 22.0, 55.0, 180.0, 443.0, 193.0, 62.0, 30.0, 7.0, 9.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047456078231334686, -0.04594796150922775, -0.04443984851241112, -0.04293173551559448, -0.04142361879348755, -0.039915502071380615, -0.03840738907456398, -0.036899276077747345, -0.03539115935564041, -0.03388304263353348, -0.03237492963671684, -0.03086681477725506, -0.029358699917793274, -0.02785058505833149, -0.026342470198869705, -0.02483435533940792, -0.023326240479946136, -0.021818125620484352, -0.020310010761022568, -0.018801895901560783, -0.017293781042099, -0.015785666182637215, -0.01427755132317543, -0.012769436463713646, -0.011261321604251862, -0.009753206744790077, -0.008245091885328293, -0.0067369770258665085, -0.005228862166404724, -0.0037207473069429398, -0.0022126324474811554, -0.000704517588019371, 0.0008035972714424133, 0.0023117121309041977, 0.003819826990365982, 0.005327941849827766, 0.006836056709289551, 0.008344171568751335, 0.00985228642821312, 0.011360401287674904, 0.012868516147136688, 0.014376631006598473, 0.015884745866060257, 0.01739286072552204, 0.018900975584983826, 0.02040909044444561, 0.021917205303907394, 0.02342532016336918, 0.024933435022830963, 0.026441549882292747, 0.027949664741754532, 0.029457779601216316, 0.0309658944606781, 0.032474011182785034, 0.03398212417960167, 0.035490237176418304, 0.03699835389852524, 0.03850647062063217, 0.04001458361744881, 0.04152269661426544, 0.043030813336372375, 0.04453893005847931, 0.046047043055295944, 0.04755515605211258, 0.04906327277421951]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 7.0, 5.0, 10.0, 8.0, 8.0, 13.0, 20.0, 13.0, 14.0, 23.0, 20.0, 21.0, 37.0, 29.0, 31.0, 35.0, 25.0, 27.0, 46.0, 52.0, 38.0, 37.0, 37.0, 41.0, 31.0, 31.0, 44.0, 27.0, 33.0, 30.0, 23.0, 22.0, 19.0, 26.0, 19.0, 15.0, 14.0, 15.0, 13.0, 6.0, 8.0, 3.0, 5.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.009925782680511475, -0.00963624007999897, -0.009346697479486465, -0.009057154878973961, -0.008767612278461456, -0.008478069677948952, -0.008188527077436447, -0.007898984476923943, -0.007609441876411438, -0.007319899275898933, -0.007030356675386429, -0.006740814074873924, -0.00645127147436142, -0.006161728873848915, -0.0058721862733364105, -0.005582643672823906, -0.005293101072311401, -0.005003558471798897, -0.004714015871286392, -0.004424473270773888, -0.004134930670261383, -0.0038453880697488785, -0.003555845469236374, -0.0032663028687238693, -0.0029767602682113647, -0.00268721766769886, -0.0023976750671863556, -0.002108132466673851, -0.0018185898661613464, -0.0015290472656488419, -0.0012395046651363373, -0.0009499620646238327, -0.0006604194641113281, -0.00037087686359882355, -8.133426308631897e-05, 0.0002082083374261856, 0.0004977509379386902, 0.0007872935384511948, 0.0010768361389636993, 0.001366378739476204, 0.0016559213399887085, 0.001945463940501213, 0.0022350065410137177, 0.0025245491415262222, 0.002814091742038727, 0.0031036343425512314, 0.003393176943063736, 0.0036827195435762405, 0.003972262144088745, 0.00426180474460125, 0.004551347345113754, 0.004840889945626259, 0.005130432546138763, 0.005419975146651268, 0.005709517747163773, 0.005999060347676277, 0.006288602948188782, 0.006578145548701286, 0.006867688149213791, 0.0071572307497262955, 0.0074467733502388, 0.007736315950751305, 0.00802585855126381, 0.008315401151776314, 0.008604943752288818]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 8.0, 9.0, 10.0, 17.0, 23.0, 24.0, 28.0, 25.0, 33.0, 27.0, 20.0, 28.0, 34.0, 31.0, 33.0, 45.0, 53.0, 37.0, 59.0, 40.0, 43.0, 34.0, 35.0, 33.0, 26.0, 32.0, 23.0, 24.0, 22.0, 13.0, 19.0, 15.0, 16.0, 17.0, 7.0, 8.0, 13.0, 9.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.359375, -3.25341796875, -3.1474609375, -3.04150390625, -2.935546875, -2.82958984375, -2.7236328125, -2.61767578125, -2.51171875, -2.40576171875, -2.2998046875, -2.19384765625, -2.087890625, -1.98193359375, -1.8759765625, -1.77001953125, -1.6640625, -1.55810546875, -1.4521484375, -1.34619140625, -1.240234375, -1.13427734375, -1.0283203125, -0.92236328125, -0.81640625, -0.71044921875, -0.6044921875, -0.49853515625, -0.392578125, -0.28662109375, -0.1806640625, -0.07470703125, 0.03125, 0.13720703125, 0.2431640625, 0.34912109375, 0.455078125, 0.56103515625, 0.6669921875, 0.77294921875, 0.87890625, 0.98486328125, 1.0908203125, 1.19677734375, 1.302734375, 1.40869140625, 1.5146484375, 1.62060546875, 1.7265625, 1.83251953125, 1.9384765625, 2.04443359375, 2.150390625, 2.25634765625, 2.3623046875, 2.46826171875, 2.57421875, 2.68017578125, 2.7861328125, 2.89208984375, 2.998046875, 3.10400390625, 3.2099609375, 3.31591796875, 3.421875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 8.0, 9.0, 16.0, 19.0, 33.0, 44.0, 47.0, 85.0, 139.0, 257.0, 442.0, 689.0, 1307.0, 2382.0, 4517.0, 8227.0, 15233.0, 27502.0, 49429.0, 90121.0, 161495.0, 243694.0, 195244.0, 111222.0, 60923.0, 33876.0, 18864.0, 10300.0, 5620.0, 3009.0, 1660.0, 886.0, 466.0, 310.0, 172.0, 99.0, 67.0, 39.0, 27.0, 22.0, 12.0, 11.0, 11.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.78125, -2.68426513671875, -2.5872802734375, -2.49029541015625, -2.393310546875, -2.29632568359375, -2.1993408203125, -2.10235595703125, -2.00537109375, -1.90838623046875, -1.8114013671875, -1.71441650390625, -1.617431640625, -1.52044677734375, -1.4234619140625, -1.32647705078125, -1.2294921875, -1.13250732421875, -1.0355224609375, -0.93853759765625, -0.841552734375, -0.74456787109375, -0.6475830078125, -0.55059814453125, -0.45361328125, -0.35662841796875, -0.2596435546875, -0.16265869140625, -0.065673828125, 0.03131103515625, 0.1282958984375, 0.22528076171875, 0.322265625, 0.41925048828125, 0.5162353515625, 0.61322021484375, 0.710205078125, 0.80718994140625, 0.9041748046875, 1.00115966796875, 1.09814453125, 1.19512939453125, 1.2921142578125, 1.38909912109375, 1.486083984375, 1.58306884765625, 1.6800537109375, 1.77703857421875, 1.8740234375, 1.97100830078125, 2.0679931640625, 2.16497802734375, 2.261962890625, 2.35894775390625, 2.4559326171875, 2.55291748046875, 2.64990234375, 2.74688720703125, 2.8438720703125, 2.94085693359375, 3.037841796875, 3.13482666015625, 3.2318115234375, 3.32879638671875, 3.42578125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 7.0, 6.0, 11.0, 10.0, 19.0, 16.0, 24.0, 36.0, 39.0, 35.0, 53.0, 51.0, 75.0, 128.0, 247.0, 1461.0, 291.0, 141.0, 82.0, 56.0, 55.0, 36.0, 42.0, 30.0, 17.0, 26.0, 19.0, 9.0, 9.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.921875, -22.3431396484375, -21.764404296875, -21.1856689453125, -20.60693359375, -20.0281982421875, -19.449462890625, -18.8707275390625, -18.2919921875, -17.7132568359375, -17.134521484375, -16.5557861328125, -15.97705078125, -15.3983154296875, -14.819580078125, -14.2408447265625, -13.662109375, -13.0833740234375, -12.504638671875, -11.9259033203125, -11.34716796875, -10.7684326171875, -10.189697265625, -9.6109619140625, -9.0322265625, -8.4534912109375, -7.874755859375, -7.2960205078125, -6.71728515625, -6.1385498046875, -5.559814453125, -4.9810791015625, -4.40234375, -3.8236083984375, -3.244873046875, -2.6661376953125, -2.08740234375, -1.5086669921875, -0.929931640625, -0.3511962890625, 0.2275390625, 0.8062744140625, 1.385009765625, 1.9637451171875, 2.54248046875, 3.1212158203125, 3.699951171875, 4.2786865234375, 4.857421875, 5.4361572265625, 6.014892578125, 6.5936279296875, 7.17236328125, 7.7510986328125, 8.329833984375, 8.9085693359375, 9.4873046875, 10.0660400390625, 10.644775390625, 11.2235107421875, 11.80224609375, 12.3809814453125, 12.959716796875, 13.5384521484375, 14.1171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 17.0, 22.0, 18.0, 23.0, 46.0, 43.0, 60.0, 113.0, 142.0, 207.0, 317.0, 656.0, 3198.0, 500977.0, 2631152.0, 6611.0, 902.0, 381.0, 238.0, 151.0, 103.0, 79.0, 70.0, 48.0, 22.0, 23.0, 24.0, 7.0, 18.0, 12.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.484375, -29.220947265625, -27.95751953125, -26.694091796875, -25.4306640625, -24.167236328125, -22.90380859375, -21.640380859375, -20.376953125, -19.113525390625, -17.85009765625, -16.586669921875, -15.3232421875, -14.059814453125, -12.79638671875, -11.532958984375, -10.26953125, -9.006103515625, -7.74267578125, -6.479248046875, -5.2158203125, -3.952392578125, -2.68896484375, -1.425537109375, -0.162109375, 1.101318359375, 2.36474609375, 3.628173828125, 4.8916015625, 6.155029296875, 7.41845703125, 8.681884765625, 9.9453125, 11.208740234375, 12.47216796875, 13.735595703125, 14.9990234375, 16.262451171875, 17.52587890625, 18.789306640625, 20.052734375, 21.316162109375, 22.57958984375, 23.843017578125, 25.1064453125, 26.369873046875, 27.63330078125, 28.896728515625, 30.16015625, 31.423583984375, 32.68701171875, 33.950439453125, 35.2138671875, 36.477294921875, 37.74072265625, 39.004150390625, 40.267578125, 41.531005859375, 42.79443359375, 44.057861328125, 45.3212890625, 46.584716796875, 47.84814453125, 49.111572265625, 50.375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 81.0, 297.0, 405.0, 171.0, 43.0, 9.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.115962982177734, -55.38356399536133, -52.65116500854492, -49.91876983642578, -47.186370849609375, -44.45397186279297, -41.72157287597656, -38.989173889160156, -36.25677490234375, -33.524375915527344, -30.791976928710938, -28.059579849243164, -25.327180862426758, -22.59478187561035, -19.862384796142578, -17.129985809326172, -14.397586822509766, -11.66518783569336, -8.93278980255127, -6.20039176940918, -3.4679927825927734, -0.7355937957763672, 1.9968032836914062, 4.7292022705078125, 7.461601257324219, 10.194000244140625, 12.926398277282715, 15.658796310424805, 18.39119529724121, 21.123594284057617, 23.85599136352539, 26.588390350341797, 29.320785522460938, 32.053184509277344, 34.78558349609375, 37.517982482910156, 40.25038146972656, 42.98278045654297, 45.71517562866211, 48.447574615478516, 51.17997360229492, 53.91237258911133, 56.644771575927734, 59.377166748046875, 62.10956573486328, 64.84196472167969, 67.5743637084961, 70.3067626953125, 73.0391616821289, 75.77156066894531, 78.50395965576172, 81.23635864257812, 83.96875762939453, 86.70115661621094, 89.43354797363281, 92.16595458984375, 94.89834594726562, 97.63074493408203, 100.36314392089844, 103.09554290771484, 105.82794189453125, 108.56034088134766, 111.29273986816406, 114.02513122558594, 116.75753784179688]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 9.0, 13.0, 15.0, 16.0, 22.0, 28.0, 16.0, 26.0, 10.0, 34.0, 34.0, 33.0, 37.0, 45.0, 39.0, 43.0, 19.0, 42.0, 40.0, 41.0, 38.0, 50.0, 48.0, 28.0, 32.0, 30.0, 20.0, 25.0, 14.0, 23.0, 12.0, 16.0, 12.0, 10.0, 13.0, 10.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-33.09831619262695, -32.14722442626953, -31.196136474609375, -30.245046615600586, -29.293956756591797, -28.342866897583008, -27.39177703857422, -26.440685272216797, -25.48959732055664, -24.53850746154785, -23.587417602539062, -22.636327743530273, -21.685237884521484, -20.734148025512695, -19.783058166503906, -18.831966400146484, -17.880876541137695, -16.929786682128906, -15.978696823120117, -15.027606964111328, -14.076517105102539, -13.12542724609375, -12.174336433410645, -11.223246574401855, -10.272156715393066, -9.321066856384277, -8.369976997375488, -7.418886661529541, -6.467796802520752, -5.516706943511963, -4.565616607666016, -3.6145267486572266, -2.6634349822998047, -1.712345004081726, -0.7612550258636475, 0.1898350715637207, 1.1409249305725098, 2.092014789581299, 3.043105125427246, 3.994194984436035, 4.945284843444824, 5.896374702453613, 6.847464561462402, 7.79855489730835, 8.749645233154297, 9.700735092163086, 10.651824951171875, 11.602914810180664, 12.554004669189453, 13.505094528198242, 14.456184387207031, 15.40727424621582, 16.35836410522461, 17.3094539642334, 18.260543823242188, 19.21163558959961, 20.162723541259766, 21.113813400268555, 22.064903259277344, 23.015993118286133, 23.967082977294922, 24.91817283630371, 25.8692626953125, 26.820354461669922, 27.77144432067871]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 7.0, 13.0, 13.0, 12.0, 21.0, 18.0, 20.0, 24.0, 19.0, 29.0, 23.0, 28.0, 30.0, 28.0, 32.0, 40.0, 44.0, 42.0, 36.0, 40.0, 36.0, 29.0, 43.0, 36.0, 44.0, 31.0, 20.0, 23.0, 26.0, 26.0, 19.0, 16.0, 15.0, 16.0, 17.0, 21.0, 12.0, 5.0, 6.0, 7.0, 3.0, 8.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.546875, -3.4373779296875, -3.327880859375, -3.2183837890625, -3.10888671875, -2.9993896484375, -2.889892578125, -2.7803955078125, -2.6708984375, -2.5614013671875, -2.451904296875, -2.3424072265625, -2.23291015625, -2.1234130859375, -2.013916015625, -1.9044189453125, -1.794921875, -1.6854248046875, -1.575927734375, -1.4664306640625, -1.35693359375, -1.2474365234375, -1.137939453125, -1.0284423828125, -0.9189453125, -0.8094482421875, -0.699951171875, -0.5904541015625, -0.48095703125, -0.3714599609375, -0.261962890625, -0.1524658203125, -0.04296875, 0.0665283203125, 0.176025390625, 0.2855224609375, 0.39501953125, 0.5045166015625, 0.614013671875, 0.7235107421875, 0.8330078125, 0.9425048828125, 1.052001953125, 1.1614990234375, 1.27099609375, 1.3804931640625, 1.489990234375, 1.5994873046875, 1.708984375, 1.8184814453125, 1.927978515625, 2.0374755859375, 2.14697265625, 2.2564697265625, 2.365966796875, 2.4754638671875, 2.5849609375, 2.6944580078125, 2.803955078125, 2.9134521484375, 3.02294921875, 3.1324462890625, 3.241943359375, 3.3514404296875, 3.4609375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 10.0, 13.0, 5.0, 19.0, 11.0, 15.0, 21.0, 17.0, 20.0, 22.0, 22.0, 36.0, 42.0, 75.0, 155.0, 314.0, 938.0, 4448.0, 42489.0, 592229.0, 2635442.0, 845775.0, 63887.0, 6104.0, 1219.0, 406.0, 158.0, 104.0, 50.0, 34.0, 27.0, 35.0, 24.0, 13.0, 20.0, 11.0, 11.0, 7.0, 13.0, 8.0, 4.0, 9.0, 4.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.8203125, -10.4881591796875, -10.156005859375, -9.8238525390625, -9.49169921875, -9.1595458984375, -8.827392578125, -8.4952392578125, -8.1630859375, -7.8309326171875, -7.498779296875, -7.1666259765625, -6.83447265625, -6.5023193359375, -6.170166015625, -5.8380126953125, -5.505859375, -5.1737060546875, -4.841552734375, -4.5093994140625, -4.17724609375, -3.8450927734375, -3.512939453125, -3.1807861328125, -2.8486328125, -2.5164794921875, -2.184326171875, -1.8521728515625, -1.52001953125, -1.1878662109375, -0.855712890625, -0.5235595703125, -0.19140625, 0.1407470703125, 0.472900390625, 0.8050537109375, 1.13720703125, 1.4693603515625, 1.801513671875, 2.1336669921875, 2.4658203125, 2.7979736328125, 3.130126953125, 3.4622802734375, 3.79443359375, 4.1265869140625, 4.458740234375, 4.7908935546875, 5.123046875, 5.4552001953125, 5.787353515625, 6.1195068359375, 6.45166015625, 6.7838134765625, 7.115966796875, 7.4481201171875, 7.7802734375, 8.1124267578125, 8.444580078125, 8.7767333984375, 9.10888671875, 9.4410400390625, 9.773193359375, 10.1053466796875, 10.4375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 9.0, 7.0, 7.0, 21.0, 25.0, 28.0, 22.0, 18.0, 38.0, 37.0, 49.0, 66.0, 69.0, 99.0, 125.0, 167.0, 148.0, 175.0, 232.0, 258.0, 268.0, 279.0, 272.0, 260.0, 226.0, 192.0, 178.0, 153.0, 129.0, 89.0, 76.0, 68.0, 54.0, 37.0, 37.0, 25.0, 26.0, 19.0, 20.0, 9.0, 15.0, 6.0, 10.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-5.6484375, -5.46844482421875, -5.2884521484375, -5.10845947265625, -4.928466796875, -4.74847412109375, -4.5684814453125, -4.38848876953125, -4.20849609375, -4.02850341796875, -3.8485107421875, -3.66851806640625, -3.488525390625, -3.30853271484375, -3.1285400390625, -2.94854736328125, -2.7685546875, -2.58856201171875, -2.4085693359375, -2.22857666015625, -2.048583984375, -1.86859130859375, -1.6885986328125, -1.50860595703125, -1.32861328125, -1.14862060546875, -0.9686279296875, -0.78863525390625, -0.608642578125, -0.42864990234375, -0.2486572265625, -0.06866455078125, 0.111328125, 0.29132080078125, 0.4713134765625, 0.65130615234375, 0.831298828125, 1.01129150390625, 1.1912841796875, 1.37127685546875, 1.55126953125, 1.73126220703125, 1.9112548828125, 2.09124755859375, 2.271240234375, 2.45123291015625, 2.6312255859375, 2.81121826171875, 2.9912109375, 3.17120361328125, 3.3511962890625, 3.53118896484375, 3.711181640625, 3.89117431640625, 4.0711669921875, 4.25115966796875, 4.43115234375, 4.61114501953125, 4.7911376953125, 4.97113037109375, 5.151123046875, 5.33111572265625, 5.5111083984375, 5.69110107421875, 5.87109375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 7.0, 5.0, 10.0, 10.0, 17.0, 10.0, 23.0, 23.0, 22.0, 33.0, 50.0, 54.0, 62.0, 80.0, 116.0, 135.0, 178.0, 266.0, 443.0, 1009.0, 3406.0, 19918.0, 159823.0, 1230331.0, 2267990.0, 446284.0, 52937.0, 7508.0, 1685.0, 615.0, 346.0, 205.0, 164.0, 109.0, 72.0, 70.0, 53.0, 33.0, 35.0, 26.0, 31.0, 31.0, 15.0, 7.0, 9.0, 5.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-12.7734375, -12.38916015625, -12.0048828125, -11.62060546875, -11.236328125, -10.85205078125, -10.4677734375, -10.08349609375, -9.69921875, -9.31494140625, -8.9306640625, -8.54638671875, -8.162109375, -7.77783203125, -7.3935546875, -7.00927734375, -6.625, -6.24072265625, -5.8564453125, -5.47216796875, -5.087890625, -4.70361328125, -4.3193359375, -3.93505859375, -3.55078125, -3.16650390625, -2.7822265625, -2.39794921875, -2.013671875, -1.62939453125, -1.2451171875, -0.86083984375, -0.4765625, -0.09228515625, 0.2919921875, 0.67626953125, 1.060546875, 1.44482421875, 1.8291015625, 2.21337890625, 2.59765625, 2.98193359375, 3.3662109375, 3.75048828125, 4.134765625, 4.51904296875, 4.9033203125, 5.28759765625, 5.671875, 6.05615234375, 6.4404296875, 6.82470703125, 7.208984375, 7.59326171875, 7.9775390625, 8.36181640625, 8.74609375, 9.13037109375, 9.5146484375, 9.89892578125, 10.283203125, 10.66748046875, 11.0517578125, 11.43603515625, 11.8203125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 16.0, 50.0, 87.0, 153.0, 200.0, 215.0, 152.0, 74.0, 42.0, 16.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.947265625, -97.4390869140625, -94.93091583251953, -92.42273712158203, -89.91455841064453, -87.40638732910156, -84.89820861816406, -82.39002990722656, -79.88185119628906, -77.37367248535156, -74.8655014038086, -72.3573226928711, -69.8491439819336, -67.34097290039062, -64.83279418945312, -62.324615478515625, -59.816444396972656, -57.30826950073242, -54.80009078979492, -52.29191589355469, -49.78373718261719, -47.27556228637695, -44.76738739013672, -42.25920867919922, -39.751033782958984, -37.24285888671875, -34.73468017578125, -32.226505279541016, -29.71832847595215, -27.21015167236328, -24.701976776123047, -22.19379997253418, -19.685630798339844, -17.177453994750977, -14.669278144836426, -12.161102294921875, -9.652925491333008, -7.144748687744141, -4.63657283782959, -2.128396987915039, 0.3797798156738281, 2.887956142425537, 5.396132469177246, 7.904308795928955, 10.412485122680664, 12.920661926269531, 15.428837776184082, 17.937013626098633, 20.4451904296875, 22.953367233276367, 25.461544036865234, 27.96971893310547, 30.477895736694336, 32.9860725402832, 35.49424743652344, 38.00242614746094, 40.51060104370117, 43.018775939941406, 45.526954650878906, 48.03512954711914, 50.543304443359375, 53.051483154296875, 55.55965805053711, 58.067832946777344, 60.576011657714844]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 10.0, 9.0, 20.0, 19.0, 23.0, 23.0, 27.0, 26.0, 26.0, 39.0, 41.0, 48.0, 44.0, 46.0, 43.0, 42.0, 43.0, 56.0, 44.0, 34.0, 32.0, 35.0, 37.0, 39.0, 30.0, 33.0, 25.0, 19.0, 20.0, 5.0, 6.0, 8.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-34.479705810546875, -33.51327133178711, -32.54683303833008, -31.580398559570312, -30.613964080810547, -29.64752769470215, -28.68109130859375, -27.714656829833984, -26.748220443725586, -25.781784057617188, -24.815349578857422, -23.848913192749023, -22.882476806640625, -21.91604232788086, -20.94960594177246, -19.983169555664062, -19.016735076904297, -18.0502986907959, -17.083864212036133, -16.117427825927734, -15.150992393493652, -14.18455696105957, -13.218120574951172, -12.25168514251709, -11.285249710083008, -10.318814277648926, -9.352378845214844, -8.385942459106445, -7.419507026672363, -6.453071594238281, -5.486635684967041, -4.520199775695801, -3.5537643432617188, -2.5873286724090576, -1.6208930015563965, -0.6544573307037354, 0.3119783401489258, 1.2784137725830078, 2.244849681854248, 3.2112855911254883, 4.17772102355957, 5.144156455993652, 6.110592365264893, 7.077028274536133, 8.043463706970215, 9.009899139404297, 9.976335525512695, 10.942770957946777, 11.90920639038086, 12.875641822814941, 13.842077255249023, 14.808513641357422, 15.774949073791504, 16.741384506225586, 17.707820892333984, 18.67425537109375, 19.64069175720215, 20.607128143310547, 21.573562622070312, 22.53999900817871, 23.50643539428711, 24.472869873046875, 25.439306259155273, 26.405742645263672, 27.372177124023438]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 10.0, 9.0, 12.0, 16.0, 7.0, 15.0, 16.0, 22.0, 23.0, 35.0, 22.0, 35.0, 26.0, 28.0, 26.0, 46.0, 26.0, 41.0, 42.0, 44.0, 39.0, 40.0, 43.0, 38.0, 31.0, 20.0, 22.0, 41.0, 21.0, 26.0, 21.0, 21.0, 21.0, 18.0, 16.0, 12.0, 12.0, 7.0, 12.0, 9.0, 5.0, 6.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.376953125, -3.271209716796875, -3.16546630859375, -3.059722900390625, -2.9539794921875, -2.848236083984375, -2.74249267578125, -2.636749267578125, -2.531005859375, -2.425262451171875, -2.31951904296875, -2.213775634765625, -2.1080322265625, -2.002288818359375, -1.89654541015625, -1.790802001953125, -1.68505859375, -1.579315185546875, -1.47357177734375, -1.367828369140625, -1.2620849609375, -1.156341552734375, -1.05059814453125, -0.944854736328125, -0.839111328125, -0.733367919921875, -0.62762451171875, -0.521881103515625, -0.4161376953125, -0.310394287109375, -0.20465087890625, -0.098907470703125, 0.0068359375, 0.112579345703125, 0.21832275390625, 0.324066162109375, 0.4298095703125, 0.535552978515625, 0.64129638671875, 0.747039794921875, 0.852783203125, 0.958526611328125, 1.06427001953125, 1.170013427734375, 1.2757568359375, 1.381500244140625, 1.48724365234375, 1.592987060546875, 1.69873046875, 1.804473876953125, 1.91021728515625, 2.015960693359375, 2.1217041015625, 2.227447509765625, 2.33319091796875, 2.438934326171875, 2.544677734375, 2.650421142578125, 2.75616455078125, 2.861907958984375, 2.9676513671875, 3.073394775390625, 3.17913818359375, 3.284881591796875, 3.390625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 10.0, 30.0, 31.0, 41.0, 77.0, 103.0, 180.0, 251.0, 422.0, 631.0, 919.0, 1343.0, 2145.0, 3277.0, 4815.0, 7259.0, 11364.0, 17617.0, 27314.0, 42119.0, 65554.0, 98692.0, 141280.0, 171963.0, 147998.0, 105428.0, 69745.0, 45107.0, 29119.0, 18849.0, 11865.0, 7784.0, 5169.0, 3402.0, 2306.0, 1431.0, 986.0, 680.0, 450.0, 285.0, 168.0, 119.0, 71.0, 63.0, 28.0, 23.0, 14.0, 9.0, 5.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.3662109375, -0.3549690246582031, -0.34372711181640625, -0.3324851989746094, -0.3212432861328125, -0.3100013732910156, -0.29875946044921875, -0.2875175476074219, -0.276275634765625, -0.2650337219238281, -0.25379180908203125, -0.24254989624023438, -0.2313079833984375, -0.22006607055664062, -0.20882415771484375, -0.19758224487304688, -0.18634033203125, -0.17509841918945312, -0.16385650634765625, -0.15261459350585938, -0.1413726806640625, -0.13013076782226562, -0.11888885498046875, -0.10764694213867188, -0.096405029296875, -0.08516311645507812, -0.07392120361328125, -0.06267929077148438, -0.0514373779296875, -0.040195465087890625, -0.02895355224609375, -0.017711639404296875, -0.0064697265625, 0.004772186279296875, 0.01601409912109375, 0.027256011962890625, 0.0384979248046875, 0.049739837646484375, 0.06098175048828125, 0.07222366333007812, 0.083465576171875, 0.09470748901367188, 0.10594940185546875, 0.11719131469726562, 0.1284332275390625, 0.13967514038085938, 0.15091705322265625, 0.16215896606445312, 0.17340087890625, 0.18464279174804688, 0.19588470458984375, 0.20712661743164062, 0.2183685302734375, 0.22961044311523438, 0.24085235595703125, 0.2520942687988281, 0.263336181640625, 0.2745780944824219, 0.28582000732421875, 0.2970619201660156, 0.3083038330078125, 0.3195457458496094, 0.33078765869140625, 0.3420295715332031, 0.353271484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 16.0, 14.0, 13.0, 14.0, 26.0, 14.0, 33.0, 21.0, 26.0, 23.0, 33.0, 31.0, 50.0, 37.0, 42.0, 37.0, 34.0, 1053.0, 45.0, 43.0, 32.0, 34.0, 34.0, 37.0, 28.0, 39.0, 29.0, 18.0, 17.0, 12.0, 16.0, 20.0, 11.0, 15.0, 14.0, 5.0, 17.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.3359375, -2.265380859375, -2.19482421875, -2.124267578125, -2.0537109375, -1.983154296875, -1.91259765625, -1.842041015625, -1.771484375, -1.700927734375, -1.63037109375, -1.559814453125, -1.4892578125, -1.418701171875, -1.34814453125, -1.277587890625, -1.20703125, -1.136474609375, -1.06591796875, -0.995361328125, -0.9248046875, -0.854248046875, -0.78369140625, -0.713134765625, -0.642578125, -0.572021484375, -0.50146484375, -0.430908203125, -0.3603515625, -0.289794921875, -0.21923828125, -0.148681640625, -0.078125, -0.007568359375, 0.06298828125, 0.133544921875, 0.2041015625, 0.274658203125, 0.34521484375, 0.415771484375, 0.486328125, 0.556884765625, 0.62744140625, 0.697998046875, 0.7685546875, 0.839111328125, 0.90966796875, 0.980224609375, 1.05078125, 1.121337890625, 1.19189453125, 1.262451171875, 1.3330078125, 1.403564453125, 1.47412109375, 1.544677734375, 1.615234375, 1.685791015625, 1.75634765625, 1.826904296875, 1.8974609375, 1.968017578125, 2.03857421875, 2.109130859375, 2.1796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 11.0, 6.0, 14.0, 18.0, 41.0, 39.0, 63.0, 95.0, 154.0, 255.0, 410.0, 658.0, 1033.0, 1905.0, 2970.0, 5019.0, 8814.0, 15213.0, 26286.0, 45429.0, 75048.0, 118595.0, 177557.0, 1218396.0, 149561.0, 100593.0, 61387.0, 36268.0, 21392.0, 12319.0, 7110.0, 4181.0, 2407.0, 1452.0, 882.0, 559.0, 363.0, 216.0, 161.0, 94.0, 60.0, 39.0, 26.0, 13.0, 12.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.249267578125, -0.24155044555664062, -0.23383331298828125, -0.22611618041992188, -0.2183990478515625, -0.21068191528320312, -0.20296478271484375, -0.19524765014648438, -0.187530517578125, -0.17981338500976562, -0.17209625244140625, -0.16437911987304688, -0.1566619873046875, -0.14894485473632812, -0.14122772216796875, -0.13351058959960938, -0.12579345703125, -0.11807632446289062, -0.11035919189453125, -0.10264205932617188, -0.0949249267578125, -0.08720779418945312, -0.07949066162109375, -0.07177352905273438, -0.064056396484375, -0.056339263916015625, -0.04862213134765625, -0.040904998779296875, -0.0331878662109375, -0.025470733642578125, -0.01775360107421875, -0.010036468505859375, -0.0023193359375, 0.005397796630859375, 0.01311492919921875, 0.020832061767578125, 0.0285491943359375, 0.036266326904296875, 0.04398345947265625, 0.051700592041015625, 0.059417724609375, 0.06713485717773438, 0.07485198974609375, 0.08256912231445312, 0.0902862548828125, 0.09800338745117188, 0.10572052001953125, 0.11343765258789062, 0.12115478515625, 0.12887191772460938, 0.13658905029296875, 0.14430618286132812, 0.1520233154296875, 0.15974044799804688, 0.16745758056640625, 0.17517471313476562, 0.182891845703125, 0.19060897827148438, 0.19832611083984375, 0.20604324340820312, 0.2137603759765625, 0.22147750854492188, 0.22919464111328125, 0.23691177368164062, 0.24462890625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 6.0, 12.0, 15.0, 15.0, 13.0, 21.0, 29.0, 28.0, 38.0, 48.0, 69.0, 93.0, 171.0, 103.0, 59.0, 52.0, 35.0, 32.0, 26.0, 23.0, 20.0, 13.0, 10.0, 9.0, 5.0, 5.0, 9.0, 5.0, 8.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00934600830078125, -0.009039878845214844, -0.008733749389648438, -0.008427619934082031, -0.008121490478515625, -0.007815361022949219, -0.0075092315673828125, -0.007203102111816406, -0.00689697265625, -0.006590843200683594, -0.0062847137451171875, -0.005978584289550781, -0.005672454833984375, -0.005366325378417969, -0.0050601959228515625, -0.004754066467285156, -0.00444793701171875, -0.004141807556152344, -0.0038356781005859375, -0.0035295486450195312, -0.003223419189453125, -0.0029172897338867188, -0.0026111602783203125, -0.0023050308227539062, -0.0019989013671875, -0.0016927719116210938, -0.0013866424560546875, -0.0010805130004882812, -0.000774383544921875, -0.00046825408935546875, -0.0001621246337890625, 0.00014400482177734375, 0.00045013427734375, 0.0007562637329101562, 0.0010623931884765625, 0.0013685226440429688, 0.001674652099609375, 0.0019807815551757812, 0.0022869110107421875, 0.0025930404663085938, 0.002899169921875, 0.0032052993774414062, 0.0035114288330078125, 0.0038175582885742188, 0.004123687744140625, 0.004429817199707031, 0.0047359466552734375, 0.005042076110839844, 0.00534820556640625, 0.005654335021972656, 0.0059604644775390625, 0.006266593933105469, 0.006572723388671875, 0.006878852844238281, 0.0071849822998046875, 0.007491111755371094, 0.0077972412109375, 0.008103370666503906, 0.008409500122070312, 0.008715629577636719, 0.009021759033203125, 0.009327888488769531, 0.009634017944335938, 0.009940147399902344, 0.01024627685546875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 7.0, 4.0, 8.0, 9.0, 7.0, 12.0, 11.0, 15.0, 16.0, 30.0, 35.0, 59.0, 87.0, 160.0, 678.0, 11216.0, 964486.0, 69470.0, 1597.0, 275.0, 129.0, 63.0, 47.0, 27.0, 26.0, 17.0, 16.0, 9.0, 11.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.249267578125, -0.24187088012695312, -0.23447418212890625, -0.22707748413085938, -0.2196807861328125, -0.21228408813476562, -0.20488739013671875, -0.19749069213867188, -0.190093994140625, -0.18269729614257812, -0.17530059814453125, -0.16790390014648438, -0.1605072021484375, -0.15311050415039062, -0.14571380615234375, -0.13831710815429688, -0.13092041015625, -0.12352371215820312, -0.11612701416015625, -0.10873031616210938, -0.1013336181640625, -0.09393692016601562, -0.08654022216796875, -0.07914352416992188, -0.071746826171875, -0.06435012817382812, -0.05695343017578125, -0.049556732177734375, -0.0421600341796875, -0.034763336181640625, -0.02736663818359375, -0.019969940185546875, -0.0125732421875, -0.005176544189453125, 0.00222015380859375, 0.009616851806640625, 0.0170135498046875, 0.024410247802734375, 0.03180694580078125, 0.039203643798828125, 0.046600341796875, 0.053997039794921875, 0.06139373779296875, 0.06879043579101562, 0.0761871337890625, 0.08358383178710938, 0.09098052978515625, 0.09837722778320312, 0.10577392578125, 0.11317062377929688, 0.12056732177734375, 0.12796401977539062, 0.1353607177734375, 0.14275741577148438, 0.15015411376953125, 0.15755081176757812, 0.164947509765625, 0.17234420776367188, 0.17974090576171875, 0.18713760375976562, 0.1945343017578125, 0.20193099975585938, 0.20932769775390625, 0.21672439575195312, 0.22412109375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 13.0, 46.0, 231.0, 540.0, 125.0, 31.0, 16.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1253189593553543, -0.12267021834850311, -0.12002148479223251, -0.11737275123596191, -0.11472401022911072, -0.11207526922225952, -0.10942653566598892, -0.10677780210971832, -0.10412906110286713, -0.10148032009601593, -0.09883158653974533, -0.09618285298347473, -0.09353411197662354, -0.09088537096977234, -0.08823663741350174, -0.08558790385723114, -0.08293916285037994, -0.08029042184352875, -0.07764168828725815, -0.07499295473098755, -0.07234421372413635, -0.06969547271728516, -0.06704673916101456, -0.06439800560474396, -0.06174926459789276, -0.05910052731633186, -0.056451790034770966, -0.05380305275321007, -0.05115431547164917, -0.04850557819008827, -0.045856840908527374, -0.043208103626966476, -0.04055936262011528, -0.03791062533855438, -0.035261888056993484, -0.03261315077543259, -0.02996441349387169, -0.02731567621231079, -0.024666938930749893, -0.022018201649188995, -0.019369464367628098, -0.0167207270860672, -0.014071989804506302, -0.011423252522945404, -0.008774515241384506, -0.006125777959823608, -0.0034770406782627106, -0.0008283033967018127, 0.001820433884859085, 0.004469171166419983, 0.007117908447980881, 0.009766645729541779, 0.012415383011102676, 0.015064120292663574, 0.017712857574224472, 0.02036159485578537, 0.023010332137346268, 0.025659069418907166, 0.028307806700468063, 0.03095654398202896, 0.03360528126358986, 0.03625401854515076, 0.038902755826711655, 0.04155149310827255, 0.04420023038983345]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 2.0, 5.0, 5.0, 1.0, 6.0, 7.0, 14.0, 6.0, 10.0, 10.0, 13.0, 13.0, 18.0, 14.0, 29.0, 17.0, 20.0, 30.0, 26.0, 32.0, 33.0, 33.0, 32.0, 31.0, 50.0, 39.0, 45.0, 36.0, 36.0, 36.0, 33.0, 24.0, 33.0, 24.0, 32.0, 24.0, 26.0, 16.0, 22.0, 16.0, 23.0, 17.0, 13.0, 15.0, 11.0, 6.0, 8.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.008710920810699463, -0.008412553928792477, -0.00811418704688549, -0.007815820164978504, -0.007517453283071518, -0.007219086401164532, -0.0069207195192575455, -0.006622352637350559, -0.006323985755443573, -0.006025618873536587, -0.0057272519916296005, -0.005428885109722614, -0.005130518227815628, -0.004832151345908642, -0.004533784464001656, -0.004235417582094669, -0.003937050700187683, -0.003638683818280697, -0.0033403169363737106, -0.0030419500544667244, -0.002743583172559738, -0.002445216290652752, -0.0021468494087457657, -0.0018484825268387794, -0.0015501156449317932, -0.001251748763024807, -0.0009533818811178207, -0.0006550149992108345, -0.00035664811730384827, -5.828123539686203e-05, 0.0002400856465101242, 0.0005384525284171104, 0.0008368194103240967, 0.001135186292231083, 0.0014335531741380692, 0.0017319200560450554, 0.0020302869379520416, 0.002328653819859028, 0.002627020701766014, 0.0029253875836730003, 0.0032237544655799866, 0.003522121347486973, 0.003820488229393959, 0.004118855111300945, 0.0044172219932079315, 0.004715588875114918, 0.005013955757021904, 0.00531232263892889, 0.0056106895208358765, 0.005909056402742863, 0.006207423284649849, 0.006505790166556835, 0.006804157048463821, 0.007102523930370808, 0.007400890812277794, 0.00769925769418478, 0.007997624576091766, 0.008295991457998753, 0.008594358339905739, 0.008892725221812725, 0.009191092103719711, 0.009489458985626698, 0.009787825867533684, 0.01008619274944067, 0.010384559631347656]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 10.0, 9.0, 12.0, 16.0, 6.0, 16.0, 16.0, 22.0, 23.0, 35.0, 21.0, 36.0, 26.0, 28.0, 26.0, 46.0, 26.0, 41.0, 42.0, 44.0, 39.0, 40.0, 43.0, 38.0, 31.0, 20.0, 22.0, 40.0, 22.0, 27.0, 20.0, 21.0, 21.0, 18.0, 16.0, 12.0, 12.0, 7.0, 12.0, 9.0, 5.0, 6.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.376953125, -3.271209716796875, -3.16546630859375, -3.059722900390625, -2.9539794921875, -2.848236083984375, -2.74249267578125, -2.636749267578125, -2.531005859375, -2.425262451171875, -2.31951904296875, -2.213775634765625, -2.1080322265625, -2.002288818359375, -1.89654541015625, -1.790802001953125, -1.68505859375, -1.579315185546875, -1.47357177734375, -1.367828369140625, -1.2620849609375, -1.156341552734375, -1.05059814453125, -0.944854736328125, -0.839111328125, -0.733367919921875, -0.62762451171875, -0.521881103515625, -0.4161376953125, -0.310394287109375, -0.20465087890625, -0.098907470703125, 0.0068359375, 0.112579345703125, 0.21832275390625, 0.324066162109375, 0.4298095703125, 0.535552978515625, 0.64129638671875, 0.747039794921875, 0.852783203125, 0.958526611328125, 1.06427001953125, 1.170013427734375, 1.2757568359375, 1.381500244140625, 1.48724365234375, 1.592987060546875, 1.69873046875, 1.804473876953125, 1.91021728515625, 2.015960693359375, 2.1217041015625, 2.227447509765625, 2.33319091796875, 2.438934326171875, 2.544677734375, 2.650421142578125, 2.75616455078125, 2.861907958984375, 2.9676513671875, 3.073394775390625, 3.17913818359375, 3.284881591796875, 3.390625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 12.0, 10.0, 17.0, 25.0, 37.0, 67.0, 104.0, 193.0, 320.0, 745.0, 1554.0, 3298.0, 6957.0, 14573.0, 30199.0, 60095.0, 120589.0, 240368.0, 282330.0, 144856.0, 71974.0, 36281.0, 17643.0, 8617.0, 4010.0, 1814.0, 908.0, 442.0, 214.0, 108.0, 76.0, 37.0, 20.0, 20.0, 7.0, 6.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0546875, -3.9244384765625, -3.794189453125, -3.6639404296875, -3.53369140625, -3.4034423828125, -3.273193359375, -3.1429443359375, -3.0126953125, -2.8824462890625, -2.752197265625, -2.6219482421875, -2.49169921875, -2.3614501953125, -2.231201171875, -2.1009521484375, -1.970703125, -1.8404541015625, -1.710205078125, -1.5799560546875, -1.44970703125, -1.3194580078125, -1.189208984375, -1.0589599609375, -0.9287109375, -0.7984619140625, -0.668212890625, -0.5379638671875, -0.40771484375, -0.2774658203125, -0.147216796875, -0.0169677734375, 0.11328125, 0.2435302734375, 0.373779296875, 0.5040283203125, 0.63427734375, 0.7645263671875, 0.894775390625, 1.0250244140625, 1.1552734375, 1.2855224609375, 1.415771484375, 1.5460205078125, 1.67626953125, 1.8065185546875, 1.936767578125, 2.0670166015625, 2.197265625, 2.3275146484375, 2.457763671875, 2.5880126953125, 2.71826171875, 2.8485107421875, 2.978759765625, 3.1090087890625, 3.2392578125, 3.3695068359375, 3.499755859375, 3.6300048828125, 3.76025390625, 3.8905029296875, 4.020751953125, 4.1510009765625, 4.28125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 5.0, 7.0, 14.0, 16.0, 14.0, 15.0, 22.0, 23.0, 30.0, 30.0, 39.0, 34.0, 39.0, 53.0, 103.0, 152.0, 276.0, 1400.0, 180.0, 119.0, 76.0, 47.0, 54.0, 31.0, 31.0, 34.0, 34.0, 19.0, 21.0, 18.0, 16.0, 13.0, 15.0, 11.0, 10.0, 7.0, 5.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.515625, -12.126953125, -11.73828125, -11.349609375, -10.9609375, -10.572265625, -10.18359375, -9.794921875, -9.40625, -9.017578125, -8.62890625, -8.240234375, -7.8515625, -7.462890625, -7.07421875, -6.685546875, -6.296875, -5.908203125, -5.51953125, -5.130859375, -4.7421875, -4.353515625, -3.96484375, -3.576171875, -3.1875, -2.798828125, -2.41015625, -2.021484375, -1.6328125, -1.244140625, -0.85546875, -0.466796875, -0.078125, 0.310546875, 0.69921875, 1.087890625, 1.4765625, 1.865234375, 2.25390625, 2.642578125, 3.03125, 3.419921875, 3.80859375, 4.197265625, 4.5859375, 4.974609375, 5.36328125, 5.751953125, 6.140625, 6.529296875, 6.91796875, 7.306640625, 7.6953125, 8.083984375, 8.47265625, 8.861328125, 9.25, 9.638671875, 10.02734375, 10.416015625, 10.8046875, 11.193359375, 11.58203125, 11.970703125, 12.359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 11.0, 5.0, 12.0, 25.0, 20.0, 29.0, 47.0, 55.0, 69.0, 108.0, 179.0, 244.0, 427.0, 1236.0, 30311.0, 3074775.0, 35718.0, 1194.0, 461.0, 244.0, 147.0, 115.0, 60.0, 54.0, 34.0, 28.0, 14.0, 13.0, 19.0, 12.0, 8.0, 2.0, 7.0, 4.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.40625, -29.0556640625, -27.705078125, -26.3544921875, -25.00390625, -23.6533203125, -22.302734375, -20.9521484375, -19.6015625, -18.2509765625, -16.900390625, -15.5498046875, -14.19921875, -12.8486328125, -11.498046875, -10.1474609375, -8.796875, -7.4462890625, -6.095703125, -4.7451171875, -3.39453125, -2.0439453125, -0.693359375, 0.6572265625, 2.0078125, 3.3583984375, 4.708984375, 6.0595703125, 7.41015625, 8.7607421875, 10.111328125, 11.4619140625, 12.8125, 14.1630859375, 15.513671875, 16.8642578125, 18.21484375, 19.5654296875, 20.916015625, 22.2666015625, 23.6171875, 24.9677734375, 26.318359375, 27.6689453125, 29.01953125, 30.3701171875, 31.720703125, 33.0712890625, 34.421875, 35.7724609375, 37.123046875, 38.4736328125, 39.82421875, 41.1748046875, 42.525390625, 43.8759765625, 45.2265625, 46.5771484375, 47.927734375, 49.2783203125, 50.62890625, 51.9794921875, 53.330078125, 54.6806640625, 56.03125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 52.0, 870.0, 97.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.582706451416016, -37.38191223144531, -29.181121826171875, -20.980329513549805, -12.779537200927734, -4.578746795654297, 3.6220474243164062, 11.82284164428711, 20.023632049560547, 28.224424362182617, 36.42521667480469, 44.626007080078125, 52.82680130004883, 61.027591705322266, 69.22838592529297, 77.42918395996094, 85.62997436523438, 93.83076477050781, 102.03155517578125, 110.23235321044922, 118.43314361572266, 126.6339340209961, 134.83473205566406, 143.0355224609375, 151.23631286621094, 159.43710327148438, 167.6378936767578, 175.83868408203125, 184.03948974609375, 192.24026489257812, 200.44107055664062, 208.64186096191406, 216.8426513671875, 225.04344177246094, 233.24423217773438, 241.4450225830078, 249.64581298828125, 257.84661865234375, 266.0473937988281, 274.2481994628906, 282.448974609375, 290.6497802734375, 298.8505554199219, 307.0513610839844, 315.25213623046875, 323.45294189453125, 331.6537170410156, 339.8545227050781, 348.0553283691406, 356.2561340332031, 364.4569091796875, 372.65771484375, 380.8584899902344, 389.0592956542969, 397.26007080078125, 405.46087646484375, 413.66168212890625, 421.86248779296875, 430.0632629394531, 438.2640686035156, 446.46484375, 454.6656494140625, 462.8664245605469, 471.0672302246094, 479.26800537109375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 9.0, 6.0, 8.0, 7.0, 11.0, 5.0, 18.0, 17.0, 16.0, 23.0, 17.0, 28.0, 24.0, 39.0, 33.0, 37.0, 45.0, 44.0, 42.0, 39.0, 49.0, 56.0, 45.0, 35.0, 38.0, 33.0, 42.0, 38.0, 34.0, 25.0, 18.0, 22.0, 17.0, 14.0, 15.0, 14.0, 16.0, 4.0, 4.0, 1.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.8189697265625, -37.6719856262207, -36.52499771118164, -35.378013610839844, -34.23102569580078, -33.084041595458984, -31.937055587768555, -30.790069580078125, -29.643083572387695, -28.496097564697266, -27.349111557006836, -26.202125549316406, -25.05514144897461, -23.908153533935547, -22.76116943359375, -21.61418342590332, -20.46719741821289, -19.32021141052246, -18.17322540283203, -17.0262393951416, -15.879254341125488, -14.732268333435059, -13.585283279418945, -12.438297271728516, -11.291311264038086, -10.144325256347656, -8.997339248657227, -7.850354194641113, -6.703368186950684, -5.556382179260254, -4.409396648406982, -3.262411117553711, -2.1154212951660156, -0.968435525894165, 0.17855024337768555, 1.3255360126495361, 2.4725217819213867, 3.6195077896118164, 4.766493320465088, 5.913478851318359, 7.060464859008789, 8.207450866699219, 9.354436874389648, 10.501421928405762, 11.648407936096191, 12.795393943786621, 13.942378997802734, 15.089365005493164, 16.236351013183594, 17.383337020874023, 18.530323028564453, 19.677309036254883, 20.824295043945312, 21.97127914428711, 23.11826515197754, 24.26525115966797, 25.4122371673584, 26.559223175048828, 27.706209182739258, 28.853195190429688, 30.000179290771484, 31.147167205810547, 32.294151306152344, 33.441139221191406, 34.5881233215332]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 4.0, 3.0, 2.0, 4.0, 7.0, 7.0, 6.0, 15.0, 10.0, 10.0, 19.0, 20.0, 17.0, 20.0, 30.0, 38.0, 36.0, 24.0, 50.0, 25.0, 31.0, 29.0, 30.0, 51.0, 51.0, 46.0, 42.0, 37.0, 30.0, 25.0, 28.0, 24.0, 19.0, 24.0, 34.0, 18.0, 19.0, 22.0, 17.0, 14.0, 9.0, 10.0, 12.0, 7.0, 6.0, 6.0, 7.0, 6.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.7421875, -3.6229248046875, -3.503662109375, -3.3843994140625, -3.26513671875, -3.1458740234375, -3.026611328125, -2.9073486328125, -2.7880859375, -2.6688232421875, -2.549560546875, -2.4302978515625, -2.31103515625, -2.1917724609375, -2.072509765625, -1.9532470703125, -1.833984375, -1.7147216796875, -1.595458984375, -1.4761962890625, -1.35693359375, -1.2376708984375, -1.118408203125, -0.9991455078125, -0.8798828125, -0.7606201171875, -0.641357421875, -0.5220947265625, -0.40283203125, -0.2835693359375, -0.164306640625, -0.0450439453125, 0.07421875, 0.1934814453125, 0.312744140625, 0.4320068359375, 0.55126953125, 0.6705322265625, 0.789794921875, 0.9090576171875, 1.0283203125, 1.1475830078125, 1.266845703125, 1.3861083984375, 1.50537109375, 1.6246337890625, 1.743896484375, 1.8631591796875, 1.982421875, 2.1016845703125, 2.220947265625, 2.3402099609375, 2.45947265625, 2.5787353515625, 2.697998046875, 2.8172607421875, 2.9365234375, 3.0557861328125, 3.175048828125, 3.2943115234375, 3.41357421875, 3.5328369140625, 3.652099609375, 3.7713623046875, 3.890625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 6.0, 3.0, 12.0, 15.0, 19.0, 21.0, 22.0, 18.0, 29.0, 40.0, 41.0, 79.0, 96.0, 186.0, 457.0, 1479.0, 8457.0, 91907.0, 997403.0, 2451751.0, 585548.0, 49206.0, 5227.0, 1190.0, 434.0, 191.0, 102.0, 77.0, 49.0, 38.0, 35.0, 21.0, 20.0, 18.0, 16.0, 8.0, 9.0, 13.0, 12.0, 5.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.746337890625, -9.41455078125, -9.082763671875, -8.7509765625, -8.419189453125, -8.08740234375, -7.755615234375, -7.423828125, -7.092041015625, -6.76025390625, -6.428466796875, -6.0966796875, -5.764892578125, -5.43310546875, -5.101318359375, -4.76953125, -4.437744140625, -4.10595703125, -3.774169921875, -3.4423828125, -3.110595703125, -2.77880859375, -2.447021484375, -2.115234375, -1.783447265625, -1.45166015625, -1.119873046875, -0.7880859375, -0.456298828125, -0.12451171875, 0.207275390625, 0.5390625, 0.870849609375, 1.20263671875, 1.534423828125, 1.8662109375, 2.197998046875, 2.52978515625, 2.861572265625, 3.193359375, 3.525146484375, 3.85693359375, 4.188720703125, 4.5205078125, 4.852294921875, 5.18408203125, 5.515869140625, 5.84765625, 6.179443359375, 6.51123046875, 6.843017578125, 7.1748046875, 7.506591796875, 7.83837890625, 8.170166015625, 8.501953125, 8.833740234375, 9.16552734375, 9.497314453125, 9.8291015625, 10.160888671875, 10.49267578125, 10.824462890625, 11.15625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 13.0, 18.0, 18.0, 31.0, 50.0, 71.0, 87.0, 134.0, 206.0, 271.0, 369.0, 444.0, 476.0, 439.0, 407.0, 310.0, 232.0, 164.0, 116.0, 62.0, 43.0, 41.0, 18.0, 19.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.4564208984375, -12.115966796875, -11.7755126953125, -11.43505859375, -11.0946044921875, -10.754150390625, -10.4136962890625, -10.0732421875, -9.7327880859375, -9.392333984375, -9.0518798828125, -8.71142578125, -8.3709716796875, -8.030517578125, -7.6900634765625, -7.349609375, -7.0091552734375, -6.668701171875, -6.3282470703125, -5.98779296875, -5.6473388671875, -5.306884765625, -4.9664306640625, -4.6259765625, -4.2855224609375, -3.945068359375, -3.6046142578125, -3.26416015625, -2.9237060546875, -2.583251953125, -2.2427978515625, -1.90234375, -1.5618896484375, -1.221435546875, -0.8809814453125, -0.54052734375, -0.2000732421875, 0.140380859375, 0.4808349609375, 0.8212890625, 1.1617431640625, 1.502197265625, 1.8426513671875, 2.18310546875, 2.5235595703125, 2.864013671875, 3.2044677734375, 3.544921875, 3.8853759765625, 4.225830078125, 4.5662841796875, 4.90673828125, 5.2471923828125, 5.587646484375, 5.9281005859375, 6.2685546875, 6.6090087890625, 6.949462890625, 7.2899169921875, 7.63037109375, 7.9708251953125, 8.311279296875, 8.6517333984375, 8.9921875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 9.0, 15.0, 21.0, 39.0, 39.0, 72.0, 122.0, 199.0, 330.0, 671.0, 3511.0, 769427.0, 3401456.0, 16445.0, 945.0, 381.0, 215.0, 123.0, 82.0, 58.0, 45.0, 18.0, 20.0, 14.0, 9.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.609375, -30.402099609375, -29.19482421875, -27.987548828125, -26.7802734375, -25.572998046875, -24.36572265625, -23.158447265625, -21.951171875, -20.743896484375, -19.53662109375, -18.329345703125, -17.1220703125, -15.914794921875, -14.70751953125, -13.500244140625, -12.29296875, -11.085693359375, -9.87841796875, -8.671142578125, -7.4638671875, -6.256591796875, -5.04931640625, -3.842041015625, -2.634765625, -1.427490234375, -0.22021484375, 0.987060546875, 2.1943359375, 3.401611328125, 4.60888671875, 5.816162109375, 7.0234375, 8.230712890625, 9.43798828125, 10.645263671875, 11.8525390625, 13.059814453125, 14.26708984375, 15.474365234375, 16.681640625, 17.888916015625, 19.09619140625, 20.303466796875, 21.5107421875, 22.718017578125, 23.92529296875, 25.132568359375, 26.33984375, 27.547119140625, 28.75439453125, 29.961669921875, 31.1689453125, 32.376220703125, 33.58349609375, 34.790771484375, 35.998046875, 37.205322265625, 38.41259765625, 39.619873046875, 40.8271484375, 42.034423828125, 43.24169921875, 44.448974609375, 45.65625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 31.0, 82.0, 172.0, 213.0, 233.0, 173.0, 60.0, 37.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.04817199707031, -72.03520965576172, -69.02224731445312, -66.00929260253906, -62.99633026123047, -59.983367919921875, -56.97040939331055, -53.95745086669922, -50.944488525390625, -47.93152618408203, -44.9185676574707, -41.905609130859375, -38.89264678955078, -35.87968444824219, -32.86672592163086, -29.8537654876709, -26.840805053710938, -23.827844619750977, -20.814884185791016, -17.801923751831055, -14.788963317871094, -11.776002883911133, -8.763042449951172, -5.750082015991211, -2.73712158203125, 0.27583885192871094, 3.288799285888672, 6.301759719848633, 9.314720153808594, 12.327680587768555, 15.340641021728516, 18.353601455688477, 21.366561889648438, 24.3795223236084, 27.39248275756836, 30.40544319152832, 33.41840362548828, 36.431365966796875, 39.4443244934082, 42.45728302001953, 45.470245361328125, 48.48320770263672, 51.49616622924805, 54.509124755859375, 57.52208709716797, 60.53504943847656, 63.54800796508789, 66.56096649169922, 69.57392883300781, 72.5868911743164, 75.599853515625, 78.61280822753906, 81.62577056884766, 84.63873291015625, 87.65168762207031, 90.6646499633789, 93.6776123046875, 96.6905746459961, 99.70353698730469, 102.71649169921875, 105.72945404052734, 108.74241638183594, 111.75537109375, 114.7683334350586, 117.78129577636719]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 3.0, 9.0, 3.0, 7.0, 4.0, 16.0, 10.0, 15.0, 22.0, 16.0, 14.0, 32.0, 26.0, 24.0, 37.0, 36.0, 25.0, 47.0, 43.0, 39.0, 39.0, 39.0, 38.0, 46.0, 45.0, 36.0, 44.0, 34.0, 29.0, 34.0, 22.0, 25.0, 19.0, 24.0, 17.0, 13.0, 13.0, 10.0, 9.0, 9.0, 7.0, 7.0, 6.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0], "bins": [-32.24060821533203, -31.361865997314453, -30.483123779296875, -29.604381561279297, -28.72563934326172, -27.84689712524414, -26.968154907226562, -26.089412689208984, -25.210670471191406, -24.331928253173828, -23.45318603515625, -22.574443817138672, -21.695701599121094, -20.816959381103516, -19.938217163085938, -19.05947494506836, -18.18073272705078, -17.301990509033203, -16.423248291015625, -15.544506072998047, -14.665763854980469, -13.78702163696289, -12.908279418945312, -12.029537200927734, -11.150793075561523, -10.272050857543945, -9.393308639526367, -8.514566421508789, -7.635824203491211, -6.757081508636475, -5.8783392906188965, -4.999597072601318, -4.120855331420898, -3.2421131134033203, -2.363370895385742, -1.484628438949585, -0.6058862209320068, 0.2728562355041504, 1.1515984535217285, 2.0303406715393066, 2.9090828895568848, 3.787825107574463, 4.666567325592041, 5.545310020446777, 6.4240522384643555, 7.302794456481934, 8.181536674499512, 9.06027889251709, 9.939021110534668, 10.817763328552246, 11.696505546569824, 12.575247764587402, 13.45398998260498, 14.332733154296875, 15.211475372314453, 16.09021759033203, 16.96895980834961, 17.847702026367188, 18.726444244384766, 19.605186462402344, 20.483928680419922, 21.3626708984375, 22.241413116455078, 23.120155334472656, 23.998897552490234]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 10.0, 10.0, 7.0, 15.0, 14.0, 18.0, 16.0, 24.0, 31.0, 24.0, 44.0, 28.0, 42.0, 44.0, 39.0, 48.0, 43.0, 34.0, 41.0, 35.0, 39.0, 50.0, 34.0, 32.0, 25.0, 31.0, 13.0, 29.0, 24.0, 24.0, 15.0, 29.0, 14.0, 17.0, 13.0, 6.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.94921875, -3.82672119140625, -3.7042236328125, -3.58172607421875, -3.459228515625, -3.33673095703125, -3.2142333984375, -3.09173583984375, -2.96923828125, -2.84674072265625, -2.7242431640625, -2.60174560546875, -2.479248046875, -2.35675048828125, -2.2342529296875, -2.11175537109375, -1.9892578125, -1.86676025390625, -1.7442626953125, -1.62176513671875, -1.499267578125, -1.37677001953125, -1.2542724609375, -1.13177490234375, -1.00927734375, -0.88677978515625, -0.7642822265625, -0.64178466796875, -0.519287109375, -0.39678955078125, -0.2742919921875, -0.15179443359375, -0.029296875, 0.09320068359375, 0.2156982421875, 0.33819580078125, 0.460693359375, 0.58319091796875, 0.7056884765625, 0.82818603515625, 0.95068359375, 1.07318115234375, 1.1956787109375, 1.31817626953125, 1.440673828125, 1.56317138671875, 1.6856689453125, 1.80816650390625, 1.9306640625, 2.05316162109375, 2.1756591796875, 2.29815673828125, 2.420654296875, 2.54315185546875, 2.6656494140625, 2.78814697265625, 2.91064453125, 3.03314208984375, 3.1556396484375, 3.27813720703125, 3.400634765625, 3.52313232421875, 3.6456298828125, 3.76812744140625, 3.890625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 15.0, 24.0, 18.0, 44.0, 54.0, 73.0, 132.0, 176.0, 260.0, 359.0, 535.0, 786.0, 1143.0, 1663.0, 2554.0, 3757.0, 5528.0, 8461.0, 12293.0, 18805.0, 28378.0, 42128.0, 62796.0, 91167.0, 127541.0, 154931.0, 144681.0, 108207.0, 76185.0, 51986.0, 34642.0, 23214.0, 15071.0, 10027.0, 6859.0, 4564.0, 3046.0, 2051.0, 1376.0, 961.0, 663.0, 468.0, 272.0, 194.0, 140.0, 115.0, 69.0, 39.0, 34.0, 18.0, 21.0, 13.0, 3.0, 9.0, 0.0, 6.0], "bins": [-0.360107421875, -0.3494377136230469, -0.33876800537109375, -0.3280982971191406, -0.3174285888671875, -0.3067588806152344, -0.29608917236328125, -0.2854194641113281, -0.274749755859375, -0.2640800476074219, -0.25341033935546875, -0.24274063110351562, -0.2320709228515625, -0.22140121459960938, -0.21073150634765625, -0.20006179809570312, -0.18939208984375, -0.17872238159179688, -0.16805267333984375, -0.15738296508789062, -0.1467132568359375, -0.13604354858398438, -0.12537384033203125, -0.11470413208007812, -0.104034423828125, -0.09336471557617188, -0.08269500732421875, -0.07202529907226562, -0.0613555908203125, -0.050685882568359375, -0.04001617431640625, -0.029346466064453125, -0.0186767578125, -0.008007049560546875, 0.00266265869140625, 0.013332366943359375, 0.0240020751953125, 0.034671783447265625, 0.04534149169921875, 0.056011199951171875, 0.066680908203125, 0.07735061645507812, 0.08802032470703125, 0.09869003295898438, 0.1093597412109375, 0.12002944946289062, 0.13069915771484375, 0.14136886596679688, 0.15203857421875, 0.16270828247070312, 0.17337799072265625, 0.18404769897460938, 0.1947174072265625, 0.20538711547851562, 0.21605682373046875, 0.22672653198242188, 0.237396240234375, 0.24806594848632812, 0.25873565673828125, 0.2694053649902344, 0.2800750732421875, 0.2907447814941406, 0.30141448974609375, 0.3120841979980469, 0.32275390625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 1.0, 8.0, 3.0, 4.0, 8.0, 9.0, 14.0, 18.0, 14.0, 14.0, 16.0, 25.0, 19.0, 17.0, 15.0, 31.0, 27.0, 41.0, 44.0, 38.0, 36.0, 40.0, 42.0, 1060.0, 39.0, 36.0, 40.0, 39.0, 42.0, 33.0, 37.0, 27.0, 24.0, 22.0, 15.0, 21.0, 25.0, 17.0, 15.0, 7.0, 16.0, 7.0, 6.0, 7.0, 0.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.978515625, -1.9027099609375, -1.826904296875, -1.7510986328125, -1.67529296875, -1.5994873046875, -1.523681640625, -1.4478759765625, -1.3720703125, -1.2962646484375, -1.220458984375, -1.1446533203125, -1.06884765625, -0.9930419921875, -0.917236328125, -0.8414306640625, -0.765625, -0.6898193359375, -0.614013671875, -0.5382080078125, -0.46240234375, -0.3865966796875, -0.310791015625, -0.2349853515625, -0.1591796875, -0.0833740234375, -0.007568359375, 0.0682373046875, 0.14404296875, 0.2198486328125, 0.295654296875, 0.3714599609375, 0.447265625, 0.5230712890625, 0.598876953125, 0.6746826171875, 0.75048828125, 0.8262939453125, 0.902099609375, 0.9779052734375, 1.0537109375, 1.1295166015625, 1.205322265625, 1.2811279296875, 1.35693359375, 1.4327392578125, 1.508544921875, 1.5843505859375, 1.66015625, 1.7359619140625, 1.811767578125, 1.8875732421875, 1.96337890625, 2.0391845703125, 2.114990234375, 2.1907958984375, 2.2666015625, 2.3424072265625, 2.418212890625, 2.4940185546875, 2.56982421875, 2.6456298828125, 2.721435546875, 2.7972412109375, 2.873046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 7.0, 14.0, 25.0, 32.0, 35.0, 75.0, 135.0, 183.0, 303.0, 445.0, 697.0, 1065.0, 1776.0, 2855.0, 4743.0, 7954.0, 13001.0, 21668.0, 35199.0, 55958.0, 85331.0, 123698.0, 359274.0, 1006528.0, 129924.0, 90547.0, 59422.0, 37176.0, 23279.0, 13860.0, 8401.0, 5216.0, 3151.0, 1896.0, 1186.0, 740.0, 492.0, 300.0, 175.0, 121.0, 100.0, 47.0, 44.0, 16.0, 12.0, 13.0, 7.0, 6.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.2568645477294922, -0.24932479858398438, -0.24178504943847656, -0.23424530029296875, -0.22670555114746094, -0.21916580200195312, -0.2116260528564453, -0.2040863037109375, -0.1965465545654297, -0.18900680541992188, -0.18146705627441406, -0.17392730712890625, -0.16638755798339844, -0.15884780883789062, -0.1513080596923828, -0.143768310546875, -0.1362285614013672, -0.12868881225585938, -0.12114906311035156, -0.11360931396484375, -0.10606956481933594, -0.09852981567382812, -0.09099006652832031, -0.0834503173828125, -0.07591056823730469, -0.06837081909179688, -0.06083106994628906, -0.05329132080078125, -0.04575157165527344, -0.038211822509765625, -0.030672073364257812, -0.02313232421875, -0.015592575073242188, -0.008052825927734375, -0.0005130767822265625, 0.00702667236328125, 0.014566421508789062, 0.022106170654296875, 0.029645919799804688, 0.0371856689453125, 0.04472541809082031, 0.052265167236328125, 0.05980491638183594, 0.06734466552734375, 0.07488441467285156, 0.08242416381835938, 0.08996391296386719, 0.097503662109375, 0.10504341125488281, 0.11258316040039062, 0.12012290954589844, 0.12766265869140625, 0.13520240783691406, 0.14274215698242188, 0.1502819061279297, 0.1578216552734375, 0.1653614044189453, 0.17290115356445312, 0.18044090270996094, 0.18798065185546875, 0.19552040100097656, 0.20306015014648438, 0.2105998992919922, 0.2181396484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 7.0, 12.0, 16.0, 15.0, 15.0, 32.0, 28.0, 34.0, 38.0, 71.0, 63.0, 70.0, 75.0, 97.0, 84.0, 69.0, 41.0, 48.0, 39.0, 24.0, 29.0, 21.0, 12.0, 8.0, 7.0, 8.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0176849365234375, -0.01710367202758789, -0.01652240753173828, -0.015941143035888672, -0.015359878540039062, -0.014778614044189453, -0.014197349548339844, -0.013616085052490234, -0.013034820556640625, -0.012453556060791016, -0.011872291564941406, -0.011291027069091797, -0.010709762573242188, -0.010128498077392578, -0.009547233581542969, -0.00896596908569336, -0.00838470458984375, -0.007803440093994141, -0.007222175598144531, -0.006640911102294922, -0.0060596466064453125, -0.005478382110595703, -0.004897117614746094, -0.004315853118896484, -0.003734588623046875, -0.0031533241271972656, -0.0025720596313476562, -0.001990795135498047, -0.0014095306396484375, -0.0008282661437988281, -0.00024700164794921875, 0.0003342628479003906, 0.00091552734375, 0.0014967918395996094, 0.0020780563354492188, 0.002659320831298828, 0.0032405853271484375, 0.003821849822998047, 0.004403114318847656, 0.004984378814697266, 0.005565643310546875, 0.006146907806396484, 0.006728172302246094, 0.007309436798095703, 0.007890701293945312, 0.008471965789794922, 0.009053230285644531, 0.00963449478149414, 0.01021575927734375, 0.01079702377319336, 0.011378288269042969, 0.011959552764892578, 0.012540817260742188, 0.013122081756591797, 0.013703346252441406, 0.014284610748291016, 0.014865875244140625, 0.015447139739990234, 0.016028404235839844, 0.016609668731689453, 0.017190933227539062, 0.017772197723388672, 0.01835346221923828, 0.01893472671508789, 0.0195159912109375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 7.0, 7.0, 4.0, 12.0, 9.0, 10.0, 22.0, 21.0, 37.0, 45.0, 58.0, 104.0, 182.0, 417.0, 3580.0, 1008538.0, 33971.0, 790.0, 249.0, 151.0, 83.0, 63.0, 43.0, 40.0, 29.0, 22.0, 16.0, 11.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.417236328125, -0.4052162170410156, -0.39319610595703125, -0.3811759948730469, -0.3691558837890625, -0.3571357727050781, -0.34511566162109375, -0.3330955505371094, -0.321075439453125, -0.3090553283691406, -0.29703521728515625, -0.2850151062011719, -0.2729949951171875, -0.2609748840332031, -0.24895477294921875, -0.23693466186523438, -0.22491455078125, -0.21289443969726562, -0.20087432861328125, -0.18885421752929688, -0.1768341064453125, -0.16481399536132812, -0.15279388427734375, -0.14077377319335938, -0.128753662109375, -0.11673355102539062, -0.10471343994140625, -0.09269332885742188, -0.0806732177734375, -0.06865310668945312, -0.05663299560546875, -0.044612884521484375, -0.0325927734375, -0.020572662353515625, -0.00855255126953125, 0.003467559814453125, 0.0154876708984375, 0.027507781982421875, 0.03952789306640625, 0.051548004150390625, 0.063568115234375, 0.07558822631835938, 0.08760833740234375, 0.09962844848632812, 0.1116485595703125, 0.12366867065429688, 0.13568878173828125, 0.14770889282226562, 0.15972900390625, 0.17174911499023438, 0.18376922607421875, 0.19578933715820312, 0.2078094482421875, 0.21982955932617188, 0.23184967041015625, 0.24386978149414062, 0.255889892578125, 0.2679100036621094, 0.27993011474609375, 0.2919502258300781, 0.3039703369140625, 0.3159904479980469, 0.32801055908203125, 0.3400306701660156, 0.35205078125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 461.0, 519.0, 24.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3614063858985901, -0.3529999256134033, -0.34459346532821655, -0.3361870050430298, -0.327780544757843, -0.31937405467033386, -0.3109675943851471, -0.3025611340999603, -0.29415467381477356, -0.2857482135295868, -0.2773417532444, -0.26893529295921326, -0.2605288028717041, -0.25212234258651733, -0.24371588230133057, -0.2353094220161438, -0.22690296173095703, -0.21849650144577026, -0.2100900411605835, -0.20168356597423553, -0.19327710568904877, -0.184870645403862, -0.17646417021751404, -0.16805770993232727, -0.1596512496471405, -0.15124478936195374, -0.14283832907676697, -0.134431853890419, -0.12602539360523224, -0.11761893332004547, -0.1092124655842781, -0.10080599784851074, -0.09239950776100159, -0.08399304747581482, -0.07558657974004745, -0.06718011200428009, -0.05877365171909332, -0.05036718770861626, -0.04196072369813919, -0.033554259687662125, -0.02514779567718506, -0.016741331666707993, -0.008334867656230927, 7.159635424613953e-05, 0.008478060364723206, 0.01688452437520027, 0.025290988385677338, 0.033697452396154404, 0.04210391640663147, 0.050510380417108536, 0.0589168444275856, 0.06732331216335297, 0.07572977244853973, 0.0841362327337265, 0.09254270046949387, 0.10094916820526123, 0.109355628490448, 0.11776208877563477, 0.12616854906082153, 0.1345750242471695, 0.14298148453235626, 0.15138794481754303, 0.159794420003891, 0.16820088028907776, 0.17660734057426453]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 9.0, 10.0, 14.0, 11.0, 11.0, 17.0, 18.0, 26.0, 21.0, 28.0, 28.0, 28.0, 23.0, 25.0, 28.0, 36.0, 36.0, 47.0, 36.0, 29.0, 45.0, 40.0, 44.0, 38.0, 37.0, 29.0, 30.0, 24.0, 18.0, 24.0, 26.0, 24.0, 16.0, 13.0, 19.0, 14.0, 11.0, 13.0, 5.0, 3.0, 7.0, 9.0, 0.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.023770511150360107, -0.023075811564922333, -0.022381113842129707, -0.021686416119337082, -0.020991716533899307, -0.020297016948461533, -0.019602319225668907, -0.018907621502876282, -0.018212921917438507, -0.017518222332000732, -0.016823524609208107, -0.01612882688641548, -0.015434127300977707, -0.014739428646862507, -0.014044729992747307, -0.013350031338632107, -0.012655332684516907, -0.011960634030401707, -0.011265935376286507, -0.010571236722171307, -0.009876538068056107, -0.009181839413940907, -0.008487140759825706, -0.0077924421057105064, -0.007097743451595306, -0.006403044797480106, -0.005708346143364906, -0.005013647489249706, -0.004318948835134506, -0.003624250181019306, -0.002929551526904106, -0.002234852872788906, -0.001540154218673706, -0.000845455564558506, -0.00015075691044330597, 0.0005439417436718941, 0.0012386403977870941, 0.0019333390519022942, 0.002628037706017494, 0.0033227363601326942, 0.004017435014247894, 0.004712133668363094, 0.005406832322478294, 0.006101530976593494, 0.0067962296307086945, 0.0074909282848238945, 0.008185626938939095, 0.008880325593054295, 0.009575024247169495, 0.010269722901284695, 0.010964421555399895, 0.011659120209515095, 0.012353818863630295, 0.013048517517745495, 0.013743216171860695, 0.014437914825975895, 0.015132613480091095, 0.01582731306552887, 0.016522010788321495, 0.01721670851111412, 0.017911408096551895, 0.01860610768198967, 0.019300805404782295, 0.01999550312757492, 0.020690202713012695]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 11.0, 9.0, 7.0, 15.0, 14.0, 18.0, 16.0, 24.0, 31.0, 24.0, 44.0, 28.0, 42.0, 43.0, 40.0, 48.0, 40.0, 37.0, 40.0, 36.0, 39.0, 49.0, 35.0, 32.0, 25.0, 31.0, 13.0, 29.0, 24.0, 24.0, 15.0, 29.0, 14.0, 17.0, 13.0, 6.0, 6.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.951171875, -3.828643798828125, -3.70611572265625, -3.583587646484375, -3.4610595703125, -3.338531494140625, -3.21600341796875, -3.093475341796875, -2.970947265625, -2.848419189453125, -2.72589111328125, -2.603363037109375, -2.4808349609375, -2.358306884765625, -2.23577880859375, -2.113250732421875, -1.99072265625, -1.868194580078125, -1.74566650390625, -1.623138427734375, -1.5006103515625, -1.378082275390625, -1.25555419921875, -1.133026123046875, -1.010498046875, -0.887969970703125, -0.76544189453125, -0.642913818359375, -0.5203857421875, -0.397857666015625, -0.27532958984375, -0.152801513671875, -0.0302734375, 0.092254638671875, 0.21478271484375, 0.337310791015625, 0.4598388671875, 0.582366943359375, 0.70489501953125, 0.827423095703125, 0.949951171875, 1.072479248046875, 1.19500732421875, 1.317535400390625, 1.4400634765625, 1.562591552734375, 1.68511962890625, 1.807647705078125, 1.93017578125, 2.052703857421875, 2.17523193359375, 2.297760009765625, 2.4202880859375, 2.542816162109375, 2.66534423828125, 2.787872314453125, 2.910400390625, 3.032928466796875, 3.15545654296875, 3.277984619140625, 3.4005126953125, 3.523040771484375, 3.64556884765625, 3.768096923828125, 3.890625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 1.0, 6.0, 4.0, 5.0, 9.0, 12.0, 19.0, 14.0, 21.0, 40.0, 50.0, 85.0, 121.0, 160.0, 250.0, 506.0, 882.0, 1649.0, 3173.0, 6326.0, 12526.0, 25750.0, 54542.0, 115293.0, 244502.0, 302771.0, 146730.0, 68705.0, 32236.0, 15839.0, 7691.0, 3978.0, 2060.0, 1084.0, 593.0, 327.0, 202.0, 117.0, 70.0, 41.0, 46.0, 30.0, 18.0, 23.0, 10.0, 12.0, 13.0, 4.0, 1.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.39453125, -4.25787353515625, -4.1212158203125, -3.98455810546875, -3.847900390625, -3.71124267578125, -3.5745849609375, -3.43792724609375, -3.30126953125, -3.16461181640625, -3.0279541015625, -2.89129638671875, -2.754638671875, -2.61798095703125, -2.4813232421875, -2.34466552734375, -2.2080078125, -2.07135009765625, -1.9346923828125, -1.79803466796875, -1.661376953125, -1.52471923828125, -1.3880615234375, -1.25140380859375, -1.11474609375, -0.97808837890625, -0.8414306640625, -0.70477294921875, -0.568115234375, -0.43145751953125, -0.2947998046875, -0.15814208984375, -0.021484375, 0.11517333984375, 0.2518310546875, 0.38848876953125, 0.525146484375, 0.66180419921875, 0.7984619140625, 0.93511962890625, 1.07177734375, 1.20843505859375, 1.3450927734375, 1.48175048828125, 1.618408203125, 1.75506591796875, 1.8917236328125, 2.02838134765625, 2.1650390625, 2.30169677734375, 2.4383544921875, 2.57501220703125, 2.711669921875, 2.84832763671875, 2.9849853515625, 3.12164306640625, 3.25830078125, 3.39495849609375, 3.5316162109375, 3.66827392578125, 3.804931640625, 3.94158935546875, 4.0782470703125, 4.21490478515625, 4.3515625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 5.0, 10.0, 15.0, 11.0, 11.0, 20.0, 18.0, 24.0, 21.0, 30.0, 39.0, 50.0, 46.0, 68.0, 58.0, 93.0, 173.0, 837.0, 811.0, 173.0, 81.0, 66.0, 60.0, 48.0, 33.0, 29.0, 33.0, 26.0, 22.0, 28.0, 19.0, 11.0, 8.0, 6.0, 15.0, 7.0, 3.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-13.5078125, -13.085693359375, -12.66357421875, -12.241455078125, -11.8193359375, -11.397216796875, -10.97509765625, -10.552978515625, -10.130859375, -9.708740234375, -9.28662109375, -8.864501953125, -8.4423828125, -8.020263671875, -7.59814453125, -7.176025390625, -6.75390625, -6.331787109375, -5.90966796875, -5.487548828125, -5.0654296875, -4.643310546875, -4.22119140625, -3.799072265625, -3.376953125, -2.954833984375, -2.53271484375, -2.110595703125, -1.6884765625, -1.266357421875, -0.84423828125, -0.422119140625, 0.0, 0.422119140625, 0.84423828125, 1.266357421875, 1.6884765625, 2.110595703125, 2.53271484375, 2.954833984375, 3.376953125, 3.799072265625, 4.22119140625, 4.643310546875, 5.0654296875, 5.487548828125, 5.90966796875, 6.331787109375, 6.75390625, 7.176025390625, 7.59814453125, 8.020263671875, 8.4423828125, 8.864501953125, 9.28662109375, 9.708740234375, 10.130859375, 10.552978515625, 10.97509765625, 11.397216796875, 11.8193359375, 12.241455078125, 12.66357421875, 13.085693359375, 13.5078125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 3.0, 11.0, 25.0, 24.0, 32.0, 60.0, 78.0, 128.0, 222.0, 389.0, 777.0, 16195.0, 3119626.0, 6459.0, 739.0, 364.0, 196.0, 107.0, 90.0, 48.0, 32.0, 21.0, 23.0, 11.0, 5.0, 6.0, 5.0, 6.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.1875, -80.96435546875, -78.7412109375, -76.51806640625, -74.294921875, -72.07177734375, -69.8486328125, -67.62548828125, -65.40234375, -63.17919921875, -60.9560546875, -58.73291015625, -56.509765625, -54.28662109375, -52.0634765625, -49.84033203125, -47.6171875, -45.39404296875, -43.1708984375, -40.94775390625, -38.724609375, -36.50146484375, -34.2783203125, -32.05517578125, -29.83203125, -27.60888671875, -25.3857421875, -23.16259765625, -20.939453125, -18.71630859375, -16.4931640625, -14.27001953125, -12.046875, -9.82373046875, -7.6005859375, -5.37744140625, -3.154296875, -0.93115234375, 1.2919921875, 3.51513671875, 5.73828125, 7.96142578125, 10.1845703125, 12.40771484375, 14.630859375, 16.85400390625, 19.0771484375, 21.30029296875, 23.5234375, 25.74658203125, 27.9697265625, 30.19287109375, 32.416015625, 34.63916015625, 36.8623046875, 39.08544921875, 41.30859375, 43.53173828125, 45.7548828125, 47.97802734375, 50.201171875, 52.42431640625, 54.6474609375, 56.87060546875, 59.09375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 98.0, 576.0, 319.0, 22.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-233.8211669921875, -229.3029327392578, -224.78469848632812, -220.2664794921875, -215.7482452392578, -211.23001098632812, -206.71177673339844, -202.19354248046875, -197.67530822753906, -193.15707397460938, -188.6388397216797, -184.12060546875, -179.60238647460938, -175.0841522216797, -170.56591796875, -166.0476837158203, -161.52944946289062, -157.01121520996094, -152.49298095703125, -147.97476196289062, -143.45652770996094, -138.93829345703125, -134.42005920410156, -129.90182495117188, -125.38360595703125, -120.86537170410156, -116.3471450805664, -111.82891082763672, -107.31067657470703, -102.79244995117188, -98.27421569824219, -93.7559814453125, -89.23773956298828, -84.7195053100586, -80.20127868652344, -75.68304443359375, -71.16481018066406, -66.64657592773438, -62.12834930419922, -57.61011505126953, -53.09188461303711, -48.57365417480469, -44.055419921875, -39.53718948364258, -35.018959045410156, -30.50072479248047, -25.982494354248047, -21.464262008666992, -16.946029663085938, -12.427797317504883, -7.9095659255981445, -3.3913345336914062, 1.1268978118896484, 5.645130157470703, 10.163360595703125, 14.68159294128418, 19.199825286865234, 23.71805763244629, 28.236289978027344, 32.754520416259766, 37.27275085449219, 41.790985107421875, 46.3092155456543, 50.82744598388672, 55.345680236816406]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 10.0, 2.0, 8.0, 7.0, 8.0, 13.0, 14.0, 18.0, 24.0, 19.0, 17.0, 29.0, 23.0, 32.0, 47.0, 31.0, 39.0, 33.0, 53.0, 48.0, 39.0, 43.0, 38.0, 40.0, 44.0, 44.0, 44.0, 38.0, 35.0, 28.0, 27.0, 18.0, 12.0, 21.0, 10.0, 12.0, 7.0, 14.0, 3.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.29620361328125, -32.120670318603516, -30.945138931274414, -29.769607543945312, -28.594074249267578, -27.418542861938477, -26.243011474609375, -25.06747817993164, -23.89194679260254, -22.716415405273438, -21.540882110595703, -20.3653507232666, -19.1898193359375, -18.014286041259766, -16.838754653930664, -15.663222312927246, -14.487689971923828, -13.31215763092041, -12.136625289916992, -10.96109390258789, -9.785561561584473, -8.610029220581055, -7.434497356414795, -6.258965492248535, -5.083433151245117, -3.9079010486602783, -2.7323689460754395, -1.5568368434906006, -0.3813047409057617, 0.7942276000976562, 1.969759464263916, 3.145291328430176, 4.320823669433594, 5.496356010437012, 6.6718878746032715, 7.847419738769531, 9.02295207977295, 10.198484420776367, 11.374015808105469, 12.549548149108887, 13.725080490112305, 14.900612831115723, 16.07614517211914, 17.251676559448242, 18.427207946777344, 19.602741241455078, 20.77827262878418, 21.95380401611328, 23.129337310791016, 24.304868698120117, 25.48040199279785, 26.655933380126953, 27.831466674804688, 29.00699806213379, 30.18252944946289, 31.358062744140625, 32.533592224121094, 33.70912551879883, 34.8846549987793, 36.06018829345703, 37.235721588134766, 38.4112548828125, 39.58678436279297, 40.7623176574707, 41.93785095214844]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 11.0, 2.0, 10.0, 11.0, 9.0, 11.0, 8.0, 20.0, 30.0, 26.0, 24.0, 34.0, 38.0, 33.0, 40.0, 38.0, 41.0, 49.0, 51.0, 46.0, 35.0, 43.0, 42.0, 32.0, 26.0, 33.0, 30.0, 26.0, 29.0, 29.0, 20.0, 22.0, 13.0, 18.0, 16.0, 16.0, 10.0, 7.0, 6.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8046875, -4.661865234375, -4.51904296875, -4.376220703125, -4.2333984375, -4.090576171875, -3.94775390625, -3.804931640625, -3.662109375, -3.519287109375, -3.37646484375, -3.233642578125, -3.0908203125, -2.947998046875, -2.80517578125, -2.662353515625, -2.51953125, -2.376708984375, -2.23388671875, -2.091064453125, -1.9482421875, -1.805419921875, -1.66259765625, -1.519775390625, -1.376953125, -1.234130859375, -1.09130859375, -0.948486328125, -0.8056640625, -0.662841796875, -0.52001953125, -0.377197265625, -0.234375, -0.091552734375, 0.05126953125, 0.194091796875, 0.3369140625, 0.479736328125, 0.62255859375, 0.765380859375, 0.908203125, 1.051025390625, 1.19384765625, 1.336669921875, 1.4794921875, 1.622314453125, 1.76513671875, 1.907958984375, 2.05078125, 2.193603515625, 2.33642578125, 2.479248046875, 2.6220703125, 2.764892578125, 2.90771484375, 3.050537109375, 3.193359375, 3.336181640625, 3.47900390625, 3.621826171875, 3.7646484375, 3.907470703125, 4.05029296875, 4.193115234375, 4.3359375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 7.0, 3.0, 9.0, 14.0, 20.0, 16.0, 35.0, 43.0, 64.0, 109.0, 175.0, 301.0, 739.0, 2781.0, 19060.0, 191538.0, 1447748.0, 2085247.0, 399385.0, 39148.0, 5240.0, 1359.0, 468.0, 280.0, 159.0, 99.0, 67.0, 55.0, 39.0, 30.0, 12.0, 12.0, 9.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.453125, -12.1351318359375, -11.817138671875, -11.4991455078125, -11.18115234375, -10.8631591796875, -10.545166015625, -10.2271728515625, -9.9091796875, -9.5911865234375, -9.273193359375, -8.9552001953125, -8.63720703125, -8.3192138671875, -8.001220703125, -7.6832275390625, -7.365234375, -7.0472412109375, -6.729248046875, -6.4112548828125, -6.09326171875, -5.7752685546875, -5.457275390625, -5.1392822265625, -4.8212890625, -4.5032958984375, -4.185302734375, -3.8673095703125, -3.54931640625, -3.2313232421875, -2.913330078125, -2.5953369140625, -2.27734375, -1.9593505859375, -1.641357421875, -1.3233642578125, -1.00537109375, -0.6873779296875, -0.369384765625, -0.0513916015625, 0.2666015625, 0.5845947265625, 0.902587890625, 1.2205810546875, 1.53857421875, 1.8565673828125, 2.174560546875, 2.4925537109375, 2.810546875, 3.1285400390625, 3.446533203125, 3.7645263671875, 4.08251953125, 4.4005126953125, 4.718505859375, 5.0364990234375, 5.3544921875, 5.6724853515625, 5.990478515625, 6.3084716796875, 6.62646484375, 6.9444580078125, 7.262451171875, 7.5804443359375, 7.8984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 14.0, 21.0, 20.0, 36.0, 36.0, 47.0, 72.0, 90.0, 118.0, 168.0, 239.0, 259.0, 349.0, 343.0, 386.0, 386.0, 358.0, 268.0, 203.0, 136.0, 123.0, 104.0, 74.0, 55.0, 36.0, 26.0, 27.0, 12.0, 17.0, 12.0, 9.0, 5.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3203125, -8.0377197265625, -7.755126953125, -7.4725341796875, -7.18994140625, -6.9073486328125, -6.624755859375, -6.3421630859375, -6.0595703125, -5.7769775390625, -5.494384765625, -5.2117919921875, -4.92919921875, -4.6466064453125, -4.364013671875, -4.0814208984375, -3.798828125, -3.5162353515625, -3.233642578125, -2.9510498046875, -2.66845703125, -2.3858642578125, -2.103271484375, -1.8206787109375, -1.5380859375, -1.2554931640625, -0.972900390625, -0.6903076171875, -0.40771484375, -0.1251220703125, 0.157470703125, 0.4400634765625, 0.72265625, 1.0052490234375, 1.287841796875, 1.5704345703125, 1.85302734375, 2.1356201171875, 2.418212890625, 2.7008056640625, 2.9833984375, 3.2659912109375, 3.548583984375, 3.8311767578125, 4.11376953125, 4.3963623046875, 4.678955078125, 4.9615478515625, 5.244140625, 5.5267333984375, 5.809326171875, 6.0919189453125, 6.37451171875, 6.6571044921875, 6.939697265625, 7.2222900390625, 7.5048828125, 7.7874755859375, 8.070068359375, 8.3526611328125, 8.63525390625, 8.9178466796875, 9.200439453125, 9.4830322265625, 9.765625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 5.0, 5.0, 14.0, 13.0, 18.0, 18.0, 27.0, 33.0, 56.0, 78.0, 114.0, 160.0, 199.0, 345.0, 573.0, 3316.0, 277976.0, 3772297.0, 135372.0, 2200.0, 494.0, 326.0, 177.0, 137.0, 102.0, 60.0, 43.0, 34.0, 26.0, 25.0, 16.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.46875, -32.467529296875, -31.46630859375, -30.465087890625, -29.4638671875, -28.462646484375, -27.46142578125, -26.460205078125, -25.458984375, -24.457763671875, -23.45654296875, -22.455322265625, -21.4541015625, -20.452880859375, -19.45166015625, -18.450439453125, -17.44921875, -16.447998046875, -15.44677734375, -14.445556640625, -13.4443359375, -12.443115234375, -11.44189453125, -10.440673828125, -9.439453125, -8.438232421875, -7.43701171875, -6.435791015625, -5.4345703125, -4.433349609375, -3.43212890625, -2.430908203125, -1.4296875, -0.428466796875, 0.57275390625, 1.573974609375, 2.5751953125, 3.576416015625, 4.57763671875, 5.578857421875, 6.580078125, 7.581298828125, 8.58251953125, 9.583740234375, 10.5849609375, 11.586181640625, 12.58740234375, 13.588623046875, 14.58984375, 15.591064453125, 16.59228515625, 17.593505859375, 18.5947265625, 19.595947265625, 20.59716796875, 21.598388671875, 22.599609375, 23.600830078125, 24.60205078125, 25.603271484375, 26.6044921875, 27.605712890625, 28.60693359375, 29.608154296875, 30.609375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 11.0, 10.0, 26.0, 60.0, 92.0, 127.0, 141.0, 161.0, 140.0, 104.0, 70.0, 34.0, 25.0, 4.0, 5.0, 4.0, 2.0], "bins": [-110.89139556884766, -108.84294128417969, -106.79449462890625, -104.74604034423828, -102.69759368896484, -100.64913940429688, -98.60069274902344, -96.55223846435547, -94.5037841796875, -92.45532989501953, -90.4068832397461, -88.35842895507812, -86.30998229980469, -84.26152801513672, -82.21308135986328, -80.16462707519531, -78.11618041992188, -76.0677261352539, -74.01927947998047, -71.9708251953125, -69.92237854003906, -67.8739242553711, -65.82547760009766, -63.77702331542969, -61.728572845458984, -59.68012237548828, -57.63167190551758, -55.583221435546875, -53.534767150878906, -51.48632049560547, -49.4378662109375, -47.3894157409668, -45.34095764160156, -43.29250717163086, -41.244056701660156, -39.19560623168945, -37.14715576171875, -35.09870147705078, -33.05025100708008, -31.001800537109375, -28.953350067138672, -26.90489959716797, -24.856449127197266, -22.80799674987793, -20.759546279907227, -18.711095809936523, -16.662643432617188, -14.614192962646484, -12.565742492675781, -10.517292022705078, -8.468840599060059, -6.420389652252197, -4.371938705444336, -2.323488235473633, -0.2750368118286133, 1.7734146118164062, 3.8218650817871094, 5.870316028594971, 7.918766975402832, 9.967218399047852, 12.015668869018555, 14.064119338989258, 16.112571716308594, 18.161022186279297, 20.20947265625]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 7.0, 7.0, 6.0, 8.0, 19.0, 13.0, 19.0, 31.0, 15.0, 18.0, 10.0, 19.0, 30.0, 39.0, 27.0, 35.0, 43.0, 39.0, 52.0, 50.0, 53.0, 39.0, 37.0, 33.0, 40.0, 38.0, 42.0, 27.0, 20.0, 35.0, 31.0, 18.0, 21.0, 14.0, 13.0, 9.0, 5.0, 10.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-30.64522933959961, -29.68155288696289, -28.717876434326172, -27.754199981689453, -26.790525436401367, -25.82684898376465, -24.86317253112793, -23.89949607849121, -22.935819625854492, -21.972143173217773, -21.008466720581055, -20.04479217529297, -19.08111572265625, -18.11743927001953, -17.153762817382812, -16.190086364746094, -15.226410865783691, -14.262734413146973, -13.29905891418457, -12.335382461547852, -11.371706008911133, -10.408029556274414, -9.444354057312012, -8.480677604675293, -7.517001628875732, -6.553325653076172, -5.589649200439453, -4.625973224639893, -3.662297010421753, -2.6986207962036133, -1.7349448204040527, -0.771268367767334, 0.19240760803222656, 1.1560838222503662, 2.119760036468506, 3.0834360122680664, 4.047112464904785, 5.010788440704346, 5.974464416503906, 6.938140869140625, 7.9018168449401855, 8.865492820739746, 9.829169273376465, 10.792844772338867, 11.756521224975586, 12.720197677612305, 13.683874130249023, 14.647550582885742, 15.611226081848145, 16.574901580810547, 17.538578033447266, 18.502254486083984, 19.465930938720703, 20.429607391357422, 21.39328384399414, 22.35696029663086, 23.320634841918945, 24.284311294555664, 25.247987747192383, 26.21166229248047, 27.175338745117188, 28.139015197753906, 29.102691650390625, 30.066368103027344, 31.030044555664062]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 3.0, 6.0, 11.0, 9.0, 14.0, 20.0, 20.0, 18.0, 25.0, 32.0, 30.0, 48.0, 35.0, 35.0, 34.0, 34.0, 36.0, 41.0, 37.0, 45.0, 31.0, 44.0, 34.0, 42.0, 37.0, 34.0, 25.0, 23.0, 18.0, 28.0, 24.0, 19.0, 12.0, 12.0, 12.0, 13.0, 10.0, 12.0, 6.0, 6.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.27734375, -4.1483154296875, -4.019287109375, -3.8902587890625, -3.76123046875, -3.6322021484375, -3.503173828125, -3.3741455078125, -3.2451171875, -3.1160888671875, -2.987060546875, -2.8580322265625, -2.72900390625, -2.5999755859375, -2.470947265625, -2.3419189453125, -2.212890625, -2.0838623046875, -1.954833984375, -1.8258056640625, -1.69677734375, -1.5677490234375, -1.438720703125, -1.3096923828125, -1.1806640625, -1.0516357421875, -0.922607421875, -0.7935791015625, -0.66455078125, -0.5355224609375, -0.406494140625, -0.2774658203125, -0.1484375, -0.0194091796875, 0.109619140625, 0.2386474609375, 0.36767578125, 0.4967041015625, 0.625732421875, 0.7547607421875, 0.8837890625, 1.0128173828125, 1.141845703125, 1.2708740234375, 1.39990234375, 1.5289306640625, 1.657958984375, 1.7869873046875, 1.916015625, 2.0450439453125, 2.174072265625, 2.3031005859375, 2.43212890625, 2.5611572265625, 2.690185546875, 2.8192138671875, 2.9482421875, 3.0772705078125, 3.206298828125, 3.3353271484375, 3.46435546875, 3.5933837890625, 3.722412109375, 3.8514404296875, 3.98046875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 10.0, 25.0, 27.0, 29.0, 69.0, 81.0, 143.0, 208.0, 303.0, 442.0, 605.0, 881.0, 1247.0, 1860.0, 2701.0, 4018.0, 5545.0, 8368.0, 12369.0, 18147.0, 27198.0, 40173.0, 58645.0, 83028.0, 113279.0, 139424.0, 140288.0, 114685.0, 85366.0, 60304.0, 41954.0, 28176.0, 18863.0, 12852.0, 8744.0, 5838.0, 3872.0, 2715.0, 1889.0, 1269.0, 898.0, 648.0, 438.0, 289.0, 209.0, 150.0, 104.0, 72.0, 42.0, 34.0, 17.0, 8.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.279815673828125, -0.26983642578125, -0.259857177734375, -0.2498779296875, -0.239898681640625, -0.22991943359375, -0.219940185546875, -0.2099609375, -0.199981689453125, -0.19000244140625, -0.180023193359375, -0.1700439453125, -0.160064697265625, -0.15008544921875, -0.140106201171875, -0.130126953125, -0.120147705078125, -0.11016845703125, -0.100189208984375, -0.0902099609375, -0.080230712890625, -0.07025146484375, -0.060272216796875, -0.05029296875, -0.040313720703125, -0.03033447265625, -0.020355224609375, -0.0103759765625, -0.000396728515625, 0.00958251953125, 0.019561767578125, 0.029541015625, 0.039520263671875, 0.04949951171875, 0.059478759765625, 0.0694580078125, 0.079437255859375, 0.08941650390625, 0.099395751953125, 0.109375, 0.119354248046875, 0.12933349609375, 0.139312744140625, 0.1492919921875, 0.159271240234375, 0.16925048828125, 0.179229736328125, 0.189208984375, 0.199188232421875, 0.20916748046875, 0.219146728515625, 0.2291259765625, 0.239105224609375, 0.24908447265625, 0.259063720703125, 0.26904296875, 0.279022216796875, 0.28900146484375, 0.298980712890625, 0.3089599609375, 0.318939208984375, 0.32891845703125, 0.338897705078125, 0.348876953125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 0.0, 4.0, 6.0, 5.0, 3.0, 11.0, 18.0, 12.0, 20.0, 22.0, 21.0, 30.0, 25.0, 24.0, 22.0, 44.0, 42.0, 54.0, 38.0, 42.0, 34.0, 1071.0, 46.0, 43.0, 47.0, 30.0, 26.0, 44.0, 31.0, 29.0, 26.0, 24.0, 25.0, 16.0, 16.0, 10.0, 14.0, 9.0, 7.0, 7.0, 6.0, 4.0, 10.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.021484375, -2.931488037109375, -2.84149169921875, -2.751495361328125, -2.6614990234375, -2.571502685546875, -2.48150634765625, -2.391510009765625, -2.301513671875, -2.211517333984375, -2.12152099609375, -2.031524658203125, -1.9415283203125, -1.851531982421875, -1.76153564453125, -1.671539306640625, -1.58154296875, -1.491546630859375, -1.40155029296875, -1.311553955078125, -1.2215576171875, -1.131561279296875, -1.04156494140625, -0.951568603515625, -0.861572265625, -0.771575927734375, -0.68157958984375, -0.591583251953125, -0.5015869140625, -0.411590576171875, -0.32159423828125, -0.231597900390625, -0.1416015625, -0.051605224609375, 0.03839111328125, 0.128387451171875, 0.2183837890625, 0.308380126953125, 0.39837646484375, 0.488372802734375, 0.578369140625, 0.668365478515625, 0.75836181640625, 0.848358154296875, 0.9383544921875, 1.028350830078125, 1.11834716796875, 1.208343505859375, 1.29833984375, 1.388336181640625, 1.47833251953125, 1.568328857421875, 1.6583251953125, 1.748321533203125, 1.83831787109375, 1.928314208984375, 2.018310546875, 2.108306884765625, 2.19830322265625, 2.288299560546875, 2.3782958984375, 2.468292236328125, 2.55828857421875, 2.648284912109375, 2.73828125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 7.0, 7.0, 8.0, 13.0, 14.0, 25.0, 47.0, 52.0, 85.0, 121.0, 191.0, 276.0, 442.0, 643.0, 1032.0, 1615.0, 2449.0, 3797.0, 5863.0, 9368.0, 14698.0, 22579.0, 34061.0, 50936.0, 74713.0, 104396.0, 139234.0, 1189462.0, 131708.0, 100064.0, 71112.0, 47819.0, 31770.0, 20821.0, 13343.0, 8632.0, 5503.0, 3542.0, 2306.0, 1545.0, 930.0, 617.0, 450.0, 279.0, 190.0, 127.0, 78.0, 56.0, 44.0, 27.0, 15.0, 9.0, 5.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2130126953125, -0.20623397827148438, -0.19945526123046875, -0.19267654418945312, -0.1858978271484375, -0.17911911010742188, -0.17234039306640625, -0.16556167602539062, -0.158782958984375, -0.15200424194335938, -0.14522552490234375, -0.13844680786132812, -0.1316680908203125, -0.12488937377929688, -0.11811065673828125, -0.11133193969726562, -0.10455322265625, -0.09777450561523438, -0.09099578857421875, -0.08421707153320312, -0.0774383544921875, -0.07065963745117188, -0.06388092041015625, -0.057102203369140625, -0.050323486328125, -0.043544769287109375, -0.03676605224609375, -0.029987335205078125, -0.0232086181640625, -0.016429901123046875, -0.00965118408203125, -0.002872467041015625, 0.00390625, 0.010684967041015625, 0.01746368408203125, 0.024242401123046875, 0.0310211181640625, 0.037799835205078125, 0.04457855224609375, 0.051357269287109375, 0.058135986328125, 0.06491470336914062, 0.07169342041015625, 0.07847213745117188, 0.0852508544921875, 0.09202957153320312, 0.09880828857421875, 0.10558700561523438, 0.11236572265625, 0.11914443969726562, 0.12592315673828125, 0.13270187377929688, 0.1394805908203125, 0.14625930786132812, 0.15303802490234375, 0.15981674194335938, 0.166595458984375, 0.17337417602539062, 0.18015289306640625, 0.18693161010742188, 0.1937103271484375, 0.20048904418945312, 0.20726776123046875, 0.21404647827148438, 0.2208251953125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 7.0, 6.0, 4.0, 13.0, 8.0, 8.0, 14.0, 15.0, 20.0, 20.0, 39.0, 45.0, 55.0, 50.0, 85.0, 107.0, 90.0, 96.0, 64.0, 48.0, 41.0, 39.0, 19.0, 21.0, 16.0, 12.0, 12.0, 11.0, 6.0, 6.0, 7.0, 5.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01111602783203125, -0.010759234428405762, -0.010402441024780273, -0.010045647621154785, -0.009688854217529297, -0.009332060813903809, -0.00897526741027832, -0.008618474006652832, -0.008261680603027344, -0.007904887199401855, -0.007548093795776367, -0.007191300392150879, -0.006834506988525391, -0.006477713584899902, -0.006120920181274414, -0.005764126777648926, -0.0054073333740234375, -0.005050539970397949, -0.004693746566772461, -0.004336953163146973, -0.003980159759521484, -0.003623366355895996, -0.003266572952270508, -0.0029097795486450195, -0.0025529861450195312, -0.002196192741394043, -0.0018393993377685547, -0.0014826059341430664, -0.0011258125305175781, -0.0007690191268920898, -0.00041222572326660156, -5.543231964111328e-05, 0.000301361083984375, 0.0006581544876098633, 0.0010149478912353516, 0.0013717412948608398, 0.0017285346984863281, 0.0020853281021118164, 0.0024421215057373047, 0.002798914909362793, 0.0031557083129882812, 0.0035125017166137695, 0.003869295120239258, 0.004226088523864746, 0.004582881927490234, 0.004939675331115723, 0.005296468734741211, 0.005653262138366699, 0.0060100555419921875, 0.006366848945617676, 0.006723642349243164, 0.007080435752868652, 0.007437229156494141, 0.007794022560119629, 0.008150815963745117, 0.008507609367370605, 0.008864402770996094, 0.009221196174621582, 0.00957798957824707, 0.009934782981872559, 0.010291576385498047, 0.010648369789123535, 0.011005163192749023, 0.011361956596374512, 0.01171875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 10.0, 5.0, 13.0, 13.0, 16.0, 21.0, 26.0, 32.0, 44.0, 58.0, 105.0, 162.0, 477.0, 7244.0, 959456.0, 78625.0, 1525.0, 262.0, 121.0, 91.0, 71.0, 33.0, 32.0, 18.0, 18.0, 15.0, 6.0, 9.0, 12.0, 7.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.2548828125, -0.24754905700683594, -0.24021530151367188, -0.2328815460205078, -0.22554779052734375, -0.2182140350341797, -0.21088027954101562, -0.20354652404785156, -0.1962127685546875, -0.18887901306152344, -0.18154525756835938, -0.1742115020751953, -0.16687774658203125, -0.1595439910888672, -0.15221023559570312, -0.14487648010253906, -0.137542724609375, -0.13020896911621094, -0.12287521362304688, -0.11554145812988281, -0.10820770263671875, -0.10087394714355469, -0.09354019165039062, -0.08620643615722656, -0.0788726806640625, -0.07153892517089844, -0.06420516967773438, -0.05687141418457031, -0.04953765869140625, -0.04220390319824219, -0.034870147705078125, -0.027536392211914062, -0.02020263671875, -0.012868881225585938, -0.005535125732421875, 0.0017986297607421875, 0.00913238525390625, 0.016466140747070312, 0.023799896240234375, 0.031133651733398438, 0.0384674072265625, 0.04580116271972656, 0.053134918212890625, 0.06046867370605469, 0.06780242919921875, 0.07513618469238281, 0.08246994018554688, 0.08980369567871094, 0.097137451171875, 0.10447120666503906, 0.11180496215820312, 0.11913871765136719, 0.12647247314453125, 0.1338062286376953, 0.14113998413085938, 0.14847373962402344, 0.1558074951171875, 0.16314125061035156, 0.17047500610351562, 0.1778087615966797, 0.18514251708984375, 0.1924762725830078, 0.19981002807617188, 0.20714378356933594, 0.2144775390625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 10.0, 13.0, 29.0, 81.0, 202.0, 343.0, 175.0, 73.0, 39.0, 20.0, 8.0, 8.0, 3.0, 0.0, 0.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016347967088222504, -0.015122907236218452, -0.013897846452891827, -0.0126727856695652, -0.01144772581756115, -0.010222665965557098, -0.008997605182230473, -0.007772544398903847, -0.0065474845468997955, -0.005322424229234457, -0.0040973639115691185, -0.00287230359390378, -0.0016472432762384415, -0.00042218295857310295, 0.0008028773590922356, 0.0020279381424188614, 0.0032529979944229126, 0.004478058312088251, 0.00570311862975359, 0.006928178947418928, 0.008153239265084267, 0.009378299117088318, 0.010603359900414944, 0.01182842068374157, 0.01305348053574562, 0.014278540387749672, 0.015503601171076298, 0.016728661954402924, 0.017953721806406975, 0.019178781658411026, 0.020403843373060226, 0.021628903225064278, 0.02285396307706833, 0.02407902292907238, 0.02530408278107643, 0.02652914449572563, 0.027754204347729683, 0.028979264199733734, 0.030204325914382935, 0.031429387629032135, 0.03265444561839104, 0.03387950733304024, 0.03510456532239914, 0.03632962703704834, 0.03755468875169754, 0.03877974674105644, 0.04000480845570564, 0.041229866445064545, 0.042454928159713745, 0.043679989874362946, 0.04490504786372185, 0.04613010957837105, 0.04735516756772995, 0.04858022928237915, 0.04980529099702835, 0.05103035271167755, 0.05225541070103645, 0.053480472415685654, 0.054705530405044556, 0.055930592119693756, 0.05715565383434296, 0.05838071182370186, 0.05960577353835106, 0.06083083152770996, 0.06205589324235916]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 8.0, 8.0, 7.0, 9.0, 6.0, 7.0, 13.0, 11.0, 22.0, 14.0, 19.0, 18.0, 14.0, 22.0, 23.0, 18.0, 33.0, 20.0, 37.0, 35.0, 37.0, 42.0, 33.0, 34.0, 28.0, 33.0, 38.0, 30.0, 36.0, 17.0, 29.0, 27.0, 32.0, 25.0, 24.0, 24.0, 24.0, 20.0, 16.0, 14.0, 14.0, 11.0, 11.0, 8.0, 17.0, 12.0, 1.0, 5.0, 3.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.010185658931732178, -0.009859631769359112, -0.009533604606986046, -0.00920757744461298, -0.008881550282239914, -0.008555523119866848, -0.008229495957493782, -0.007903468795120716, -0.00757744163274765, -0.007251414470374584, -0.006925387308001518, -0.006599360145628452, -0.006273332983255386, -0.00594730582088232, -0.0056212786585092545, -0.0052952514961361885, -0.0049692243337631226, -0.004643197171390057, -0.004317170009016991, -0.003991142846643925, -0.0036651156842708588, -0.003339088521897793, -0.003013061359524727, -0.002687034197151661, -0.002361007034778595, -0.002034979872405529, -0.001708952710032463, -0.0013829255476593971, -0.0010568983852863312, -0.0007308712229132652, -0.0004048440605401993, -7.881689816713333e-05, 0.0002472102642059326, 0.0005732374265789986, 0.0008992645889520645, 0.0012252917513251305, 0.0015513189136981964, 0.0018773460760712624, 0.0022033732384443283, 0.0025294004008173943, 0.00285542756319046, 0.003181454725563526, 0.003507481887936592, 0.003833509050309658, 0.004159536212682724, 0.00448556337505579, 0.004811590537428856, 0.005137617699801922, 0.005463644862174988, 0.005789672024548054, 0.00611569918692112, 0.006441726349294186, 0.006767753511667252, 0.0070937806740403175, 0.0074198078364133835, 0.007745834998786449, 0.008071862161159515, 0.008397889323532581, 0.008723916485905647, 0.009049943648278713, 0.00937597081065178, 0.009701997973024845, 0.010028025135397911, 0.010354052297770977, 0.010680079460144043]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 3.0, 6.0, 11.0, 9.0, 14.0, 20.0, 20.0, 18.0, 25.0, 32.0, 30.0, 48.0, 35.0, 35.0, 34.0, 34.0, 36.0, 41.0, 38.0, 44.0, 31.0, 44.0, 33.0, 43.0, 37.0, 34.0, 25.0, 23.0, 18.0, 28.0, 24.0, 19.0, 12.0, 12.0, 12.0, 13.0, 11.0, 11.0, 6.0, 6.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.27734375, -4.1483154296875, -4.019287109375, -3.8902587890625, -3.76123046875, -3.6322021484375, -3.503173828125, -3.3741455078125, -3.2451171875, -3.1160888671875, -2.987060546875, -2.8580322265625, -2.72900390625, -2.5999755859375, -2.470947265625, -2.3419189453125, -2.212890625, -2.0838623046875, -1.954833984375, -1.8258056640625, -1.69677734375, -1.5677490234375, -1.438720703125, -1.3096923828125, -1.1806640625, -1.0516357421875, -0.922607421875, -0.7935791015625, -0.66455078125, -0.5355224609375, -0.406494140625, -0.2774658203125, -0.1484375, -0.0194091796875, 0.109619140625, 0.2386474609375, 0.36767578125, 0.4967041015625, 0.625732421875, 0.7547607421875, 0.8837890625, 1.0128173828125, 1.141845703125, 1.2708740234375, 1.39990234375, 1.5289306640625, 1.657958984375, 1.7869873046875, 1.916015625, 2.0450439453125, 2.174072265625, 2.3031005859375, 2.43212890625, 2.5611572265625, 2.690185546875, 2.8192138671875, 2.9482421875, 3.0772705078125, 3.206298828125, 3.3353271484375, 3.46435546875, 3.5933837890625, 3.722412109375, 3.8514404296875, 3.98046875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 7.0, 5.0, 14.0, 21.0, 27.0, 43.0, 49.0, 72.0, 132.0, 196.0, 274.0, 496.0, 843.0, 1428.0, 2670.0, 5430.0, 11892.0, 28221.0, 66969.0, 150508.0, 335358.0, 246802.0, 110602.0, 48514.0, 20340.0, 8663.0, 4022.0, 2029.0, 1130.0, 649.0, 404.0, 233.0, 137.0, 105.0, 80.0, 53.0, 41.0, 19.0, 22.0, 17.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3515625, -4.20556640625, -4.0595703125, -3.91357421875, -3.767578125, -3.62158203125, -3.4755859375, -3.32958984375, -3.18359375, -3.03759765625, -2.8916015625, -2.74560546875, -2.599609375, -2.45361328125, -2.3076171875, -2.16162109375, -2.015625, -1.86962890625, -1.7236328125, -1.57763671875, -1.431640625, -1.28564453125, -1.1396484375, -0.99365234375, -0.84765625, -0.70166015625, -0.5556640625, -0.40966796875, -0.263671875, -0.11767578125, 0.0283203125, 0.17431640625, 0.3203125, 0.46630859375, 0.6123046875, 0.75830078125, 0.904296875, 1.05029296875, 1.1962890625, 1.34228515625, 1.48828125, 1.63427734375, 1.7802734375, 1.92626953125, 2.072265625, 2.21826171875, 2.3642578125, 2.51025390625, 2.65625, 2.80224609375, 2.9482421875, 3.09423828125, 3.240234375, 3.38623046875, 3.5322265625, 3.67822265625, 3.82421875, 3.97021484375, 4.1162109375, 4.26220703125, 4.408203125, 4.55419921875, 4.7001953125, 4.84619140625, 4.9921875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 9.0, 5.0, 6.0, 11.0, 13.0, 16.0, 20.0, 14.0, 23.0, 28.0, 22.0, 30.0, 41.0, 51.0, 46.0, 67.0, 107.0, 197.0, 1466.0, 294.0, 124.0, 68.0, 63.0, 57.0, 51.0, 35.0, 29.0, 30.0, 29.0, 17.0, 18.0, 17.0, 12.0, 10.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.2783203125, -13.744140625, -13.2099609375, -12.67578125, -12.1416015625, -11.607421875, -11.0732421875, -10.5390625, -10.0048828125, -9.470703125, -8.9365234375, -8.40234375, -7.8681640625, -7.333984375, -6.7998046875, -6.265625, -5.7314453125, -5.197265625, -4.6630859375, -4.12890625, -3.5947265625, -3.060546875, -2.5263671875, -1.9921875, -1.4580078125, -0.923828125, -0.3896484375, 0.14453125, 0.6787109375, 1.212890625, 1.7470703125, 2.28125, 2.8154296875, 3.349609375, 3.8837890625, 4.41796875, 4.9521484375, 5.486328125, 6.0205078125, 6.5546875, 7.0888671875, 7.623046875, 8.1572265625, 8.69140625, 9.2255859375, 9.759765625, 10.2939453125, 10.828125, 11.3623046875, 11.896484375, 12.4306640625, 12.96484375, 13.4990234375, 14.033203125, 14.5673828125, 15.1015625, 15.6357421875, 16.169921875, 16.7041015625, 17.23828125, 17.7724609375, 18.306640625, 18.8408203125, 19.375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 11.0, 10.0, 17.0, 17.0, 21.0, 25.0, 58.0, 84.0, 111.0, 205.0, 431.0, 1257.0, 16556.0, 3119202.0, 5844.0, 945.0, 368.0, 178.0, 128.0, 76.0, 49.0, 33.0, 16.0, 15.0, 16.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.1875, -85.82861328125, -83.4697265625, -81.11083984375, -78.751953125, -76.39306640625, -74.0341796875, -71.67529296875, -69.31640625, -66.95751953125, -64.5986328125, -62.23974609375, -59.880859375, -57.52197265625, -55.1630859375, -52.80419921875, -50.4453125, -48.08642578125, -45.7275390625, -43.36865234375, -41.009765625, -38.65087890625, -36.2919921875, -33.93310546875, -31.57421875, -29.21533203125, -26.8564453125, -24.49755859375, -22.138671875, -19.77978515625, -17.4208984375, -15.06201171875, -12.703125, -10.34423828125, -7.9853515625, -5.62646484375, -3.267578125, -0.90869140625, 1.4501953125, 3.80908203125, 6.16796875, 8.52685546875, 10.8857421875, 13.24462890625, 15.603515625, 17.96240234375, 20.3212890625, 22.68017578125, 25.0390625, 27.39794921875, 29.7568359375, 32.11572265625, 34.474609375, 36.83349609375, 39.1923828125, 41.55126953125, 43.91015625, 46.26904296875, 48.6279296875, 50.98681640625, 53.345703125, 55.70458984375, 58.0634765625, 60.42236328125, 62.78125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 11.0, 110.0, 389.0, 395.0, 101.0, 9.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.951934814453125, -11.977840423583984, -9.003745079040527, -6.02964973449707, -3.0555553436279297, -0.08146095275878906, 2.8926353454589844, 5.866729736328125, 8.840824127197266, 11.814918518066406, 14.789013862609863, 17.76310920715332, 20.73720359802246, 23.7112979888916, 26.685394287109375, 29.659488677978516, 32.633583068847656, 35.6076774597168, 38.58177185058594, 41.555870056152344, 44.52996063232422, 47.504058837890625, 50.478153228759766, 53.452247619628906, 56.42634201049805, 59.40043640136719, 62.37453079223633, 65.34862518310547, 68.32272338867188, 71.29681396484375, 74.27091217041016, 77.24501037597656, 80.21910095214844, 83.19319915771484, 86.16728973388672, 89.14138793945312, 92.115478515625, 95.0895767211914, 98.06367492675781, 101.03776550292969, 104.01185607910156, 106.98595428466797, 109.96004486083984, 112.93414306640625, 115.90823364257812, 118.88233184814453, 121.85643005371094, 124.83052062988281, 127.80461883544922, 130.77871704101562, 133.7528076171875, 136.72689819335938, 139.7010040283203, 142.6750946044922, 145.64918518066406, 148.623291015625, 151.59738159179688, 154.57147216796875, 157.5455780029297, 160.51966857910156, 163.49375915527344, 166.4678497314453, 169.44195556640625, 172.41604614257812, 175.39013671875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 10.0, 11.0, 10.0, 12.0, 20.0, 18.0, 16.0, 22.0, 26.0, 37.0, 38.0, 37.0, 48.0, 29.0, 40.0, 29.0, 60.0, 45.0, 44.0, 41.0, 46.0, 31.0, 33.0, 24.0, 42.0, 36.0, 24.0, 23.0, 22.0, 26.0, 19.0, 14.0, 17.0, 7.0, 7.0, 8.0, 5.0, 3.0, 4.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.861671447753906, -36.64950180053711, -35.43733215332031, -34.22516632080078, -33.012996673583984, -31.800827026367188, -30.58865737915039, -29.376487731933594, -28.164318084716797, -26.9521484375, -25.739980697631836, -24.52781105041504, -23.315641403198242, -22.103473663330078, -20.89130401611328, -19.679134368896484, -18.46696662902832, -17.254796981811523, -16.04262924194336, -14.830459594726562, -13.618289947509766, -12.406121253967285, -11.193952560424805, -9.981782913208008, -8.769614219665527, -7.557445049285889, -6.34527587890625, -5.1331071853637695, -3.920938014984131, -2.708768844604492, -1.4966001510620117, -0.28443050384521484, 0.9277381896972656, 2.1399073600769043, 3.352076292037964, 4.564245223999023, 5.776414394378662, 6.988583564758301, 8.200752258300781, 9.412921905517578, 10.625090599060059, 11.837259292602539, 13.049428939819336, 14.261597633361816, 15.473766326904297, 16.685935974121094, 17.89810562133789, 19.110275268554688, 20.32244300842285, 21.53461265563965, 22.746780395507812, 23.95895004272461, 25.171119689941406, 26.383289337158203, 27.595457077026367, 28.807626724243164, 30.019794464111328, 31.231964111328125, 32.44413375854492, 33.65630340576172, 34.86846923828125, 36.08063888549805, 37.292808532714844, 38.50497817993164, 39.71714782714844]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 8.0, 4.0, 10.0, 7.0, 13.0, 13.0, 30.0, 24.0, 30.0, 27.0, 27.0, 34.0, 36.0, 28.0, 42.0, 53.0, 35.0, 45.0, 31.0, 36.0, 32.0, 34.0, 38.0, 40.0, 36.0, 33.0, 23.0, 22.0, 23.0, 25.0, 16.0, 18.0, 17.0, 20.0, 14.0, 13.0, 3.0, 5.0, 8.0, 8.0, 10.0, 3.0, 6.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5546875, -4.41680908203125, -4.2789306640625, -4.14105224609375, -4.003173828125, -3.86529541015625, -3.7274169921875, -3.58953857421875, -3.45166015625, -3.31378173828125, -3.1759033203125, -3.03802490234375, -2.900146484375, -2.76226806640625, -2.6243896484375, -2.48651123046875, -2.3486328125, -2.21075439453125, -2.0728759765625, -1.93499755859375, -1.797119140625, -1.65924072265625, -1.5213623046875, -1.38348388671875, -1.24560546875, -1.10772705078125, -0.9698486328125, -0.83197021484375, -0.694091796875, -0.55621337890625, -0.4183349609375, -0.28045654296875, -0.142578125, -0.00469970703125, 0.1331787109375, 0.27105712890625, 0.408935546875, 0.54681396484375, 0.6846923828125, 0.82257080078125, 0.96044921875, 1.09832763671875, 1.2362060546875, 1.37408447265625, 1.511962890625, 1.64984130859375, 1.7877197265625, 1.92559814453125, 2.0634765625, 2.20135498046875, 2.3392333984375, 2.47711181640625, 2.614990234375, 2.75286865234375, 2.8907470703125, 3.02862548828125, 3.16650390625, 3.30438232421875, 3.4422607421875, 3.58013916015625, 3.718017578125, 3.85589599609375, 3.9937744140625, 4.13165283203125, 4.26953125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 9.0, 15.0, 20.0, 18.0, 24.0, 34.0, 39.0, 45.0, 66.0, 61.0, 101.0, 166.0, 246.0, 463.0, 1235.0, 3965.0, 16964.0, 87073.0, 456102.0, 1490283.0, 1542397.0, 476715.0, 92908.0, 18325.0, 4209.0, 1309.0, 545.0, 297.0, 150.0, 99.0, 77.0, 54.0, 48.0, 32.0, 31.0, 19.0, 23.0, 24.0, 13.0, 8.0, 17.0, 14.0, 5.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0], "bins": [-8.40625, -8.16619873046875, -7.9261474609375, -7.68609619140625, -7.446044921875, -7.20599365234375, -6.9659423828125, -6.72589111328125, -6.48583984375, -6.24578857421875, -6.0057373046875, -5.76568603515625, -5.525634765625, -5.28558349609375, -5.0455322265625, -4.80548095703125, -4.5654296875, -4.32537841796875, -4.0853271484375, -3.84527587890625, -3.605224609375, -3.36517333984375, -3.1251220703125, -2.88507080078125, -2.64501953125, -2.40496826171875, -2.1649169921875, -1.92486572265625, -1.684814453125, -1.44476318359375, -1.2047119140625, -0.96466064453125, -0.724609375, -0.48455810546875, -0.2445068359375, -0.00445556640625, 0.235595703125, 0.47564697265625, 0.7156982421875, 0.95574951171875, 1.19580078125, 1.43585205078125, 1.6759033203125, 1.91595458984375, 2.156005859375, 2.39605712890625, 2.6361083984375, 2.87615966796875, 3.1162109375, 3.35626220703125, 3.5963134765625, 3.83636474609375, 4.076416015625, 4.31646728515625, 4.5565185546875, 4.79656982421875, 5.03662109375, 5.27667236328125, 5.5167236328125, 5.75677490234375, 5.996826171875, 6.23687744140625, 6.4769287109375, 6.71697998046875, 6.95703125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 6.0, 8.0, 7.0, 9.0, 17.0, 42.0, 45.0, 53.0, 82.0, 97.0, 170.0, 204.0, 286.0, 352.0, 430.0, 455.0, 421.0, 354.0, 263.0, 193.0, 141.0, 116.0, 94.0, 61.0, 48.0, 32.0, 25.0, 20.0, 19.0, 9.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.6732177734375, -8.346435546875, -8.0196533203125, -7.69287109375, -7.3660888671875, -7.039306640625, -6.7125244140625, -6.3857421875, -6.0589599609375, -5.732177734375, -5.4053955078125, -5.07861328125, -4.7518310546875, -4.425048828125, -4.0982666015625, -3.771484375, -3.4447021484375, -3.117919921875, -2.7911376953125, -2.46435546875, -2.1375732421875, -1.810791015625, -1.4840087890625, -1.1572265625, -0.8304443359375, -0.503662109375, -0.1768798828125, 0.14990234375, 0.4766845703125, 0.803466796875, 1.1302490234375, 1.45703125, 1.7838134765625, 2.110595703125, 2.4373779296875, 2.76416015625, 3.0909423828125, 3.417724609375, 3.7445068359375, 4.0712890625, 4.3980712890625, 4.724853515625, 5.0516357421875, 5.37841796875, 5.7052001953125, 6.031982421875, 6.3587646484375, 6.685546875, 7.0123291015625, 7.339111328125, 7.6658935546875, 7.99267578125, 8.3194580078125, 8.646240234375, 8.9730224609375, 9.2998046875, 9.6265869140625, 9.953369140625, 10.2801513671875, 10.60693359375, 10.9337158203125, 11.260498046875, 11.5872802734375, 11.9140625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 1.0, 8.0, 11.0, 13.0, 20.0, 25.0, 33.0, 54.0, 67.0, 91.0, 135.0, 155.0, 266.0, 482.0, 2109.0, 728974.0, 3452449.0, 7716.0, 653.0, 323.0, 202.0, 169.0, 88.0, 65.0, 53.0, 39.0, 33.0, 12.0, 14.0, 8.0, 5.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.6875, -54.18896484375, -52.6904296875, -51.19189453125, -49.693359375, -48.19482421875, -46.6962890625, -45.19775390625, -43.69921875, -42.20068359375, -40.7021484375, -39.20361328125, -37.705078125, -36.20654296875, -34.7080078125, -33.20947265625, -31.7109375, -30.21240234375, -28.7138671875, -27.21533203125, -25.716796875, -24.21826171875, -22.7197265625, -21.22119140625, -19.72265625, -18.22412109375, -16.7255859375, -15.22705078125, -13.728515625, -12.22998046875, -10.7314453125, -9.23291015625, -7.734375, -6.23583984375, -4.7373046875, -3.23876953125, -1.740234375, -0.24169921875, 1.2568359375, 2.75537109375, 4.25390625, 5.75244140625, 7.2509765625, 8.74951171875, 10.248046875, 11.74658203125, 13.2451171875, 14.74365234375, 16.2421875, 17.74072265625, 19.2392578125, 20.73779296875, 22.236328125, 23.73486328125, 25.2333984375, 26.73193359375, 28.23046875, 29.72900390625, 31.2275390625, 32.72607421875, 34.224609375, 35.72314453125, 37.2216796875, 38.72021484375, 40.21875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 2.0, 23.0, 68.0, 176.0, 226.0, 272.0, 157.0, 71.0, 15.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.012392044067383, -27.58333969116211, -24.154285430908203, -20.725231170654297, -17.296178817749023, -13.867124557495117, -10.438072204589844, -7.00901985168457, -3.579965591430664, -0.15091228485107422, 3.2781410217285156, 6.7071943283081055, 10.136247634887695, 13.565301895141602, 16.994354248046875, 20.42340660095215, 23.852460861206055, 27.281513214111328, 30.710567474365234, 34.13962173461914, 37.56867218017578, 40.99772644042969, 44.426780700683594, 47.8558349609375, 51.284889221191406, 54.71394348144531, 58.14299774169922, 61.57204818725586, 65.0010986328125, 68.43016052246094, 71.85920715332031, 75.28826141357422, 78.71731567382812, 82.14636993408203, 85.57542419433594, 89.00447845458984, 92.43353271484375, 95.86257934570312, 99.29163360595703, 102.72068786621094, 106.14974212646484, 109.57879638671875, 113.00785064697266, 116.43690490722656, 119.86595153808594, 123.29501342773438, 126.72406005859375, 130.15310668945312, 133.58216857910156, 137.01121520996094, 140.44027709960938, 143.86932373046875, 147.2983856201172, 150.72743225097656, 154.156494140625, 157.58554077148438, 161.01458740234375, 164.44363403320312, 167.87269592285156, 171.30174255371094, 174.73080444335938, 178.15985107421875, 181.5889129638672, 185.01795959472656, 188.447021484375]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 7.0, 7.0, 9.0, 14.0, 20.0, 27.0, 28.0, 24.0, 30.0, 42.0, 34.0, 37.0, 46.0, 35.0, 36.0, 44.0, 38.0, 43.0, 36.0, 44.0, 42.0, 40.0, 43.0, 29.0, 27.0, 31.0, 27.0, 21.0, 22.0, 16.0, 9.0, 14.0, 11.0, 11.0, 10.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.871028900146484, -30.838356018066406, -29.805683135986328, -28.773008346557617, -27.74033546447754, -26.70766258239746, -25.67498779296875, -24.642314910888672, -23.609642028808594, -22.576969146728516, -21.544296264648438, -20.511621475219727, -19.47894859313965, -18.44627571105957, -17.41360092163086, -16.38092803955078, -15.348255157470703, -14.315582275390625, -13.28290843963623, -12.250234603881836, -11.217561721801758, -10.18488883972168, -9.152215003967285, -8.11954116821289, -7.0868682861328125, -6.054194927215576, -5.02152156829834, -3.9888482093811035, -2.956174850463867, -1.9235014915466309, -0.8908281326293945, 0.1418452262878418, 1.1745147705078125, 2.207188129425049, 3.239861488342285, 4.2725348472595215, 5.305208206176758, 6.337881565093994, 7.3705549240112305, 8.403228759765625, 9.435901641845703, 10.468574523925781, 11.501248359680176, 12.53392219543457, 13.566595077514648, 14.599267959594727, 15.631941795349121, 16.664615631103516, 17.697288513183594, 18.729961395263672, 19.76263427734375, 20.79530906677246, 21.82798194885254, 22.860654830932617, 23.893329620361328, 24.926002502441406, 25.958675384521484, 26.991348266601562, 28.02402114868164, 29.05669593811035, 30.08936882019043, 31.122041702270508, 32.15471649169922, 33.1873893737793, 34.220062255859375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 14.0, 7.0, 6.0, 13.0, 8.0, 10.0, 18.0, 33.0, 19.0, 33.0, 34.0, 30.0, 36.0, 28.0, 40.0, 37.0, 33.0, 39.0, 46.0, 42.0, 34.0, 36.0, 34.0, 39.0, 35.0, 32.0, 26.0, 26.0, 29.0, 12.0, 22.0, 24.0, 17.0, 18.0, 17.0, 11.0, 5.0, 10.0, 8.0, 6.0, 9.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.1953125, -4.0614013671875, -3.927490234375, -3.7935791015625, -3.65966796875, -3.5257568359375, -3.391845703125, -3.2579345703125, -3.1240234375, -2.9901123046875, -2.856201171875, -2.7222900390625, -2.58837890625, -2.4544677734375, -2.320556640625, -2.1866455078125, -2.052734375, -1.9188232421875, -1.784912109375, -1.6510009765625, -1.51708984375, -1.3831787109375, -1.249267578125, -1.1153564453125, -0.9814453125, -0.8475341796875, -0.713623046875, -0.5797119140625, -0.44580078125, -0.3118896484375, -0.177978515625, -0.0440673828125, 0.08984375, 0.2237548828125, 0.357666015625, 0.4915771484375, 0.62548828125, 0.7593994140625, 0.893310546875, 1.0272216796875, 1.1611328125, 1.2950439453125, 1.428955078125, 1.5628662109375, 1.69677734375, 1.8306884765625, 1.964599609375, 2.0985107421875, 2.232421875, 2.3663330078125, 2.500244140625, 2.6341552734375, 2.76806640625, 2.9019775390625, 3.035888671875, 3.1697998046875, 3.3037109375, 3.4376220703125, 3.571533203125, 3.7054443359375, 3.83935546875, 3.9732666015625, 4.107177734375, 4.2410888671875, 4.375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 8.0, 14.0, 30.0, 39.0, 54.0, 92.0, 145.0, 277.0, 449.0, 785.0, 1285.0, 2350.0, 4147.0, 7665.0, 14107.0, 25844.0, 46984.0, 83674.0, 142252.0, 206321.0, 201103.0, 134555.0, 78822.0, 44074.0, 24191.0, 13046.0, 7267.0, 3863.0, 2166.0, 1223.0, 728.0, 449.0, 224.0, 120.0, 81.0, 51.0, 24.0, 21.0, 15.0, 7.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423095703125, -0.4079551696777344, -0.39281463623046875, -0.3776741027832031, -0.3625335693359375, -0.3473930358886719, -0.33225250244140625, -0.3171119689941406, -0.301971435546875, -0.2868309020996094, -0.27169036865234375, -0.2565498352050781, -0.2414093017578125, -0.22626876831054688, -0.21112823486328125, -0.19598770141601562, -0.18084716796875, -0.16570663452148438, -0.15056610107421875, -0.13542556762695312, -0.1202850341796875, -0.10514450073242188, -0.09000396728515625, -0.07486343383789062, -0.059722900390625, -0.044582366943359375, -0.02944183349609375, -0.014301300048828125, 0.0008392333984375, 0.015979766845703125, 0.03112030029296875, 0.046260833740234375, 0.0614013671875, 0.07654190063476562, 0.09168243408203125, 0.10682296752929688, 0.1219635009765625, 0.13710403442382812, 0.15224456787109375, 0.16738510131835938, 0.182525634765625, 0.19766616821289062, 0.21280670166015625, 0.22794723510742188, 0.2430877685546875, 0.2582283020019531, 0.27336883544921875, 0.2885093688964844, 0.30364990234375, 0.3187904357910156, 0.33393096923828125, 0.3490715026855469, 0.3642120361328125, 0.3793525695800781, 0.39449310302734375, 0.4096336364746094, 0.424774169921875, 0.4399147033691406, 0.45505523681640625, 0.4701957702636719, 0.4853363037109375, 0.5004768371582031, 0.5156173706054688, 0.5307579040527344, 0.5458984375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 7.0, 5.0, 12.0, 13.0, 21.0, 16.0, 19.0, 26.0, 28.0, 33.0, 26.0, 26.0, 33.0, 25.0, 38.0, 35.0, 31.0, 45.0, 1067.0, 46.0, 35.0, 47.0, 26.0, 35.0, 28.0, 38.0, 35.0, 36.0, 26.0, 27.0, 14.0, 17.0, 15.0, 12.0, 15.0, 12.0, 7.0, 5.0, 5.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.802734375, -2.717987060546875, -2.63323974609375, -2.548492431640625, -2.4637451171875, -2.378997802734375, -2.29425048828125, -2.209503173828125, -2.124755859375, -2.040008544921875, -1.95526123046875, -1.870513916015625, -1.7857666015625, -1.701019287109375, -1.61627197265625, -1.531524658203125, -1.44677734375, -1.362030029296875, -1.27728271484375, -1.192535400390625, -1.1077880859375, -1.023040771484375, -0.93829345703125, -0.853546142578125, -0.768798828125, -0.684051513671875, -0.59930419921875, -0.514556884765625, -0.4298095703125, -0.345062255859375, -0.26031494140625, -0.175567626953125, -0.0908203125, -0.006072998046875, 0.07867431640625, 0.163421630859375, 0.2481689453125, 0.332916259765625, 0.41766357421875, 0.502410888671875, 0.587158203125, 0.671905517578125, 0.75665283203125, 0.841400146484375, 0.9261474609375, 1.010894775390625, 1.09564208984375, 1.180389404296875, 1.26513671875, 1.349884033203125, 1.43463134765625, 1.519378662109375, 1.6041259765625, 1.688873291015625, 1.77362060546875, 1.858367919921875, 1.943115234375, 2.027862548828125, 2.11260986328125, 2.197357177734375, 2.2821044921875, 2.366851806640625, 2.45159912109375, 2.536346435546875, 2.62109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 14.0, 20.0, 24.0, 30.0, 52.0, 81.0, 107.0, 172.0, 261.0, 406.0, 611.0, 924.0, 1556.0, 2582.0, 3837.0, 6195.0, 9693.0, 15166.0, 23795.0, 36420.0, 55390.0, 80799.0, 111520.0, 158696.0, 1166933.0, 128113.0, 96285.0, 68311.0, 45907.0, 29906.0, 19248.0, 12317.0, 7908.0, 5040.0, 3154.0, 1988.0, 1302.0, 857.0, 528.0, 339.0, 246.0, 156.0, 96.0, 61.0, 31.0, 19.0, 14.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2174072265625, -0.21045494079589844, -0.20350265502929688, -0.1965503692626953, -0.18959808349609375, -0.1826457977294922, -0.17569351196289062, -0.16874122619628906, -0.1617889404296875, -0.15483665466308594, -0.14788436889648438, -0.1409320831298828, -0.13397979736328125, -0.1270275115966797, -0.12007522583007812, -0.11312294006347656, -0.106170654296875, -0.09921836853027344, -0.09226608276367188, -0.08531379699707031, -0.07836151123046875, -0.07140922546386719, -0.06445693969726562, -0.05750465393066406, -0.0505523681640625, -0.04360008239746094, -0.036647796630859375, -0.029695510864257812, -0.02274322509765625, -0.015790939331054688, -0.008838653564453125, -0.0018863677978515625, 0.00506591796875, 0.012018203735351562, 0.018970489501953125, 0.025922775268554688, 0.03287506103515625, 0.03982734680175781, 0.046779632568359375, 0.05373191833496094, 0.0606842041015625, 0.06763648986816406, 0.07458877563476562, 0.08154106140136719, 0.08849334716796875, 0.09544563293457031, 0.10239791870117188, 0.10935020446777344, 0.116302490234375, 0.12325477600097656, 0.13020706176757812, 0.1371593475341797, 0.14411163330078125, 0.1510639190673828, 0.15801620483398438, 0.16496849060058594, 0.1719207763671875, 0.17887306213378906, 0.18582534790039062, 0.1927776336669922, 0.19972991943359375, 0.2066822052001953, 0.21363449096679688, 0.22058677673339844, 0.2275390625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 6.0, 10.0, 6.0, 15.0, 29.0, 16.0, 49.0, 80.0, 95.0, 191.0, 147.0, 100.0, 74.0, 46.0, 30.0, 26.0, 20.0, 13.0, 7.0, 5.0, 3.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02484130859375, -0.024167537689208984, -0.02349376678466797, -0.022819995880126953, -0.022146224975585938, -0.021472454071044922, -0.020798683166503906, -0.02012491226196289, -0.019451141357421875, -0.01877737045288086, -0.018103599548339844, -0.017429828643798828, -0.016756057739257812, -0.016082286834716797, -0.015408515930175781, -0.014734745025634766, -0.01406097412109375, -0.013387203216552734, -0.012713432312011719, -0.012039661407470703, -0.011365890502929688, -0.010692119598388672, -0.010018348693847656, -0.00934457778930664, -0.008670806884765625, -0.00799703598022461, -0.007323265075683594, -0.006649494171142578, -0.0059757232666015625, -0.005301952362060547, -0.004628181457519531, -0.003954410552978516, -0.0032806396484375, -0.0026068687438964844, -0.0019330978393554688, -0.0012593269348144531, -0.0005855560302734375, 8.821487426757812e-05, 0.0007619857788085938, 0.0014357566833496094, 0.002109527587890625, 0.0027832984924316406, 0.0034570693969726562, 0.004130840301513672, 0.0048046112060546875, 0.005478382110595703, 0.006152153015136719, 0.006825923919677734, 0.00749969482421875, 0.008173465728759766, 0.008847236633300781, 0.009521007537841797, 0.010194778442382812, 0.010868549346923828, 0.011542320251464844, 0.01221609115600586, 0.012889862060546875, 0.01356363296508789, 0.014237403869628906, 0.014911174774169922, 0.015584945678710938, 0.016258716583251953, 0.01693248748779297, 0.017606258392333984, 0.018280029296875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 9.0, 7.0, 12.0, 15.0, 33.0, 31.0, 47.0, 94.0, 181.0, 414.0, 16598.0, 1029443.0, 1129.0, 240.0, 105.0, 50.0, 36.0, 35.0, 9.0, 14.0, 8.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385986328125, -0.3718299865722656, -0.35767364501953125, -0.3435173034667969, -0.3293609619140625, -0.3152046203613281, -0.30104827880859375, -0.2868919372558594, -0.272735595703125, -0.2585792541503906, -0.24442291259765625, -0.23026657104492188, -0.2161102294921875, -0.20195388793945312, -0.18779754638671875, -0.17364120483398438, -0.15948486328125, -0.14532852172851562, -0.13117218017578125, -0.11701583862304688, -0.1028594970703125, -0.08870315551757812, -0.07454681396484375, -0.060390472412109375, -0.046234130859375, -0.032077789306640625, -0.01792144775390625, -0.003765106201171875, 0.0103912353515625, 0.024547576904296875, 0.03870391845703125, 0.052860260009765625, 0.0670166015625, 0.08117294311523438, 0.09532928466796875, 0.10948562622070312, 0.1236419677734375, 0.13779830932617188, 0.15195465087890625, 0.16611099243164062, 0.180267333984375, 0.19442367553710938, 0.20858001708984375, 0.22273635864257812, 0.2368927001953125, 0.2510490417480469, 0.26520538330078125, 0.2793617248535156, 0.29351806640625, 0.3076744079589844, 0.32183074951171875, 0.3359870910644531, 0.3501434326171875, 0.3642997741699219, 0.37845611572265625, 0.3926124572753906, 0.406768798828125, 0.4209251403808594, 0.43508148193359375, 0.4492378234863281, 0.4633941650390625, 0.4775505065917969, 0.49170684814453125, 0.5058631896972656, 0.52001953125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 148.0, 767.0, 84.0, 9.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13448819518089294, -0.12989123165607452, -0.1252942681312561, -0.12069730460643768, -0.11610034853219986, -0.11150338500738144, -0.10690642148256302, -0.1023094654083252, -0.09771250188350677, -0.09311553835868835, -0.08851857483386993, -0.08392161130905151, -0.07932465523481369, -0.07472769170999527, -0.07013072818517685, -0.06553377211093903, -0.06093680113554001, -0.05633983761072159, -0.051742877811193466, -0.047145914286375046, -0.042548954486846924, -0.0379519909620285, -0.03335502743721008, -0.02875806763768196, -0.02416110411286354, -0.01956414245069027, -0.014967179857194424, -0.010370217263698578, -0.005773255601525307, -0.0011762939393520355, 0.003420669585466385, 0.008017629384994507, 0.012614592909812927, 0.0172115545719862, 0.02180851623415947, 0.02640547975897789, 0.03100244142115116, 0.03559940308332443, 0.04019636660814285, 0.044793326407670975, 0.049390289932489395, 0.053987253457307816, 0.05858421325683594, 0.06318117678165436, 0.06777814030647278, 0.0723751038312912, 0.07697206735610962, 0.08156902343034744, 0.08616598695516586, 0.09076295047998428, 0.0953599140048027, 0.09995687007904053, 0.10455383360385895, 0.10915079712867737, 0.11374776065349579, 0.11834472417831421, 0.12294168770313263, 0.12753865122795105, 0.13213561475276947, 0.1367325782775879, 0.1413295418024063, 0.14592650532722473, 0.15052345395088196, 0.15512041747570038, 0.1597173810005188]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 7.0, 8.0, 10.0, 13.0, 18.0, 18.0, 18.0, 19.0, 22.0, 36.0, 29.0, 43.0, 41.0, 44.0, 37.0, 33.0, 35.0, 25.0, 46.0, 39.0, 52.0, 27.0, 41.0, 28.0, 37.0, 28.0, 30.0, 23.0, 25.0, 28.0, 21.0, 24.0, 16.0, 11.0, 11.0, 12.0, 10.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.018322348594665527, -0.017755262553691864, -0.0171881765127182, -0.016621090471744537, -0.016054004430770874, -0.01548691838979721, -0.014919832348823547, -0.014352746307849884, -0.01378566026687622, -0.013218574225902557, -0.012651488184928894, -0.01208440214395523, -0.011517316102981567, -0.010950230062007904, -0.01038314402103424, -0.009816057980060577, -0.009248971939086914, -0.00868188589811325, -0.008114799857139587, -0.007547713816165924, -0.006980627775192261, -0.006413541734218597, -0.005846455693244934, -0.005279369652271271, -0.004712283611297607, -0.004145197570323944, -0.0035781115293502808, -0.0030110254883766174, -0.002443939447402954, -0.0018768534064292908, -0.0013097673654556274, -0.0007426813244819641, -0.00017559528350830078, 0.00039149075746536255, 0.0009585767984390259, 0.0015256628394126892, 0.0020927488803863525, 0.002659834921360016, 0.003226920962333679, 0.0037940070033073425, 0.004361093044281006, 0.004928179085254669, 0.0054952651262283325, 0.006062351167201996, 0.006629437208175659, 0.0071965232491493225, 0.007763609290122986, 0.00833069533109665, 0.008897781372070312, 0.009464867413043976, 0.01003195345401764, 0.010599039494991302, 0.011166125535964966, 0.01173321157693863, 0.012300297617912292, 0.012867383658885956, 0.01343446969985962, 0.014001555740833282, 0.014568641781806946, 0.015135727822780609, 0.015702813863754272, 0.016269899904727936, 0.0168369859457016, 0.017404071986675262, 0.017971158027648926]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 14.0, 7.0, 6.0, 13.0, 8.0, 10.0, 18.0, 33.0, 19.0, 33.0, 34.0, 30.0, 36.0, 28.0, 40.0, 37.0, 33.0, 39.0, 46.0, 42.0, 34.0, 36.0, 34.0, 39.0, 34.0, 33.0, 26.0, 26.0, 29.0, 12.0, 22.0, 24.0, 17.0, 19.0, 16.0, 11.0, 5.0, 10.0, 8.0, 6.0, 9.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.1953125, -4.0614013671875, -3.927490234375, -3.7935791015625, -3.65966796875, -3.5257568359375, -3.391845703125, -3.2579345703125, -3.1240234375, -2.9901123046875, -2.856201171875, -2.7222900390625, -2.58837890625, -2.4544677734375, -2.320556640625, -2.1866455078125, -2.052734375, -1.9188232421875, -1.784912109375, -1.6510009765625, -1.51708984375, -1.3831787109375, -1.249267578125, -1.1153564453125, -0.9814453125, -0.8475341796875, -0.713623046875, -0.5797119140625, -0.44580078125, -0.3118896484375, -0.177978515625, -0.0440673828125, 0.08984375, 0.2237548828125, 0.357666015625, 0.4915771484375, 0.62548828125, 0.7593994140625, 0.893310546875, 1.0272216796875, 1.1611328125, 1.2950439453125, 1.428955078125, 1.5628662109375, 1.69677734375, 1.8306884765625, 1.964599609375, 2.0985107421875, 2.232421875, 2.3663330078125, 2.500244140625, 2.6341552734375, 2.76806640625, 2.9019775390625, 3.035888671875, 3.1697998046875, 3.3037109375, 3.4376220703125, 3.571533203125, 3.7054443359375, 3.83935546875, 3.9732666015625, 4.107177734375, 4.2410888671875, 4.375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 5.0, 3.0, 9.0, 11.0, 4.0, 16.0, 18.0, 25.0, 22.0, 42.0, 56.0, 112.0, 150.0, 276.0, 536.0, 993.0, 1945.0, 3637.0, 6929.0, 13291.0, 26094.0, 54982.0, 129452.0, 321754.0, 280590.0, 111304.0, 48075.0, 22947.0, 11870.0, 6181.0, 3355.0, 1789.0, 856.0, 508.0, 277.0, 152.0, 89.0, 45.0, 43.0, 25.0, 14.0, 14.0, 11.0, 12.0, 9.0, 5.0, 4.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.625, -4.47039794921875, -4.3157958984375, -4.16119384765625, -4.006591796875, -3.85198974609375, -3.6973876953125, -3.54278564453125, -3.38818359375, -3.23358154296875, -3.0789794921875, -2.92437744140625, -2.769775390625, -2.61517333984375, -2.4605712890625, -2.30596923828125, -2.1513671875, -1.99676513671875, -1.8421630859375, -1.68756103515625, -1.532958984375, -1.37835693359375, -1.2237548828125, -1.06915283203125, -0.91455078125, -0.75994873046875, -0.6053466796875, -0.45074462890625, -0.296142578125, -0.14154052734375, 0.0130615234375, 0.16766357421875, 0.322265625, 0.47686767578125, 0.6314697265625, 0.78607177734375, 0.940673828125, 1.09527587890625, 1.2498779296875, 1.40447998046875, 1.55908203125, 1.71368408203125, 1.8682861328125, 2.02288818359375, 2.177490234375, 2.33209228515625, 2.4866943359375, 2.64129638671875, 2.7958984375, 2.95050048828125, 3.1051025390625, 3.25970458984375, 3.414306640625, 3.56890869140625, 3.7235107421875, 3.87811279296875, 4.03271484375, 4.18731689453125, 4.3419189453125, 4.49652099609375, 4.651123046875, 4.80572509765625, 4.9603271484375, 5.11492919921875, 5.26953125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 2.0, 5.0, 5.0, 6.0, 9.0, 12.0, 12.0, 25.0, 21.0, 23.0, 34.0, 22.0, 30.0, 36.0, 34.0, 46.0, 47.0, 70.0, 108.0, 180.0, 1365.0, 328.0, 150.0, 74.0, 57.0, 37.0, 36.0, 40.0, 37.0, 32.0, 22.0, 15.0, 14.0, 23.0, 9.0, 13.0, 14.0, 8.0, 9.0, 9.0, 6.0, 4.0, 4.0, 2.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-17.78125, -17.257568359375, -16.73388671875, -16.210205078125, -15.6865234375, -15.162841796875, -14.63916015625, -14.115478515625, -13.591796875, -13.068115234375, -12.54443359375, -12.020751953125, -11.4970703125, -10.973388671875, -10.44970703125, -9.926025390625, -9.40234375, -8.878662109375, -8.35498046875, -7.831298828125, -7.3076171875, -6.783935546875, -6.26025390625, -5.736572265625, -5.212890625, -4.689208984375, -4.16552734375, -3.641845703125, -3.1181640625, -2.594482421875, -2.07080078125, -1.547119140625, -1.0234375, -0.499755859375, 0.02392578125, 0.547607421875, 1.0712890625, 1.594970703125, 2.11865234375, 2.642333984375, 3.166015625, 3.689697265625, 4.21337890625, 4.737060546875, 5.2607421875, 5.784423828125, 6.30810546875, 6.831787109375, 7.35546875, 7.879150390625, 8.40283203125, 8.926513671875, 9.4501953125, 9.973876953125, 10.49755859375, 11.021240234375, 11.544921875, 12.068603515625, 12.59228515625, 13.115966796875, 13.6396484375, 14.163330078125, 14.68701171875, 15.210693359375, 15.734375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 11.0, 11.0, 13.0, 9.0, 18.0, 23.0, 25.0, 25.0, 36.0, 53.0, 58.0, 70.0, 104.0, 178.0, 206.0, 285.0, 641.0, 2216.0, 67227.0, 3038876.0, 32137.0, 1681.0, 548.0, 339.0, 217.0, 153.0, 109.0, 99.0, 58.0, 63.0, 40.0, 27.0, 28.0, 23.0, 15.0, 16.0, 9.0, 9.0, 9.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-42.84375, -41.5224609375, -40.201171875, -38.8798828125, -37.55859375, -36.2373046875, -34.916015625, -33.5947265625, -32.2734375, -30.9521484375, -29.630859375, -28.3095703125, -26.98828125, -25.6669921875, -24.345703125, -23.0244140625, -21.703125, -20.3818359375, -19.060546875, -17.7392578125, -16.41796875, -15.0966796875, -13.775390625, -12.4541015625, -11.1328125, -9.8115234375, -8.490234375, -7.1689453125, -5.84765625, -4.5263671875, -3.205078125, -1.8837890625, -0.5625, 0.7587890625, 2.080078125, 3.4013671875, 4.72265625, 6.0439453125, 7.365234375, 8.6865234375, 10.0078125, 11.3291015625, 12.650390625, 13.9716796875, 15.29296875, 16.6142578125, 17.935546875, 19.2568359375, 20.578125, 21.8994140625, 23.220703125, 24.5419921875, 25.86328125, 27.1845703125, 28.505859375, 29.8271484375, 31.1484375, 32.4697265625, 33.791015625, 35.1123046875, 36.43359375, 37.7548828125, 39.076171875, 40.3974609375, 41.71875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 73.0, 237.0, 401.0, 234.0, 53.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-138.49945068359375, -135.95594787597656, -133.4124298095703, -130.86892700195312, -128.32542419433594, -125.78190612792969, -123.2384033203125, -120.69489288330078, -118.15138244628906, -115.60787200927734, -113.06436920166016, -110.52085876464844, -107.97734832763672, -105.433837890625, -102.89033508300781, -100.3468246459961, -97.80331420898438, -95.25980377197266, -92.71630096435547, -90.17279052734375, -87.62928009033203, -85.08576965332031, -82.54226684570312, -79.9987564086914, -77.45525360107422, -74.9117431640625, -72.36824035644531, -69.8247299194336, -67.28121948242188, -64.73770904541016, -62.19420623779297, -59.65069580078125, -57.10718536376953, -54.56367874145508, -52.02016830444336, -49.476661682128906, -46.93315124511719, -44.389644622802734, -41.84613800048828, -39.30262756347656, -36.759117126464844, -34.21561050415039, -31.672100067138672, -29.12859344482422, -26.5850830078125, -24.041576385498047, -21.49806785583496, -18.954559326171875, -16.411052703857422, -13.867544174194336, -11.32403564453125, -8.78052806854248, -6.2370195388793945, -3.6935110092163086, -1.150003433227539, 1.3935050964355469, 3.937013626098633, 6.480522155761719, 9.024030685424805, 11.567538261413574, 14.11104679107666, 16.654556274414062, 19.198062896728516, 21.7415714263916, 24.285079956054688]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 11.0, 8.0, 6.0, 8.0, 12.0, 15.0, 9.0, 17.0, 16.0, 18.0, 20.0, 22.0, 32.0, 21.0, 29.0, 29.0, 35.0, 38.0, 36.0, 38.0, 39.0, 47.0, 42.0, 44.0, 39.0, 49.0, 36.0, 34.0, 28.0, 27.0, 26.0, 25.0, 22.0, 24.0, 19.0, 23.0, 12.0, 8.0, 6.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-42.71039581298828, -41.401756286621094, -40.09312057495117, -38.784481048583984, -37.4758415222168, -36.167205810546875, -34.85856628417969, -33.5499267578125, -32.24128723144531, -30.932649612426758, -29.62401008605957, -28.315372467041016, -27.006732940673828, -25.698095321655273, -24.38945770263672, -23.08081817626953, -21.77218246459961, -20.463544845581055, -19.154905319213867, -17.846267700195312, -16.537628173828125, -15.22899055480957, -13.920352935791016, -12.611714363098145, -11.303075790405273, -9.994437217712402, -8.685798645019531, -7.377161026000977, -6.0685224533081055, -4.759883880615234, -3.4512457847595215, -2.1426076889038086, -0.8339653015136719, 0.4746730327606201, 1.783311367034912, 3.091949701309204, 4.400588035583496, 5.709226608276367, 7.01786470413208, 8.326502799987793, 9.635141372680664, 10.943779945373535, 12.252418518066406, 13.561056137084961, 14.869694709777832, 16.178333282470703, 17.486970901489258, 18.795608520507812, 20.104248046875, 21.412885665893555, 22.721525192260742, 24.030162811279297, 25.338802337646484, 26.64743995666504, 27.956077575683594, 29.26471710205078, 30.573354721069336, 31.88199234008789, 33.19063186645508, 34.499271392822266, 35.80790710449219, 37.116546630859375, 38.42518615722656, 39.733821868896484, 41.04246139526367]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 7.0, 4.0, 4.0, 5.0, 2.0, 7.0, 6.0, 11.0, 9.0, 11.0, 18.0, 18.0, 23.0, 22.0, 24.0, 35.0, 35.0, 28.0, 22.0, 37.0, 37.0, 46.0, 32.0, 49.0, 34.0, 39.0, 40.0, 33.0, 36.0, 35.0, 42.0, 36.0, 23.0, 23.0, 25.0, 23.0, 20.0, 17.0, 5.0, 20.0, 9.0, 10.0, 13.0, 10.0, 8.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.51953125, -4.37078857421875, -4.2220458984375, -4.07330322265625, -3.924560546875, -3.77581787109375, -3.6270751953125, -3.47833251953125, -3.32958984375, -3.18084716796875, -3.0321044921875, -2.88336181640625, -2.734619140625, -2.58587646484375, -2.4371337890625, -2.28839111328125, -2.1396484375, -1.99090576171875, -1.8421630859375, -1.69342041015625, -1.544677734375, -1.39593505859375, -1.2471923828125, -1.09844970703125, -0.94970703125, -0.80096435546875, -0.6522216796875, -0.50347900390625, -0.354736328125, -0.20599365234375, -0.0572509765625, 0.09149169921875, 0.240234375, 0.38897705078125, 0.5377197265625, 0.68646240234375, 0.835205078125, 0.98394775390625, 1.1326904296875, 1.28143310546875, 1.43017578125, 1.57891845703125, 1.7276611328125, 1.87640380859375, 2.025146484375, 2.17388916015625, 2.3226318359375, 2.47137451171875, 2.6201171875, 2.76885986328125, 2.9176025390625, 3.06634521484375, 3.215087890625, 3.36383056640625, 3.5125732421875, 3.66131591796875, 3.81005859375, 3.95880126953125, 4.1075439453125, 4.25628662109375, 4.405029296875, 4.55377197265625, 4.7025146484375, 4.85125732421875, 5.0]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 8.0, 4.0, 2.0, 5.0, 6.0, 9.0, 12.0, 6.0, 18.0, 21.0, 29.0, 35.0, 41.0, 58.0, 71.0, 96.0, 147.0, 213.0, 461.0, 1121.0, 5107.0, 33516.0, 280062.0, 1642308.0, 1834850.0, 345809.0, 41326.0, 6208.0, 1327.0, 548.0, 241.0, 166.0, 111.0, 79.0, 55.0, 44.0, 42.0, 34.0, 27.0, 9.0, 16.0, 8.0, 11.0, 4.0, 7.0, 4.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.54638671875, -9.2177734375, -8.88916015625, -8.560546875, -8.23193359375, -7.9033203125, -7.57470703125, -7.24609375, -6.91748046875, -6.5888671875, -6.26025390625, -5.931640625, -5.60302734375, -5.2744140625, -4.94580078125, -4.6171875, -4.28857421875, -3.9599609375, -3.63134765625, -3.302734375, -2.97412109375, -2.6455078125, -2.31689453125, -1.98828125, -1.65966796875, -1.3310546875, -1.00244140625, -0.673828125, -0.34521484375, -0.0166015625, 0.31201171875, 0.640625, 0.96923828125, 1.2978515625, 1.62646484375, 1.955078125, 2.28369140625, 2.6123046875, 2.94091796875, 3.26953125, 3.59814453125, 3.9267578125, 4.25537109375, 4.583984375, 4.91259765625, 5.2412109375, 5.56982421875, 5.8984375, 6.22705078125, 6.5556640625, 6.88427734375, 7.212890625, 7.54150390625, 7.8701171875, 8.19873046875, 8.52734375, 8.85595703125, 9.1845703125, 9.51318359375, 9.841796875, 10.17041015625, 10.4990234375, 10.82763671875, 11.15625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 11.0, 12.0, 22.0, 27.0, 31.0, 44.0, 55.0, 83.0, 118.0, 152.0, 201.0, 287.0, 359.0, 394.0, 421.0, 415.0, 316.0, 254.0, 220.0, 148.0, 119.0, 86.0, 85.0, 60.0, 42.0, 19.0, 20.0, 18.0, 13.0, 8.0, 4.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.7265625, -8.420654296875, -8.11474609375, -7.808837890625, -7.5029296875, -7.197021484375, -6.89111328125, -6.585205078125, -6.279296875, -5.973388671875, -5.66748046875, -5.361572265625, -5.0556640625, -4.749755859375, -4.44384765625, -4.137939453125, -3.83203125, -3.526123046875, -3.22021484375, -2.914306640625, -2.6083984375, -2.302490234375, -1.99658203125, -1.690673828125, -1.384765625, -1.078857421875, -0.77294921875, -0.467041015625, -0.1611328125, 0.144775390625, 0.45068359375, 0.756591796875, 1.0625, 1.368408203125, 1.67431640625, 1.980224609375, 2.2861328125, 2.592041015625, 2.89794921875, 3.203857421875, 3.509765625, 3.815673828125, 4.12158203125, 4.427490234375, 4.7333984375, 5.039306640625, 5.34521484375, 5.651123046875, 5.95703125, 6.262939453125, 6.56884765625, 6.874755859375, 7.1806640625, 7.486572265625, 7.79248046875, 8.098388671875, 8.404296875, 8.710205078125, 9.01611328125, 9.322021484375, 9.6279296875, 9.933837890625, 10.23974609375, 10.545654296875, 10.8515625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 10.0, 6.0, 9.0, 7.0, 24.0, 18.0, 28.0, 41.0, 61.0, 87.0, 103.0, 124.0, 191.0, 312.0, 427.0, 1999.0, 291717.0, 3863411.0, 33586.0, 894.0, 402.0, 252.0, 173.0, 114.0, 75.0, 54.0, 40.0, 29.0, 27.0, 20.0, 12.0, 5.0, 11.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.03125, -48.65380859375, -47.2763671875, -45.89892578125, -44.521484375, -43.14404296875, -41.7666015625, -40.38916015625, -39.01171875, -37.63427734375, -36.2568359375, -34.87939453125, -33.501953125, -32.12451171875, -30.7470703125, -29.36962890625, -27.9921875, -26.61474609375, -25.2373046875, -23.85986328125, -22.482421875, -21.10498046875, -19.7275390625, -18.35009765625, -16.97265625, -15.59521484375, -14.2177734375, -12.84033203125, -11.462890625, -10.08544921875, -8.7080078125, -7.33056640625, -5.953125, -4.57568359375, -3.1982421875, -1.82080078125, -0.443359375, 0.93408203125, 2.3115234375, 3.68896484375, 5.06640625, 6.44384765625, 7.8212890625, 9.19873046875, 10.576171875, 11.95361328125, 13.3310546875, 14.70849609375, 16.0859375, 17.46337890625, 18.8408203125, 20.21826171875, 21.595703125, 22.97314453125, 24.3505859375, 25.72802734375, 27.10546875, 28.48291015625, 29.8603515625, 31.23779296875, 32.615234375, 33.99267578125, 35.3701171875, 36.74755859375, 38.125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 15.0, 48.0, 219.0, 342.0, 255.0, 109.0, 23.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.34267044067383, -35.22692108154297, -31.11117172241211, -26.99542236328125, -22.87967300415039, -18.76392364501953, -14.648174285888672, -10.532424926757812, -6.416675567626953, -2.3009262084960938, 1.8148231506347656, 5.930572509765625, 10.046321868896484, 14.162071228027344, 18.277820587158203, 22.393569946289062, 26.509319305419922, 30.62506866455078, 34.74081802368164, 38.8565673828125, 42.97231674194336, 47.08806610107422, 51.20381546020508, 55.31956481933594, 59.4353141784668, 63.551063537597656, 67.66680908203125, 71.78256225585938, 75.8983154296875, 80.0140609741211, 84.12980651855469, 88.24555969238281, 92.36129760742188, 96.47705078125, 100.5927963256836, 104.70854187011719, 108.82429504394531, 112.94004821777344, 117.05579376220703, 121.17153930664062, 125.28729248046875, 129.40304565429688, 133.518798828125, 137.63453674316406, 141.7502899169922, 145.8660430908203, 149.98178100585938, 154.0975341796875, 158.21328735351562, 162.32904052734375, 166.44479370117188, 170.56053161621094, 174.67628479003906, 178.7920379638672, 182.90777587890625, 187.02352905273438, 191.1392822265625, 195.25503540039062, 199.37078857421875, 203.4865264892578, 207.60227966308594, 211.71803283691406, 215.83377075195312, 219.94952392578125, 224.06527709960938]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 7.0, 6.0, 8.0, 11.0, 13.0, 6.0, 16.0, 16.0, 28.0, 18.0, 30.0, 34.0, 34.0, 41.0, 45.0, 47.0, 46.0, 44.0, 44.0, 45.0, 36.0, 39.0, 56.0, 34.0, 52.0, 38.0, 29.0, 25.0, 25.0, 22.0, 12.0, 9.0, 17.0, 13.0, 14.0, 8.0, 6.0, 5.0, 3.0, 4.0, 1.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-39.37056350708008, -38.268489837646484, -37.166419982910156, -36.06434631347656, -34.962276458740234, -33.86020278930664, -32.75813293457031, -31.65605926513672, -30.55398941040039, -29.45191764831543, -28.34984588623047, -27.247774124145508, -26.145702362060547, -25.043630599975586, -23.941558837890625, -22.83948516845703, -21.73741340637207, -20.63534164428711, -19.53326988220215, -18.431198120117188, -17.329126358032227, -16.227054595947266, -15.124981880187988, -14.022910118103027, -12.920838356018066, -11.818766593933105, -10.716694831848145, -9.614622116088867, -8.512550354003906, -7.4104790687561035, -6.308406829833984, -5.206335067749023, -4.104265213012695, -3.0021934509277344, -1.9001214504241943, -0.7980494499206543, 0.30402231216430664, 1.4060940742492676, 2.5081663131713867, 3.6102380752563477, 4.712309837341309, 5.8143815994262695, 6.9164533615112305, 8.018526077270508, 9.120597839355469, 10.22266960144043, 11.32474136352539, 12.426813125610352, 13.528884887695312, 14.630956649780273, 15.733028411865234, 16.835100173950195, 17.937171936035156, 19.039243698120117, 20.141315460205078, 21.243389129638672, 22.345458984375, 23.44753074645996, 24.549602508544922, 25.651674270629883, 26.753746032714844, 27.855817794799805, 28.957889556884766, 30.05996322631836, 31.16203498840332]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 11.0, 7.0, 14.0, 9.0, 13.0, 12.0, 21.0, 19.0, 27.0, 30.0, 17.0, 34.0, 31.0, 41.0, 51.0, 35.0, 38.0, 32.0, 38.0, 40.0, 38.0, 34.0, 33.0, 39.0, 35.0, 30.0, 35.0, 18.0, 22.0, 29.0, 16.0, 16.0, 20.0, 17.0, 17.0, 14.0, 14.0, 8.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.5234375, -4.38616943359375, -4.2489013671875, -4.11163330078125, -3.974365234375, -3.83709716796875, -3.6998291015625, -3.56256103515625, -3.42529296875, -3.28802490234375, -3.1507568359375, -3.01348876953125, -2.876220703125, -2.73895263671875, -2.6016845703125, -2.46441650390625, -2.3271484375, -2.18988037109375, -2.0526123046875, -1.91534423828125, -1.778076171875, -1.64080810546875, -1.5035400390625, -1.36627197265625, -1.22900390625, -1.09173583984375, -0.9544677734375, -0.81719970703125, -0.679931640625, -0.54266357421875, -0.4053955078125, -0.26812744140625, -0.130859375, 0.00640869140625, 0.1436767578125, 0.28094482421875, 0.418212890625, 0.55548095703125, 0.6927490234375, 0.83001708984375, 0.96728515625, 1.10455322265625, 1.2418212890625, 1.37908935546875, 1.516357421875, 1.65362548828125, 1.7908935546875, 1.92816162109375, 2.0654296875, 2.20269775390625, 2.3399658203125, 2.47723388671875, 2.614501953125, 2.75177001953125, 2.8890380859375, 3.02630615234375, 3.16357421875, 3.30084228515625, 3.4381103515625, 3.57537841796875, 3.712646484375, 3.84991455078125, 3.9871826171875, 4.12445068359375, 4.26171875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 11.0, 21.0, 36.0, 45.0, 65.0, 99.0, 158.0, 217.0, 351.0, 518.0, 720.0, 1110.0, 1687.0, 2569.0, 3788.0, 5757.0, 8482.0, 13247.0, 19846.0, 29773.0, 43902.0, 64292.0, 90019.0, 118933.0, 141856.0, 136766.0, 110005.0, 81061.0, 56303.0, 39087.0, 26132.0, 17449.0, 11571.0, 7580.0, 5007.0, 3358.0, 2209.0, 1485.0, 979.0, 646.0, 455.0, 340.0, 182.0, 140.0, 94.0, 65.0, 54.0, 31.0, 23.0, 14.0, 11.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.317626953125, -0.3076515197753906, -0.29767608642578125, -0.2877006530761719, -0.2777252197265625, -0.2677497863769531, -0.25777435302734375, -0.24779891967773438, -0.237823486328125, -0.22784805297851562, -0.21787261962890625, -0.20789718627929688, -0.1979217529296875, -0.18794631958007812, -0.17797088623046875, -0.16799545288085938, -0.15802001953125, -0.14804458618164062, -0.13806915283203125, -0.12809371948242188, -0.1181182861328125, -0.10814285278320312, -0.09816741943359375, -0.08819198608398438, -0.078216552734375, -0.06824111938476562, -0.05826568603515625, -0.048290252685546875, -0.0383148193359375, -0.028339385986328125, -0.01836395263671875, -0.008388519287109375, 0.0015869140625, 0.011562347412109375, 0.02153778076171875, 0.031513214111328125, 0.0414886474609375, 0.051464080810546875, 0.06143951416015625, 0.07141494750976562, 0.081390380859375, 0.09136581420898438, 0.10134124755859375, 0.11131668090820312, 0.1212921142578125, 0.13126754760742188, 0.14124298095703125, 0.15121841430664062, 0.16119384765625, 0.17116928100585938, 0.18114471435546875, 0.19112014770507812, 0.2010955810546875, 0.21107101440429688, 0.22104644775390625, 0.23102188110351562, 0.240997314453125, 0.2509727478027344, 0.26094818115234375, 0.2709236145019531, 0.2808990478515625, 0.2908744812011719, 0.30084991455078125, 0.3108253479003906, 0.32080078125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 3.0, 2.0, 5.0, 8.0, 11.0, 10.0, 14.0, 21.0, 21.0, 15.0, 29.0, 25.0, 32.0, 37.0, 27.0, 51.0, 36.0, 30.0, 49.0, 36.0, 1073.0, 36.0, 37.0, 40.0, 52.0, 33.0, 40.0, 34.0, 37.0, 37.0, 20.0, 27.0, 20.0, 12.0, 10.0, 18.0, 10.0, 8.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.375, -3.27471923828125, -3.1744384765625, -3.07415771484375, -2.973876953125, -2.87359619140625, -2.7733154296875, -2.67303466796875, -2.57275390625, -2.47247314453125, -2.3721923828125, -2.27191162109375, -2.171630859375, -2.07135009765625, -1.9710693359375, -1.87078857421875, -1.7705078125, -1.67022705078125, -1.5699462890625, -1.46966552734375, -1.369384765625, -1.26910400390625, -1.1688232421875, -1.06854248046875, -0.96826171875, -0.86798095703125, -0.7677001953125, -0.66741943359375, -0.567138671875, -0.46685791015625, -0.3665771484375, -0.26629638671875, -0.166015625, -0.06573486328125, 0.0345458984375, 0.13482666015625, 0.235107421875, 0.33538818359375, 0.4356689453125, 0.53594970703125, 0.63623046875, 0.73651123046875, 0.8367919921875, 0.93707275390625, 1.037353515625, 1.13763427734375, 1.2379150390625, 1.33819580078125, 1.4384765625, 1.53875732421875, 1.6390380859375, 1.73931884765625, 1.839599609375, 1.93988037109375, 2.0401611328125, 2.14044189453125, 2.24072265625, 2.34100341796875, 2.4412841796875, 2.54156494140625, 2.641845703125, 2.74212646484375, 2.8424072265625, 2.94268798828125, 3.04296875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 13.0, 17.0, 30.0, 44.0, 77.0, 105.0, 147.0, 250.0, 356.0, 557.0, 862.0, 1378.0, 2347.0, 3566.0, 6102.0, 9971.0, 16446.0, 27133.0, 43556.0, 68035.0, 100949.0, 137262.0, 1197059.0, 154237.0, 113740.0, 78207.0, 51573.0, 32146.0, 19779.0, 12027.0, 7403.0, 4446.0, 2697.0, 1691.0, 1080.0, 631.0, 428.0, 268.0, 175.0, 123.0, 65.0, 54.0, 29.0, 22.0, 18.0, 10.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.27392578125, -0.26602745056152344, -0.2581291198730469, -0.2502307891845703, -0.24233245849609375, -0.2344341278076172, -0.22653579711914062, -0.21863746643066406, -0.2107391357421875, -0.20284080505371094, -0.19494247436523438, -0.1870441436767578, -0.17914581298828125, -0.1712474822998047, -0.16334915161132812, -0.15545082092285156, -0.147552490234375, -0.13965415954589844, -0.13175582885742188, -0.12385749816894531, -0.11595916748046875, -0.10806083679199219, -0.10016250610351562, -0.09226417541503906, -0.0843658447265625, -0.07646751403808594, -0.06856918334960938, -0.06067085266113281, -0.05277252197265625, -0.04487419128417969, -0.036975860595703125, -0.029077529907226562, -0.02117919921875, -0.013280868530273438, -0.005382537841796875, 0.0025157928466796875, 0.01041412353515625, 0.018312454223632812, 0.026210784912109375, 0.03410911560058594, 0.0420074462890625, 0.04990577697753906, 0.057804107666015625, 0.06570243835449219, 0.07360076904296875, 0.08149909973144531, 0.08939743041992188, 0.09729576110839844, 0.105194091796875, 0.11309242248535156, 0.12099075317382812, 0.1288890838623047, 0.13678741455078125, 0.1446857452392578, 0.15258407592773438, 0.16048240661621094, 0.1683807373046875, 0.17627906799316406, 0.18417739868164062, 0.1920757293701172, 0.19997406005859375, 0.2078723907470703, 0.21577072143554688, 0.22366905212402344, 0.2315673828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 3.0, 6.0, 5.0, 8.0, 10.0, 10.0, 14.0, 22.0, 40.0, 58.0, 82.0, 137.0, 204.0, 153.0, 68.0, 46.0, 34.0, 15.0, 16.0, 16.0, 14.0, 11.0, 5.0, 4.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.0160980224609375, -0.015568971633911133, -0.015039920806884766, -0.014510869979858398, -0.013981819152832031, -0.013452768325805664, -0.012923717498779297, -0.01239466667175293, -0.011865615844726562, -0.011336565017700195, -0.010807514190673828, -0.010278463363647461, -0.009749412536621094, -0.009220361709594727, -0.00869131088256836, -0.008162260055541992, -0.007633209228515625, -0.007104158401489258, -0.006575107574462891, -0.0060460567474365234, -0.005517005920410156, -0.004987955093383789, -0.004458904266357422, -0.003929853439331055, -0.0034008026123046875, -0.0028717517852783203, -0.002342700958251953, -0.001813650131225586, -0.0012845993041992188, -0.0007555484771728516, -0.00022649765014648438, 0.0003025531768798828, 0.00083160400390625, 0.0013606548309326172, 0.0018897056579589844, 0.0024187564849853516, 0.0029478073120117188, 0.003476858139038086, 0.004005908966064453, 0.00453495979309082, 0.0050640106201171875, 0.005593061447143555, 0.006122112274169922, 0.006651163101196289, 0.007180213928222656, 0.0077092647552490234, 0.00823831558227539, 0.008767366409301758, 0.009296417236328125, 0.009825468063354492, 0.01035451889038086, 0.010883569717407227, 0.011412620544433594, 0.011941671371459961, 0.012470722198486328, 0.012999773025512695, 0.013528823852539062, 0.01405787467956543, 0.014586925506591797, 0.015115976333618164, 0.01564502716064453, 0.0161740779876709, 0.016703128814697266, 0.017232179641723633, 0.01776123046875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 9.0, 3.0, 5.0, 9.0, 12.0, 14.0, 20.0, 33.0, 42.0, 72.0, 126.0, 235.0, 2259.0, 1038911.0, 6124.0, 314.0, 138.0, 81.0, 44.0, 29.0, 13.0, 15.0, 14.0, 7.0, 7.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.3773345947265625, -0.365753173828125, -0.3541717529296875, -0.34259033203125, -0.3310089111328125, -0.319427490234375, -0.3078460693359375, -0.2962646484375, -0.2846832275390625, -0.273101806640625, -0.2615203857421875, -0.24993896484375, -0.2383575439453125, -0.226776123046875, -0.2151947021484375, -0.20361328125, -0.1920318603515625, -0.180450439453125, -0.1688690185546875, -0.15728759765625, -0.1457061767578125, -0.134124755859375, -0.1225433349609375, -0.1109619140625, -0.0993804931640625, -0.087799072265625, -0.0762176513671875, -0.06463623046875, -0.0530548095703125, -0.041473388671875, -0.0298919677734375, -0.018310546875, -0.0067291259765625, 0.004852294921875, 0.0164337158203125, 0.02801513671875, 0.0395965576171875, 0.051177978515625, 0.0627593994140625, 0.0743408203125, 0.0859222412109375, 0.097503662109375, 0.1090850830078125, 0.12066650390625, 0.1322479248046875, 0.143829345703125, 0.1554107666015625, 0.1669921875, 0.1785736083984375, 0.190155029296875, 0.2017364501953125, 0.21331787109375, 0.2248992919921875, 0.236480712890625, 0.2480621337890625, 0.2596435546875, 0.2712249755859375, 0.282806396484375, 0.2943878173828125, 0.30596923828125, 0.3175506591796875, 0.329132080078125, 0.3407135009765625, 0.352294921875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 23.0, 53.0, 147.0, 287.0, 263.0, 106.0, 58.0, 28.0, 12.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013879046775400639, -0.013049098663032055, -0.012219149619340897, -0.011389201506972313, -0.01055925339460373, -0.009729305282235146, -0.008899357169866562, -0.008069408126175404, -0.00723946001380682, -0.006409511901438236, -0.005579563323408365, -0.004749614745378494, -0.003919666633009911, -0.003089718520641327, -0.002259769942611456, -0.001429821364581585, -0.0005998732522130013, 0.00023007509298622608, 0.0010600234381854534, 0.0018899717833846807, 0.002719920128583908, 0.0035498682409524918, 0.004379816818982363, 0.005209765397012234, 0.006039713509380817, 0.006869661621749401, 0.007699610199779272, 0.008529558777809143, 0.009359506890177727, 0.01018945500254631, 0.011019403114914894, 0.011849352158606052, 0.01267930120229721, 0.013509249314665794, 0.014339197427034378, 0.015169146470725536, 0.015999093651771545, 0.01682904362678528, 0.017658991739153862, 0.018488939851522446, 0.01931888796389103, 0.020148836076259613, 0.020978784188628197, 0.02180873230099678, 0.022638682276010513, 0.023468628525733948, 0.02429857850074768, 0.025128526613116264, 0.025958474725484848, 0.02678842283785343, 0.027618370950222015, 0.0284483190625906, 0.029278267174959183, 0.030108217149972916, 0.0309381652623415, 0.03176811337471008, 0.032598063349723816, 0.03342801332473755, 0.03425795957446098, 0.035087909549474716, 0.03591785579919815, 0.036747805774211884, 0.03757775202393532, 0.03840770199894905, 0.039237648248672485]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 12.0, 9.0, 4.0, 12.0, 10.0, 18.0, 21.0, 19.0, 29.0, 25.0, 32.0, 27.0, 41.0, 34.0, 41.0, 40.0, 47.0, 49.0, 38.0, 41.0, 38.0, 50.0, 44.0, 40.0, 32.0, 32.0, 26.0, 31.0, 23.0, 22.0, 15.0, 21.0, 15.0, 15.0, 12.0, 5.0, 5.0, 4.0, 8.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0110853910446167, -0.010772244073450565, -0.010459097102284431, -0.010145950131118298, -0.009832803159952164, -0.00951965618878603, -0.009206509217619896, -0.008893362246453762, -0.008580215275287628, -0.008267068304121494, -0.00795392133295536, -0.0076407743617892265, -0.007327627390623093, -0.007014480419456959, -0.006701333448290825, -0.006388186477124691, -0.006075039505958557, -0.005761892534792423, -0.005448745563626289, -0.0051355985924601555, -0.004822451621294022, -0.004509304650127888, -0.004196157678961754, -0.00388301070779562, -0.003569863736629486, -0.003256716765463352, -0.0029435697942972183, -0.0026304228231310844, -0.0023172758519649506, -0.0020041288807988167, -0.0016909819096326828, -0.001377834938466549, -0.001064687967300415, -0.0007515409961342812, -0.0004383940249681473, -0.0001252470538020134, 0.00018789991736412048, 0.0005010468885302544, 0.0008141938596963882, 0.0011273408308625221, 0.001440487802028656, 0.0017536347731947899, 0.0020667817443609238, 0.0023799287155270576, 0.0026930756866931915, 0.0030062226578593254, 0.0033193696290254593, 0.003632516600191593, 0.003945663571357727, 0.004258810542523861, 0.004571957513689995, 0.004885104484856129, 0.005198251456022263, 0.0055113984271883965, 0.00582454539835453, 0.006137692369520664, 0.006450839340686798, 0.006763986311852932, 0.007077133283019066, 0.0073902802541852, 0.007703427225351334, 0.008016574196517467, 0.008329721167683601, 0.008642868138849735, 0.00895601511001587]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 3.0, 4.0, 3.0, 7.0, 6.0, 11.0, 7.0, 14.0, 9.0, 13.0, 12.0, 21.0, 19.0, 27.0, 30.0, 17.0, 34.0, 31.0, 41.0, 51.0, 35.0, 38.0, 32.0, 38.0, 40.0, 38.0, 34.0, 33.0, 39.0, 35.0, 30.0, 35.0, 18.0, 23.0, 28.0, 16.0, 16.0, 20.0, 17.0, 17.0, 14.0, 14.0, 8.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.5234375, -4.38616943359375, -4.2489013671875, -4.11163330078125, -3.974365234375, -3.83709716796875, -3.6998291015625, -3.56256103515625, -3.42529296875, -3.28802490234375, -3.1507568359375, -3.01348876953125, -2.876220703125, -2.73895263671875, -2.6016845703125, -2.46441650390625, -2.3271484375, -2.18988037109375, -2.0526123046875, -1.91534423828125, -1.778076171875, -1.64080810546875, -1.5035400390625, -1.36627197265625, -1.22900390625, -1.09173583984375, -0.9544677734375, -0.81719970703125, -0.679931640625, -0.54266357421875, -0.4053955078125, -0.26812744140625, -0.130859375, 0.00640869140625, 0.1436767578125, 0.28094482421875, 0.418212890625, 0.55548095703125, 0.6927490234375, 0.83001708984375, 0.96728515625, 1.10455322265625, 1.2418212890625, 1.37908935546875, 1.516357421875, 1.65362548828125, 1.7908935546875, 1.92816162109375, 2.0654296875, 2.20269775390625, 2.3399658203125, 2.47723388671875, 2.614501953125, 2.75177001953125, 2.8890380859375, 3.02630615234375, 3.16357421875, 3.30084228515625, 3.4381103515625, 3.57537841796875, 3.712646484375, 3.84991455078125, 3.9871826171875, 4.12445068359375, 4.26171875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 8.0, 13.0, 9.0, 15.0, 20.0, 22.0, 27.0, 37.0, 35.0, 57.0, 96.0, 101.0, 208.0, 356.0, 708.0, 1402.0, 2826.0, 5679.0, 11365.0, 22525.0, 44231.0, 88072.0, 181195.0, 313182.0, 190361.0, 92132.0, 46044.0, 23736.0, 12092.0, 5854.0, 2962.0, 1390.0, 703.0, 364.0, 217.0, 121.0, 94.0, 48.0, 50.0, 35.0, 39.0, 25.0, 19.0, 19.0, 13.0, 9.0, 7.0, 6.0, 3.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.73828125, -4.5880126953125, -4.437744140625, -4.2874755859375, -4.13720703125, -3.9869384765625, -3.836669921875, -3.6864013671875, -3.5361328125, -3.3858642578125, -3.235595703125, -3.0853271484375, -2.93505859375, -2.7847900390625, -2.634521484375, -2.4842529296875, -2.333984375, -2.1837158203125, -2.033447265625, -1.8831787109375, -1.73291015625, -1.5826416015625, -1.432373046875, -1.2821044921875, -1.1318359375, -0.9815673828125, -0.831298828125, -0.6810302734375, -0.53076171875, -0.3804931640625, -0.230224609375, -0.0799560546875, 0.0703125, 0.2205810546875, 0.370849609375, 0.5211181640625, 0.67138671875, 0.8216552734375, 0.971923828125, 1.1221923828125, 1.2724609375, 1.4227294921875, 1.572998046875, 1.7232666015625, 1.87353515625, 2.0238037109375, 2.174072265625, 2.3243408203125, 2.474609375, 2.6248779296875, 2.775146484375, 2.9254150390625, 3.07568359375, 3.2259521484375, 3.376220703125, 3.5264892578125, 3.6767578125, 3.8270263671875, 3.977294921875, 4.1275634765625, 4.27783203125, 4.4281005859375, 4.578369140625, 4.7286376953125, 4.87890625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 9.0, 16.0, 14.0, 13.0, 21.0, 26.0, 35.0, 42.0, 36.0, 43.0, 61.0, 62.0, 59.0, 126.0, 322.0, 1443.0, 221.0, 110.0, 51.0, 43.0, 43.0, 30.0, 27.0, 36.0, 28.0, 20.0, 23.0, 11.0, 17.0, 8.0, 12.0, 11.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.25, -18.688720703125, -18.12744140625, -17.566162109375, -17.0048828125, -16.443603515625, -15.88232421875, -15.321044921875, -14.759765625, -14.198486328125, -13.63720703125, -13.075927734375, -12.5146484375, -11.953369140625, -11.39208984375, -10.830810546875, -10.26953125, -9.708251953125, -9.14697265625, -8.585693359375, -8.0244140625, -7.463134765625, -6.90185546875, -6.340576171875, -5.779296875, -5.218017578125, -4.65673828125, -4.095458984375, -3.5341796875, -2.972900390625, -2.41162109375, -1.850341796875, -1.2890625, -0.727783203125, -0.16650390625, 0.394775390625, 0.9560546875, 1.517333984375, 2.07861328125, 2.639892578125, 3.201171875, 3.762451171875, 4.32373046875, 4.885009765625, 5.4462890625, 6.007568359375, 6.56884765625, 7.130126953125, 7.69140625, 8.252685546875, 8.81396484375, 9.375244140625, 9.9365234375, 10.497802734375, 11.05908203125, 11.620361328125, 12.181640625, 12.742919921875, 13.30419921875, 13.865478515625, 14.4267578125, 14.988037109375, 15.54931640625, 16.110595703125, 16.671875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 6.0, 5.0, 9.0, 7.0, 12.0, 6.0, 9.0, 18.0, 13.0, 20.0, 33.0, 31.0, 46.0, 75.0, 88.0, 127.0, 216.0, 332.0, 660.0, 1555.0, 21384.0, 3084204.0, 33225.0, 1816.0, 706.0, 343.0, 221.0, 125.0, 94.0, 76.0, 53.0, 42.0, 32.0, 23.0, 13.0, 15.0, 11.0, 13.0, 9.0, 9.0, 4.0, 3.0, 6.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-53.59375, -51.94677734375, -50.2998046875, -48.65283203125, -47.005859375, -45.35888671875, -43.7119140625, -42.06494140625, -40.41796875, -38.77099609375, -37.1240234375, -35.47705078125, -33.830078125, -32.18310546875, -30.5361328125, -28.88916015625, -27.2421875, -25.59521484375, -23.9482421875, -22.30126953125, -20.654296875, -19.00732421875, -17.3603515625, -15.71337890625, -14.06640625, -12.41943359375, -10.7724609375, -9.12548828125, -7.478515625, -5.83154296875, -4.1845703125, -2.53759765625, -0.890625, 0.75634765625, 2.4033203125, 4.05029296875, 5.697265625, 7.34423828125, 8.9912109375, 10.63818359375, 12.28515625, 13.93212890625, 15.5791015625, 17.22607421875, 18.873046875, 20.52001953125, 22.1669921875, 23.81396484375, 25.4609375, 27.10791015625, 28.7548828125, 30.40185546875, 32.048828125, 33.69580078125, 35.3427734375, 36.98974609375, 38.63671875, 40.28369140625, 41.9306640625, 43.57763671875, 45.224609375, 46.87158203125, 48.5185546875, 50.16552734375, 51.8125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 194.0, 659.0, 156.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.0184631347656, -262.2860107421875, -257.5535888671875, -252.82115173339844, -248.08871459960938, -243.3562774658203, -238.62384033203125, -233.89138793945312, -229.15896606445312, -224.42652893066406, -219.694091796875, -214.96165466308594, -210.22921752929688, -205.4967803955078, -200.76434326171875, -196.03189086914062, -191.29945373535156, -186.5670166015625, -181.83457946777344, -177.10214233398438, -172.3697052001953, -167.63726806640625, -162.9048309326172, -158.17239379882812, -153.43994140625, -148.70750427246094, -143.97506713867188, -139.2426300048828, -134.51019287109375, -129.7777557373047, -125.0453109741211, -120.31287384033203, -115.58045196533203, -110.84801483154297, -106.1155776977539, -101.38314056396484, -96.65069580078125, -91.91825866699219, -87.18582153320312, -82.45338439941406, -77.720947265625, -72.98851013183594, -68.25607299804688, -63.52363204956055, -58.791194915771484, -54.05875778198242, -49.326316833496094, -44.59387969970703, -39.86144256591797, -35.129005432128906, -30.39656639099121, -25.664127349853516, -20.931690216064453, -16.19925308227539, -11.466814041137695, -6.734375, -2.0019378662109375, 2.7305002212524414, 7.46293830871582, 12.1953763961792, 16.927814483642578, 21.66025161743164, 26.392690658569336, 31.12512969970703, 35.857566833496094]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 11.0, 7.0, 7.0, 14.0, 17.0, 17.0, 27.0, 18.0, 14.0, 29.0, 25.0, 26.0, 29.0, 39.0, 36.0, 29.0, 30.0, 47.0, 38.0, 33.0, 45.0, 32.0, 38.0, 38.0, 37.0, 39.0, 38.0, 32.0, 31.0, 26.0, 23.0, 24.0, 17.0, 13.0, 11.0, 13.0, 6.0, 9.0, 9.0, 3.0, 2.0, 5.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.434974670410156, -35.29469680786133, -34.154422760009766, -33.01414489746094, -31.873868942260742, -30.733592987060547, -29.59331512451172, -28.453039169311523, -27.312763214111328, -26.172487258911133, -25.032211303710938, -23.89193344116211, -22.751657485961914, -21.61138153076172, -20.47110366821289, -19.330827713012695, -18.1905517578125, -17.050275802612305, -15.909998893737793, -14.769721984863281, -13.629446029663086, -12.48917007446289, -11.348893165588379, -10.208616256713867, -9.068340301513672, -7.928063869476318, -6.787787437438965, -5.647511005401611, -4.507234573364258, -3.3669581413269043, -2.226681709289551, -1.0864052772521973, 0.053867340087890625, 1.1941437721252441, 2.3344202041625977, 3.474696636199951, 4.614973068237305, 5.755249500274658, 6.895525932312012, 8.035802841186523, 9.176078796386719, 10.316354751586914, 11.456631660461426, 12.596908569335938, 13.737184524536133, 14.877460479736328, 16.017738342285156, 17.15801429748535, 18.298290252685547, 19.438566207885742, 20.578842163085938, 21.719120025634766, 22.85939598083496, 23.999671936035156, 25.139949798583984, 26.28022575378418, 27.420501708984375, 28.56077766418457, 29.701053619384766, 30.841331481933594, 31.98160743713379, 33.121883392333984, 34.26216125488281, 35.402435302734375, 36.5427131652832]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 8.0, 7.0, 14.0, 20.0, 14.0, 16.0, 26.0, 18.0, 24.0, 19.0, 22.0, 33.0, 36.0, 39.0, 43.0, 41.0, 38.0, 35.0, 44.0, 38.0, 37.0, 36.0, 30.0, 28.0, 31.0, 32.0, 37.0, 25.0, 16.0, 22.0, 16.0, 21.0, 18.0, 26.0, 14.0, 14.0, 6.0, 8.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.6571044921875, -4.505615234375, -4.3541259765625, -4.20263671875, -4.0511474609375, -3.899658203125, -3.7481689453125, -3.5966796875, -3.4451904296875, -3.293701171875, -3.1422119140625, -2.99072265625, -2.8392333984375, -2.687744140625, -2.5362548828125, -2.384765625, -2.2332763671875, -2.081787109375, -1.9302978515625, -1.77880859375, -1.6273193359375, -1.475830078125, -1.3243408203125, -1.1728515625, -1.0213623046875, -0.869873046875, -0.7183837890625, -0.56689453125, -0.4154052734375, -0.263916015625, -0.1124267578125, 0.0390625, 0.1905517578125, 0.342041015625, 0.4935302734375, 0.64501953125, 0.7965087890625, 0.947998046875, 1.0994873046875, 1.2509765625, 1.4024658203125, 1.553955078125, 1.7054443359375, 1.85693359375, 2.0084228515625, 2.159912109375, 2.3114013671875, 2.462890625, 2.6143798828125, 2.765869140625, 2.9173583984375, 3.06884765625, 3.2203369140625, 3.371826171875, 3.5233154296875, 3.6748046875, 3.8262939453125, 3.977783203125, 4.1292724609375, 4.28076171875, 4.4322509765625, 4.583740234375, 4.7352294921875, 4.88671875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 4.0, 4.0, 2.0, 3.0, 3.0, 5.0, 12.0, 14.0, 13.0, 21.0, 34.0, 26.0, 34.0, 46.0, 56.0, 77.0, 118.0, 223.0, 430.0, 1611.0, 10394.0, 107764.0, 1132988.0, 2448448.0, 446867.0, 38781.0, 4509.0, 880.0, 346.0, 149.0, 94.0, 59.0, 48.0, 46.0, 33.0, 26.0, 23.0, 31.0, 14.0, 11.0, 7.0, 6.0, 4.0, 4.0, 7.0, 1.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.2415771484375, -11.850341796875, -11.4591064453125, -11.06787109375, -10.6766357421875, -10.285400390625, -9.8941650390625, -9.5029296875, -9.1116943359375, -8.720458984375, -8.3292236328125, -7.93798828125, -7.5467529296875, -7.155517578125, -6.7642822265625, -6.373046875, -5.9818115234375, -5.590576171875, -5.1993408203125, -4.80810546875, -4.4168701171875, -4.025634765625, -3.6343994140625, -3.2431640625, -2.8519287109375, -2.460693359375, -2.0694580078125, -1.67822265625, -1.2869873046875, -0.895751953125, -0.5045166015625, -0.11328125, 0.2779541015625, 0.669189453125, 1.0604248046875, 1.45166015625, 1.8428955078125, 2.234130859375, 2.6253662109375, 3.0166015625, 3.4078369140625, 3.799072265625, 4.1903076171875, 4.58154296875, 4.9727783203125, 5.364013671875, 5.7552490234375, 6.146484375, 6.5377197265625, 6.928955078125, 7.3201904296875, 7.71142578125, 8.1026611328125, 8.493896484375, 8.8851318359375, 9.2763671875, 9.6676025390625, 10.058837890625, 10.4500732421875, 10.84130859375, 11.2325439453125, 11.623779296875, 12.0150146484375, 12.40625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 7.0, 8.0, 15.0, 18.0, 32.0, 33.0, 42.0, 51.0, 95.0, 125.0, 191.0, 269.0, 369.0, 453.0, 520.0, 475.0, 408.0, 295.0, 208.0, 150.0, 100.0, 56.0, 41.0, 36.0, 25.0, 9.0, 8.0, 11.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.703125, -8.3359375, -7.96875, -7.6015625, -7.234375, -6.8671875, -6.5, -6.1328125, -5.765625, -5.3984375, -5.03125, -4.6640625, -4.296875, -3.9296875, -3.5625, -3.1953125, -2.828125, -2.4609375, -2.09375, -1.7265625, -1.359375, -0.9921875, -0.625, -0.2578125, 0.109375, 0.4765625, 0.84375, 1.2109375, 1.578125, 1.9453125, 2.3125, 2.6796875, 3.046875, 3.4140625, 3.78125, 4.1484375, 4.515625, 4.8828125, 5.25, 5.6171875, 5.984375, 6.3515625, 6.71875, 7.0859375, 7.453125, 7.8203125, 8.1875, 8.5546875, 8.921875, 9.2890625, 9.65625, 10.0234375, 10.390625, 10.7578125, 11.125, 11.4921875, 11.859375, 12.2265625, 12.59375, 12.9609375, 13.328125, 13.6953125, 14.0625, 14.4296875, 14.796875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 0.0, 7.0, 9.0, 10.0, 12.0, 17.0, 31.0, 40.0, 53.0, 81.0, 140.0, 207.0, 385.0, 765.0, 16533.0, 4120184.0, 53708.0, 929.0, 440.0, 251.0, 147.0, 108.0, 50.0, 40.0, 49.0, 22.0, 18.0, 18.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-81.8125, -79.8447265625, -77.876953125, -75.9091796875, -73.94140625, -71.9736328125, -70.005859375, -68.0380859375, -66.0703125, -64.1025390625, -62.134765625, -60.1669921875, -58.19921875, -56.2314453125, -54.263671875, -52.2958984375, -50.328125, -48.3603515625, -46.392578125, -44.4248046875, -42.45703125, -40.4892578125, -38.521484375, -36.5537109375, -34.5859375, -32.6181640625, -30.650390625, -28.6826171875, -26.71484375, -24.7470703125, -22.779296875, -20.8115234375, -18.84375, -16.8759765625, -14.908203125, -12.9404296875, -10.97265625, -9.0048828125, -7.037109375, -5.0693359375, -3.1015625, -1.1337890625, 0.833984375, 2.8017578125, 4.76953125, 6.7373046875, 8.705078125, 10.6728515625, 12.640625, 14.6083984375, 16.576171875, 18.5439453125, 20.51171875, 22.4794921875, 24.447265625, 26.4150390625, 28.3828125, 30.3505859375, 32.318359375, 34.2861328125, 36.25390625, 38.2216796875, 40.189453125, 42.1572265625, 44.125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 19.0, 155.0, 367.0, 343.0, 117.0, 12.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.86396026611328, -34.873046875, -29.882137298583984, -24.891225814819336, -19.900314331054688, -14.909402847290039, -9.91849136352539, -4.927581787109375, 0.06333160400390625, 5.054243087768555, 10.045154571533203, 15.036066055297852, 20.0269775390625, 25.01788902282715, 30.008800506591797, 34.99971008300781, 39.990623474121094, 44.981536865234375, 49.97244644165039, 54.963356018066406, 59.95426940917969, 64.94518280029297, 69.93609619140625, 74.927001953125, 79.91791534423828, 84.90882873535156, 89.89973449707031, 94.8906478881836, 99.88156127929688, 104.87247467041016, 109.86338806152344, 114.85429382324219, 119.84521484375, 124.83612823486328, 129.82704162597656, 134.8179473876953, 139.80886840820312, 144.79977416992188, 149.79067993164062, 154.78158569335938, 159.7725067138672, 164.76341247558594, 169.75433349609375, 174.7452392578125, 179.73614501953125, 184.72706604003906, 189.7179718017578, 194.70889282226562, 199.69979858398438, 204.69070434570312, 209.68162536621094, 214.6725311279297, 219.6634521484375, 224.65435791015625, 229.645263671875, 234.63616943359375, 239.62709045410156, 244.6179962158203, 249.60891723632812, 254.59982299804688, 259.5907287597656, 264.5816345214844, 269.57257080078125, 274.5634765625, 279.55438232421875]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 7.0, 10.0, 15.0, 19.0, 12.0, 22.0, 17.0, 27.0, 24.0, 32.0, 20.0, 39.0, 35.0, 41.0, 61.0, 35.0, 43.0, 45.0, 38.0, 29.0, 38.0, 43.0, 50.0, 36.0, 33.0, 40.0, 25.0, 25.0, 17.0, 19.0, 19.0, 18.0, 9.0, 10.0, 11.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.388992309570312, -30.321237564086914, -29.253482818603516, -28.18572998046875, -27.11797523498535, -26.050220489501953, -24.982465744018555, -23.914710998535156, -22.84695816040039, -21.779203414916992, -20.711448669433594, -19.643695831298828, -18.57594108581543, -17.50818634033203, -16.440431594848633, -15.372676849365234, -14.304922103881836, -13.237167358398438, -12.169413566589355, -11.101658821105957, -10.033905029296875, -8.966150283813477, -7.898395538330078, -6.830641269683838, -5.762887001037598, -4.695132732391357, -3.627378225326538, -2.5596237182617188, -1.4918694496154785, -0.4241151809692383, 0.6436395645141602, 1.7113938331604004, 2.7791481018066406, 3.846902370452881, 4.914656639099121, 5.9824113845825195, 7.05016565322876, 8.117919921875, 9.185674667358398, 10.253429412841797, 11.321183204650879, 12.388937950134277, 13.45669174194336, 14.524446487426758, 15.592201232910156, 16.659954071044922, 17.727710723876953, 18.79546356201172, 19.863218307495117, 20.930973052978516, 21.998727798461914, 23.066482543945312, 24.134235382080078, 25.201990127563477, 26.269744873046875, 27.337499618530273, 28.405254364013672, 29.47300910949707, 30.54076385498047, 31.608516693115234, 32.676273345947266, 33.74402618408203, 34.81178283691406, 35.87953567504883, 36.947288513183594]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 6.0, 14.0, 16.0, 11.0, 16.0, 11.0, 13.0, 20.0, 20.0, 22.0, 23.0, 27.0, 28.0, 32.0, 22.0, 32.0, 49.0, 39.0, 38.0, 37.0, 45.0, 40.0, 45.0, 41.0, 47.0, 25.0, 29.0, 24.0, 16.0, 24.0, 29.0, 20.0, 16.0, 22.0, 11.0, 9.0, 15.0, 12.0, 9.0, 7.0, 7.0, 2.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.8359375, -4.68865966796875, -4.5413818359375, -4.39410400390625, -4.246826171875, -4.09954833984375, -3.9522705078125, -3.80499267578125, -3.65771484375, -3.51043701171875, -3.3631591796875, -3.21588134765625, -3.068603515625, -2.92132568359375, -2.7740478515625, -2.62677001953125, -2.4794921875, -2.33221435546875, -2.1849365234375, -2.03765869140625, -1.890380859375, -1.74310302734375, -1.5958251953125, -1.44854736328125, -1.30126953125, -1.15399169921875, -1.0067138671875, -0.85943603515625, -0.712158203125, -0.56488037109375, -0.4176025390625, -0.27032470703125, -0.123046875, 0.02423095703125, 0.1715087890625, 0.31878662109375, 0.466064453125, 0.61334228515625, 0.7606201171875, 0.90789794921875, 1.05517578125, 1.20245361328125, 1.3497314453125, 1.49700927734375, 1.644287109375, 1.79156494140625, 1.9388427734375, 2.08612060546875, 2.2333984375, 2.38067626953125, 2.5279541015625, 2.67523193359375, 2.822509765625, 2.96978759765625, 3.1170654296875, 3.26434326171875, 3.41162109375, 3.55889892578125, 3.7061767578125, 3.85345458984375, 4.000732421875, 4.14801025390625, 4.2952880859375, 4.44256591796875, 4.58984375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 15.0, 22.0, 26.0, 39.0, 51.0, 67.0, 118.0, 185.0, 256.0, 299.0, 497.0, 718.0, 1100.0, 1573.0, 2317.0, 3372.0, 5015.0, 7128.0, 10706.0, 16244.0, 23594.0, 34790.0, 50744.0, 72624.0, 101667.0, 132968.0, 148450.0, 126208.0, 95017.0, 67091.0, 46727.0, 31612.0, 21486.0, 14796.0, 10002.0, 6747.0, 4478.0, 3127.0, 2144.0, 1443.0, 1001.0, 660.0, 417.0, 316.0, 205.0, 159.0, 95.0, 81.0, 50.0, 29.0, 27.0, 19.0, 11.0, 9.0, 6.0, 2.0, 2.0, 2.0], "bins": [-0.347412109375, -0.3366851806640625, -0.325958251953125, -0.3152313232421875, -0.30450439453125, -0.2937774658203125, -0.283050537109375, -0.2723236083984375, -0.2615966796875, -0.2508697509765625, -0.240142822265625, -0.2294158935546875, -0.21868896484375, -0.2079620361328125, -0.197235107421875, -0.1865081787109375, -0.17578125, -0.1650543212890625, -0.154327392578125, -0.1436004638671875, -0.13287353515625, -0.1221466064453125, -0.111419677734375, -0.1006927490234375, -0.0899658203125, -0.0792388916015625, -0.068511962890625, -0.0577850341796875, -0.04705810546875, -0.0363311767578125, -0.025604248046875, -0.0148773193359375, -0.004150390625, 0.0065765380859375, 0.017303466796875, 0.0280303955078125, 0.03875732421875, 0.0494842529296875, 0.060211181640625, 0.0709381103515625, 0.0816650390625, 0.0923919677734375, 0.103118896484375, 0.1138458251953125, 0.12457275390625, 0.1352996826171875, 0.146026611328125, 0.1567535400390625, 0.16748046875, 0.1782073974609375, 0.188934326171875, 0.1996612548828125, 0.21038818359375, 0.2211151123046875, 0.231842041015625, 0.2425689697265625, 0.2532958984375, 0.2640228271484375, 0.274749755859375, 0.2854766845703125, 0.29620361328125, 0.3069305419921875, 0.317657470703125, 0.3283843994140625, 0.339111328125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 3.0, 4.0, 2.0, 9.0, 7.0, 13.0, 10.0, 11.0, 12.0, 12.0, 9.0, 22.0, 15.0, 15.0, 32.0, 24.0, 26.0, 32.0, 33.0, 38.0, 34.0, 30.0, 28.0, 36.0, 42.0, 1055.0, 34.0, 34.0, 35.0, 36.0, 33.0, 35.0, 31.0, 27.0, 26.0, 19.0, 20.0, 22.0, 14.0, 17.0, 15.0, 6.0, 10.0, 10.0, 8.0, 8.0, 9.0, 10.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.453125, -2.36700439453125, -2.2808837890625, -2.19476318359375, -2.108642578125, -2.02252197265625, -1.9364013671875, -1.85028076171875, -1.76416015625, -1.67803955078125, -1.5919189453125, -1.50579833984375, -1.419677734375, -1.33355712890625, -1.2474365234375, -1.16131591796875, -1.0751953125, -0.98907470703125, -0.9029541015625, -0.81683349609375, -0.730712890625, -0.64459228515625, -0.5584716796875, -0.47235107421875, -0.38623046875, -0.30010986328125, -0.2139892578125, -0.12786865234375, -0.041748046875, 0.04437255859375, 0.1304931640625, 0.21661376953125, 0.302734375, 0.38885498046875, 0.4749755859375, 0.56109619140625, 0.647216796875, 0.73333740234375, 0.8194580078125, 0.90557861328125, 0.99169921875, 1.07781982421875, 1.1639404296875, 1.25006103515625, 1.336181640625, 1.42230224609375, 1.5084228515625, 1.59454345703125, 1.6806640625, 1.76678466796875, 1.8529052734375, 1.93902587890625, 2.025146484375, 2.11126708984375, 2.1973876953125, 2.28350830078125, 2.36962890625, 2.45574951171875, 2.5418701171875, 2.62799072265625, 2.714111328125, 2.80023193359375, 2.8863525390625, 2.97247314453125, 3.05859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 13.0, 17.0, 34.0, 38.0, 63.0, 85.0, 142.0, 184.0, 281.0, 415.0, 585.0, 865.0, 1390.0, 2061.0, 3161.0, 4739.0, 7445.0, 11199.0, 16694.0, 25251.0, 37355.0, 53612.0, 75041.0, 100445.0, 131180.0, 1168123.0, 125866.0, 98017.0, 73247.0, 51856.0, 35979.0, 24444.0, 16279.0, 10905.0, 6905.0, 4549.0, 2886.0, 1869.0, 1323.0, 794.0, 559.0, 405.0, 266.0, 162.0, 112.0, 77.0, 75.0, 47.0, 29.0, 17.0, 13.0, 15.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.237060546875, -0.22975540161132812, -0.22245025634765625, -0.21514511108398438, -0.2078399658203125, -0.20053482055664062, -0.19322967529296875, -0.18592453002929688, -0.178619384765625, -0.17131423950195312, -0.16400909423828125, -0.15670394897460938, -0.1493988037109375, -0.14209365844726562, -0.13478851318359375, -0.12748336791992188, -0.12017822265625, -0.11287307739257812, -0.10556793212890625, -0.09826278686523438, -0.0909576416015625, -0.08365249633789062, -0.07634735107421875, -0.06904220581054688, -0.061737060546875, -0.054431915283203125, -0.04712677001953125, -0.039821624755859375, -0.0325164794921875, -0.025211334228515625, -0.01790618896484375, -0.010601043701171875, -0.0032958984375, 0.004009246826171875, 0.01131439208984375, 0.018619537353515625, 0.0259246826171875, 0.033229827880859375, 0.04053497314453125, 0.047840118408203125, 0.055145263671875, 0.062450408935546875, 0.06975555419921875, 0.07706069946289062, 0.0843658447265625, 0.09167098999023438, 0.09897613525390625, 0.10628128051757812, 0.11358642578125, 0.12089157104492188, 0.12819671630859375, 0.13550186157226562, 0.1428070068359375, 0.15011215209960938, 0.15741729736328125, 0.16472244262695312, 0.172027587890625, 0.17933273315429688, 0.18663787841796875, 0.19394302368164062, 0.2012481689453125, 0.20855331420898438, 0.21585845947265625, 0.22316360473632812, 0.23046875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 5.0, 7.0, 6.0, 8.0, 10.0, 13.0, 20.0, 26.0, 30.0, 30.0, 40.0, 40.0, 63.0, 94.0, 96.0, 112.0, 83.0, 53.0, 47.0, 43.0, 32.0, 23.0, 24.0, 21.0, 9.0, 5.0, 7.0, 10.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01488494873046875, -0.01440417766571045, -0.013923406600952148, -0.013442635536193848, -0.012961864471435547, -0.012481093406677246, -0.012000322341918945, -0.011519551277160645, -0.011038780212402344, -0.010558009147644043, -0.010077238082885742, -0.009596467018127441, -0.00911569595336914, -0.00863492488861084, -0.008154153823852539, -0.007673382759094238, -0.0071926116943359375, -0.006711840629577637, -0.006231069564819336, -0.005750298500061035, -0.005269527435302734, -0.004788756370544434, -0.004307985305786133, -0.003827214241027832, -0.0033464431762695312, -0.0028656721115112305, -0.0023849010467529297, -0.001904129981994629, -0.0014233589172363281, -0.0009425878524780273, -0.00046181678771972656, 1.895427703857422e-05, 0.000499725341796875, 0.0009804964065551758, 0.0014612674713134766, 0.0019420385360717773, 0.002422809600830078, 0.002903580665588379, 0.0033843517303466797, 0.0038651227951049805, 0.004345893859863281, 0.004826664924621582, 0.005307435989379883, 0.005788207054138184, 0.006268978118896484, 0.006749749183654785, 0.007230520248413086, 0.007711291313171387, 0.008192062377929688, 0.008672833442687988, 0.009153604507446289, 0.00963437557220459, 0.01011514663696289, 0.010595917701721191, 0.011076688766479492, 0.011557459831237793, 0.012038230895996094, 0.012519001960754395, 0.012999773025512695, 0.013480544090270996, 0.013961315155029297, 0.014442086219787598, 0.014922857284545898, 0.0154036283493042, 0.0158843994140625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 10.0, 11.0, 11.0, 13.0, 32.0, 30.0, 47.0, 60.0, 125.0, 181.0, 385.0, 1997.0, 161849.0, 877894.0, 4736.0, 507.0, 207.0, 115.0, 75.0, 54.0, 42.0, 43.0, 17.0, 17.0, 14.0, 7.0, 8.0, 7.0, 6.0, 6.0, 7.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.329833984375, -0.31987762451171875, -0.3099212646484375, -0.29996490478515625, -0.290008544921875, -0.28005218505859375, -0.2700958251953125, -0.26013946533203125, -0.25018310546875, -0.24022674560546875, -0.2302703857421875, -0.22031402587890625, -0.210357666015625, -0.20040130615234375, -0.1904449462890625, -0.18048858642578125, -0.1705322265625, -0.16057586669921875, -0.1506195068359375, -0.14066314697265625, -0.130706787109375, -0.12075042724609375, -0.1107940673828125, -0.10083770751953125, -0.09088134765625, -0.08092498779296875, -0.0709686279296875, -0.06101226806640625, -0.051055908203125, -0.04109954833984375, -0.0311431884765625, -0.02118682861328125, -0.01123046875, -0.00127410888671875, 0.0086822509765625, 0.01863861083984375, 0.028594970703125, 0.03855133056640625, 0.0485076904296875, 0.05846405029296875, 0.06842041015625, 0.07837677001953125, 0.0883331298828125, 0.09828948974609375, 0.108245849609375, 0.11820220947265625, 0.1281585693359375, 0.13811492919921875, 0.1480712890625, 0.15802764892578125, 0.1679840087890625, 0.17794036865234375, 0.187896728515625, 0.19785308837890625, 0.2078094482421875, 0.21776580810546875, 0.22772216796875, 0.23767852783203125, 0.2476348876953125, 0.25759124755859375, 0.267547607421875, 0.27750396728515625, 0.2874603271484375, 0.29741668701171875, 0.307373046875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 29.0, 260.0, 607.0, 83.0, 26.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19324229657649994, -0.1885472536087036, -0.1838522106409073, -0.17915716767311096, -0.17446212470531464, -0.1697670817375183, -0.16507203876972198, -0.16037699580192566, -0.15568193793296814, -0.15098689496517181, -0.1462918519973755, -0.14159680902957916, -0.13690176606178284, -0.1322067230939865, -0.12751168012619019, -0.12281662970781326, -0.11812159419059753, -0.11342655122280121, -0.10873150825500488, -0.10403646528720856, -0.09934142231941223, -0.0946463793516159, -0.08995132893323898, -0.08525628596544266, -0.08056124299764633, -0.07586620002985, -0.07117115706205368, -0.06647611409425735, -0.06178106740117073, -0.057086024433374405, -0.05239097774028778, -0.047695934772491455, -0.043000876903533936, -0.03830583393573761, -0.033610790967941284, -0.02891574427485466, -0.024220701307058334, -0.01952565833926201, -0.014830613508820534, -0.010135568678379059, -0.005440525710582733, -0.0007454818114638329, 0.0039495620876550674, 0.008644605986773968, 0.013339649885892868, 0.018034692853689194, 0.02272973768413067, 0.027424782514572144, 0.03211982548236847, 0.036814868450164795, 0.04150991141796112, 0.046204958111047745, 0.05090000107884407, 0.055595044046640396, 0.06029009073972702, 0.06498513370752335, 0.06968017667531967, 0.074375219643116, 0.07907026261091232, 0.08376530557870865, 0.08846035599708557, 0.0931553989648819, 0.09785044193267822, 0.10254548490047455, 0.10724052786827087]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 6.0, 5.0, 2.0, 9.0, 8.0, 14.0, 10.0, 19.0, 12.0, 25.0, 25.0, 31.0, 31.0, 26.0, 30.0, 34.0, 19.0, 39.0, 45.0, 35.0, 34.0, 47.0, 37.0, 44.0, 35.0, 32.0, 36.0, 25.0, 26.0, 27.0, 27.0, 27.0, 22.0, 32.0, 19.0, 12.0, 17.0, 13.0, 12.0, 20.0, 2.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.019198596477508545, -0.018639346584677696, -0.018080096691846848, -0.017520846799016, -0.01696159690618515, -0.0164023470133543, -0.015843097120523453, -0.015283847227692604, -0.014724597334861755, -0.014165347442030907, -0.013606097549200058, -0.01304684765636921, -0.01248759776353836, -0.011928347870707512, -0.011369097977876663, -0.010809848085045815, -0.010250598192214966, -0.009691348299384117, -0.009132098406553268, -0.00857284851372242, -0.008013598620891571, -0.007454348728060722, -0.006895098835229874, -0.006335848942399025, -0.005776599049568176, -0.005217349156737328, -0.004658099263906479, -0.00409884937107563, -0.0035395994782447815, -0.002980349585413933, -0.002421099692583084, -0.0018618497997522354, -0.0013025999069213867, -0.000743350014090538, -0.00018410012125968933, 0.00037514977157115936, 0.0009343996644020081, 0.0014936495572328568, 0.0020528994500637054, 0.002612149342894554, 0.003171399235725403, 0.0037306491285562515, 0.0042898990213871, 0.004849148914217949, 0.005408398807048798, 0.005967648699879646, 0.006526898592710495, 0.007086148485541344, 0.007645398378372192, 0.008204648271203041, 0.00876389816403389, 0.009323148056864738, 0.009882397949695587, 0.010441647842526436, 0.011000897735357285, 0.011560147628188133, 0.012119397521018982, 0.01267864741384983, 0.01323789730668068, 0.013797147199511528, 0.014356397092342377, 0.014915646985173225, 0.015474896878004074, 0.016034146770834923, 0.01659339666366577]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 6.0, 14.0, 15.0, 12.0, 16.0, 11.0, 13.0, 19.0, 21.0, 22.0, 22.0, 26.0, 30.0, 30.0, 24.0, 31.0, 50.0, 38.0, 39.0, 37.0, 45.0, 40.0, 45.0, 41.0, 46.0, 26.0, 28.0, 25.0, 16.0, 24.0, 29.0, 20.0, 16.0, 22.0, 11.0, 9.0, 15.0, 12.0, 9.0, 7.0, 7.0, 2.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.83984375, -4.6925048828125, -4.545166015625, -4.3978271484375, -4.25048828125, -4.1031494140625, -3.955810546875, -3.8084716796875, -3.6611328125, -3.5137939453125, -3.366455078125, -3.2191162109375, -3.07177734375, -2.9244384765625, -2.777099609375, -2.6297607421875, -2.482421875, -2.3350830078125, -2.187744140625, -2.0404052734375, -1.89306640625, -1.7457275390625, -1.598388671875, -1.4510498046875, -1.3037109375, -1.1563720703125, -1.009033203125, -0.8616943359375, -0.71435546875, -0.5670166015625, -0.419677734375, -0.2723388671875, -0.125, 0.0223388671875, 0.169677734375, 0.3170166015625, 0.46435546875, 0.6116943359375, 0.759033203125, 0.9063720703125, 1.0537109375, 1.2010498046875, 1.348388671875, 1.4957275390625, 1.64306640625, 1.7904052734375, 1.937744140625, 2.0850830078125, 2.232421875, 2.3797607421875, 2.527099609375, 2.6744384765625, 2.82177734375, 2.9691162109375, 3.116455078125, 3.2637939453125, 3.4111328125, 3.5584716796875, 3.705810546875, 3.8531494140625, 4.00048828125, 4.1478271484375, 4.295166015625, 4.4425048828125, 4.58984375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 19.0, 21.0, 20.0, 22.0, 34.0, 36.0, 59.0, 64.0, 114.0, 156.0, 340.0, 712.0, 1736.0, 5184.0, 16146.0, 51309.0, 196516.0, 561880.0, 151657.0, 42035.0, 13334.0, 4235.0, 1429.0, 610.0, 292.0, 162.0, 116.0, 67.0, 53.0, 31.0, 21.0, 23.0, 20.0, 20.0, 15.0, 11.0, 6.0, 4.0, 11.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.421875, -10.1099853515625, -9.798095703125, -9.4862060546875, -9.17431640625, -8.8624267578125, -8.550537109375, -8.2386474609375, -7.9267578125, -7.6148681640625, -7.302978515625, -6.9910888671875, -6.67919921875, -6.3673095703125, -6.055419921875, -5.7435302734375, -5.431640625, -5.1197509765625, -4.807861328125, -4.4959716796875, -4.18408203125, -3.8721923828125, -3.560302734375, -3.2484130859375, -2.9365234375, -2.6246337890625, -2.312744140625, -2.0008544921875, -1.68896484375, -1.3770751953125, -1.065185546875, -0.7532958984375, -0.44140625, -0.1295166015625, 0.182373046875, 0.4942626953125, 0.80615234375, 1.1180419921875, 1.429931640625, 1.7418212890625, 2.0537109375, 2.3656005859375, 2.677490234375, 2.9893798828125, 3.30126953125, 3.6131591796875, 3.925048828125, 4.2369384765625, 4.548828125, 4.8607177734375, 5.172607421875, 5.4844970703125, 5.79638671875, 6.1082763671875, 6.420166015625, 6.7320556640625, 7.0439453125, 7.3558349609375, 7.667724609375, 7.9796142578125, 8.29150390625, 8.6033935546875, 8.915283203125, 9.2271728515625, 9.5390625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 3.0, 6.0, 10.0, 13.0, 15.0, 16.0, 20.0, 27.0, 37.0, 26.0, 36.0, 38.0, 44.0, 61.0, 107.0, 195.0, 1464.0, 323.0, 141.0, 83.0, 50.0, 55.0, 50.0, 36.0, 32.0, 29.0, 17.0, 17.0, 23.0, 20.0, 8.0, 7.0, 4.0, 7.0, 7.0, 2.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.328857421875, -15.72021484375, -15.111572265625, -14.5029296875, -13.894287109375, -13.28564453125, -12.677001953125, -12.068359375, -11.459716796875, -10.85107421875, -10.242431640625, -9.6337890625, -9.025146484375, -8.41650390625, -7.807861328125, -7.19921875, -6.590576171875, -5.98193359375, -5.373291015625, -4.7646484375, -4.156005859375, -3.54736328125, -2.938720703125, -2.330078125, -1.721435546875, -1.11279296875, -0.504150390625, 0.1044921875, 0.713134765625, 1.32177734375, 1.930419921875, 2.5390625, 3.147705078125, 3.75634765625, 4.364990234375, 4.9736328125, 5.582275390625, 6.19091796875, 6.799560546875, 7.408203125, 8.016845703125, 8.62548828125, 9.234130859375, 9.8427734375, 10.451416015625, 11.06005859375, 11.668701171875, 12.27734375, 12.885986328125, 13.49462890625, 14.103271484375, 14.7119140625, 15.320556640625, 15.92919921875, 16.537841796875, 17.146484375, 17.755126953125, 18.36376953125, 18.972412109375, 19.5810546875, 20.189697265625, 20.79833984375, 21.406982421875, 22.015625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 3.0, 7.0, 5.0, 18.0, 12.0, 21.0, 26.0, 28.0, 30.0, 39.0, 59.0, 69.0, 101.0, 126.0, 228.0, 408.0, 1085.0, 14575.0, 3045523.0, 80184.0, 1743.0, 540.0, 282.0, 149.0, 111.0, 71.0, 51.0, 52.0, 30.0, 28.0, 20.0, 18.0, 11.0, 10.0, 6.0, 11.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.6875, -58.9853515625, -57.283203125, -55.5810546875, -53.87890625, -52.1767578125, -50.474609375, -48.7724609375, -47.0703125, -45.3681640625, -43.666015625, -41.9638671875, -40.26171875, -38.5595703125, -36.857421875, -35.1552734375, -33.453125, -31.7509765625, -30.048828125, -28.3466796875, -26.64453125, -24.9423828125, -23.240234375, -21.5380859375, -19.8359375, -18.1337890625, -16.431640625, -14.7294921875, -13.02734375, -11.3251953125, -9.623046875, -7.9208984375, -6.21875, -4.5166015625, -2.814453125, -1.1123046875, 0.58984375, 2.2919921875, 3.994140625, 5.6962890625, 7.3984375, 9.1005859375, 10.802734375, 12.5048828125, 14.20703125, 15.9091796875, 17.611328125, 19.3134765625, 21.015625, 22.7177734375, 24.419921875, 26.1220703125, 27.82421875, 29.5263671875, 31.228515625, 32.9306640625, 34.6328125, 36.3349609375, 38.037109375, 39.7392578125, 41.44140625, 43.1435546875, 44.845703125, 46.5478515625, 48.25]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 2.0, 6.0, 12.0, 12.0, 31.0, 41.0, 47.0, 80.0, 84.0, 105.0, 107.0, 98.0, 79.0, 92.0, 52.0, 49.0, 46.0, 25.0, 15.0, 13.0, 2.0, 8.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.501716613769531, -10.852889060974121, -10.204061508178711, -9.555233001708984, -8.906405448913574, -8.257577896118164, -7.608749866485596, -6.959921836853027, -6.311094284057617, -5.662266731262207, -5.013438701629639, -4.36461067199707, -3.71578311920166, -3.066955327987671, -2.4181275367736816, -1.7692995071411133, -1.1204719543457031, -0.47164416313171387, 0.1771836280822754, 0.8260114192962646, 1.474839210510254, 2.123667001724243, 2.7724947929382324, 3.421322822570801, 4.070150375366211, 4.718977928161621, 5.3678059577941895, 6.016633987426758, 6.665461540222168, 7.314289093017578, 7.9631171226501465, 8.611945152282715, 9.260772705078125, 9.909600257873535, 10.558427810668945, 11.207256317138672, 11.856083869934082, 12.504911422729492, 13.153739929199219, 13.802567481994629, 14.451395034790039, 15.10022258758545, 15.74905014038086, 16.397878646850586, 17.046707153320312, 17.695533752441406, 18.344362258911133, 18.99319076538086, 19.642017364501953, 20.29084587097168, 20.939672470092773, 21.5885009765625, 22.237327575683594, 22.88615608215332, 23.534984588623047, 24.18381118774414, 24.832639694213867, 25.481468200683594, 26.130294799804688, 26.779123306274414, 27.42795181274414, 28.076778411865234, 28.72560691833496, 29.374435424804688, 30.02326202392578]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 8.0, 11.0, 13.0, 12.0, 19.0, 12.0, 23.0, 25.0, 28.0, 44.0, 36.0, 40.0, 44.0, 44.0, 48.0, 47.0, 44.0, 55.0, 39.0, 50.0, 45.0, 37.0, 34.0, 31.0, 34.0, 30.0, 25.0, 31.0, 17.0, 20.0, 15.0, 8.0, 8.0, 6.0, 2.0, 10.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-67.97822570800781, -66.26310729980469, -64.54798889160156, -62.83287048339844, -61.11775207519531, -59.40263366699219, -57.68751525878906, -55.97239685058594, -54.25727844238281, -52.54216003417969, -50.82704162597656, -49.11192321777344, -47.39680480957031, -45.68168640136719, -43.96656799316406, -42.25144958496094, -40.53633499145508, -38.82121658325195, -37.10609817504883, -35.3909797668457, -33.67586135864258, -31.960742950439453, -30.24562644958496, -28.530508041381836, -26.81538963317871, -25.100271224975586, -23.38515281677246, -21.67003631591797, -19.954917907714844, -18.23979949951172, -16.524681091308594, -14.809562683105469, -13.09444808959961, -11.379329681396484, -9.66421127319336, -7.949093818664551, -6.233975410461426, -4.518857002258301, -2.803739547729492, -1.0886211395263672, 0.6264972686767578, 2.3416154384613037, 4.05673360824585, 5.771851539611816, 7.486969947814941, 9.202088356018066, 10.917205810546875, 12.63232421875, 14.347442626953125, 16.06256103515625, 17.777679443359375, 19.4927978515625, 21.207916259765625, 22.92303466796875, 24.638151168823242, 26.353269577026367, 28.068387985229492, 29.783506393432617, 31.498624801635742, 33.213741302490234, 34.92885971069336, 36.643978118896484, 38.35909652709961, 40.074214935302734, 41.78933334350586]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 8.0, 6.0, 8.0, 9.0, 13.0, 17.0, 10.0, 25.0, 13.0, 23.0, 25.0, 34.0, 25.0, 26.0, 23.0, 35.0, 42.0, 35.0, 41.0, 35.0, 48.0, 48.0, 41.0, 43.0, 41.0, 30.0, 33.0, 29.0, 29.0, 28.0, 21.0, 22.0, 23.0, 15.0, 9.0, 15.0, 12.0, 19.0, 6.0, 3.0, 4.0, 6.0, 7.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0], "bins": [-6.09765625, -5.92572021484375, -5.7537841796875, -5.58184814453125, -5.409912109375, -5.23797607421875, -5.0660400390625, -4.89410400390625, -4.72216796875, -4.55023193359375, -4.3782958984375, -4.20635986328125, -4.034423828125, -3.86248779296875, -3.6905517578125, -3.51861572265625, -3.3466796875, -3.17474365234375, -3.0028076171875, -2.83087158203125, -2.658935546875, -2.48699951171875, -2.3150634765625, -2.14312744140625, -1.97119140625, -1.79925537109375, -1.6273193359375, -1.45538330078125, -1.283447265625, -1.11151123046875, -0.9395751953125, -0.76763916015625, -0.595703125, -0.42376708984375, -0.2518310546875, -0.07989501953125, 0.092041015625, 0.26397705078125, 0.4359130859375, 0.60784912109375, 0.77978515625, 0.95172119140625, 1.1236572265625, 1.29559326171875, 1.467529296875, 1.63946533203125, 1.8114013671875, 1.98333740234375, 2.1552734375, 2.32720947265625, 2.4991455078125, 2.67108154296875, 2.843017578125, 3.01495361328125, 3.1868896484375, 3.35882568359375, 3.53076171875, 3.70269775390625, 3.8746337890625, 4.04656982421875, 4.218505859375, 4.39044189453125, 4.5623779296875, 4.73431396484375, 4.90625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 1.0, 6.0, 18.0, 17.0, 15.0, 19.0, 27.0, 33.0, 28.0, 57.0, 74.0, 134.0, 226.0, 373.0, 633.0, 1340.0, 3124.0, 8186.0, 21722.0, 64698.0, 184682.0, 472464.0, 942443.0, 1167925.0, 771449.0, 350720.0, 131464.0, 45842.0, 15674.0, 5961.0, 2436.0, 1062.0, 558.0, 304.0, 166.0, 113.0, 78.0, 54.0, 27.0, 22.0, 22.0, 12.0, 14.0, 10.0, 14.0, 5.0, 3.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0], "bins": [-5.89453125, -5.72283935546875, -5.5511474609375, -5.37945556640625, -5.207763671875, -5.03607177734375, -4.8643798828125, -4.69268798828125, -4.52099609375, -4.34930419921875, -4.1776123046875, -4.00592041015625, -3.834228515625, -3.66253662109375, -3.4908447265625, -3.31915283203125, -3.1474609375, -2.97576904296875, -2.8040771484375, -2.63238525390625, -2.460693359375, -2.28900146484375, -2.1173095703125, -1.94561767578125, -1.77392578125, -1.60223388671875, -1.4305419921875, -1.25885009765625, -1.087158203125, -0.91546630859375, -0.7437744140625, -0.57208251953125, -0.400390625, -0.22869873046875, -0.0570068359375, 0.11468505859375, 0.286376953125, 0.45806884765625, 0.6297607421875, 0.80145263671875, 0.97314453125, 1.14483642578125, 1.3165283203125, 1.48822021484375, 1.659912109375, 1.83160400390625, 2.0032958984375, 2.17498779296875, 2.3466796875, 2.51837158203125, 2.6900634765625, 2.86175537109375, 3.033447265625, 3.20513916015625, 3.3768310546875, 3.54852294921875, 3.72021484375, 3.89190673828125, 4.0635986328125, 4.23529052734375, 4.406982421875, 4.57867431640625, 4.7503662109375, 4.92205810546875, 5.09375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 6.0, 4.0, 7.0, 13.0, 11.0, 20.0, 30.0, 26.0, 40.0, 54.0, 63.0, 85.0, 103.0, 145.0, 194.0, 239.0, 308.0, 354.0, 374.0, 383.0, 327.0, 299.0, 243.0, 184.0, 138.0, 98.0, 77.0, 64.0, 40.0, 36.0, 15.0, 19.0, 18.0, 12.0, 11.0, 7.0, 7.0, 8.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0078125, -8.7161865234375, -8.424560546875, -8.1329345703125, -7.84130859375, -7.5496826171875, -7.258056640625, -6.9664306640625, -6.6748046875, -6.3831787109375, -6.091552734375, -5.7999267578125, -5.50830078125, -5.2166748046875, -4.925048828125, -4.6334228515625, -4.341796875, -4.0501708984375, -3.758544921875, -3.4669189453125, -3.17529296875, -2.8836669921875, -2.592041015625, -2.3004150390625, -2.0087890625, -1.7171630859375, -1.425537109375, -1.1339111328125, -0.84228515625, -0.5506591796875, -0.259033203125, 0.0325927734375, 0.32421875, 0.6158447265625, 0.907470703125, 1.1990966796875, 1.49072265625, 1.7823486328125, 2.073974609375, 2.3656005859375, 2.6572265625, 2.9488525390625, 3.240478515625, 3.5321044921875, 3.82373046875, 4.1153564453125, 4.406982421875, 4.6986083984375, 4.990234375, 5.2818603515625, 5.573486328125, 5.8651123046875, 6.15673828125, 6.4483642578125, 6.739990234375, 7.0316162109375, 7.3232421875, 7.6148681640625, 7.906494140625, 8.1981201171875, 8.48974609375, 8.7813720703125, 9.072998046875, 9.3646240234375, 9.65625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 11.0, 10.0, 12.0, 10.0, 16.0, 16.0, 27.0, 39.0, 47.0, 67.0, 116.0, 147.0, 238.0, 427.0, 697.0, 1644.0, 12261.0, 1077884.0, 3056639.0, 39374.0, 2367.0, 879.0, 481.0, 245.0, 177.0, 123.0, 74.0, 65.0, 44.0, 37.0, 24.0, 18.0, 16.0, 13.0, 7.0, 8.0, 7.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.15625, -34.095703125, -33.03515625, -31.974609375, -30.9140625, -29.853515625, -28.79296875, -27.732421875, -26.671875, -25.611328125, -24.55078125, -23.490234375, -22.4296875, -21.369140625, -20.30859375, -19.248046875, -18.1875, -17.126953125, -16.06640625, -15.005859375, -13.9453125, -12.884765625, -11.82421875, -10.763671875, -9.703125, -8.642578125, -7.58203125, -6.521484375, -5.4609375, -4.400390625, -3.33984375, -2.279296875, -1.21875, -0.158203125, 0.90234375, 1.962890625, 3.0234375, 4.083984375, 5.14453125, 6.205078125, 7.265625, 8.326171875, 9.38671875, 10.447265625, 11.5078125, 12.568359375, 13.62890625, 14.689453125, 15.75, 16.810546875, 17.87109375, 18.931640625, 19.9921875, 21.052734375, 22.11328125, 23.173828125, 24.234375, 25.294921875, 26.35546875, 27.416015625, 28.4765625, 29.537109375, 30.59765625, 31.658203125, 32.71875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 34.0, 691.0, 287.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-493.4949035644531, -481.6839904785156, -469.8730773925781, -458.0621337890625, -446.251220703125, -434.4403076171875, -422.62939453125, -410.8184814453125, -399.007568359375, -387.1966552734375, -375.3857421875, -363.5748291015625, -351.7638854980469, -339.9529724121094, -328.1420593261719, -316.3311462402344, -304.52020263671875, -292.70928955078125, -280.89837646484375, -269.08746337890625, -257.2765197753906, -245.46560668945312, -233.65469360351562, -221.84378051757812, -210.03286743164062, -198.22195434570312, -186.41102600097656, -174.60011291503906, -162.78919982910156, -150.978271484375, -139.1673583984375, -127.3564453125, -115.5455322265625, -103.73461151123047, -91.92369842529297, -80.11277770996094, -68.30186462402344, -56.490943908691406, -44.680023193359375, -32.869110107421875, -21.058189392089844, -9.247271537780762, 2.5636463165283203, 14.374565124511719, 26.185482025146484, 37.99639892578125, 49.80731964111328, 61.61823272705078, 73.42915344238281, 85.24007415771484, 97.05098724365234, 108.86190795898438, 120.67282104492188, 132.48373413085938, 144.29466247558594, 156.10557556152344, 167.91650390625, 179.7274169921875, 191.53834533691406, 203.34925842285156, 215.16017150878906, 226.97109985351562, 238.78201293945312, 250.59292602539062, 262.4038391113281]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 10.0, 9.0, 10.0, 15.0, 10.0, 25.0, 17.0, 24.0, 28.0, 35.0, 35.0, 38.0, 42.0, 42.0, 36.0, 33.0, 39.0, 37.0, 38.0, 42.0, 44.0, 48.0, 35.0, 44.0, 30.0, 33.0, 26.0, 15.0, 23.0, 19.0, 19.0, 21.0, 8.0, 8.0, 8.0, 7.0, 2.0, 8.0, 6.0, 8.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.747676849365234, -31.709997177124023, -30.672317504882812, -29.6346378326416, -28.59695816040039, -27.55927848815918, -26.52159881591797, -25.483919143676758, -24.446239471435547, -23.408559799194336, -22.370880126953125, -21.333200454711914, -20.295520782470703, -19.257841110229492, -18.22016143798828, -17.18248176574707, -16.14480209350586, -15.107122421264648, -14.069442749023438, -13.031763076782227, -11.994083404541016, -10.956403732299805, -9.918724060058594, -8.881044387817383, -7.843364715576172, -6.805685043334961, -5.76800537109375, -4.730325698852539, -3.692646026611328, -2.654966354370117, -1.6172866821289062, -0.5796070098876953, 0.45807647705078125, 1.4957561492919922, 2.533435821533203, 3.571115493774414, 4.608795166015625, 5.646474838256836, 6.684154510498047, 7.721834182739258, 8.759513854980469, 9.79719352722168, 10.83487319946289, 11.872552871704102, 12.910232543945312, 13.947912216186523, 14.985591888427734, 16.023271560668945, 17.060951232910156, 18.098630905151367, 19.136310577392578, 20.17399024963379, 21.211669921875, 22.24934959411621, 23.287029266357422, 24.324708938598633, 25.362388610839844, 26.400068283081055, 27.437747955322266, 28.475427627563477, 29.513107299804688, 30.5507869720459, 31.58846664428711, 32.62614440917969, 33.66382598876953]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 8.0, 9.0, 6.0, 15.0, 17.0, 21.0, 17.0, 23.0, 25.0, 23.0, 26.0, 27.0, 37.0, 27.0, 40.0, 45.0, 37.0, 38.0, 43.0, 47.0, 44.0, 37.0, 51.0, 35.0, 29.0, 46.0, 25.0, 24.0, 22.0, 33.0, 24.0, 13.0, 15.0, 10.0, 15.0, 12.0, 6.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.63433837890625, -5.4639892578125, -5.29364013671875, -5.123291015625, -4.95294189453125, -4.7825927734375, -4.61224365234375, -4.44189453125, -4.27154541015625, -4.1011962890625, -3.93084716796875, -3.760498046875, -3.59014892578125, -3.4197998046875, -3.24945068359375, -3.0791015625, -2.90875244140625, -2.7384033203125, -2.56805419921875, -2.397705078125, -2.22735595703125, -2.0570068359375, -1.88665771484375, -1.71630859375, -1.54595947265625, -1.3756103515625, -1.20526123046875, -1.034912109375, -0.86456298828125, -0.6942138671875, -0.52386474609375, -0.353515625, -0.18316650390625, -0.0128173828125, 0.15753173828125, 0.327880859375, 0.49822998046875, 0.6685791015625, 0.83892822265625, 1.00927734375, 1.17962646484375, 1.3499755859375, 1.52032470703125, 1.690673828125, 1.86102294921875, 2.0313720703125, 2.20172119140625, 2.3720703125, 2.54241943359375, 2.7127685546875, 2.88311767578125, 3.053466796875, 3.22381591796875, 3.3941650390625, 3.56451416015625, 3.73486328125, 3.90521240234375, 4.0755615234375, 4.24591064453125, 4.416259765625, 4.58660888671875, 4.7569580078125, 4.92730712890625, 5.09765625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 10.0, 8.0, 9.0, 21.0, 23.0, 31.0, 65.0, 100.0, 161.0, 271.0, 407.0, 603.0, 1037.0, 1737.0, 2673.0, 4297.0, 6885.0, 11104.0, 17972.0, 28434.0, 46676.0, 74661.0, 118180.0, 170854.0, 186311.0, 138370.0, 90113.0, 56117.0, 34543.0, 21634.0, 13200.0, 8315.0, 5151.0, 3194.0, 2000.0, 1264.0, 772.0, 498.0, 337.0, 158.0, 133.0, 93.0, 50.0, 33.0, 20.0, 16.0, 3.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.483642578125, -0.46862030029296875, -0.4535980224609375, -0.43857574462890625, -0.423553466796875, -0.40853118896484375, -0.3935089111328125, -0.37848663330078125, -0.36346435546875, -0.34844207763671875, -0.3334197998046875, -0.31839752197265625, -0.303375244140625, -0.28835296630859375, -0.2733306884765625, -0.25830841064453125, -0.2432861328125, -0.22826385498046875, -0.2132415771484375, -0.19821929931640625, -0.183197021484375, -0.16817474365234375, -0.1531524658203125, -0.13813018798828125, -0.12310791015625, -0.10808563232421875, -0.0930633544921875, -0.07804107666015625, -0.063018798828125, -0.04799652099609375, -0.0329742431640625, -0.01795196533203125, -0.0029296875, 0.01209259033203125, 0.0271148681640625, 0.04213714599609375, 0.057159423828125, 0.07218170166015625, 0.0872039794921875, 0.10222625732421875, 0.11724853515625, 0.13227081298828125, 0.1472930908203125, 0.16231536865234375, 0.177337646484375, 0.19235992431640625, 0.2073822021484375, 0.22240447998046875, 0.2374267578125, 0.25244903564453125, 0.2674713134765625, 0.28249359130859375, 0.297515869140625, 0.31253814697265625, 0.3275604248046875, 0.34258270263671875, 0.35760498046875, 0.37262725830078125, 0.3876495361328125, 0.40267181396484375, 0.417694091796875, 0.43271636962890625, 0.4477386474609375, 0.46276092529296875, 0.477783203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 8.0, 4.0, 8.0, 13.0, 16.0, 13.0, 14.0, 19.0, 23.0, 32.0, 16.0, 31.0, 38.0, 27.0, 30.0, 38.0, 33.0, 52.0, 43.0, 1062.0, 37.0, 45.0, 42.0, 38.0, 41.0, 35.0, 32.0, 32.0, 23.0, 30.0, 26.0, 14.0, 29.0, 17.0, 9.0, 9.0, 11.0, 14.0, 3.0, 11.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.873046875, -3.76544189453125, -3.6578369140625, -3.55023193359375, -3.442626953125, -3.33502197265625, -3.2274169921875, -3.11981201171875, -3.01220703125, -2.90460205078125, -2.7969970703125, -2.68939208984375, -2.581787109375, -2.47418212890625, -2.3665771484375, -2.25897216796875, -2.1513671875, -2.04376220703125, -1.9361572265625, -1.82855224609375, -1.720947265625, -1.61334228515625, -1.5057373046875, -1.39813232421875, -1.29052734375, -1.18292236328125, -1.0753173828125, -0.96771240234375, -0.860107421875, -0.75250244140625, -0.6448974609375, -0.53729248046875, -0.4296875, -0.32208251953125, -0.2144775390625, -0.10687255859375, 0.000732421875, 0.10833740234375, 0.2159423828125, 0.32354736328125, 0.43115234375, 0.53875732421875, 0.6463623046875, 0.75396728515625, 0.861572265625, 0.96917724609375, 1.0767822265625, 1.18438720703125, 1.2919921875, 1.39959716796875, 1.5072021484375, 1.61480712890625, 1.722412109375, 1.83001708984375, 1.9376220703125, 2.04522705078125, 2.15283203125, 2.26043701171875, 2.3680419921875, 2.47564697265625, 2.583251953125, 2.69085693359375, 2.7984619140625, 2.90606689453125, 3.013671875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 15.0, 22.0, 27.0, 52.0, 64.0, 91.0, 140.0, 183.0, 276.0, 427.0, 602.0, 908.0, 1383.0, 2013.0, 3098.0, 4907.0, 7527.0, 11958.0, 18395.0, 28077.0, 42936.0, 64047.0, 91550.0, 123007.0, 1125160.0, 209301.0, 113728.0, 82350.0, 56755.0, 37625.0, 24912.0, 16066.0, 10300.0, 6656.0, 4341.0, 2734.0, 1786.0, 1194.0, 812.0, 533.0, 331.0, 263.0, 175.0, 128.0, 90.0, 56.0, 46.0, 27.0, 14.0, 9.0, 7.0, 7.0, 5.0, 4.0, 1.0, 4.0, 2.0], "bins": [-0.267578125, -0.25917816162109375, -0.2507781982421875, -0.24237823486328125, -0.233978271484375, -0.22557830810546875, -0.2171783447265625, -0.20877838134765625, -0.20037841796875, -0.19197845458984375, -0.1835784912109375, -0.17517852783203125, -0.166778564453125, -0.15837860107421875, -0.1499786376953125, -0.14157867431640625, -0.1331787109375, -0.12477874755859375, -0.1163787841796875, -0.10797882080078125, -0.099578857421875, -0.09117889404296875, -0.0827789306640625, -0.07437896728515625, -0.06597900390625, -0.05757904052734375, -0.0491790771484375, -0.04077911376953125, -0.032379150390625, -0.02397918701171875, -0.0155792236328125, -0.00717926025390625, 0.001220703125, 0.00962066650390625, 0.0180206298828125, 0.02642059326171875, 0.034820556640625, 0.04322052001953125, 0.0516204833984375, 0.06002044677734375, 0.06842041015625, 0.07682037353515625, 0.0852203369140625, 0.09362030029296875, 0.102020263671875, 0.11042022705078125, 0.1188201904296875, 0.12722015380859375, 0.1356201171875, 0.14402008056640625, 0.1524200439453125, 0.16082000732421875, 0.169219970703125, 0.17761993408203125, 0.1860198974609375, 0.19441986083984375, 0.20281982421875, 0.21121978759765625, 0.2196197509765625, 0.22801971435546875, 0.236419677734375, 0.24481964111328125, 0.2532196044921875, 0.26161956787109375, 0.27001953125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 16.0, 7.0, 16.0, 18.0, 21.0, 24.0, 24.0, 28.0, 33.0, 60.0, 75.0, 82.0, 94.0, 84.0, 75.0, 50.0, 55.0, 27.0, 26.0, 20.0, 19.0, 20.0, 17.0, 12.0, 5.0, 11.0, 14.0, 8.0, 6.0, 1.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0101470947265625, -0.009816169738769531, -0.009485244750976562, -0.009154319763183594, -0.008823394775390625, -0.008492469787597656, -0.008161544799804688, -0.007830619812011719, -0.00749969482421875, -0.007168769836425781, -0.0068378448486328125, -0.006506919860839844, -0.006175994873046875, -0.005845069885253906, -0.0055141448974609375, -0.005183219909667969, -0.004852294921875, -0.004521369934082031, -0.0041904449462890625, -0.0038595199584960938, -0.003528594970703125, -0.0031976699829101562, -0.0028667449951171875, -0.0025358200073242188, -0.00220489501953125, -0.0018739700317382812, -0.0015430450439453125, -0.0012121200561523438, -0.000881195068359375, -0.0005502700805664062, -0.0002193450927734375, 0.00011157989501953125, 0.0004425048828125, 0.0007734298706054688, 0.0011043548583984375, 0.0014352798461914062, 0.001766204833984375, 0.0020971298217773438, 0.0024280548095703125, 0.0027589797973632812, 0.00308990478515625, 0.0034208297729492188, 0.0037517547607421875, 0.004082679748535156, 0.004413604736328125, 0.004744529724121094, 0.0050754547119140625, 0.005406379699707031, 0.0057373046875, 0.006068229675292969, 0.0063991546630859375, 0.006730079650878906, 0.007061004638671875, 0.007391929626464844, 0.0077228546142578125, 0.008053779602050781, 0.00838470458984375, 0.008715629577636719, 0.009046554565429688, 0.009377479553222656, 0.009708404541015625, 0.010039329528808594, 0.010370254516601562, 0.010701179504394531, 0.0110321044921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 6.0, 7.0, 11.0, 10.0, 15.0, 15.0, 17.0, 24.0, 26.0, 41.0, 45.0, 85.0, 107.0, 188.0, 402.0, 2282.0, 83044.0, 945187.0, 15224.0, 1019.0, 297.0, 135.0, 83.0, 61.0, 52.0, 44.0, 27.0, 25.0, 16.0, 15.0, 6.0, 8.0, 8.0, 8.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.24951171875, -0.2420177459716797, -0.23452377319335938, -0.22702980041503906, -0.21953582763671875, -0.21204185485839844, -0.20454788208007812, -0.1970539093017578, -0.1895599365234375, -0.1820659637451172, -0.17457199096679688, -0.16707801818847656, -0.15958404541015625, -0.15209007263183594, -0.14459609985351562, -0.1371021270751953, -0.129608154296875, -0.12211418151855469, -0.11462020874023438, -0.10712623596191406, -0.09963226318359375, -0.09213829040527344, -0.08464431762695312, -0.07715034484863281, -0.0696563720703125, -0.06216239929199219, -0.054668426513671875, -0.04717445373535156, -0.03968048095703125, -0.03218650817871094, -0.024692535400390625, -0.017198562622070312, -0.00970458984375, -0.0022106170654296875, 0.005283355712890625, 0.012777328491210938, 0.02027130126953125, 0.027765274047851562, 0.035259246826171875, 0.04275321960449219, 0.0502471923828125, 0.05774116516113281, 0.06523513793945312, 0.07272911071777344, 0.08022308349609375, 0.08771705627441406, 0.09521102905273438, 0.10270500183105469, 0.110198974609375, 0.11769294738769531, 0.12518692016601562, 0.13268089294433594, 0.14017486572265625, 0.14766883850097656, 0.15516281127929688, 0.1626567840576172, 0.1701507568359375, 0.1776447296142578, 0.18513870239257812, 0.19263267517089844, 0.20012664794921875, 0.20762062072753906, 0.21511459350585938, 0.2226085662841797, 0.2301025390625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 20.0, 37.0, 45.0, 116.0, 246.0, 197.0, 147.0, 67.0, 47.0, 17.0, 21.0, 14.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03400374948978424, -0.03282804414629936, -0.031652338802814484, -0.030476629734039307, -0.029300924390554428, -0.02812521904706955, -0.026949511840939522, -0.025773804634809494, -0.024598099291324615, -0.023422393947839737, -0.02224668674170971, -0.02107097953557968, -0.019895274192094803, -0.018719568848609924, -0.017543861642479897, -0.01636815443634987, -0.01519244909286499, -0.014016742818057537, -0.012841036543250084, -0.01166533026844263, -0.010489623993635178, -0.009313917718827724, -0.008138211444020271, -0.006962505169212818, -0.005786798894405365, -0.004611092619597912, -0.0034353863447904587, -0.0022596800699830055, -0.0010839737951755524, 9.173247963190079e-05, 0.001267438754439354, 0.002443145029246807, 0.0036188513040542603, 0.004794557578861713, 0.0059702638536691666, 0.00714597012847662, 0.008321676403284073, 0.009497382678091526, 0.01067308895289898, 0.011848795227706432, 0.013024501502513885, 0.014200207777321339, 0.015375914052128792, 0.01655162125825882, 0.017727326601743698, 0.018903031945228577, 0.020078739151358604, 0.021254446357488632, 0.02243015170097351, 0.02360585704445839, 0.024781564250588417, 0.025957271456718445, 0.027132976800203323, 0.028308682143688202, 0.02948438934981823, 0.030660096555948257, 0.031835801899433136, 0.033011507242918015, 0.03418721258640289, 0.03536292165517807, 0.03653862699866295, 0.03771433234214783, 0.038890041410923004, 0.04006574675440788, 0.04124145209789276]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 6.0, 6.0, 9.0, 7.0, 13.0, 15.0, 13.0, 28.0, 14.0, 29.0, 24.0, 29.0, 27.0, 32.0, 33.0, 32.0, 42.0, 34.0, 35.0, 46.0, 42.0, 37.0, 31.0, 43.0, 35.0, 36.0, 42.0, 34.0, 28.0, 23.0, 25.0, 33.0, 19.0, 13.0, 22.0, 8.0, 14.0, 10.0, 8.0, 6.0, 1.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.006516158580780029, -0.0063246507197618484, -0.006133142858743668, -0.005941634997725487, -0.005750127136707306, -0.005558619275689125, -0.005367111414670944, -0.005175603553652763, -0.0049840956926345825, -0.004792587831616402, -0.004601079970598221, -0.00440957210958004, -0.004218064248561859, -0.004026556387543678, -0.0038350485265254974, -0.0036435406655073166, -0.0034520328044891357, -0.003260524943470955, -0.003069017082452774, -0.002877509221434593, -0.0026860013604164124, -0.0024944934993982315, -0.0023029856383800507, -0.00211147777736187, -0.001919969916343689, -0.0017284620553255081, -0.0015369541943073273, -0.0013454463332891464, -0.0011539384722709656, -0.0009624306112527847, -0.0007709227502346039, -0.000579414889216423, -0.0003879070281982422, -0.00019639916718006134, -4.891306161880493e-06, 0.00018661655485630035, 0.0003781244158744812, 0.000569632276892662, 0.0007611401379108429, 0.0009526479989290237, 0.0011441558599472046, 0.0013356637209653854, 0.0015271715819835663, 0.0017186794430017471, 0.001910187304019928, 0.002101695165038109, 0.0022932030260562897, 0.0024847108870744705, 0.0026762187480926514, 0.002867726609110832, 0.003059234470129013, 0.003250742331147194, 0.0034422501921653748, 0.0036337580531835556, 0.0038252659142017365, 0.004016773775219917, 0.004208281636238098, 0.004399789497256279, 0.00459129735827446, 0.004782805219292641, 0.0049743130803108215, 0.005165820941329002, 0.005357328802347183, 0.005548836663365364, 0.005740344524383545]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 8.0, 9.0, 6.0, 15.0, 17.0, 21.0, 17.0, 23.0, 25.0, 23.0, 26.0, 27.0, 37.0, 27.0, 40.0, 45.0, 37.0, 38.0, 43.0, 47.0, 44.0, 37.0, 51.0, 36.0, 28.0, 47.0, 24.0, 24.0, 22.0, 33.0, 24.0, 13.0, 15.0, 10.0, 15.0, 12.0, 6.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.8046875, -5.63433837890625, -5.4639892578125, -5.29364013671875, -5.123291015625, -4.95294189453125, -4.7825927734375, -4.61224365234375, -4.44189453125, -4.27154541015625, -4.1011962890625, -3.93084716796875, -3.760498046875, -3.59014892578125, -3.4197998046875, -3.24945068359375, -3.0791015625, -2.90875244140625, -2.7384033203125, -2.56805419921875, -2.397705078125, -2.22735595703125, -2.0570068359375, -1.88665771484375, -1.71630859375, -1.54595947265625, -1.3756103515625, -1.20526123046875, -1.034912109375, -0.86456298828125, -0.6942138671875, -0.52386474609375, -0.353515625, -0.18316650390625, -0.0128173828125, 0.15753173828125, 0.327880859375, 0.49822998046875, 0.6685791015625, 0.83892822265625, 1.00927734375, 1.17962646484375, 1.3499755859375, 1.52032470703125, 1.690673828125, 1.86102294921875, 2.0313720703125, 2.20172119140625, 2.3720703125, 2.54241943359375, 2.7127685546875, 2.88311767578125, 3.053466796875, 3.22381591796875, 3.3941650390625, 3.56451416015625, 3.73486328125, 3.90521240234375, 4.0755615234375, 4.24591064453125, 4.416259765625, 4.58660888671875, 4.7569580078125, 4.92730712890625, 5.09765625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 5.0, 4.0, 6.0, 15.0, 15.0, 22.0, 31.0, 53.0, 75.0, 106.0, 158.0, 287.0, 532.0, 981.0, 1867.0, 3634.0, 6995.0, 13840.0, 26527.0, 52014.0, 111177.0, 256417.0, 300641.0, 142946.0, 63591.0, 32034.0, 16688.0, 8543.0, 4320.0, 2288.0, 1178.0, 621.0, 370.0, 207.0, 126.0, 68.0, 38.0, 39.0, 28.0, 20.0, 8.0, 10.0, 7.0, 7.0, 6.0, 5.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.9190673828125, -5.740478515625, -5.5618896484375, -5.38330078125, -5.2047119140625, -5.026123046875, -4.8475341796875, -4.6689453125, -4.4903564453125, -4.311767578125, -4.1331787109375, -3.95458984375, -3.7760009765625, -3.597412109375, -3.4188232421875, -3.240234375, -3.0616455078125, -2.883056640625, -2.7044677734375, -2.52587890625, -2.3472900390625, -2.168701171875, -1.9901123046875, -1.8115234375, -1.6329345703125, -1.454345703125, -1.2757568359375, -1.09716796875, -0.9185791015625, -0.739990234375, -0.5614013671875, -0.3828125, -0.2042236328125, -0.025634765625, 0.1529541015625, 0.33154296875, 0.5101318359375, 0.688720703125, 0.8673095703125, 1.0458984375, 1.2244873046875, 1.403076171875, 1.5816650390625, 1.76025390625, 1.9388427734375, 2.117431640625, 2.2960205078125, 2.474609375, 2.6531982421875, 2.831787109375, 3.0103759765625, 3.18896484375, 3.3675537109375, 3.546142578125, 3.7247314453125, 3.9033203125, 4.0819091796875, 4.260498046875, 4.4390869140625, 4.61767578125, 4.7962646484375, 4.974853515625, 5.1534423828125, 5.33203125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 3.0, 5.0, 9.0, 7.0, 5.0, 7.0, 13.0, 10.0, 22.0, 24.0, 26.0, 18.0, 24.0, 28.0, 37.0, 45.0, 48.0, 49.0, 69.0, 112.0, 212.0, 1385.0, 285.0, 117.0, 73.0, 67.0, 47.0, 39.0, 38.0, 39.0, 25.0, 20.0, 23.0, 16.0, 17.0, 15.0, 9.0, 9.0, 17.0, 6.0, 10.0, 3.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.32666015625, -15.7939453125, -15.26123046875, -14.728515625, -14.19580078125, -13.6630859375, -13.13037109375, -12.59765625, -12.06494140625, -11.5322265625, -10.99951171875, -10.466796875, -9.93408203125, -9.4013671875, -8.86865234375, -8.3359375, -7.80322265625, -7.2705078125, -6.73779296875, -6.205078125, -5.67236328125, -5.1396484375, -4.60693359375, -4.07421875, -3.54150390625, -3.0087890625, -2.47607421875, -1.943359375, -1.41064453125, -0.8779296875, -0.34521484375, 0.1875, 0.72021484375, 1.2529296875, 1.78564453125, 2.318359375, 2.85107421875, 3.3837890625, 3.91650390625, 4.44921875, 4.98193359375, 5.5146484375, 6.04736328125, 6.580078125, 7.11279296875, 7.6455078125, 8.17822265625, 8.7109375, 9.24365234375, 9.7763671875, 10.30908203125, 10.841796875, 11.37451171875, 11.9072265625, 12.43994140625, 12.97265625, 13.50537109375, 14.0380859375, 14.57080078125, 15.103515625, 15.63623046875, 16.1689453125, 16.70166015625, 17.234375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 4.0, 4.0, 8.0, 6.0, 6.0, 14.0, 21.0, 22.0, 32.0, 46.0, 43.0, 71.0, 103.0, 135.0, 238.0, 369.0, 700.0, 2378.0, 72954.0, 3006013.0, 58616.0, 2166.0, 618.0, 370.0, 215.0, 145.0, 99.0, 74.0, 63.0, 41.0, 24.0, 17.0, 21.0, 15.0, 13.0, 7.0, 10.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.65625, -40.37353515625, -39.0908203125, -37.80810546875, -36.525390625, -35.24267578125, -33.9599609375, -32.67724609375, -31.39453125, -30.11181640625, -28.8291015625, -27.54638671875, -26.263671875, -24.98095703125, -23.6982421875, -22.41552734375, -21.1328125, -19.85009765625, -18.5673828125, -17.28466796875, -16.001953125, -14.71923828125, -13.4365234375, -12.15380859375, -10.87109375, -9.58837890625, -8.3056640625, -7.02294921875, -5.740234375, -4.45751953125, -3.1748046875, -1.89208984375, -0.609375, 0.67333984375, 1.9560546875, 3.23876953125, 4.521484375, 5.80419921875, 7.0869140625, 8.36962890625, 9.65234375, 10.93505859375, 12.2177734375, 13.50048828125, 14.783203125, 16.06591796875, 17.3486328125, 18.63134765625, 19.9140625, 21.19677734375, 22.4794921875, 23.76220703125, 25.044921875, 26.32763671875, 27.6103515625, 28.89306640625, 30.17578125, 31.45849609375, 32.7412109375, 34.02392578125, 35.306640625, 36.58935546875, 37.8720703125, 39.15478515625, 40.4375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 40.0, 964.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-681.158935546875, -669.08349609375, -657.008056640625, -644.9326171875, -632.857177734375, -620.78173828125, -608.706298828125, -596.630859375, -584.555419921875, -572.47998046875, -560.404541015625, -548.3291015625, -536.253662109375, -524.17822265625, -512.102783203125, -500.02734375, -487.9518737792969, -475.8764343261719, -463.8009948730469, -451.7255554199219, -439.6501159667969, -427.5746765136719, -415.49920654296875, -403.42376708984375, -391.34832763671875, -379.27288818359375, -367.19744873046875, -355.12200927734375, -343.04656982421875, -330.97113037109375, -318.89569091796875, -306.82025146484375, -294.74481201171875, -282.66937255859375, -270.59393310546875, -258.51849365234375, -246.44305419921875, -234.36761474609375, -222.2921600341797, -210.2167205810547, -198.14129638671875, -186.06585693359375, -173.99041748046875, -161.91497802734375, -149.83953857421875, -137.76409912109375, -125.68864440917969, -113.61320495605469, -101.53776550292969, -89.46232604980469, -77.38688659667969, -65.31143951416016, -53.236000061035156, -41.160560607910156, -29.085113525390625, -17.009674072265625, -4.934234619140625, 7.141206741333008, 19.21664810180664, 31.292091369628906, 43.367530822753906, 55.442970275878906, 67.51841735839844, 79.59385681152344, 91.66929626464844]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 11.0, 9.0, 18.0, 18.0, 23.0, 23.0, 34.0, 37.0, 51.0, 48.0, 53.0, 54.0, 56.0, 56.0, 56.0, 61.0, 65.0, 45.0, 37.0, 42.0, 24.0, 34.0, 17.0, 32.0, 25.0, 16.0, 18.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.01895523071289, -61.288143157958984, -59.557334899902344, -57.82652282714844, -56.09571075439453, -54.364898681640625, -52.634090423583984, -50.90327835083008, -49.17247009277344, -47.44165802001953, -45.71084976196289, -43.980037689208984, -42.24922561645508, -40.51841735839844, -38.78760528564453, -37.056793212890625, -35.32598114013672, -33.59516906738281, -31.86435890197754, -30.133548736572266, -28.40273666381836, -26.671926498413086, -24.941116333007812, -23.210304260253906, -21.479494094848633, -19.74868392944336, -18.017871856689453, -16.28706169128418, -14.55625057220459, -12.825439453125, -11.094629287719727, -9.363818168640137, -7.633003234863281, -5.902192115783691, -4.17138147354126, -2.440570831298828, -0.7097597122192383, 1.0210514068603516, 2.751861572265625, 4.482672691345215, 6.213483810424805, 7.9442949295043945, 9.675106048583984, 11.405916213989258, 13.136727333068848, 14.867538452148438, 16.59834861755371, 18.329158782958984, 20.05997085571289, 21.790781021118164, 23.52159309387207, 25.252403259277344, 26.98321533203125, 28.714025497436523, 30.444835662841797, 32.1756477355957, 33.906455993652344, 35.63726806640625, 37.36807632446289, 39.0988883972168, 40.8297004699707, 42.560508728027344, 44.29132080078125, 46.022132873535156, 47.75294494628906]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 3.0, 7.0, 2.0, 6.0, 13.0, 10.0, 15.0, 18.0, 19.0, 20.0, 25.0, 23.0, 20.0, 28.0, 42.0, 34.0, 32.0, 32.0, 39.0, 36.0, 37.0, 44.0, 45.0, 39.0, 37.0, 35.0, 31.0, 29.0, 29.0, 28.0, 26.0, 29.0, 33.0, 20.0, 18.0, 14.0, 15.0, 12.0, 4.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-6.0078125, -5.833251953125, -5.65869140625, -5.484130859375, -5.3095703125, -5.135009765625, -4.96044921875, -4.785888671875, -4.611328125, -4.436767578125, -4.26220703125, -4.087646484375, -3.9130859375, -3.738525390625, -3.56396484375, -3.389404296875, -3.21484375, -3.040283203125, -2.86572265625, -2.691162109375, -2.5166015625, -2.342041015625, -2.16748046875, -1.992919921875, -1.818359375, -1.643798828125, -1.46923828125, -1.294677734375, -1.1201171875, -0.945556640625, -0.77099609375, -0.596435546875, -0.421875, -0.247314453125, -0.07275390625, 0.101806640625, 0.2763671875, 0.450927734375, 0.62548828125, 0.800048828125, 0.974609375, 1.149169921875, 1.32373046875, 1.498291015625, 1.6728515625, 1.847412109375, 2.02197265625, 2.196533203125, 2.37109375, 2.545654296875, 2.72021484375, 2.894775390625, 3.0693359375, 3.243896484375, 3.41845703125, 3.593017578125, 3.767578125, 3.942138671875, 4.11669921875, 4.291259765625, 4.4658203125, 4.640380859375, 4.81494140625, 4.989501953125, 5.1640625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 6.0, 4.0, 5.0, 4.0, 4.0, 16.0, 8.0, 23.0, 10.0, 13.0, 25.0, 33.0, 26.0, 42.0, 46.0, 76.0, 102.0, 182.0, 560.0, 2763.0, 20910.0, 230263.0, 1875420.0, 1816799.0, 222714.0, 20472.0, 2652.0, 502.0, 157.0, 87.0, 64.0, 52.0, 49.0, 34.0, 29.0, 24.0, 16.0, 16.0, 14.0, 14.0, 7.0, 7.0, 1.0, 8.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0], "bins": [-13.5390625, -13.1407470703125, -12.742431640625, -12.3441162109375, -11.94580078125, -11.5474853515625, -11.149169921875, -10.7508544921875, -10.3525390625, -9.9542236328125, -9.555908203125, -9.1575927734375, -8.75927734375, -8.3609619140625, -7.962646484375, -7.5643310546875, -7.166015625, -6.7677001953125, -6.369384765625, -5.9710693359375, -5.57275390625, -5.1744384765625, -4.776123046875, -4.3778076171875, -3.9794921875, -3.5811767578125, -3.182861328125, -2.7845458984375, -2.38623046875, -1.9879150390625, -1.589599609375, -1.1912841796875, -0.79296875, -0.3946533203125, 0.003662109375, 0.4019775390625, 0.80029296875, 1.1986083984375, 1.596923828125, 1.9952392578125, 2.3935546875, 2.7918701171875, 3.190185546875, 3.5885009765625, 3.98681640625, 4.3851318359375, 4.783447265625, 5.1817626953125, 5.580078125, 5.9783935546875, 6.376708984375, 6.7750244140625, 7.17333984375, 7.5716552734375, 7.969970703125, 8.3682861328125, 8.7666015625, 9.1649169921875, 9.563232421875, 9.9615478515625, 10.35986328125, 10.7581787109375, 11.156494140625, 11.5548095703125, 11.953125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 14.0, 21.0, 23.0, 35.0, 45.0, 65.0, 88.0, 151.0, 199.0, 302.0, 432.0, 506.0, 537.0, 494.0, 372.0, 240.0, 156.0, 110.0, 85.0, 58.0, 46.0, 23.0, 18.0, 8.0, 13.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.046875, -15.667236328125, -15.28759765625, -14.907958984375, -14.5283203125, -14.148681640625, -13.76904296875, -13.389404296875, -13.009765625, -12.630126953125, -12.25048828125, -11.870849609375, -11.4912109375, -11.111572265625, -10.73193359375, -10.352294921875, -9.97265625, -9.593017578125, -9.21337890625, -8.833740234375, -8.4541015625, -8.074462890625, -7.69482421875, -7.315185546875, -6.935546875, -6.555908203125, -6.17626953125, -5.796630859375, -5.4169921875, -5.037353515625, -4.65771484375, -4.278076171875, -3.8984375, -3.518798828125, -3.13916015625, -2.759521484375, -2.3798828125, -2.000244140625, -1.62060546875, -1.240966796875, -0.861328125, -0.481689453125, -0.10205078125, 0.277587890625, 0.6572265625, 1.036865234375, 1.41650390625, 1.796142578125, 2.17578125, 2.555419921875, 2.93505859375, 3.314697265625, 3.6943359375, 4.073974609375, 4.45361328125, 4.833251953125, 5.212890625, 5.592529296875, 5.97216796875, 6.351806640625, 6.7314453125, 7.111083984375, 7.49072265625, 7.870361328125, 8.25]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 9.0, 15.0, 18.0, 40.0, 47.0, 86.0, 104.0, 133.0, 268.0, 457.0, 951.0, 6485.0, 509116.0, 3615351.0, 57540.0, 1998.0, 674.0, 335.0, 217.0, 137.0, 79.0, 69.0, 44.0, 27.0, 14.0, 20.0, 11.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.53125, -26.3486328125, -25.166015625, -23.9833984375, -22.80078125, -21.6181640625, -20.435546875, -19.2529296875, -18.0703125, -16.8876953125, -15.705078125, -14.5224609375, -13.33984375, -12.1572265625, -10.974609375, -9.7919921875, -8.609375, -7.4267578125, -6.244140625, -5.0615234375, -3.87890625, -2.6962890625, -1.513671875, -0.3310546875, 0.8515625, 2.0341796875, 3.216796875, 4.3994140625, 5.58203125, 6.7646484375, 7.947265625, 9.1298828125, 10.3125, 11.4951171875, 12.677734375, 13.8603515625, 15.04296875, 16.2255859375, 17.408203125, 18.5908203125, 19.7734375, 20.9560546875, 22.138671875, 23.3212890625, 24.50390625, 25.6865234375, 26.869140625, 28.0517578125, 29.234375, 30.4169921875, 31.599609375, 32.7822265625, 33.96484375, 35.1474609375, 36.330078125, 37.5126953125, 38.6953125, 39.8779296875, 41.060546875, 42.2431640625, 43.42578125, 44.6083984375, 45.791015625, 46.9736328125, 48.15625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 13.0, 69.0, 311.0, 419.0, 171.0, 32.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.78282165527344, -182.75057983398438, -177.71835327148438, -172.6861114501953, -167.65386962890625, -162.62164306640625, -157.5894012451172, -152.55715942382812, -147.52493286132812, -142.49269104003906, -137.46046447753906, -132.42822265625, -127.39598083496094, -122.3637466430664, -117.33151245117188, -112.29927062988281, -107.26702880859375, -102.23479461669922, -97.20255279541016, -92.17031860351562, -87.13807678222656, -82.10584259033203, -77.0736083984375, -72.04136657714844, -67.0091323852539, -61.97689437866211, -56.94465637207031, -51.91242218017578, -46.880184173583984, -41.84794616699219, -36.815711975097656, -31.78347396850586, -26.751220703125, -21.718982696533203, -16.68674659729004, -11.654509544372559, -6.622272491455078, -1.5900344848632812, 3.442201614379883, 8.474437713623047, 13.506675720214844, 18.53891372680664, 23.571149826049805, 28.60338592529297, 33.635623931884766, 38.66786193847656, 43.700096130371094, 48.73233413696289, 53.76457214355469, 58.796810150146484, 63.82904815673828, 68.86128234863281, 73.89352416992188, 78.9257583618164, 83.95799255371094, 88.990234375, 94.02246856689453, 99.05470275878906, 104.08694458007812, 109.11917877197266, 114.15141296386719, 119.18365478515625, 124.21588897705078, 129.2481231689453, 134.28036499023438]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 2.0, 7.0, 6.0, 7.0, 9.0, 11.0, 10.0, 16.0, 14.0, 15.0, 18.0, 19.0, 22.0, 41.0, 26.0, 25.0, 38.0, 31.0, 37.0, 28.0, 34.0, 39.0, 43.0, 38.0, 29.0, 39.0, 35.0, 42.0, 30.0, 24.0, 33.0, 30.0, 19.0, 28.0, 19.0, 18.0, 18.0, 15.0, 18.0, 17.0, 14.0, 8.0, 11.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.55781555175781, -32.573326110839844, -31.588838577270508, -30.60434913635254, -29.61985969543457, -28.635372161865234, -27.650882720947266, -26.666393280029297, -25.681903839111328, -24.69741439819336, -23.712926864624023, -22.728437423706055, -21.743947982788086, -20.75946044921875, -19.77497100830078, -18.790481567382812, -17.805994033813477, -16.821504592895508, -15.837016105651855, -14.852527618408203, -13.868038177490234, -12.883549690246582, -11.89906120300293, -10.914571762084961, -9.930083274841309, -8.945594787597656, -7.9611053466796875, -6.976616859436035, -5.992127895355225, -5.007638931274414, -4.023150444030762, -3.038661479949951, -2.0541725158691406, -1.0696836709976196, -0.08519482612609863, 0.8992938995361328, 1.8837828636169434, 2.868271827697754, 3.8527603149414062, 4.837249279022217, 5.821738243103027, 6.806227207183838, 7.790716171264648, 8.7752046585083, 9.759693145751953, 10.744182586669922, 11.728671073913574, 12.713159561157227, 13.697649002075195, 14.682137489318848, 15.666626930236816, 16.65111541748047, 17.635604858398438, 18.620094299316406, 19.604581832885742, 20.58907127380371, 21.573558807373047, 22.558048248291016, 23.54253578186035, 24.52702522277832, 25.51151466369629, 26.496002197265625, 27.480491638183594, 28.464981079101562, 29.44947052001953]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 3.0, 4.0, 6.0, 5.0, 12.0, 12.0, 13.0, 9.0, 14.0, 24.0, 33.0, 34.0, 32.0, 35.0, 41.0, 37.0, 40.0, 40.0, 41.0, 53.0, 37.0, 44.0, 38.0, 43.0, 42.0, 38.0, 31.0, 25.0, 34.0, 38.0, 29.0, 17.0, 18.0, 12.0, 20.0, 11.0, 6.0, 10.0, 1.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.556884765625, -6.36376953125, -6.170654296875, -5.9775390625, -5.784423828125, -5.59130859375, -5.398193359375, -5.205078125, -5.011962890625, -4.81884765625, -4.625732421875, -4.4326171875, -4.239501953125, -4.04638671875, -3.853271484375, -3.66015625, -3.467041015625, -3.27392578125, -3.080810546875, -2.8876953125, -2.694580078125, -2.50146484375, -2.308349609375, -2.115234375, -1.922119140625, -1.72900390625, -1.535888671875, -1.3427734375, -1.149658203125, -0.95654296875, -0.763427734375, -0.5703125, -0.377197265625, -0.18408203125, 0.009033203125, 0.2021484375, 0.395263671875, 0.58837890625, 0.781494140625, 0.974609375, 1.167724609375, 1.36083984375, 1.553955078125, 1.7470703125, 1.940185546875, 2.13330078125, 2.326416015625, 2.51953125, 2.712646484375, 2.90576171875, 3.098876953125, 3.2919921875, 3.485107421875, 3.67822265625, 3.871337890625, 4.064453125, 4.257568359375, 4.45068359375, 4.643798828125, 4.8369140625, 5.030029296875, 5.22314453125, 5.416259765625, 5.609375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 6.0, 3.0, 4.0, 16.0, 15.0, 32.0, 38.0, 61.0, 99.0, 129.0, 213.0, 310.0, 412.0, 551.0, 860.0, 1176.0, 1629.0, 2470.0, 3548.0, 5186.0, 7425.0, 10640.0, 15664.0, 22558.0, 33032.0, 47607.0, 68788.0, 94663.0, 121602.0, 138803.0, 127879.0, 101207.0, 74268.0, 52335.0, 36157.0, 24609.0, 16737.0, 11753.0, 8069.0, 5497.0, 3771.0, 2746.0, 1864.0, 1229.0, 899.0, 606.0, 437.0, 322.0, 225.0, 144.0, 88.0, 66.0, 38.0, 26.0, 28.0, 14.0, 10.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.350341796875, -0.3392601013183594, -0.32817840576171875, -0.3170967102050781, -0.3060150146484375, -0.2949333190917969, -0.28385162353515625, -0.2727699279785156, -0.261688232421875, -0.2506065368652344, -0.23952484130859375, -0.22844314575195312, -0.2173614501953125, -0.20627975463867188, -0.19519805908203125, -0.18411636352539062, -0.17303466796875, -0.16195297241210938, -0.15087127685546875, -0.13978958129882812, -0.1287078857421875, -0.11762619018554688, -0.10654449462890625, -0.09546279907226562, -0.084381103515625, -0.07329940795898438, -0.06221771240234375, -0.051136016845703125, -0.0400543212890625, -0.028972625732421875, -0.01789093017578125, -0.006809234619140625, 0.0042724609375, 0.015354156494140625, 0.02643585205078125, 0.037517547607421875, 0.0485992431640625, 0.059680938720703125, 0.07076263427734375, 0.08184432983398438, 0.092926025390625, 0.10400772094726562, 0.11508941650390625, 0.12617111206054688, 0.1372528076171875, 0.14833450317382812, 0.15941619873046875, 0.17049789428710938, 0.18157958984375, 0.19266128540039062, 0.20374298095703125, 0.21482467651367188, 0.2259063720703125, 0.23698806762695312, 0.24806976318359375, 0.2591514587402344, 0.270233154296875, 0.2813148498535156, 0.29239654541015625, 0.3034782409667969, 0.3145599365234375, 0.3256416320800781, 0.33672332763671875, 0.3478050231933594, 0.35888671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 6.0, 12.0, 3.0, 5.0, 12.0, 13.0, 15.0, 13.0, 18.0, 21.0, 23.0, 20.0, 23.0, 25.0, 26.0, 17.0, 34.0, 30.0, 39.0, 31.0, 38.0, 45.0, 1069.0, 30.0, 35.0, 37.0, 28.0, 32.0, 31.0, 33.0, 26.0, 32.0, 26.0, 24.0, 26.0, 23.0, 15.0, 14.0, 12.0, 15.0, 8.0, 7.0, 4.0, 7.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05859375, -2.956634521484375, -2.85467529296875, -2.752716064453125, -2.6507568359375, -2.548797607421875, -2.44683837890625, -2.344879150390625, -2.242919921875, -2.140960693359375, -2.03900146484375, -1.937042236328125, -1.8350830078125, -1.733123779296875, -1.63116455078125, -1.529205322265625, -1.42724609375, -1.325286865234375, -1.22332763671875, -1.121368408203125, -1.0194091796875, -0.917449951171875, -0.81549072265625, -0.713531494140625, -0.611572265625, -0.509613037109375, -0.40765380859375, -0.305694580078125, -0.2037353515625, -0.101776123046875, 0.00018310546875, 0.102142333984375, 0.2041015625, 0.306060791015625, 0.40802001953125, 0.509979248046875, 0.6119384765625, 0.713897705078125, 0.81585693359375, 0.917816162109375, 1.019775390625, 1.121734619140625, 1.22369384765625, 1.325653076171875, 1.4276123046875, 1.529571533203125, 1.63153076171875, 1.733489990234375, 1.83544921875, 1.937408447265625, 2.03936767578125, 2.141326904296875, 2.2432861328125, 2.345245361328125, 2.44720458984375, 2.549163818359375, 2.651123046875, 2.753082275390625, 2.85504150390625, 2.957000732421875, 3.0589599609375, 3.160919189453125, 3.26287841796875, 3.364837646484375, 3.466796875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 10.0, 30.0, 39.0, 62.0, 108.0, 171.0, 209.0, 370.0, 554.0, 914.0, 1514.0, 2469.0, 4297.0, 7191.0, 12087.0, 20107.0, 33980.0, 55968.0, 89235.0, 133033.0, 1019812.0, 364362.0, 129748.0, 86011.0, 54051.0, 32731.0, 19624.0, 11415.0, 6886.0, 4021.0, 2379.0, 1408.0, 892.0, 532.0, 318.0, 213.0, 144.0, 89.0, 51.0, 30.0, 20.0, 10.0, 15.0, 5.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.297607421875, -0.28733062744140625, -0.2770538330078125, -0.26677703857421875, -0.256500244140625, -0.24622344970703125, -0.2359466552734375, -0.22566986083984375, -0.21539306640625, -0.20511627197265625, -0.1948394775390625, -0.18456268310546875, -0.174285888671875, -0.16400909423828125, -0.1537322998046875, -0.14345550537109375, -0.1331787109375, -0.12290191650390625, -0.1126251220703125, -0.10234832763671875, -0.092071533203125, -0.08179473876953125, -0.0715179443359375, -0.06124114990234375, -0.05096435546875, -0.04068756103515625, -0.0304107666015625, -0.02013397216796875, -0.009857177734375, 0.00041961669921875, 0.0106964111328125, 0.02097320556640625, 0.03125, 0.04152679443359375, 0.0518035888671875, 0.06208038330078125, 0.072357177734375, 0.08263397216796875, 0.0929107666015625, 0.10318756103515625, 0.11346435546875, 0.12374114990234375, 0.1340179443359375, 0.14429473876953125, 0.154571533203125, 0.16484832763671875, 0.1751251220703125, 0.18540191650390625, 0.1956787109375, 0.20595550537109375, 0.2162322998046875, 0.22650909423828125, 0.236785888671875, 0.24706268310546875, 0.2573394775390625, 0.26761627197265625, 0.27789306640625, 0.28816986083984375, 0.2984466552734375, 0.30872344970703125, 0.319000244140625, 0.32927703857421875, 0.3395538330078125, 0.34983062744140625, 0.360107421875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 12.0, 15.0, 35.0, 41.0, 54.0, 64.0, 116.0, 226.0, 158.0, 96.0, 61.0, 42.0, 24.0, 13.0, 11.0, 9.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01398468017578125, -0.013581275939941406, -0.013177871704101562, -0.012774467468261719, -0.012371063232421875, -0.011967658996582031, -0.011564254760742188, -0.011160850524902344, -0.0107574462890625, -0.010354042053222656, -0.009950637817382812, -0.009547233581542969, -0.009143829345703125, -0.008740425109863281, -0.008337020874023438, -0.007933616638183594, -0.00753021240234375, -0.007126808166503906, -0.0067234039306640625, -0.006319999694824219, -0.005916595458984375, -0.005513191223144531, -0.0051097869873046875, -0.004706382751464844, -0.004302978515625, -0.0038995742797851562, -0.0034961700439453125, -0.0030927658081054688, -0.002689361572265625, -0.0022859573364257812, -0.0018825531005859375, -0.0014791488647460938, -0.00107574462890625, -0.0006723403930664062, -0.0002689361572265625, 0.00013446807861328125, 0.000537872314453125, 0.0009412765502929688, 0.0013446807861328125, 0.0017480850219726562, 0.0021514892578125, 0.0025548934936523438, 0.0029582977294921875, 0.0033617019653320312, 0.003765106201171875, 0.004168510437011719, 0.0045719146728515625, 0.004975318908691406, 0.00537872314453125, 0.005782127380371094, 0.0061855316162109375, 0.006588935852050781, 0.006992340087890625, 0.007395744323730469, 0.0077991485595703125, 0.008202552795410156, 0.00860595703125, 0.009009361267089844, 0.009412765502929688, 0.009816169738769531, 0.010219573974609375, 0.010622978210449219, 0.011026382446289062, 0.011429786682128906, 0.01183319091796875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 10.0, 16.0, 20.0, 19.0, 46.0, 73.0, 167.0, 601.0, 25136.0, 1015061.0, 6689.0, 366.0, 141.0, 75.0, 45.0, 28.0, 22.0, 11.0, 6.0, 4.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25146484375, -0.2429046630859375, -0.234344482421875, -0.2257843017578125, -0.21722412109375, -0.2086639404296875, -0.200103759765625, -0.1915435791015625, -0.1829833984375, -0.1744232177734375, -0.165863037109375, -0.1573028564453125, -0.14874267578125, -0.1401824951171875, -0.131622314453125, -0.1230621337890625, -0.114501953125, -0.1059417724609375, -0.097381591796875, -0.0888214111328125, -0.08026123046875, -0.0717010498046875, -0.063140869140625, -0.0545806884765625, -0.0460205078125, -0.0374603271484375, -0.028900146484375, -0.0203399658203125, -0.01177978515625, -0.0032196044921875, 0.005340576171875, 0.0139007568359375, 0.0224609375, 0.0310211181640625, 0.039581298828125, 0.0481414794921875, 0.05670166015625, 0.0652618408203125, 0.073822021484375, 0.0823822021484375, 0.0909423828125, 0.0995025634765625, 0.108062744140625, 0.1166229248046875, 0.12518310546875, 0.1337432861328125, 0.142303466796875, 0.1508636474609375, 0.159423828125, 0.1679840087890625, 0.176544189453125, 0.1851043701171875, 0.19366455078125, 0.2022247314453125, 0.210784912109375, 0.2193450927734375, 0.2279052734375, 0.2364654541015625, 0.245025634765625, 0.2535858154296875, 0.26214599609375, 0.2707061767578125, 0.279266357421875, 0.2878265380859375, 0.29638671875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 12.0, 79.0, 468.0, 347.0, 69.0, 26.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.10467356443405151, -0.10253288596868515, -0.10039220750331879, -0.09825153648853302, -0.09611085802316666, -0.09397017955780029, -0.09182950109243393, -0.08968882262706757, -0.0875481441617012, -0.08540746569633484, -0.08326678723096848, -0.08112610876560211, -0.07898543775081635, -0.07684475928544998, -0.07470408082008362, -0.07256340235471725, -0.07042272388935089, -0.06828204542398453, -0.06614136695861816, -0.0640006959438324, -0.061860013753175735, -0.05971933901309967, -0.05757866054773331, -0.05543798208236694, -0.05329731106758118, -0.05115663260221481, -0.04901595786213875, -0.046875279396772385, -0.04473460093140602, -0.042593926191329956, -0.04045324772596359, -0.03831256926059723, -0.036171890795230865, -0.0340312123298645, -0.03189053758978844, -0.029749859124422073, -0.02760918065905571, -0.025468504056334496, -0.02332782745361328, -0.021187148988246918, -0.019046472385525703, -0.01690579578280449, -0.014765117317438126, -0.012624440714716911, -0.010483763180673122, -0.008343085646629333, -0.006202409043908119, -0.00406173150986433, -0.0019210539758205414, 0.00021962332539260387, 0.002360300626605749, 0.004500977694988251, 0.00664165522903204, 0.008782332763075829, 0.010923009365797043, 0.013063686899840832, 0.01520436443388462, 0.017345041036605835, 0.0194857195019722, 0.021626396104693413, 0.023767072707414627, 0.02590775117278099, 0.028048427775502205, 0.03018910437822342, 0.03232978284358978]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 11.0, 10.0, 8.0, 10.0, 15.0, 17.0, 26.0, 24.0, 25.0, 29.0, 31.0, 25.0, 38.0, 30.0, 49.0, 45.0, 39.0, 36.0, 51.0, 34.0, 47.0, 44.0, 37.0, 35.0, 29.0, 27.0, 38.0, 27.0, 25.0, 22.0, 19.0, 14.0, 10.0, 10.0, 4.0, 14.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006221175193786621, -0.006025002337992191, -0.0058288294821977615, -0.005632656626403332, -0.005436483770608902, -0.005240310914814472, -0.005044138059020042, -0.004847965203225613, -0.004651792347431183, -0.004455619491636753, -0.004259446635842323, -0.0040632737800478935, -0.0038671009242534637, -0.003670928068459034, -0.003474755212664604, -0.0032785823568701744, -0.0030824095010757446, -0.002886236645281315, -0.002690063789486885, -0.0024938909336924553, -0.0022977180778980255, -0.0021015452221035957, -0.001905372366309166, -0.0017091995105147362, -0.0015130266547203064, -0.0013168537989258766, -0.0011206809431314468, -0.0009245080873370171, -0.0007283352315425873, -0.0005321623757481575, -0.0003359895199537277, -0.00013981666415929794, 5.6356191635131836e-05, 0.0002525290474295616, 0.0004487019032239914, 0.0006448747590184212, 0.000841047614812851, 0.0010372204706072807, 0.0012333933264017105, 0.0014295661821961403, 0.00162573903799057, 0.0018219118937849998, 0.0020180847495794296, 0.0022142576053738594, 0.002410430461168289, 0.002606603316962719, 0.0028027761727571487, 0.0029989490285515785, 0.0031951218843460083, 0.003391294740140438, 0.003587467595934868, 0.0037836404517292976, 0.003979813307523727, 0.004175986163318157, 0.004372159019112587, 0.004568331874907017, 0.0047645047307014465, 0.004960677586495876, 0.005156850442290306, 0.005353023298084736, 0.005549196153879166, 0.005745369009673595, 0.005941541865468025, 0.006137714721262455, 0.006333887577056885]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 7.0, 3.0, 4.0, 6.0, 5.0, 12.0, 12.0, 13.0, 9.0, 14.0, 24.0, 32.0, 35.0, 32.0, 35.0, 40.0, 38.0, 40.0, 39.0, 42.0, 53.0, 37.0, 44.0, 38.0, 42.0, 42.0, 39.0, 28.0, 28.0, 33.0, 38.0, 29.0, 18.0, 17.0, 13.0, 20.0, 11.0, 5.0, 11.0, 1.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.55694580078125, -6.3638916015625, -6.17083740234375, -5.977783203125, -5.78472900390625, -5.5916748046875, -5.39862060546875, -5.20556640625, -5.01251220703125, -4.8194580078125, -4.62640380859375, -4.433349609375, -4.24029541015625, -4.0472412109375, -3.85418701171875, -3.6611328125, -3.46807861328125, -3.2750244140625, -3.08197021484375, -2.888916015625, -2.69586181640625, -2.5028076171875, -2.30975341796875, -2.11669921875, -1.92364501953125, -1.7305908203125, -1.53753662109375, -1.344482421875, -1.15142822265625, -0.9583740234375, -0.76531982421875, -0.572265625, -0.37921142578125, -0.1861572265625, 0.00689697265625, 0.199951171875, 0.39300537109375, 0.5860595703125, 0.77911376953125, 0.97216796875, 1.16522216796875, 1.3582763671875, 1.55133056640625, 1.744384765625, 1.93743896484375, 2.1304931640625, 2.32354736328125, 2.5166015625, 2.70965576171875, 2.9027099609375, 3.09576416015625, 3.288818359375, 3.48187255859375, 3.6749267578125, 3.86798095703125, 4.06103515625, 4.25408935546875, 4.4471435546875, 4.64019775390625, 4.833251953125, 5.02630615234375, 5.2193603515625, 5.41241455078125, 5.60546875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 3.0, 7.0, 2.0, 7.0, 6.0, 12.0, 10.0, 10.0, 15.0, 26.0, 42.0, 43.0, 60.0, 80.0, 132.0, 148.0, 240.0, 471.0, 1131.0, 3507.0, 10924.0, 36700.0, 196149.0, 607123.0, 146590.0, 30787.0, 9304.0, 2824.0, 1009.0, 409.0, 219.0, 153.0, 92.0, 67.0, 53.0, 50.0, 36.0, 42.0, 21.0, 12.0, 11.0, 9.0, 9.0, 6.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.640625, -12.2838134765625, -11.927001953125, -11.5701904296875, -11.21337890625, -10.8565673828125, -10.499755859375, -10.1429443359375, -9.7861328125, -9.4293212890625, -9.072509765625, -8.7156982421875, -8.35888671875, -8.0020751953125, -7.645263671875, -7.2884521484375, -6.931640625, -6.5748291015625, -6.218017578125, -5.8612060546875, -5.50439453125, -5.1475830078125, -4.790771484375, -4.4339599609375, -4.0771484375, -3.7203369140625, -3.363525390625, -3.0067138671875, -2.64990234375, -2.2930908203125, -1.936279296875, -1.5794677734375, -1.22265625, -0.8658447265625, -0.509033203125, -0.1522216796875, 0.20458984375, 0.5614013671875, 0.918212890625, 1.2750244140625, 1.6318359375, 1.9886474609375, 2.345458984375, 2.7022705078125, 3.05908203125, 3.4158935546875, 3.772705078125, 4.1295166015625, 4.486328125, 4.8431396484375, 5.199951171875, 5.5567626953125, 5.91357421875, 6.2703857421875, 6.627197265625, 6.9840087890625, 7.3408203125, 7.6976318359375, 8.054443359375, 8.4112548828125, 8.76806640625, 9.1248779296875, 9.481689453125, 9.8385009765625, 10.1953125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 8.0, 15.0, 7.0, 20.0, 16.0, 19.0, 20.0, 21.0, 23.0, 31.0, 32.0, 35.0, 39.0, 51.0, 63.0, 80.0, 131.0, 1472.0, 402.0, 134.0, 66.0, 43.0, 37.0, 38.0, 33.0, 32.0, 27.0, 31.0, 19.0, 13.0, 18.0, 13.0, 12.0, 12.0, 11.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -19.101806640625, -18.48486328125, -17.867919921875, -17.2509765625, -16.634033203125, -16.01708984375, -15.400146484375, -14.783203125, -14.166259765625, -13.54931640625, -12.932373046875, -12.3154296875, -11.698486328125, -11.08154296875, -10.464599609375, -9.84765625, -9.230712890625, -8.61376953125, -7.996826171875, -7.3798828125, -6.762939453125, -6.14599609375, -5.529052734375, -4.912109375, -4.295166015625, -3.67822265625, -3.061279296875, -2.4443359375, -1.827392578125, -1.21044921875, -0.593505859375, 0.0234375, 0.640380859375, 1.25732421875, 1.874267578125, 2.4912109375, 3.108154296875, 3.72509765625, 4.342041015625, 4.958984375, 5.575927734375, 6.19287109375, 6.809814453125, 7.4267578125, 8.043701171875, 8.66064453125, 9.277587890625, 9.89453125, 10.511474609375, 11.12841796875, 11.745361328125, 12.3623046875, 12.979248046875, 13.59619140625, 14.213134765625, 14.830078125, 15.447021484375, 16.06396484375, 16.680908203125, 17.2978515625, 17.914794921875, 18.53173828125, 19.148681640625, 19.765625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 7.0, 7.0, 8.0, 13.0, 13.0, 25.0, 18.0, 37.0, 42.0, 60.0, 81.0, 101.0, 168.0, 334.0, 847.0, 6501.0, 2807089.0, 326142.0, 2727.0, 622.0, 275.0, 171.0, 101.0, 70.0, 53.0, 36.0, 31.0, 32.0, 26.0, 14.0, 11.0, 12.0, 6.0, 3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.5, -38.87060546875, -37.2412109375, -35.61181640625, -33.982421875, -32.35302734375, -30.7236328125, -29.09423828125, -27.46484375, -25.83544921875, -24.2060546875, -22.57666015625, -20.947265625, -19.31787109375, -17.6884765625, -16.05908203125, -14.4296875, -12.80029296875, -11.1708984375, -9.54150390625, -7.912109375, -6.28271484375, -4.6533203125, -3.02392578125, -1.39453125, 0.23486328125, 1.8642578125, 3.49365234375, 5.123046875, 6.75244140625, 8.3818359375, 10.01123046875, 11.640625, 13.27001953125, 14.8994140625, 16.52880859375, 18.158203125, 19.78759765625, 21.4169921875, 23.04638671875, 24.67578125, 26.30517578125, 27.9345703125, 29.56396484375, 31.193359375, 32.82275390625, 34.4521484375, 36.08154296875, 37.7109375, 39.34033203125, 40.9697265625, 42.59912109375, 44.228515625, 45.85791015625, 47.4873046875, 49.11669921875, 50.74609375, 52.37548828125, 54.0048828125, 55.63427734375, 57.263671875, 58.89306640625, 60.5224609375, 62.15185546875, 63.78125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 15.0, 68.0, 130.0, 226.0, 277.0, 194.0, 63.0, 32.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.018024444580078, -24.410335540771484, -22.80264663696289, -21.194957733154297, -19.587268829345703, -17.97957992553711, -16.371889114379883, -14.764200210571289, -13.156511306762695, -11.548822402954102, -9.941133499145508, -8.333443641662598, -6.725754737854004, -5.11806583404541, -3.5103759765625, -1.9026870727539062, -0.2949981689453125, 1.3126909732818604, 2.920380115509033, 4.528069496154785, 6.135758399963379, 7.743447303771973, 9.351137161254883, 10.958826065063477, 12.56651496887207, 14.174203872680664, 15.781892776489258, 17.389583587646484, 18.997272491455078, 20.604961395263672, 22.212650299072266, 23.82033920288086, 25.428024291992188, 27.03571319580078, 28.643402099609375, 30.25109100341797, 31.858779907226562, 33.466468811035156, 35.07415771484375, 36.681846618652344, 38.28953552246094, 39.89722442626953, 41.504913330078125, 43.11260223388672, 44.72029113769531, 46.327980041503906, 47.9356689453125, 49.543357849121094, 51.15105056762695, 52.75873947143555, 54.36642837524414, 55.974117279052734, 57.58180618286133, 59.18949508666992, 60.79718780517578, 62.404876708984375, 64.01256561279297, 65.62025451660156, 67.22794342041016, 68.83563232421875, 70.44332122802734, 72.05101013183594, 73.65869903564453, 75.26638793945312, 76.87407684326172]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 11.0, 5.0, 11.0, 4.0, 12.0, 13.0, 21.0, 21.0, 22.0, 27.0, 27.0, 29.0, 31.0, 23.0, 43.0, 32.0, 47.0, 44.0, 31.0, 43.0, 41.0, 44.0, 52.0, 45.0, 37.0, 30.0, 24.0, 36.0, 24.0, 31.0, 23.0, 20.0, 19.0, 13.0, 15.0, 8.0, 10.0, 7.0, 8.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.94161605834961, -42.57663345336914, -41.21165084838867, -39.8466682434082, -38.481685638427734, -37.116703033447266, -35.7517204284668, -34.38673782348633, -33.02175521850586, -31.65677261352539, -30.291790008544922, -28.926807403564453, -27.561824798583984, -26.196842193603516, -24.831859588623047, -23.466876983642578, -22.10189437866211, -20.73691177368164, -19.371929168701172, -18.006946563720703, -16.641963958740234, -15.276981353759766, -13.911998748779297, -12.547016143798828, -11.18203353881836, -9.81705093383789, -8.452068328857422, -7.087085723876953, -5.722103118896484, -4.357120513916016, -2.992137908935547, -1.6271553039550781, -0.26216888427734375, 1.102813720703125, 2.4677963256835938, 3.8327789306640625, 5.197761535644531, 6.562744140625, 7.927726745605469, 9.292709350585938, 10.657691955566406, 12.022674560546875, 13.387657165527344, 14.752639770507812, 16.11762237548828, 17.48260498046875, 18.84758758544922, 20.212570190429688, 21.577552795410156, 22.942535400390625, 24.307518005371094, 25.672500610351562, 27.03748321533203, 28.4024658203125, 29.76744842529297, 31.132431030273438, 32.497413635253906, 33.862396240234375, 35.227378845214844, 36.59236145019531, 37.95734405517578, 39.32232666015625, 40.68730926513672, 42.05229187011719, 43.417274475097656]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 8.0, 8.0, 3.0, 6.0, 5.0, 11.0, 16.0, 15.0, 14.0, 28.0, 22.0, 34.0, 30.0, 47.0, 31.0, 37.0, 51.0, 32.0, 45.0, 52.0, 36.0, 47.0, 46.0, 43.0, 32.0, 39.0, 39.0, 37.0, 30.0, 27.0, 20.0, 18.0, 19.0, 13.0, 11.0, 9.0, 12.0, 8.0, 8.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.93359375, -7.7236328125, -7.513671875, -7.3037109375, -7.09375, -6.8837890625, -6.673828125, -6.4638671875, -6.25390625, -6.0439453125, -5.833984375, -5.6240234375, -5.4140625, -5.2041015625, -4.994140625, -4.7841796875, -4.57421875, -4.3642578125, -4.154296875, -3.9443359375, -3.734375, -3.5244140625, -3.314453125, -3.1044921875, -2.89453125, -2.6845703125, -2.474609375, -2.2646484375, -2.0546875, -1.8447265625, -1.634765625, -1.4248046875, -1.21484375, -1.0048828125, -0.794921875, -0.5849609375, -0.375, -0.1650390625, 0.044921875, 0.2548828125, 0.46484375, 0.6748046875, 0.884765625, 1.0947265625, 1.3046875, 1.5146484375, 1.724609375, 1.9345703125, 2.14453125, 2.3544921875, 2.564453125, 2.7744140625, 2.984375, 3.1943359375, 3.404296875, 3.6142578125, 3.82421875, 4.0341796875, 4.244140625, 4.4541015625, 4.6640625, 4.8740234375, 5.083984375, 5.2939453125, 5.50390625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 6.0, 4.0, 10.0, 7.0, 11.0, 16.0, 18.0, 23.0, 35.0, 36.0, 43.0, 60.0, 97.0, 151.0, 312.0, 888.0, 3680.0, 23242.0, 196040.0, 1353378.0, 2081504.0, 467982.0, 56670.0, 7599.0, 1452.0, 410.0, 172.0, 106.0, 67.0, 63.0, 46.0, 30.0, 25.0, 18.0, 14.0, 17.0, 6.0, 9.0, 7.0, 6.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-12.8515625, -12.49658203125, -12.1416015625, -11.78662109375, -11.431640625, -11.07666015625, -10.7216796875, -10.36669921875, -10.01171875, -9.65673828125, -9.3017578125, -8.94677734375, -8.591796875, -8.23681640625, -7.8818359375, -7.52685546875, -7.171875, -6.81689453125, -6.4619140625, -6.10693359375, -5.751953125, -5.39697265625, -5.0419921875, -4.68701171875, -4.33203125, -3.97705078125, -3.6220703125, -3.26708984375, -2.912109375, -2.55712890625, -2.2021484375, -1.84716796875, -1.4921875, -1.13720703125, -0.7822265625, -0.42724609375, -0.072265625, 0.28271484375, 0.6376953125, 0.99267578125, 1.34765625, 1.70263671875, 2.0576171875, 2.41259765625, 2.767578125, 3.12255859375, 3.4775390625, 3.83251953125, 4.1875, 4.54248046875, 4.8974609375, 5.25244140625, 5.607421875, 5.96240234375, 6.3173828125, 6.67236328125, 7.02734375, 7.38232421875, 7.7373046875, 8.09228515625, 8.447265625, 8.80224609375, 9.1572265625, 9.51220703125, 9.8671875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 7.0, 5.0, 17.0, 11.0, 20.0, 28.0, 34.0, 44.0, 49.0, 77.0, 76.0, 115.0, 182.0, 191.0, 246.0, 329.0, 374.0, 364.0, 353.0, 315.0, 270.0, 218.0, 187.0, 125.0, 94.0, 76.0, 75.0, 36.0, 28.0, 25.0, 23.0, 18.0, 12.0, 9.0, 7.0, 4.0, 9.0, 1.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.515625, -8.255126953125, -7.99462890625, -7.734130859375, -7.4736328125, -7.213134765625, -6.95263671875, -6.692138671875, -6.431640625, -6.171142578125, -5.91064453125, -5.650146484375, -5.3896484375, -5.129150390625, -4.86865234375, -4.608154296875, -4.34765625, -4.087158203125, -3.82666015625, -3.566162109375, -3.3056640625, -3.045166015625, -2.78466796875, -2.524169921875, -2.263671875, -2.003173828125, -1.74267578125, -1.482177734375, -1.2216796875, -0.961181640625, -0.70068359375, -0.440185546875, -0.1796875, 0.080810546875, 0.34130859375, 0.601806640625, 0.8623046875, 1.122802734375, 1.38330078125, 1.643798828125, 1.904296875, 2.164794921875, 2.42529296875, 2.685791015625, 2.9462890625, 3.206787109375, 3.46728515625, 3.727783203125, 3.98828125, 4.248779296875, 4.50927734375, 4.769775390625, 5.0302734375, 5.290771484375, 5.55126953125, 5.811767578125, 6.072265625, 6.332763671875, 6.59326171875, 6.853759765625, 7.1142578125, 7.374755859375, 7.63525390625, 7.895751953125, 8.15625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 8.0, 9.0, 10.0, 9.0, 21.0, 28.0, 28.0, 39.0, 62.0, 92.0, 117.0, 162.0, 222.0, 320.0, 521.0, 1055.0, 3358.0, 20417.0, 244476.0, 2729965.0, 1108651.0, 72642.0, 8095.0, 1827.0, 736.0, 424.0, 267.0, 180.0, 155.0, 90.0, 69.0, 65.0, 29.0, 35.0, 23.0, 20.0, 15.0, 5.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.75, -18.140625, -17.53125, -16.921875, -16.3125, -15.703125, -15.09375, -14.484375, -13.875, -13.265625, -12.65625, -12.046875, -11.4375, -10.828125, -10.21875, -9.609375, -9.0, -8.390625, -7.78125, -7.171875, -6.5625, -5.953125, -5.34375, -4.734375, -4.125, -3.515625, -2.90625, -2.296875, -1.6875, -1.078125, -0.46875, 0.140625, 0.75, 1.359375, 1.96875, 2.578125, 3.1875, 3.796875, 4.40625, 5.015625, 5.625, 6.234375, 6.84375, 7.453125, 8.0625, 8.671875, 9.28125, 9.890625, 10.5, 11.109375, 11.71875, 12.328125, 12.9375, 13.546875, 14.15625, 14.765625, 15.375, 15.984375, 16.59375, 17.203125, 17.8125, 18.421875, 19.03125, 19.640625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 12.0, 44.0, 80.0, 160.0, 195.0, 200.0, 180.0, 78.0, 41.0, 16.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0794677734375, -30.730344772338867, -28.381221771240234, -26.032100677490234, -23.6829776763916, -21.33385467529297, -18.98473358154297, -16.635610580444336, -14.286487579345703, -11.93736457824707, -9.588242530822754, -7.239120006561279, -4.889997482299805, -2.540874481201172, -0.19175243377685547, 2.157369613647461, 4.506492614746094, 6.855615139007568, 9.204737663269043, 11.55385971069336, 13.902982711791992, 16.252105712890625, 18.601226806640625, 20.950349807739258, 23.29947280883789, 25.648595809936523, 27.997718811035156, 30.346839904785156, 32.695960998535156, 35.04508590698242, 37.39420700073242, 39.74333190917969, 42.09245300292969, 44.44157409667969, 46.79069900512695, 49.13982009887695, 51.48894500732422, 53.83806610107422, 56.18718719482422, 58.53630828857422, 60.885433197021484, 63.234554290771484, 65.58367919921875, 67.93280029296875, 70.28192138671875, 72.63104248046875, 74.98017120361328, 77.32929229736328, 79.67841339111328, 82.02753448486328, 84.37665557861328, 86.72578430175781, 89.07490539550781, 91.42402648925781, 93.77314758300781, 96.12226867675781, 98.47138977050781, 100.82051086425781, 103.16963195800781, 105.51876068115234, 107.86788177490234, 110.21700286865234, 112.56612396240234, 114.91524505615234, 117.26437377929688]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 5.0, 7.0, 10.0, 6.0, 12.0, 14.0, 18.0, 12.0, 21.0, 22.0, 26.0, 17.0, 26.0, 28.0, 26.0, 24.0, 29.0, 32.0, 40.0, 49.0, 28.0, 32.0, 36.0, 34.0, 33.0, 30.0, 42.0, 36.0, 21.0, 23.0, 35.0, 21.0, 24.0, 17.0, 23.0, 22.0, 19.0, 17.0, 20.0, 13.0, 12.0, 8.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-29.119922637939453, -28.207233428955078, -27.29454231262207, -26.381851196289062, -25.469161987304688, -24.556472778320312, -23.643781661987305, -22.731090545654297, -21.818401336669922, -20.905712127685547, -19.99302101135254, -19.08032989501953, -18.167640686035156, -17.25495147705078, -16.342260360717773, -15.429570198059082, -14.51688003540039, -13.6041898727417, -12.691499710083008, -11.778809547424316, -10.866119384765625, -9.953429222106934, -9.040739059448242, -8.12804889678955, -7.215358734130859, -6.302668571472168, -5.389978408813477, -4.477288246154785, -3.5645980834960938, -2.6519079208374023, -1.739217758178711, -0.8265275955200195, 0.08616065979003906, 0.9988508224487305, 1.9115409851074219, 2.8242311477661133, 3.7369213104248047, 4.649611473083496, 5.5623016357421875, 6.474991798400879, 7.38768196105957, 8.300372123718262, 9.213062286376953, 10.125752449035645, 11.038442611694336, 11.951132774353027, 12.863822937011719, 13.77651309967041, 14.689203262329102, 15.601893424987793, 16.514583587646484, 17.42727279663086, 18.339963912963867, 19.252655029296875, 20.16534423828125, 21.078033447265625, 21.990724563598633, 22.90341567993164, 23.816104888916016, 24.72879409790039, 25.6414852142334, 26.554176330566406, 27.46686553955078, 28.379554748535156, 29.292245864868164]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 10.0, 9.0, 19.0, 15.0, 11.0, 15.0, 23.0, 24.0, 25.0, 25.0, 32.0, 28.0, 34.0, 43.0, 44.0, 40.0, 38.0, 41.0, 42.0, 49.0, 39.0, 38.0, 29.0, 26.0, 30.0, 24.0, 23.0, 23.0, 32.0, 21.0, 21.0, 18.0, 13.0, 18.0, 8.0, 10.0, 9.0, 9.0, 8.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5, -6.313720703125, -6.12744140625, -5.941162109375, -5.7548828125, -5.568603515625, -5.38232421875, -5.196044921875, -5.009765625, -4.823486328125, -4.63720703125, -4.450927734375, -4.2646484375, -4.078369140625, -3.89208984375, -3.705810546875, -3.51953125, -3.333251953125, -3.14697265625, -2.960693359375, -2.7744140625, -2.588134765625, -2.40185546875, -2.215576171875, -2.029296875, -1.843017578125, -1.65673828125, -1.470458984375, -1.2841796875, -1.097900390625, -0.91162109375, -0.725341796875, -0.5390625, -0.352783203125, -0.16650390625, 0.019775390625, 0.2060546875, 0.392333984375, 0.57861328125, 0.764892578125, 0.951171875, 1.137451171875, 1.32373046875, 1.510009765625, 1.6962890625, 1.882568359375, 2.06884765625, 2.255126953125, 2.44140625, 2.627685546875, 2.81396484375, 3.000244140625, 3.1865234375, 3.372802734375, 3.55908203125, 3.745361328125, 3.931640625, 4.117919921875, 4.30419921875, 4.490478515625, 4.6767578125, 4.863037109375, 5.04931640625, 5.235595703125, 5.421875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 8.0, 9.0, 14.0, 16.0, 24.0, 35.0, 54.0, 76.0, 124.0, 184.0, 298.0, 398.0, 692.0, 963.0, 1402.0, 2160.0, 3130.0, 4624.0, 7021.0, 10314.0, 15558.0, 23145.0, 34103.0, 51143.0, 74476.0, 105516.0, 139366.0, 153037.0, 127278.0, 93777.0, 64709.0, 44224.0, 29730.0, 20073.0, 13595.0, 9045.0, 6008.0, 4055.0, 2658.0, 1831.0, 1242.0, 823.0, 556.0, 340.0, 259.0, 161.0, 123.0, 69.0, 45.0, 30.0, 22.0, 9.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.376220703125, -0.3642082214355469, -0.35219573974609375, -0.3401832580566406, -0.3281707763671875, -0.3161582946777344, -0.30414581298828125, -0.2921333312988281, -0.280120849609375, -0.2681083679199219, -0.25609588623046875, -0.24408340454101562, -0.2320709228515625, -0.22005844116210938, -0.20804595947265625, -0.19603347778320312, -0.18402099609375, -0.17200851440429688, -0.15999603271484375, -0.14798355102539062, -0.1359710693359375, -0.12395858764648438, -0.11194610595703125, -0.09993362426757812, -0.087921142578125, -0.07590866088867188, -0.06389617919921875, -0.051883697509765625, -0.0398712158203125, -0.027858734130859375, -0.01584625244140625, -0.003833770751953125, 0.0081787109375, 0.020191192626953125, 0.03220367431640625, 0.044216156005859375, 0.0562286376953125, 0.06824111938476562, 0.08025360107421875, 0.09226608276367188, 0.104278564453125, 0.11629104614257812, 0.12830352783203125, 0.14031600952148438, 0.1523284912109375, 0.16434097290039062, 0.17635345458984375, 0.18836593627929688, 0.20037841796875, 0.21239089965820312, 0.22440338134765625, 0.23641586303710938, 0.2484283447265625, 0.2604408264160156, 0.27245330810546875, 0.2844657897949219, 0.296478271484375, 0.3084907531738281, 0.32050323486328125, 0.3325157165527344, 0.3445281982421875, 0.3565406799316406, 0.36855316162109375, 0.3805656433105469, 0.392578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 9.0, 4.0, 7.0, 7.0, 12.0, 10.0, 17.0, 19.0, 19.0, 19.0, 31.0, 35.0, 29.0, 31.0, 49.0, 27.0, 50.0, 38.0, 41.0, 1053.0, 40.0, 49.0, 49.0, 48.0, 46.0, 36.0, 41.0, 22.0, 25.0, 29.0, 25.0, 26.0, 18.0, 10.0, 17.0, 14.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.02423095703125, -3.8883056640625, -3.75238037109375, -3.616455078125, -3.48052978515625, -3.3446044921875, -3.20867919921875, -3.07275390625, -2.93682861328125, -2.8009033203125, -2.66497802734375, -2.529052734375, -2.39312744140625, -2.2572021484375, -2.12127685546875, -1.9853515625, -1.84942626953125, -1.7135009765625, -1.57757568359375, -1.441650390625, -1.30572509765625, -1.1697998046875, -1.03387451171875, -0.89794921875, -0.76202392578125, -0.6260986328125, -0.49017333984375, -0.354248046875, -0.21832275390625, -0.0823974609375, 0.05352783203125, 0.189453125, 0.32537841796875, 0.4613037109375, 0.59722900390625, 0.733154296875, 0.86907958984375, 1.0050048828125, 1.14093017578125, 1.27685546875, 1.41278076171875, 1.5487060546875, 1.68463134765625, 1.820556640625, 1.95648193359375, 2.0924072265625, 2.22833251953125, 2.3642578125, 2.50018310546875, 2.6361083984375, 2.77203369140625, 2.907958984375, 3.04388427734375, 3.1798095703125, 3.31573486328125, 3.45166015625, 3.58758544921875, 3.7235107421875, 3.85943603515625, 3.995361328125, 4.13128662109375, 4.2672119140625, 4.40313720703125, 4.5390625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 9.0, 3.0, 12.0, 5.0, 11.0, 17.0, 25.0, 24.0, 51.0, 75.0, 111.0, 155.0, 234.0, 281.0, 447.0, 700.0, 1055.0, 1622.0, 2471.0, 3853.0, 6211.0, 9549.0, 15309.0, 23697.0, 37101.0, 56307.0, 83133.0, 115602.0, 172737.0, 1165837.0, 125188.0, 92908.0, 63975.0, 42371.0, 27482.0, 17498.0, 11131.0, 7116.0, 4496.0, 2853.0, 1844.0, 1244.0, 802.0, 533.0, 332.0, 230.0, 161.0, 96.0, 77.0, 40.0, 29.0, 23.0, 15.0, 13.0, 12.0, 8.0, 12.0, 5.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.28857421875, -0.2793121337890625, -0.270050048828125, -0.2607879638671875, -0.25152587890625, -0.2422637939453125, -0.233001708984375, -0.2237396240234375, -0.2144775390625, -0.2052154541015625, -0.195953369140625, -0.1866912841796875, -0.17742919921875, -0.1681671142578125, -0.158905029296875, -0.1496429443359375, -0.140380859375, -0.1311187744140625, -0.121856689453125, -0.1125946044921875, -0.10333251953125, -0.0940704345703125, -0.084808349609375, -0.0755462646484375, -0.0662841796875, -0.0570220947265625, -0.047760009765625, -0.0384979248046875, -0.02923583984375, -0.0199737548828125, -0.010711669921875, -0.0014495849609375, 0.0078125, 0.0170745849609375, 0.026336669921875, 0.0355987548828125, 0.04486083984375, 0.0541229248046875, 0.063385009765625, 0.0726470947265625, 0.0819091796875, 0.0911712646484375, 0.100433349609375, 0.1096954345703125, 0.11895751953125, 0.1282196044921875, 0.137481689453125, 0.1467437744140625, 0.156005859375, 0.1652679443359375, 0.174530029296875, 0.1837921142578125, 0.19305419921875, 0.2023162841796875, 0.211578369140625, 0.2208404541015625, 0.2301025390625, 0.2393646240234375, 0.248626708984375, 0.2578887939453125, 0.26715087890625, 0.2764129638671875, 0.285675048828125, 0.2949371337890625, 0.30419921875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 2.0, 6.0, 6.0, 5.0, 4.0, 7.0, 9.0, 13.0, 15.0, 17.0, 15.0, 30.0, 43.0, 44.0, 58.0, 89.0, 99.0, 107.0, 97.0, 64.0, 51.0, 39.0, 30.0, 25.0, 24.0, 12.0, 16.0, 10.0, 6.0, 10.0, 6.0, 3.0, 7.0, 6.0, 3.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00766754150390625, -0.007431149482727051, -0.0071947574615478516, -0.006958365440368652, -0.006721973419189453, -0.006485581398010254, -0.006249189376831055, -0.0060127973556518555, -0.005776405334472656, -0.005540013313293457, -0.005303621292114258, -0.005067229270935059, -0.004830837249755859, -0.00459444522857666, -0.004358053207397461, -0.004121661186218262, -0.0038852691650390625, -0.0036488771438598633, -0.003412485122680664, -0.003176093101501465, -0.0029397010803222656, -0.0027033090591430664, -0.002466917037963867, -0.002230525016784668, -0.0019941329956054688, -0.0017577409744262695, -0.0015213489532470703, -0.001284956932067871, -0.0010485649108886719, -0.0008121728897094727, -0.0005757808685302734, -0.0003393888473510742, -0.000102996826171875, 0.00013339519500732422, 0.00036978721618652344, 0.0006061792373657227, 0.0008425712585449219, 0.001078963279724121, 0.0013153553009033203, 0.0015517473220825195, 0.0017881393432617188, 0.002024531364440918, 0.002260923385620117, 0.0024973154067993164, 0.0027337074279785156, 0.002970099449157715, 0.003206491470336914, 0.0034428834915161133, 0.0036792755126953125, 0.003915667533874512, 0.004152059555053711, 0.00438845157623291, 0.004624843597412109, 0.004861235618591309, 0.005097627639770508, 0.005334019660949707, 0.005570411682128906, 0.0058068037033081055, 0.006043195724487305, 0.006279587745666504, 0.006515979766845703, 0.006752371788024902, 0.0069887638092041016, 0.007225155830383301, 0.0074615478515625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 8.0, 6.0, 7.0, 10.0, 9.0, 6.0, 13.0, 15.0, 14.0, 27.0, 26.0, 37.0, 44.0, 85.0, 127.0, 256.0, 718.0, 4646.0, 170367.0, 858652.0, 11389.0, 1217.0, 367.0, 146.0, 99.0, 62.0, 45.0, 31.0, 24.0, 20.0, 19.0, 12.0, 9.0, 5.0, 8.0, 5.0, 5.0, 4.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15478515625, -0.14981842041015625, -0.1448516845703125, -0.13988494873046875, -0.134918212890625, -0.12995147705078125, -0.1249847412109375, -0.12001800537109375, -0.11505126953125, -0.11008453369140625, -0.1051177978515625, -0.10015106201171875, -0.095184326171875, -0.09021759033203125, -0.0852508544921875, -0.08028411865234375, -0.0753173828125, -0.07035064697265625, -0.0653839111328125, -0.06041717529296875, -0.055450439453125, -0.05048370361328125, -0.0455169677734375, -0.04055023193359375, -0.03558349609375, -0.03061676025390625, -0.0256500244140625, -0.02068328857421875, -0.015716552734375, -0.01074981689453125, -0.0057830810546875, -0.00081634521484375, 0.004150390625, 0.00911712646484375, 0.0140838623046875, 0.01905059814453125, 0.024017333984375, 0.02898406982421875, 0.0339508056640625, 0.03891754150390625, 0.04388427734375, 0.04885101318359375, 0.0538177490234375, 0.05878448486328125, 0.063751220703125, 0.06871795654296875, 0.0736846923828125, 0.07865142822265625, 0.0836181640625, 0.08858489990234375, 0.0935516357421875, 0.09851837158203125, 0.103485107421875, 0.10845184326171875, 0.1134185791015625, 0.11838531494140625, 0.12335205078125, 0.12831878662109375, 0.1332855224609375, 0.13825225830078125, 0.143218994140625, 0.14818572998046875, 0.1531524658203125, 0.15811920166015625, 0.1630859375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 7.0, 25.0, 72.0, 235.0, 398.0, 168.0, 66.0, 21.0, 11.0, 10.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00669793039560318, -0.005446131341159344, -0.0041943322867155075, -0.0029425336979329586, -0.0016907346434891224, -0.0004389355890452862, 0.0008128629997372627, 0.002064662054181099, 0.003316461108624935, 0.004568260163068771, 0.005820059217512608, 0.0070718578062951565, 0.008323656395077705, 0.009575456380844116, 0.010827254503965378, 0.012079053558409214, 0.01333085261285305, 0.014582651667296886, 0.015834450721740723, 0.017086248844861984, 0.018338048830628395, 0.019589846953749657, 0.020841646939516068, 0.02209344506263733, 0.02334524318575859, 0.024597041308879852, 0.025848841294646263, 0.027100639417767525, 0.028352439403533936, 0.029604237526655197, 0.03085603564977646, 0.03210783749818802, 0.03335963562130928, 0.03461143374443054, 0.035863231867551804, 0.037115033715963364, 0.038366831839084625, 0.03961862996220589, 0.04087042808532715, 0.04212222993373871, 0.04337402805685997, 0.04462582617998123, 0.04587762430310249, 0.04712942615151405, 0.048381224274635315, 0.04963302239775658, 0.05088482052087784, 0.0521366223692894, 0.05338841676712036, 0.05464021489024162, 0.055892013013362885, 0.057143814861774445, 0.058395612984895706, 0.05964741110801697, 0.06089920923113823, 0.06215100735425949, 0.06340280920267105, 0.06465461105108261, 0.06590640544891357, 0.06715820729732513, 0.0684100016951561, 0.06966180354356766, 0.07091360539197922, 0.07216539978981018, 0.07341720163822174]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 7.0, 9.0, 11.0, 24.0, 31.0, 34.0, 31.0, 42.0, 46.0, 45.0, 67.0, 69.0, 88.0, 60.0, 43.0, 62.0, 56.0, 59.0, 47.0, 33.0, 30.0, 27.0, 19.0, 12.0, 13.0, 7.0, 9.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007668793201446533, -0.007420984096825123, -0.0071731749922037125, -0.006925365887582302, -0.006677556782960892, -0.006429747678339481, -0.006181938573718071, -0.005934129469096661, -0.00568632036447525, -0.00543851125985384, -0.0051907021552324295, -0.004942893050611019, -0.004695083945989609, -0.004447274841368198, -0.004199465736746788, -0.003951656632125378, -0.0037038475275039673, -0.003456038422882557, -0.0032082293182611465, -0.002960420213639736, -0.002712611109018326, -0.0024648020043969154, -0.002216992899775505, -0.0019691837951540947, -0.0017213746905326843, -0.001473565585911274, -0.0012257564812898636, -0.0009779473766684532, -0.0007301382720470428, -0.0004823291674256325, -0.0002345200628042221, 1.3289041817188263e-05, 0.00026109814643859863, 0.000508907251060009, 0.0007567163556814194, 0.0010045254603028297, 0.0012523345649242401, 0.0015001436695456505, 0.0017479527741670609, 0.0019957618787884712, 0.0022435709834098816, 0.002491380088031292, 0.0027391891926527023, 0.0029869982972741127, 0.003234807401895523, 0.0034826165065169334, 0.003730425611138344, 0.003978234715759754, 0.0042260438203811646, 0.004473852925002575, 0.004721662029623985, 0.004969471134245396, 0.005217280238866806, 0.005465089343488216, 0.005712898448109627, 0.005960707552731037, 0.0062085166573524475, 0.006456325761973858, 0.006704134866595268, 0.006951943971216679, 0.007199753075838089, 0.007447562180459499, 0.00769537128508091, 0.00794318038970232, 0.00819098949432373]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 10.0, 9.0, 19.0, 15.0, 11.0, 15.0, 23.0, 24.0, 25.0, 25.0, 32.0, 28.0, 34.0, 43.0, 45.0, 39.0, 38.0, 41.0, 42.0, 49.0, 39.0, 38.0, 29.0, 26.0, 30.0, 24.0, 23.0, 23.0, 32.0, 21.0, 21.0, 18.0, 13.0, 17.0, 9.0, 10.0, 9.0, 9.0, 8.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5, -6.313720703125, -6.12744140625, -5.941162109375, -5.7548828125, -5.568603515625, -5.38232421875, -5.196044921875, -5.009765625, -4.823486328125, -4.63720703125, -4.450927734375, -4.2646484375, -4.078369140625, -3.89208984375, -3.705810546875, -3.51953125, -3.333251953125, -3.14697265625, -2.960693359375, -2.7744140625, -2.588134765625, -2.40185546875, -2.215576171875, -2.029296875, -1.843017578125, -1.65673828125, -1.470458984375, -1.2841796875, -1.097900390625, -0.91162109375, -0.725341796875, -0.5390625, -0.352783203125, -0.16650390625, 0.019775390625, 0.2060546875, 0.392333984375, 0.57861328125, 0.764892578125, 0.951171875, 1.137451171875, 1.32373046875, 1.510009765625, 1.6962890625, 1.882568359375, 2.06884765625, 2.255126953125, 2.44140625, 2.627685546875, 2.81396484375, 3.000244140625, 3.1865234375, 3.372802734375, 3.55908203125, 3.745361328125, 3.931640625, 4.117919921875, 4.30419921875, 4.490478515625, 4.6767578125, 4.863037109375, 5.04931640625, 5.235595703125, 5.421875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 6.0, 6.0, 8.0, 9.0, 15.0, 23.0, 24.0, 20.0, 47.0, 54.0, 61.0, 84.0, 119.0, 176.0, 210.0, 312.0, 415.0, 676.0, 1206.0, 2967.0, 10404.0, 41301.0, 292434.0, 608940.0, 65514.0, 15233.0, 4260.0, 1537.0, 774.0, 437.0, 302.0, 205.0, 176.0, 148.0, 107.0, 97.0, 71.0, 45.0, 42.0, 23.0, 20.0, 14.0, 11.0, 12.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.359375, -15.8939208984375, -15.428466796875, -14.9630126953125, -14.49755859375, -14.0321044921875, -13.566650390625, -13.1011962890625, -12.6357421875, -12.1702880859375, -11.704833984375, -11.2393798828125, -10.77392578125, -10.3084716796875, -9.843017578125, -9.3775634765625, -8.912109375, -8.4466552734375, -7.981201171875, -7.5157470703125, -7.05029296875, -6.5848388671875, -6.119384765625, -5.6539306640625, -5.1884765625, -4.7230224609375, -4.257568359375, -3.7921142578125, -3.32666015625, -2.8612060546875, -2.395751953125, -1.9302978515625, -1.46484375, -0.9993896484375, -0.533935546875, -0.0684814453125, 0.39697265625, 0.8624267578125, 1.327880859375, 1.7933349609375, 2.2587890625, 2.7242431640625, 3.189697265625, 3.6551513671875, 4.12060546875, 4.5860595703125, 5.051513671875, 5.5169677734375, 5.982421875, 6.4478759765625, 6.913330078125, 7.3787841796875, 7.84423828125, 8.3096923828125, 8.775146484375, 9.2406005859375, 9.7060546875, 10.1715087890625, 10.636962890625, 11.1024169921875, 11.56787109375, 12.0333251953125, 12.498779296875, 12.9642333984375, 13.4296875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 2.0, 7.0, 11.0, 5.0, 14.0, 9.0, 8.0, 17.0, 25.0, 26.0, 27.0, 35.0, 45.0, 36.0, 49.0, 54.0, 67.0, 95.0, 169.0, 1474.0, 327.0, 110.0, 64.0, 54.0, 51.0, 45.0, 27.0, 32.0, 31.0, 24.0, 26.0, 12.0, 13.0, 11.0, 13.0, 7.0, 10.0, 2.0, 4.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.859375, -22.219970703125, -21.58056640625, -20.941162109375, -20.3017578125, -19.662353515625, -19.02294921875, -18.383544921875, -17.744140625, -17.104736328125, -16.46533203125, -15.825927734375, -15.1865234375, -14.547119140625, -13.90771484375, -13.268310546875, -12.62890625, -11.989501953125, -11.35009765625, -10.710693359375, -10.0712890625, -9.431884765625, -8.79248046875, -8.153076171875, -7.513671875, -6.874267578125, -6.23486328125, -5.595458984375, -4.9560546875, -4.316650390625, -3.67724609375, -3.037841796875, -2.3984375, -1.759033203125, -1.11962890625, -0.480224609375, 0.1591796875, 0.798583984375, 1.43798828125, 2.077392578125, 2.716796875, 3.356201171875, 3.99560546875, 4.635009765625, 5.2744140625, 5.913818359375, 6.55322265625, 7.192626953125, 7.83203125, 8.471435546875, 9.11083984375, 9.750244140625, 10.3896484375, 11.029052734375, 11.66845703125, 12.307861328125, 12.947265625, 13.586669921875, 14.22607421875, 14.865478515625, 15.5048828125, 16.144287109375, 16.78369140625, 17.423095703125, 18.0625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 9.0, 8.0, 16.0, 12.0, 18.0, 17.0, 22.0, 40.0, 44.0, 37.0, 63.0, 79.0, 121.0, 246.0, 439.0, 1258.0, 9873.0, 2861951.0, 265418.0, 4144.0, 781.0, 358.0, 189.0, 136.0, 89.0, 84.0, 49.0, 33.0, 33.0, 22.0, 19.0, 16.0, 16.0, 15.0, 6.0, 5.0, 8.0, 5.0, 7.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.71875, -47.029296875, -45.33984375, -43.650390625, -41.9609375, -40.271484375, -38.58203125, -36.892578125, -35.203125, -33.513671875, -31.82421875, -30.134765625, -28.4453125, -26.755859375, -25.06640625, -23.376953125, -21.6875, -19.998046875, -18.30859375, -16.619140625, -14.9296875, -13.240234375, -11.55078125, -9.861328125, -8.171875, -6.482421875, -4.79296875, -3.103515625, -1.4140625, 0.275390625, 1.96484375, 3.654296875, 5.34375, 7.033203125, 8.72265625, 10.412109375, 12.1015625, 13.791015625, 15.48046875, 17.169921875, 18.859375, 20.548828125, 22.23828125, 23.927734375, 25.6171875, 27.306640625, 28.99609375, 30.685546875, 32.375, 34.064453125, 35.75390625, 37.443359375, 39.1328125, 40.822265625, 42.51171875, 44.201171875, 45.890625, 47.580078125, 49.26953125, 50.958984375, 52.6484375, 54.337890625, 56.02734375, 57.716796875, 59.40625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 286.0, 595.0, 116.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.23345947265625, -217.005859375, -212.77825927734375, -208.5506591796875, -204.3230438232422, -200.09544372558594, -195.8678436279297, -191.64024353027344, -187.4126434326172, -183.18504333496094, -178.9574432373047, -174.72982788085938, -170.50222778320312, -166.27462768554688, -162.04702758789062, -157.81942749023438, -153.59182739257812, -149.36422729492188, -145.13662719726562, -140.90902709960938, -136.68141174316406, -132.4538116455078, -128.22621154785156, -123.99861145019531, -119.77099609375, -115.54339599609375, -111.31578826904297, -107.08818817138672, -102.86058807373047, -98.63298034667969, -94.40538024902344, -90.17778015136719, -85.9501953125, -81.72259521484375, -77.49498748779297, -73.26738739013672, -69.03978729248047, -64.81217956542969, -60.58457946777344, -56.35697937011719, -52.129371643066406, -47.90176773071289, -43.67416763305664, -39.446563720703125, -35.218963623046875, -30.99135971069336, -26.763755798339844, -22.53615379333496, -18.308551788330078, -14.080949783325195, -9.853346824645996, -5.625743865966797, -1.398141860961914, 2.8294601440429688, 7.057064056396484, 11.284666061401367, 15.51226806640625, 19.739870071411133, 23.967472076416016, 28.19507598876953, 32.42267608642578, 36.6502799987793, 40.87788391113281, 45.10548400878906, 49.33308792114258]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 14.0, 12.0, 11.0, 25.0, 19.0, 35.0, 19.0, 37.0, 43.0, 63.0, 43.0, 41.0, 37.0, 44.0, 55.0, 49.0, 43.0, 44.0, 41.0, 51.0, 46.0, 42.0, 28.0, 30.0, 18.0, 19.0, 18.0, 15.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.21122360229492, -50.403079986572266, -48.594940185546875, -46.78679656982422, -44.97865295410156, -43.17051315307617, -41.362369537353516, -39.554229736328125, -37.74608612060547, -35.93794250488281, -34.12980270385742, -32.321659088134766, -30.513517379760742, -28.70537567138672, -26.897232055664062, -25.08909034729004, -23.280948638916016, -21.472806930541992, -19.66466522216797, -17.856521606445312, -16.04837989807129, -14.240238189697266, -12.432095527648926, -10.623952865600586, -8.815811157226562, -7.007668972015381, -5.199526786804199, -3.3913846015930176, -1.583242416381836, 0.2248992919921875, 2.0330419540405273, 3.841184616088867, 5.649322509765625, 7.457464694976807, 9.265606880187988, 11.073749542236328, 12.881891250610352, 14.690032958984375, 16.49817657470703, 18.306318283081055, 20.114459991455078, 21.9226016998291, 23.730743408203125, 25.53888702392578, 27.347028732299805, 29.155170440673828, 30.963314056396484, 32.771453857421875, 34.57959747314453, 36.38774108886719, 38.19588088989258, 40.004024505615234, 41.812164306640625, 43.62030792236328, 45.42845153808594, 47.236595153808594, 49.044734954833984, 50.85287857055664, 52.66101837158203, 54.46916198730469, 56.277305603027344, 58.085445404052734, 59.89358901977539, 61.70172882080078, 63.50987243652344]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 5.0, 8.0, 6.0, 9.0, 9.0, 10.0, 16.0, 15.0, 18.0, 29.0, 22.0, 16.0, 18.0, 34.0, 21.0, 24.0, 33.0, 38.0, 42.0, 42.0, 47.0, 62.0, 36.0, 47.0, 44.0, 41.0, 29.0, 39.0, 30.0, 17.0, 25.0, 25.0, 21.0, 18.0, 17.0, 23.0, 10.0, 13.0, 11.0, 9.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.58984375, -6.3924560546875, -6.195068359375, -5.9976806640625, -5.80029296875, -5.6029052734375, -5.405517578125, -5.2081298828125, -5.0107421875, -4.8133544921875, -4.615966796875, -4.4185791015625, -4.22119140625, -4.0238037109375, -3.826416015625, -3.6290283203125, -3.431640625, -3.2342529296875, -3.036865234375, -2.8394775390625, -2.64208984375, -2.4447021484375, -2.247314453125, -2.0499267578125, -1.8525390625, -1.6551513671875, -1.457763671875, -1.2603759765625, -1.06298828125, -0.8656005859375, -0.668212890625, -0.4708251953125, -0.2734375, -0.0760498046875, 0.121337890625, 0.3187255859375, 0.51611328125, 0.7135009765625, 0.910888671875, 1.1082763671875, 1.3056640625, 1.5030517578125, 1.700439453125, 1.8978271484375, 2.09521484375, 2.2926025390625, 2.489990234375, 2.6873779296875, 2.884765625, 3.0821533203125, 3.279541015625, 3.4769287109375, 3.67431640625, 3.8717041015625, 4.069091796875, 4.2664794921875, 4.4638671875, 4.6612548828125, 4.858642578125, 5.0560302734375, 5.25341796875, 5.4508056640625, 5.648193359375, 5.8455810546875, 6.04296875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 10.0, 8.0, 12.0, 14.0, 19.0, 18.0, 42.0, 40.0, 48.0, 59.0, 76.0, 93.0, 147.0, 224.0, 409.0, 776.0, 2276.0, 9103.0, 46540.0, 267588.0, 1178495.0, 1839140.0, 682570.0, 135108.0, 23542.0, 4980.0, 1373.0, 587.0, 290.0, 164.0, 134.0, 84.0, 70.0, 44.0, 42.0, 35.0, 31.0, 27.0, 16.0, 11.0, 8.0, 11.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6015625, -8.317626953125, -8.03369140625, -7.749755859375, -7.4658203125, -7.181884765625, -6.89794921875, -6.614013671875, -6.330078125, -6.046142578125, -5.76220703125, -5.478271484375, -5.1943359375, -4.910400390625, -4.62646484375, -4.342529296875, -4.05859375, -3.774658203125, -3.49072265625, -3.206787109375, -2.9228515625, -2.638916015625, -2.35498046875, -2.071044921875, -1.787109375, -1.503173828125, -1.21923828125, -0.935302734375, -0.6513671875, -0.367431640625, -0.08349609375, 0.200439453125, 0.484375, 0.768310546875, 1.05224609375, 1.336181640625, 1.6201171875, 1.904052734375, 2.18798828125, 2.471923828125, 2.755859375, 3.039794921875, 3.32373046875, 3.607666015625, 3.8916015625, 4.175537109375, 4.45947265625, 4.743408203125, 5.02734375, 5.311279296875, 5.59521484375, 5.879150390625, 6.1630859375, 6.447021484375, 6.73095703125, 7.014892578125, 7.298828125, 7.582763671875, 7.86669921875, 8.150634765625, 8.4345703125, 8.718505859375, 9.00244140625, 9.286376953125, 9.5703125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 5.0, 9.0, 13.0, 12.0, 22.0, 21.0, 32.0, 74.0, 84.0, 126.0, 140.0, 205.0, 257.0, 375.0, 410.0, 459.0, 410.0, 365.0, 290.0, 214.0, 151.0, 112.0, 80.0, 55.0, 34.0, 26.0, 24.0, 17.0, 13.0, 11.0, 5.0, 1.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.3436279296875, -7.031005859375, -6.7183837890625, -6.40576171875, -6.0931396484375, -5.780517578125, -5.4678955078125, -5.1552734375, -4.8426513671875, -4.530029296875, -4.2174072265625, -3.90478515625, -3.5921630859375, -3.279541015625, -2.9669189453125, -2.654296875, -2.3416748046875, -2.029052734375, -1.7164306640625, -1.40380859375, -1.0911865234375, -0.778564453125, -0.4659423828125, -0.1533203125, 0.1593017578125, 0.471923828125, 0.7845458984375, 1.09716796875, 1.4097900390625, 1.722412109375, 2.0350341796875, 2.34765625, 2.6602783203125, 2.972900390625, 3.2855224609375, 3.59814453125, 3.9107666015625, 4.223388671875, 4.5360107421875, 4.8486328125, 5.1612548828125, 5.473876953125, 5.7864990234375, 6.09912109375, 6.4117431640625, 6.724365234375, 7.0369873046875, 7.349609375, 7.6622314453125, 7.974853515625, 8.2874755859375, 8.60009765625, 8.9127197265625, 9.225341796875, 9.5379638671875, 9.8505859375, 10.1632080078125, 10.475830078125, 10.7884521484375, 11.10107421875, 11.4136962890625, 11.726318359375, 12.0389404296875, 12.3515625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 14.0, 10.0, 16.0, 35.0, 46.0, 58.0, 89.0, 139.0, 198.0, 423.0, 770.0, 2319.0, 20513.0, 719004.0, 3310294.0, 130855.0, 6820.0, 1290.0, 550.0, 319.0, 167.0, 125.0, 66.0, 48.0, 39.0, 19.0, 15.0, 13.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-35.0, -34.131103515625, -33.26220703125, -32.393310546875, -31.5244140625, -30.655517578125, -29.78662109375, -28.917724609375, -28.048828125, -27.179931640625, -26.31103515625, -25.442138671875, -24.5732421875, -23.704345703125, -22.83544921875, -21.966552734375, -21.09765625, -20.228759765625, -19.35986328125, -18.490966796875, -17.6220703125, -16.753173828125, -15.88427734375, -15.015380859375, -14.146484375, -13.277587890625, -12.40869140625, -11.539794921875, -10.6708984375, -9.802001953125, -8.93310546875, -8.064208984375, -7.1953125, -6.326416015625, -5.45751953125, -4.588623046875, -3.7197265625, -2.850830078125, -1.98193359375, -1.113037109375, -0.244140625, 0.624755859375, 1.49365234375, 2.362548828125, 3.2314453125, 4.100341796875, 4.96923828125, 5.838134765625, 6.70703125, 7.575927734375, 8.44482421875, 9.313720703125, 10.1826171875, 11.051513671875, 11.92041015625, 12.789306640625, 13.658203125, 14.527099609375, 15.39599609375, 16.264892578125, 17.1337890625, 18.002685546875, 18.87158203125, 19.740478515625, 20.609375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 329.0, 684.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-605.7996826171875, -591.0722045898438, -576.3446655273438, -561.6171875, -546.8897094726562, -532.1622314453125, -517.4346923828125, -502.70721435546875, -487.9797058105469, -473.252197265625, -458.52471923828125, -443.7972106933594, -429.0697021484375, -414.34222412109375, -399.6147155761719, -384.88720703125, -370.15972900390625, -355.4322204589844, -340.7047424316406, -325.97723388671875, -311.249755859375, -296.5222473144531, -281.79473876953125, -267.0672607421875, -252.33975219726562, -237.6122589111328, -222.884765625, -208.15725708007812, -193.4297637939453, -178.7022705078125, -163.97476196289062, -149.2472686767578, -134.519775390625, -119.79228210449219, -105.06478118896484, -90.3372802734375, -75.60978698730469, -60.882293701171875, -46.15479278564453, -31.427291870117188, -16.699798583984375, -1.9723014831542969, 12.755195617675781, 27.48269271850586, 42.21018981933594, 56.93768310546875, 71.6651840209961, 86.39268493652344, 101.12017822265625, 115.84767150878906, 130.57516479492188, 145.30267333984375, 160.03016662597656, 174.75765991210938, 189.48516845703125, 204.21266174316406, 218.94015502929688, 233.6676483154297, 248.3951416015625, 263.1226501464844, 277.85015869140625, 292.57763671875, 307.3051452636719, 322.03265380859375, 336.7601318359375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 9.0, 12.0, 7.0, 12.0, 14.0, 16.0, 25.0, 22.0, 22.0, 25.0, 29.0, 30.0, 40.0, 34.0, 30.0, 34.0, 34.0, 48.0, 45.0, 37.0, 45.0, 43.0, 35.0, 38.0, 50.0, 32.0, 33.0, 31.0, 16.0, 24.0, 20.0, 17.0, 18.0, 14.0, 11.0, 10.0, 11.0, 10.0, 10.0, 3.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.876346588134766, -27.870195388793945, -26.864046096801758, -25.857894897460938, -24.85174560546875, -23.84559440612793, -22.83944320678711, -21.833293914794922, -20.8271427154541, -19.82099151611328, -18.814842224121094, -17.808691024780273, -16.802539825439453, -15.796390533447266, -14.790239334106445, -13.784089088439941, -12.777938842773438, -11.771788597106934, -10.76563835144043, -9.75948715209961, -8.753336906433105, -7.747186660766602, -6.7410359382629395, -5.734885215759277, -4.728734970092773, -3.7225844860076904, -2.7164340019226074, -1.7102835178375244, -0.7041330337524414, 0.3020172119140625, 1.3081679344177246, 2.3143186569213867, 3.320465087890625, 4.326615333557129, 5.332766056060791, 6.338916778564453, 7.345067024230957, 8.351217269897461, 9.357368469238281, 10.363518714904785, 11.369668960571289, 12.375819206237793, 13.381969451904297, 14.388120651245117, 15.394270896911621, 16.400421142578125, 17.406572341918945, 18.412723541259766, 19.418872833251953, 20.425024032592773, 21.43117332458496, 22.43732452392578, 23.44347381591797, 24.44962501525879, 25.45577621459961, 26.461925506591797, 27.468076705932617, 28.474227905273438, 29.480377197265625, 30.486528396606445, 31.492679595947266, 32.49882888793945, 33.50497817993164, 34.511131286621094, 35.51728057861328]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 11.0, 8.0, 8.0, 18.0, 20.0, 13.0, 26.0, 25.0, 28.0, 42.0, 34.0, 35.0, 40.0, 40.0, 38.0, 55.0, 50.0, 40.0, 53.0, 44.0, 36.0, 45.0, 28.0, 45.0, 29.0, 38.0, 24.0, 29.0, 15.0, 19.0, 7.0, 11.0, 9.0, 6.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.71875, -6.49993896484375, -6.2811279296875, -6.06231689453125, -5.843505859375, -5.62469482421875, -5.4058837890625, -5.18707275390625, -4.96826171875, -4.74945068359375, -4.5306396484375, -4.31182861328125, -4.093017578125, -3.87420654296875, -3.6553955078125, -3.43658447265625, -3.2177734375, -2.99896240234375, -2.7801513671875, -2.56134033203125, -2.342529296875, -2.12371826171875, -1.9049072265625, -1.68609619140625, -1.46728515625, -1.24847412109375, -1.0296630859375, -0.81085205078125, -0.592041015625, -0.37322998046875, -0.1544189453125, 0.06439208984375, 0.283203125, 0.50201416015625, 0.7208251953125, 0.93963623046875, 1.158447265625, 1.37725830078125, 1.5960693359375, 1.81488037109375, 2.03369140625, 2.25250244140625, 2.4713134765625, 2.69012451171875, 2.908935546875, 3.12774658203125, 3.3465576171875, 3.56536865234375, 3.7841796875, 4.00299072265625, 4.2218017578125, 4.44061279296875, 4.659423828125, 4.87823486328125, 5.0970458984375, 5.31585693359375, 5.53466796875, 5.75347900390625, 5.9722900390625, 6.19110107421875, 6.409912109375, 6.62872314453125, 6.8475341796875, 7.06634521484375, 7.28515625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 15.0, 22.0, 28.0, 49.0, 68.0, 113.0, 174.0, 286.0, 464.0, 746.0, 1229.0, 1850.0, 2913.0, 4627.0, 7404.0, 11850.0, 19040.0, 29898.0, 46491.0, 71525.0, 106126.0, 146748.0, 167317.0, 141422.0, 101117.0, 67736.0, 44067.0, 27799.0, 17298.0, 11134.0, 7100.0, 4392.0, 2749.0, 1758.0, 1083.0, 685.0, 444.0, 275.0, 171.0, 124.0, 76.0, 47.0, 30.0, 21.0, 11.0, 9.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.473876953125, -0.460113525390625, -0.44635009765625, -0.432586669921875, -0.4188232421875, -0.405059814453125, -0.39129638671875, -0.377532958984375, -0.36376953125, -0.350006103515625, -0.33624267578125, -0.322479248046875, -0.3087158203125, -0.294952392578125, -0.28118896484375, -0.267425537109375, -0.253662109375, -0.239898681640625, -0.22613525390625, -0.212371826171875, -0.1986083984375, -0.184844970703125, -0.17108154296875, -0.157318115234375, -0.1435546875, -0.129791259765625, -0.11602783203125, -0.102264404296875, -0.0885009765625, -0.074737548828125, -0.06097412109375, -0.047210693359375, -0.033447265625, -0.019683837890625, -0.00592041015625, 0.007843017578125, 0.0216064453125, 0.035369873046875, 0.04913330078125, 0.062896728515625, 0.07666015625, 0.090423583984375, 0.10418701171875, 0.117950439453125, 0.1317138671875, 0.145477294921875, 0.15924072265625, 0.173004150390625, 0.186767578125, 0.200531005859375, 0.21429443359375, 0.228057861328125, 0.2418212890625, 0.255584716796875, 0.26934814453125, 0.283111572265625, 0.296875, 0.310638427734375, 0.32440185546875, 0.338165283203125, 0.3519287109375, 0.365692138671875, 0.37945556640625, 0.393218994140625, 0.406982421875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 5.0, 9.0, 3.0, 13.0, 11.0, 8.0, 15.0, 15.0, 16.0, 30.0, 28.0, 27.0, 27.0, 30.0, 31.0, 48.0, 45.0, 39.0, 39.0, 30.0, 1056.0, 38.0, 33.0, 37.0, 33.0, 35.0, 30.0, 38.0, 28.0, 33.0, 31.0, 23.0, 19.0, 25.0, 22.0, 15.0, 13.0, 10.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.04296875, -3.921783447265625, -3.80059814453125, -3.679412841796875, -3.5582275390625, -3.437042236328125, -3.31585693359375, -3.194671630859375, -3.073486328125, -2.952301025390625, -2.83111572265625, -2.709930419921875, -2.5887451171875, -2.467559814453125, -2.34637451171875, -2.225189208984375, -2.10400390625, -1.982818603515625, -1.86163330078125, -1.740447998046875, -1.6192626953125, -1.498077392578125, -1.37689208984375, -1.255706787109375, -1.134521484375, -1.013336181640625, -0.89215087890625, -0.770965576171875, -0.6497802734375, -0.528594970703125, -0.40740966796875, -0.286224365234375, -0.1650390625, -0.043853759765625, 0.07733154296875, 0.198516845703125, 0.3197021484375, 0.440887451171875, 0.56207275390625, 0.683258056640625, 0.804443359375, 0.925628662109375, 1.04681396484375, 1.167999267578125, 1.2891845703125, 1.410369873046875, 1.53155517578125, 1.652740478515625, 1.77392578125, 1.895111083984375, 2.01629638671875, 2.137481689453125, 2.2586669921875, 2.379852294921875, 2.50103759765625, 2.622222900390625, 2.743408203125, 2.864593505859375, 2.98577880859375, 3.106964111328125, 3.2281494140625, 3.349334716796875, 3.47052001953125, 3.591705322265625, 3.712890625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 13.0, 18.0, 30.0, 41.0, 51.0, 79.0, 123.0, 196.0, 270.0, 368.0, 559.0, 833.0, 1285.0, 1907.0, 2931.0, 4464.0, 7107.0, 11147.0, 16985.0, 26391.0, 40390.0, 60532.0, 86290.0, 117769.0, 372354.0, 957161.0, 119350.0, 88278.0, 61316.0, 41393.0, 27288.0, 17607.0, 11420.0, 7306.0, 4767.0, 3086.0, 2016.0, 1379.0, 831.0, 564.0, 370.0, 255.0, 189.0, 127.0, 86.0, 58.0, 47.0, 32.0, 22.0, 16.0, 13.0, 14.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.301513671875, -0.2921028137207031, -0.28269195556640625, -0.2732810974121094, -0.2638702392578125, -0.2544593811035156, -0.24504852294921875, -0.23563766479492188, -0.226226806640625, -0.21681594848632812, -0.20740509033203125, -0.19799423217773438, -0.1885833740234375, -0.17917251586914062, -0.16976165771484375, -0.16035079956054688, -0.15093994140625, -0.14152908325195312, -0.13211822509765625, -0.12270736694335938, -0.1132965087890625, -0.10388565063476562, -0.09447479248046875, -0.08506393432617188, -0.075653076171875, -0.06624221801757812, -0.05683135986328125, -0.047420501708984375, -0.0380096435546875, -0.028598785400390625, -0.01918792724609375, -0.009777069091796875, -0.0003662109375, 0.009044647216796875, 0.01845550537109375, 0.027866363525390625, 0.0372772216796875, 0.046688079833984375, 0.05609893798828125, 0.06550979614257812, 0.074920654296875, 0.08433151245117188, 0.09374237060546875, 0.10315322875976562, 0.1125640869140625, 0.12197494506835938, 0.13138580322265625, 0.14079666137695312, 0.15020751953125, 0.15961837768554688, 0.16902923583984375, 0.17844009399414062, 0.1878509521484375, 0.19726181030273438, 0.20667266845703125, 0.21608352661132812, 0.225494384765625, 0.23490524291992188, 0.24431610107421875, 0.2537269592285156, 0.2631378173828125, 0.2725486755371094, 0.28195953369140625, 0.2913703918457031, 0.30078125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 5.0, 7.0, 7.0, 14.0, 10.0, 7.0, 18.0, 32.0, 45.0, 49.0, 66.0, 115.0, 117.0, 136.0, 96.0, 74.0, 51.0, 37.0, 30.0, 26.0, 8.0, 22.0, 10.0, 9.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014404296875, -0.013982295989990234, -0.013560295104980469, -0.013138294219970703, -0.012716293334960938, -0.012294292449951172, -0.011872291564941406, -0.01145029067993164, -0.011028289794921875, -0.01060628890991211, -0.010184288024902344, -0.009762287139892578, -0.009340286254882812, -0.008918285369873047, -0.008496284484863281, -0.008074283599853516, -0.00765228271484375, -0.007230281829833984, -0.006808280944824219, -0.006386280059814453, -0.0059642791748046875, -0.005542278289794922, -0.005120277404785156, -0.004698276519775391, -0.004276275634765625, -0.0038542747497558594, -0.0034322738647460938, -0.003010272979736328, -0.0025882720947265625, -0.002166271209716797, -0.0017442703247070312, -0.0013222694396972656, -0.0009002685546875, -0.0004782676696777344, -5.626678466796875e-05, 0.0003657341003417969, 0.0007877349853515625, 0.0012097358703613281, 0.0016317367553710938, 0.0020537376403808594, 0.002475738525390625, 0.0028977394104003906, 0.0033197402954101562, 0.003741741180419922, 0.0041637420654296875, 0.004585742950439453, 0.005007743835449219, 0.005429744720458984, 0.00585174560546875, 0.006273746490478516, 0.006695747375488281, 0.007117748260498047, 0.0075397491455078125, 0.007961750030517578, 0.008383750915527344, 0.00880575180053711, 0.009227752685546875, 0.00964975357055664, 0.010071754455566406, 0.010493755340576172, 0.010915756225585938, 0.011337757110595703, 0.011759757995605469, 0.012181758880615234, 0.012603759765625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 12.0, 15.0, 14.0, 21.0, 54.0, 57.0, 109.0, 145.0, 367.0, 1920.0, 984249.0, 60214.0, 708.0, 280.0, 141.0, 85.0, 55.0, 25.0, 26.0, 17.0, 14.0, 9.0, 6.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2685546875, -0.25954437255859375, -0.2505340576171875, -0.24152374267578125, -0.232513427734375, -0.22350311279296875, -0.2144927978515625, -0.20548248291015625, -0.19647216796875, -0.18746185302734375, -0.1784515380859375, -0.16944122314453125, -0.160430908203125, -0.15142059326171875, -0.1424102783203125, -0.13339996337890625, -0.1243896484375, -0.11537933349609375, -0.1063690185546875, -0.09735870361328125, -0.088348388671875, -0.07933807373046875, -0.0703277587890625, -0.06131744384765625, -0.05230712890625, -0.04329681396484375, -0.0342864990234375, -0.02527618408203125, -0.016265869140625, -0.00725555419921875, 0.0017547607421875, 0.01076507568359375, 0.019775390625, 0.02878570556640625, 0.0377960205078125, 0.04680633544921875, 0.055816650390625, 0.06482696533203125, 0.0738372802734375, 0.08284759521484375, 0.09185791015625, 0.10086822509765625, 0.1098785400390625, 0.11888885498046875, 0.127899169921875, 0.13690948486328125, 0.1459197998046875, 0.15493011474609375, 0.1639404296875, 0.17295074462890625, 0.1819610595703125, 0.19097137451171875, 0.199981689453125, 0.20899200439453125, 0.2180023193359375, 0.22701263427734375, 0.23602294921875, 0.24503326416015625, 0.2540435791015625, 0.26305389404296875, 0.272064208984375, 0.28107452392578125, 0.2900848388671875, 0.29909515380859375, 0.30810546875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 8.0, 35.0, 115.0, 400.0, 310.0, 104.0, 27.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007931796833872795, -0.006773454137146473, -0.0056151109747588634, -0.004456767812371254, -0.003298425115644932, -0.0021400824189186096, -0.0009817392565310001, 0.00017660390585660934, 0.0013349466025829315, 0.0024932895321398973, 0.003651632461696863, 0.004809975624084473, 0.005968318320810795, 0.007126661017537117, 0.008285004645586014, 0.009443347342312336, 0.010601690039038658, 0.01176003273576498, 0.012918375432491302, 0.0140767190605402, 0.015235061757266521, 0.016393404453992844, 0.01755174808204174, 0.018710091710090637, 0.019868433475494385, 0.02102677710354328, 0.02218511886894703, 0.023343462496995926, 0.024501804262399673, 0.02566014789044857, 0.026818491518497467, 0.027976833283901215, 0.029135175049304962, 0.03029351867735386, 0.031451862305402756, 0.0326102040708065, 0.03376854583621025, 0.0349268913269043, 0.036085233092308044, 0.03724357485771179, 0.03840191662311554, 0.03956025838851929, 0.04071860387921333, 0.04187694564461708, 0.04303528741002083, 0.044193632900714874, 0.04535197466611862, 0.04651031643152237, 0.047668661922216415, 0.04882700368762016, 0.04998534917831421, 0.05114369094371796, 0.052302032709121704, 0.05346037447452545, 0.0546187199652195, 0.055777061730623245, 0.05693540722131729, 0.05809374898672104, 0.059252094477415085, 0.06041043624281883, 0.06156877800822258, 0.06272712349891663, 0.06388546526432037, 0.06504380702972412, 0.06620214879512787]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 1.0, 10.0, 15.0, 12.0, 15.0, 22.0, 25.0, 32.0, 48.0, 45.0, 47.0, 54.0, 57.0, 49.0, 62.0, 36.0, 76.0, 50.0, 42.0, 48.0, 39.0, 45.0, 39.0, 19.0, 28.0, 20.0, 16.0, 14.0, 17.0, 4.0, 4.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008097052574157715, -0.007872756570577621, -0.007648460566997528, -0.007424164563417435, -0.007199868559837341, -0.006975572556257248, -0.0067512765526771545, -0.006526980549097061, -0.006302684545516968, -0.006078388541936874, -0.005854092538356781, -0.005629796534776688, -0.005405500531196594, -0.005181204527616501, -0.0049569085240364075, -0.004732612520456314, -0.004508316516876221, -0.004284020513296127, -0.004059724509716034, -0.0038354285061359406, -0.003611132502555847, -0.003386836498975754, -0.0031625404953956604, -0.002938244491815567, -0.0027139484882354736, -0.0024896524846553802, -0.002265356481075287, -0.0020410604774951935, -0.0018167644739151, -0.0015924684703350067, -0.0013681724667549133, -0.00114387646317482, -0.0009195804595947266, -0.0006952844560146332, -0.0004709884524345398, -0.0002466924488544464, -2.2396445274353027e-05, 0.00020189955830574036, 0.00042619556188583374, 0.0006504915654659271, 0.0008747875690460205, 0.001099083572626114, 0.0013233795762062073, 0.0015476755797863007, 0.001771971583366394, 0.0019962675869464874, 0.002220563590526581, 0.002444859594106674, 0.0026691555976867676, 0.002893451601266861, 0.0031177476048469543, 0.0033420436084270477, 0.003566339612007141, 0.0037906356155872345, 0.004014931619167328, 0.004239227622747421, 0.004463523626327515, 0.004687819629907608, 0.004912115633487701, 0.005136411637067795, 0.005360707640647888, 0.005585003644227982, 0.005809299647808075, 0.006033595651388168, 0.006257891654968262]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 11.0, 8.0, 8.0, 18.0, 20.0, 13.0, 26.0, 26.0, 27.0, 42.0, 34.0, 35.0, 40.0, 40.0, 37.0, 56.0, 50.0, 40.0, 53.0, 44.0, 36.0, 45.0, 28.0, 45.0, 29.0, 38.0, 24.0, 29.0, 15.0, 19.0, 7.0, 11.0, 9.0, 6.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.71875, -6.49993896484375, -6.2811279296875, -6.06231689453125, -5.843505859375, -5.62469482421875, -5.4058837890625, -5.18707275390625, -4.96826171875, -4.74945068359375, -4.5306396484375, -4.31182861328125, -4.093017578125, -3.87420654296875, -3.6553955078125, -3.43658447265625, -3.2177734375, -2.99896240234375, -2.7801513671875, -2.56134033203125, -2.342529296875, -2.12371826171875, -1.9049072265625, -1.68609619140625, -1.46728515625, -1.24847412109375, -1.0296630859375, -0.81085205078125, -0.592041015625, -0.37322998046875, -0.1544189453125, 0.06439208984375, 0.283203125, 0.50201416015625, 0.7208251953125, 0.93963623046875, 1.158447265625, 1.37725830078125, 1.5960693359375, 1.81488037109375, 2.03369140625, 2.25250244140625, 2.4713134765625, 2.69012451171875, 2.908935546875, 3.12774658203125, 3.3465576171875, 3.56536865234375, 3.7841796875, 4.00299072265625, 4.2218017578125, 4.44061279296875, 4.659423828125, 4.87823486328125, 5.0970458984375, 5.31585693359375, 5.53466796875, 5.75347900390625, 5.9722900390625, 6.19110107421875, 6.409912109375, 6.62872314453125, 6.8475341796875, 7.06634521484375, 7.28515625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 16.0, 9.0, 15.0, 16.0, 22.0, 32.0, 40.0, 64.0, 57.0, 97.0, 135.0, 188.0, 330.0, 521.0, 985.0, 1830.0, 3897.0, 8801.0, 20368.0, 46377.0, 108496.0, 263245.0, 332166.0, 148972.0, 61813.0, 27604.0, 11605.0, 5236.0, 2497.0, 1181.0, 711.0, 416.0, 261.0, 174.0, 105.0, 80.0, 49.0, 39.0, 22.0, 19.0, 18.0, 13.0, 5.0, 8.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1484375, -6.9034423828125, -6.658447265625, -6.4134521484375, -6.16845703125, -5.9234619140625, -5.678466796875, -5.4334716796875, -5.1884765625, -4.9434814453125, -4.698486328125, -4.4534912109375, -4.20849609375, -3.9635009765625, -3.718505859375, -3.4735107421875, -3.228515625, -2.9835205078125, -2.738525390625, -2.4935302734375, -2.24853515625, -2.0035400390625, -1.758544921875, -1.5135498046875, -1.2685546875, -1.0235595703125, -0.778564453125, -0.5335693359375, -0.28857421875, -0.0435791015625, 0.201416015625, 0.4464111328125, 0.69140625, 0.9364013671875, 1.181396484375, 1.4263916015625, 1.67138671875, 1.9163818359375, 2.161376953125, 2.4063720703125, 2.6513671875, 2.8963623046875, 3.141357421875, 3.3863525390625, 3.63134765625, 3.8763427734375, 4.121337890625, 4.3663330078125, 4.611328125, 4.8563232421875, 5.101318359375, 5.3463134765625, 5.59130859375, 5.8363037109375, 6.081298828125, 6.3262939453125, 6.5712890625, 6.8162841796875, 7.061279296875, 7.3062744140625, 7.55126953125, 7.7962646484375, 8.041259765625, 8.2862548828125, 8.53125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 6.0, 12.0, 11.0, 14.0, 13.0, 13.0, 18.0, 18.0, 26.0, 35.0, 31.0, 31.0, 53.0, 48.0, 58.0, 65.0, 141.0, 261.0, 1418.0, 216.0, 112.0, 65.0, 49.0, 41.0, 40.0, 43.0, 35.0, 23.0, 32.0, 22.0, 23.0, 15.0, 9.0, 9.0, 4.0, 9.0, 9.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.21875, -18.62353515625, -18.0283203125, -17.43310546875, -16.837890625, -16.24267578125, -15.6474609375, -15.05224609375, -14.45703125, -13.86181640625, -13.2666015625, -12.67138671875, -12.076171875, -11.48095703125, -10.8857421875, -10.29052734375, -9.6953125, -9.10009765625, -8.5048828125, -7.90966796875, -7.314453125, -6.71923828125, -6.1240234375, -5.52880859375, -4.93359375, -4.33837890625, -3.7431640625, -3.14794921875, -2.552734375, -1.95751953125, -1.3623046875, -0.76708984375, -0.171875, 0.42333984375, 1.0185546875, 1.61376953125, 2.208984375, 2.80419921875, 3.3994140625, 3.99462890625, 4.58984375, 5.18505859375, 5.7802734375, 6.37548828125, 6.970703125, 7.56591796875, 8.1611328125, 8.75634765625, 9.3515625, 9.94677734375, 10.5419921875, 11.13720703125, 11.732421875, 12.32763671875, 12.9228515625, 13.51806640625, 14.11328125, 14.70849609375, 15.3037109375, 15.89892578125, 16.494140625, 17.08935546875, 17.6845703125, 18.27978515625, 18.875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 13.0, 20.0, 24.0, 22.0, 42.0, 74.0, 73.0, 120.0, 211.0, 348.0, 499.0, 1018.0, 6615.0, 249525.0, 2828794.0, 53685.0, 2560.0, 777.0, 451.0, 252.0, 157.0, 99.0, 85.0, 51.0, 38.0, 31.0, 22.0, 15.0, 9.0, 6.0, 9.0, 8.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.375, -34.2802734375, -33.185546875, -32.0908203125, -30.99609375, -29.9013671875, -28.806640625, -27.7119140625, -26.6171875, -25.5224609375, -24.427734375, -23.3330078125, -22.23828125, -21.1435546875, -20.048828125, -18.9541015625, -17.859375, -16.7646484375, -15.669921875, -14.5751953125, -13.48046875, -12.3857421875, -11.291015625, -10.1962890625, -9.1015625, -8.0068359375, -6.912109375, -5.8173828125, -4.72265625, -3.6279296875, -2.533203125, -1.4384765625, -0.34375, 0.7509765625, 1.845703125, 2.9404296875, 4.03515625, 5.1298828125, 6.224609375, 7.3193359375, 8.4140625, 9.5087890625, 10.603515625, 11.6982421875, 12.79296875, 13.8876953125, 14.982421875, 16.0771484375, 17.171875, 18.2666015625, 19.361328125, 20.4560546875, 21.55078125, 22.6455078125, 23.740234375, 24.8349609375, 25.9296875, 27.0244140625, 28.119140625, 29.2138671875, 30.30859375, 31.4033203125, 32.498046875, 33.5927734375, 34.6875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 89.0, 913.0, 16.0, 1.0], "bins": [-675.0516357421875, -664.0450439453125, -653.0384521484375, -642.0318603515625, -631.0252685546875, -620.0186767578125, -609.0120849609375, -598.0054931640625, -586.9988403320312, -575.9922485351562, -564.9856567382812, -553.9790649414062, -542.9724731445312, -531.9658813476562, -520.959228515625, -509.9526672363281, -498.94610595703125, -487.93951416015625, -476.93292236328125, -465.92633056640625, -454.9197082519531, -443.9131164550781, -432.9065246582031, -421.8999328613281, -410.893310546875, -399.88671875, -388.880126953125, -377.87353515625, -366.8669128417969, -355.8603210449219, -344.8537292480469, -333.8471374511719, -322.8405456542969, -311.8339538574219, -300.8273620605469, -289.82073974609375, -278.81414794921875, -267.80755615234375, -256.80096435546875, -245.79437255859375, -234.78778076171875, -223.78118896484375, -212.7745819091797, -201.7679901123047, -190.7613983154297, -179.75479125976562, -168.74819946289062, -157.74160766601562, -146.73500061035156, -135.72840881347656, -124.72180938720703, -113.7152099609375, -102.7086181640625, -91.70201873779297, -80.69541931152344, -69.68882751464844, -58.682228088378906, -47.67563247680664, -36.669036865234375, -25.662437438964844, -14.655841827392578, -3.6492462158203125, 7.357353210449219, 18.36394500732422, 29.37054443359375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 8.0, 2.0, 6.0, 10.0, 8.0, 8.0, 8.0, 10.0, 15.0, 15.0, 12.0, 15.0, 23.0, 19.0, 24.0, 30.0, 29.0, 35.0, 36.0, 35.0, 39.0, 36.0, 43.0, 47.0, 37.0, 42.0, 39.0, 44.0, 24.0, 31.0, 21.0, 24.0, 21.0, 32.0, 27.0, 23.0, 25.0, 23.0, 6.0, 11.0, 10.0, 10.0, 11.0, 12.0, 3.0, 5.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.55262756347656, -36.398128509521484, -35.243629455566406, -34.089134216308594, -32.934635162353516, -31.780136108398438, -30.62563705444336, -29.47113800048828, -28.316640853881836, -27.162141799926758, -26.007644653320312, -24.853145599365234, -23.698646545410156, -22.54414939880371, -21.389650344848633, -20.235153198242188, -19.08065414428711, -17.92615509033203, -16.771657943725586, -15.617158889770508, -14.462660789489746, -13.308162689208984, -12.153663635253906, -10.999165534973145, -9.844667434692383, -8.690169334411621, -7.535670757293701, -6.381172180175781, -5.2266740798950195, -4.072175979614258, -2.917677402496338, -1.763178825378418, -0.6086807250976562, 0.5458176136016846, 1.7003159523010254, 2.854814291000366, 4.009312629699707, 5.163810729980469, 6.318309307098389, 7.472807884216309, 8.62730598449707, 9.781804084777832, 10.936302185058594, 12.090801239013672, 13.245299339294434, 14.399797439575195, 15.554296493530273, 16.70879364013672, 17.863292694091797, 19.017791748046875, 20.17228889465332, 21.3267879486084, 22.481285095214844, 23.635784149169922, 24.790283203125, 25.944782257080078, 27.099279403686523, 28.2537784576416, 29.408275604248047, 30.562774658203125, 31.717273712158203, 32.87177276611328, 34.026268005371094, 35.18076705932617, 36.33526611328125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 11.0, 12.0, 12.0, 24.0, 17.0, 16.0, 13.0, 33.0, 26.0, 41.0, 42.0, 31.0, 39.0, 57.0, 35.0, 48.0, 45.0, 58.0, 55.0, 40.0, 36.0, 43.0, 34.0, 39.0, 37.0, 24.0, 28.0, 15.0, 16.0, 16.0, 14.0, 10.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.818359375, -6.59375, -6.369140625, -6.14453125, -5.919921875, -5.6953125, -5.470703125, -5.24609375, -5.021484375, -4.796875, -4.572265625, -4.34765625, -4.123046875, -3.8984375, -3.673828125, -3.44921875, -3.224609375, -3.0, -2.775390625, -2.55078125, -2.326171875, -2.1015625, -1.876953125, -1.65234375, -1.427734375, -1.203125, -0.978515625, -0.75390625, -0.529296875, -0.3046875, -0.080078125, 0.14453125, 0.369140625, 0.59375, 0.818359375, 1.04296875, 1.267578125, 1.4921875, 1.716796875, 1.94140625, 2.166015625, 2.390625, 2.615234375, 2.83984375, 3.064453125, 3.2890625, 3.513671875, 3.73828125, 3.962890625, 4.1875, 4.412109375, 4.63671875, 4.861328125, 5.0859375, 5.310546875, 5.53515625, 5.759765625, 5.984375, 6.208984375, 6.43359375, 6.658203125, 6.8828125, 7.107421875, 7.33203125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 12.0, 17.0, 26.0, 33.0, 46.0, 69.0, 118.0, 179.0, 301.0, 535.0, 924.0, 1949.0, 4692.0, 13532.0, 44970.0, 163864.0, 575764.0, 1429234.0, 1282797.0, 481655.0, 136660.0, 37866.0, 11351.0, 4000.0, 1709.0, 815.0, 420.0, 266.0, 151.0, 120.0, 70.0, 49.0, 27.0, 13.0, 15.0, 13.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.20361328125, -5.9814453125, -5.75927734375, -5.537109375, -5.31494140625, -5.0927734375, -4.87060546875, -4.6484375, -4.42626953125, -4.2041015625, -3.98193359375, -3.759765625, -3.53759765625, -3.3154296875, -3.09326171875, -2.87109375, -2.64892578125, -2.4267578125, -2.20458984375, -1.982421875, -1.76025390625, -1.5380859375, -1.31591796875, -1.09375, -0.87158203125, -0.6494140625, -0.42724609375, -0.205078125, 0.01708984375, 0.2392578125, 0.46142578125, 0.68359375, 0.90576171875, 1.1279296875, 1.35009765625, 1.572265625, 1.79443359375, 2.0166015625, 2.23876953125, 2.4609375, 2.68310546875, 2.9052734375, 3.12744140625, 3.349609375, 3.57177734375, 3.7939453125, 4.01611328125, 4.23828125, 4.46044921875, 4.6826171875, 4.90478515625, 5.126953125, 5.34912109375, 5.5712890625, 5.79345703125, 6.015625, 6.23779296875, 6.4599609375, 6.68212890625, 6.904296875, 7.12646484375, 7.3486328125, 7.57080078125, 7.79296875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 4.0, 8.0, 14.0, 13.0, 19.0, 24.0, 43.0, 38.0, 50.0, 74.0, 94.0, 122.0, 196.0, 265.0, 298.0, 369.0, 375.0, 375.0, 332.0, 314.0, 237.0, 190.0, 139.0, 99.0, 96.0, 59.0, 41.0, 32.0, 30.0, 23.0, 14.0, 9.0, 11.0, 10.0, 9.0, 7.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0], "bins": [-7.71484375, -7.46588134765625, -7.2169189453125, -6.96795654296875, -6.718994140625, -6.47003173828125, -6.2210693359375, -5.97210693359375, -5.72314453125, -5.47418212890625, -5.2252197265625, -4.97625732421875, -4.727294921875, -4.47833251953125, -4.2293701171875, -3.98040771484375, -3.7314453125, -3.48248291015625, -3.2335205078125, -2.98455810546875, -2.735595703125, -2.48663330078125, -2.2376708984375, -1.98870849609375, -1.73974609375, -1.49078369140625, -1.2418212890625, -0.99285888671875, -0.743896484375, -0.49493408203125, -0.2459716796875, 0.00299072265625, 0.251953125, 0.50091552734375, 0.7498779296875, 0.99884033203125, 1.247802734375, 1.49676513671875, 1.7457275390625, 1.99468994140625, 2.24365234375, 2.49261474609375, 2.7415771484375, 2.99053955078125, 3.239501953125, 3.48846435546875, 3.7374267578125, 3.98638916015625, 4.2353515625, 4.48431396484375, 4.7332763671875, 4.98223876953125, 5.231201171875, 5.48016357421875, 5.7291259765625, 5.97808837890625, 6.22705078125, 6.47601318359375, 6.7249755859375, 6.97393798828125, 7.222900390625, 7.47186279296875, 7.7208251953125, 7.96978759765625, 8.21875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 1.0, 11.0, 11.0, 4.0, 17.0, 16.0, 19.0, 13.0, 27.0, 40.0, 58.0, 68.0, 93.0, 124.0, 229.0, 380.0, 685.0, 1363.0, 3162.0, 8377.0, 25775.0, 100474.0, 505938.0, 2125541.0, 1139479.0, 209888.0, 48563.0, 14597.0, 4994.0, 2020.0, 969.0, 484.0, 281.0, 174.0, 118.0, 80.0, 45.0, 42.0, 36.0, 15.0, 19.0, 6.0, 10.0, 7.0, 4.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.444091796875, -11.08349609375, -10.722900390625, -10.3623046875, -10.001708984375, -9.64111328125, -9.280517578125, -8.919921875, -8.559326171875, -8.19873046875, -7.838134765625, -7.4775390625, -7.116943359375, -6.75634765625, -6.395751953125, -6.03515625, -5.674560546875, -5.31396484375, -4.953369140625, -4.5927734375, -4.232177734375, -3.87158203125, -3.510986328125, -3.150390625, -2.789794921875, -2.42919921875, -2.068603515625, -1.7080078125, -1.347412109375, -0.98681640625, -0.626220703125, -0.265625, 0.094970703125, 0.45556640625, 0.816162109375, 1.1767578125, 1.537353515625, 1.89794921875, 2.258544921875, 2.619140625, 2.979736328125, 3.34033203125, 3.700927734375, 4.0615234375, 4.422119140625, 4.78271484375, 5.143310546875, 5.50390625, 5.864501953125, 6.22509765625, 6.585693359375, 6.9462890625, 7.306884765625, 7.66748046875, 8.028076171875, 8.388671875, 8.749267578125, 9.10986328125, 9.470458984375, 9.8310546875, 10.191650390625, 10.55224609375, 10.912841796875, 11.2734375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 93.0, 452.0, 400.0, 63.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.30988311767578, -67.13794708251953, -60.96601104736328, -54.7940788269043, -48.62214279174805, -42.4502067565918, -36.27827453613281, -30.106338500976562, -23.934402465820312, -17.762466430664062, -11.590532302856445, -5.418598175048828, 0.7533378601074219, 6.925273895263672, 13.097206115722656, 19.269142150878906, 25.441078186035156, 31.613014221191406, 37.784950256347656, 43.95688247680664, 50.12881851196289, 56.30075454711914, 62.472686767578125, 68.64462280273438, 74.81655883789062, 80.98849487304688, 87.16043090820312, 93.33236694335938, 99.50430297851562, 105.67623901367188, 111.8481674194336, 118.02010345458984, 124.19204711914062, 130.36398315429688, 136.53591918945312, 142.70785522460938, 148.87979125976562, 155.05172729492188, 161.22366333007812, 167.39559936523438, 173.56753540039062, 179.73947143554688, 185.91140747070312, 192.08334350585938, 198.25527954101562, 204.42721557617188, 210.59915161132812, 216.77108764648438, 222.94300842285156, 229.1149444580078, 235.28688049316406, 241.4588165283203, 247.63075256347656, 253.8026885986328, 259.974609375, 266.14654541015625, 272.3184814453125, 278.49041748046875, 284.662353515625, 290.83428955078125, 297.0062255859375, 303.17816162109375, 309.35009765625, 315.52203369140625, 321.6939697265625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 4.0, 8.0, 3.0, 12.0, 17.0, 13.0, 15.0, 24.0, 28.0, 31.0, 22.0, 40.0, 35.0, 50.0, 41.0, 47.0, 38.0, 42.0, 37.0, 28.0, 44.0, 48.0, 34.0, 39.0, 35.0, 42.0, 23.0, 32.0, 20.0, 22.0, 17.0, 17.0, 11.0, 17.0, 12.0, 10.0, 6.0, 6.0, 3.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.025562286376953, -30.02846336364746, -29.03136444091797, -28.034263610839844, -27.03716468811035, -26.04006576538086, -25.042966842651367, -24.045867919921875, -23.04876708984375, -22.051668167114258, -21.054569244384766, -20.05746841430664, -19.06036949157715, -18.063270568847656, -17.066171646118164, -16.069072723388672, -15.071972846984863, -14.074873924255371, -13.077774047851562, -12.08067512512207, -11.083575248718262, -10.08647632598877, -9.089376449584961, -8.092277526855469, -7.095178127288818, -6.098078727722168, -5.100979328155518, -4.103879928588867, -3.106780767440796, -2.1096816062927246, -1.1125822067260742, -0.11548280715942383, 0.8816165924072266, 1.878715991973877, 2.8758153915405273, 3.8729145526885986, 4.870014190673828, 5.86711311340332, 6.864212512969971, 7.861311912536621, 8.85841178894043, 9.855510711669922, 10.85261058807373, 11.849709510803223, 12.846809387207031, 13.843908309936523, 14.841007232666016, 15.838107109069824, 16.835205078125, 17.832304000854492, 18.829402923583984, 19.82650375366211, 20.8236026763916, 21.820701599121094, 22.817800521850586, 23.814899444580078, 24.812000274658203, 25.809099197387695, 26.806198120117188, 27.803298950195312, 28.800397872924805, 29.797496795654297, 30.79459571838379, 31.79169464111328, 32.788795471191406]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 8.0, 7.0, 13.0, 7.0, 15.0, 16.0, 24.0, 10.0, 15.0, 27.0, 17.0, 35.0, 27.0, 33.0, 41.0, 44.0, 47.0, 41.0, 31.0, 48.0, 50.0, 38.0, 35.0, 47.0, 47.0, 34.0, 34.0, 22.0, 20.0, 30.0, 22.0, 21.0, 22.0, 17.0, 7.0, 5.0, 9.0, 9.0, 7.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.97265625, -6.7708740234375, -6.569091796875, -6.3673095703125, -6.16552734375, -5.9637451171875, -5.761962890625, -5.5601806640625, -5.3583984375, -5.1566162109375, -4.954833984375, -4.7530517578125, -4.55126953125, -4.3494873046875, -4.147705078125, -3.9459228515625, -3.744140625, -3.5423583984375, -3.340576171875, -3.1387939453125, -2.93701171875, -2.7352294921875, -2.533447265625, -2.3316650390625, -2.1298828125, -1.9281005859375, -1.726318359375, -1.5245361328125, -1.32275390625, -1.1209716796875, -0.919189453125, -0.7174072265625, -0.515625, -0.3138427734375, -0.112060546875, 0.0897216796875, 0.29150390625, 0.4932861328125, 0.695068359375, 0.8968505859375, 1.0986328125, 1.3004150390625, 1.502197265625, 1.7039794921875, 1.90576171875, 2.1075439453125, 2.309326171875, 2.5111083984375, 2.712890625, 2.9146728515625, 3.116455078125, 3.3182373046875, 3.52001953125, 3.7218017578125, 3.923583984375, 4.1253662109375, 4.3271484375, 4.5289306640625, 4.730712890625, 4.9324951171875, 5.13427734375, 5.3360595703125, 5.537841796875, 5.7396240234375, 5.94140625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 13.0, 8.0, 18.0, 30.0, 39.0, 48.0, 83.0, 150.0, 225.0, 276.0, 509.0, 781.0, 1143.0, 1996.0, 3146.0, 5337.0, 8862.0, 15539.0, 26050.0, 45374.0, 78734.0, 132832.0, 197858.0, 200118.0, 136516.0, 80502.0, 46545.0, 26836.0, 15694.0, 9122.0, 5510.0, 3254.0, 1947.0, 1291.0, 750.0, 521.0, 313.0, 197.0, 135.0, 68.0, 64.0, 42.0, 27.0, 20.0, 13.0, 6.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61181640625, -0.5914382934570312, -0.5710601806640625, -0.5506820678710938, -0.530303955078125, -0.5099258422851562, -0.4895477294921875, -0.46916961669921875, -0.44879150390625, -0.42841339111328125, -0.4080352783203125, -0.38765716552734375, -0.367279052734375, -0.34690093994140625, -0.3265228271484375, -0.30614471435546875, -0.2857666015625, -0.26538848876953125, -0.2450103759765625, -0.22463226318359375, -0.204254150390625, -0.18387603759765625, -0.1634979248046875, -0.14311981201171875, -0.12274169921875, -0.10236358642578125, -0.0819854736328125, -0.06160736083984375, -0.041229248046875, -0.02085113525390625, -0.0004730224609375, 0.01990509033203125, 0.040283203125, 0.06066131591796875, 0.0810394287109375, 0.10141754150390625, 0.121795654296875, 0.14217376708984375, 0.1625518798828125, 0.18292999267578125, 0.20330810546875, 0.22368621826171875, 0.2440643310546875, 0.26444244384765625, 0.284820556640625, 0.30519866943359375, 0.3255767822265625, 0.34595489501953125, 0.3663330078125, 0.38671112060546875, 0.4070892333984375, 0.42746734619140625, 0.447845458984375, 0.46822357177734375, 0.4886016845703125, 0.5089797973632812, 0.52935791015625, 0.5497360229492188, 0.5701141357421875, 0.5904922485351562, 0.610870361328125, 0.6312484741210938, 0.6516265869140625, 0.6720046997070312, 0.6923828125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 5.0, 12.0, 10.0, 9.0, 21.0, 16.0, 29.0, 13.0, 19.0, 14.0, 24.0, 25.0, 23.0, 34.0, 34.0, 41.0, 33.0, 51.0, 32.0, 1063.0, 29.0, 42.0, 48.0, 39.0, 33.0, 37.0, 24.0, 34.0, 22.0, 27.0, 32.0, 20.0, 16.0, 14.0, 24.0, 23.0, 7.0, 12.0, 8.0, 11.0, 6.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62890625, -3.50250244140625, -3.3760986328125, -3.24969482421875, -3.123291015625, -2.99688720703125, -2.8704833984375, -2.74407958984375, -2.61767578125, -2.49127197265625, -2.3648681640625, -2.23846435546875, -2.112060546875, -1.98565673828125, -1.8592529296875, -1.73284912109375, -1.6064453125, -1.48004150390625, -1.3536376953125, -1.22723388671875, -1.100830078125, -0.97442626953125, -0.8480224609375, -0.72161865234375, -0.59521484375, -0.46881103515625, -0.3424072265625, -0.21600341796875, -0.089599609375, 0.03680419921875, 0.1632080078125, 0.28961181640625, 0.416015625, 0.54241943359375, 0.6688232421875, 0.79522705078125, 0.921630859375, 1.04803466796875, 1.1744384765625, 1.30084228515625, 1.42724609375, 1.55364990234375, 1.6800537109375, 1.80645751953125, 1.932861328125, 2.05926513671875, 2.1856689453125, 2.31207275390625, 2.4384765625, 2.56488037109375, 2.6912841796875, 2.81768798828125, 2.944091796875, 3.07049560546875, 3.1968994140625, 3.32330322265625, 3.44970703125, 3.57611083984375, 3.7025146484375, 3.82891845703125, 3.955322265625, 4.08172607421875, 4.2081298828125, 4.33453369140625, 4.4609375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 10.0, 19.0, 24.0, 39.0, 58.0, 79.0, 141.0, 198.0, 338.0, 581.0, 957.0, 1710.0, 3211.0, 5826.0, 11436.0, 21989.0, 43405.0, 81401.0, 143960.0, 937950.0, 535517.0, 141475.0, 79137.0, 42027.0, 21575.0, 10917.0, 5721.0, 3122.0, 1757.0, 974.0, 626.0, 363.0, 213.0, 132.0, 87.0, 55.0, 27.0, 21.0, 16.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.49658203125, -0.48055267333984375, -0.4645233154296875, -0.44849395751953125, -0.432464599609375, -0.41643524169921875, -0.4004058837890625, -0.38437652587890625, -0.36834716796875, -0.35231781005859375, -0.3362884521484375, -0.32025909423828125, -0.304229736328125, -0.28820037841796875, -0.2721710205078125, -0.25614166259765625, -0.2401123046875, -0.22408294677734375, -0.2080535888671875, -0.19202423095703125, -0.175994873046875, -0.15996551513671875, -0.1439361572265625, -0.12790679931640625, -0.11187744140625, -0.09584808349609375, -0.0798187255859375, -0.06378936767578125, -0.047760009765625, -0.03173065185546875, -0.0157012939453125, 0.00032806396484375, 0.016357421875, 0.03238677978515625, 0.0484161376953125, 0.06444549560546875, 0.080474853515625, 0.09650421142578125, 0.1125335693359375, 0.12856292724609375, 0.14459228515625, 0.16062164306640625, 0.1766510009765625, 0.19268035888671875, 0.208709716796875, 0.22473907470703125, 0.2407684326171875, 0.25679779052734375, 0.2728271484375, 0.28885650634765625, 0.3048858642578125, 0.32091522216796875, 0.336944580078125, 0.35297393798828125, 0.3690032958984375, 0.38503265380859375, 0.40106201171875, 0.41709136962890625, 0.4331207275390625, 0.44915008544921875, 0.465179443359375, 0.48120880126953125, 0.4972381591796875, 0.5132675170898438, 0.529296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 5.0, 7.0, 7.0, 10.0, 11.0, 12.0, 14.0, 21.0, 30.0, 24.0, 24.0, 41.0, 36.0, 61.0, 75.0, 88.0, 101.0, 80.0, 53.0, 41.0, 35.0, 41.0, 21.0, 30.0, 13.0, 13.0, 10.0, 12.0, 6.0, 10.0, 12.0, 12.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0152587890625, -0.014785528182983398, -0.014312267303466797, -0.013839006423950195, -0.013365745544433594, -0.012892484664916992, -0.01241922378540039, -0.011945962905883789, -0.011472702026367188, -0.010999441146850586, -0.010526180267333984, -0.010052919387817383, -0.009579658508300781, -0.00910639762878418, -0.008633136749267578, -0.008159875869750977, -0.007686614990234375, -0.0072133541107177734, -0.006740093231201172, -0.00626683235168457, -0.005793571472167969, -0.005320310592651367, -0.004847049713134766, -0.004373788833618164, -0.0039005279541015625, -0.003427267074584961, -0.0029540061950683594, -0.002480745315551758, -0.0020074844360351562, -0.0015342235565185547, -0.0010609626770019531, -0.0005877017974853516, -0.00011444091796875, 0.00035881996154785156, 0.0008320808410644531, 0.0013053417205810547, 0.0017786026000976562, 0.002251863479614258, 0.0027251243591308594, 0.003198385238647461, 0.0036716461181640625, 0.004144906997680664, 0.004618167877197266, 0.005091428756713867, 0.005564689636230469, 0.00603795051574707, 0.006511211395263672, 0.0069844722747802734, 0.007457733154296875, 0.007930994033813477, 0.008404254913330078, 0.00887751579284668, 0.009350776672363281, 0.009824037551879883, 0.010297298431396484, 0.010770559310913086, 0.011243820190429688, 0.011717081069946289, 0.01219034194946289, 0.012663602828979492, 0.013136863708496094, 0.013610124588012695, 0.014083385467529297, 0.014556646347045898, 0.0150299072265625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 4.0, 7.0, 14.0, 8.0, 9.0, 18.0, 23.0, 17.0, 31.0, 31.0, 44.0, 48.0, 88.0, 111.0, 186.0, 260.0, 421.0, 1189.0, 30338.0, 992850.0, 20453.0, 1070.0, 437.0, 229.0, 166.0, 126.0, 80.0, 70.0, 39.0, 36.0, 23.0, 24.0, 18.0, 14.0, 11.0, 8.0, 10.0, 7.0, 5.0, 8.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2962913513183594, -0.28716278076171875, -0.2780342102050781, -0.2689056396484375, -0.2597770690917969, -0.25064849853515625, -0.24151992797851562, -0.232391357421875, -0.22326278686523438, -0.21413421630859375, -0.20500564575195312, -0.1958770751953125, -0.18674850463867188, -0.17761993408203125, -0.16849136352539062, -0.15936279296875, -0.15023422241210938, -0.14110565185546875, -0.13197708129882812, -0.1228485107421875, -0.11371994018554688, -0.10459136962890625, -0.09546279907226562, -0.086334228515625, -0.07720565795898438, -0.06807708740234375, -0.058948516845703125, -0.0498199462890625, -0.040691375732421875, -0.03156280517578125, -0.022434234619140625, -0.0133056640625, -0.004177093505859375, 0.00495147705078125, 0.014080047607421875, 0.0232086181640625, 0.032337188720703125, 0.04146575927734375, 0.050594329833984375, 0.059722900390625, 0.06885147094726562, 0.07798004150390625, 0.08710861206054688, 0.0962371826171875, 0.10536575317382812, 0.11449432373046875, 0.12362289428710938, 0.13275146484375, 0.14188003540039062, 0.15100860595703125, 0.16013717651367188, 0.1692657470703125, 0.17839431762695312, 0.18752288818359375, 0.19665145874023438, 0.205780029296875, 0.21490859985351562, 0.22403717041015625, 0.23316574096679688, 0.2422943115234375, 0.2514228820800781, 0.26055145263671875, 0.2696800231933594, 0.27880859375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 317.0, 680.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0902738869190216, -0.08281730860471725, -0.0753607302904129, -0.06790414452552795, -0.0604475662112236, -0.05299098789691925, -0.0455344095826149, -0.03807782754302025, -0.030621249228715897, -0.023164669051766396, -0.015708088874816895, -0.008251510560512543, -0.0007949303835630417, 0.006661649793386459, 0.014118228107690811, 0.02157481014728546, 0.029031388461589813, 0.036487966775894165, 0.043944548815488815, 0.05140112712979317, 0.05885770916938782, 0.06631428748369217, 0.07377086579799652, 0.08122745156288147, 0.08868402242660522, 0.09614060074090958, 0.10359717905521393, 0.11105376482009888, 0.11851034313440323, 0.12596692144870758, 0.13342350721359253, 0.14088007807731628, 0.14833666384220123, 0.15579324960708618, 0.16324982047080994, 0.17070640623569489, 0.17816297709941864, 0.1856195628643036, 0.19307613372802734, 0.2005327194929123, 0.20798930525779724, 0.2154458910226822, 0.22290246188640594, 0.2303590476512909, 0.23781561851501465, 0.2452722042798996, 0.25272879004478455, 0.2601853609085083, 0.26764193177223206, 0.2750985026359558, 0.28255510330200195, 0.2900116741657257, 0.29746824502944946, 0.3049248456954956, 0.31238141655921936, 0.3198379874229431, 0.32729458808898926, 0.334751158952713, 0.34220775961875916, 0.3496643304824829, 0.35712090134620667, 0.3645774722099304, 0.37203407287597656, 0.3794906437397003, 0.3869472146034241]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 9.0, 4.0, 7.0, 6.0, 15.0, 21.0, 26.0, 20.0, 35.0, 28.0, 31.0, 33.0, 39.0, 51.0, 54.0, 54.0, 57.0, 57.0, 52.0, 50.0, 43.0, 41.0, 46.0, 39.0, 37.0, 27.0, 28.0, 24.0, 12.0, 9.0, 18.0, 10.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.024103105068206787, -0.023459849879145622, -0.022816594690084457, -0.022173339501023293, -0.021530084311962128, -0.020886829122900963, -0.020243573933839798, -0.019600318744778633, -0.018957063555717468, -0.018313808366656303, -0.01767055317759514, -0.017027297988533974, -0.01638404279947281, -0.015740787610411644, -0.015097532421350479, -0.014454277232289314, -0.01381102204322815, -0.013167766854166985, -0.01252451166510582, -0.011881256476044655, -0.01123800128698349, -0.010594746097922325, -0.00995149090886116, -0.009308235719799995, -0.00866498053073883, -0.008021725341677666, -0.007378470152616501, -0.006735214963555336, -0.006091959774494171, -0.005448704585433006, -0.004805449396371841, -0.004162194207310677, -0.0035189390182495117, -0.002875683829188347, -0.002232428640127182, -0.0015891734510660172, -0.0009459182620048523, -0.00030266307294368744, 0.0003405921161174774, 0.0009838473051786423, 0.0016271024942398071, 0.002270357683300972, 0.002913612872362137, 0.0035568680614233017, 0.0042001232504844666, 0.004843378439545631, 0.005486633628606796, 0.006129888817667961, 0.006773144006729126, 0.007416399195790291, 0.008059654384851456, 0.00870290957391262, 0.009346164762973785, 0.00998941995203495, 0.010632675141096115, 0.01127593033015728, 0.011919185519218445, 0.01256244070827961, 0.013205695897340775, 0.01384895108640194, 0.014492206275463104, 0.015135461464524269, 0.015778716653585434, 0.0164219718426466, 0.017065227031707764]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 3.0, 1.0, 8.0, 7.0, 13.0, 7.0, 15.0, 15.0, 25.0, 9.0, 16.0, 27.0, 17.0, 35.0, 26.0, 33.0, 42.0, 43.0, 48.0, 41.0, 30.0, 48.0, 51.0, 37.0, 36.0, 45.0, 48.0, 35.0, 34.0, 22.0, 19.0, 31.0, 21.0, 22.0, 22.0, 17.0, 7.0, 4.0, 10.0, 9.0, 7.0, 3.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.97265625, -6.77093505859375, -6.5692138671875, -6.36749267578125, -6.165771484375, -5.96405029296875, -5.7623291015625, -5.56060791015625, -5.35888671875, -5.15716552734375, -4.9554443359375, -4.75372314453125, -4.552001953125, -4.35028076171875, -4.1485595703125, -3.94683837890625, -3.7451171875, -3.54339599609375, -3.3416748046875, -3.13995361328125, -2.938232421875, -2.73651123046875, -2.5347900390625, -2.33306884765625, -2.13134765625, -1.92962646484375, -1.7279052734375, -1.52618408203125, -1.324462890625, -1.12274169921875, -0.9210205078125, -0.71929931640625, -0.517578125, -0.31585693359375, -0.1141357421875, 0.08758544921875, 0.289306640625, 0.49102783203125, 0.6927490234375, 0.89447021484375, 1.09619140625, 1.29791259765625, 1.4996337890625, 1.70135498046875, 1.903076171875, 2.10479736328125, 2.3065185546875, 2.50823974609375, 2.7099609375, 2.91168212890625, 3.1134033203125, 3.31512451171875, 3.516845703125, 3.71856689453125, 3.9202880859375, 4.12200927734375, 4.32373046875, 4.52545166015625, 4.7271728515625, 4.92889404296875, 5.130615234375, 5.33233642578125, 5.5340576171875, 5.73577880859375, 5.9375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 2.0, 3.0, 3.0, 7.0, 12.0, 13.0, 18.0, 23.0, 28.0, 29.0, 50.0, 75.0, 117.0, 148.0, 196.0, 274.0, 440.0, 748.0, 1446.0, 2991.0, 6987.0, 18107.0, 49437.0, 131053.0, 328523.0, 310810.0, 121830.0, 45725.0, 16568.0, 6647.0, 2785.0, 1328.0, 736.0, 440.0, 256.0, 185.0, 128.0, 104.0, 72.0, 53.0, 49.0, 24.0, 19.0, 29.0, 13.0, 9.0, 10.0, 2.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2265625, -7.9425048828125, -7.658447265625, -7.3743896484375, -7.09033203125, -6.8062744140625, -6.522216796875, -6.2381591796875, -5.9541015625, -5.6700439453125, -5.385986328125, -5.1019287109375, -4.81787109375, -4.5338134765625, -4.249755859375, -3.9656982421875, -3.681640625, -3.3975830078125, -3.113525390625, -2.8294677734375, -2.54541015625, -2.2613525390625, -1.977294921875, -1.6932373046875, -1.4091796875, -1.1251220703125, -0.841064453125, -0.5570068359375, -0.27294921875, 0.0111083984375, 0.295166015625, 0.5792236328125, 0.86328125, 1.1473388671875, 1.431396484375, 1.7154541015625, 1.99951171875, 2.2835693359375, 2.567626953125, 2.8516845703125, 3.1357421875, 3.4197998046875, 3.703857421875, 3.9879150390625, 4.27197265625, 4.5560302734375, 4.840087890625, 5.1241455078125, 5.408203125, 5.6922607421875, 5.976318359375, 6.2603759765625, 6.54443359375, 6.8284912109375, 7.112548828125, 7.3966064453125, 7.6806640625, 7.9647216796875, 8.248779296875, 8.5328369140625, 8.81689453125, 9.1009521484375, 9.385009765625, 9.6690673828125, 9.953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 12.0, 16.0, 17.0, 16.0, 20.0, 20.0, 28.0, 42.0, 33.0, 40.0, 57.0, 70.0, 103.0, 160.0, 247.0, 1392.0, 204.0, 119.0, 82.0, 49.0, 57.0, 44.0, 37.0, 30.0, 22.0, 26.0, 20.0, 13.0, 9.0, 11.0, 12.0, 4.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.75, -16.176513671875, -15.60302734375, -15.029541015625, -14.4560546875, -13.882568359375, -13.30908203125, -12.735595703125, -12.162109375, -11.588623046875, -11.01513671875, -10.441650390625, -9.8681640625, -9.294677734375, -8.72119140625, -8.147705078125, -7.57421875, -7.000732421875, -6.42724609375, -5.853759765625, -5.2802734375, -4.706787109375, -4.13330078125, -3.559814453125, -2.986328125, -2.412841796875, -1.83935546875, -1.265869140625, -0.6923828125, -0.118896484375, 0.45458984375, 1.028076171875, 1.6015625, 2.175048828125, 2.74853515625, 3.322021484375, 3.8955078125, 4.468994140625, 5.04248046875, 5.615966796875, 6.189453125, 6.762939453125, 7.33642578125, 7.909912109375, 8.4833984375, 9.056884765625, 9.63037109375, 10.203857421875, 10.77734375, 11.350830078125, 11.92431640625, 12.497802734375, 13.0712890625, 13.644775390625, 14.21826171875, 14.791748046875, 15.365234375, 15.938720703125, 16.51220703125, 17.085693359375, 17.6591796875, 18.232666015625, 18.80615234375, 19.379638671875, 19.953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 3.0, 8.0, 5.0, 9.0, 16.0, 20.0, 26.0, 38.0, 58.0, 71.0, 121.0, 171.0, 276.0, 416.0, 851.0, 2491.0, 66719.0, 2980839.0, 88633.0, 2784.0, 807.0, 480.0, 259.0, 173.0, 137.0, 73.0, 54.0, 45.0, 32.0, 23.0, 15.0, 14.0, 12.0, 6.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-47.40625, -46.14306640625, -44.8798828125, -43.61669921875, -42.353515625, -41.09033203125, -39.8271484375, -38.56396484375, -37.30078125, -36.03759765625, -34.7744140625, -33.51123046875, -32.248046875, -30.98486328125, -29.7216796875, -28.45849609375, -27.1953125, -25.93212890625, -24.6689453125, -23.40576171875, -22.142578125, -20.87939453125, -19.6162109375, -18.35302734375, -17.08984375, -15.82666015625, -14.5634765625, -13.30029296875, -12.037109375, -10.77392578125, -9.5107421875, -8.24755859375, -6.984375, -5.72119140625, -4.4580078125, -3.19482421875, -1.931640625, -0.66845703125, 0.5947265625, 1.85791015625, 3.12109375, 4.38427734375, 5.6474609375, 6.91064453125, 8.173828125, 9.43701171875, 10.7001953125, 11.96337890625, 13.2265625, 14.48974609375, 15.7529296875, 17.01611328125, 18.279296875, 19.54248046875, 20.8056640625, 22.06884765625, 23.33203125, 24.59521484375, 25.8583984375, 27.12158203125, 28.384765625, 29.64794921875, 30.9111328125, 32.17431640625, 33.4375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 10.0, 13.0, 26.0, 90.0, 144.0, 191.0, 195.0, 167.0, 113.0, 38.0, 20.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.012578964233398, -11.406538009643555, -9.800498008728027, -8.194457054138184, -6.588416576385498, -4.9823760986328125, -3.3763351440429688, -1.7702951431274414, -0.16425418853759766, 1.4417864084243774, 3.0478270053863525, 4.653867721557617, 6.259908199310303, 7.865948677062988, 9.471989631652832, 11.07802963256836, 12.684070587158203, 14.290111541748047, 15.896151542663574, 17.502193450927734, 19.108232498168945, 20.71427345275879, 22.320314407348633, 23.926353454589844, 25.532394409179688, 27.13843536376953, 28.744476318359375, 30.35051727294922, 31.95655632019043, 33.562599182128906, 35.16864013671875, 36.77467727661133, 38.38071823120117, 39.986759185791016, 41.59280014038086, 43.1988410949707, 44.80488204956055, 46.410919189453125, 48.01696014404297, 49.62300109863281, 51.229042053222656, 52.8350830078125, 54.441123962402344, 56.04716491699219, 57.65320587158203, 59.259246826171875, 60.86528778076172, 62.4713249206543, 64.0773696899414, 65.68341064453125, 67.2894515991211, 68.89549255371094, 70.50153350830078, 72.10757446289062, 73.71361541748047, 75.31965637207031, 76.92568969726562, 78.53173065185547, 80.13777160644531, 81.74381256103516, 83.349853515625, 84.95589447021484, 86.56193542480469, 88.16797637939453, 89.77401733398438]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 10.0, 4.0, 8.0, 11.0, 10.0, 8.0, 22.0, 28.0, 16.0, 28.0, 33.0, 33.0, 33.0, 29.0, 38.0, 43.0, 41.0, 40.0, 49.0, 60.0, 39.0, 37.0, 41.0, 47.0, 37.0, 40.0, 35.0, 29.0, 26.0, 23.0, 17.0, 20.0, 15.0, 10.0, 7.0, 9.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.79722595214844, -31.507078170776367, -30.21693229675293, -28.92678451538086, -27.63663673400879, -26.34648895263672, -25.05634307861328, -23.76619529724121, -22.47604751586914, -21.18589973449707, -19.895753860473633, -18.605606079101562, -17.315458297729492, -16.025310516357422, -14.735164642333984, -13.445016860961914, -12.154870986938477, -10.864724159240723, -9.574576377868652, -8.284429550170898, -6.994282245635986, -5.704134941101074, -4.41398811340332, -3.12384033203125, -1.833693504333496, -0.5435463190078735, 0.746600866317749, 2.036747932434082, 3.326895236968994, 4.617042541503906, 5.90718936920166, 7.1973371505737305, 8.487483978271484, 9.777630805969238, 11.067778587341309, 12.357925415039062, 13.648073196411133, 14.938220024108887, 16.22836685180664, 17.51851463317871, 18.80866241455078, 20.09881019592285, 21.38895606994629, 22.67910385131836, 23.96925163269043, 25.2593994140625, 26.549545288085938, 27.839693069458008, 29.129838943481445, 30.419986724853516, 31.710132598876953, 33.000282287597656, 34.290428161621094, 35.58057403564453, 36.87071990966797, 38.16086959838867, 39.45101547241211, 40.74116134643555, 42.03131103515625, 43.32145690917969, 44.611602783203125, 45.90175247192383, 47.191898345947266, 48.48204803466797, 49.772193908691406]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 9.0, 10.0, 7.0, 15.0, 12.0, 17.0, 30.0, 22.0, 24.0, 20.0, 39.0, 36.0, 31.0, 42.0, 40.0, 52.0, 60.0, 42.0, 48.0, 35.0, 45.0, 39.0, 48.0, 36.0, 43.0, 31.0, 34.0, 23.0, 15.0, 20.0, 15.0, 8.0, 10.0, 7.0, 8.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.97265625, -7.74774169921875, -7.5228271484375, -7.29791259765625, -7.072998046875, -6.84808349609375, -6.6231689453125, -6.39825439453125, -6.17333984375, -5.94842529296875, -5.7235107421875, -5.49859619140625, -5.273681640625, -5.04876708984375, -4.8238525390625, -4.59893798828125, -4.3740234375, -4.14910888671875, -3.9241943359375, -3.69927978515625, -3.474365234375, -3.24945068359375, -3.0245361328125, -2.79962158203125, -2.57470703125, -2.34979248046875, -2.1248779296875, -1.89996337890625, -1.675048828125, -1.45013427734375, -1.2252197265625, -1.00030517578125, -0.775390625, -0.55047607421875, -0.3255615234375, -0.10064697265625, 0.124267578125, 0.34918212890625, 0.5740966796875, 0.79901123046875, 1.02392578125, 1.24884033203125, 1.4737548828125, 1.69866943359375, 1.923583984375, 2.14849853515625, 2.3734130859375, 2.59832763671875, 2.8232421875, 3.04815673828125, 3.2730712890625, 3.49798583984375, 3.722900390625, 3.94781494140625, 4.1727294921875, 4.39764404296875, 4.62255859375, 4.84747314453125, 5.0723876953125, 5.29730224609375, 5.522216796875, 5.74713134765625, 5.9720458984375, 6.19696044921875, 6.421875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 9.0, 8.0, 14.0, 21.0, 27.0, 22.0, 49.0, 50.0, 72.0, 107.0, 161.0, 210.0, 336.0, 509.0, 4607.0, 3932556.0, 253138.0, 1032.0, 412.0, 286.0, 192.0, 127.0, 83.0, 52.0, 61.0, 28.0, 31.0, 20.0, 14.0, 17.0, 7.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.875, -54.96484375, -53.0546875, -51.14453125, -49.234375, -47.32421875, -45.4140625, -43.50390625, -41.59375, -39.68359375, -37.7734375, -35.86328125, -33.953125, -32.04296875, -30.1328125, -28.22265625, -26.3125, -24.40234375, -22.4921875, -20.58203125, -18.671875, -16.76171875, -14.8515625, -12.94140625, -11.03125, -9.12109375, -7.2109375, -5.30078125, -3.390625, -1.48046875, 0.4296875, 2.33984375, 4.25, 6.16015625, 8.0703125, 9.98046875, 11.890625, 13.80078125, 15.7109375, 17.62109375, 19.53125, 21.44140625, 23.3515625, 25.26171875, 27.171875, 29.08203125, 30.9921875, 32.90234375, 34.8125, 36.72265625, 38.6328125, 40.54296875, 42.453125, 44.36328125, 46.2734375, 48.18359375, 50.09375, 52.00390625, 53.9140625, 55.82421875, 57.734375, 59.64453125, 61.5546875, 63.46484375, 65.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 6.0, 4.0, 5.0, 7.0, 10.0, 9.0, 14.0, 17.0, 27.0, 31.0, 42.0, 59.0, 78.0, 96.0, 126.0, 193.0, 254.0, 361.0, 456.0, 516.0, 483.0, 315.0, 238.0, 179.0, 141.0, 94.0, 77.0, 62.0, 41.0, 29.0, 18.0, 19.0, 15.0, 12.0, 13.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-9.0390625, -8.7425537109375, -8.446044921875, -8.1495361328125, -7.85302734375, -7.5565185546875, -7.260009765625, -6.9635009765625, -6.6669921875, -6.3704833984375, -6.073974609375, -5.7774658203125, -5.48095703125, -5.1844482421875, -4.887939453125, -4.5914306640625, -4.294921875, -3.9984130859375, -3.701904296875, -3.4053955078125, -3.10888671875, -2.8123779296875, -2.515869140625, -2.2193603515625, -1.9228515625, -1.6263427734375, -1.329833984375, -1.0333251953125, -0.73681640625, -0.4403076171875, -0.143798828125, 0.1527099609375, 0.44921875, 0.7457275390625, 1.042236328125, 1.3387451171875, 1.63525390625, 1.9317626953125, 2.228271484375, 2.5247802734375, 2.8212890625, 3.1177978515625, 3.414306640625, 3.7108154296875, 4.00732421875, 4.3038330078125, 4.600341796875, 4.8968505859375, 5.193359375, 5.4898681640625, 5.786376953125, 6.0828857421875, 6.37939453125, 6.6759033203125, 6.972412109375, 7.2689208984375, 7.5654296875, 7.8619384765625, 8.158447265625, 8.4549560546875, 8.75146484375, 9.0479736328125, 9.344482421875, 9.6409912109375, 9.9375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 6.0, 13.0, 13.0, 25.0, 24.0, 37.0, 47.0, 58.0, 87.0, 172.0, 301.0, 840.0, 6447.0, 173240.0, 3765867.0, 236979.0, 8299.0, 1053.0, 290.0, 172.0, 102.0, 54.0, 36.0, 28.0, 29.0, 15.0, 11.0, 7.0, 4.0, 7.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.5625, -39.53662109375, -38.5107421875, -37.48486328125, -36.458984375, -35.43310546875, -34.4072265625, -33.38134765625, -32.35546875, -31.32958984375, -30.3037109375, -29.27783203125, -28.251953125, -27.22607421875, -26.2001953125, -25.17431640625, -24.1484375, -23.12255859375, -22.0966796875, -21.07080078125, -20.044921875, -19.01904296875, -17.9931640625, -16.96728515625, -15.94140625, -14.91552734375, -13.8896484375, -12.86376953125, -11.837890625, -10.81201171875, -9.7861328125, -8.76025390625, -7.734375, -6.70849609375, -5.6826171875, -4.65673828125, -3.630859375, -2.60498046875, -1.5791015625, -0.55322265625, 0.47265625, 1.49853515625, 2.5244140625, 3.55029296875, 4.576171875, 5.60205078125, 6.6279296875, 7.65380859375, 8.6796875, 9.70556640625, 10.7314453125, 11.75732421875, 12.783203125, 13.80908203125, 14.8349609375, 15.86083984375, 16.88671875, 17.91259765625, 18.9384765625, 19.96435546875, 20.990234375, 22.01611328125, 23.0419921875, 24.06787109375, 25.09375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 44.0, 146.0, 347.0, 342.0, 110.0, 20.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.33321380615234, -96.31324768066406, -92.29328155517578, -88.2733154296875, -84.25335693359375, -80.23339080810547, -76.21342468261719, -72.1934585571289, -68.17349243164062, -64.15352630615234, -60.13356399536133, -56.11359786987305, -52.09363555908203, -48.07366943359375, -44.05370330810547, -40.03373718261719, -36.01377868652344, -31.99381446838379, -27.97385025024414, -23.95388412475586, -19.93391990661621, -15.913955688476562, -11.893989562988281, -7.874025344848633, -3.8540611267089844, 0.16590356826782227, 4.185868263244629, 8.205833435058594, 12.225797653198242, 16.24576187133789, 20.265727996826172, 24.28569221496582, 28.305648803710938, 32.32561492919922, 36.345577239990234, 40.365543365478516, 44.38550567626953, 48.40547180175781, 52.425437927246094, 56.445404052734375, 60.46536636352539, 64.4853286743164, 68.50529479980469, 72.52526092529297, 76.54522705078125, 80.565185546875, 84.58515930175781, 88.60511779785156, 92.62508392333984, 96.64505004882812, 100.6650161743164, 104.68498229980469, 108.70494079589844, 112.72490692138672, 116.744873046875, 120.76483917236328, 124.78480529785156, 128.8047637939453, 132.82473754882812, 136.84469604492188, 140.8646697998047, 144.88462829589844, 148.90460205078125, 152.924560546875, 156.94451904296875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 3.0, 6.0, 6.0, 6.0, 11.0, 12.0, 13.0, 11.0, 20.0, 17.0, 17.0, 27.0, 23.0, 37.0, 38.0, 34.0, 39.0, 32.0, 40.0, 51.0, 48.0, 40.0, 46.0, 39.0, 30.0, 37.0, 32.0, 38.0, 22.0, 29.0, 31.0, 29.0, 22.0, 19.0, 15.0, 10.0, 10.0, 15.0, 10.0, 7.0, 4.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-35.067378997802734, -34.06101989746094, -33.054656982421875, -32.04829788208008, -31.04193878173828, -30.03557777404785, -29.029216766357422, -28.022857666015625, -27.016498565673828, -26.0101375579834, -25.0037784576416, -23.997417449951172, -22.991058349609375, -21.984697341918945, -20.978336334228516, -19.97197723388672, -18.96561622619629, -17.95925521850586, -16.952896118164062, -15.946535110473633, -14.940176010131836, -13.933815002441406, -12.927454948425293, -11.92109489440918, -10.914734840393066, -9.908374786376953, -8.90201473236084, -7.895654201507568, -6.889294147491455, -5.882934093475342, -4.87657356262207, -3.870213508605957, -2.863851547241211, -1.857491374015808, -0.8511312007904053, 0.1552290916442871, 1.1615891456604004, 2.1679491996765137, 3.174309730529785, 4.180669784545898, 5.187029838562012, 6.193389892578125, 7.199749946594238, 8.206110000610352, 9.212471008300781, 10.218830108642578, 11.225191116333008, 12.231551170349121, 13.237911224365234, 14.244271278381348, 15.250631332397461, 16.25699234008789, 17.263351440429688, 18.269712448120117, 19.276073455810547, 20.282432556152344, 21.28879165649414, 22.29515266418457, 23.301511764526367, 24.307872772216797, 25.314231872558594, 26.320592880249023, 27.326953887939453, 28.33331298828125, 29.33967399597168]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 2.0, 3.0, 4.0, 7.0, 8.0, 4.0, 11.0, 24.0, 22.0, 18.0, 22.0, 20.0, 28.0, 29.0, 34.0, 40.0, 27.0, 39.0, 39.0, 45.0, 39.0, 39.0, 48.0, 51.0, 27.0, 47.0, 21.0, 40.0, 38.0, 25.0, 25.0, 27.0, 13.0, 15.0, 17.0, 22.0, 15.0, 14.0, 4.0, 8.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.19140625, -6.00732421875, -5.8232421875, -5.63916015625, -5.455078125, -5.27099609375, -5.0869140625, -4.90283203125, -4.71875, -4.53466796875, -4.3505859375, -4.16650390625, -3.982421875, -3.79833984375, -3.6142578125, -3.43017578125, -3.24609375, -3.06201171875, -2.8779296875, -2.69384765625, -2.509765625, -2.32568359375, -2.1416015625, -1.95751953125, -1.7734375, -1.58935546875, -1.4052734375, -1.22119140625, -1.037109375, -0.85302734375, -0.6689453125, -0.48486328125, -0.30078125, -0.11669921875, 0.0673828125, 0.25146484375, 0.435546875, 0.61962890625, 0.8037109375, 0.98779296875, 1.171875, 1.35595703125, 1.5400390625, 1.72412109375, 1.908203125, 2.09228515625, 2.2763671875, 2.46044921875, 2.64453125, 2.82861328125, 3.0126953125, 3.19677734375, 3.380859375, 3.56494140625, 3.7490234375, 3.93310546875, 4.1171875, 4.30126953125, 4.4853515625, 4.66943359375, 4.853515625, 5.03759765625, 5.2216796875, 5.40576171875, 5.58984375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 11.0, 15.0, 18.0, 19.0, 48.0, 59.0, 111.0, 143.0, 227.0, 322.0, 560.0, 918.0, 1390.0, 2382.0, 4100.0, 7542.0, 13533.0, 25790.0, 52634.0, 106989.0, 205060.0, 265150.0, 178736.0, 89301.0, 44297.0, 21947.0, 11680.0, 6388.0, 3564.0, 2089.0, 1350.0, 768.0, 483.0, 298.0, 222.0, 135.0, 101.0, 56.0, 24.0, 37.0, 17.0, 6.0, 15.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.91650390625, -0.8890457153320312, -0.8615875244140625, -0.8341293334960938, -0.806671142578125, -0.7792129516601562, -0.7517547607421875, -0.7242965698242188, -0.69683837890625, -0.6693801879882812, -0.6419219970703125, -0.6144638061523438, -0.587005615234375, -0.5595474243164062, -0.5320892333984375, -0.5046310424804688, -0.4771728515625, -0.44971466064453125, -0.4222564697265625, -0.39479827880859375, -0.367340087890625, -0.33988189697265625, -0.3124237060546875, -0.28496551513671875, -0.25750732421875, -0.23004913330078125, -0.2025909423828125, -0.17513275146484375, -0.147674560546875, -0.12021636962890625, -0.0927581787109375, -0.06529998779296875, -0.037841796875, -0.01038360595703125, 0.0170745849609375, 0.04453277587890625, 0.071990966796875, 0.09944915771484375, 0.1269073486328125, 0.15436553955078125, 0.18182373046875, 0.20928192138671875, 0.2367401123046875, 0.26419830322265625, 0.291656494140625, 0.31911468505859375, 0.3465728759765625, 0.37403106689453125, 0.4014892578125, 0.42894744873046875, 0.4564056396484375, 0.48386383056640625, 0.511322021484375, 0.5387802124023438, 0.5662384033203125, 0.5936965942382812, 0.62115478515625, 0.6486129760742188, 0.6760711669921875, 0.7035293579101562, 0.730987548828125, 0.7584457397460938, 0.7859039306640625, 0.8133621215820312, 0.8408203125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 3.0, 3.0, 9.0, 7.0, 12.0, 10.0, 10.0, 11.0, 19.0, 20.0, 28.0, 30.0, 27.0, 30.0, 39.0, 27.0, 35.0, 27.0, 30.0, 33.0, 34.0, 1066.0, 41.0, 35.0, 46.0, 32.0, 35.0, 31.0, 26.0, 39.0, 31.0, 27.0, 23.0, 18.0, 23.0, 19.0, 17.0, 10.0, 11.0, 6.0, 7.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0], "bins": [-3.80078125, -3.690673828125, -3.58056640625, -3.470458984375, -3.3603515625, -3.250244140625, -3.14013671875, -3.030029296875, -2.919921875, -2.809814453125, -2.69970703125, -2.589599609375, -2.4794921875, -2.369384765625, -2.25927734375, -2.149169921875, -2.0390625, -1.928955078125, -1.81884765625, -1.708740234375, -1.5986328125, -1.488525390625, -1.37841796875, -1.268310546875, -1.158203125, -1.048095703125, -0.93798828125, -0.827880859375, -0.7177734375, -0.607666015625, -0.49755859375, -0.387451171875, -0.27734375, -0.167236328125, -0.05712890625, 0.052978515625, 0.1630859375, 0.273193359375, 0.38330078125, 0.493408203125, 0.603515625, 0.713623046875, 0.82373046875, 0.933837890625, 1.0439453125, 1.154052734375, 1.26416015625, 1.374267578125, 1.484375, 1.594482421875, 1.70458984375, 1.814697265625, 1.9248046875, 2.034912109375, 2.14501953125, 2.255126953125, 2.365234375, 2.475341796875, 2.58544921875, 2.695556640625, 2.8056640625, 2.915771484375, 3.02587890625, 3.135986328125, 3.24609375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 0.0, 3.0, 4.0, 8.0, 10.0, 13.0, 37.0, 60.0, 66.0, 126.0, 198.0, 324.0, 500.0, 880.0, 1513.0, 2740.0, 5205.0, 9897.0, 19824.0, 39371.0, 78889.0, 151035.0, 1174818.0, 336206.0, 134895.0, 69003.0, 34731.0, 17167.0, 8833.0, 4675.0, 2592.0, 1449.0, 852.0, 493.0, 261.0, 161.0, 104.0, 60.0, 42.0, 28.0, 12.0, 18.0, 9.0, 5.0, 8.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5859375, -0.5681304931640625, -0.550323486328125, -0.5325164794921875, -0.51470947265625, -0.4969024658203125, -0.479095458984375, -0.4612884521484375, -0.4434814453125, -0.4256744384765625, -0.407867431640625, -0.3900604248046875, -0.37225341796875, -0.3544464111328125, -0.336639404296875, -0.3188323974609375, -0.301025390625, -0.2832183837890625, -0.265411376953125, -0.2476043701171875, -0.22979736328125, -0.2119903564453125, -0.194183349609375, -0.1763763427734375, -0.1585693359375, -0.1407623291015625, -0.122955322265625, -0.1051483154296875, -0.08734130859375, -0.0695343017578125, -0.051727294921875, -0.0339202880859375, -0.01611328125, 0.0016937255859375, 0.019500732421875, 0.0373077392578125, 0.05511474609375, 0.0729217529296875, 0.090728759765625, 0.1085357666015625, 0.1263427734375, 0.1441497802734375, 0.161956787109375, 0.1797637939453125, 0.19757080078125, 0.2153778076171875, 0.233184814453125, 0.2509918212890625, 0.268798828125, 0.2866058349609375, 0.304412841796875, 0.3222198486328125, 0.34002685546875, 0.3578338623046875, 0.375640869140625, 0.3934478759765625, 0.4112548828125, 0.4290618896484375, 0.446868896484375, 0.4646759033203125, 0.48248291015625, 0.5002899169921875, 0.518096923828125, 0.5359039306640625, 0.5537109375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 0.0, 5.0, 15.0, 8.0, 12.0, 14.0, 15.0, 18.0, 20.0, 16.0, 35.0, 38.0, 51.0, 50.0, 72.0, 99.0, 139.0, 58.0, 51.0, 48.0, 25.0, 35.0, 28.0, 21.0, 25.0, 19.0, 8.0, 14.0, 11.0, 11.0, 4.0, 7.0, 7.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.041351318359375, -0.04021024703979492, -0.039069175720214844, -0.037928104400634766, -0.03678703308105469, -0.03564596176147461, -0.03450489044189453, -0.03336381912231445, -0.032222747802734375, -0.031081676483154297, -0.02994060516357422, -0.02879953384399414, -0.027658462524414062, -0.026517391204833984, -0.025376319885253906, -0.024235248565673828, -0.02309417724609375, -0.021953105926513672, -0.020812034606933594, -0.019670963287353516, -0.018529891967773438, -0.01738882064819336, -0.01624774932861328, -0.015106678009033203, -0.013965606689453125, -0.012824535369873047, -0.011683464050292969, -0.01054239273071289, -0.009401321411132812, -0.008260250091552734, -0.007119178771972656, -0.005978107452392578, -0.0048370361328125, -0.003695964813232422, -0.0025548934936523438, -0.0014138221740722656, -0.0002727508544921875, 0.0008683204650878906, 0.0020093917846679688, 0.003150463104248047, 0.004291534423828125, 0.005432605743408203, 0.006573677062988281, 0.007714748382568359, 0.008855819702148438, 0.009996891021728516, 0.011137962341308594, 0.012279033660888672, 0.01342010498046875, 0.014561176300048828, 0.015702247619628906, 0.016843318939208984, 0.017984390258789062, 0.01912546157836914, 0.02026653289794922, 0.021407604217529297, 0.022548675537109375, 0.023689746856689453, 0.02483081817626953, 0.02597188949584961, 0.027112960815429688, 0.028254032135009766, 0.029395103454589844, 0.030536174774169922, 0.03167724609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 2.0, 11.0, 10.0, 19.0, 16.0, 23.0, 35.0, 33.0, 46.0, 71.0, 80.0, 127.0, 155.0, 234.0, 439.0, 840.0, 12797.0, 1026298.0, 5317.0, 710.0, 392.0, 251.0, 181.0, 98.0, 68.0, 61.0, 40.0, 35.0, 30.0, 29.0, 25.0, 13.0, 10.0, 10.0, 13.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5791015625, -0.5587234497070312, -0.5383453369140625, -0.5179672241210938, -0.497589111328125, -0.47721099853515625, -0.4568328857421875, -0.43645477294921875, -0.41607666015625, -0.39569854736328125, -0.3753204345703125, -0.35494232177734375, -0.334564208984375, -0.31418609619140625, -0.2938079833984375, -0.27342987060546875, -0.2530517578125, -0.23267364501953125, -0.2122955322265625, -0.19191741943359375, -0.171539306640625, -0.15116119384765625, -0.1307830810546875, -0.11040496826171875, -0.09002685546875, -0.06964874267578125, -0.0492706298828125, -0.02889251708984375, -0.008514404296875, 0.01186370849609375, 0.0322418212890625, 0.05261993408203125, 0.072998046875, 0.09337615966796875, 0.1137542724609375, 0.13413238525390625, 0.154510498046875, 0.17488861083984375, 0.1952667236328125, 0.21564483642578125, 0.23602294921875, 0.25640106201171875, 0.2767791748046875, 0.29715728759765625, 0.317535400390625, 0.33791351318359375, 0.3582916259765625, 0.37866973876953125, 0.3990478515625, 0.41942596435546875, 0.4398040771484375, 0.46018218994140625, 0.480560302734375, 0.5009384155273438, 0.5213165283203125, 0.5416946411132812, 0.56207275390625, 0.5824508666992188, 0.6028289794921875, 0.6232070922851562, 0.643585205078125, 0.6639633178710938, 0.6843414306640625, 0.7047195434570312, 0.72509765625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 832.0, 175.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14046236872673035, -0.12001092731952667, -0.0995594784617424, -0.07910802960395813, -0.058656588196754456, -0.03820514678955078, -0.01775369793176651, 0.0026977509260177612, 0.023149192333221436, 0.04360063746571541, 0.06405208259820938, 0.08450353145599365, 0.10495497286319733, 0.125406414270401, 0.14585787057876587, 0.16630931198596954, 0.18676075339317322, 0.2072121948003769, 0.22766363620758057, 0.24811509251594543, 0.2685665488243103, 0.2890179753303528, 0.30946943163871765, 0.3299208879470825, 0.350372314453125, 0.37082377076148987, 0.39127519726753235, 0.4117266535758972, 0.4321780800819397, 0.45262953639030457, 0.47308099269866943, 0.4935324192047119, 0.5139838457107544, 0.5344352722167969, 0.5548867583274841, 0.5753381848335266, 0.5957896113395691, 0.6162410974502563, 0.6366925239562988, 0.6571439504623413, 0.6775953769683838, 0.6980468034744263, 0.7184982895851135, 0.738949716091156, 0.7594011425971985, 0.7798526287078857, 0.8003040552139282, 0.8207554817199707, 0.841206967830658, 0.8616583943367004, 0.8821098804473877, 0.9025613069534302, 0.9230127334594727, 0.9434641599655151, 0.9639156460762024, 0.9843670725822449, 1.0048185586929321, 1.0252699851989746, 1.045721411705017, 1.0661728382110596, 1.0866243839263916, 1.107075810432434, 1.1275272369384766, 1.147978663444519, 1.1684300899505615]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 8.0, 7.0, 10.0, 11.0, 27.0, 18.0, 31.0, 27.0, 30.0, 41.0, 34.0, 40.0, 45.0, 57.0, 61.0, 46.0, 57.0, 40.0, 48.0, 40.0, 38.0, 39.0, 39.0, 31.0, 26.0, 19.0, 29.0, 20.0, 17.0, 10.0, 8.0, 11.0, 8.0, 5.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.07264828681945801, -0.07077066600322723, -0.06889304518699646, -0.06701542437076569, -0.06513780355453491, -0.06326018273830414, -0.061382561922073364, -0.05950494110584259, -0.057627320289611816, -0.05574969947338104, -0.05387207865715027, -0.051994457840919495, -0.05011683702468872, -0.04823921620845795, -0.04636159539222717, -0.0444839745759964, -0.042606353759765625, -0.04072873294353485, -0.03885111212730408, -0.0369734913110733, -0.03509587049484253, -0.033218249678611755, -0.03134062886238098, -0.029463008046150208, -0.027585387229919434, -0.02570776641368866, -0.023830145597457886, -0.021952524781227112, -0.020074903964996338, -0.018197283148765564, -0.01631966233253479, -0.014442041516304016, -0.012564420700073242, -0.010686799883842468, -0.008809179067611694, -0.00693155825138092, -0.0050539374351501465, -0.0031763166189193726, -0.0012986958026885986, 0.0005789250135421753, 0.0024565458297729492, 0.004334166646003723, 0.006211787462234497, 0.008089408278465271, 0.009967029094696045, 0.011844649910926819, 0.013722270727157593, 0.015599891543388367, 0.01747751235961914, 0.019355133175849915, 0.02123275399208069, 0.023110374808311462, 0.024987995624542236, 0.02686561644077301, 0.028743237257003784, 0.030620858073234558, 0.03249847888946533, 0.034376099705696106, 0.03625372052192688, 0.038131341338157654, 0.04000896215438843, 0.0418865829706192, 0.043764203786849976, 0.04564182460308075, 0.04751944541931152]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 3.0, 2.0, 4.0, 7.0, 8.0, 5.0, 11.0, 23.0, 22.0, 19.0, 22.0, 20.0, 28.0, 28.0, 34.0, 40.0, 27.0, 40.0, 41.0, 44.0, 39.0, 38.0, 50.0, 49.0, 28.0, 44.0, 24.0, 38.0, 38.0, 25.0, 25.0, 27.0, 13.0, 15.0, 17.0, 22.0, 15.0, 14.0, 4.0, 8.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.1875, -6.00341796875, -5.8193359375, -5.63525390625, -5.451171875, -5.26708984375, -5.0830078125, -4.89892578125, -4.71484375, -4.53076171875, -4.3466796875, -4.16259765625, -3.978515625, -3.79443359375, -3.6103515625, -3.42626953125, -3.2421875, -3.05810546875, -2.8740234375, -2.68994140625, -2.505859375, -2.32177734375, -2.1376953125, -1.95361328125, -1.76953125, -1.58544921875, -1.4013671875, -1.21728515625, -1.033203125, -0.84912109375, -0.6650390625, -0.48095703125, -0.296875, -0.11279296875, 0.0712890625, 0.25537109375, 0.439453125, 0.62353515625, 0.8076171875, 0.99169921875, 1.17578125, 1.35986328125, 1.5439453125, 1.72802734375, 1.912109375, 2.09619140625, 2.2802734375, 2.46435546875, 2.6484375, 2.83251953125, 3.0166015625, 3.20068359375, 3.384765625, 3.56884765625, 3.7529296875, 3.93701171875, 4.12109375, 4.30517578125, 4.4892578125, 4.67333984375, 4.857421875, 5.04150390625, 5.2255859375, 5.40966796875, 5.59375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 6.0, 10.0, 14.0, 21.0, 24.0, 20.0, 45.0, 35.0, 55.0, 99.0, 102.0, 152.0, 173.0, 240.0, 327.0, 446.0, 560.0, 808.0, 1095.0, 2009.0, 5726.0, 25448.0, 118999.0, 419681.0, 352773.0, 90406.0, 19044.0, 4507.0, 1722.0, 1059.0, 763.0, 531.0, 411.0, 303.0, 224.0, 156.0, 122.0, 128.0, 81.0, 58.0, 36.0, 28.0, 20.0, 29.0, 16.0, 15.0, 12.0, 7.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-12.4609375, -12.082275390625, -11.70361328125, -11.324951171875, -10.9462890625, -10.567626953125, -10.18896484375, -9.810302734375, -9.431640625, -9.052978515625, -8.67431640625, -8.295654296875, -7.9169921875, -7.538330078125, -7.15966796875, -6.781005859375, -6.40234375, -6.023681640625, -5.64501953125, -5.266357421875, -4.8876953125, -4.509033203125, -4.13037109375, -3.751708984375, -3.373046875, -2.994384765625, -2.61572265625, -2.237060546875, -1.8583984375, -1.479736328125, -1.10107421875, -0.722412109375, -0.34375, 0.034912109375, 0.41357421875, 0.792236328125, 1.1708984375, 1.549560546875, 1.92822265625, 2.306884765625, 2.685546875, 3.064208984375, 3.44287109375, 3.821533203125, 4.2001953125, 4.578857421875, 4.95751953125, 5.336181640625, 5.71484375, 6.093505859375, 6.47216796875, 6.850830078125, 7.2294921875, 7.608154296875, 7.98681640625, 8.365478515625, 8.744140625, 9.122802734375, 9.50146484375, 9.880126953125, 10.2587890625, 10.637451171875, 11.01611328125, 11.394775390625, 11.7734375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 3.0, 8.0, 7.0, 7.0, 11.0, 12.0, 19.0, 21.0, 19.0, 37.0, 29.0, 46.0, 44.0, 51.0, 65.0, 105.0, 216.0, 1420.0, 304.0, 149.0, 72.0, 62.0, 54.0, 36.0, 36.0, 28.0, 24.0, 26.0, 20.0, 21.0, 20.0, 24.0, 9.0, 14.0, 6.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.09375, -17.58740234375, -17.0810546875, -16.57470703125, -16.068359375, -15.56201171875, -15.0556640625, -14.54931640625, -14.04296875, -13.53662109375, -13.0302734375, -12.52392578125, -12.017578125, -11.51123046875, -11.0048828125, -10.49853515625, -9.9921875, -9.48583984375, -8.9794921875, -8.47314453125, -7.966796875, -7.46044921875, -6.9541015625, -6.44775390625, -5.94140625, -5.43505859375, -4.9287109375, -4.42236328125, -3.916015625, -3.40966796875, -2.9033203125, -2.39697265625, -1.890625, -1.38427734375, -0.8779296875, -0.37158203125, 0.134765625, 0.64111328125, 1.1474609375, 1.65380859375, 2.16015625, 2.66650390625, 3.1728515625, 3.67919921875, 4.185546875, 4.69189453125, 5.1982421875, 5.70458984375, 6.2109375, 6.71728515625, 7.2236328125, 7.72998046875, 8.236328125, 8.74267578125, 9.2490234375, 9.75537109375, 10.26171875, 10.76806640625, 11.2744140625, 11.78076171875, 12.287109375, 12.79345703125, 13.2998046875, 13.80615234375, 14.3125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 7.0, 10.0, 12.0, 12.0, 15.0, 20.0, 19.0, 32.0, 47.0, 51.0, 96.0, 150.0, 243.0, 367.0, 708.0, 1602.0, 129147.0, 3009011.0, 2176.0, 785.0, 428.0, 257.0, 162.0, 97.0, 68.0, 53.0, 38.0, 18.0, 15.0, 11.0, 18.0, 9.0, 5.0, 5.0, 5.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.0625, -66.419921875, -63.77734375, -61.134765625, -58.4921875, -55.849609375, -53.20703125, -50.564453125, -47.921875, -45.279296875, -42.63671875, -39.994140625, -37.3515625, -34.708984375, -32.06640625, -29.423828125, -26.78125, -24.138671875, -21.49609375, -18.853515625, -16.2109375, -13.568359375, -10.92578125, -8.283203125, -5.640625, -2.998046875, -0.35546875, 2.287109375, 4.9296875, 7.572265625, 10.21484375, 12.857421875, 15.5, 18.142578125, 20.78515625, 23.427734375, 26.0703125, 28.712890625, 31.35546875, 33.998046875, 36.640625, 39.283203125, 41.92578125, 44.568359375, 47.2109375, 49.853515625, 52.49609375, 55.138671875, 57.78125, 60.423828125, 63.06640625, 65.708984375, 68.3515625, 70.994140625, 73.63671875, 76.279296875, 78.921875, 81.564453125, 84.20703125, 86.849609375, 89.4921875, 92.134765625, 94.77734375, 97.419921875, 100.0625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 7.0, 11.0, 60.0, 195.0, 272.0, 268.0, 143.0, 44.0, 10.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.63715362548828, -94.26972198486328, -91.90229034423828, -89.53485107421875, -87.16741943359375, -84.79998779296875, -82.43255615234375, -80.06512451171875, -77.69768524169922, -75.33025360107422, -72.96282196044922, -70.59538269042969, -68.22795104980469, -65.86051940917969, -63.49308776855469, -61.12565231323242, -58.75822067260742, -56.39078903198242, -54.023353576660156, -51.655921936035156, -49.28848648071289, -46.92105484008789, -44.553619384765625, -42.186187744140625, -39.818756103515625, -37.451324462890625, -35.08388900756836, -32.71645736694336, -30.349021911621094, -27.981590270996094, -25.61415672302246, -23.246723175048828, -20.879287719726562, -18.51185417175293, -16.144420623779297, -13.77698802947998, -11.409554481506348, -9.042120933532715, -6.674688339233398, -4.307254791259766, -1.9398212432861328, 0.4276120662689209, 2.7950453758239746, 5.162478446960449, 7.529911994934082, 9.897345542907715, 12.264778137207031, 14.632211685180664, 16.999645233154297, 19.36707878112793, 21.734512329101562, 24.101943969726562, 26.469379425048828, 28.836811065673828, 31.20424461364746, 33.571678161621094, 35.939109802246094, 38.306541442871094, 40.67397689819336, 43.04140853881836, 45.408843994140625, 47.776275634765625, 50.143707275390625, 52.51114273071289, 54.878578186035156]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 9.0, 6.0, 14.0, 7.0, 14.0, 16.0, 20.0, 21.0, 15.0, 17.0, 34.0, 29.0, 36.0, 35.0, 44.0, 48.0, 31.0, 47.0, 53.0, 39.0, 48.0, 36.0, 33.0, 28.0, 33.0, 29.0, 33.0, 33.0, 26.0, 25.0, 25.0, 22.0, 12.0, 12.0, 17.0, 19.0, 5.0, 8.0, 10.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.62610626220703, -37.34136962890625, -36.056636810302734, -34.77190017700195, -33.48716735839844, -32.202430725097656, -30.917694091796875, -29.632959365844727, -28.348224639892578, -27.06348991394043, -25.77875518798828, -24.4940185546875, -23.20928382873535, -21.924549102783203, -20.639812469482422, -19.355077743530273, -18.070343017578125, -16.785608291625977, -15.500872611999512, -14.216136932373047, -12.931402206420898, -11.64666748046875, -10.361931800842285, -9.07719612121582, -7.792461395263672, -6.507726192474365, -5.222990989685059, -3.938255786895752, -2.6535205841064453, -1.3687853813171387, -0.08405017852783203, 1.2006855010986328, 2.4854202270507812, 3.770155429840088, 5.0548906326293945, 6.339625835418701, 7.624361038208008, 8.909095764160156, 10.193831443786621, 11.478567123413086, 12.763301849365234, 14.048036575317383, 15.332772254943848, 16.617507934570312, 17.90224266052246, 19.18697738647461, 20.47171401977539, 21.75644874572754, 23.041183471679688, 24.325918197631836, 25.610652923583984, 26.895389556884766, 28.180124282836914, 29.464859008789062, 30.749595642089844, 32.034332275390625, 33.31906509399414, 34.60380172729492, 35.88853454589844, 37.17327117919922, 38.4580078125, 39.742740631103516, 41.0274772644043, 42.31221008300781, 43.596946716308594]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 3.0, 4.0, 11.0, 8.0, 6.0, 12.0, 9.0, 12.0, 15.0, 15.0, 25.0, 21.0, 22.0, 27.0, 29.0, 38.0, 37.0, 34.0, 30.0, 41.0, 30.0, 51.0, 36.0, 42.0, 31.0, 32.0, 40.0, 35.0, 37.0, 34.0, 27.0, 30.0, 22.0, 24.0, 24.0, 14.0, 17.0, 11.0, 8.0, 5.0, 7.0, 12.0, 4.0, 5.0, 1.0, 6.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-5.7109375, -5.53570556640625, -5.3604736328125, -5.18524169921875, -5.010009765625, -4.83477783203125, -4.6595458984375, -4.48431396484375, -4.30908203125, -4.13385009765625, -3.9586181640625, -3.78338623046875, -3.608154296875, -3.43292236328125, -3.2576904296875, -3.08245849609375, -2.9072265625, -2.73199462890625, -2.5567626953125, -2.38153076171875, -2.206298828125, -2.03106689453125, -1.8558349609375, -1.68060302734375, -1.50537109375, -1.33013916015625, -1.1549072265625, -0.97967529296875, -0.804443359375, -0.62921142578125, -0.4539794921875, -0.27874755859375, -0.103515625, 0.07171630859375, 0.2469482421875, 0.42218017578125, 0.597412109375, 0.77264404296875, 0.9478759765625, 1.12310791015625, 1.29833984375, 1.47357177734375, 1.6488037109375, 1.82403564453125, 1.999267578125, 2.17449951171875, 2.3497314453125, 2.52496337890625, 2.7001953125, 2.87542724609375, 3.0506591796875, 3.22589111328125, 3.401123046875, 3.57635498046875, 3.7515869140625, 3.92681884765625, 4.10205078125, 4.27728271484375, 4.4525146484375, 4.62774658203125, 4.802978515625, 4.97821044921875, 5.1534423828125, 5.32867431640625, 5.50390625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 5.0, 1.0, 11.0, 15.0, 31.0, 28.0, 69.0, 87.0, 110.0, 148.0, 294.0, 392.0, 702.0, 1252.0, 2370.0, 5380.0, 14083.0, 49288.0, 206141.0, 785142.0, 1802250.0, 969752.0, 264973.0, 61841.0, 17543.0, 6254.0, 2800.0, 1354.0, 755.0, 452.0, 265.0, 167.0, 106.0, 76.0, 41.0, 27.0, 22.0, 14.0, 8.0, 10.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8671875, -8.5950927734375, -8.322998046875, -8.0509033203125, -7.77880859375, -7.5067138671875, -7.234619140625, -6.9625244140625, -6.6904296875, -6.4183349609375, -6.146240234375, -5.8741455078125, -5.60205078125, -5.3299560546875, -5.057861328125, -4.7857666015625, -4.513671875, -4.2415771484375, -3.969482421875, -3.6973876953125, -3.42529296875, -3.1531982421875, -2.881103515625, -2.6090087890625, -2.3369140625, -2.0648193359375, -1.792724609375, -1.5206298828125, -1.24853515625, -0.9764404296875, -0.704345703125, -0.4322509765625, -0.16015625, 0.1119384765625, 0.384033203125, 0.6561279296875, 0.92822265625, 1.2003173828125, 1.472412109375, 1.7445068359375, 2.0166015625, 2.2886962890625, 2.560791015625, 2.8328857421875, 3.10498046875, 3.3770751953125, 3.649169921875, 3.9212646484375, 4.193359375, 4.4654541015625, 4.737548828125, 5.0096435546875, 5.28173828125, 5.5538330078125, 5.825927734375, 6.0980224609375, 6.3701171875, 6.6422119140625, 6.914306640625, 7.1864013671875, 7.45849609375, 7.7305908203125, 8.002685546875, 8.2747802734375, 8.546875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 8.0, 3.0, 11.0, 9.0, 12.0, 17.0, 25.0, 29.0, 31.0, 52.0, 53.0, 78.0, 80.0, 129.0, 149.0, 203.0, 319.0, 417.0, 455.0, 446.0, 354.0, 290.0, 186.0, 163.0, 110.0, 90.0, 90.0, 57.0, 61.0, 32.0, 27.0, 21.0, 17.0, 10.0, 9.0, 8.0, 8.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6875, -9.3734130859375, -9.059326171875, -8.7452392578125, -8.43115234375, -8.1170654296875, -7.802978515625, -7.4888916015625, -7.1748046875, -6.8607177734375, -6.546630859375, -6.2325439453125, -5.91845703125, -5.6043701171875, -5.290283203125, -4.9761962890625, -4.662109375, -4.3480224609375, -4.033935546875, -3.7198486328125, -3.40576171875, -3.0916748046875, -2.777587890625, -2.4635009765625, -2.1494140625, -1.8353271484375, -1.521240234375, -1.2071533203125, -0.89306640625, -0.5789794921875, -0.264892578125, 0.0491943359375, 0.36328125, 0.6773681640625, 0.991455078125, 1.3055419921875, 1.61962890625, 1.9337158203125, 2.247802734375, 2.5618896484375, 2.8759765625, 3.1900634765625, 3.504150390625, 3.8182373046875, 4.13232421875, 4.4464111328125, 4.760498046875, 5.0745849609375, 5.388671875, 5.7027587890625, 6.016845703125, 6.3309326171875, 6.64501953125, 6.9591064453125, 7.273193359375, 7.5872802734375, 7.9013671875, 8.2154541015625, 8.529541015625, 8.8436279296875, 9.15771484375, 9.4718017578125, 9.785888671875, 10.0999755859375, 10.4140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 6.0, 3.0, 8.0, 9.0, 12.0, 12.0, 13.0, 19.0, 27.0, 32.0, 62.0, 67.0, 85.0, 138.0, 204.0, 263.0, 395.0, 725.0, 1312.0, 3029.0, 11084.0, 71258.0, 547662.0, 2825699.0, 631630.0, 81861.0, 12195.0, 3093.0, 1278.0, 708.0, 438.0, 293.0, 171.0, 128.0, 97.0, 67.0, 59.0, 34.0, 30.0, 18.0, 16.0, 8.0, 11.0, 13.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-17.0, -16.53466796875, -16.0693359375, -15.60400390625, -15.138671875, -14.67333984375, -14.2080078125, -13.74267578125, -13.27734375, -12.81201171875, -12.3466796875, -11.88134765625, -11.416015625, -10.95068359375, -10.4853515625, -10.02001953125, -9.5546875, -9.08935546875, -8.6240234375, -8.15869140625, -7.693359375, -7.22802734375, -6.7626953125, -6.29736328125, -5.83203125, -5.36669921875, -4.9013671875, -4.43603515625, -3.970703125, -3.50537109375, -3.0400390625, -2.57470703125, -2.109375, -1.64404296875, -1.1787109375, -0.71337890625, -0.248046875, 0.21728515625, 0.6826171875, 1.14794921875, 1.61328125, 2.07861328125, 2.5439453125, 3.00927734375, 3.474609375, 3.93994140625, 4.4052734375, 4.87060546875, 5.3359375, 5.80126953125, 6.2666015625, 6.73193359375, 7.197265625, 7.66259765625, 8.1279296875, 8.59326171875, 9.05859375, 9.52392578125, 9.9892578125, 10.45458984375, 10.919921875, 11.38525390625, 11.8505859375, 12.31591796875, 12.78125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 27.0, 480.0, 473.0, 33.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-491.4495849609375, -481.9941101074219, -472.53863525390625, -463.0831298828125, -453.6276550292969, -444.17218017578125, -434.7166748046875, -425.2611999511719, -415.80572509765625, -406.3502502441406, -396.894775390625, -387.43927001953125, -377.9837951660156, -368.5283203125, -359.07281494140625, -349.6173400878906, -340.161865234375, -330.7063903808594, -321.25091552734375, -311.79541015625, -302.3399353027344, -292.88446044921875, -283.428955078125, -273.9734802246094, -264.51800537109375, -255.06253051757812, -245.60704040527344, -236.15155029296875, -226.69607543945312, -217.2406005859375, -207.7851104736328, -198.32962036132812, -188.87417602539062, -179.418701171875, -169.9632110595703, -160.50772094726562, -151.05224609375, -141.59677124023438, -132.1412811279297, -122.68579864501953, -113.23031616210938, -103.77483367919922, -94.31935119628906, -84.8638687133789, -75.40838623046875, -65.9529037475586, -56.49742126464844, -47.04193878173828, -37.586456298828125, -28.13097381591797, -18.675491333007812, -9.220008850097656, 0.2354736328125, 9.690956115722656, 19.146438598632812, 28.60192108154297, 38.057403564453125, 47.51288604736328, 56.96836853027344, 66.4238510131836, 75.87933349609375, 85.3348159790039, 94.79029846191406, 104.24578094482422, 113.70126342773438]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 11.0, 9.0, 8.0, 9.0, 14.0, 16.0, 20.0, 24.0, 20.0, 25.0, 26.0, 24.0, 30.0, 38.0, 30.0, 29.0, 35.0, 24.0, 41.0, 43.0, 52.0, 44.0, 38.0, 47.0, 36.0, 30.0, 41.0, 34.0, 19.0, 24.0, 19.0, 17.0, 20.0, 19.0, 15.0, 13.0, 16.0, 7.0, 10.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.23923110961914, -37.9691162109375, -36.699005126953125, -35.428890228271484, -34.158775329589844, -32.8886604309082, -31.618547439575195, -30.348434448242188, -29.078319549560547, -27.808204650878906, -26.5380916595459, -25.26797866821289, -23.99786376953125, -22.72774887084961, -21.4576358795166, -20.187522888183594, -18.917407989501953, -17.647293090820312, -16.377180099487305, -15.10706615447998, -13.836952209472656, -12.566838264465332, -11.296724319458008, -10.026610374450684, -8.75649642944336, -7.486382484436035, -6.216268539428711, -4.946154594421387, -3.6760406494140625, -2.4059267044067383, -1.135812759399414, 0.13430118560791016, 1.4044151306152344, 2.6745290756225586, 3.944643020629883, 5.214756965637207, 6.484870910644531, 7.7549848556518555, 9.02509880065918, 10.295212745666504, 11.565326690673828, 12.835440635681152, 14.105554580688477, 15.3756685256958, 16.645782470703125, 17.915897369384766, 19.186010360717773, 20.45612335205078, 21.726238250732422, 22.996353149414062, 24.26646614074707, 25.536579132080078, 26.80669403076172, 28.07680892944336, 29.346921920776367, 30.617034912109375, 31.887149810791016, 33.157264709472656, 34.42737579345703, 35.69749069213867, 36.96760559082031, 38.23772048950195, 39.507835388183594, 40.77794647216797, 42.04806137084961]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 13.0, 11.0, 10.0, 16.0, 26.0, 22.0, 23.0, 18.0, 26.0, 29.0, 32.0, 33.0, 46.0, 37.0, 38.0, 44.0, 36.0, 40.0, 48.0, 49.0, 42.0, 41.0, 38.0, 37.0, 32.0, 28.0, 24.0, 26.0, 34.0, 15.0, 12.0, 10.0, 9.0, 12.0, 9.0, 9.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.08831787109375, -4.9266357421875, -4.76495361328125, -4.603271484375, -4.44158935546875, -4.2799072265625, -4.11822509765625, -3.95654296875, -3.79486083984375, -3.6331787109375, -3.47149658203125, -3.309814453125, -3.14813232421875, -2.9864501953125, -2.82476806640625, -2.6630859375, -2.50140380859375, -2.3397216796875, -2.17803955078125, -2.016357421875, -1.85467529296875, -1.6929931640625, -1.53131103515625, -1.36962890625, -1.20794677734375, -1.0462646484375, -0.88458251953125, -0.722900390625, -0.56121826171875, -0.3995361328125, -0.23785400390625, -0.076171875, 0.08551025390625, 0.2471923828125, 0.40887451171875, 0.570556640625, 0.73223876953125, 0.8939208984375, 1.05560302734375, 1.21728515625, 1.37896728515625, 1.5406494140625, 1.70233154296875, 1.864013671875, 2.02569580078125, 2.1873779296875, 2.34906005859375, 2.5107421875, 2.67242431640625, 2.8341064453125, 2.99578857421875, 3.157470703125, 3.31915283203125, 3.4808349609375, 3.64251708984375, 3.80419921875, 3.96588134765625, 4.1275634765625, 4.28924560546875, 4.450927734375, 4.61260986328125, 4.7742919921875, 4.93597412109375, 5.09765625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 8.0, 5.0, 15.0, 18.0, 34.0, 45.0, 50.0, 79.0, 135.0, 210.0, 290.0, 446.0, 636.0, 928.0, 1390.0, 2281.0, 3474.0, 5288.0, 8338.0, 13675.0, 22733.0, 38653.0, 65661.0, 109997.0, 171540.0, 202472.0, 156376.0, 97651.0, 57912.0, 34348.0, 20085.0, 12377.0, 7749.0, 4750.0, 2963.0, 1941.0, 1301.0, 870.0, 539.0, 406.0, 264.0, 195.0, 142.0, 90.0, 65.0, 49.0, 37.0, 19.0, 13.0, 9.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.461181640625, -0.4460029602050781, -0.43082427978515625, -0.4156455993652344, -0.4004669189453125, -0.3852882385253906, -0.37010955810546875, -0.3549308776855469, -0.339752197265625, -0.3245735168457031, -0.30939483642578125, -0.2942161560058594, -0.2790374755859375, -0.2638587951660156, -0.24868011474609375, -0.23350143432617188, -0.21832275390625, -0.20314407348632812, -0.18796539306640625, -0.17278671264648438, -0.1576080322265625, -0.14242935180664062, -0.12725067138671875, -0.11207199096679688, -0.096893310546875, -0.08171463012695312, -0.06653594970703125, -0.051357269287109375, -0.0361785888671875, -0.020999908447265625, -0.00582122802734375, 0.009357452392578125, 0.0245361328125, 0.039714813232421875, 0.05489349365234375, 0.07007217407226562, 0.0852508544921875, 0.10042953491210938, 0.11560821533203125, 0.13078689575195312, 0.145965576171875, 0.16114425659179688, 0.17632293701171875, 0.19150161743164062, 0.2066802978515625, 0.22185897827148438, 0.23703765869140625, 0.2522163391113281, 0.26739501953125, 0.2825736999511719, 0.29775238037109375, 0.3129310607910156, 0.3281097412109375, 0.3432884216308594, 0.35846710205078125, 0.3736457824707031, 0.388824462890625, 0.4040031433105469, 0.41918182373046875, 0.4343605041503906, 0.4495391845703125, 0.4647178649902344, 0.47989654541015625, 0.4950752258300781, 0.51025390625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 12.0, 11.0, 8.0, 13.0, 17.0, 18.0, 27.0, 25.0, 31.0, 34.0, 27.0, 45.0, 37.0, 48.0, 34.0, 49.0, 48.0, 1059.0, 36.0, 38.0, 46.0, 32.0, 31.0, 27.0, 30.0, 23.0, 31.0, 32.0, 27.0, 15.0, 13.0, 13.0, 18.0, 14.0, 14.0, 8.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.00390625, -2.903411865234375, -2.80291748046875, -2.702423095703125, -2.6019287109375, -2.501434326171875, -2.40093994140625, -2.300445556640625, -2.199951171875, -2.099456787109375, -1.99896240234375, -1.898468017578125, -1.7979736328125, -1.697479248046875, -1.59698486328125, -1.496490478515625, -1.39599609375, -1.295501708984375, -1.19500732421875, -1.094512939453125, -0.9940185546875, -0.893524169921875, -0.79302978515625, -0.692535400390625, -0.592041015625, -0.491546630859375, -0.39105224609375, -0.290557861328125, -0.1900634765625, -0.089569091796875, 0.01092529296875, 0.111419677734375, 0.2119140625, 0.312408447265625, 0.41290283203125, 0.513397216796875, 0.6138916015625, 0.714385986328125, 0.81488037109375, 0.915374755859375, 1.015869140625, 1.116363525390625, 1.21685791015625, 1.317352294921875, 1.4178466796875, 1.518341064453125, 1.61883544921875, 1.719329833984375, 1.81982421875, 1.920318603515625, 2.02081298828125, 2.121307373046875, 2.2218017578125, 2.322296142578125, 2.42279052734375, 2.523284912109375, 2.623779296875, 2.724273681640625, 2.82476806640625, 2.925262451171875, 3.0257568359375, 3.126251220703125, 3.22674560546875, 3.327239990234375, 3.427734375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 6.0, 2.0, 25.0, 24.0, 40.0, 63.0, 94.0, 159.0, 272.0, 540.0, 909.0, 1732.0, 3338.0, 6548.0, 13141.0, 26992.0, 54316.0, 105844.0, 187859.0, 1288564.0, 189407.0, 106903.0, 55536.0, 27429.0, 13442.0, 6525.0, 3478.0, 1654.0, 988.0, 557.0, 301.0, 180.0, 93.0, 51.0, 47.0, 26.0, 10.0, 13.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44921875, -0.43581390380859375, -0.4224090576171875, -0.40900421142578125, -0.395599365234375, -0.38219451904296875, -0.3687896728515625, -0.35538482666015625, -0.34197998046875, -0.32857513427734375, -0.3151702880859375, -0.30176544189453125, -0.288360595703125, -0.27495574951171875, -0.2615509033203125, -0.24814605712890625, -0.2347412109375, -0.22133636474609375, -0.2079315185546875, -0.19452667236328125, -0.181121826171875, -0.16771697998046875, -0.1543121337890625, -0.14090728759765625, -0.12750244140625, -0.11409759521484375, -0.1006927490234375, -0.08728790283203125, -0.073883056640625, -0.06047821044921875, -0.0470733642578125, -0.03366851806640625, -0.020263671875, -0.00685882568359375, 0.0065460205078125, 0.01995086669921875, 0.033355712890625, 0.04676055908203125, 0.0601654052734375, 0.07357025146484375, 0.08697509765625, 0.10037994384765625, 0.1137847900390625, 0.12718963623046875, 0.140594482421875, 0.15399932861328125, 0.1674041748046875, 0.18080902099609375, 0.1942138671875, 0.20761871337890625, 0.2210235595703125, 0.23442840576171875, 0.247833251953125, 0.26123809814453125, 0.2746429443359375, 0.28804779052734375, 0.30145263671875, 0.31485748291015625, 0.3282623291015625, 0.34166717529296875, 0.355072021484375, 0.36847686767578125, 0.3818817138671875, 0.39528656005859375, 0.40869140625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 3.0, 10.0, 6.0, 11.0, 14.0, 25.0, 31.0, 27.0, 30.0, 43.0, 54.0, 79.0, 96.0, 87.0, 98.0, 79.0, 66.0, 35.0, 31.0, 36.0, 25.0, 20.0, 18.0, 12.0, 8.0, 9.0, 8.0, 12.0, 6.0, 5.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0146026611328125, -0.01419520378112793, -0.01378774642944336, -0.013380289077758789, -0.012972831726074219, -0.012565374374389648, -0.012157917022705078, -0.011750459671020508, -0.011343002319335938, -0.010935544967651367, -0.010528087615966797, -0.010120630264282227, -0.009713172912597656, -0.009305715560913086, -0.008898258209228516, -0.008490800857543945, -0.008083343505859375, -0.007675886154174805, -0.007268428802490234, -0.006860971450805664, -0.006453514099121094, -0.0060460567474365234, -0.005638599395751953, -0.005231142044067383, -0.0048236846923828125, -0.004416227340698242, -0.004008769989013672, -0.0036013126373291016, -0.0031938552856445312, -0.002786397933959961, -0.0023789405822753906, -0.0019714832305908203, -0.00156402587890625, -0.0011565685272216797, -0.0007491111755371094, -0.00034165382385253906, 6.580352783203125e-05, 0.00047326087951660156, 0.0008807182312011719, 0.0012881755828857422, 0.0016956329345703125, 0.002103090286254883, 0.002510547637939453, 0.0029180049896240234, 0.0033254623413085938, 0.003732919692993164, 0.004140377044677734, 0.004547834396362305, 0.004955291748046875, 0.005362749099731445, 0.005770206451416016, 0.006177663803100586, 0.006585121154785156, 0.0069925785064697266, 0.007400035858154297, 0.007807493209838867, 0.008214950561523438, 0.008622407913208008, 0.009029865264892578, 0.009437322616577148, 0.009844779968261719, 0.010252237319946289, 0.01065969467163086, 0.01106715202331543, 0.011474609375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 5.0, 4.0, 9.0, 9.0, 9.0, 9.0, 17.0, 10.0, 27.0, 20.0, 28.0, 34.0, 46.0, 79.0, 101.0, 154.0, 229.0, 440.0, 1386.0, 63451.0, 972325.0, 8453.0, 746.0, 321.0, 185.0, 112.0, 81.0, 79.0, 57.0, 35.0, 26.0, 17.0, 15.0, 16.0, 9.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19873046875, -0.19170379638671875, -0.1846771240234375, -0.17765045166015625, -0.170623779296875, -0.16359710693359375, -0.1565704345703125, -0.14954376220703125, -0.14251708984375, -0.13549041748046875, -0.1284637451171875, -0.12143707275390625, -0.114410400390625, -0.10738372802734375, -0.1003570556640625, -0.09333038330078125, -0.0863037109375, -0.07927703857421875, -0.0722503662109375, -0.06522369384765625, -0.058197021484375, -0.05117034912109375, -0.0441436767578125, -0.03711700439453125, -0.03009033203125, -0.02306365966796875, -0.0160369873046875, -0.00901031494140625, -0.001983642578125, 0.00504302978515625, 0.0120697021484375, 0.01909637451171875, 0.026123046875, 0.03314971923828125, 0.0401763916015625, 0.04720306396484375, 0.054229736328125, 0.06125640869140625, 0.0682830810546875, 0.07530975341796875, 0.08233642578125, 0.08936309814453125, 0.0963897705078125, 0.10341644287109375, 0.110443115234375, 0.11746978759765625, 0.1244964599609375, 0.13152313232421875, 0.1385498046875, 0.14557647705078125, 0.1526031494140625, 0.15962982177734375, 0.166656494140625, 0.17368316650390625, 0.1807098388671875, 0.18773651123046875, 0.19476318359375, 0.20178985595703125, 0.2088165283203125, 0.21584320068359375, 0.222869873046875, 0.22989654541015625, 0.2369232177734375, 0.24394989013671875, 0.2509765625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 15.0, 466.0, 530.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049009084701538086, -0.04289869964122772, -0.03678831085562706, -0.030677923932671547, -0.024567537009716034, -0.01845715008676052, -0.012346763163805008, -0.006236374378204346, -0.00012598931789398193, 0.005984397605061531, 0.012094784528017044, 0.018205171450972557, 0.02431555837392807, 0.030425945296883583, 0.036536332219839096, 0.04264672100543976, 0.04875710606575012, 0.054867491126060486, 0.06097787991166115, 0.06708826869726181, 0.07319865375757217, 0.07930903881788254, 0.0854194313287735, 0.09152981638908386, 0.09764020144939423, 0.10375058650970459, 0.10986097157001495, 0.11597136408090591, 0.12208174914121628, 0.12819214165210724, 0.1343025267124176, 0.14041291177272797, 0.14652329683303833, 0.1526336818933487, 0.15874406695365906, 0.16485445201396942, 0.17096483707427979, 0.17707523703575134, 0.1831856220960617, 0.18929600715637207, 0.19540639221668243, 0.2015167772769928, 0.20762716233730316, 0.21373754739761353, 0.21984794735908508, 0.22595833241939545, 0.2320687174797058, 0.23817910254001617, 0.24428948760032654, 0.2503998875617981, 0.25651025772094727, 0.2626206576824188, 0.268731027841568, 0.27484142780303955, 0.2809517979621887, 0.2870621979236603, 0.29317259788513184, 0.2992829978466034, 0.30539336800575256, 0.3115037679672241, 0.3176141381263733, 0.32372453808784485, 0.329834908246994, 0.3359453082084656, 0.34205567836761475]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 9.0, 13.0, 20.0, 14.0, 18.0, 22.0, 33.0, 40.0, 34.0, 42.0, 47.0, 55.0, 67.0, 64.0, 71.0, 45.0, 56.0, 63.0, 38.0, 44.0, 48.0, 38.0, 27.0, 19.0, 24.0, 16.0, 8.0, 6.0, 9.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01946234703063965, -0.01892559789121151, -0.01838884875178337, -0.017852099612355232, -0.017315350472927094, -0.016778601333498955, -0.016241852194070816, -0.015705103054642677, -0.015168353915214539, -0.0146316047757864, -0.014094855636358261, -0.013558106496930122, -0.013021357357501984, -0.012484608218073845, -0.011947859078645706, -0.011411109939217567, -0.010874360799789429, -0.01033761166036129, -0.009800862520933151, -0.009264113381505013, -0.008727364242076874, -0.008190615102648735, -0.007653865963220596, -0.007117116823792458, -0.006580367684364319, -0.00604361854493618, -0.005506869405508041, -0.004970120266079903, -0.004433371126651764, -0.003896621987223625, -0.0033598728477954865, -0.0028231237083673477, -0.002286374568939209, -0.0017496254295110703, -0.0012128762900829315, -0.0006761271506547928, -0.00013937801122665405, 0.0003973711282014847, 0.0009341202676296234, 0.0014708694070577621, 0.002007618546485901, 0.0025443676859140396, 0.0030811168253421783, 0.003617865964770317, 0.004154615104198456, 0.0046913642436265945, 0.005228113383054733, 0.005764862522482872, 0.006301611661911011, 0.0068383608013391495, 0.007375109940767288, 0.007911859080195427, 0.008448608219623566, 0.008985357359051704, 0.009522106498479843, 0.010058855637907982, 0.01059560477733612, 0.01113235391676426, 0.011669103056192398, 0.012205852195620537, 0.012742601335048676, 0.013279350474476814, 0.013816099613904953, 0.014352848753333092, 0.01488959789276123]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 14.0, 11.0, 10.0, 16.0, 26.0, 22.0, 23.0, 18.0, 26.0, 29.0, 32.0, 33.0, 46.0, 38.0, 36.0, 45.0, 36.0, 40.0, 48.0, 49.0, 43.0, 40.0, 38.0, 37.0, 32.0, 28.0, 24.0, 26.0, 34.0, 15.0, 12.0, 10.0, 9.0, 12.0, 9.0, 9.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.08831787109375, -4.9266357421875, -4.76495361328125, -4.603271484375, -4.44158935546875, -4.2799072265625, -4.11822509765625, -3.95654296875, -3.79486083984375, -3.6331787109375, -3.47149658203125, -3.309814453125, -3.14813232421875, -2.9864501953125, -2.82476806640625, -2.6630859375, -2.50140380859375, -2.3397216796875, -2.17803955078125, -2.016357421875, -1.85467529296875, -1.6929931640625, -1.53131103515625, -1.36962890625, -1.20794677734375, -1.0462646484375, -0.88458251953125, -0.722900390625, -0.56121826171875, -0.3995361328125, -0.23785400390625, -0.076171875, 0.08551025390625, 0.2471923828125, 0.40887451171875, 0.570556640625, 0.73223876953125, 0.8939208984375, 1.05560302734375, 1.21728515625, 1.37896728515625, 1.5406494140625, 1.70233154296875, 1.864013671875, 2.02569580078125, 2.1873779296875, 2.34906005859375, 2.5107421875, 2.67242431640625, 2.8341064453125, 2.99578857421875, 3.157470703125, 3.31915283203125, 3.4808349609375, 3.64251708984375, 3.80419921875, 3.96588134765625, 4.1275634765625, 4.28924560546875, 4.450927734375, 4.61260986328125, 4.7742919921875, 4.93597412109375, 5.09765625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 12.0, 20.0, 21.0, 37.0, 48.0, 52.0, 76.0, 113.0, 131.0, 194.0, 275.0, 351.0, 529.0, 733.0, 1010.0, 1293.0, 1890.0, 3065.0, 6329.0, 25631.0, 190152.0, 648428.0, 134569.0, 18902.0, 5398.0, 2842.0, 1830.0, 1242.0, 858.0, 657.0, 485.0, 359.0, 287.0, 213.0, 150.0, 112.0, 86.0, 52.0, 38.0, 26.0, 15.0, 12.0, 11.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.15625, -11.769287109375, -11.38232421875, -10.995361328125, -10.6083984375, -10.221435546875, -9.83447265625, -9.447509765625, -9.060546875, -8.673583984375, -8.28662109375, -7.899658203125, -7.5126953125, -7.125732421875, -6.73876953125, -6.351806640625, -5.96484375, -5.577880859375, -5.19091796875, -4.803955078125, -4.4169921875, -4.030029296875, -3.64306640625, -3.256103515625, -2.869140625, -2.482177734375, -2.09521484375, -1.708251953125, -1.3212890625, -0.934326171875, -0.54736328125, -0.160400390625, 0.2265625, 0.613525390625, 1.00048828125, 1.387451171875, 1.7744140625, 2.161376953125, 2.54833984375, 2.935302734375, 3.322265625, 3.709228515625, 4.09619140625, 4.483154296875, 4.8701171875, 5.257080078125, 5.64404296875, 6.031005859375, 6.41796875, 6.804931640625, 7.19189453125, 7.578857421875, 7.9658203125, 8.352783203125, 8.73974609375, 9.126708984375, 9.513671875, 9.900634765625, 10.28759765625, 10.674560546875, 11.0615234375, 11.448486328125, 11.83544921875, 12.222412109375, 12.609375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 6.0, 7.0, 11.0, 15.0, 13.0, 24.0, 22.0, 22.0, 31.0, 35.0, 41.0, 44.0, 56.0, 51.0, 131.0, 290.0, 1466.0, 257.0, 106.0, 50.0, 58.0, 43.0, 35.0, 30.0, 29.0, 22.0, 26.0, 12.0, 18.0, 18.0, 12.0, 8.0, 18.0, 3.0, 5.0, 4.0, 1.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.65625, -13.25927734375, -12.8623046875, -12.46533203125, -12.068359375, -11.67138671875, -11.2744140625, -10.87744140625, -10.48046875, -10.08349609375, -9.6865234375, -9.28955078125, -8.892578125, -8.49560546875, -8.0986328125, -7.70166015625, -7.3046875, -6.90771484375, -6.5107421875, -6.11376953125, -5.716796875, -5.31982421875, -4.9228515625, -4.52587890625, -4.12890625, -3.73193359375, -3.3349609375, -2.93798828125, -2.541015625, -2.14404296875, -1.7470703125, -1.35009765625, -0.953125, -0.55615234375, -0.1591796875, 0.23779296875, 0.634765625, 1.03173828125, 1.4287109375, 1.82568359375, 2.22265625, 2.61962890625, 3.0166015625, 3.41357421875, 3.810546875, 4.20751953125, 4.6044921875, 5.00146484375, 5.3984375, 5.79541015625, 6.1923828125, 6.58935546875, 6.986328125, 7.38330078125, 7.7802734375, 8.17724609375, 8.57421875, 8.97119140625, 9.3681640625, 9.76513671875, 10.162109375, 10.55908203125, 10.9560546875, 11.35302734375, 11.75]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 9.0, 15.0, 17.0, 22.0, 28.0, 34.0, 45.0, 67.0, 105.0, 166.0, 328.0, 639.0, 1564.0, 11239.0, 3124802.0, 4263.0, 1099.0, 511.0, 271.0, 147.0, 82.0, 79.0, 43.0, 45.0, 18.0, 13.0, 10.0, 5.0, 4.0, 10.0, 5.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.3818359375, -60.326171875, -58.2705078125, -56.21484375, -54.1591796875, -52.103515625, -50.0478515625, -47.9921875, -45.9365234375, -43.880859375, -41.8251953125, -39.76953125, -37.7138671875, -35.658203125, -33.6025390625, -31.546875, -29.4912109375, -27.435546875, -25.3798828125, -23.32421875, -21.2685546875, -19.212890625, -17.1572265625, -15.1015625, -13.0458984375, -10.990234375, -8.9345703125, -6.87890625, -4.8232421875, -2.767578125, -0.7119140625, 1.34375, 3.3994140625, 5.455078125, 7.5107421875, 9.56640625, 11.6220703125, 13.677734375, 15.7333984375, 17.7890625, 19.8447265625, 21.900390625, 23.9560546875, 26.01171875, 28.0673828125, 30.123046875, 32.1787109375, 34.234375, 36.2900390625, 38.345703125, 40.4013671875, 42.45703125, 44.5126953125, 46.568359375, 48.6240234375, 50.6796875, 52.7353515625, 54.791015625, 56.8466796875, 58.90234375, 60.9580078125, 63.013671875, 65.0693359375, 67.125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 28.0, 242.0, 483.0, 218.0, 34.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.78399658203125, -209.54949951171875, -205.31500244140625, -201.08050537109375, -196.84600830078125, -192.61151123046875, -188.37701416015625, -184.14251708984375, -179.90802001953125, -175.67352294921875, -171.43902587890625, -167.20452880859375, -162.97003173828125, -158.73553466796875, -154.50103759765625, -150.26654052734375, -146.03204345703125, -141.79754638671875, -137.56304931640625, -133.32855224609375, -129.09405517578125, -124.85955810546875, -120.62506103515625, -116.39056396484375, -112.15606689453125, -107.92156982421875, -103.68707275390625, -99.45257568359375, -95.21807861328125, -90.98358154296875, -86.74908447265625, -82.51458740234375, -78.28010559082031, -74.04560852050781, -69.81111145019531, -65.57661437988281, -61.34211730957031, -57.10762023925781, -52.87312316894531, -48.63862609863281, -44.40412902832031, -40.16963195800781, -35.93513488769531, -31.700637817382812, -27.466140747070312, -23.231643676757812, -18.997146606445312, -14.762649536132812, -10.528152465820312, -6.2936553955078125, -2.0591583251953125, 2.1753387451171875, 6.4098358154296875, 10.644332885742188, 14.878829956054688, 19.113327026367188, 23.347824096679688, 27.582321166992188, 31.816818237304688, 36.05131530761719, 40.28581237792969, 44.52030944824219, 48.75480651855469, 52.98930358886719, 57.22380065917969]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 5.0, 11.0, 12.0, 17.0, 14.0, 12.0, 16.0, 17.0, 27.0, 24.0, 31.0, 31.0, 33.0, 24.0, 39.0, 41.0, 39.0, 39.0, 45.0, 40.0, 57.0, 42.0, 45.0, 36.0, 35.0, 40.0, 28.0, 32.0, 14.0, 31.0, 14.0, 15.0, 18.0, 18.0, 16.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-44.88050079345703, -43.524410247802734, -42.16831970214844, -40.812225341796875, -39.45613479614258, -38.10004425048828, -36.74394989013672, -35.38785934448242, -34.031768798828125, -32.67567825317383, -31.3195858001709, -29.96349334716797, -28.607402801513672, -27.251312255859375, -25.895219802856445, -24.539127349853516, -23.18303680419922, -21.826946258544922, -20.470853805541992, -19.114761352539062, -17.758670806884766, -16.40258026123047, -15.046487808227539, -13.690396308898926, -12.334304809570312, -10.9782133102417, -9.622121810913086, -8.266030311584473, -6.909938812255859, -5.553847312927246, -4.197755813598633, -2.8416643142700195, -1.4855690002441406, -0.12947750091552734, 1.226613998413086, 2.582705497741699, 3.9387969970703125, 5.294888496398926, 6.650979995727539, 8.007071495056152, 9.363162994384766, 10.719254493713379, 12.075345993041992, 13.431437492370605, 14.787528991699219, 16.143619537353516, 17.499711990356445, 18.855804443359375, 20.211894989013672, 21.56798553466797, 22.9240779876709, 24.280170440673828, 25.636260986328125, 26.992351531982422, 28.34844398498535, 29.70453643798828, 31.060626983642578, 32.416717529296875, 33.77281188964844, 35.128902435302734, 36.48499298095703, 37.84108352661133, 39.197174072265625, 40.55326843261719, 41.909358978271484]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 8.0, 3.0, 4.0, 7.0, 10.0, 12.0, 16.0, 19.0, 24.0, 20.0, 21.0, 27.0, 26.0, 25.0, 31.0, 37.0, 37.0, 35.0, 39.0, 36.0, 51.0, 38.0, 41.0, 29.0, 34.0, 39.0, 37.0, 30.0, 39.0, 37.0, 28.0, 44.0, 24.0, 13.0, 17.0, 10.0, 16.0, 17.0, 4.0, 5.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.1680908203125, -4.004150390625, -3.8402099609375, -3.67626953125, -3.5123291015625, -3.348388671875, -3.1844482421875, -3.0205078125, -2.8565673828125, -2.692626953125, -2.5286865234375, -2.36474609375, -2.2008056640625, -2.036865234375, -1.8729248046875, -1.708984375, -1.5450439453125, -1.381103515625, -1.2171630859375, -1.05322265625, -0.8892822265625, -0.725341796875, -0.5614013671875, -0.3974609375, -0.2335205078125, -0.069580078125, 0.0943603515625, 0.25830078125, 0.4222412109375, 0.586181640625, 0.7501220703125, 0.9140625, 1.0780029296875, 1.241943359375, 1.4058837890625, 1.56982421875, 1.7337646484375, 1.897705078125, 2.0616455078125, 2.2255859375, 2.3895263671875, 2.553466796875, 2.7174072265625, 2.88134765625, 3.0452880859375, 3.209228515625, 3.3731689453125, 3.537109375, 3.7010498046875, 3.864990234375, 4.0289306640625, 4.19287109375, 4.3568115234375, 4.520751953125, 4.6846923828125, 4.8486328125, 5.0125732421875, 5.176513671875, 5.3404541015625, 5.50439453125, 5.6683349609375, 5.832275390625, 5.9962158203125, 6.16015625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 8.0, 3.0, 4.0, 5.0, 7.0, 12.0, 23.0, 30.0, 31.0, 32.0, 40.0, 60.0, 116.0, 169.0, 269.0, 422.0, 706.0, 1108.0, 1890.0, 3581.0, 7338.0, 18342.0, 62491.0, 315747.0, 1309386.0, 1780655.0, 542821.0, 103068.0, 26003.0, 9719.0, 4454.0, 2333.0, 1289.0, 760.0, 476.0, 264.0, 186.0, 125.0, 75.0, 66.0, 47.0, 36.0, 16.0, 23.0, 8.0, 15.0, 10.0, 11.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.66015625, -7.41436767578125, -7.1685791015625, -6.92279052734375, -6.677001953125, -6.43121337890625, -6.1854248046875, -5.93963623046875, -5.69384765625, -5.44805908203125, -5.2022705078125, -4.95648193359375, -4.710693359375, -4.46490478515625, -4.2191162109375, -3.97332763671875, -3.7275390625, -3.48175048828125, -3.2359619140625, -2.99017333984375, -2.744384765625, -2.49859619140625, -2.2528076171875, -2.00701904296875, -1.76123046875, -1.51544189453125, -1.2696533203125, -1.02386474609375, -0.778076171875, -0.53228759765625, -0.2864990234375, -0.04071044921875, 0.205078125, 0.45086669921875, 0.6966552734375, 0.94244384765625, 1.188232421875, 1.43402099609375, 1.6798095703125, 1.92559814453125, 2.17138671875, 2.41717529296875, 2.6629638671875, 2.90875244140625, 3.154541015625, 3.40032958984375, 3.6461181640625, 3.89190673828125, 4.1376953125, 4.38348388671875, 4.6292724609375, 4.87506103515625, 5.120849609375, 5.36663818359375, 5.6124267578125, 5.85821533203125, 6.10400390625, 6.34979248046875, 6.5955810546875, 6.84136962890625, 7.087158203125, 7.33294677734375, 7.5787353515625, 7.82452392578125, 8.0703125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 6.0, 16.0, 26.0, 34.0, 40.0, 94.0, 185.0, 318.0, 506.0, 791.0, 818.0, 530.0, 304.0, 182.0, 95.0, 58.0, 27.0, 17.0, 15.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -16.045654296875, -15.52880859375, -15.011962890625, -14.4951171875, -13.978271484375, -13.46142578125, -12.944580078125, -12.427734375, -11.910888671875, -11.39404296875, -10.877197265625, -10.3603515625, -9.843505859375, -9.32666015625, -8.809814453125, -8.29296875, -7.776123046875, -7.25927734375, -6.742431640625, -6.2255859375, -5.708740234375, -5.19189453125, -4.675048828125, -4.158203125, -3.641357421875, -3.12451171875, -2.607666015625, -2.0908203125, -1.573974609375, -1.05712890625, -0.540283203125, -0.0234375, 0.493408203125, 1.01025390625, 1.527099609375, 2.0439453125, 2.560791015625, 3.07763671875, 3.594482421875, 4.111328125, 4.628173828125, 5.14501953125, 5.661865234375, 6.1787109375, 6.695556640625, 7.21240234375, 7.729248046875, 8.24609375, 8.762939453125, 9.27978515625, 9.796630859375, 10.3134765625, 10.830322265625, 11.34716796875, 11.864013671875, 12.380859375, 12.897705078125, 13.41455078125, 13.931396484375, 14.4482421875, 14.965087890625, 15.48193359375, 15.998779296875, 16.515625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 16.0, 18.0, 44.0, 67.0, 182.0, 390.0, 1045.0, 4238.0, 471465.0, 3702201.0, 11801.0, 1739.0, 565.0, 258.0, 82.0, 51.0, 51.0, 17.0, 16.0, 4.0, 9.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.21875, -35.0576171875, -33.896484375, -32.7353515625, -31.57421875, -30.4130859375, -29.251953125, -28.0908203125, -26.9296875, -25.7685546875, -24.607421875, -23.4462890625, -22.28515625, -21.1240234375, -19.962890625, -18.8017578125, -17.640625, -16.4794921875, -15.318359375, -14.1572265625, -12.99609375, -11.8349609375, -10.673828125, -9.5126953125, -8.3515625, -7.1904296875, -6.029296875, -4.8681640625, -3.70703125, -2.5458984375, -1.384765625, -0.2236328125, 0.9375, 2.0986328125, 3.259765625, 4.4208984375, 5.58203125, 6.7431640625, 7.904296875, 9.0654296875, 10.2265625, 11.3876953125, 12.548828125, 13.7099609375, 14.87109375, 16.0322265625, 17.193359375, 18.3544921875, 19.515625, 20.6767578125, 21.837890625, 22.9990234375, 24.16015625, 25.3212890625, 26.482421875, 27.6435546875, 28.8046875, 29.9658203125, 31.126953125, 32.2880859375, 33.44921875, 34.6103515625, 35.771484375, 36.9326171875, 38.09375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 222.0, 592.0, 182.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.44705200195312, -153.61192321777344, -146.77679443359375, -139.94166564941406, -133.10653686523438, -126.27140808105469, -119.436279296875, -112.60115051269531, -105.76602172851562, -98.93089294433594, -92.09576416015625, -85.26063537597656, -78.42550659179688, -71.59037780761719, -64.7552490234375, -57.92012405395508, -51.084999084472656, -44.24987030029297, -37.41474151611328, -30.579614639282227, -23.74448585510254, -16.909358978271484, -10.074230194091797, -3.2391014099121094, 3.596027374267578, 10.431156158447266, 17.266284942626953, 24.101411819458008, 30.936540603637695, 37.77166748046875, 44.60679626464844, 51.441925048828125, 58.27705383300781, 65.1121826171875, 71.94731140136719, 78.78244018554688, 85.61756896972656, 92.45269775390625, 99.28782653808594, 106.12295532226562, 112.95808410644531, 119.793212890625, 126.62834167480469, 133.46347045898438, 140.29859924316406, 147.13372802734375, 153.96885681152344, 160.80398559570312, 167.63909912109375, 174.47422790527344, 181.30935668945312, 188.1444854736328, 194.9796142578125, 201.8147430419922, 208.64987182617188, 215.48500061035156, 222.32012939453125, 229.15525817871094, 235.99038696289062, 242.8255157470703, 249.66064453125, 256.4957580566406, 263.3309020996094, 270.166015625, 277.00115966796875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 5.0, 11.0, 19.0, 21.0, 21.0, 25.0, 25.0, 38.0, 45.0, 29.0, 34.0, 40.0, 39.0, 44.0, 51.0, 48.0, 50.0, 49.0, 50.0, 41.0, 40.0, 38.0, 37.0, 35.0, 26.0, 30.0, 22.0, 14.0, 14.0, 11.0, 6.0, 4.0, 9.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.47022247314453, -35.155433654785156, -33.84064483642578, -32.52585983276367, -31.211071014404297, -29.896282196044922, -28.581493377685547, -27.266706466674805, -25.951919555664062, -24.637130737304688, -23.322343826293945, -22.00755500793457, -20.692768096923828, -19.377979278564453, -18.063190460205078, -16.748403549194336, -15.433614730834961, -14.118826866149902, -12.804039001464844, -11.489250183105469, -10.174463272094727, -8.859674453735352, -7.544886589050293, -6.230098724365234, -4.915310859680176, -3.600522994995117, -2.2857348918914795, -0.9709467887878418, 0.3438410758972168, 1.6586289405822754, 2.973417282104492, 4.288205146789551, 5.602993011474609, 6.917780876159668, 8.232568740844727, 9.547357559204102, 10.862144470214844, 12.176933288574219, 13.491721153259277, 14.806509017944336, 16.121295928955078, 17.436084747314453, 18.750871658325195, 20.06566047668457, 21.380447387695312, 22.695236206054688, 24.010025024414062, 25.324811935424805, 26.63960075378418, 27.954389572143555, 29.269176483154297, 30.583965301513672, 31.898752212524414, 33.213539123535156, 34.52832794189453, 35.843116760253906, 37.15790557861328, 38.472694396972656, 39.78748321533203, 41.10226821899414, 42.417057037353516, 43.73184585571289, 45.046634674072266, 46.361419677734375, 47.67620849609375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 1.0, 3.0, 2.0, 3.0, 10.0, 6.0, 14.0, 9.0, 11.0, 12.0, 21.0, 11.0, 27.0, 21.0, 31.0, 29.0, 38.0, 26.0, 41.0, 48.0, 35.0, 41.0, 57.0, 40.0, 39.0, 43.0, 37.0, 36.0, 24.0, 28.0, 32.0, 30.0, 35.0, 32.0, 16.0, 21.0, 19.0, 18.0, 17.0, 9.0, 12.0, 6.0, 3.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69140625, -3.56146240234375, -3.4315185546875, -3.30157470703125, -3.171630859375, -3.04168701171875, -2.9117431640625, -2.78179931640625, -2.65185546875, -2.52191162109375, -2.3919677734375, -2.26202392578125, -2.132080078125, -2.00213623046875, -1.8721923828125, -1.74224853515625, -1.6123046875, -1.48236083984375, -1.3524169921875, -1.22247314453125, -1.092529296875, -0.96258544921875, -0.8326416015625, -0.70269775390625, -0.57275390625, -0.44281005859375, -0.3128662109375, -0.18292236328125, -0.052978515625, 0.07696533203125, 0.2069091796875, 0.33685302734375, 0.466796875, 0.59674072265625, 0.7266845703125, 0.85662841796875, 0.986572265625, 1.11651611328125, 1.2464599609375, 1.37640380859375, 1.50634765625, 1.63629150390625, 1.7662353515625, 1.89617919921875, 2.026123046875, 2.15606689453125, 2.2860107421875, 2.41595458984375, 2.5458984375, 2.67584228515625, 2.8057861328125, 2.93572998046875, 3.065673828125, 3.19561767578125, 3.3255615234375, 3.45550537109375, 3.58544921875, 3.71539306640625, 3.8453369140625, 3.97528076171875, 4.105224609375, 4.23516845703125, 4.3651123046875, 4.49505615234375, 4.625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 13.0, 12.0, 23.0, 30.0, 32.0, 61.0, 76.0, 131.0, 169.0, 344.0, 526.0, 864.0, 1484.0, 2523.0, 4145.0, 7120.0, 12542.0, 21545.0, 37100.0, 64034.0, 108306.0, 170550.0, 208818.0, 162724.0, 102207.0, 60141.0, 34770.0, 20097.0, 11676.0, 6736.0, 3912.0, 2308.0, 1323.0, 862.0, 484.0, 294.0, 203.0, 105.0, 78.0, 51.0, 43.0, 27.0, 23.0, 14.0, 5.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3359375, -0.3252525329589844, -0.31456756591796875, -0.3038825988769531, -0.2931976318359375, -0.2825126647949219, -0.27182769775390625, -0.2611427307128906, -0.250457763671875, -0.23977279663085938, -0.22908782958984375, -0.21840286254882812, -0.2077178955078125, -0.19703292846679688, -0.18634796142578125, -0.17566299438476562, -0.16497802734375, -0.15429306030273438, -0.14360809326171875, -0.13292312622070312, -0.1222381591796875, -0.11155319213867188, -0.10086822509765625, -0.09018325805664062, -0.079498291015625, -0.06881332397460938, -0.05812835693359375, -0.047443389892578125, -0.0367584228515625, -0.026073455810546875, -0.01538848876953125, -0.004703521728515625, 0.0059814453125, 0.016666412353515625, 0.02735137939453125, 0.038036346435546875, 0.0487213134765625, 0.059406280517578125, 0.07009124755859375, 0.08077621459960938, 0.091461181640625, 0.10214614868164062, 0.11283111572265625, 0.12351608276367188, 0.1342010498046875, 0.14488601684570312, 0.15557098388671875, 0.16625595092773438, 0.17694091796875, 0.18762588500976562, 0.19831085205078125, 0.20899581909179688, 0.2196807861328125, 0.23036575317382812, 0.24105072021484375, 0.2517356872558594, 0.262420654296875, 0.2731056213378906, 0.28379058837890625, 0.2944755554199219, 0.3051605224609375, 0.3158454895019531, 0.32653045654296875, 0.3372154235839844, 0.347900390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 2.0, 10.0, 11.0, 10.0, 18.0, 16.0, 13.0, 14.0, 16.0, 17.0, 30.0, 21.0, 26.0, 29.0, 42.0, 38.0, 33.0, 34.0, 40.0, 36.0, 34.0, 1055.0, 58.0, 37.0, 42.0, 34.0, 31.0, 27.0, 31.0, 25.0, 28.0, 20.0, 22.0, 20.0, 15.0, 14.0, 9.0, 11.0, 7.0, 7.0, 10.0, 5.0, 12.0, 1.0, 5.0, 1.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.478515625, -2.401397705078125, -2.32427978515625, -2.247161865234375, -2.1700439453125, -2.092926025390625, -2.01580810546875, -1.938690185546875, -1.861572265625, -1.784454345703125, -1.70733642578125, -1.630218505859375, -1.5531005859375, -1.475982666015625, -1.39886474609375, -1.321746826171875, -1.24462890625, -1.167510986328125, -1.09039306640625, -1.013275146484375, -0.9361572265625, -0.859039306640625, -0.78192138671875, -0.704803466796875, -0.627685546875, -0.550567626953125, -0.47344970703125, -0.396331787109375, -0.3192138671875, -0.242095947265625, -0.16497802734375, -0.087860107421875, -0.0107421875, 0.066375732421875, 0.14349365234375, 0.220611572265625, 0.2977294921875, 0.374847412109375, 0.45196533203125, 0.529083251953125, 0.606201171875, 0.683319091796875, 0.76043701171875, 0.837554931640625, 0.9146728515625, 0.991790771484375, 1.06890869140625, 1.146026611328125, 1.22314453125, 1.300262451171875, 1.37738037109375, 1.454498291015625, 1.5316162109375, 1.608734130859375, 1.68585205078125, 1.762969970703125, 1.840087890625, 1.917205810546875, 1.99432373046875, 2.071441650390625, 2.1485595703125, 2.225677490234375, 2.30279541015625, 2.379913330078125, 2.45703125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 9.0, 13.0, 13.0, 29.0, 38.0, 51.0, 76.0, 117.0, 176.0, 262.0, 346.0, 499.0, 770.0, 1115.0, 1756.0, 2686.0, 3919.0, 6103.0, 9100.0, 13717.0, 20464.0, 30231.0, 43933.0, 62985.0, 86739.0, 112985.0, 970444.0, 341673.0, 110859.0, 84500.0, 61108.0, 42674.0, 29265.0, 19536.0, 12996.0, 8801.0, 5741.0, 3853.0, 2558.0, 1659.0, 1034.0, 728.0, 508.0, 364.0, 229.0, 162.0, 109.0, 66.0, 37.0, 39.0, 24.0, 15.0, 6.0, 8.0, 1.0, 3.0, 5.0, 2.0, 3.0, 1.0], "bins": [-0.17138671875, -0.1658496856689453, -0.16031265258789062, -0.15477561950683594, -0.14923858642578125, -0.14370155334472656, -0.13816452026367188, -0.1326274871826172, -0.1270904541015625, -0.12155342102050781, -0.11601638793945312, -0.11047935485839844, -0.10494232177734375, -0.09940528869628906, -0.09386825561523438, -0.08833122253417969, -0.082794189453125, -0.07725715637207031, -0.07172012329101562, -0.06618309020996094, -0.06064605712890625, -0.05510902404785156, -0.049571990966796875, -0.04403495788574219, -0.0384979248046875, -0.03296089172363281, -0.027423858642578125, -0.021886825561523438, -0.01634979248046875, -0.010812759399414062, -0.005275726318359375, 0.0002613067626953125, 0.00579833984375, 0.011335372924804688, 0.016872406005859375, 0.022409439086914062, 0.02794647216796875, 0.03348350524902344, 0.039020538330078125, 0.04455757141113281, 0.0500946044921875, 0.05563163757324219, 0.061168670654296875, 0.06670570373535156, 0.07224273681640625, 0.07777976989746094, 0.08331680297851562, 0.08885383605957031, 0.094390869140625, 0.09992790222167969, 0.10546493530273438, 0.11100196838378906, 0.11653900146484375, 0.12207603454589844, 0.12761306762695312, 0.1331501007080078, 0.1386871337890625, 0.1442241668701172, 0.14976119995117188, 0.15529823303222656, 0.16083526611328125, 0.16637229919433594, 0.17190933227539062, 0.1774463653564453, 0.1829833984375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 9.0, 16.0, 13.0, 25.0, 19.0, 44.0, 41.0, 49.0, 76.0, 83.0, 108.0, 101.0, 89.0, 66.0, 56.0, 48.0, 30.0, 26.0, 15.0, 17.0, 14.0, 10.0, 9.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00672149658203125, -0.006494998931884766, -0.006268501281738281, -0.006042003631591797, -0.0058155059814453125, -0.005589008331298828, -0.005362510681152344, -0.005136013031005859, -0.004909515380859375, -0.004683017730712891, -0.004456520080566406, -0.004230022430419922, -0.0040035247802734375, -0.003777027130126953, -0.0035505294799804688, -0.0033240318298339844, -0.0030975341796875, -0.0028710365295410156, -0.0026445388793945312, -0.002418041229248047, -0.0021915435791015625, -0.001965045928955078, -0.0017385482788085938, -0.0015120506286621094, -0.001285552978515625, -0.0010590553283691406, -0.0008325576782226562, -0.0006060600280761719, -0.0003795623779296875, -0.00015306472778320312, 7.343292236328125e-05, 0.0002999305725097656, 0.00052642822265625, 0.0007529258728027344, 0.0009794235229492188, 0.0012059211730957031, 0.0014324188232421875, 0.0016589164733886719, 0.0018854141235351562, 0.0021119117736816406, 0.002338409423828125, 0.0025649070739746094, 0.0027914047241210938, 0.003017902374267578, 0.0032444000244140625, 0.003470897674560547, 0.0036973953247070312, 0.003923892974853516, 0.004150390625, 0.004376888275146484, 0.004603385925292969, 0.004829883575439453, 0.0050563812255859375, 0.005282878875732422, 0.005509376525878906, 0.005735874176025391, 0.005962371826171875, 0.006188869476318359, 0.006415367126464844, 0.006641864776611328, 0.0068683624267578125, 0.007094860076904297, 0.007321357727050781, 0.007547855377197266, 0.00777435302734375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 4.0, 12.0, 12.0, 17.0, 22.0, 23.0, 33.0, 30.0, 55.0, 71.0, 118.0, 171.0, 264.0, 458.0, 1132.0, 36174.0, 999684.0, 8465.0, 745.0, 345.0, 228.0, 134.0, 100.0, 67.0, 38.0, 44.0, 19.0, 17.0, 15.0, 12.0, 9.0, 8.0, 5.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1328125, -0.12894725799560547, -0.12508201599121094, -0.1212167739868164, -0.11735153198242188, -0.11348628997802734, -0.10962104797363281, -0.10575580596923828, -0.10189056396484375, -0.09802532196044922, -0.09416007995605469, -0.09029483795166016, -0.08642959594726562, -0.0825643539428711, -0.07869911193847656, -0.07483386993408203, -0.0709686279296875, -0.06710338592529297, -0.06323814392089844, -0.059372901916503906, -0.055507659912109375, -0.051642417907714844, -0.04777717590332031, -0.04391193389892578, -0.04004669189453125, -0.03618144989013672, -0.03231620788574219, -0.028450965881347656, -0.024585723876953125, -0.020720481872558594, -0.016855239868164062, -0.012989997863769531, -0.009124755859375, -0.005259513854980469, -0.0013942718505859375, 0.0024709701538085938, 0.006336212158203125, 0.010201454162597656, 0.014066696166992188, 0.01793193817138672, 0.02179718017578125, 0.02566242218017578, 0.029527664184570312, 0.033392906188964844, 0.037258148193359375, 0.041123390197753906, 0.04498863220214844, 0.04885387420654297, 0.0527191162109375, 0.05658435821533203, 0.06044960021972656, 0.0643148422241211, 0.06818008422851562, 0.07204532623291016, 0.07591056823730469, 0.07977581024169922, 0.08364105224609375, 0.08750629425048828, 0.09137153625488281, 0.09523677825927734, 0.09910202026367188, 0.1029672622680664, 0.10683250427246094, 0.11069774627685547, 0.11456298828125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 450.0, 552.0, 9.0], "bins": [-0.14696530997753143, -0.1445966511964798, -0.14222797751426697, -0.13985931873321533, -0.1374906450510025, -0.13512198626995087, -0.13275332748889923, -0.1303846538066864, -0.12801599502563477, -0.12564733624458313, -0.1232786625623703, -0.12091000378131866, -0.11854133754968643, -0.1161726713180542, -0.11380400508642197, -0.11143533885478973, -0.1090666726231575, -0.10669800639152527, -0.10432934015989304, -0.1019606813788414, -0.09959201514720917, -0.09722334891557693, -0.0948546826839447, -0.09248601645231247, -0.09011735022068024, -0.087748683989048, -0.08538001775741577, -0.08301135897636414, -0.0806426927447319, -0.07827402651309967, -0.07590536028146744, -0.0735366940498352, -0.07116802781820297, -0.06879936158657074, -0.06643069535493851, -0.06406203657388687, -0.06169337034225464, -0.059324704110622406, -0.05695603787899017, -0.05458737164735794, -0.052218709141016006, -0.049850042909383774, -0.04748138040304184, -0.04511271417140961, -0.042744047939777374, -0.04037538543343544, -0.03800671920180321, -0.03563805669546127, -0.03326939046382904, -0.030900726094841957, -0.028532061725854874, -0.02616339549422264, -0.023794731125235558, -0.021426066756248474, -0.01905740052461624, -0.016688736155629158, -0.014320071786642075, -0.011951407417654991, -0.009582742117345333, -0.007214077282696962, -0.004845412448048592, -0.002476748079061508, -0.00010808277875185013, 0.002260582521557808, 0.004629246890544891]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 15.0, 17.0, 26.0, 41.0, 39.0, 61.0, 77.0, 86.0, 86.0, 91.0, 107.0, 77.0, 68.0, 56.0, 47.0, 38.0, 34.0, 21.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012537539005279541, -0.012221626937389374, -0.011905714869499207, -0.01158980280160904, -0.011273890733718872, -0.010957978665828705, -0.010642066597938538, -0.01032615453004837, -0.010010242462158203, -0.009694330394268036, -0.009378418326377869, -0.009062506258487701, -0.008746594190597534, -0.008430682122707367, -0.0081147700548172, -0.0077988579869270325, -0.007482945919036865, -0.007167033851146698, -0.006851121783256531, -0.0065352097153663635, -0.006219297647476196, -0.005903385579586029, -0.005587473511695862, -0.005271561443805695, -0.004955649375915527, -0.00463973730802536, -0.004323825240135193, -0.004007913172245026, -0.0036920011043548584, -0.003376089036464691, -0.003060176968574524, -0.0027442649006843567, -0.0024283528327941895, -0.002112440764904022, -0.001796528697013855, -0.0014806166291236877, -0.0011647045612335205, -0.0008487924933433533, -0.000532880425453186, -0.0002169683575630188, 9.894371032714844e-05, 0.0004148557782173157, 0.0007307678461074829, 0.0010466799139976501, 0.0013625919818878174, 0.0016785040497779846, 0.001994416117668152, 0.002310328185558319, 0.0026262402534484863, 0.0029421523213386536, 0.003258064389228821, 0.003573976457118988, 0.0038898885250091553, 0.0042058005928993225, 0.00452171266078949, 0.004837624728679657, 0.005153536796569824, 0.0054694488644599915, 0.005785360932350159, 0.006101273000240326, 0.006417185068130493, 0.00673309713602066, 0.007049009203910828, 0.007364921271800995, 0.007680833339691162]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 1.0, 3.0, 2.0, 3.0, 10.0, 6.0, 14.0, 9.0, 11.0, 12.0, 21.0, 11.0, 27.0, 20.0, 32.0, 29.0, 38.0, 26.0, 41.0, 48.0, 35.0, 41.0, 56.0, 41.0, 39.0, 43.0, 37.0, 36.0, 24.0, 28.0, 32.0, 30.0, 35.0, 32.0, 16.0, 21.0, 19.0, 18.0, 17.0, 9.0, 12.0, 6.0, 3.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69140625, -3.56146240234375, -3.4315185546875, -3.30157470703125, -3.171630859375, -3.04168701171875, -2.9117431640625, -2.78179931640625, -2.65185546875, -2.52191162109375, -2.3919677734375, -2.26202392578125, -2.132080078125, -2.00213623046875, -1.8721923828125, -1.74224853515625, -1.6123046875, -1.48236083984375, -1.3524169921875, -1.22247314453125, -1.092529296875, -0.96258544921875, -0.8326416015625, -0.70269775390625, -0.57275390625, -0.44281005859375, -0.3128662109375, -0.18292236328125, -0.052978515625, 0.07696533203125, 0.2069091796875, 0.33685302734375, 0.466796875, 0.59674072265625, 0.7266845703125, 0.85662841796875, 0.986572265625, 1.11651611328125, 1.2464599609375, 1.37640380859375, 1.50634765625, 1.63629150390625, 1.7662353515625, 1.89617919921875, 2.026123046875, 2.15606689453125, 2.2860107421875, 2.41595458984375, 2.5458984375, 2.67584228515625, 2.8057861328125, 2.93572998046875, 3.065673828125, 3.19561767578125, 3.3255615234375, 3.45550537109375, 3.58544921875, 3.71539306640625, 3.8453369140625, 3.97528076171875, 4.105224609375, 4.23516845703125, 4.3651123046875, 4.49505615234375, 4.625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 5.0, 14.0, 17.0, 9.0, 12.0, 16.0, 25.0, 35.0, 41.0, 58.0, 70.0, 93.0, 109.0, 150.0, 215.0, 281.0, 397.0, 528.0, 864.0, 1283.0, 2306.0, 4886.0, 12003.0, 40957.0, 208818.0, 559782.0, 161393.0, 33528.0, 10302.0, 4286.0, 2081.0, 1202.0, 782.0, 486.0, 369.0, 267.0, 212.0, 156.0, 142.0, 88.0, 74.0, 56.0, 41.0, 23.0, 25.0, 13.0, 21.0, 15.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0078125, -5.80364990234375, -5.5994873046875, -5.39532470703125, -5.191162109375, -4.98699951171875, -4.7828369140625, -4.57867431640625, -4.37451171875, -4.17034912109375, -3.9661865234375, -3.76202392578125, -3.557861328125, -3.35369873046875, -3.1495361328125, -2.94537353515625, -2.7412109375, -2.53704833984375, -2.3328857421875, -2.12872314453125, -1.924560546875, -1.72039794921875, -1.5162353515625, -1.31207275390625, -1.10791015625, -0.90374755859375, -0.6995849609375, -0.49542236328125, -0.291259765625, -0.08709716796875, 0.1170654296875, 0.32122802734375, 0.525390625, 0.72955322265625, 0.9337158203125, 1.13787841796875, 1.342041015625, 1.54620361328125, 1.7503662109375, 1.95452880859375, 2.15869140625, 2.36285400390625, 2.5670166015625, 2.77117919921875, 2.975341796875, 3.17950439453125, 3.3836669921875, 3.58782958984375, 3.7919921875, 3.99615478515625, 4.2003173828125, 4.40447998046875, 4.608642578125, 4.81280517578125, 5.0169677734375, 5.22113037109375, 5.42529296875, 5.62945556640625, 5.8336181640625, 6.03778076171875, 6.241943359375, 6.44610595703125, 6.6502685546875, 6.85443115234375, 7.05859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 5.0, 6.0, 9.0, 9.0, 7.0, 5.0, 16.0, 15.0, 15.0, 24.0, 36.0, 31.0, 45.0, 48.0, 52.0, 73.0, 114.0, 297.0, 1487.0, 251.0, 122.0, 65.0, 58.0, 57.0, 36.0, 41.0, 26.0, 24.0, 12.0, 8.0, 8.0, 7.0, 8.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-15.0703125, -14.6456298828125, -14.220947265625, -13.7962646484375, -13.37158203125, -12.9468994140625, -12.522216796875, -12.0975341796875, -11.6728515625, -11.2481689453125, -10.823486328125, -10.3988037109375, -9.97412109375, -9.5494384765625, -9.124755859375, -8.7000732421875, -8.275390625, -7.8507080078125, -7.426025390625, -7.0013427734375, -6.57666015625, -6.1519775390625, -5.727294921875, -5.3026123046875, -4.8779296875, -4.4532470703125, -4.028564453125, -3.6038818359375, -3.17919921875, -2.7545166015625, -2.329833984375, -1.9051513671875, -1.48046875, -1.0557861328125, -0.631103515625, -0.2064208984375, 0.21826171875, 0.6429443359375, 1.067626953125, 1.4923095703125, 1.9169921875, 2.3416748046875, 2.766357421875, 3.1910400390625, 3.61572265625, 4.0404052734375, 4.465087890625, 4.8897705078125, 5.314453125, 5.7391357421875, 6.163818359375, 6.5885009765625, 7.01318359375, 7.4378662109375, 7.862548828125, 8.2872314453125, 8.7119140625, 9.1365966796875, 9.561279296875, 9.9859619140625, 10.41064453125, 10.8353271484375, 11.260009765625, 11.6846923828125, 12.109375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 7.0, 5.0, 12.0, 10.0, 16.0, 15.0, 37.0, 41.0, 76.0, 92.0, 142.0, 224.0, 398.0, 1025.0, 5680.0, 3076984.0, 57437.0, 1921.0, 631.0, 320.0, 152.0, 121.0, 101.0, 58.0, 44.0, 40.0, 32.0, 12.0, 20.0, 12.0, 14.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.671875, -26.674072265625, -25.67626953125, -24.678466796875, -23.6806640625, -22.682861328125, -21.68505859375, -20.687255859375, -19.689453125, -18.691650390625, -17.69384765625, -16.696044921875, -15.6982421875, -14.700439453125, -13.70263671875, -12.704833984375, -11.70703125, -10.709228515625, -9.71142578125, -8.713623046875, -7.7158203125, -6.718017578125, -5.72021484375, -4.722412109375, -3.724609375, -2.726806640625, -1.72900390625, -0.731201171875, 0.2666015625, 1.264404296875, 2.26220703125, 3.260009765625, 4.2578125, 5.255615234375, 6.25341796875, 7.251220703125, 8.2490234375, 9.246826171875, 10.24462890625, 11.242431640625, 12.240234375, 13.238037109375, 14.23583984375, 15.233642578125, 16.2314453125, 17.229248046875, 18.22705078125, 19.224853515625, 20.22265625, 21.220458984375, 22.21826171875, 23.216064453125, 24.2138671875, 25.211669921875, 26.20947265625, 27.207275390625, 28.205078125, 29.202880859375, 30.20068359375, 31.198486328125, 32.1962890625, 33.194091796875, 34.19189453125, 35.189697265625, 36.1875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 172.0, 827.0, 12.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-382.6285400390625, -375.70989990234375, -368.7912292480469, -361.8725891113281, -354.95391845703125, -348.0352783203125, -341.1166076660156, -334.1979675292969, -327.279296875, -320.36065673828125, -313.4419860839844, -306.5233459472656, -299.60467529296875, -292.68603515625, -285.7673645019531, -278.8487243652344, -271.9300537109375, -265.01141357421875, -258.0927429199219, -251.17408752441406, -244.25543212890625, -237.33677673339844, -230.41812133789062, -223.4994659423828, -216.58082580566406, -209.66217041015625, -202.74351501464844, -195.82485961914062, -188.9062042236328, -181.987548828125, -175.0688934326172, -168.15023803710938, -161.23159790039062, -154.3129425048828, -147.394287109375, -140.4756317138672, -133.55697631835938, -126.63832092285156, -119.71966552734375, -112.80101013183594, -105.88235473632812, -98.96369934082031, -92.0450439453125, -85.12638854980469, -78.20773315429688, -71.28907775878906, -64.37042236328125, -57.4517707824707, -50.533111572265625, -43.61445617675781, -36.69580078125, -29.77714729309082, -22.858491897583008, -15.939838409423828, -9.021183013916016, -2.102527618408203, 4.816127777099609, 11.734783172607422, 18.653438568115234, 25.572092056274414, 32.490745544433594, 39.409400939941406, 46.32805633544922, 53.24671173095703, 60.165367126464844]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 5.0, 9.0, 7.0, 7.0, 9.0, 9.0, 14.0, 9.0, 19.0, 19.0, 18.0, 27.0, 36.0, 30.0, 27.0, 34.0, 36.0, 48.0, 38.0, 40.0, 38.0, 40.0, 38.0, 49.0, 41.0, 29.0, 31.0, 26.0, 30.0, 34.0, 32.0, 25.0, 25.0, 17.0, 19.0, 15.0, 18.0, 10.0, 11.0, 7.0, 4.0, 11.0, 6.0, 1.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.71405029296875, -25.867168426513672, -25.020286560058594, -24.173404693603516, -23.326522827148438, -22.47964096069336, -21.63275909423828, -20.785877227783203, -19.938995361328125, -19.092113494873047, -18.24523162841797, -17.39834976196289, -16.551467895507812, -15.704586029052734, -14.857704162597656, -14.010822296142578, -13.163941383361816, -12.317059516906738, -11.47017765045166, -10.623295783996582, -9.776413917541504, -8.929533004760742, -8.082651138305664, -7.235768795013428, -6.38888692855835, -5.5420050621032715, -4.695123195648193, -3.8482415676116943, -3.001359701156616, -2.154478073120117, -1.307596206665039, -0.46071434020996094, 0.3861675262451172, 1.2330493927001953, 2.0799312591552734, 2.9268128871917725, 3.7736947536468506, 4.62057638168335, 5.467458248138428, 6.314340114593506, 7.161221981048584, 8.008103370666504, 8.854985237121582, 9.70186710357666, 10.548748970031738, 11.395630836486816, 12.242512702941895, 13.089394569396973, 13.93627643585205, 14.783158302307129, 15.630040168762207, 16.47692108154297, 17.323802947998047, 18.170684814453125, 19.017566680908203, 19.86444854736328, 20.71133041381836, 21.558212280273438, 22.405094146728516, 23.251976013183594, 24.098857879638672, 24.94573974609375, 25.792621612548828, 26.639503479003906, 27.486385345458984]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 5.0, 5.0, 14.0, 13.0, 14.0, 19.0, 19.0, 21.0, 27.0, 33.0, 38.0, 36.0, 49.0, 31.0, 40.0, 28.0, 41.0, 40.0, 51.0, 53.0, 42.0, 42.0, 34.0, 43.0, 25.0, 32.0, 30.0, 24.0, 32.0, 26.0, 20.0, 11.0, 14.0, 11.0, 12.0, 4.0, 9.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0234375, -4.8665771484375, -4.709716796875, -4.5528564453125, -4.39599609375, -4.2391357421875, -4.082275390625, -3.9254150390625, -3.7685546875, -3.6116943359375, -3.454833984375, -3.2979736328125, -3.14111328125, -2.9842529296875, -2.827392578125, -2.6705322265625, -2.513671875, -2.3568115234375, -2.199951171875, -2.0430908203125, -1.88623046875, -1.7293701171875, -1.572509765625, -1.4156494140625, -1.2587890625, -1.1019287109375, -0.945068359375, -0.7882080078125, -0.63134765625, -0.4744873046875, -0.317626953125, -0.1607666015625, -0.00390625, 0.1529541015625, 0.309814453125, 0.4666748046875, 0.62353515625, 0.7803955078125, 0.937255859375, 1.0941162109375, 1.2509765625, 1.4078369140625, 1.564697265625, 1.7215576171875, 1.87841796875, 2.0352783203125, 2.192138671875, 2.3489990234375, 2.505859375, 2.6627197265625, 2.819580078125, 2.9764404296875, 3.13330078125, 3.2901611328125, 3.447021484375, 3.6038818359375, 3.7607421875, 3.9176025390625, 4.074462890625, 4.2313232421875, 4.38818359375, 4.5450439453125, 4.701904296875, 4.8587646484375, 5.015625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 8.0, 21.0, 17.0, 24.0, 36.0, 43.0, 65.0, 105.0, 137.0, 165.0, 239.0, 395.0, 517.0, 902.0, 1908.0, 6513.0, 106965.0, 3402130.0, 653414.0, 14672.0, 2746.0, 1093.0, 669.0, 428.0, 306.0, 205.0, 158.0, 113.0, 79.0, 50.0, 27.0, 27.0, 14.0, 18.0, 14.0, 9.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.953125, -23.1728515625, -22.392578125, -21.6123046875, -20.83203125, -20.0517578125, -19.271484375, -18.4912109375, -17.7109375, -16.9306640625, -16.150390625, -15.3701171875, -14.58984375, -13.8095703125, -13.029296875, -12.2490234375, -11.46875, -10.6884765625, -9.908203125, -9.1279296875, -8.34765625, -7.5673828125, -6.787109375, -6.0068359375, -5.2265625, -4.4462890625, -3.666015625, -2.8857421875, -2.10546875, -1.3251953125, -0.544921875, 0.2353515625, 1.015625, 1.7958984375, 2.576171875, 3.3564453125, 4.13671875, 4.9169921875, 5.697265625, 6.4775390625, 7.2578125, 8.0380859375, 8.818359375, 9.5986328125, 10.37890625, 11.1591796875, 11.939453125, 12.7197265625, 13.5, 14.2802734375, 15.060546875, 15.8408203125, 16.62109375, 17.4013671875, 18.181640625, 18.9619140625, 19.7421875, 20.5224609375, 21.302734375, 22.0830078125, 22.86328125, 23.6435546875, 24.423828125, 25.2041015625, 25.984375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 9.0, 9.0, 9.0, 13.0, 28.0, 36.0, 45.0, 90.0, 151.0, 239.0, 362.0, 512.0, 569.0, 577.0, 470.0, 313.0, 242.0, 156.0, 80.0, 60.0, 30.0, 27.0, 10.0, 10.0, 4.0, 3.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.421875, -10.0753173828125, -9.728759765625, -9.3822021484375, -9.03564453125, -8.6890869140625, -8.342529296875, -7.9959716796875, -7.6494140625, -7.3028564453125, -6.956298828125, -6.6097412109375, -6.26318359375, -5.9166259765625, -5.570068359375, -5.2235107421875, -4.876953125, -4.5303955078125, -4.183837890625, -3.8372802734375, -3.49072265625, -3.1441650390625, -2.797607421875, -2.4510498046875, -2.1044921875, -1.7579345703125, -1.411376953125, -1.0648193359375, -0.71826171875, -0.3717041015625, -0.025146484375, 0.3214111328125, 0.66796875, 1.0145263671875, 1.361083984375, 1.7076416015625, 2.05419921875, 2.4007568359375, 2.747314453125, 3.0938720703125, 3.4404296875, 3.7869873046875, 4.133544921875, 4.4801025390625, 4.82666015625, 5.1732177734375, 5.519775390625, 5.8663330078125, 6.212890625, 6.5594482421875, 6.906005859375, 7.2525634765625, 7.59912109375, 7.9456787109375, 8.292236328125, 8.6387939453125, 8.9853515625, 9.3319091796875, 9.678466796875, 10.0250244140625, 10.37158203125, 10.7181396484375, 11.064697265625, 11.4112548828125, 11.7578125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 1.0, 10.0, 8.0, 14.0, 12.0, 20.0, 40.0, 73.0, 160.0, 271.0, 610.0, 1419.0, 4572.0, 18353.0, 137790.0, 1471751.0, 2262970.0, 257803.0, 28990.0, 5994.0, 1920.0, 791.0, 337.0, 150.0, 85.0, 47.0, 26.0, 24.0, 16.0, 13.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.9921875, -11.6602783203125, -11.328369140625, -10.9964599609375, -10.66455078125, -10.3326416015625, -10.000732421875, -9.6688232421875, -9.3369140625, -9.0050048828125, -8.673095703125, -8.3411865234375, -8.00927734375, -7.6773681640625, -7.345458984375, -7.0135498046875, -6.681640625, -6.3497314453125, -6.017822265625, -5.6859130859375, -5.35400390625, -5.0220947265625, -4.690185546875, -4.3582763671875, -4.0263671875, -3.6944580078125, -3.362548828125, -3.0306396484375, -2.69873046875, -2.3668212890625, -2.034912109375, -1.7030029296875, -1.37109375, -1.0391845703125, -0.707275390625, -0.3753662109375, -0.04345703125, 0.2884521484375, 0.620361328125, 0.9522705078125, 1.2841796875, 1.6160888671875, 1.947998046875, 2.2799072265625, 2.61181640625, 2.9437255859375, 3.275634765625, 3.6075439453125, 3.939453125, 4.2713623046875, 4.603271484375, 4.9351806640625, 5.26708984375, 5.5989990234375, 5.930908203125, 6.2628173828125, 6.5947265625, 6.9266357421875, 7.258544921875, 7.5904541015625, 7.92236328125, 8.2542724609375, 8.586181640625, 8.9180908203125, 9.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 11.0, 9.0, 20.0, 29.0, 45.0, 53.0, 72.0, 86.0, 115.0, 107.0, 99.0, 100.0, 68.0, 60.0, 44.0, 25.0, 16.0, 9.0, 14.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.067909240722656, -37.87989807128906, -35.69188690185547, -33.503875732421875, -31.315866470336914, -29.12785530090332, -26.93984603881836, -24.751834869384766, -22.563823699951172, -20.375812530517578, -18.187801361083984, -15.999792098999023, -13.81178092956543, -11.623769760131836, -9.435759544372559, -7.247749328613281, -5.0597381591796875, -2.871727466583252, -0.6837167739868164, 1.5042939186096191, 3.6923046112060547, 5.880315780639648, 8.068325996398926, 10.256336212158203, 12.444347381591797, 14.63235855102539, 16.820369720458984, 19.008378982543945, 21.19639015197754, 23.384401321411133, 25.572410583496094, 27.760421752929688, 29.94842529296875, 32.136436462402344, 34.32444763183594, 36.51245880126953, 38.700469970703125, 40.88848114013672, 43.07648849487305, 45.26449966430664, 47.452510833740234, 49.64052200317383, 51.82853317260742, 54.016544342041016, 56.204551696777344, 58.39256286621094, 60.58057403564453, 62.768585205078125, 64.95659637451172, 67.14460754394531, 69.3326187133789, 71.5206298828125, 73.7086410522461, 75.89665222167969, 78.08466339111328, 80.27267456054688, 82.46067810058594, 84.64868927001953, 86.83670043945312, 89.02471160888672, 91.21272277832031, 93.4007339477539, 95.5887451171875, 97.77674865722656, 99.96476745605469]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 7.0, 3.0, 3.0, 2.0, 5.0, 12.0, 8.0, 8.0, 19.0, 18.0, 19.0, 29.0, 22.0, 25.0, 26.0, 27.0, 45.0, 33.0, 32.0, 31.0, 40.0, 33.0, 42.0, 37.0, 41.0, 39.0, 41.0, 40.0, 34.0, 29.0, 32.0, 24.0, 23.0, 25.0, 22.0, 22.0, 24.0, 16.0, 20.0, 17.0, 9.0, 8.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-37.983272552490234, -36.90467071533203, -35.82606887817383, -34.747467041015625, -33.66886520385742, -32.59026336669922, -31.51166343688965, -30.433061599731445, -29.354459762573242, -28.27585792541504, -27.197256088256836, -26.118654251098633, -25.040054321289062, -23.96145248413086, -22.882850646972656, -21.804248809814453, -20.72564697265625, -19.647045135498047, -18.568443298339844, -17.48984146118164, -16.411239624023438, -15.33263874053955, -14.254037857055664, -13.175436019897461, -12.096834182739258, -11.018232345581055, -9.939630508422852, -8.861029624938965, -7.782427787780762, -6.703825950622559, -5.625224590301514, -4.546623229980469, -3.4680233001708984, -2.3894217014312744, -1.3108201026916504, -0.23221850395202637, 0.8463830947875977, 1.9249849319458008, 3.0035862922668457, 4.082187652587891, 5.160789489746094, 6.239391326904297, 7.317992687225342, 8.396594047546387, 9.47519588470459, 10.553797721862793, 11.63239860534668, 12.711000442504883, 13.789602279663086, 14.868204116821289, 15.946805953979492, 17.025407791137695, 18.104007720947266, 19.18260955810547, 20.261211395263672, 21.339813232421875, 22.418415069580078, 23.49701690673828, 24.575618743896484, 25.654220581054688, 26.73282241821289, 27.811424255371094, 28.890024185180664, 29.968626022338867, 31.04722785949707]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 7.0, 13.0, 10.0, 20.0, 26.0, 24.0, 36.0, 28.0, 28.0, 33.0, 49.0, 41.0, 51.0, 48.0, 47.0, 45.0, 50.0, 46.0, 48.0, 49.0, 42.0, 35.0, 38.0, 28.0, 33.0, 19.0, 24.0, 20.0, 22.0, 10.0, 12.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.7421875, -68.171875, -65.6015625, -63.03125, -60.4609375, -57.890625, -55.3203125, -52.75, -50.1796875, -47.609375, -45.0390625, -42.46875, -39.8984375, -37.328125, -34.7578125, -32.1875, -29.6171875, -27.046875, -24.4765625, -21.90625, -19.3359375, -16.765625, -14.1953125, -11.625, -9.0546875, -6.484375, -3.9140625, -1.34375, 1.2265625, 3.796875, 6.3671875, 8.9375, 11.5078125, 14.078125, 16.6484375, 19.21875, 21.7890625, 24.359375, 26.9296875, 29.5, 32.0703125, 34.640625, 37.2109375, 39.78125, 42.3515625, 44.921875, 47.4921875, 50.0625, 52.6328125, 55.203125, 57.7734375, 60.34375, 62.9140625, 65.484375, 68.0546875, 70.625, 73.1953125, 75.765625, 78.3359375, 80.90625, 83.4765625, 86.046875, 88.6171875, 91.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 12.0, 24.0, 27.0, 38.0, 64.0, 118.0, 160.0, 230.0, 392.0, 633.0, 981.0, 1513.0, 2399.0, 3929.0, 6318.0, 10210.0, 16272.0, 26228.0, 42466.0, 68061.0, 105964.0, 149582.0, 173010.0, 151183.0, 106881.0, 69164.0, 42496.0, 26534.0, 16324.0, 10168.0, 6352.0, 3999.0, 2503.0, 1537.0, 1045.0, 603.0, 402.0, 243.0, 170.0, 94.0, 79.0, 46.0, 27.0, 22.0, 11.0, 11.0, 8.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.62109375, -3.502410888671875, -3.38372802734375, -3.265045166015625, -3.1463623046875, -3.027679443359375, -2.90899658203125, -2.790313720703125, -2.671630859375, -2.552947998046875, -2.43426513671875, -2.315582275390625, -2.1968994140625, -2.078216552734375, -1.95953369140625, -1.840850830078125, -1.72216796875, -1.603485107421875, -1.48480224609375, -1.366119384765625, -1.2474365234375, -1.128753662109375, -1.01007080078125, -0.891387939453125, -0.772705078125, -0.654022216796875, -0.53533935546875, -0.416656494140625, -0.2979736328125, -0.179290771484375, -0.06060791015625, 0.058074951171875, 0.1767578125, 0.295440673828125, 0.41412353515625, 0.532806396484375, 0.6514892578125, 0.770172119140625, 0.88885498046875, 1.007537841796875, 1.126220703125, 1.244903564453125, 1.36358642578125, 1.482269287109375, 1.6009521484375, 1.719635009765625, 1.83831787109375, 1.957000732421875, 2.07568359375, 2.194366455078125, 2.31304931640625, 2.431732177734375, 2.5504150390625, 2.669097900390625, 2.78778076171875, 2.906463623046875, 3.025146484375, 3.143829345703125, 3.26251220703125, 3.381195068359375, 3.4998779296875, 3.618560791015625, 3.73724365234375, 3.855926513671875, 3.974609375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 10.0, 11.0, 16.0, 21.0, 21.0, 30.0, 25.0, 27.0, 34.0, 37.0, 37.0, 41.0, 50.0, 41.0, 52.0, 1073.0, 53.0, 49.0, 32.0, 37.0, 37.0, 31.0, 29.0, 37.0, 35.0, 21.0, 14.0, 16.0, 16.0, 14.0, 13.0, 7.0, 9.0, 8.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.5, -40.0810546875, -38.662109375, -37.2431640625, -35.82421875, -34.4052734375, -32.986328125, -31.5673828125, -30.1484375, -28.7294921875, -27.310546875, -25.8916015625, -24.47265625, -23.0537109375, -21.634765625, -20.2158203125, -18.796875, -17.3779296875, -15.958984375, -14.5400390625, -13.12109375, -11.7021484375, -10.283203125, -8.8642578125, -7.4453125, -6.0263671875, -4.607421875, -3.1884765625, -1.76953125, -0.3505859375, 1.068359375, 2.4873046875, 3.90625, 5.3251953125, 6.744140625, 8.1630859375, 9.58203125, 11.0009765625, 12.419921875, 13.8388671875, 15.2578125, 16.6767578125, 18.095703125, 19.5146484375, 20.93359375, 22.3525390625, 23.771484375, 25.1904296875, 26.609375, 28.0283203125, 29.447265625, 30.8662109375, 32.28515625, 33.7041015625, 35.123046875, 36.5419921875, 37.9609375, 39.3798828125, 40.798828125, 42.2177734375, 43.63671875, 45.0556640625, 46.474609375, 47.8935546875, 49.3125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 9.0, 16.0, 17.0, 27.0, 28.0, 52.0, 69.0, 107.0, 166.0, 287.0, 447.0, 646.0, 1021.0, 1643.0, 2606.0, 4094.0, 6468.0, 9820.0, 15428.0, 24587.0, 37857.0, 57877.0, 86268.0, 121275.0, 401902.0, 945763.0, 122721.0, 88371.0, 59516.0, 38924.0, 25076.0, 15838.0, 10165.0, 6360.0, 4177.0, 2664.0, 1670.0, 1124.0, 689.0, 492.0, 309.0, 203.0, 113.0, 85.0, 61.0, 40.0, 20.0, 13.0, 12.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.96484375, -2.872283935546875, -2.77972412109375, -2.687164306640625, -2.5946044921875, -2.502044677734375, -2.40948486328125, -2.316925048828125, -2.224365234375, -2.131805419921875, -2.03924560546875, -1.946685791015625, -1.8541259765625, -1.761566162109375, -1.66900634765625, -1.576446533203125, -1.48388671875, -1.391326904296875, -1.29876708984375, -1.206207275390625, -1.1136474609375, -1.021087646484375, -0.92852783203125, -0.835968017578125, -0.743408203125, -0.650848388671875, -0.55828857421875, -0.465728759765625, -0.3731689453125, -0.280609130859375, -0.18804931640625, -0.095489501953125, -0.0029296875, 0.089630126953125, 0.18218994140625, 0.274749755859375, 0.3673095703125, 0.459869384765625, 0.55242919921875, 0.644989013671875, 0.737548828125, 0.830108642578125, 0.92266845703125, 1.015228271484375, 1.1077880859375, 1.200347900390625, 1.29290771484375, 1.385467529296875, 1.47802734375, 1.570587158203125, 1.66314697265625, 1.755706787109375, 1.8482666015625, 1.940826416015625, 2.03338623046875, 2.125946044921875, 2.218505859375, 2.311065673828125, 2.40362548828125, 2.496185302734375, 2.5887451171875, 2.681304931640625, 2.77386474609375, 2.866424560546875, 2.958984375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 7.0, 3.0, 9.0, 4.0, 9.0, 14.0, 17.0, 25.0, 26.0, 25.0, 26.0, 23.0, 36.0, 38.0, 56.0, 51.0, 47.0, 59.0, 48.0, 61.0, 50.0, 45.0, 48.0, 51.0, 39.0, 33.0, 33.0, 29.0, 18.0, 13.0, 14.0, 9.0, 6.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.033233642578125, -0.03231477737426758, -0.031395912170410156, -0.030477046966552734, -0.029558181762695312, -0.02863931655883789, -0.02772045135498047, -0.026801586151123047, -0.025882720947265625, -0.024963855743408203, -0.02404499053955078, -0.02312612533569336, -0.022207260131835938, -0.021288394927978516, -0.020369529724121094, -0.019450664520263672, -0.01853179931640625, -0.017612934112548828, -0.016694068908691406, -0.015775203704833984, -0.014856338500976562, -0.01393747329711914, -0.013018608093261719, -0.012099742889404297, -0.011180877685546875, -0.010262012481689453, -0.009343147277832031, -0.00842428207397461, -0.0075054168701171875, -0.006586551666259766, -0.005667686462402344, -0.004748821258544922, -0.0038299560546875, -0.002911090850830078, -0.0019922256469726562, -0.0010733604431152344, -0.0001544952392578125, 0.0007643699645996094, 0.0016832351684570312, 0.002602100372314453, 0.003520965576171875, 0.004439830780029297, 0.005358695983886719, 0.006277561187744141, 0.0071964263916015625, 0.008115291595458984, 0.009034156799316406, 0.009953022003173828, 0.01087188720703125, 0.011790752410888672, 0.012709617614746094, 0.013628482818603516, 0.014547348022460938, 0.01546621322631836, 0.01638507843017578, 0.017303943634033203, 0.018222808837890625, 0.019141674041748047, 0.02006053924560547, 0.02097940444946289, 0.021898269653320312, 0.022817134857177734, 0.023736000061035156, 0.024654865264892578, 0.02557373046875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 14.0, 14.0, 10.0, 13.0, 38.0, 21.0, 35.0, 61.0, 85.0, 131.0, 203.0, 308.0, 603.0, 1085.0, 2011.0, 3816.0, 8029.0, 17812.0, 45088.0, 121683.0, 330365.0, 322748.0, 117817.0, 42983.0, 17442.0, 7820.0, 3734.0, 1995.0, 1068.0, 553.0, 317.0, 193.0, 154.0, 85.0, 50.0, 42.0, 38.0, 30.0, 16.0, 13.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.1579303741455078, -0.15228652954101562, -0.14664268493652344, -0.14099884033203125, -0.13535499572753906, -0.12971115112304688, -0.12406730651855469, -0.1184234619140625, -0.11277961730957031, -0.10713577270507812, -0.10149192810058594, -0.09584808349609375, -0.09020423889160156, -0.08456039428710938, -0.07891654968261719, -0.073272705078125, -0.06762886047363281, -0.061985015869140625, -0.05634117126464844, -0.05069732666015625, -0.04505348205566406, -0.039409637451171875, -0.03376579284667969, -0.0281219482421875, -0.022478103637695312, -0.016834259033203125, -0.011190414428710938, -0.00554656982421875, 9.72747802734375e-05, 0.005741119384765625, 0.011384963989257812, 0.01702880859375, 0.022672653198242188, 0.028316497802734375, 0.03396034240722656, 0.03960418701171875, 0.04524803161621094, 0.050891876220703125, 0.05653572082519531, 0.0621795654296875, 0.06782341003417969, 0.07346725463867188, 0.07911109924316406, 0.08475494384765625, 0.09039878845214844, 0.09604263305664062, 0.10168647766113281, 0.107330322265625, 0.11297416687011719, 0.11861801147460938, 0.12426185607910156, 0.12990570068359375, 0.13554954528808594, 0.14119338989257812, 0.1468372344970703, 0.1524810791015625, 0.1581249237060547, 0.16376876831054688, 0.16941261291503906, 0.17505645751953125, 0.18070030212402344, 0.18634414672851562, 0.1919879913330078, 0.1976318359375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 13.0, 7.0, 11.0, 22.0, 53.0, 63.0, 64.0, 86.0, 113.0, 122.0, 115.0, 90.0, 76.0, 55.0, 32.0, 25.0, 10.0, 9.0, 16.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.08668020367622375, -0.08447448909282684, -0.08226878196001053, -0.08006306737661362, -0.0778573527932167, -0.07565164566040039, -0.07344593107700348, -0.07124021649360657, -0.06903450936079025, -0.06682879477739334, -0.06462308764457703, -0.062417373061180115, -0.0602116622030735, -0.05800595134496689, -0.05580023676156998, -0.053594525903463364, -0.05138881132006645, -0.04918310046195984, -0.04697738587856293, -0.044771675020456314, -0.0425659641623497, -0.04036024957895279, -0.038154538720846176, -0.03594882786273956, -0.03374311327934265, -0.03153740242123604, -0.029331689700484276, -0.027125976979732513, -0.0249202661216259, -0.022714553400874138, -0.020508840680122375, -0.018303129822015762, -0.016097422689199448, -0.01389171089977026, -0.011685999110341072, -0.00948028638958931, -0.007274574600160122, -0.005068862810730934, -0.0028631500899791718, -0.000657438300549984, 0.0015482734888792038, 0.0037539855111390352, 0.005959697533398867, 0.008165409788489342, 0.01037112157791853, 0.012576833367347717, 0.01478254608809948, 0.016988258808851242, 0.019193969666957855, 0.021399682387709618, 0.02360539324581623, 0.025811105966567993, 0.028016816824674606, 0.03022252954542637, 0.03242824226617813, 0.034633953124284744, 0.03683966398239136, 0.03904537484049797, 0.04125108942389488, 0.043456800282001495, 0.04566251114010811, 0.04786822199821472, 0.05007393658161163, 0.052279647439718246, 0.05448536202311516]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 10.0, 12.0, 14.0, 10.0, 16.0, 19.0, 16.0, 20.0, 25.0, 28.0, 29.0, 27.0, 36.0, 46.0, 41.0, 33.0, 30.0, 47.0, 39.0, 59.0, 57.0, 37.0, 34.0, 36.0, 43.0, 32.0, 28.0, 20.0, 22.0, 15.0, 21.0, 18.0, 13.0, 11.0, 10.0, 8.0, 7.0, 9.0, 6.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.02265644073486328, -0.02202192321419716, -0.021387403830885887, -0.020752884447574615, -0.020118366926908493, -0.01948384940624237, -0.0188493300229311, -0.018214810639619827, -0.017580293118953705, -0.016945775598287582, -0.01631125621497631, -0.01567673683166504, -0.015042219310998917, -0.01440770085901022, -0.013773182407021523, -0.013138663955032825, -0.012504145503044128, -0.011869627051055431, -0.011235108599066734, -0.010600590147078037, -0.00996607169508934, -0.009331553243100643, -0.008697034791111946, -0.008062516339123249, -0.007427997887134552, -0.006793479435145855, -0.006158960983157158, -0.005524442531168461, -0.004889924079179764, -0.004255405627191067, -0.0036208871752023697, -0.0029863687232136726, -0.0023518502712249756, -0.0017173318192362785, -0.0010828133672475815, -0.00044829491525888443, 0.00018622353672981262, 0.0008207419887185097, 0.0014552604407072067, 0.0020897788926959038, 0.002724297344684601, 0.003358815796673298, 0.003993334248661995, 0.004627852700650692, 0.005262371152639389, 0.005896889604628086, 0.006531408056616783, 0.00716592650860548, 0.007800444960594177, 0.008434963412582874, 0.009069481864571571, 0.009704000316560268, 0.010338518768548965, 0.010973037220537663, 0.01160755567252636, 0.012242074124515057, 0.012876592576503754, 0.01351111102849245, 0.014145629480481148, 0.014780147932469845, 0.015414666384458542, 0.016049183905124664, 0.016683703288435936, 0.017318222671747208, 0.01795274019241333]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 13.0, 10.0, 20.0, 24.0, 28.0, 33.0, 29.0, 28.0, 33.0, 49.0, 41.0, 51.0, 48.0, 48.0, 45.0, 48.0, 46.0, 50.0, 48.0, 40.0, 38.0, 37.0, 28.0, 34.0, 19.0, 23.0, 20.0, 21.0, 10.0, 13.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.7421875, -68.171875, -65.6015625, -63.03125, -60.4609375, -57.890625, -55.3203125, -52.75, -50.1796875, -47.609375, -45.0390625, -42.46875, -39.8984375, -37.328125, -34.7578125, -32.1875, -29.6171875, -27.046875, -24.4765625, -21.90625, -19.3359375, -16.765625, -14.1953125, -11.625, -9.0546875, -6.484375, -3.9140625, -1.34375, 1.2265625, 3.796875, 6.3671875, 8.9375, 11.5078125, 14.078125, 16.6484375, 19.21875, 21.7890625, 24.359375, 26.9296875, 29.5, 32.0703125, 34.640625, 37.2109375, 39.78125, 42.3515625, 44.921875, 47.4921875, 50.0625, 52.6328125, 55.203125, 57.7734375, 60.34375, 62.9140625, 65.484375, 68.0546875, 70.625, 73.1953125, 75.765625, 78.3359375, 80.90625, 83.4765625, 86.046875, 88.6171875, 91.1875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 19.0, 13.0, 26.0, 37.0, 67.0, 77.0, 142.0, 230.0, 391.0, 680.0, 1378.0, 3771.0, 15009.0, 104295.0, 587060.0, 287742.0, 36329.0, 6846.0, 2161.0, 981.0, 525.0, 286.0, 176.0, 88.0, 86.0, 44.0, 33.0, 16.0, 12.0, 11.0, 6.0, 4.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -11.97412109375, -11.5263671875, -11.07861328125, -10.630859375, -10.18310546875, -9.7353515625, -9.28759765625, -8.83984375, -8.39208984375, -7.9443359375, -7.49658203125, -7.048828125, -6.60107421875, -6.1533203125, -5.70556640625, -5.2578125, -4.81005859375, -4.3623046875, -3.91455078125, -3.466796875, -3.01904296875, -2.5712890625, -2.12353515625, -1.67578125, -1.22802734375, -0.7802734375, -0.33251953125, 0.115234375, 0.56298828125, 1.0107421875, 1.45849609375, 1.90625, 2.35400390625, 2.8017578125, 3.24951171875, 3.697265625, 4.14501953125, 4.5927734375, 5.04052734375, 5.48828125, 5.93603515625, 6.3837890625, 6.83154296875, 7.279296875, 7.72705078125, 8.1748046875, 8.62255859375, 9.0703125, 9.51806640625, 9.9658203125, 10.41357421875, 10.861328125, 11.30908203125, 11.7568359375, 12.20458984375, 12.65234375, 13.10009765625, 13.5478515625, 13.99560546875, 14.443359375, 14.89111328125, 15.3388671875, 15.78662109375, 16.234375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 11.0, 20.0, 42.0, 70.0, 125.0, 138.0, 2205.0, 160.0, 113.0, 75.0, 42.0, 20.0, 12.0, 4.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-337.75, -327.69921875, -317.6484375, -307.59765625, -297.546875, -287.49609375, -277.4453125, -267.39453125, -257.34375, -247.29296875, -237.2421875, -227.19140625, -217.140625, -207.08984375, -197.0390625, -186.98828125, -176.9375, -166.88671875, -156.8359375, -146.78515625, -136.734375, -126.68359375, -116.6328125, -106.58203125, -96.53125, -86.48046875, -76.4296875, -66.37890625, -56.328125, -46.27734375, -36.2265625, -26.17578125, -16.125, -6.07421875, 3.9765625, 14.02734375, 24.078125, 34.12890625, 44.1796875, 54.23046875, 64.28125, 74.33203125, 84.3828125, 94.43359375, 104.484375, 114.53515625, 124.5859375, 134.63671875, 144.6875, 154.73828125, 164.7890625, 174.83984375, 184.890625, 194.94140625, 204.9921875, 215.04296875, 225.09375, 235.14453125, 245.1953125, 255.24609375, 265.296875, 275.34765625, 285.3984375, 295.44921875, 305.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 7.0, 7.0, 9.0, 12.0, 19.0, 23.0, 40.0, 49.0, 100.0, 261.0, 648.0, 1910.0, 16043.0, 3075301.0, 47064.0, 2768.0, 800.0, 323.0, 123.0, 78.0, 46.0, 20.0, 17.0, 10.0, 5.0, 8.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.625, -39.2978515625, -37.970703125, -36.6435546875, -35.31640625, -33.9892578125, -32.662109375, -31.3349609375, -30.0078125, -28.6806640625, -27.353515625, -26.0263671875, -24.69921875, -23.3720703125, -22.044921875, -20.7177734375, -19.390625, -18.0634765625, -16.736328125, -15.4091796875, -14.08203125, -12.7548828125, -11.427734375, -10.1005859375, -8.7734375, -7.4462890625, -6.119140625, -4.7919921875, -3.46484375, -2.1376953125, -0.810546875, 0.5166015625, 1.84375, 3.1708984375, 4.498046875, 5.8251953125, 7.15234375, 8.4794921875, 9.806640625, 11.1337890625, 12.4609375, 13.7880859375, 15.115234375, 16.4423828125, 17.76953125, 19.0966796875, 20.423828125, 21.7509765625, 23.078125, 24.4052734375, 25.732421875, 27.0595703125, 28.38671875, 29.7138671875, 31.041015625, 32.3681640625, 33.6953125, 35.0224609375, 36.349609375, 37.6767578125, 39.00390625, 40.3310546875, 41.658203125, 42.9853515625, 44.3125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 13.0, 26.0, 85.0, 212.0, 356.0, 202.0, 58.0, 19.0, 13.0, 5.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-240.0777587890625, -229.2676544189453, -218.4575653076172, -207.6474609375, -196.83737182617188, -186.0272674560547, -175.2171630859375, -164.40707397460938, -153.59698486328125, -142.78688049316406, -131.97679138183594, -121.16668701171875, -110.35659790039062, -99.54649353027344, -88.73639678955078, -77.92630004882812, -67.11619567871094, -56.30609893798828, -45.496002197265625, -34.6859016418457, -23.875804901123047, -13.06570816040039, -2.2556076049804688, 8.554489135742188, 19.364585876464844, 30.1746826171875, 40.984779357910156, 51.79487991333008, 62.604976654052734, 73.41506958007812, 84.22517395019531, 95.03527069091797, 105.84536743164062, 116.65546417236328, 127.46556091308594, 138.27566528320312, 149.08575439453125, 159.89585876464844, 170.70596313476562, 181.51605224609375, 192.32614135742188, 203.13624572753906, 213.9463348388672, 224.75643920898438, 235.5665283203125, 246.3766326904297, 257.1867370605469, 267.996826171875, 278.80694580078125, 289.6170349121094, 300.4271545410156, 311.23724365234375, 322.0473327636719, 332.857421875, 343.66754150390625, 354.4776306152344, 365.2877197265625, 376.0978088378906, 386.9079284667969, 397.718017578125, 408.5281066894531, 419.33819580078125, 430.1483154296875, 440.9584045410156, 451.76849365234375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 5.0, 4.0, 5.0, 7.0, 9.0, 10.0, 18.0, 22.0, 25.0, 17.0, 28.0, 31.0, 34.0, 31.0, 34.0, 41.0, 41.0, 41.0, 52.0, 40.0, 30.0, 35.0, 43.0, 39.0, 41.0, 37.0, 36.0, 30.0, 46.0, 26.0, 21.0, 21.0, 18.0, 14.0, 14.0, 13.0, 13.0, 5.0, 2.0, 8.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-129.8126983642578, -125.88247680664062, -121.95225524902344, -118.02203369140625, -114.09181213378906, -110.16159057617188, -106.23136901855469, -102.3011474609375, -98.37092590332031, -94.44070434570312, -90.51048278808594, -86.58026123046875, -82.65003967285156, -78.71981811523438, -74.78959655761719, -70.859375, -66.92914581298828, -62.998924255371094, -59.068702697753906, -55.13848114013672, -51.20825958251953, -47.278038024902344, -43.34781265258789, -39.4175910949707, -35.487369537353516, -31.557147979736328, -27.62692642211914, -23.69670295715332, -19.766481399536133, -15.836259841918945, -11.906036376953125, -7.9758148193359375, -4.04559326171875, -0.1153712272644043, 3.8148508071899414, 7.745073318481445, 11.675294876098633, 15.60551643371582, 19.53573989868164, 23.465961456298828, 27.396183013916016, 31.326404571533203, 35.25662612915039, 39.186851501464844, 43.11707305908203, 47.04729461669922, 50.977516174316406, 54.907737731933594, 58.83795928955078, 62.76818084716797, 66.69840240478516, 70.62862396240234, 74.55884552001953, 78.48906707763672, 82.41929626464844, 86.34951782226562, 90.27973937988281, 94.2099609375, 98.14018249511719, 102.07040405273438, 106.00062561035156, 109.93084716796875, 113.86106872558594, 117.79129028320312, 121.72151184082031]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 8.0, 9.0, 13.0, 14.0, 21.0, 21.0, 41.0, 55.0, 62.0, 115.0, 148.0, 192.0, 261.0, 436.0, 578.0, 826.0, 1336.0, 1927.0, 2842.0, 4064.0, 5575.0, 1007423.0, 6900.0, 4650.0, 3526.0, 2424.0, 1637.0, 1094.0, 695.0, 462.0, 345.0, 233.0, 179.0, 119.0, 77.0, 66.0, 42.0, 37.0, 21.0, 25.0, 11.0, 9.0, 7.0, 5.0, 10.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.909204483032227, -18.228309631347656, -17.54741668701172, -16.86652183532715, -16.185626983642578, -15.504732131958008, -14.823838233947754, -14.1429443359375, -13.46204948425293, -12.78115463256836, -12.100260734558105, -11.419366836547852, -10.738471984863281, -10.057577133178711, -9.376683235168457, -8.695789337158203, -8.014894485473633, -7.334000110626221, -6.653105735778809, -5.9722113609313965, -5.291316986083984, -4.610422611236572, -3.92952823638916, -3.248633861541748, -2.567739486694336, -1.8868451118469238, -1.2059507369995117, -0.5250563621520996, 0.1558380126953125, 0.8367323875427246, 1.5176267623901367, 2.198521137237549, 2.879413604736328, 3.5603079795837402, 4.241202354431152, 4.9220967292785645, 5.602991104125977, 6.283885478973389, 6.964779853820801, 7.645674228668213, 8.326568603515625, 9.007463455200195, 9.68835735321045, 10.369251251220703, 11.050146102905273, 11.731040954589844, 12.411934852600098, 13.092828750610352, 13.773723602294922, 14.454618453979492, 15.135512351989746, 15.81640625, 16.49730110168457, 17.17819595336914, 17.859088897705078, 18.53998374938965, 19.22087860107422, 19.90177345275879, 20.58266830444336, 21.263561248779297, 21.944456100463867, 22.625350952148438, 23.306243896484375, 23.987138748168945, 24.668033599853516]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 8.0, 5.0, 6.0, 8.0, 16.0, 16.0, 39.0, 63.0, 68.0, 119.0, 157.0, 1346.0, 51460764.0, 322.0, 84.0, 38.0, 27.0, 20.0, 13.0, 11.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2445.1943359375, -2361.688720703125, -2278.18310546875, -2194.677734375, -2111.172119140625, -2027.66650390625, -1944.160888671875, -1860.6552734375, -1777.149658203125, -1693.64404296875, -1610.1385498046875, -1526.6329345703125, -1443.1273193359375, -1359.621826171875, -1276.1162109375, -1192.610595703125, -1109.1051025390625, -1025.5994873046875, -942.0939331054688, -858.58837890625, -775.082763671875, -691.5772094726562, -608.0716552734375, -524.5660400390625, -441.06048583984375, -357.5549011230469, -274.04931640625, -190.54376220703125, -107.03817749023438, -23.5325927734375, 59.97296142578125, 143.47857666015625, 226.984130859375, 310.4897155761719, 393.99530029296875, 477.5008544921875, 561.0064697265625, 644.5120239257812, 728.017578125, 811.523193359375, 895.0287475585938, 978.5343017578125, 1062.0399169921875, 1145.54541015625, 1229.051025390625, 1312.556640625, 1396.062255859375, 1479.56787109375, 1563.0733642578125, 1646.5789794921875, 1730.08447265625, 1813.590087890625, 1897.095703125, 1980.601318359375, 2064.10693359375, 2147.6123046875, 2231.117919921875, 2314.62353515625, 2398.129150390625, 2481.634765625, 2565.14013671875, 2648.645751953125, 2732.1513671875, 2815.656982421875, 2899.16259765625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 9.0, 15.0, 18.0, 29.0, 27.0, 60.0, 91.0, 128.0, 163.0, 287.0, 425.0, 654.0, 920.0, 1339.0, 2146.0, 3209.0, 4882.0, 7397.0, 11532.0, 17614.0, 27573.0, 43233.0, 67334.0, 102979.0, 157755.0, 232117.0, 322172.0, 453428.0, 3509510.0, 400240.0, 301687.0, 213038.0, 144275.0, 94264.0, 59960.0, 39072.0, 25499.0, 16031.0, 10647.0, 6665.0, 4365.0, 2895.0, 1860.0, 1389.0, 842.0, 528.0, 376.0, 241.0, 159.0, 113.0, 79.0, 54.0, 47.0, 20.0, 15.0, 15.0, 7.0, 8.0, 4.0, 3.0, 4.0], "bins": [-0.89208984375, -0.8636703491210938, -0.8352508544921875, -0.8068313598632812, -0.778411865234375, -0.7499923706054688, -0.7215728759765625, -0.6931533813476562, -0.66473388671875, -0.6363143920898438, -0.6078948974609375, -0.5794754028320312, -0.551055908203125, -0.5226364135742188, -0.4942169189453125, -0.46579742431640625, -0.4373779296875, -0.40895843505859375, -0.3805389404296875, -0.35211944580078125, -0.323699951171875, -0.29528045654296875, -0.2668609619140625, -0.23844146728515625, -0.21002197265625, -0.18160247802734375, -0.1531829833984375, -0.12476348876953125, -0.096343994140625, -0.06792449951171875, -0.0395050048828125, -0.01108551025390625, 0.017333984375, 0.04575347900390625, 0.0741729736328125, 0.10259246826171875, 0.131011962890625, 0.15943145751953125, 0.1878509521484375, 0.21627044677734375, 0.24468994140625, 0.27310943603515625, 0.3015289306640625, 0.32994842529296875, 0.358367919921875, 0.38678741455078125, 0.4152069091796875, 0.44362640380859375, 0.4720458984375, 0.5004653930664062, 0.5288848876953125, 0.5573043823242188, 0.585723876953125, 0.6141433715820312, 0.6425628662109375, 0.6709823608398438, 0.69940185546875, 0.7278213500976562, 0.7562408447265625, 0.7846603393554688, 0.813079833984375, 0.8414993286132812, 0.8699188232421875, 0.8983383178710938, 0.9267578125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 13.0, 15.0, 12.0, 9.0, 10.0, 24.0, 23.0, 37.0, 29.0, 33.0, 37.0, 33.0, 39.0, 35.0, 32.0, 39.0, 46.0, 944.0, 149.0, 51.0, 32.0, 35.0, 28.0, 36.0, 24.0, 35.0, 29.0, 34.0, 21.0, 27.0, 16.0, 13.0, 12.0, 6.0, 9.0, 6.0, 5.0, 5.0, 7.0, 2.0, 0.0, 8.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.6484375, -13.2047119140625, -12.760986328125, -12.3172607421875, -11.87353515625, -11.4298095703125, -10.986083984375, -10.5423583984375, -10.0986328125, -9.6549072265625, -9.211181640625, -8.7674560546875, -8.32373046875, -7.8800048828125, -7.436279296875, -6.9925537109375, -6.548828125, -6.1051025390625, -5.661376953125, -5.2176513671875, -4.77392578125, -4.3302001953125, -3.886474609375, -3.4427490234375, -2.9990234375, -2.5552978515625, -2.111572265625, -1.6678466796875, -1.22412109375, -0.7803955078125, -0.336669921875, 0.1070556640625, 0.55078125, 0.9945068359375, 1.438232421875, 1.8819580078125, 2.32568359375, 2.7694091796875, 3.213134765625, 3.6568603515625, 4.1005859375, 4.5443115234375, 4.988037109375, 5.4317626953125, 5.87548828125, 6.3192138671875, 6.762939453125, 7.2066650390625, 7.650390625, 8.0941162109375, 8.537841796875, 8.9815673828125, 9.42529296875, 9.8690185546875, 10.312744140625, 10.7564697265625, 11.2001953125, 11.6439208984375, 12.087646484375, 12.5313720703125, 12.97509765625, 13.4188232421875, 13.862548828125, 14.3062744140625, 14.75]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 13.0, 13.0, 16.0, 29.0, 40.0, 46.0, 88.0, 156.0, 237.0, 436.0, 795.0, 1443.0, 2307.0, 4162.0, 7675.0, 14216.0, 26195.0, 48603.0, 88423.0, 158364.0, 272585.0, 426275.0, 2694252.0, 1541920.0, 411326.0, 258635.0, 150296.0, 83383.0, 45196.0, 24190.0, 13157.0, 7306.0, 4000.0, 2309.0, 1400.0, 765.0, 445.0, 247.0, 178.0, 109.0, 70.0, 43.0, 38.0, 18.0, 15.0, 9.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.1572265625, -1.124114990234375, -1.09100341796875, -1.057891845703125, -1.0247802734375, -0.991668701171875, -0.95855712890625, -0.925445556640625, -0.892333984375, -0.859222412109375, -0.82611083984375, -0.792999267578125, -0.7598876953125, -0.726776123046875, -0.69366455078125, -0.660552978515625, -0.62744140625, -0.594329833984375, -0.56121826171875, -0.528106689453125, -0.4949951171875, -0.461883544921875, -0.42877197265625, -0.395660400390625, -0.362548828125, -0.329437255859375, -0.29632568359375, -0.263214111328125, -0.2301025390625, -0.196990966796875, -0.16387939453125, -0.130767822265625, -0.09765625, -0.064544677734375, -0.03143310546875, 0.001678466796875, 0.0347900390625, 0.067901611328125, 0.10101318359375, 0.134124755859375, 0.167236328125, 0.200347900390625, 0.23345947265625, 0.266571044921875, 0.2996826171875, 0.332794189453125, 0.36590576171875, 0.399017333984375, 0.43212890625, 0.465240478515625, 0.49835205078125, 0.531463623046875, 0.5645751953125, 0.597686767578125, 0.63079833984375, 0.663909912109375, 0.697021484375, 0.730133056640625, 0.76324462890625, 0.796356201171875, 0.8294677734375, 0.862579345703125, 0.89569091796875, 0.928802490234375, 0.9619140625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 6.0, 7.0, 10.0, 11.0, 15.0, 16.0, 18.0, 11.0, 11.0, 18.0, 43.0, 39.0, 35.0, 40.0, 52.0, 34.0, 39.0, 50.0, 996.0, 113.0, 55.0, 42.0, 36.0, 43.0, 31.0, 42.0, 30.0, 29.0, 24.0, 27.0, 16.0, 15.0, 13.0, 9.0, 8.0, 6.0, 4.0, 4.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.078125, -10.705810546875, -10.33349609375, -9.961181640625, -9.5888671875, -9.216552734375, -8.84423828125, -8.471923828125, -8.099609375, -7.727294921875, -7.35498046875, -6.982666015625, -6.6103515625, -6.238037109375, -5.86572265625, -5.493408203125, -5.12109375, -4.748779296875, -4.37646484375, -4.004150390625, -3.6318359375, -3.259521484375, -2.88720703125, -2.514892578125, -2.142578125, -1.770263671875, -1.39794921875, -1.025634765625, -0.6533203125, -0.281005859375, 0.09130859375, 0.463623046875, 0.8359375, 1.208251953125, 1.58056640625, 1.952880859375, 2.3251953125, 2.697509765625, 3.06982421875, 3.442138671875, 3.814453125, 4.186767578125, 4.55908203125, 4.931396484375, 5.3037109375, 5.676025390625, 6.04833984375, 6.420654296875, 6.79296875, 7.165283203125, 7.53759765625, 7.909912109375, 8.2822265625, 8.654541015625, 9.02685546875, 9.399169921875, 9.771484375, 10.143798828125, 10.51611328125, 10.888427734375, 11.2607421875, 11.633056640625, 12.00537109375, 12.377685546875, 12.75]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 9.0, 5.0, 9.0, 10.0, 22.0, 20.0, 40.0, 42.0, 76.0, 101.0, 134.0, 157.0, 223.0, 322.0, 510.0, 692.0, 949.0, 1587.0, 2343.0, 4126.0, 7290.0, 13407.0, 25790.0, 52794.0, 114885.0, 5653950.0, 240882.0, 84559.0, 40380.0, 19985.0, 10314.0, 5898.0, 3446.0, 2159.0, 1342.0, 872.0, 583.0, 407.0, 315.0, 233.0, 171.0, 94.0, 74.0, 67.0, 50.0, 40.0, 17.0, 17.0, 16.0, 2.0, 2.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.060546875, -2.96435546875, -2.8681640625, -2.77197265625, -2.67578125, -2.57958984375, -2.4833984375, -2.38720703125, -2.291015625, -2.19482421875, -2.0986328125, -2.00244140625, -1.90625, -1.81005859375, -1.7138671875, -1.61767578125, -1.521484375, -1.42529296875, -1.3291015625, -1.23291015625, -1.13671875, -1.04052734375, -0.9443359375, -0.84814453125, -0.751953125, -0.65576171875, -0.5595703125, -0.46337890625, -0.3671875, -0.27099609375, -0.1748046875, -0.07861328125, 0.017578125, 0.11376953125, 0.2099609375, 0.30615234375, 0.40234375, 0.49853515625, 0.5947265625, 0.69091796875, 0.787109375, 0.88330078125, 0.9794921875, 1.07568359375, 1.171875, 1.26806640625, 1.3642578125, 1.46044921875, 1.556640625, 1.65283203125, 1.7490234375, 1.84521484375, 1.94140625, 2.03759765625, 2.1337890625, 2.22998046875, 2.326171875, 2.42236328125, 2.5185546875, 2.61474609375, 2.7109375, 2.80712890625, 2.9033203125, 2.99951171875, 3.095703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 7.0, 4.0, 6.0, 8.0, 7.0, 16.0, 11.0, 13.0, 16.0, 25.0, 19.0, 21.0, 26.0, 30.0, 31.0, 27.0, 46.0, 34.0, 38.0, 36.0, 62.0, 883.0, 190.0, 42.0, 37.0, 39.0, 27.0, 38.0, 34.0, 32.0, 28.0, 22.0, 27.0, 27.0, 20.0, 16.0, 13.0, 14.0, 11.0, 10.0, 5.0, 6.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.2177734375, -7.951171875, -7.6845703125, -7.41796875, -7.1513671875, -6.884765625, -6.6181640625, -6.3515625, -6.0849609375, -5.818359375, -5.5517578125, -5.28515625, -5.0185546875, -4.751953125, -4.4853515625, -4.21875, -3.9521484375, -3.685546875, -3.4189453125, -3.15234375, -2.8857421875, -2.619140625, -2.3525390625, -2.0859375, -1.8193359375, -1.552734375, -1.2861328125, -1.01953125, -0.7529296875, -0.486328125, -0.2197265625, 0.046875, 0.3134765625, 0.580078125, 0.8466796875, 1.11328125, 1.3798828125, 1.646484375, 1.9130859375, 2.1796875, 2.4462890625, 2.712890625, 2.9794921875, 3.24609375, 3.5126953125, 3.779296875, 4.0458984375, 4.3125, 4.5791015625, 4.845703125, 5.1123046875, 5.37890625, 5.6455078125, 5.912109375, 6.1787109375, 6.4453125, 6.7119140625, 6.978515625, 7.2451171875, 7.51171875, 7.7783203125, 8.044921875, 8.3115234375, 8.578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 8.0, 10.0, 15.0, 28.0, 41.0, 67.0, 133.0, 182.0, 178.0, 133.0, 64.0, 49.0, 35.0, 18.0, 18.0, 7.0, 6.0, 4.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.14434051513672, -17.088048934936523, -16.031755447387695, -14.9754638671875, -13.919170379638672, -12.862878799438477, -11.806586265563965, -10.750293731689453, -9.694001197814941, -8.63770866394043, -7.581416130065918, -6.5251240730285645, -5.468831539154053, -4.412539005279541, -3.3562469482421875, -2.299954414367676, -1.243661880493164, -0.1873694658279419, 0.8689229488372803, 1.925215244293213, 2.9815077781677246, 4.037800312042236, 5.09409236907959, 6.150384902954102, 7.206677436828613, 8.262969970703125, 9.319262504577637, 10.375555038452148, 11.431846618652344, 12.488140106201172, 13.544431686401367, 14.600724220275879, 15.65701675415039, 16.713308334350586, 17.769601821899414, 18.82589340209961, 19.882186889648438, 20.938478469848633, 21.994770050048828, 23.051063537597656, 24.107357025146484, 25.16364860534668, 26.219942092895508, 27.276233673095703, 28.33252716064453, 29.388818740844727, 30.445110321044922, 31.50140380859375, 32.55769348144531, 33.61398696899414, 34.6702766418457, 35.72657012939453, 36.78286361694336, 37.83915710449219, 38.89544677734375, 39.95174026489258, 41.008033752441406, 42.064327239990234, 43.1206169128418, 44.176910400390625, 45.23320388793945, 46.28949737548828, 47.345787048339844, 48.40208053588867, 49.4583740234375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 7.0, 5.0, 9.0, 4.0, 20.0, 21.0, 24.0, 32.0, 40.0, 42.0, 35.0, 53.0, 61.0, 55.0, 43.0, 59.0, 48.0, 47.0, 61.0, 47.0, 50.0, 49.0, 42.0, 32.0, 39.0, 29.0, 25.0, 11.0, 7.0, 6.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.16651153564453, -36.938209533691406, -35.70990753173828, -34.48160934448242, -33.2533073425293, -32.02500534057617, -30.796703338623047, -29.568403244018555, -28.340103149414062, -27.111801147460938, -25.883501052856445, -24.65519905090332, -23.426898956298828, -22.198596954345703, -20.970294952392578, -19.741994857788086, -18.51369285583496, -17.285390853881836, -16.057090759277344, -14.828788757324219, -13.600488662719727, -12.372186660766602, -11.143885612487793, -9.915584564208984, -8.687283515930176, -7.458982467651367, -6.230681419372559, -5.002379894256592, -3.774078845977783, -2.5457777976989746, -1.3174762725830078, -0.08917522430419922, 1.1391258239746094, 2.367426872253418, 3.5957281589508057, 4.824029445648193, 6.052330493927002, 7.2806315422058105, 8.508933067321777, 9.737234115600586, 10.965535163879395, 12.193836212158203, 13.422137260437012, 14.65043830871582, 15.878740310668945, 17.107040405273438, 18.335342407226562, 19.563644409179688, 20.79194450378418, 22.020246505737305, 23.248546600341797, 24.476848602294922, 25.705148696899414, 26.93345069885254, 28.16175079345703, 29.390052795410156, 30.61835479736328, 31.846656799316406, 33.07495880126953, 34.30325698852539, 35.531558990478516, 36.75986099243164, 37.988162994384766, 39.216461181640625, 40.44476318359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 5.0, 5.0, 12.0, 16.0, 20.0, 29.0, 56.0, 62.0, 95.0, 139.0, 221.0, 293.0, 484.0, 765.0, 1215.0, 1957.0, 3767.0, 8885.0, 35454.0, 3987410.0, 128058.0, 14656.0, 4919.0, 2406.0, 1353.0, 758.0, 461.0, 278.0, 154.0, 118.0, 70.0, 57.0, 28.0, 19.0, 15.0, 13.0, 2.0, 9.0, 5.0, 4.0, 1.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.252685546875, -0.24358749389648438, -0.23448944091796875, -0.22539138793945312, -0.2162933349609375, -0.20719528198242188, -0.19809722900390625, -0.18899917602539062, -0.179901123046875, -0.17080307006835938, -0.16170501708984375, -0.15260696411132812, -0.1435089111328125, -0.13441085815429688, -0.12531280517578125, -0.11621475219726562, -0.10711669921875, -0.09801864624023438, -0.08892059326171875, -0.07982254028320312, -0.0707244873046875, -0.061626434326171875, -0.05252838134765625, -0.043430328369140625, -0.034332275390625, -0.025234222412109375, -0.01613616943359375, -0.007038116455078125, 0.0020599365234375, 0.011157989501953125, 0.02025604248046875, 0.029354095458984375, 0.0384521484375, 0.047550201416015625, 0.05664825439453125, 0.06574630737304688, 0.0748443603515625, 0.08394241333007812, 0.09304046630859375, 0.10213851928710938, 0.111236572265625, 0.12033462524414062, 0.12943267822265625, 0.13853073120117188, 0.1476287841796875, 0.15672683715820312, 0.16582489013671875, 0.17492294311523438, 0.18402099609375, 0.19311904907226562, 0.20221710205078125, 0.21131515502929688, 0.2204132080078125, 0.22951126098632812, 0.23860931396484375, 0.24770736694335938, 0.256805419921875, 0.2659034729003906, 0.27500152587890625, 0.2840995788574219, 0.2931976318359375, 0.3022956848144531, 0.31139373779296875, 0.3204917907714844, 0.32958984375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 0.0, 7.0, 2.0, 5.0, 6.0, 8.0, 8.0, 9.0, 9.0, 10.0, 12.0, 18.0, 20.0, 767.0, 16.0, 17.0, 8.0, 9.0, 12.0, 9.0, 6.0, 5.0, 9.0, 2.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1102294921875, -0.10700511932373047, -0.10378074645996094, -0.1005563735961914, -0.09733200073242188, -0.09410762786865234, -0.09088325500488281, -0.08765888214111328, -0.08443450927734375, -0.08121013641357422, -0.07798576354980469, -0.07476139068603516, -0.07153701782226562, -0.0683126449584961, -0.06508827209472656, -0.06186389923095703, -0.0586395263671875, -0.05541515350341797, -0.05219078063964844, -0.048966407775878906, -0.045742034912109375, -0.042517662048339844, -0.03929328918457031, -0.03606891632080078, -0.03284454345703125, -0.02962017059326172, -0.026395797729492188, -0.023171424865722656, -0.019947052001953125, -0.016722679138183594, -0.013498306274414062, -0.010273933410644531, -0.007049560546875, -0.0038251876831054688, -0.0006008148193359375, 0.0026235580444335938, 0.005847930908203125, 0.009072303771972656, 0.012296676635742188, 0.015521049499511719, 0.01874542236328125, 0.02196979522705078, 0.025194168090820312, 0.028418540954589844, 0.031642913818359375, 0.034867286682128906, 0.03809165954589844, 0.04131603240966797, 0.0445404052734375, 0.04776477813720703, 0.05098915100097656, 0.054213523864746094, 0.057437896728515625, 0.060662269592285156, 0.06388664245605469, 0.06711101531982422, 0.07033538818359375, 0.07355976104736328, 0.07678413391113281, 0.08000850677490234, 0.08323287963867188, 0.0864572525024414, 0.08968162536621094, 0.09290599822998047, 0.09613037109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 13.0, 15.0, 21.0, 26.0, 44.0, 60.0, 88.0, 141.0, 199.0, 364.0, 627.0, 1117.0, 2317.0, 5158.0, 14209.0, 63027.0, 3532288.0, 518471.0, 36049.0, 10663.0, 4390.0, 2119.0, 1060.0, 697.0, 389.0, 238.0, 150.0, 87.0, 66.0, 44.0, 40.0, 19.0, 23.0, 8.0, 5.0, 12.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.248291015625, -0.24048614501953125, -0.2326812744140625, -0.22487640380859375, -0.217071533203125, -0.20926666259765625, -0.2014617919921875, -0.19365692138671875, -0.18585205078125, -0.17804718017578125, -0.1702423095703125, -0.16243743896484375, -0.154632568359375, -0.14682769775390625, -0.1390228271484375, -0.13121795654296875, -0.1234130859375, -0.11560821533203125, -0.1078033447265625, -0.09999847412109375, -0.092193603515625, -0.08438873291015625, -0.0765838623046875, -0.06877899169921875, -0.06097412109375, -0.05316925048828125, -0.0453643798828125, -0.03755950927734375, -0.029754638671875, -0.02194976806640625, -0.0141448974609375, -0.00634002685546875, 0.00146484375, 0.00926971435546875, 0.0170745849609375, 0.02487945556640625, 0.032684326171875, 0.04048919677734375, 0.0482940673828125, 0.05609893798828125, 0.06390380859375, 0.07170867919921875, 0.0795135498046875, 0.08731842041015625, 0.095123291015625, 0.10292816162109375, 0.1107330322265625, 0.11853790283203125, 0.1263427734375, 0.13414764404296875, 0.1419525146484375, 0.14975738525390625, 0.157562255859375, 0.16536712646484375, 0.1731719970703125, 0.18097686767578125, 0.18878173828125, 0.19658660888671875, 0.2043914794921875, 0.21219635009765625, 0.220001220703125, 0.22780609130859375, 0.2356109619140625, 0.24341583251953125, 0.251220703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 8.0, 15.0, 10.0, 17.0, 42.0, 79.0, 292.0, 1713.0, 1318.0, 299.0, 104.0, 48.0, 28.0, 18.0, 9.0, 12.0, 13.0, 8.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.161376953125, -0.15662193298339844, -0.15186691284179688, -0.1471118927001953, -0.14235687255859375, -0.1376018524169922, -0.13284683227539062, -0.12809181213378906, -0.1233367919921875, -0.11858177185058594, -0.11382675170898438, -0.10907173156738281, -0.10431671142578125, -0.09956169128417969, -0.09480667114257812, -0.09005165100097656, -0.085296630859375, -0.08054161071777344, -0.07578659057617188, -0.07103157043457031, -0.06627655029296875, -0.06152153015136719, -0.056766510009765625, -0.05201148986816406, -0.0472564697265625, -0.04250144958496094, -0.037746429443359375, -0.03299140930175781, -0.02823638916015625, -0.023481369018554688, -0.018726348876953125, -0.013971328735351562, -0.00921630859375, -0.0044612884521484375, 0.000293731689453125, 0.0050487518310546875, 0.00980377197265625, 0.014558792114257812, 0.019313812255859375, 0.024068832397460938, 0.0288238525390625, 0.03357887268066406, 0.038333892822265625, 0.04308891296386719, 0.04784393310546875, 0.05259895324707031, 0.057353973388671875, 0.06210899353027344, 0.066864013671875, 0.07161903381347656, 0.07637405395507812, 0.08112907409667969, 0.08588409423828125, 0.09063911437988281, 0.09539413452148438, 0.10014915466308594, 0.1049041748046875, 0.10965919494628906, 0.11441421508789062, 0.11916923522949219, 0.12392425537109375, 0.1286792755126953, 0.13343429565429688, 0.13818931579589844, 0.1429443359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 59.0, 462.0, 385.0, 61.0, 16.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.095311164855957, -2.0515289306640625, -2.007746934890747, -1.963964819908142, -1.920182704925537, -1.8764004707336426, -1.8326184749603271, -1.7888362407684326, -1.7450541257858276, -1.7012720108032227, -1.6574898958206177, -1.6137077808380127, -1.5699256658554077, -1.5261435508728027, -1.4823613166809082, -1.4385792016983032, -1.3947970867156982, -1.3510149717330933, -1.3072328567504883, -1.2634507417678833, -1.2196686267852783, -1.1758863925933838, -1.1321043968200684, -1.0883221626281738, -1.0445401668548584, -1.0007580518722534, -0.9569759368896484, -0.9131938219070435, -0.8694116473197937, -0.8256295323371887, -0.7818474173545837, -0.738065242767334, -0.6942831873893738, -0.6505010724067688, -0.6067189574241638, -0.5629367828369141, -0.5191546678543091, -0.4753725528717041, -0.4315904378890991, -0.38780829310417175, -0.3440261781215668, -0.3002440631389618, -0.2564619183540344, -0.21267980337142944, -0.16889767348766327, -0.1251155436038971, -0.08133342862129211, -0.037551283836364746, 0.006230831146240234, 0.05001295730471611, 0.09379508346319199, 0.13757720589637756, 0.18135933578014374, 0.2251414656639099, 0.2689235806465149, 0.31270572543144226, 0.35648784041404724, 0.4002699553966522, 0.4440521001815796, 0.48783421516418457, 0.5316163301467896, 0.5753984451293945, 0.6191805601119995, 0.6629627346992493, 0.7067448496818542]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 13.0, 6.0, 13.0, 25.0, 35.0, 53.0, 88.0, 114.0, 127.0, 136.0, 121.0, 82.0, 60.0, 50.0, 30.0, 16.0, 10.0, 7.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7515149712562561, -0.7248200178146362, -0.6981250047683716, -0.6714300513267517, -0.6447350978851318, -0.618040144443512, -0.5913451910018921, -0.5646501779556274, -0.5379552245140076, -0.5112602710723877, -0.48456528782844543, -0.4578703045845032, -0.4311753511428833, -0.4044803977012634, -0.37778541445732117, -0.3510904312133789, -0.32439547777175903, -0.29770052433013916, -0.2710055410861969, -0.24431057274341583, -0.21761560440063477, -0.1909206360578537, -0.16422566771507263, -0.13753069937229156, -0.1108357310295105, -0.08414076268672943, -0.057445794343948364, -0.030750826001167297, -0.0040558576583862305, 0.022639110684394836, 0.0493340790271759, 0.07602904736995697, 0.10272401571273804, 0.1294189840555191, 0.15611395239830017, 0.18280892074108124, 0.2095038890838623, 0.23619885742664337, 0.26289382576942444, 0.2895888090133667, 0.3162837624549866, 0.34297871589660645, 0.3696736991405487, 0.39636868238449097, 0.42306363582611084, 0.4497585892677307, 0.476453572511673, 0.5031485557556152, 0.5298435091972351, 0.556538462638855, 0.5832334756851196, 0.6099284291267395, 0.6366233825683594, 0.6633183360099792, 0.6900132894515991, 0.7167083024978638, 0.7434032559394836, 0.7700982093811035, 0.7967932224273682, 0.823488175868988, 0.8501831293106079, 0.8768780827522278, 0.9035730361938477, 0.9302680492401123, 0.9569630026817322]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 9.0, 14.0, 15.0, 14.0, 26.0, 47.0, 46.0, 75.0, 89.0, 150.0, 235.0, 350.0, 505.0, 658.0, 1084.0, 1690.0, 2796.0, 4498.0, 8145.0, 14985.0, 31235.0, 730555.0, 191293.0, 27791.0, 13472.0, 7391.0, 4172.0, 2558.0, 1559.0, 1002.0, 664.0, 443.0, 292.0, 187.0, 131.0, 110.0, 71.0, 59.0, 40.0, 23.0, 23.0, 18.0, 9.0, 9.0, 7.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.410400390625, -0.3971290588378906, -0.38385772705078125, -0.3705863952636719, -0.3573150634765625, -0.3440437316894531, -0.33077239990234375, -0.3175010681152344, -0.304229736328125, -0.2909584045410156, -0.27768707275390625, -0.2644157409667969, -0.2511444091796875, -0.23787307739257812, -0.22460174560546875, -0.21133041381835938, -0.19805908203125, -0.18478775024414062, -0.17151641845703125, -0.15824508666992188, -0.1449737548828125, -0.13170242309570312, -0.11843109130859375, -0.10515975952148438, -0.091888427734375, -0.07861709594726562, -0.06534576416015625, -0.052074432373046875, -0.0388031005859375, -0.025531768798828125, -0.01226043701171875, 0.001010894775390625, 0.0142822265625, 0.027553558349609375, 0.04082489013671875, 0.054096221923828125, 0.0673675537109375, 0.08063888549804688, 0.09391021728515625, 0.10718154907226562, 0.120452880859375, 0.13372421264648438, 0.14699554443359375, 0.16026687622070312, 0.1735382080078125, 0.18680953979492188, 0.20008087158203125, 0.21335220336914062, 0.22662353515625, 0.23989486694335938, 0.25316619873046875, 0.2664375305175781, 0.2797088623046875, 0.2929801940917969, 0.30625152587890625, 0.3195228576660156, 0.332794189453125, 0.3460655212402344, 0.35933685302734375, 0.3726081848144531, 0.3858795166015625, 0.3991508483886719, 0.41242218017578125, 0.4256935119628906, 0.43896484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 10.0, 10.0, 8.0, 9.0, 8.0, 12.0, 12.0, 32.0, 611.0, 157.0, 16.0, 11.0, 8.0, 9.0, 13.0, 7.0, 9.0, 2.0, 9.0, 5.0, 5.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097900390625, -0.09497642517089844, -0.09205245971679688, -0.08912849426269531, -0.08620452880859375, -0.08328056335449219, -0.08035659790039062, -0.07743263244628906, -0.0745086669921875, -0.07158470153808594, -0.06866073608398438, -0.06573677062988281, -0.06281280517578125, -0.05988883972167969, -0.056964874267578125, -0.05404090881347656, -0.051116943359375, -0.04819297790527344, -0.045269012451171875, -0.04234504699707031, -0.03942108154296875, -0.03649711608886719, -0.033573150634765625, -0.030649185180664062, -0.0277252197265625, -0.024801254272460938, -0.021877288818359375, -0.018953323364257812, -0.01602935791015625, -0.013105392456054688, -0.010181427001953125, -0.0072574615478515625, -0.00433349609375, -0.0014095306396484375, 0.001514434814453125, 0.0044384002685546875, 0.00736236572265625, 0.010286331176757812, 0.013210296630859375, 0.016134262084960938, 0.0190582275390625, 0.021982192993164062, 0.024906158447265625, 0.027830123901367188, 0.03075408935546875, 0.03367805480957031, 0.036602020263671875, 0.03952598571777344, 0.042449951171875, 0.04537391662597656, 0.048297882080078125, 0.05122184753417969, 0.05414581298828125, 0.05706977844238281, 0.059993743896484375, 0.06291770935058594, 0.0658416748046875, 0.06876564025878906, 0.07168960571289062, 0.07461357116699219, 0.07753753662109375, 0.08046150207519531, 0.08338546752929688, 0.08630943298339844, 0.0892333984375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 14.0, 22.0, 27.0, 28.0, 46.0, 58.0, 76.0, 126.0, 149.0, 242.0, 395.0, 751.0, 1473.0, 3334.0, 8874.0, 27633.0, 98914.0, 355719.0, 392259.0, 111056.0, 30454.0, 9710.0, 3623.0, 1489.0, 755.0, 421.0, 268.0, 160.0, 148.0, 89.0, 66.0, 46.0, 33.0, 19.0, 12.0, 15.0, 11.0, 7.0, 5.0, 3.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.27099609375, -0.2625389099121094, -0.25408172607421875, -0.24562454223632812, -0.2371673583984375, -0.22871017456054688, -0.22025299072265625, -0.21179580688476562, -0.203338623046875, -0.19488143920898438, -0.18642425537109375, -0.17796707153320312, -0.1695098876953125, -0.16105270385742188, -0.15259552001953125, -0.14413833618164062, -0.13568115234375, -0.12722396850585938, -0.11876678466796875, -0.11030960083007812, -0.1018524169921875, -0.09339523315429688, -0.08493804931640625, -0.07648086547851562, -0.068023681640625, -0.059566497802734375, -0.05110931396484375, -0.042652130126953125, -0.0341949462890625, -0.025737762451171875, -0.01728057861328125, -0.008823394775390625, -0.0003662109375, 0.008090972900390625, 0.01654815673828125, 0.025005340576171875, 0.0334625244140625, 0.041919708251953125, 0.05037689208984375, 0.058834075927734375, 0.067291259765625, 0.07574844360351562, 0.08420562744140625, 0.09266281127929688, 0.1011199951171875, 0.10957717895507812, 0.11803436279296875, 0.12649154663085938, 0.13494873046875, 0.14340591430664062, 0.15186309814453125, 0.16032028198242188, 0.1687774658203125, 0.17723464965820312, 0.18569183349609375, 0.19414901733398438, 0.202606201171875, 0.21106338500976562, 0.21952056884765625, 0.22797775268554688, 0.2364349365234375, 0.24489212036132812, 0.25334930419921875, 0.2618064880371094, 0.270263671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 9.0, 11.0, 10.0, 8.0, 17.0, 24.0, 29.0, 18.0, 25.0, 34.0, 30.0, 31.0, 38.0, 30.0, 33.0, 30.0, 40.0, 39.0, 51.0, 44.0, 43.0, 44.0, 37.0, 36.0, 35.0, 43.0, 33.0, 29.0, 17.0, 19.0, 20.0, 15.0, 7.0, 16.0, 9.0, 8.0, 6.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.37060546875, -0.36048126220703125, -0.3503570556640625, -0.34023284912109375, -0.330108642578125, -0.31998443603515625, -0.3098602294921875, -0.29973602294921875, -0.28961181640625, -0.27948760986328125, -0.2693634033203125, -0.25923919677734375, -0.249114990234375, -0.23899078369140625, -0.2288665771484375, -0.21874237060546875, -0.2086181640625, -0.19849395751953125, -0.1883697509765625, -0.17824554443359375, -0.168121337890625, -0.15799713134765625, -0.1478729248046875, -0.13774871826171875, -0.12762451171875, -0.11750030517578125, -0.1073760986328125, -0.09725189208984375, -0.087127685546875, -0.07700347900390625, -0.0668792724609375, -0.05675506591796875, -0.046630859375, -0.03650665283203125, -0.0263824462890625, -0.01625823974609375, -0.006134033203125, 0.00399017333984375, 0.0141143798828125, 0.02423858642578125, 0.03436279296875, 0.04448699951171875, 0.0546112060546875, 0.06473541259765625, 0.074859619140625, 0.08498382568359375, 0.0951080322265625, 0.10523223876953125, 0.1153564453125, 0.12548065185546875, 0.1356048583984375, 0.14572906494140625, 0.155853271484375, 0.16597747802734375, 0.1761016845703125, 0.18622589111328125, 0.19635009765625, 0.20647430419921875, 0.2165985107421875, 0.22672271728515625, 0.236846923828125, 0.24697113037109375, 0.2570953369140625, 0.26721954345703125, 0.27734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 11.0, 9.0, 18.0, 29.0, 37.0, 106.0, 142.0, 264.0, 667.0, 1627.0, 5996.0, 54541.0, 944710.0, 33253.0, 4673.0, 1350.0, 504.0, 264.0, 127.0, 80.0, 43.0, 31.0, 21.0, 10.0, 10.0, 10.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34521484375, -0.331634521484375, -0.31805419921875, -0.304473876953125, -0.2908935546875, -0.277313232421875, -0.26373291015625, -0.250152587890625, -0.236572265625, -0.222991943359375, -0.20941162109375, -0.195831298828125, -0.1822509765625, -0.168670654296875, -0.15509033203125, -0.141510009765625, -0.1279296875, -0.114349365234375, -0.10076904296875, -0.087188720703125, -0.0736083984375, -0.060028076171875, -0.04644775390625, -0.032867431640625, -0.019287109375, -0.005706787109375, 0.00787353515625, 0.021453857421875, 0.0350341796875, 0.048614501953125, 0.06219482421875, 0.075775146484375, 0.08935546875, 0.102935791015625, 0.11651611328125, 0.130096435546875, 0.1436767578125, 0.157257080078125, 0.17083740234375, 0.184417724609375, 0.197998046875, 0.211578369140625, 0.22515869140625, 0.238739013671875, 0.2523193359375, 0.265899658203125, 0.27947998046875, 0.293060302734375, 0.306640625, 0.320220947265625, 0.33380126953125, 0.347381591796875, 0.3609619140625, 0.374542236328125, 0.38812255859375, 0.401702880859375, 0.415283203125, 0.428863525390625, 0.44244384765625, 0.456024169921875, 0.4696044921875, 0.483184814453125, 0.49676513671875, 0.510345458984375, 0.52392578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 8.0, 7.0, 8.0, 9.0, 11.0, 8.0, 15.0, 23.0, 20.0, 14.0, 25.0, 29.0, 46.0, 66.0, 131.0, 145.0, 146.0, 57.0, 44.0, 36.0, 25.0, 22.0, 9.0, 18.0, 15.0, 13.0, 9.0, 8.0, 3.0, 6.0, 6.0, 7.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023126602172851562, -0.00022310763597488403, -0.00021494925022125244, -0.00020679086446762085, -0.00019863247871398926, -0.00019047409296035767, -0.00018231570720672607, -0.00017415732145309448, -0.0001659989356994629, -0.0001578405499458313, -0.0001496821641921997, -0.00014152377843856812, -0.00013336539268493652, -0.00012520700693130493, -0.00011704862117767334, -0.00010889023542404175, -0.00010073184967041016, -9.257346391677856e-05, -8.441507816314697e-05, -7.625669240951538e-05, -6.809830665588379e-05, -5.99399209022522e-05, -5.1781535148620605e-05, -4.3623149394989014e-05, -3.546476364135742e-05, -2.730637788772583e-05, -1.9147992134094238e-05, -1.0989606380462646e-05, -2.8312206268310547e-06, 5.327165126800537e-06, 1.3485550880432129e-05, 2.164393663406372e-05, 2.9802322387695312e-05, 3.7960708141326904e-05, 4.6119093894958496e-05, 5.427747964859009e-05, 6.243586540222168e-05, 7.059425115585327e-05, 7.875263690948486e-05, 8.691102266311646e-05, 9.506940841674805e-05, 0.00010322779417037964, 0.00011138617992401123, 0.00011954456567764282, 0.00012770295143127441, 0.000135861337184906, 0.0001440197229385376, 0.0001521781086921692, 0.00016033649444580078, 0.00016849488019943237, 0.00017665326595306396, 0.00018481165170669556, 0.00019297003746032715, 0.00020112842321395874, 0.00020928680896759033, 0.00021744519472122192, 0.00022560358047485352, 0.0002337619662284851, 0.0002419203519821167, 0.0002500787377357483, 0.0002582371234893799, 0.0002663955092430115, 0.00027455389499664307, 0.00028271228075027466, 0.00029087066650390625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 10.0, 10.0, 14.0, 27.0, 67.0, 121.0, 225.0, 462.0, 1262.0, 4658.0, 30398.0, 715647.0, 274897.0, 15965.0, 3107.0, 960.0, 342.0, 161.0, 75.0, 48.0, 31.0, 23.0, 16.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3202018737792969, -0.30910491943359375, -0.2980079650878906, -0.2869110107421875, -0.2758140563964844, -0.26471710205078125, -0.2536201477050781, -0.242523193359375, -0.23142623901367188, -0.22032928466796875, -0.20923233032226562, -0.1981353759765625, -0.18703842163085938, -0.17594146728515625, -0.16484451293945312, -0.15374755859375, -0.14265060424804688, -0.13155364990234375, -0.12045669555664062, -0.1093597412109375, -0.09826278686523438, -0.08716583251953125, -0.07606887817382812, -0.064971923828125, -0.053874969482421875, -0.04277801513671875, -0.031681060791015625, -0.0205841064453125, -0.009487152099609375, 0.00160980224609375, 0.012706756591796875, 0.0238037109375, 0.034900665283203125, 0.04599761962890625, 0.057094573974609375, 0.0681915283203125, 0.07928848266601562, 0.09038543701171875, 0.10148239135742188, 0.112579345703125, 0.12367630004882812, 0.13477325439453125, 0.14587020874023438, 0.1569671630859375, 0.16806411743164062, 0.17916107177734375, 0.19025802612304688, 0.20135498046875, 0.21245193481445312, 0.22354888916015625, 0.23464584350585938, 0.2457427978515625, 0.2568397521972656, 0.26793670654296875, 0.2790336608886719, 0.290130615234375, 0.3012275695800781, 0.31232452392578125, 0.3234214782714844, 0.3345184326171875, 0.3456153869628906, 0.35671234130859375, 0.3678092956542969, 0.37890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 8.0, 7.0, 9.0, 18.0, 23.0, 33.0, 60.0, 78.0, 131.0, 162.0, 181.0, 100.0, 82.0, 49.0, 33.0, 13.0, 10.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5164108276367188, -0.5015716552734375, -0.48673248291015625, -0.471893310546875, -0.45705413818359375, -0.4422149658203125, -0.42737579345703125, -0.41253662109375, -0.39769744873046875, -0.3828582763671875, -0.36801910400390625, -0.353179931640625, -0.33834075927734375, -0.3235015869140625, -0.30866241455078125, -0.2938232421875, -0.27898406982421875, -0.2641448974609375, -0.24930572509765625, -0.234466552734375, -0.21962738037109375, -0.2047882080078125, -0.18994903564453125, -0.17510986328125, -0.16027069091796875, -0.1454315185546875, -0.13059234619140625, -0.115753173828125, -0.10091400146484375, -0.0860748291015625, -0.07123565673828125, -0.056396484375, -0.04155731201171875, -0.0267181396484375, -0.01187896728515625, 0.002960205078125, 0.01779937744140625, 0.0326385498046875, 0.04747772216796875, 0.06231689453125, 0.07715606689453125, 0.0919952392578125, 0.10683441162109375, 0.121673583984375, 0.13651275634765625, 0.1513519287109375, 0.16619110107421875, 0.1810302734375, 0.19586944580078125, 0.2107086181640625, 0.22554779052734375, 0.240386962890625, 0.25522613525390625, 0.2700653076171875, 0.28490447998046875, 0.29974365234375, 0.31458282470703125, 0.3294219970703125, 0.34426116943359375, 0.359100341796875, 0.37393951416015625, 0.3887786865234375, 0.40361785888671875, 0.41845703125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 19.0, 58.0, 257.0, 496.0, 117.0, 23.0, 15.0, 5.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.924313545227051, -6.680110454559326, -6.43590784072876, -6.191704750061035, -5.947502136230469, -5.703299045562744, -5.459096431732178, -5.214893341064453, -4.970690727233887, -4.726487636566162, -4.482285022735596, -4.238081932067871, -3.9938793182373047, -3.74967622756958, -3.5054736137390137, -3.261270523071289, -3.0170676708221436, -2.772864818572998, -2.5286619663238525, -2.284459114074707, -2.0402562618255615, -1.7960532903671265, -1.551850438117981, -1.3076475858688354, -1.06344473361969, -0.8192418813705444, -0.5750390291213989, -0.33083611726760864, -0.08663326501846313, 0.15756964683532715, 0.40177249908447266, 0.6459753513336182, 0.8901782035827637, 1.1343810558319092, 1.3785839080810547, 1.6227867603302002, 1.8669896125793457, 2.1111927032470703, 2.3553953170776367, 2.5995984077453613, 2.8438010215759277, 3.0880038738250732, 3.3322067260742188, 3.5764095783233643, 3.8206124305725098, 4.064815521240234, 4.309018135070801, 4.553221225738525, 4.79742431640625, 5.041627407073975, 5.285830020904541, 5.530033111572266, 5.774235725402832, 6.018438816070557, 6.262641429901123, 6.506844520568848, 6.751047134399414, 6.995250225067139, 7.239452838897705, 7.48365592956543, 7.727858543395996, 7.972061634063721, 8.216264724731445, 8.460467338562012, 8.704669952392578]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 2.0, 7.0, 14.0, 17.0, 16.0, 29.0, 53.0, 79.0, 112.0, 123.0, 121.0, 109.0, 89.0, 63.0, 35.0, 27.0, 12.0, 8.0, 7.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.305180072784424, -5.129615783691406, -4.9540510177612305, -4.778486251831055, -4.602921962738037, -4.4273576736450195, -4.251792907714844, -4.076228141784668, -3.9006638526916504, -3.7250993251800537, -3.549534797668457, -3.3739702701568604, -3.1984057426452637, -3.022841215133667, -2.8472766876220703, -2.6717121601104736, -2.496147632598877, -2.3205831050872803, -2.1450185775756836, -1.969454050064087, -1.7938895225524902, -1.6183249950408936, -1.4427604675292969, -1.2671959400177002, -1.0916314125061035, -0.9160668849945068, -0.7405023574829102, -0.5649378299713135, -0.3893733024597168, -0.21380877494812012, -0.03824424743652344, 0.13732028007507324, 0.3128852844238281, 0.4884498119354248, 0.6640143394470215, 0.8395788669586182, 1.0151433944702148, 1.1907079219818115, 1.3662724494934082, 1.5418369770050049, 1.7174015045166016, 1.8929660320281982, 2.068530559539795, 2.2440950870513916, 2.4196596145629883, 2.595224142074585, 2.7707886695861816, 2.9463531970977783, 3.121917724609375, 3.2974822521209717, 3.4730467796325684, 3.648611307144165, 3.8241758346557617, 3.9997403621673584, 4.175304889678955, 4.350869178771973, 4.526433944702148, 4.701998710632324, 4.877562999725342, 5.053127288818359, 5.228692054748535, 5.404256820678711, 5.5798211097717285, 5.755385398864746, 5.930950164794922]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 5.0, 6.0, 9.0, 18.0, 12.0, 18.0, 24.0, 48.0, 66.0, 95.0, 156.0, 284.0, 417.0, 790.0, 1428.0, 2890.0, 6111.0, 16141.0, 69851.0, 3955251.0, 113323.0, 17230.0, 5809.0, 2142.0, 994.0, 537.0, 256.0, 151.0, 78.0, 53.0, 40.0, 18.0, 18.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2490234375, -1.2174835205078125, -1.185943603515625, -1.1544036865234375, -1.12286376953125, -1.0913238525390625, -1.059783935546875, -1.0282440185546875, -0.9967041015625, -0.9651641845703125, -0.933624267578125, -0.9020843505859375, -0.87054443359375, -0.8390045166015625, -0.807464599609375, -0.7759246826171875, -0.744384765625, -0.7128448486328125, -0.681304931640625, -0.6497650146484375, -0.61822509765625, -0.5866851806640625, -0.555145263671875, -0.5236053466796875, -0.4920654296875, -0.4605255126953125, -0.428985595703125, -0.3974456787109375, -0.36590576171875, -0.3343658447265625, -0.302825927734375, -0.2712860107421875, -0.23974609375, -0.2082061767578125, -0.176666259765625, -0.1451263427734375, -0.11358642578125, -0.0820465087890625, -0.050506591796875, -0.0189666748046875, 0.0125732421875, 0.0441131591796875, 0.075653076171875, 0.1071929931640625, 0.13873291015625, 0.1702728271484375, 0.201812744140625, 0.2333526611328125, 0.264892578125, 0.2964324951171875, 0.327972412109375, 0.3595123291015625, 0.39105224609375, 0.4225921630859375, 0.454132080078125, 0.4856719970703125, 0.5172119140625, 0.5487518310546875, 0.580291748046875, 0.6118316650390625, 0.64337158203125, 0.6749114990234375, 0.706451416015625, 0.7379913330078125, 0.76953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 2.0, 7.0, 6.0, 10.0, 11.0, 7.0, 10.0, 17.0, 45.0, 213.0, 386.0, 151.0, 40.0, 8.0, 15.0, 9.0, 18.0, 8.0, 5.0, 2.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10772705078125, -0.10497760772705078, -0.10222816467285156, -0.09947872161865234, -0.09672927856445312, -0.0939798355102539, -0.09123039245605469, -0.08848094940185547, -0.08573150634765625, -0.08298206329345703, -0.08023262023925781, -0.0774831771850586, -0.07473373413085938, -0.07198429107666016, -0.06923484802246094, -0.06648540496826172, -0.0637359619140625, -0.06098651885986328, -0.05823707580566406, -0.055487632751464844, -0.052738189697265625, -0.049988746643066406, -0.04723930358886719, -0.04448986053466797, -0.04174041748046875, -0.03899097442626953, -0.03624153137207031, -0.033492088317871094, -0.030742645263671875, -0.027993202209472656, -0.025243759155273438, -0.02249431610107422, -0.019744873046875, -0.01699542999267578, -0.014245986938476562, -0.011496543884277344, -0.008747100830078125, -0.005997657775878906, -0.0032482147216796875, -0.0004987716674804688, 0.00225067138671875, 0.005000114440917969, 0.0077495574951171875, 0.010499000549316406, 0.013248443603515625, 0.015997886657714844, 0.018747329711914062, 0.02149677276611328, 0.0242462158203125, 0.02699565887451172, 0.029745101928710938, 0.032494544982910156, 0.035243988037109375, 0.037993431091308594, 0.04074287414550781, 0.04349231719970703, 0.04624176025390625, 0.04899120330810547, 0.05174064636230469, 0.054490089416503906, 0.057239532470703125, 0.059988975524902344, 0.06273841857910156, 0.06548786163330078, 0.0682373046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 17.0, 24.0, 25.0, 59.0, 124.0, 245.0, 700.0, 2297.0, 13572.0, 312436.0, 3822608.0, 35759.0, 4472.0, 1093.0, 388.0, 205.0, 105.0, 51.0, 39.0, 18.0, 12.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6576766967773438, -0.6293182373046875, -0.6009597778320312, -0.572601318359375, -0.5442428588867188, -0.5158843994140625, -0.48752593994140625, -0.45916748046875, -0.43080902099609375, -0.4024505615234375, -0.37409210205078125, -0.345733642578125, -0.31737518310546875, -0.2890167236328125, -0.26065826416015625, -0.2322998046875, -0.20394134521484375, -0.1755828857421875, -0.14722442626953125, -0.118865966796875, -0.09050750732421875, -0.0621490478515625, -0.03379058837890625, -0.00543212890625, 0.02292633056640625, 0.0512847900390625, 0.07964324951171875, 0.108001708984375, 0.13636016845703125, 0.1647186279296875, 0.19307708740234375, 0.221435546875, 0.24979400634765625, 0.2781524658203125, 0.30651092529296875, 0.334869384765625, 0.36322784423828125, 0.3915863037109375, 0.41994476318359375, 0.44830322265625, 0.47666168212890625, 0.5050201416015625, 0.5333786010742188, 0.561737060546875, 0.5900955200195312, 0.6184539794921875, 0.6468124389648438, 0.6751708984375, 0.7035293579101562, 0.7318878173828125, 0.7602462768554688, 0.788604736328125, 0.8169631958007812, 0.8453216552734375, 0.8736801147460938, 0.90203857421875, 0.9303970336914062, 0.9587554931640625, 0.9871139526367188, 1.015472412109375, 1.0438308715820312, 1.0721893310546875, 1.1005477905273438, 1.12890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 3.0, 13.0, 7.0, 16.0, 21.0, 42.0, 79.0, 135.0, 532.0, 2212.0, 578.0, 194.0, 93.0, 45.0, 27.0, 23.0, 12.0, 16.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0718994140625, -0.067535400390625, -0.06317138671875, -0.058807373046875, -0.054443359375, -0.050079345703125, -0.04571533203125, -0.041351318359375, -0.0369873046875, -0.032623291015625, -0.02825927734375, -0.023895263671875, -0.01953125, -0.015167236328125, -0.01080322265625, -0.006439208984375, -0.0020751953125, 0.002288818359375, 0.00665283203125, 0.011016845703125, 0.015380859375, 0.019744873046875, 0.02410888671875, 0.028472900390625, 0.0328369140625, 0.037200927734375, 0.04156494140625, 0.045928955078125, 0.05029296875, 0.054656982421875, 0.05902099609375, 0.063385009765625, 0.0677490234375, 0.072113037109375, 0.07647705078125, 0.080841064453125, 0.085205078125, 0.089569091796875, 0.09393310546875, 0.098297119140625, 0.1026611328125, 0.107025146484375, 0.11138916015625, 0.115753173828125, 0.1201171875, 0.124481201171875, 0.12884521484375, 0.133209228515625, 0.1375732421875, 0.141937255859375, 0.14630126953125, 0.150665283203125, 0.155029296875, 0.159393310546875, 0.16375732421875, 0.168121337890625, 0.1724853515625, 0.176849365234375, 0.18121337890625, 0.185577392578125, 0.18994140625, 0.194305419921875, 0.19866943359375, 0.203033447265625, 0.2073974609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 16.0, 207.0, 628.0, 105.0, 17.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7564871311187744, -1.6835155487060547, -1.610543966293335, -1.5375723838806152, -1.4646008014678955, -1.3916292190551758, -1.318657636642456, -1.2456860542297363, -1.1727144718170166, -1.0997428894042969, -1.0267713069915771, -0.9537997245788574, -0.8808281421661377, -0.807856559753418, -0.7348849773406982, -0.6619133949279785, -0.5889418125152588, -0.5159702301025391, -0.44299864768981934, -0.3700270652770996, -0.2970554828643799, -0.22408390045166016, -0.15111231803894043, -0.0781407356262207, -0.0051691532135009766, 0.06780242919921875, 0.14077401161193848, 0.2137455940246582, 0.28671717643737793, 0.35968875885009766, 0.4326603412628174, 0.5056319236755371, 0.5786037445068359, 0.6515753269195557, 0.7245469093322754, 0.7975184917449951, 0.8704900741577148, 0.9434616565704346, 1.0164332389831543, 1.089404821395874, 1.1623764038085938, 1.2353479862213135, 1.3083195686340332, 1.381291151046753, 1.4542627334594727, 1.5272343158721924, 1.600205898284912, 1.6731774806976318, 1.7461490631103516, 1.8191206455230713, 1.892092227935791, 1.9650638103485107, 2.0380353927612305, 2.11100697517395, 2.18397855758667, 2.2569501399993896, 2.3299217224121094, 2.402893304824829, 2.475864887237549, 2.5488364696502686, 2.6218080520629883, 2.694779634475708, 2.7677512168884277, 2.8407227993011475, 2.913694381713867]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 9.0, 12.0, 12.0, 22.0, 31.0, 33.0, 39.0, 54.0, 69.0, 68.0, 84.0, 91.0, 62.0, 63.0, 53.0, 57.0, 58.0, 41.0, 37.0, 22.0, 17.0, 7.0, 14.0, 8.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.8213629722595215, -0.8008663654327393, -0.7803698182106018, -0.7598732709884644, -0.7393766641616821, -0.7188800573348999, -0.6983835101127625, -0.677886962890625, -0.6573903560638428, -0.6368937492370605, -0.6163972020149231, -0.5959006547927856, -0.5754040479660034, -0.5549074411392212, -0.5344108939170837, -0.5139143466949463, -0.49341773986816406, -0.4729211628437042, -0.4524245858192444, -0.43192800879478455, -0.4114314317703247, -0.39093485474586487, -0.37043827772140503, -0.3499417006969452, -0.32944512367248535, -0.3089485466480255, -0.2884519696235657, -0.26795539259910583, -0.247458815574646, -0.22696223855018616, -0.20646566152572632, -0.18596908450126648, -0.16547244787216187, -0.14497587084770203, -0.12447929382324219, -0.10398271679878235, -0.08348613977432251, -0.06298956274986267, -0.04249298572540283, -0.021996408700942993, -0.0014998316764831543, 0.018996745347976685, 0.03949332237243652, 0.05998989939689636, 0.0804864764213562, 0.10098305344581604, 0.12147963047027588, 0.14197620749473572, 0.16247278451919556, 0.1829693615436554, 0.20346593856811523, 0.22396251559257507, 0.2444590926170349, 0.26495566964149475, 0.2854522466659546, 0.30594882369041443, 0.32644540071487427, 0.3469419777393341, 0.36743855476379395, 0.3879351317882538, 0.4084317088127136, 0.42892828583717346, 0.4494248628616333, 0.46992143988609314, 0.490418016910553]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 7.0, 3.0, 7.0, 14.0, 12.0, 19.0, 27.0, 37.0, 59.0, 72.0, 135.0, 214.0, 300.0, 493.0, 935.0, 1651.0, 3170.0, 6848.0, 16051.0, 50493.0, 658021.0, 253937.0, 32672.0, 12101.0, 5301.0, 2567.0, 1457.0, 699.0, 468.0, 249.0, 150.0, 129.0, 88.0, 55.0, 29.0, 23.0, 22.0, 12.0, 9.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.470458984375, -0.4546928405761719, -0.43892669677734375, -0.4231605529785156, -0.4073944091796875, -0.3916282653808594, -0.37586212158203125, -0.3600959777832031, -0.344329833984375, -0.3285636901855469, -0.31279754638671875, -0.2970314025878906, -0.2812652587890625, -0.2654991149902344, -0.24973297119140625, -0.23396682739257812, -0.21820068359375, -0.20243453979492188, -0.18666839599609375, -0.17090225219726562, -0.1551361083984375, -0.13936996459960938, -0.12360382080078125, -0.10783767700195312, -0.092071533203125, -0.07630538940429688, -0.06053924560546875, -0.044773101806640625, -0.0290069580078125, -0.013240814208984375, 0.00252532958984375, 0.018291473388671875, 0.0340576171875, 0.049823760986328125, 0.06558990478515625, 0.08135604858398438, 0.0971221923828125, 0.11288833618164062, 0.12865447998046875, 0.14442062377929688, 0.160186767578125, 0.17595291137695312, 0.19171905517578125, 0.20748519897460938, 0.2232513427734375, 0.23901748657226562, 0.25478363037109375, 0.2705497741699219, 0.28631591796875, 0.3020820617675781, 0.31784820556640625, 0.3336143493652344, 0.3493804931640625, 0.3651466369628906, 0.38091278076171875, 0.3966789245605469, 0.412445068359375, 0.4282112121582031, 0.44397735595703125, 0.4597434997558594, 0.4755096435546875, 0.4912757873535156, 0.5070419311523438, 0.5228080749511719, 0.53857421875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 7.0, 9.0, 6.0, 12.0, 6.0, 25.0, 27.0, 79.0, 169.0, 255.0, 173.0, 92.0, 46.0, 20.0, 19.0, 5.0, 6.0, 13.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.10113525390625, -0.09857177734375, -0.09600830078125, -0.09344482421875, -0.09088134765625, -0.08831787109375, -0.08575439453125, -0.08319091796875, -0.08062744140625, -0.07806396484375, -0.07550048828125, -0.07293701171875, -0.07037353515625, -0.06781005859375, -0.06524658203125, -0.06268310546875, -0.06011962890625, -0.05755615234375, -0.05499267578125, -0.05242919921875, -0.04986572265625, -0.04730224609375, -0.04473876953125, -0.04217529296875, -0.03961181640625, -0.03704833984375, -0.03448486328125, -0.03192138671875, -0.02935791015625, -0.02679443359375, -0.02423095703125, -0.02166748046875, -0.01910400390625, -0.01654052734375, -0.01397705078125, -0.01141357421875, -0.00885009765625, -0.00628662109375, -0.00372314453125, -0.00115966796875, 0.00140380859375, 0.00396728515625, 0.00653076171875, 0.00909423828125, 0.01165771484375, 0.01422119140625, 0.01678466796875, 0.01934814453125, 0.02191162109375, 0.02447509765625, 0.02703857421875, 0.02960205078125, 0.03216552734375, 0.03472900390625, 0.03729248046875, 0.03985595703125, 0.04241943359375, 0.04498291015625, 0.04754638671875, 0.05010986328125, 0.05267333984375, 0.05523681640625, 0.05780029296875, 0.06036376953125, 0.06292724609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 6.0, 1.0, 4.0, 2.0, 5.0, 4.0, 15.0, 65.0, 408.0, 4208.0, 887245.0, 154844.0, 1467.0, 190.0, 32.0, 8.0, 10.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.732421875, -1.679656982421875, -1.62689208984375, -1.574127197265625, -1.5213623046875, -1.468597412109375, -1.41583251953125, -1.363067626953125, -1.310302734375, -1.257537841796875, -1.20477294921875, -1.152008056640625, -1.0992431640625, -1.046478271484375, -0.99371337890625, -0.940948486328125, -0.88818359375, -0.835418701171875, -0.78265380859375, -0.729888916015625, -0.6771240234375, -0.624359130859375, -0.57159423828125, -0.518829345703125, -0.466064453125, -0.413299560546875, -0.36053466796875, -0.307769775390625, -0.2550048828125, -0.202239990234375, -0.14947509765625, -0.096710205078125, -0.0439453125, 0.008819580078125, 0.06158447265625, 0.114349365234375, 0.1671142578125, 0.219879150390625, 0.27264404296875, 0.325408935546875, 0.378173828125, 0.430938720703125, 0.48370361328125, 0.536468505859375, 0.5892333984375, 0.641998291015625, 0.69476318359375, 0.747528076171875, 0.80029296875, 0.853057861328125, 0.90582275390625, 0.958587646484375, 1.0113525390625, 1.064117431640625, 1.11688232421875, 1.169647216796875, 1.222412109375, 1.275177001953125, 1.32794189453125, 1.380706787109375, 1.4334716796875, 1.486236572265625, 1.53900146484375, 1.591766357421875, 1.64453125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 3.0, 1.0, 1.0, 2.0, 5.0, 12.0, 5.0, 9.0, 11.0, 9.0, 6.0, 7.0, 16.0, 16.0, 18.0, 13.0, 24.0, 21.0, 25.0, 31.0, 26.0, 28.0, 28.0, 33.0, 28.0, 36.0, 33.0, 39.0, 37.0, 30.0, 35.0, 32.0, 35.0, 27.0, 30.0, 30.0, 33.0, 25.0, 16.0, 30.0, 22.0, 30.0, 12.0, 17.0, 18.0, 17.0, 10.0, 7.0, 5.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.1727294921875, -0.16731834411621094, -0.16190719604492188, -0.1564960479736328, -0.15108489990234375, -0.1456737518310547, -0.14026260375976562, -0.13485145568847656, -0.1294403076171875, -0.12402915954589844, -0.11861801147460938, -0.11320686340332031, -0.10779571533203125, -0.10238456726074219, -0.09697341918945312, -0.09156227111816406, -0.086151123046875, -0.08073997497558594, -0.07532882690429688, -0.06991767883300781, -0.06450653076171875, -0.05909538269042969, -0.053684234619140625, -0.04827308654785156, -0.0428619384765625, -0.03745079040527344, -0.032039642333984375, -0.026628494262695312, -0.02121734619140625, -0.015806198120117188, -0.010395050048828125, -0.0049839019775390625, 0.00042724609375, 0.0058383941650390625, 0.011249542236328125, 0.016660690307617188, 0.02207183837890625, 0.027482986450195312, 0.032894134521484375, 0.03830528259277344, 0.0437164306640625, 0.04912757873535156, 0.054538726806640625, 0.05994987487792969, 0.06536102294921875, 0.07077217102050781, 0.07618331909179688, 0.08159446716308594, 0.087005615234375, 0.09241676330566406, 0.09782791137695312, 0.10323905944824219, 0.10865020751953125, 0.11406135559082031, 0.11947250366210938, 0.12488365173339844, 0.1302947998046875, 0.13570594787597656, 0.14111709594726562, 0.1465282440185547, 0.15193939208984375, 0.1573505401611328, 0.16276168823242188, 0.16817283630371094, 0.173583984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 6.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 18.0, 34.0, 72.0, 272.0, 1666.0, 85343.0, 957020.0, 3473.0, 400.0, 106.0, 35.0, 19.0, 17.0, 12.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.48828125, -1.4389190673828125, -1.389556884765625, -1.3401947021484375, -1.29083251953125, -1.2414703369140625, -1.192108154296875, -1.1427459716796875, -1.0933837890625, -1.0440216064453125, -0.994659423828125, -0.9452972412109375, -0.89593505859375, -0.8465728759765625, -0.797210693359375, -0.7478485107421875, -0.698486328125, -0.6491241455078125, -0.599761962890625, -0.5503997802734375, -0.50103759765625, -0.4516754150390625, -0.402313232421875, -0.3529510498046875, -0.3035888671875, -0.2542266845703125, -0.204864501953125, -0.1555023193359375, -0.10614013671875, -0.0567779541015625, -0.007415771484375, 0.0419464111328125, 0.09130859375, 0.1406707763671875, 0.190032958984375, 0.2393951416015625, 0.28875732421875, 0.3381195068359375, 0.387481689453125, 0.4368438720703125, 0.4862060546875, 0.5355682373046875, 0.584930419921875, 0.6342926025390625, 0.68365478515625, 0.7330169677734375, 0.782379150390625, 0.8317413330078125, 0.881103515625, 0.9304656982421875, 0.979827880859375, 1.0291900634765625, 1.07855224609375, 1.1279144287109375, 1.177276611328125, 1.2266387939453125, 1.2760009765625, 1.3253631591796875, 1.374725341796875, 1.4240875244140625, 1.47344970703125, 1.5228118896484375, 1.572174072265625, 1.6215362548828125, 1.6708984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 8.0, 5.0, 12.0, 6.0, 10.0, 18.0, 23.0, 29.0, 33.0, 67.0, 101.0, 133.0, 177.0, 88.0, 63.0, 64.0, 32.0, 21.0, 18.0, 17.0, 13.0, 11.0, 9.0, 5.0, 1.0, 6.0, 7.0, 4.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0003590583801269531, -0.0003485754132270813, -0.00033809244632720947, -0.00032760947942733765, -0.0003171265125274658, -0.000306643545627594, -0.00029616057872772217, -0.00028567761182785034, -0.0002751946449279785, -0.0002647116780281067, -0.00025422871112823486, -0.00024374574422836304, -0.0002332627773284912, -0.00022277981042861938, -0.00021229684352874756, -0.00020181387662887573, -0.0001913309097290039, -0.00018084794282913208, -0.00017036497592926025, -0.00015988200902938843, -0.0001493990421295166, -0.00013891607522964478, -0.00012843310832977295, -0.00011795014142990112, -0.0001074671745300293, -9.698420763015747e-05, -8.650124073028564e-05, -7.601827383041382e-05, -6.553530693054199e-05, -5.5052340030670166e-05, -4.456937313079834e-05, -3.4086406230926514e-05, -2.3603439331054688e-05, -1.3120472431182861e-05, -2.637505531311035e-06, 7.845461368560791e-06, 1.8328428268432617e-05, 2.8811395168304443e-05, 3.929436206817627e-05, 4.9777328968048096e-05, 6.026029586791992e-05, 7.074326276779175e-05, 8.122622966766357e-05, 9.17091965675354e-05, 0.00010219216346740723, 0.00011267513036727905, 0.00012315809726715088, 0.0001336410641670227, 0.00014412403106689453, 0.00015460699796676636, 0.00016508996486663818, 0.00017557293176651, 0.00018605589866638184, 0.00019653886556625366, 0.0002070218324661255, 0.00021750479936599731, 0.00022798776626586914, 0.00023847073316574097, 0.0002489537000656128, 0.0002594366669654846, 0.00026991963386535645, 0.00028040260076522827, 0.0002908855676651001, 0.0003013685345649719, 0.00031185150146484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 13.0, 15.0, 30.0, 37.0, 74.0, 132.0, 202.0, 472.0, 1236.0, 4872.0, 45387.0, 864864.0, 119671.0, 8466.0, 1827.0, 652.0, 278.0, 133.0, 80.0, 39.0, 22.0, 13.0, 10.0, 7.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54345703125, -0.52777099609375, -0.5120849609375, -0.49639892578125, -0.480712890625, -0.46502685546875, -0.4493408203125, -0.43365478515625, -0.41796875, -0.40228271484375, -0.3865966796875, -0.37091064453125, -0.355224609375, -0.33953857421875, -0.3238525390625, -0.30816650390625, -0.29248046875, -0.27679443359375, -0.2611083984375, -0.24542236328125, -0.229736328125, -0.21405029296875, -0.1983642578125, -0.18267822265625, -0.1669921875, -0.15130615234375, -0.1356201171875, -0.11993408203125, -0.104248046875, -0.08856201171875, -0.0728759765625, -0.05718994140625, -0.04150390625, -0.02581787109375, -0.0101318359375, 0.00555419921875, 0.021240234375, 0.03692626953125, 0.0526123046875, 0.06829833984375, 0.083984375, 0.09967041015625, 0.1153564453125, 0.13104248046875, 0.146728515625, 0.16241455078125, 0.1781005859375, 0.19378662109375, 0.20947265625, 0.22515869140625, 0.2408447265625, 0.25653076171875, 0.272216796875, 0.28790283203125, 0.3035888671875, 0.31927490234375, 0.3349609375, 0.35064697265625, 0.3663330078125, 0.38201904296875, 0.397705078125, 0.41339111328125, 0.4290771484375, 0.44476318359375, 0.46044921875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 11.0, 17.0, 29.0, 34.0, 77.0, 145.0, 161.0, 177.0, 149.0, 94.0, 42.0, 28.0, 18.0, 9.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50537109375, -0.4921226501464844, -0.47887420654296875, -0.4656257629394531, -0.4523773193359375, -0.4391288757324219, -0.42588043212890625, -0.4126319885253906, -0.399383544921875, -0.3861351013183594, -0.37288665771484375, -0.3596382141113281, -0.3463897705078125, -0.3331413269042969, -0.31989288330078125, -0.3066444396972656, -0.29339599609375, -0.2801475524902344, -0.26689910888671875, -0.2536506652832031, -0.2404022216796875, -0.22715377807617188, -0.21390533447265625, -0.20065689086914062, -0.187408447265625, -0.17416000366210938, -0.16091156005859375, -0.14766311645507812, -0.1344146728515625, -0.12116622924804688, -0.10791778564453125, -0.09466934204101562, -0.0814208984375, -0.06817245483398438, -0.05492401123046875, -0.041675567626953125, -0.0284271240234375, -0.015178680419921875, -0.00193023681640625, 0.011318206787109375, 0.024566650390625, 0.037815093994140625, 0.05106353759765625, 0.06431198120117188, 0.0775604248046875, 0.09080886840820312, 0.10405731201171875, 0.11730575561523438, 0.13055419921875, 0.14380264282226562, 0.15705108642578125, 0.17029953002929688, 0.1835479736328125, 0.19679641723632812, 0.21004486083984375, 0.22329330444335938, 0.236541748046875, 0.24979019165039062, 0.26303863525390625, 0.2762870788574219, 0.2895355224609375, 0.3027839660644531, 0.31603240966796875, 0.3292808532714844, 0.342529296875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 24.0, 63.0, 167.0, 323.0, 232.0, 102.0, 36.0, 18.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.8879098892211914, -3.7847743034362793, -3.681638717651367, -3.578502893447876, -3.475367307662964, -3.3722317218780518, -3.2690958976745605, -3.1659603118896484, -3.0628247261047363, -2.959689140319824, -2.856553554534912, -2.753417730331421, -2.650282144546509, -2.5471465587615967, -2.4440107345581055, -2.3408751487731934, -2.2377395629882812, -2.134603977203369, -2.031468391418457, -1.9283325672149658, -1.8251969814300537, -1.7220613956451416, -1.61892569065094, -1.5157899856567383, -1.4126543998718262, -1.309518814086914, -1.2063831090927124, -1.1032474040985107, -1.0001118183135986, -0.8969761729240417, -0.7938405275344849, -0.690704882144928, -0.5875692367553711, -0.4844335913658142, -0.3812979459762573, -0.27816230058670044, -0.17502665519714355, -0.07189100980758667, 0.031244635581970215, 0.1343802809715271, 0.23751592636108398, 0.34065157175064087, 0.44378721714019775, 0.5469228625297546, 0.6500585079193115, 0.7531941533088684, 0.8563297986984253, 0.9594654440879822, 1.062601089477539, 1.1657366752624512, 1.2688723802566528, 1.3720080852508545, 1.4751436710357666, 1.5782792568206787, 1.6814149618148804, 1.784550666809082, 1.8876862525939941, 1.9908218383789062, 2.0939574241638184, 2.1970932483673096, 2.3002288341522217, 2.403364419937134, 2.506500244140625, 2.609635829925537, 2.712771415710449]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 10.0, 16.0, 19.0, 33.0, 54.0, 70.0, 92.0, 118.0, 141.0, 115.0, 111.0, 70.0, 42.0, 36.0, 24.0, 11.0, 6.0, 4.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6824002265930176, -2.5637271404266357, -2.445053815841675, -2.326380729675293, -2.207707643508911, -2.0890345573425293, -1.9703612327575684, -1.8516881465911865, -1.7330150604248047, -1.6143418550491333, -1.4956687688827515, -1.37699556350708, -1.2583224773406982, -1.1396492719650269, -1.0209760665893555, -0.9023029804229736, -0.7836297750473022, -0.6649566292762756, -0.546283483505249, -0.4276103079319, -0.3089371621608734, -0.19026398658752441, -0.0715908408164978, 0.04708230495452881, 0.16575545072555542, 0.28442859649658203, 0.40310174226760864, 0.5217748880386353, 0.6404480934143066, 0.7591212391853333, 0.8777943849563599, 0.9964675307273865, 1.115140676498413, 1.2338138818740845, 1.3524869680404663, 1.4711601734161377, 1.5898332595825195, 1.708506464958191, 1.8271796703338623, 1.9458527565002441, 2.064525842666626, 2.183198928833008, 2.3018722534179688, 2.4205453395843506, 2.5392184257507324, 2.6578917503356934, 2.776564836502075, 2.895237922668457, 3.013911247253418, 3.1325843334198, 3.2512576580047607, 3.3699307441711426, 3.4886038303375244, 3.6072769165039062, 3.725950241088867, 3.844623327255249, 3.963296413421631, 4.081969738006592, 4.2006425857543945, 4.3193159103393555, 4.437989234924316, 4.556662082672119, 4.67533540725708, 4.794008255004883, 4.912681579589844]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 8.0, 3.0, 11.0, 8.0, 12.0, 12.0, 22.0, 22.0, 38.0, 56.0, 96.0, 155.0, 201.0, 317.0, 515.0, 1002.0, 2458.0, 8704.0, 218655.0, 3944652.0, 12499.0, 2696.0, 1111.0, 491.0, 231.0, 113.0, 63.0, 39.0, 25.0, 15.0, 13.0, 11.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849609375, -2.7785491943359375, -2.707489013671875, -2.6364288330078125, -2.56536865234375, -2.4943084716796875, -2.423248291015625, -2.3521881103515625, -2.2811279296875, -2.2100677490234375, -2.139007568359375, -2.0679473876953125, -1.99688720703125, -1.9258270263671875, -1.854766845703125, -1.7837066650390625, -1.712646484375, -1.6415863037109375, -1.570526123046875, -1.4994659423828125, -1.42840576171875, -1.3573455810546875, -1.286285400390625, -1.2152252197265625, -1.1441650390625, -1.0731048583984375, -1.002044677734375, -0.9309844970703125, -0.85992431640625, -0.7888641357421875, -0.717803955078125, -0.6467437744140625, -0.57568359375, -0.5046234130859375, -0.433563232421875, -0.3625030517578125, -0.29144287109375, -0.2203826904296875, -0.149322509765625, -0.0782623291015625, -0.0072021484375, 0.0638580322265625, 0.134918212890625, 0.2059783935546875, 0.27703857421875, 0.3480987548828125, 0.419158935546875, 0.4902191162109375, 0.561279296875, 0.6323394775390625, 0.703399658203125, 0.7744598388671875, 0.84552001953125, 0.9165802001953125, 0.987640380859375, 1.0587005615234375, 1.1297607421875, 1.2008209228515625, 1.271881103515625, 1.3429412841796875, 1.41400146484375, 1.4850616455078125, 1.556121826171875, 1.6271820068359375, 1.6982421875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 11.0, 21.0, 22.0, 29.0, 100.0, 212.0, 243.0, 174.0, 83.0, 37.0, 12.0, 18.0, 14.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11944580078125, -0.11647891998291016, -0.11351203918457031, -0.11054515838623047, -0.10757827758789062, -0.10461139678955078, -0.10164451599121094, -0.0986776351928711, -0.09571075439453125, -0.0927438735961914, -0.08977699279785156, -0.08681011199951172, -0.08384323120117188, -0.08087635040283203, -0.07790946960449219, -0.07494258880615234, -0.0719757080078125, -0.06900882720947266, -0.06604194641113281, -0.06307506561279297, -0.060108184814453125, -0.05714130401611328, -0.05417442321777344, -0.051207542419433594, -0.04824066162109375, -0.045273780822753906, -0.04230690002441406, -0.03934001922607422, -0.036373138427734375, -0.03340625762939453, -0.030439376831054688, -0.027472496032714844, -0.024505615234375, -0.021538734436035156, -0.018571853637695312, -0.015604972839355469, -0.012638092041015625, -0.009671211242675781, -0.0067043304443359375, -0.0037374496459960938, -0.00077056884765625, 0.0021963119506835938, 0.0051631927490234375, 0.008130073547363281, 0.011096954345703125, 0.014063835144042969, 0.017030715942382812, 0.019997596740722656, 0.0229644775390625, 0.025931358337402344, 0.028898239135742188, 0.03186511993408203, 0.034832000732421875, 0.03779888153076172, 0.04076576232910156, 0.043732643127441406, 0.04669952392578125, 0.049666404724121094, 0.05263328552246094, 0.05560016632080078, 0.058567047119140625, 0.06153392791748047, 0.06450080871582031, 0.06746768951416016, 0.0704345703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 9.0, 16.0, 13.0, 28.0, 36.0, 75.0, 170.0, 1212.0, 786609.0, 3404436.0, 1330.0, 172.0, 62.0, 30.0, 24.0, 13.0, 12.0, 9.0, 4.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.61614990234375, -2.5115966796875, -2.40704345703125, -2.302490234375, -2.19793701171875, -2.0933837890625, -1.98883056640625, -1.88427734375, -1.77972412109375, -1.6751708984375, -1.57061767578125, -1.466064453125, -1.36151123046875, -1.2569580078125, -1.15240478515625, -1.0478515625, -0.94329833984375, -0.8387451171875, -0.73419189453125, -0.629638671875, -0.52508544921875, -0.4205322265625, -0.31597900390625, -0.21142578125, -0.10687255859375, -0.0023193359375, 0.10223388671875, 0.206787109375, 0.31134033203125, 0.4158935546875, 0.52044677734375, 0.625, 0.72955322265625, 0.8341064453125, 0.93865966796875, 1.043212890625, 1.14776611328125, 1.2523193359375, 1.35687255859375, 1.46142578125, 1.56597900390625, 1.6705322265625, 1.77508544921875, 1.879638671875, 1.98419189453125, 2.0887451171875, 2.19329833984375, 2.2978515625, 2.40240478515625, 2.5069580078125, 2.61151123046875, 2.716064453125, 2.82061767578125, 2.9251708984375, 3.02972412109375, 3.13427734375, 3.23883056640625, 3.3433837890625, 3.44793701171875, 3.552490234375, 3.65704345703125, 3.7615966796875, 3.86614990234375, 3.970703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 4.0, 7.0, 12.0, 9.0, 11.0, 30.0, 43.0, 75.0, 137.0, 363.0, 1864.0, 976.0, 259.0, 112.0, 55.0, 29.0, 38.0, 19.0, 11.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.14306640625, -0.1391744613647461, -0.1352825164794922, -0.13139057159423828, -0.12749862670898438, -0.12360668182373047, -0.11971473693847656, -0.11582279205322266, -0.11193084716796875, -0.10803890228271484, -0.10414695739746094, -0.10025501251220703, -0.09636306762695312, -0.09247112274169922, -0.08857917785644531, -0.0846872329711914, -0.0807952880859375, -0.0769033432006836, -0.07301139831542969, -0.06911945343017578, -0.06522750854492188, -0.06133556365966797, -0.05744361877441406, -0.053551673889160156, -0.04965972900390625, -0.045767784118652344, -0.04187583923339844, -0.03798389434814453, -0.034091949462890625, -0.03020000457763672, -0.026308059692382812, -0.022416114807128906, -0.018524169921875, -0.014632225036621094, -0.010740280151367188, -0.006848335266113281, -0.002956390380859375, 0.0009355545043945312, 0.0048274993896484375, 0.008719444274902344, 0.01261138916015625, 0.016503334045410156, 0.020395278930664062, 0.02428722381591797, 0.028179168701171875, 0.03207111358642578, 0.03596305847167969, 0.039855003356933594, 0.0437469482421875, 0.047638893127441406, 0.05153083801269531, 0.05542278289794922, 0.059314727783203125, 0.06320667266845703, 0.06709861755371094, 0.07099056243896484, 0.07488250732421875, 0.07877445220947266, 0.08266639709472656, 0.08655834197998047, 0.09045028686523438, 0.09434223175048828, 0.09823417663574219, 0.1021261215209961, 0.10601806640625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 16.0, 23.0, 75.0, 347.0, 417.0, 95.0, 16.0, 9.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.921736240386963, -1.8760442733764648, -1.8303521871566772, -1.7846602201461792, -1.7389682531356812, -1.693276286125183, -1.6475841999053955, -1.6018922328948975, -1.5562002658843994, -1.5105082988739014, -1.4648162126541138, -1.4191242456436157, -1.3734322786331177, -1.3277403116226196, -1.282048225402832, -1.236356258392334, -1.190664291381836, -1.144972324371338, -1.0992802381515503, -1.0535882711410522, -1.0078963041305542, -0.9622042775154114, -0.9165122509002686, -0.8708202838897705, -0.8251281976699829, -0.7794361710548401, -0.733744204044342, -0.6880521774291992, -0.6423602104187012, -0.5966681838035583, -0.5509761571884155, -0.5052841901779175, -0.45959222316741943, -0.413900226354599, -0.36820822954177856, -0.32251620292663574, -0.2768242359161377, -0.23113222420215607, -0.18544021248817444, -0.139748215675354, -0.09405621886253357, -0.048364218324422836, -0.0026722177863121033, 0.04301978647708893, 0.08871178328990936, 0.1344037801027298, 0.18009579181671143, 0.22578778862953186, 0.2714797854423523, 0.31717178225517273, 0.36286377906799316, 0.408555805683136, 0.45424777269363403, 0.49993979930877686, 0.5456317663192749, 0.5913237929344177, 0.6370158195495605, 0.6827078461647034, 0.7283998131752014, 0.7740918397903442, 0.8197838068008423, 0.8654758334159851, 0.9111678600311279, 0.956859827041626, 1.002551794052124]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 3.0, 6.0, 6.0, 9.0, 6.0, 8.0, 18.0, 13.0, 20.0, 34.0, 37.0, 45.0, 49.0, 40.0, 77.0, 62.0, 61.0, 67.0, 66.0, 63.0, 48.0, 49.0, 35.0, 37.0, 24.0, 24.0, 18.0, 12.0, 11.0, 9.0, 7.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3199346661567688, -0.3076961636543274, -0.295457661151886, -0.2832191586494446, -0.2709806561470032, -0.25874215364456177, -0.24650365114212036, -0.23426514863967896, -0.22202664613723755, -0.20978814363479614, -0.19754964113235474, -0.18531113862991333, -0.17307263612747192, -0.16083413362503052, -0.1485956311225891, -0.1363571286201477, -0.12411864101886749, -0.11188013851642609, -0.09964163601398468, -0.08740313351154327, -0.07516463100910187, -0.06292612850666046, -0.05068763345479965, -0.038449130952358246, -0.02621062844991684, -0.013972126878798008, -0.0017336253076791763, 0.01050487533211708, 0.022743377834558487, 0.03498188033699989, 0.047220379114151, 0.05945888161659241, 0.07169738411903381, 0.08393588662147522, 0.09617438912391663, 0.10841289162635803, 0.12065139412879944, 0.13288989663124084, 0.14512839913368225, 0.15736690163612366, 0.16960540413856506, 0.18184390664100647, 0.19408240914344788, 0.20632091164588928, 0.2185594141483307, 0.2307979166507721, 0.2430364191532135, 0.2552749216556549, 0.2675133943557739, 0.27975189685821533, 0.29199039936065674, 0.30422890186309814, 0.31646740436553955, 0.32870590686798096, 0.34094440937042236, 0.35318291187286377, 0.3654214143753052, 0.3776599168777466, 0.389898419380188, 0.4021369218826294, 0.4143754243850708, 0.4266139268875122, 0.4388524293899536, 0.451090931892395, 0.4633294343948364]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 9.0, 9.0, 18.0, 16.0, 35.0, 58.0, 82.0, 167.0, 271.0, 625.0, 1582.0, 5221.0, 42771.0, 909943.0, 77441.0, 6921.0, 1901.0, 726.0, 336.0, 174.0, 93.0, 42.0, 37.0, 21.0, 14.0, 14.0, 7.0, 4.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7767715454101562, -0.7464141845703125, -0.7160568237304688, -0.685699462890625, -0.6553421020507812, -0.6249847412109375, -0.5946273803710938, -0.56427001953125, -0.5339126586914062, -0.5035552978515625, -0.47319793701171875, -0.442840576171875, -0.41248321533203125, -0.3821258544921875, -0.35176849365234375, -0.3214111328125, -0.29105377197265625, -0.2606964111328125, -0.23033905029296875, -0.199981689453125, -0.16962432861328125, -0.1392669677734375, -0.10890960693359375, -0.07855224609375, -0.04819488525390625, -0.0178375244140625, 0.01251983642578125, 0.042877197265625, 0.07323455810546875, 0.1035919189453125, 0.13394927978515625, 0.164306640625, 0.19466400146484375, 0.2250213623046875, 0.25537872314453125, 0.285736083984375, 0.31609344482421875, 0.3464508056640625, 0.37680816650390625, 0.40716552734375, 0.43752288818359375, 0.4678802490234375, 0.49823760986328125, 0.528594970703125, 0.5589523315429688, 0.5893096923828125, 0.6196670532226562, 0.6500244140625, 0.6803817749023438, 0.7107391357421875, 0.7410964965820312, 0.771453857421875, 0.8018112182617188, 0.8321685791015625, 0.8625259399414062, 0.89288330078125, 0.9232406616210938, 0.9535980224609375, 0.9839553833007812, 1.014312744140625, 1.0446701049804688, 1.0750274658203125, 1.1053848266601562, 1.1357421875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 11.0, 13.0, 28.0, 77.0, 155.0, 225.0, 220.0, 150.0, 56.0, 26.0, 12.0, 12.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11663818359375, -0.11363029479980469, -0.11062240600585938, -0.10761451721191406, -0.10460662841796875, -0.10159873962402344, -0.09859085083007812, -0.09558296203613281, -0.0925750732421875, -0.08956718444824219, -0.08655929565429688, -0.08355140686035156, -0.08054351806640625, -0.07753562927246094, -0.07452774047851562, -0.07151985168457031, -0.068511962890625, -0.06550407409667969, -0.062496185302734375, -0.05948829650878906, -0.05648040771484375, -0.05347251892089844, -0.050464630126953125, -0.04745674133300781, -0.0444488525390625, -0.04144096374511719, -0.038433074951171875, -0.03542518615722656, -0.03241729736328125, -0.029409408569335938, -0.026401519775390625, -0.023393630981445312, -0.0203857421875, -0.017377853393554688, -0.014369964599609375, -0.011362075805664062, -0.00835418701171875, -0.0053462982177734375, -0.002338409423828125, 0.0006694793701171875, 0.0036773681640625, 0.0066852569580078125, 0.009693145751953125, 0.012701034545898438, 0.01570892333984375, 0.018716812133789062, 0.021724700927734375, 0.024732589721679688, 0.027740478515625, 0.030748367309570312, 0.033756256103515625, 0.03676414489746094, 0.03977203369140625, 0.04277992248535156, 0.045787811279296875, 0.04879570007324219, 0.0518035888671875, 0.05481147766113281, 0.057819366455078125, 0.06082725524902344, 0.06383514404296875, 0.06684303283691406, 0.06985092163085938, 0.07285881042480469, 0.07586669921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 6.0, 6.0, 13.0, 10.0, 12.0, 41.0, 57.0, 102.0, 221.0, 449.0, 1106.0, 3514.0, 14365.0, 85960.0, 520110.0, 356825.0, 51931.0, 9638.0, 2476.0, 899.0, 353.0, 184.0, 97.0, 57.0, 43.0, 18.0, 19.0, 12.0, 9.0, 4.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.481689453125, -0.4660835266113281, -0.45047760009765625, -0.4348716735839844, -0.4192657470703125, -0.4036598205566406, -0.38805389404296875, -0.3724479675292969, -0.356842041015625, -0.3412361145019531, -0.32563018798828125, -0.3100242614746094, -0.2944183349609375, -0.2788124084472656, -0.26320648193359375, -0.24760055541992188, -0.23199462890625, -0.21638870239257812, -0.20078277587890625, -0.18517684936523438, -0.1695709228515625, -0.15396499633789062, -0.13835906982421875, -0.12275314331054688, -0.107147216796875, -0.09154129028320312, -0.07593536376953125, -0.060329437255859375, -0.0447235107421875, -0.029117584228515625, -0.01351165771484375, 0.002094268798828125, 0.0177001953125, 0.033306121826171875, 0.04891204833984375, 0.06451797485351562, 0.0801239013671875, 0.09572982788085938, 0.11133575439453125, 0.12694168090820312, 0.142547607421875, 0.15815353393554688, 0.17375946044921875, 0.18936538696289062, 0.2049713134765625, 0.22057723999023438, 0.23618316650390625, 0.2517890930175781, 0.26739501953125, 0.2830009460449219, 0.29860687255859375, 0.3142127990722656, 0.3298187255859375, 0.3454246520996094, 0.36103057861328125, 0.3766365051269531, 0.392242431640625, 0.4078483581542969, 0.42345428466796875, 0.4390602111816406, 0.4546661376953125, 0.4702720642089844, 0.48587799072265625, 0.5014839172363281, 0.51708984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 6.0, 7.0, 4.0, 15.0, 13.0, 15.0, 15.0, 19.0, 30.0, 29.0, 35.0, 42.0, 51.0, 38.0, 36.0, 50.0, 57.0, 58.0, 45.0, 42.0, 60.0, 55.0, 45.0, 39.0, 33.0, 26.0, 28.0, 23.0, 14.0, 18.0, 13.0, 9.0, 6.0, 6.0, 5.0, 7.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19287109375, -0.18605804443359375, -0.1792449951171875, -0.17243194580078125, -0.165618896484375, -0.15880584716796875, -0.1519927978515625, -0.14517974853515625, -0.13836669921875, -0.13155364990234375, -0.1247406005859375, -0.11792755126953125, -0.111114501953125, -0.10430145263671875, -0.0974884033203125, -0.09067535400390625, -0.0838623046875, -0.07704925537109375, -0.0702362060546875, -0.06342315673828125, -0.056610107421875, -0.04979705810546875, -0.0429840087890625, -0.03617095947265625, -0.02935791015625, -0.02254486083984375, -0.0157318115234375, -0.00891876220703125, -0.002105712890625, 0.00470733642578125, 0.0115203857421875, 0.01833343505859375, 0.025146484375, 0.03195953369140625, 0.0387725830078125, 0.04558563232421875, 0.052398681640625, 0.05921173095703125, 0.0660247802734375, 0.07283782958984375, 0.07965087890625, 0.08646392822265625, 0.0932769775390625, 0.10009002685546875, 0.106903076171875, 0.11371612548828125, 0.1205291748046875, 0.12734222412109375, 0.1341552734375, 0.14096832275390625, 0.1477813720703125, 0.15459442138671875, 0.161407470703125, 0.16822052001953125, 0.1750335693359375, 0.18184661865234375, 0.18865966796875, 0.19547271728515625, 0.2022857666015625, 0.20909881591796875, 0.215911865234375, 0.22272491455078125, 0.2295379638671875, 0.23635101318359375, 0.2431640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 13.0, 8.0, 11.0, 27.0, 35.0, 68.0, 140.0, 382.0, 1229.0, 7044.0, 530104.0, 500548.0, 7025.0, 1240.0, 359.0, 154.0, 68.0, 48.0, 20.0, 11.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.923828125, -0.8995132446289062, -0.8751983642578125, -0.8508834838867188, -0.826568603515625, -0.8022537231445312, -0.7779388427734375, -0.7536239624023438, -0.72930908203125, -0.7049942016601562, -0.6806793212890625, -0.6563644409179688, -0.632049560546875, -0.6077346801757812, -0.5834197998046875, -0.5591049194335938, -0.5347900390625, -0.5104751586914062, -0.4861602783203125, -0.46184539794921875, -0.437530517578125, -0.41321563720703125, -0.3889007568359375, -0.36458587646484375, -0.34027099609375, -0.31595611572265625, -0.2916412353515625, -0.26732635498046875, -0.243011474609375, -0.21869659423828125, -0.1943817138671875, -0.17006683349609375, -0.145751953125, -0.12143707275390625, -0.0971221923828125, -0.07280731201171875, -0.048492431640625, -0.02417755126953125, 0.0001373291015625, 0.02445220947265625, 0.04876708984375, 0.07308197021484375, 0.0973968505859375, 0.12171173095703125, 0.146026611328125, 0.17034149169921875, 0.1946563720703125, 0.21897125244140625, 0.2432861328125, 0.26760101318359375, 0.2919158935546875, 0.31623077392578125, 0.340545654296875, 0.36486053466796875, 0.3891754150390625, 0.41349029541015625, 0.43780517578125, 0.46212005615234375, 0.4864349365234375, 0.5107498168945312, 0.535064697265625, 0.5593795776367188, 0.5836944580078125, 0.6080093383789062, 0.63232421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 5.0, 11.0, 17.0, 25.0, 20.0, 25.0, 26.0, 41.0, 44.0, 62.0, 66.0, 98.0, 115.0, 92.0, 69.0, 55.0, 50.0, 35.0, 35.0, 25.0, 22.0, 13.0, 13.0, 6.0, 6.0, 10.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024020671844482422, -0.00023213960230350494, -0.00022407248616218567, -0.0002160053700208664, -0.00020793825387954712, -0.00019987113773822784, -0.00019180402159690857, -0.0001837369054555893, -0.00017566978931427002, -0.00016760267317295074, -0.00015953555703163147, -0.0001514684408903122, -0.00014340132474899292, -0.00013533420860767365, -0.00012726709246635437, -0.0001191999763250351, -0.00011113286018371582, -0.00010306574404239655, -9.499862790107727e-05, -8.6931511759758e-05, -7.886439561843872e-05, -7.079727947711945e-05, -6.273016333580017e-05, -5.4663047194480896e-05, -4.659593105316162e-05, -3.8528814911842346e-05, -3.046169877052307e-05, -2.2394582629203796e-05, -1.4327466487884521e-05, -6.260350346565247e-06, 1.8067657947540283e-06, 9.873881936073303e-06, 1.7940998077392578e-05, 2.6008114218711853e-05, 3.407523036003113e-05, 4.21423465013504e-05, 5.020946264266968e-05, 5.827657878398895e-05, 6.634369492530823e-05, 7.44108110666275e-05, 8.247792720794678e-05, 9.054504334926605e-05, 9.861215949058533e-05, 0.0001066792756319046, 0.00011474639177322388, 0.00012281350791454315, 0.00013088062405586243, 0.0001389477401971817, 0.00014701485633850098, 0.00015508197247982025, 0.00016314908862113953, 0.0001712162047624588, 0.00017928332090377808, 0.00018735043704509735, 0.00019541755318641663, 0.0002034846693277359, 0.00021155178546905518, 0.00021961890161037445, 0.00022768601775169373, 0.000235753133893013, 0.00024382025003433228, 0.00025188736617565155, 0.0002599544823169708, 0.0002680215984582901, 0.0002760887145996094]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 5.0, 6.0, 7.0, 25.0, 30.0, 30.0, 68.0, 97.0, 160.0, 234.0, 466.0, 920.0, 2233.0, 9873.0, 158751.0, 837850.0, 30352.0, 4369.0, 1460.0, 651.0, 372.0, 229.0, 133.0, 86.0, 42.0, 40.0, 18.0, 12.0, 13.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.421875, -0.40517425537109375, -0.3884735107421875, -0.37177276611328125, -0.355072021484375, -0.33837127685546875, -0.3216705322265625, -0.30496978759765625, -0.28826904296875, -0.27156829833984375, -0.2548675537109375, -0.23816680908203125, -0.221466064453125, -0.20476531982421875, -0.1880645751953125, -0.17136383056640625, -0.1546630859375, -0.13796234130859375, -0.1212615966796875, -0.10456085205078125, -0.087860107421875, -0.07115936279296875, -0.0544586181640625, -0.03775787353515625, -0.02105712890625, -0.00435638427734375, 0.0123443603515625, 0.02904510498046875, 0.045745849609375, 0.06244659423828125, 0.0791473388671875, 0.09584808349609375, 0.112548828125, 0.12924957275390625, 0.1459503173828125, 0.16265106201171875, 0.179351806640625, 0.19605255126953125, 0.2127532958984375, 0.22945404052734375, 0.24615478515625, 0.26285552978515625, 0.2795562744140625, 0.29625701904296875, 0.312957763671875, 0.32965850830078125, 0.3463592529296875, 0.36305999755859375, 0.3797607421875, 0.39646148681640625, 0.4131622314453125, 0.42986297607421875, 0.446563720703125, 0.46326446533203125, 0.4799652099609375, 0.49666595458984375, 0.51336669921875, 0.5300674438476562, 0.5467681884765625, 0.5634689331054688, 0.580169677734375, 0.5968704223632812, 0.6135711669921875, 0.6302719116210938, 0.64697265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 7.0, 12.0, 27.0, 32.0, 59.0, 124.0, 186.0, 211.0, 146.0, 88.0, 43.0, 26.0, 22.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2489013671875, -0.2403888702392578, -0.23187637329101562, -0.22336387634277344, -0.21485137939453125, -0.20633888244628906, -0.19782638549804688, -0.1893138885498047, -0.1808013916015625, -0.1722888946533203, -0.16377639770507812, -0.15526390075683594, -0.14675140380859375, -0.13823890686035156, -0.12972640991210938, -0.12121391296386719, -0.112701416015625, -0.10418891906738281, -0.09567642211914062, -0.08716392517089844, -0.07865142822265625, -0.07013893127441406, -0.061626434326171875, -0.05311393737792969, -0.0446014404296875, -0.03608894348144531, -0.027576446533203125, -0.019063949584960938, -0.01055145263671875, -0.0020389556884765625, 0.006473541259765625, 0.014986038208007812, 0.02349853515625, 0.03201103210449219, 0.040523529052734375, 0.04903602600097656, 0.05754852294921875, 0.06606101989746094, 0.07457351684570312, 0.08308601379394531, 0.0915985107421875, 0.10011100769042969, 0.10862350463867188, 0.11713600158691406, 0.12564849853515625, 0.13416099548339844, 0.14267349243164062, 0.1511859893798828, 0.159698486328125, 0.1682109832763672, 0.17672348022460938, 0.18523597717285156, 0.19374847412109375, 0.20226097106933594, 0.21077346801757812, 0.2192859649658203, 0.2277984619140625, 0.2363109588623047, 0.24482345581054688, 0.25333595275878906, 0.26184844970703125, 0.27036094665527344, 0.2788734436035156, 0.2873859405517578, 0.2958984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 9.0, 14.0, 37.0, 103.0, 270.0, 307.0, 156.0, 63.0, 28.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.9216318130493164, -3.7715790271759033, -3.6215262413024902, -3.471473455429077, -3.321420669555664, -3.171367883682251, -3.021315097808838, -2.871262550354004, -2.7212095260620117, -2.5711567401885986, -2.4211039543151855, -2.2710511684417725, -2.1209983825683594, -1.9709455966949463, -1.8208929300308228, -1.6708401441574097, -1.5207874774932861, -1.370734691619873, -1.22068190574646, -1.0706291198730469, -0.9205763936042786, -0.7705236077308655, -0.6204708814620972, -0.4704180955886841, -0.320365309715271, -0.1703125387430191, -0.020259767770767212, 0.1297929883003235, 0.2798457741737366, 0.42989856004714966, 0.579951286315918, 0.730004072189331, 0.8800568580627441, 1.0301096439361572, 1.1801624298095703, 1.3302152156829834, 1.4802680015563965, 1.6303207874298096, 1.780373454093933, 1.9304262399673462, 2.080479145050049, 2.230531930923462, 2.380584716796875, 2.530637502670288, 2.680690288543701, 2.8307430744171143, 2.9807958602905273, 3.1308484077453613, 3.2809011936187744, 3.4309539794921875, 3.5810067653656006, 3.7310595512390137, 3.8811123371124268, 4.03116512298584, 4.181217670440674, 4.331270694732666, 4.4813232421875, 4.631375789642334, 4.781428813934326, 4.93148136138916, 5.081534385681152, 5.231586933135986, 5.3816399574279785, 5.5316925048828125, 5.681745529174805]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 7.0, 10.0, 12.0, 14.0, 13.0, 26.0, 18.0, 27.0, 43.0, 52.0, 55.0, 52.0, 60.0, 60.0, 62.0, 72.0, 62.0, 66.0, 50.0, 49.0, 40.0, 29.0, 24.0, 21.0, 23.0, 12.0, 12.0, 12.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.242246389389038, -2.1774702072143555, -2.112694025039673, -2.0479178428649902, -1.9831416606903076, -1.918365478515625, -1.8535891771316528, -1.7888129949569702, -1.7240368127822876, -1.659260630607605, -1.5944844484329224, -1.5297082662582397, -1.4649319648742676, -1.400155782699585, -1.3353796005249023, -1.2706034183502197, -1.205827236175537, -1.1410510540008545, -1.0762748718261719, -1.0114986896514893, -0.9467224478721619, -0.8819462656974792, -0.8171700239181519, -0.7523938417434692, -0.6876176595687866, -0.622841477394104, -0.5580652952194214, -0.493289053440094, -0.4285128712654114, -0.36373668909072876, -0.29896047711372375, -0.23418426513671875, -0.16940808296203613, -0.10463188588619232, -0.03985568881034851, 0.0249205082654953, 0.08969670534133911, 0.15447288751602173, 0.21924909949302673, 0.28402531147003174, 0.34880149364471436, 0.413577675819397, 0.478353887796402, 0.543130099773407, 0.6079062819480896, 0.6726824641227722, 0.7374587059020996, 0.8022348880767822, 0.8670110702514648, 0.9317872524261475, 0.9965634346008301, 1.0613396167755127, 1.1261157989501953, 1.190891981124878, 1.25566828250885, 1.3204444646835327, 1.3852206468582153, 1.449996829032898, 1.5147730112075806, 1.5795491933822632, 1.6443254947662354, 1.709101676940918, 1.7738778591156006, 1.8386540412902832, 1.9034302234649658]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 10.0, 22.0, 33.0, 71.0, 213.0, 645.0, 6960.0, 4178475.0, 7195.0, 441.0, 116.0, 46.0, 25.0, 13.0, 4.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.234375, -7.06011962890625, -6.8858642578125, -6.71160888671875, -6.537353515625, -6.36309814453125, -6.1888427734375, -6.01458740234375, -5.84033203125, -5.66607666015625, -5.4918212890625, -5.31756591796875, -5.143310546875, -4.96905517578125, -4.7947998046875, -4.62054443359375, -4.4462890625, -4.27203369140625, -4.0977783203125, -3.92352294921875, -3.749267578125, -3.57501220703125, -3.4007568359375, -3.22650146484375, -3.05224609375, -2.87799072265625, -2.7037353515625, -2.52947998046875, -2.355224609375, -2.18096923828125, -2.0067138671875, -1.83245849609375, -1.658203125, -1.48394775390625, -1.3096923828125, -1.13543701171875, -0.961181640625, -0.78692626953125, -0.6126708984375, -0.43841552734375, -0.26416015625, -0.08990478515625, 0.0843505859375, 0.25860595703125, 0.432861328125, 0.60711669921875, 0.7813720703125, 0.95562744140625, 1.1298828125, 1.30413818359375, 1.4783935546875, 1.65264892578125, 1.826904296875, 2.00115966796875, 2.1754150390625, 2.34967041015625, 2.52392578125, 2.69818115234375, 2.8724365234375, 3.04669189453125, 3.220947265625, 3.39520263671875, 3.5694580078125, 3.74371337890625, 3.91796875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 10.0, 16.0, 37.0, 69.0, 102.0, 163.0, 204.0, 147.0, 117.0, 61.0, 33.0, 19.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15781211853027344, -0.15400314331054688, -0.1501941680908203, -0.14638519287109375, -0.1425762176513672, -0.13876724243164062, -0.13495826721191406, -0.1311492919921875, -0.12734031677246094, -0.12353134155273438, -0.11972236633300781, -0.11591339111328125, -0.11210441589355469, -0.10829544067382812, -0.10448646545410156, -0.100677490234375, -0.09686851501464844, -0.09305953979492188, -0.08925056457519531, -0.08544158935546875, -0.08163261413574219, -0.07782363891601562, -0.07401466369628906, -0.0702056884765625, -0.06639671325683594, -0.06258773803710938, -0.05877876281738281, -0.05496978759765625, -0.05116081237792969, -0.047351837158203125, -0.04354286193847656, -0.03973388671875, -0.03592491149902344, -0.032115936279296875, -0.028306961059570312, -0.02449798583984375, -0.020689010620117188, -0.016880035400390625, -0.013071060180664062, -0.0092620849609375, -0.0054531097412109375, -0.001644134521484375, 0.0021648406982421875, 0.00597381591796875, 0.009782791137695312, 0.013591766357421875, 0.017400741577148438, 0.021209716796875, 0.025018692016601562, 0.028827667236328125, 0.03263664245605469, 0.03644561767578125, 0.04025459289550781, 0.044063568115234375, 0.04787254333496094, 0.0516815185546875, 0.05549049377441406, 0.059299468994140625, 0.06310844421386719, 0.06691741943359375, 0.07072639465332031, 0.07453536987304688, 0.07834434509277344, 0.0821533203125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 13.0, 20.0, 29.0, 49.0, 49.0, 71.0, 91.0, 148.0, 219.0, 425.0, 1144.0, 7715.0, 267395.0, 3894496.0, 19239.0, 1996.0, 539.0, 235.0, 128.0, 84.0, 58.0, 37.0, 34.0, 20.0, 14.0, 10.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9033203125, -1.85595703125, -1.80859375, -1.76123046875, -1.7138671875, -1.66650390625, -1.619140625, -1.57177734375, -1.5244140625, -1.47705078125, -1.4296875, -1.38232421875, -1.3349609375, -1.28759765625, -1.240234375, -1.19287109375, -1.1455078125, -1.09814453125, -1.05078125, -1.00341796875, -0.9560546875, -0.90869140625, -0.861328125, -0.81396484375, -0.7666015625, -0.71923828125, -0.671875, -0.62451171875, -0.5771484375, -0.52978515625, -0.482421875, -0.43505859375, -0.3876953125, -0.34033203125, -0.29296875, -0.24560546875, -0.1982421875, -0.15087890625, -0.103515625, -0.05615234375, -0.0087890625, 0.03857421875, 0.0859375, 0.13330078125, 0.1806640625, 0.22802734375, 0.275390625, 0.32275390625, 0.3701171875, 0.41748046875, 0.46484375, 0.51220703125, 0.5595703125, 0.60693359375, 0.654296875, 0.70166015625, 0.7490234375, 0.79638671875, 0.84375, 0.89111328125, 0.9384765625, 0.98583984375, 1.033203125, 1.08056640625, 1.1279296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 8.0, 17.0, 24.0, 23.0, 50.0, 104.0, 292.0, 1225.0, 1799.0, 306.0, 105.0, 54.0, 24.0, 10.0, 8.0, 7.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.291259765625, -0.284942626953125, -0.27862548828125, -0.272308349609375, -0.2659912109375, -0.259674072265625, -0.25335693359375, -0.247039794921875, -0.24072265625, -0.234405517578125, -0.22808837890625, -0.221771240234375, -0.2154541015625, -0.209136962890625, -0.20281982421875, -0.196502685546875, -0.190185546875, -0.183868408203125, -0.17755126953125, -0.171234130859375, -0.1649169921875, -0.158599853515625, -0.15228271484375, -0.145965576171875, -0.1396484375, -0.133331298828125, -0.12701416015625, -0.120697021484375, -0.1143798828125, -0.108062744140625, -0.10174560546875, -0.095428466796875, -0.089111328125, -0.082794189453125, -0.07647705078125, -0.070159912109375, -0.0638427734375, -0.057525634765625, -0.05120849609375, -0.044891357421875, -0.03857421875, -0.032257080078125, -0.02593994140625, -0.019622802734375, -0.0133056640625, -0.006988525390625, -0.00067138671875, 0.005645751953125, 0.011962890625, 0.018280029296875, 0.02459716796875, 0.030914306640625, 0.0372314453125, 0.043548583984375, 0.04986572265625, 0.056182861328125, 0.0625, 0.068817138671875, 0.07513427734375, 0.081451416015625, 0.0877685546875, 0.094085693359375, 0.10040283203125, 0.106719970703125, 0.113037109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 9.0, 15.0, 71.0, 220.0, 421.0, 184.0, 60.0, 16.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5949995517730713, -2.527709722518921, -2.4604198932647705, -2.39313006401062, -2.3258402347564697, -2.2585504055023193, -2.191260576248169, -2.1239709854125977, -2.0566811561584473, -1.9893913269042969, -1.9221014976501465, -1.854811668395996, -1.7875218391418457, -1.7202320098876953, -1.6529422998428345, -1.585652470588684, -1.5183625221252441, -1.4510726928710938, -1.3837828636169434, -1.316493034362793, -1.2492032051086426, -1.1819133758544922, -1.1146236658096313, -1.047333836555481, -0.9800440073013306, -0.9127541780471802, -0.8454643487930298, -0.7781745791435242, -0.7108847498893738, -0.6435949206352234, -0.5763051509857178, -0.5090153217315674, -0.4417257308959961, -0.3744359016418457, -0.3071461021900177, -0.2398562878370285, -0.1725664734840393, -0.10527664422988892, -0.03798684477806091, 0.02930295467376709, 0.09659278392791748, 0.16388259828090668, 0.23117241263389587, 0.2984622120857239, 0.36575204133987427, 0.43304187059402466, 0.5003316402435303, 0.5676214694976807, 0.634911298751831, 0.7022011280059814, 0.7694909572601318, 0.8367807269096375, 0.9040705561637878, 0.9713603854179382, 1.0386501550674438, 1.1059399843215942, 1.1732298135757446, 1.240519642829895, 1.3078094720840454, 1.3750993013381958, 1.4423890113830566, 1.509678840637207, 1.5769686698913574, 1.6442584991455078, 1.7115483283996582]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 7.0, 13.0, 12.0, 20.0, 36.0, 42.0, 45.0, 70.0, 78.0, 88.0, 88.0, 101.0, 77.0, 77.0, 69.0, 49.0, 49.0, 27.0, 19.0, 15.0, 10.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7502862811088562, -0.7251657247543335, -0.7000452280044556, -0.6749246716499329, -0.6498041152954102, -0.6246835589408875, -0.5995630025863647, -0.5744425058364868, -0.5493219494819641, -0.5242013931274414, -0.4990808665752411, -0.47396034002304077, -0.44883978366851807, -0.42371922731399536, -0.39859870076179504, -0.3734781742095947, -0.348357617855072, -0.3232370615005493, -0.298116534948349, -0.2729960083961487, -0.24787545204162598, -0.22275491058826447, -0.19763436913490295, -0.17251382768154144, -0.14739328622817993, -0.12227274477481842, -0.09715220332145691, -0.0720316618680954, -0.04691112041473389, -0.021790578961372375, 0.0033299624919891357, 0.028450503945350647, 0.05357104539871216, 0.07869158685207367, 0.10381212830543518, 0.1289326697587967, 0.1540532112121582, 0.17917375266551971, 0.20429429411888123, 0.22941483557224274, 0.25453537702560425, 0.27965593338012695, 0.30477645993232727, 0.3298969864845276, 0.3550175428390503, 0.380138099193573, 0.4052586257457733, 0.43037915229797363, 0.45549970865249634, 0.48062026500701904, 0.505740761756897, 0.5308613181114197, 0.5559818744659424, 0.5811024308204651, 0.6062229871749878, 0.6313434839248657, 0.6564640402793884, 0.6815845966339111, 0.7067050933837891, 0.7318256497383118, 0.7569462060928345, 0.7820667624473572, 0.8071873188018799, 0.8323078155517578, 0.8574283719062805]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 4.0, 7.0, 11.0, 21.0, 37.0, 66.0, 94.0, 201.0, 379.0, 888.0, 2319.0, 9522.0, 161796.0, 815130.0, 49562.0, 5516.0, 1660.0, 647.0, 296.0, 181.0, 96.0, 44.0, 26.0, 21.0, 8.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88330078125, -0.8541793823242188, -0.8250579833984375, -0.7959365844726562, -0.766815185546875, -0.7376937866210938, -0.7085723876953125, -0.6794509887695312, -0.65032958984375, -0.6212081909179688, -0.5920867919921875, -0.5629653930664062, -0.533843994140625, -0.5047225952148438, -0.4756011962890625, -0.44647979736328125, -0.4173583984375, -0.38823699951171875, -0.3591156005859375, -0.32999420166015625, -0.300872802734375, -0.27175140380859375, -0.2426300048828125, -0.21350860595703125, -0.18438720703125, -0.15526580810546875, -0.1261444091796875, -0.09702301025390625, -0.067901611328125, -0.03878021240234375, -0.0096588134765625, 0.01946258544921875, 0.048583984375, 0.07770538330078125, 0.1068267822265625, 0.13594818115234375, 0.165069580078125, 0.19419097900390625, 0.2233123779296875, 0.25243377685546875, 0.28155517578125, 0.31067657470703125, 0.3397979736328125, 0.36891937255859375, 0.398040771484375, 0.42716217041015625, 0.4562835693359375, 0.48540496826171875, 0.5145263671875, 0.5436477661132812, 0.5727691650390625, 0.6018905639648438, 0.631011962890625, 0.6601333618164062, 0.6892547607421875, 0.7183761596679688, 0.74749755859375, 0.7766189575195312, 0.8057403564453125, 0.8348617553710938, 0.863983154296875, 0.8931045532226562, 0.9222259521484375, 0.9513473510742188, 0.98046875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 15.0, 33.0, 59.0, 86.0, 135.0, 170.0, 168.0, 123.0, 94.0, 50.0, 29.0, 17.0, 4.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1514892578125, -0.14795207977294922, -0.14441490173339844, -0.14087772369384766, -0.13734054565429688, -0.1338033676147461, -0.1302661895751953, -0.12672901153564453, -0.12319183349609375, -0.11965465545654297, -0.11611747741699219, -0.1125802993774414, -0.10904312133789062, -0.10550594329833984, -0.10196876525878906, -0.09843158721923828, -0.0948944091796875, -0.09135723114013672, -0.08782005310058594, -0.08428287506103516, -0.08074569702148438, -0.0772085189819336, -0.07367134094238281, -0.07013416290283203, -0.06659698486328125, -0.06305980682373047, -0.05952262878417969, -0.055985450744628906, -0.052448272705078125, -0.048911094665527344, -0.04537391662597656, -0.04183673858642578, -0.038299560546875, -0.03476238250732422, -0.031225204467773438, -0.027688026428222656, -0.024150848388671875, -0.020613670349121094, -0.017076492309570312, -0.013539314270019531, -0.01000213623046875, -0.006464958190917969, -0.0029277801513671875, 0.0006093978881835938, 0.004146575927734375, 0.007683753967285156, 0.011220932006835938, 0.014758110046386719, 0.0182952880859375, 0.02183246612548828, 0.025369644165039062, 0.028906822204589844, 0.032444000244140625, 0.035981178283691406, 0.03951835632324219, 0.04305553436279297, 0.04659271240234375, 0.05012989044189453, 0.05366706848144531, 0.057204246520996094, 0.060741424560546875, 0.06427860260009766, 0.06781578063964844, 0.07135295867919922, 0.07489013671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 8.0, 9.0, 6.0, 17.0, 24.0, 26.0, 47.0, 104.0, 133.0, 298.0, 565.0, 1241.0, 2956.0, 8764.0, 32968.0, 167339.0, 540429.0, 232255.0, 44288.0, 10920.0, 3502.0, 1314.0, 649.0, 282.0, 145.0, 105.0, 52.0, 42.0, 24.0, 17.0, 9.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.383544921875, -0.3696479797363281, -0.35575103759765625, -0.3418540954589844, -0.3279571533203125, -0.3140602111816406, -0.30016326904296875, -0.2862663269042969, -0.272369384765625, -0.2584724426269531, -0.24457550048828125, -0.23067855834960938, -0.2167816162109375, -0.20288467407226562, -0.18898773193359375, -0.17509078979492188, -0.16119384765625, -0.14729690551757812, -0.13339996337890625, -0.11950302124023438, -0.1056060791015625, -0.09170913696289062, -0.07781219482421875, -0.06391525268554688, -0.050018310546875, -0.036121368408203125, -0.02222442626953125, -0.008327484130859375, 0.0055694580078125, 0.019466400146484375, 0.03336334228515625, 0.047260284423828125, 0.0611572265625, 0.07505416870117188, 0.08895111083984375, 0.10284805297851562, 0.1167449951171875, 0.13064193725585938, 0.14453887939453125, 0.15843582153320312, 0.172332763671875, 0.18622970581054688, 0.20012664794921875, 0.21402359008789062, 0.2279205322265625, 0.24181747436523438, 0.25571441650390625, 0.2696113586425781, 0.28350830078125, 0.2974052429199219, 0.31130218505859375, 0.3251991271972656, 0.3390960693359375, 0.3529930114746094, 0.36688995361328125, 0.3807868957519531, 0.394683837890625, 0.4085807800292969, 0.42247772216796875, 0.4363746643066406, 0.4502716064453125, 0.4641685485839844, 0.47806549072265625, 0.4919624328613281, 0.505859375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 1.0, 13.0, 9.0, 15.0, 15.0, 13.0, 18.0, 22.0, 26.0, 41.0, 35.0, 33.0, 62.0, 53.0, 59.0, 56.0, 70.0, 55.0, 59.0, 50.0, 43.0, 41.0, 42.0, 30.0, 22.0, 24.0, 16.0, 11.0, 16.0, 8.0, 7.0, 6.0, 7.0, 5.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.28955078125, -0.2805938720703125, -0.271636962890625, -0.2626800537109375, -0.25372314453125, -0.2447662353515625, -0.235809326171875, -0.2268524169921875, -0.2178955078125, -0.2089385986328125, -0.199981689453125, -0.1910247802734375, -0.18206787109375, -0.1731109619140625, -0.164154052734375, -0.1551971435546875, -0.146240234375, -0.1372833251953125, -0.128326416015625, -0.1193695068359375, -0.11041259765625, -0.1014556884765625, -0.092498779296875, -0.0835418701171875, -0.0745849609375, -0.0656280517578125, -0.056671142578125, -0.0477142333984375, -0.03875732421875, -0.0298004150390625, -0.020843505859375, -0.0118865966796875, -0.0029296875, 0.0060272216796875, 0.014984130859375, 0.0239410400390625, 0.03289794921875, 0.0418548583984375, 0.050811767578125, 0.0597686767578125, 0.0687255859375, 0.0776824951171875, 0.086639404296875, 0.0955963134765625, 0.10455322265625, 0.1135101318359375, 0.122467041015625, 0.1314239501953125, 0.140380859375, 0.1493377685546875, 0.158294677734375, 0.1672515869140625, 0.17620849609375, 0.1851654052734375, 0.194122314453125, 0.2030792236328125, 0.2120361328125, 0.2209930419921875, 0.229949951171875, 0.2389068603515625, 0.24786376953125, 0.2568206787109375, 0.265777587890625, 0.2747344970703125, 0.28369140625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 10.0, 25.0, 37.0, 85.0, 236.0, 831.0, 9831.0, 1014510.0, 21395.0, 1127.0, 287.0, 98.0, 37.0, 15.0, 15.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.806640625, -1.7686767578125, -1.730712890625, -1.6927490234375, -1.65478515625, -1.6168212890625, -1.578857421875, -1.5408935546875, -1.5029296875, -1.4649658203125, -1.427001953125, -1.3890380859375, -1.35107421875, -1.3131103515625, -1.275146484375, -1.2371826171875, -1.19921875, -1.1612548828125, -1.123291015625, -1.0853271484375, -1.04736328125, -1.0093994140625, -0.971435546875, -0.9334716796875, -0.8955078125, -0.8575439453125, -0.819580078125, -0.7816162109375, -0.74365234375, -0.7056884765625, -0.667724609375, -0.6297607421875, -0.591796875, -0.5538330078125, -0.515869140625, -0.4779052734375, -0.43994140625, -0.4019775390625, -0.364013671875, -0.3260498046875, -0.2880859375, -0.2501220703125, -0.212158203125, -0.1741943359375, -0.13623046875, -0.0982666015625, -0.060302734375, -0.0223388671875, 0.015625, 0.0535888671875, 0.091552734375, 0.1295166015625, 0.16748046875, 0.2054443359375, 0.243408203125, 0.2813720703125, 0.3193359375, 0.3572998046875, 0.395263671875, 0.4332275390625, 0.47119140625, 0.5091552734375, 0.547119140625, 0.5850830078125, 0.623046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 12.0, 11.0, 16.0, 21.0, 19.0, 34.0, 36.0, 52.0, 49.0, 54.0, 111.0, 106.0, 95.0, 78.0, 50.0, 36.0, 39.0, 30.0, 23.0, 21.0, 15.0, 15.0, 8.0, 7.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0001590251922607422, -0.00015250593423843384, -0.0001459866762161255, -0.00013946741819381714, -0.0001329481601715088, -0.00012642890214920044, -0.00011990964412689209, -0.00011339038610458374, -0.00010687112808227539, -0.00010035187005996704, -9.383261203765869e-05, -8.731335401535034e-05, -8.079409599304199e-05, -7.427483797073364e-05, -6.775557994842529e-05, -6.123632192611694e-05, -5.4717063903808594e-05, -4.8197805881500244e-05, -4.1678547859191895e-05, -3.5159289836883545e-05, -2.8640031814575195e-05, -2.2120773792266846e-05, -1.5601515769958496e-05, -9.082257747650146e-06, -2.562999725341797e-06, 3.956258296966553e-06, 1.0475516319274902e-05, 1.6994774341583252e-05, 2.35140323638916e-05, 3.003329038619995e-05, 3.65525484085083e-05, 4.307180643081665e-05, 4.9591064453125e-05, 5.611032247543335e-05, 6.26295804977417e-05, 6.914883852005005e-05, 7.56680965423584e-05, 8.218735456466675e-05, 8.87066125869751e-05, 9.522587060928345e-05, 0.0001017451286315918, 0.00010826438665390015, 0.0001147836446762085, 0.00012130290269851685, 0.0001278221607208252, 0.00013434141874313354, 0.0001408606767654419, 0.00014737993478775024, 0.0001538991928100586, 0.00016041845083236694, 0.0001669377088546753, 0.00017345696687698364, 0.000179976224899292, 0.00018649548292160034, 0.0001930147409439087, 0.00019953399896621704, 0.0002060532569885254, 0.00021257251501083374, 0.0002190917730331421, 0.00022561103105545044, 0.0002321302890777588, 0.00023864954710006714, 0.0002451688051223755, 0.00025168806314468384, 0.0002582073211669922]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 4.0, 7.0, 7.0, 8.0, 14.0, 20.0, 32.0, 41.0, 83.0, 144.0, 291.0, 483.0, 1059.0, 2661.0, 8984.0, 58934.0, 811759.0, 143278.0, 14271.0, 3712.0, 1399.0, 588.0, 329.0, 171.0, 91.0, 58.0, 37.0, 33.0, 16.0, 8.0, 9.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.396728515625, -0.38457489013671875, -0.3724212646484375, -0.36026763916015625, -0.348114013671875, -0.33596038818359375, -0.3238067626953125, -0.31165313720703125, -0.29949951171875, -0.28734588623046875, -0.2751922607421875, -0.26303863525390625, -0.250885009765625, -0.23873138427734375, -0.2265777587890625, -0.21442413330078125, -0.2022705078125, -0.19011688232421875, -0.1779632568359375, -0.16580963134765625, -0.153656005859375, -0.14150238037109375, -0.1293487548828125, -0.11719512939453125, -0.10504150390625, -0.09288787841796875, -0.0807342529296875, -0.06858062744140625, -0.056427001953125, -0.04427337646484375, -0.0321197509765625, -0.01996612548828125, -0.0078125, 0.00434112548828125, 0.0164947509765625, 0.02864837646484375, 0.040802001953125, 0.05295562744140625, 0.0651092529296875, 0.07726287841796875, 0.08941650390625, 0.10157012939453125, 0.1137237548828125, 0.12587738037109375, 0.138031005859375, 0.15018463134765625, 0.1623382568359375, 0.17449188232421875, 0.1866455078125, 0.19879913330078125, 0.2109527587890625, 0.22310638427734375, 0.235260009765625, 0.24741363525390625, 0.2595672607421875, 0.27172088623046875, 0.28387451171875, 0.29602813720703125, 0.3081817626953125, 0.32033538818359375, 0.332489013671875, 0.34464263916015625, 0.3567962646484375, 0.36894989013671875, 0.381103515625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 13.0, 17.0, 45.0, 65.0, 95.0, 133.0, 166.0, 159.0, 118.0, 60.0, 60.0, 16.0, 11.0, 12.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2080078125, -0.20122528076171875, -0.1944427490234375, -0.18766021728515625, -0.180877685546875, -0.17409515380859375, -0.1673126220703125, -0.16053009033203125, -0.15374755859375, -0.14696502685546875, -0.1401824951171875, -0.13339996337890625, -0.126617431640625, -0.11983489990234375, -0.1130523681640625, -0.10626983642578125, -0.0994873046875, -0.09270477294921875, -0.0859222412109375, -0.07913970947265625, -0.072357177734375, -0.06557464599609375, -0.0587921142578125, -0.05200958251953125, -0.04522705078125, -0.03844451904296875, -0.0316619873046875, -0.02487945556640625, -0.018096923828125, -0.01131439208984375, -0.0045318603515625, 0.00225067138671875, 0.009033203125, 0.01581573486328125, 0.0225982666015625, 0.02938079833984375, 0.036163330078125, 0.04294586181640625, 0.0497283935546875, 0.05651092529296875, 0.06329345703125, 0.07007598876953125, 0.0768585205078125, 0.08364105224609375, 0.090423583984375, 0.09720611572265625, 0.1039886474609375, 0.11077117919921875, 0.1175537109375, 0.12433624267578125, 0.1311187744140625, 0.13790130615234375, 0.144683837890625, 0.15146636962890625, 0.1582489013671875, 0.16503143310546875, 0.17181396484375, 0.17859649658203125, 0.1853790283203125, 0.19216156005859375, 0.198944091796875, 0.20572662353515625, 0.2125091552734375, 0.21929168701171875, 0.22607421875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 10.0, 25.0, 118.0, 405.0, 347.0, 80.0, 20.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.435122489929199, -7.201960563659668, -6.968798637390137, -6.7356367111206055, -6.502474784851074, -6.269312858581543, -6.03615140914917, -5.802989482879639, -5.569827556610107, -5.336665630340576, -5.103503704071045, -4.870341777801514, -4.637180328369141, -4.404018402099609, -4.170856475830078, -3.937694549560547, -3.7045326232910156, -3.4713706970214844, -3.238208770751953, -3.005047082901001, -2.7718851566314697, -2.5387232303619385, -2.3055615425109863, -2.072399616241455, -1.8392376899719238, -1.6060757637023926, -1.3729139566421509, -1.1397521495819092, -0.9065902233123779, -0.6734282970428467, -0.440266489982605, -0.20710468292236328, 0.02605724334716797, 0.25921911001205444, 0.4923809766769409, 0.7255428433418274, 0.9587047100067139, 1.1918666362762451, 1.4250284433364868, 1.6581902503967285, 1.8913521766662598, 2.124514102935791, 2.3576760292053223, 2.5908377170562744, 2.8239996433258057, 3.057161569595337, 3.290323257446289, 3.5234851837158203, 3.7566471099853516, 3.989809036254883, 4.222970962524414, 4.456132888793945, 4.689294815063477, 4.922456741333008, 5.155618190765381, 5.388780117034912, 5.621942043304443, 5.855103969573975, 6.088265895843506, 6.321427822113037, 6.55458927154541, 6.787751197814941, 7.020913124084473, 7.254075050354004, 7.487236976623535]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 6.0, 6.0, 5.0, 14.0, 11.0, 19.0, 32.0, 18.0, 32.0, 30.0, 40.0, 42.0, 41.0, 40.0, 52.0, 52.0, 41.0, 38.0, 58.0, 57.0, 39.0, 39.0, 50.0, 37.0, 27.0, 31.0, 21.0, 22.0, 23.0, 18.0, 9.0, 5.0, 8.0, 7.0, 5.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7985286712646484, -1.7434810400009155, -1.6884334087371826, -1.6333857774734497, -1.5783381462097168, -1.5232905149459839, -1.468242883682251, -1.413195252418518, -1.3581476211547852, -1.3030999898910522, -1.2480523586273193, -1.1930047273635864, -1.1379570960998535, -1.0829094648361206, -1.0278618335723877, -0.9728142023086548, -0.9177665710449219, -0.862718939781189, -0.807671308517456, -0.7526236772537231, -0.6975760459899902, -0.6425284147262573, -0.5874807834625244, -0.5324331521987915, -0.4773855209350586, -0.4223378896713257, -0.3672902584075928, -0.31224262714385986, -0.25719499588012695, -0.20214736461639404, -0.14709973335266113, -0.09205210208892822, -0.03700447082519531, 0.018043160438537598, 0.07309079170227051, 0.12813842296600342, 0.18318605422973633, 0.23823368549346924, 0.29328131675720215, 0.34832894802093506, 0.40337657928466797, 0.4584242105484009, 0.5134718418121338, 0.5685194730758667, 0.6235671043395996, 0.6786147356033325, 0.7336623668670654, 0.7887099981307983, 0.8437576293945312, 0.8988052606582642, 0.9538528919219971, 1.00890052318573, 1.063948154449463, 1.1189957857131958, 1.1740434169769287, 1.2290910482406616, 1.2841386795043945, 1.3391863107681274, 1.3942339420318604, 1.4492815732955933, 1.5043292045593262, 1.559376835823059, 1.614424467086792, 1.669472098350525, 1.7245197296142578]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 11.0, 9.0, 16.0, 16.0, 40.0, 73.0, 120.0, 224.0, 517.0, 1668.0, 13157.0, 3902830.0, 268165.0, 5975.0, 954.0, 264.0, 112.0, 69.0, 30.0, 12.0, 7.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.10546875, -2.0498504638671875, -1.994232177734375, -1.9386138916015625, -1.88299560546875, -1.8273773193359375, -1.771759033203125, -1.7161407470703125, -1.6605224609375, -1.6049041748046875, -1.549285888671875, -1.4936676025390625, -1.43804931640625, -1.3824310302734375, -1.326812744140625, -1.2711944580078125, -1.215576171875, -1.1599578857421875, -1.104339599609375, -1.0487213134765625, -0.99310302734375, -0.9374847412109375, -0.881866455078125, -0.8262481689453125, -0.7706298828125, -0.7150115966796875, -0.659393310546875, -0.6037750244140625, -0.54815673828125, -0.4925384521484375, -0.436920166015625, -0.3813018798828125, -0.32568359375, -0.2700653076171875, -0.214447021484375, -0.1588287353515625, -0.10321044921875, -0.0475921630859375, 0.008026123046875, 0.0636444091796875, 0.1192626953125, 0.1748809814453125, 0.230499267578125, 0.2861175537109375, 0.34173583984375, 0.3973541259765625, 0.452972412109375, 0.5085906982421875, 0.564208984375, 0.6198272705078125, 0.675445556640625, 0.7310638427734375, 0.78668212890625, 0.8423004150390625, 0.897918701171875, 0.9535369873046875, 1.0091552734375, 1.0647735595703125, 1.120391845703125, 1.1760101318359375, 1.23162841796875, 1.2872467041015625, 1.342864990234375, 1.3984832763671875, 1.4541015625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 11.0, 17.0, 26.0, 56.0, 55.0, 102.0, 119.0, 156.0, 113.0, 111.0, 93.0, 62.0, 31.0, 20.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.161376953125, -0.15759658813476562, -0.15381622314453125, -0.15003585815429688, -0.1462554931640625, -0.14247512817382812, -0.13869476318359375, -0.13491439819335938, -0.131134033203125, -0.12735366821289062, -0.12357330322265625, -0.11979293823242188, -0.1160125732421875, -0.11223220825195312, -0.10845184326171875, -0.10467147827148438, -0.10089111328125, -0.09711074829101562, -0.09333038330078125, -0.08955001831054688, -0.0857696533203125, -0.08198928833007812, -0.07820892333984375, -0.07442855834960938, -0.070648193359375, -0.06686782836914062, -0.06308746337890625, -0.059307098388671875, -0.0555267333984375, -0.051746368408203125, -0.04796600341796875, -0.044185638427734375, -0.0404052734375, -0.036624908447265625, -0.03284454345703125, -0.029064178466796875, -0.0252838134765625, -0.021503448486328125, -0.01772308349609375, -0.013942718505859375, -0.010162353515625, -0.006381988525390625, -0.00260162353515625, 0.001178741455078125, 0.0049591064453125, 0.008739471435546875, 0.01251983642578125, 0.016300201416015625, 0.02008056640625, 0.023860931396484375, 0.02764129638671875, 0.031421661376953125, 0.0352020263671875, 0.038982391357421875, 0.04276275634765625, 0.046543121337890625, 0.050323486328125, 0.054103851318359375, 0.05788421630859375, 0.061664581298828125, 0.0654449462890625, 0.06922531127929688, 0.07300567626953125, 0.07678604125976562, 0.08056640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 11.0, 20.0, 30.0, 64.0, 91.0, 234.0, 512.0, 1347.0, 6510.0, 227596.0, 3935048.0, 19224.0, 2310.0, 706.0, 287.0, 154.0, 75.0, 19.0, 20.0, 7.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.47265625, -1.434112548828125, -1.39556884765625, -1.357025146484375, -1.3184814453125, -1.279937744140625, -1.24139404296875, -1.202850341796875, -1.164306640625, -1.125762939453125, -1.08721923828125, -1.048675537109375, -1.0101318359375, -0.971588134765625, -0.93304443359375, -0.894500732421875, -0.85595703125, -0.817413330078125, -0.77886962890625, -0.740325927734375, -0.7017822265625, -0.663238525390625, -0.62469482421875, -0.586151123046875, -0.547607421875, -0.509063720703125, -0.47052001953125, -0.431976318359375, -0.3934326171875, -0.354888916015625, -0.31634521484375, -0.277801513671875, -0.2392578125, -0.200714111328125, -0.16217041015625, -0.123626708984375, -0.0850830078125, -0.046539306640625, -0.00799560546875, 0.030548095703125, 0.069091796875, 0.107635498046875, 0.14617919921875, 0.184722900390625, 0.2232666015625, 0.261810302734375, 0.30035400390625, 0.338897705078125, 0.37744140625, 0.415985107421875, 0.45452880859375, 0.493072509765625, 0.5316162109375, 0.570159912109375, 0.60870361328125, 0.647247314453125, 0.685791015625, 0.724334716796875, 0.76287841796875, 0.801422119140625, 0.8399658203125, 0.878509521484375, 0.91705322265625, 0.955596923828125, 0.994140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 8.0, 9.0, 14.0, 35.0, 63.0, 126.0, 298.0, 1186.0, 1692.0, 378.0, 124.0, 64.0, 23.0, 15.0, 10.0, 14.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.12624359130859375, -0.1207733154296875, -0.11530303955078125, -0.109832763671875, -0.10436248779296875, -0.0988922119140625, -0.09342193603515625, -0.08795166015625, -0.08248138427734375, -0.0770111083984375, -0.07154083251953125, -0.066070556640625, -0.06060028076171875, -0.0551300048828125, -0.04965972900390625, -0.044189453125, -0.03871917724609375, -0.0332489013671875, -0.02777862548828125, -0.022308349609375, -0.01683807373046875, -0.0113677978515625, -0.00589752197265625, -0.00042724609375, 0.00504302978515625, 0.0105133056640625, 0.01598358154296875, 0.021453857421875, 0.02692413330078125, 0.0323944091796875, 0.03786468505859375, 0.0433349609375, 0.04880523681640625, 0.0542755126953125, 0.05974578857421875, 0.065216064453125, 0.07068634033203125, 0.0761566162109375, 0.08162689208984375, 0.08709716796875, 0.09256744384765625, 0.0980377197265625, 0.10350799560546875, 0.108978271484375, 0.11444854736328125, 0.1199188232421875, 0.12538909912109375, 0.130859375, 0.13632965087890625, 0.1417999267578125, 0.14727020263671875, 0.152740478515625, 0.15821075439453125, 0.1636810302734375, 0.16915130615234375, 0.17462158203125, 0.18009185791015625, 0.1855621337890625, 0.19103240966796875, 0.196502685546875, 0.20197296142578125, 0.2074432373046875, 0.21291351318359375, 0.2183837890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 13.0, 31.0, 68.0, 205.0, 299.0, 230.0, 96.0, 27.0, 18.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7590133547782898, -0.7180695533752441, -0.6771257519721985, -0.6361819505691528, -0.595238208770752, -0.5542943477630615, -0.5133506059646606, -0.472406804561615, -0.43146300315856934, -0.3905192017555237, -0.349575400352478, -0.30863162875175476, -0.2676878273487091, -0.22674402594566345, -0.185800239443779, -0.14485645294189453, -0.10391265153884888, -0.06296885758638382, -0.022025063633918762, 0.018918730318546295, 0.05986252427101135, 0.100806325674057, 0.14175011217594147, 0.18269389867782593, 0.22363770008087158, 0.26458150148391724, 0.3055253028869629, 0.34646907448768616, 0.3874128758907318, 0.42835667729377747, 0.46930044889450073, 0.5102442502975464, 0.5511879920959473, 0.5921317934989929, 0.6330755949020386, 0.6740193963050842, 0.7149631977081299, 0.7559069395065308, 0.7968507409095764, 0.8377945423126221, 0.8787383437156677, 0.9196821451187134, 0.960625946521759, 1.0015697479248047, 1.0425134897232056, 1.083457350730896, 1.1244010925292969, 1.1653449535369873, 1.2062886953353882, 1.247232437133789, 1.2881762981414795, 1.3291200399398804, 1.3700639009475708, 1.4110076427459717, 1.451951503753662, 1.492895245552063, 1.5338389873504639, 1.5747827291488647, 1.6157265901565552, 1.656670331954956, 1.6976141929626465, 1.7385579347610474, 1.7795017957687378, 1.8204455375671387, 1.861389398574829]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 11.0, 10.0, 12.0, 18.0, 22.0, 30.0, 49.0, 42.0, 54.0, 71.0, 64.0, 64.0, 73.0, 85.0, 73.0, 59.0, 58.0, 50.0, 35.0, 27.0, 30.0, 18.0, 13.0, 12.0, 8.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.666449248790741, -0.6496491432189941, -0.6328489780426025, -0.6160488724708557, -0.5992487668991089, -0.5824486613273621, -0.5656485557556152, -0.5488483905792236, -0.5320482850074768, -0.51524817943573, -0.49844804406166077, -0.48164790868759155, -0.4648478031158447, -0.4480476975440979, -0.4312475621700287, -0.4144474267959595, -0.39764732122421265, -0.3808472156524658, -0.3640470802783966, -0.3472469449043274, -0.33044683933258057, -0.31364673376083374, -0.2968465983867645, -0.2800464630126953, -0.2632463574409485, -0.24644623696804047, -0.22964611649513245, -0.21284599602222443, -0.1960458755493164, -0.1792457550764084, -0.16244563460350037, -0.14564551413059235, -0.12884539365768433, -0.1120452731847763, -0.09524515271186829, -0.07844503223896027, -0.061644911766052246, -0.044844791293144226, -0.028044670820236206, -0.011244550347328186, 0.005555570125579834, 0.022355690598487854, 0.039155811071395874, 0.055955931544303894, 0.07275605201721191, 0.08955617249011993, 0.10635629296302795, 0.12315641343593597, 0.139956533908844, 0.15675665438175201, 0.17355677485466003, 0.19035689532756805, 0.20715701580047607, 0.2239571362733841, 0.24075725674629211, 0.25755739212036133, 0.27435749769210815, 0.291157603263855, 0.3079577386379242, 0.3247578740119934, 0.34155797958374023, 0.35835808515548706, 0.3751582205295563, 0.3919583559036255, 0.4087584614753723]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 6.0, 9.0, 14.0, 15.0, 12.0, 29.0, 30.0, 45.0, 61.0, 98.0, 159.0, 210.0, 343.0, 632.0, 1043.0, 1930.0, 3901.0, 10547.0, 40247.0, 199709.0, 520126.0, 208035.0, 41827.0, 10891.0, 3980.0, 1907.0, 993.0, 620.0, 383.0, 222.0, 148.0, 115.0, 96.0, 46.0, 27.0, 25.0, 24.0, 14.0, 10.0, 11.0, 6.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3291015625, -0.31668853759765625, -0.3042755126953125, -0.29186248779296875, -0.279449462890625, -0.26703643798828125, -0.2546234130859375, -0.24221038818359375, -0.22979736328125, -0.21738433837890625, -0.2049713134765625, -0.19255828857421875, -0.180145263671875, -0.16773223876953125, -0.1553192138671875, -0.14290618896484375, -0.1304931640625, -0.11808013916015625, -0.1056671142578125, -0.09325408935546875, -0.080841064453125, -0.06842803955078125, -0.0560150146484375, -0.04360198974609375, -0.03118896484375, -0.01877593994140625, -0.0063629150390625, 0.00605010986328125, 0.018463134765625, 0.03087615966796875, 0.0432891845703125, 0.05570220947265625, 0.068115234375, 0.08052825927734375, 0.0929412841796875, 0.10535430908203125, 0.117767333984375, 0.13018035888671875, 0.1425933837890625, 0.15500640869140625, 0.16741943359375, 0.17983245849609375, 0.1922454833984375, 0.20465850830078125, 0.217071533203125, 0.22948455810546875, 0.2418975830078125, 0.25431060791015625, 0.2667236328125, 0.27913665771484375, 0.2915496826171875, 0.30396270751953125, 0.316375732421875, 0.32878875732421875, 0.3412017822265625, 0.35361480712890625, 0.36602783203125, 0.37844085693359375, 0.3908538818359375, 0.40326690673828125, 0.415679931640625, 0.42809295654296875, 0.4405059814453125, 0.45291900634765625, 0.46533203125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 15.0, 18.0, 50.0, 53.0, 75.0, 115.0, 136.0, 128.0, 119.0, 121.0, 62.0, 49.0, 18.0, 10.0, 12.0, 6.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.16165637969970703, -0.15790748596191406, -0.1541585922241211, -0.15040969848632812, -0.14666080474853516, -0.1429119110107422, -0.13916301727294922, -0.13541412353515625, -0.13166522979736328, -0.1279163360595703, -0.12416744232177734, -0.12041854858398438, -0.1166696548461914, -0.11292076110839844, -0.10917186737060547, -0.1054229736328125, -0.10167407989501953, -0.09792518615722656, -0.0941762924194336, -0.09042739868164062, -0.08667850494384766, -0.08292961120605469, -0.07918071746826172, -0.07543182373046875, -0.07168292999267578, -0.06793403625488281, -0.06418514251708984, -0.060436248779296875, -0.056687355041503906, -0.05293846130371094, -0.04918956756591797, -0.045440673828125, -0.04169178009033203, -0.03794288635253906, -0.034193992614746094, -0.030445098876953125, -0.026696205139160156, -0.022947311401367188, -0.01919841766357422, -0.01544952392578125, -0.011700630187988281, -0.007951736450195312, -0.004202842712402344, -0.000453948974609375, 0.0032949447631835938, 0.0070438385009765625, 0.010792732238769531, 0.0145416259765625, 0.01829051971435547, 0.022039413452148438, 0.025788307189941406, 0.029537200927734375, 0.033286094665527344, 0.03703498840332031, 0.04078388214111328, 0.04453277587890625, 0.04828166961669922, 0.05203056335449219, 0.055779457092285156, 0.059528350830078125, 0.0632772445678711, 0.06702613830566406, 0.07077503204345703, 0.07452392578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 16.0, 19.0, 17.0, 27.0, 52.0, 48.0, 108.0, 156.0, 254.0, 519.0, 828.0, 1727.0, 3266.0, 7296.0, 17375.0, 45056.0, 127405.0, 314724.0, 319485.0, 131384.0, 45941.0, 17982.0, 7663.0, 3416.0, 1681.0, 905.0, 492.0, 284.0, 145.0, 77.0, 72.0, 46.0, 29.0, 24.0, 10.0, 10.0, 7.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25732421875, -0.24902725219726562, -0.24073028564453125, -0.23243331909179688, -0.2241363525390625, -0.21583938598632812, -0.20754241943359375, -0.19924545288085938, -0.190948486328125, -0.18265151977539062, -0.17435455322265625, -0.16605758666992188, -0.1577606201171875, -0.14946365356445312, -0.14116668701171875, -0.13286972045898438, -0.12457275390625, -0.11627578735351562, -0.10797882080078125, -0.09968185424804688, -0.0913848876953125, -0.08308792114257812, -0.07479095458984375, -0.06649398803710938, -0.058197021484375, -0.049900054931640625, -0.04160308837890625, -0.033306121826171875, -0.0250091552734375, -0.016712188720703125, -0.00841522216796875, -0.000118255615234375, 0.0081787109375, 0.016475677490234375, 0.02477264404296875, 0.033069610595703125, 0.0413665771484375, 0.049663543701171875, 0.05796051025390625, 0.06625747680664062, 0.074554443359375, 0.08285140991210938, 0.09114837646484375, 0.09944534301757812, 0.1077423095703125, 0.11603927612304688, 0.12433624267578125, 0.13263320922851562, 0.14093017578125, 0.14922714233398438, 0.15752410888671875, 0.16582107543945312, 0.1741180419921875, 0.18241500854492188, 0.19071197509765625, 0.19900894165039062, 0.207305908203125, 0.21560287475585938, 0.22389984130859375, 0.23219680786132812, 0.2404937744140625, 0.24879074096679688, 0.25708770751953125, 0.2653846740722656, 0.273681640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 3.0, 6.0, 4.0, 6.0, 10.0, 12.0, 20.0, 19.0, 8.0, 29.0, 24.0, 35.0, 26.0, 28.0, 39.0, 39.0, 38.0, 50.0, 49.0, 48.0, 52.0, 45.0, 70.0, 41.0, 33.0, 41.0, 32.0, 33.0, 25.0, 22.0, 19.0, 13.0, 16.0, 15.0, 11.0, 11.0, 4.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305908203125, -0.29734039306640625, -0.2887725830078125, -0.28020477294921875, -0.271636962890625, -0.26306915283203125, -0.2545013427734375, -0.24593353271484375, -0.23736572265625, -0.22879791259765625, -0.2202301025390625, -0.21166229248046875, -0.203094482421875, -0.19452667236328125, -0.1859588623046875, -0.17739105224609375, -0.1688232421875, -0.16025543212890625, -0.1516876220703125, -0.14311981201171875, -0.134552001953125, -0.12598419189453125, -0.1174163818359375, -0.10884857177734375, -0.10028076171875, -0.09171295166015625, -0.0831451416015625, -0.07457733154296875, -0.066009521484375, -0.05744171142578125, -0.0488739013671875, -0.04030609130859375, -0.03173828125, -0.02317047119140625, -0.0146026611328125, -0.00603485107421875, 0.002532958984375, 0.01110076904296875, 0.0196685791015625, 0.02823638916015625, 0.03680419921875, 0.04537200927734375, 0.0539398193359375, 0.06250762939453125, 0.071075439453125, 0.07964324951171875, 0.0882110595703125, 0.09677886962890625, 0.1053466796875, 0.11391448974609375, 0.1224822998046875, 0.13105010986328125, 0.139617919921875, 0.14818572998046875, 0.1567535400390625, 0.16532135009765625, 0.17388916015625, 0.18245697021484375, 0.1910247802734375, 0.19959259033203125, 0.208160400390625, 0.21672821044921875, 0.2252960205078125, 0.23386383056640625, 0.242431640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 3.0, 18.0, 17.0, 15.0, 29.0, 33.0, 58.0, 81.0, 133.0, 225.0, 459.0, 883.0, 2428.0, 7986.0, 37289.0, 309848.0, 591453.0, 77626.0, 13689.0, 3507.0, 1395.0, 593.0, 299.0, 172.0, 110.0, 54.0, 44.0, 34.0, 15.0, 8.0, 14.0, 9.0, 6.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159912109375, -0.15423965454101562, -0.14856719970703125, -0.14289474487304688, -0.1372222900390625, -0.13154983520507812, -0.12587738037109375, -0.12020492553710938, -0.114532470703125, -0.10886001586914062, -0.10318756103515625, -0.09751510620117188, -0.0918426513671875, -0.08617019653320312, -0.08049774169921875, -0.07482528686523438, -0.06915283203125, -0.06348037719726562, -0.05780792236328125, -0.052135467529296875, -0.0464630126953125, -0.040790557861328125, -0.03511810302734375, -0.029445648193359375, -0.023773193359375, -0.018100738525390625, -0.01242828369140625, -0.006755828857421875, -0.0010833740234375, 0.004589080810546875, 0.01026153564453125, 0.015933990478515625, 0.0216064453125, 0.027278900146484375, 0.03295135498046875, 0.038623809814453125, 0.0442962646484375, 0.049968719482421875, 0.05564117431640625, 0.061313629150390625, 0.066986083984375, 0.07265853881835938, 0.07833099365234375, 0.08400344848632812, 0.0896759033203125, 0.09534835815429688, 0.10102081298828125, 0.10669326782226562, 0.11236572265625, 0.11803817749023438, 0.12371063232421875, 0.12938308715820312, 0.1350555419921875, 0.14072799682617188, 0.14640045166015625, 0.15207290649414062, 0.157745361328125, 0.16341781616210938, 0.16909027099609375, 0.17476272583007812, 0.1804351806640625, 0.18610763549804688, 0.19178009033203125, 0.19745254516601562, 0.203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 0.0, 6.0, 4.0, 7.0, 8.0, 15.0, 16.0, 15.0, 28.0, 48.0, 67.0, 64.0, 126.0, 160.0, 137.0, 65.0, 63.0, 44.0, 38.0, 33.0, 15.0, 10.0, 8.0, 7.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024056434631347656, -0.00023270398378372192, -0.00022484362125396729, -0.00021698325872421265, -0.000209122896194458, -0.00020126253366470337, -0.00019340217113494873, -0.0001855418086051941, -0.00017768144607543945, -0.00016982108354568481, -0.00016196072101593018, -0.00015410035848617554, -0.0001462399959564209, -0.00013837963342666626, -0.00013051927089691162, -0.00012265890836715698, -0.00011479854583740234, -0.0001069381833076477, -9.907782077789307e-05, -9.121745824813843e-05, -8.335709571838379e-05, -7.549673318862915e-05, -6.763637065887451e-05, -5.977600812911987e-05, -5.1915645599365234e-05, -4.4055283069610596e-05, -3.619492053985596e-05, -2.833455801010132e-05, -2.047419548034668e-05, -1.2613832950592041e-05, -4.753470420837402e-06, 3.1068921089172363e-06, 1.0967254638671875e-05, 1.8827617168426514e-05, 2.6687979698181152e-05, 3.454834222793579e-05, 4.240870475769043e-05, 5.026906728744507e-05, 5.812942981719971e-05, 6.598979234695435e-05, 7.385015487670898e-05, 8.171051740646362e-05, 8.957087993621826e-05, 9.74312424659729e-05, 0.00010529160499572754, 0.00011315196752548218, 0.00012101233005523682, 0.00012887269258499146, 0.0001367330551147461, 0.00014459341764450073, 0.00015245378017425537, 0.00016031414270401, 0.00016817450523376465, 0.0001760348677635193, 0.00018389523029327393, 0.00019175559282302856, 0.0001996159553527832, 0.00020747631788253784, 0.00021533668041229248, 0.00022319704294204712, 0.00023105740547180176, 0.0002389177680015564, 0.00024677813053131104, 0.0002546384930610657, 0.0002624988555908203]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 9.0, 12.0, 19.0, 25.0, 32.0, 56.0, 92.0, 172.0, 327.0, 634.0, 1472.0, 4094.0, 13976.0, 65347.0, 488514.0, 402532.0, 53065.0, 11907.0, 3594.0, 1316.0, 621.0, 321.0, 172.0, 79.0, 58.0, 40.0, 25.0, 17.0, 10.0, 4.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.19580078125, -0.19019699096679688, -0.18459320068359375, -0.17898941040039062, -0.1733856201171875, -0.16778182983398438, -0.16217803955078125, -0.15657424926757812, -0.150970458984375, -0.14536666870117188, -0.13976287841796875, -0.13415908813476562, -0.1285552978515625, -0.12295150756835938, -0.11734771728515625, -0.11174392700195312, -0.10614013671875, -0.10053634643554688, -0.09493255615234375, -0.08932876586914062, -0.0837249755859375, -0.07812118530273438, -0.07251739501953125, -0.06691360473632812, -0.061309814453125, -0.055706024169921875, -0.05010223388671875, -0.044498443603515625, -0.0388946533203125, -0.033290863037109375, -0.02768707275390625, -0.022083282470703125, -0.0164794921875, -0.010875701904296875, -0.00527191162109375, 0.000331878662109375, 0.0059356689453125, 0.011539459228515625, 0.01714324951171875, 0.022747039794921875, 0.028350830078125, 0.033954620361328125, 0.03955841064453125, 0.045162200927734375, 0.0507659912109375, 0.056369781494140625, 0.06197357177734375, 0.06757736206054688, 0.07318115234375, 0.07878494262695312, 0.08438873291015625, 0.08999252319335938, 0.0955963134765625, 0.10120010375976562, 0.10680389404296875, 0.11240768432617188, 0.118011474609375, 0.12361526489257812, 0.12921905517578125, 0.13482284545898438, 0.1404266357421875, 0.14603042602539062, 0.15163421630859375, 0.15723800659179688, 0.162841796875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 15.0, 16.0, 21.0, 44.0, 56.0, 83.0, 111.0, 131.0, 139.0, 95.0, 85.0, 45.0, 36.0, 24.0, 22.0, 22.0, 10.0, 6.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.17431640625, -0.169464111328125, -0.16461181640625, -0.159759521484375, -0.1549072265625, -0.150054931640625, -0.14520263671875, -0.140350341796875, -0.135498046875, -0.130645751953125, -0.12579345703125, -0.120941162109375, -0.1160888671875, -0.111236572265625, -0.10638427734375, -0.101531982421875, -0.0966796875, -0.091827392578125, -0.08697509765625, -0.082122802734375, -0.0772705078125, -0.072418212890625, -0.06756591796875, -0.062713623046875, -0.057861328125, -0.053009033203125, -0.04815673828125, -0.043304443359375, -0.0384521484375, -0.033599853515625, -0.02874755859375, -0.023895263671875, -0.01904296875, -0.014190673828125, -0.00933837890625, -0.004486083984375, 0.0003662109375, 0.005218505859375, 0.01007080078125, 0.014923095703125, 0.019775390625, 0.024627685546875, 0.02947998046875, 0.034332275390625, 0.0391845703125, 0.044036865234375, 0.04888916015625, 0.053741455078125, 0.05859375, 0.063446044921875, 0.06829833984375, 0.073150634765625, 0.0780029296875, 0.082855224609375, 0.08770751953125, 0.092559814453125, 0.097412109375, 0.102264404296875, 0.10711669921875, 0.111968994140625, 0.1168212890625, 0.121673583984375, 0.12652587890625, 0.131378173828125, 0.13623046875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 18.0, 42.0, 61.0, 112.0, 171.0, 207.0, 161.0, 92.0, 56.0, 25.0, 17.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.602572202682495, -2.5162413120269775, -2.429910659790039, -2.3435797691345215, -2.257249116897583, -2.1709182262420654, -2.084587574005127, -1.9982566833496094, -1.9119259119033813, -1.8255951404571533, -1.7392643690109253, -1.6529335975646973, -1.5666027069091797, -1.4802720546722412, -1.3939411640167236, -1.3076103925704956, -1.2212796211242676, -1.1349488496780396, -1.0486180782318115, -0.9622872471809387, -0.8759564757347107, -0.7896257042884827, -0.7032948732376099, -0.6169641017913818, -0.5306333303451538, -0.4443025588989258, -0.35797175765037537, -0.27164095640182495, -0.18531018495559692, -0.0989794135093689, -0.012648582458496094, 0.07368218898773193, 0.16001319885253906, 0.24634398519992828, 0.3326747715473175, 0.4190055727958679, 0.505336344242096, 0.591667115688324, 0.6779979467391968, 0.7643287181854248, 0.8506594896316528, 0.9369902610778809, 1.0233210325241089, 1.109651803970337, 1.1959826946258545, 1.282313346862793, 1.3686442375183105, 1.4549750089645386, 1.5413057804107666, 1.6276365518569946, 1.7139673233032227, 1.8002982139587402, 1.8866288661956787, 1.9729597568511963, 2.0592904090881348, 2.1456212997436523, 2.23195219039917, 2.3182830810546875, 2.404613733291626, 2.4909446239471436, 2.577275276184082, 2.6636061668395996, 2.749937057495117, 2.8362677097320557, 2.922598361968994]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 8.0, 7.0, 6.0, 8.0, 7.0, 12.0, 25.0, 28.0, 16.0, 25.0, 29.0, 34.0, 38.0, 38.0, 41.0, 57.0, 51.0, 41.0, 53.0, 48.0, 57.0, 41.0, 44.0, 31.0, 48.0, 31.0, 23.0, 32.0, 31.0, 19.0, 16.0, 12.0, 5.0, 3.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.524464726448059, -1.4742419719696045, -1.4240190982818604, -1.3737963438034058, -1.3235735893249512, -1.2733508348464966, -1.223128080368042, -1.1729052066802979, -1.1226824522018433, -1.0724596977233887, -1.0222368240356445, -0.9720140695571899, -0.9217913150787354, -0.8715685606002808, -0.8213457465171814, -0.771122932434082, -0.7209001779556274, -0.6706774234771729, -0.6204546093940735, -0.5702317953109741, -0.5200090408325195, -0.46978625655174255, -0.4195634722709656, -0.3693406879901886, -0.3191179037094116, -0.26889511942863464, -0.21867233514785767, -0.1684495508670807, -0.11822676658630371, -0.06800398230552673, -0.017781198024749756, 0.03244158625602722, 0.08266448974609375, 0.13288727402687073, 0.1831100583076477, 0.23333284258842468, 0.28355562686920166, 0.33377841114997864, 0.3840011954307556, 0.4342239797115326, 0.48444676399230957, 0.5346695184707642, 0.5848923325538635, 0.6351151466369629, 0.6853379011154175, 0.7355606555938721, 0.7857834696769714, 0.8360062837600708, 0.8862290382385254, 0.93645179271698, 0.9866746068000793, 1.0368974208831787, 1.0871201753616333, 1.137342929840088, 1.187565803527832, 1.2377885580062866, 1.2880113124847412, 1.3382340669631958, 1.3884568214416504, 1.4386796951293945, 1.4889024496078491, 1.5391252040863037, 1.5893480777740479, 1.6395708322525024, 1.689793586730957]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 7.0, 3.0, 4.0, 11.0, 9.0, 10.0, 16.0, 30.0, 30.0, 27.0, 52.0, 95.0, 131.0, 232.0, 432.0, 936.0, 2316.0, 7901.0, 52648.0, 3848182.0, 257270.0, 17536.0, 3957.0, 1325.0, 529.0, 276.0, 140.0, 73.0, 40.0, 22.0, 16.0, 7.0, 3.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.75048828125, -0.7294845581054688, -0.7084808349609375, -0.6874771118164062, -0.666473388671875, -0.6454696655273438, -0.6244659423828125, -0.6034622192382812, -0.58245849609375, -0.5614547729492188, -0.5404510498046875, -0.5194473266601562, -0.498443603515625, -0.47743988037109375, -0.4564361572265625, -0.43543243408203125, -0.4144287109375, -0.39342498779296875, -0.3724212646484375, -0.35141754150390625, -0.330413818359375, -0.30941009521484375, -0.2884063720703125, -0.26740264892578125, -0.24639892578125, -0.22539520263671875, -0.2043914794921875, -0.18338775634765625, -0.162384033203125, -0.14138031005859375, -0.1203765869140625, -0.09937286376953125, -0.078369140625, -0.05736541748046875, -0.0363616943359375, -0.01535797119140625, 0.005645751953125, 0.02664947509765625, 0.0476531982421875, 0.06865692138671875, 0.08966064453125, 0.11066436767578125, 0.1316680908203125, 0.15267181396484375, 0.173675537109375, 0.19467926025390625, 0.2156829833984375, 0.23668670654296875, 0.2576904296875, 0.27869415283203125, 0.2996978759765625, 0.32070159912109375, 0.341705322265625, 0.36270904541015625, 0.3837127685546875, 0.40471649169921875, 0.42572021484375, 0.44672393798828125, 0.4677276611328125, 0.48873138427734375, 0.509735107421875, 0.5307388305664062, 0.5517425537109375, 0.5727462768554688, 0.59375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 9.0, 18.0, 20.0, 50.0, 44.0, 64.0, 97.0, 122.0, 133.0, 112.0, 99.0, 76.0, 53.0, 40.0, 22.0, 11.0, 7.0, 9.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1622314453125, -0.15857982635498047, -0.15492820739746094, -0.1512765884399414, -0.14762496948242188, -0.14397335052490234, -0.1403217315673828, -0.13667011260986328, -0.13301849365234375, -0.12936687469482422, -0.1257152557373047, -0.12206363677978516, -0.11841201782226562, -0.1147603988647461, -0.11110877990722656, -0.10745716094970703, -0.1038055419921875, -0.10015392303466797, -0.09650230407714844, -0.0928506851196289, -0.08919906616210938, -0.08554744720458984, -0.08189582824707031, -0.07824420928955078, -0.07459259033203125, -0.07094097137451172, -0.06728935241699219, -0.06363773345947266, -0.059986114501953125, -0.056334495544433594, -0.05268287658691406, -0.04903125762939453, -0.045379638671875, -0.04172801971435547, -0.03807640075683594, -0.034424781799316406, -0.030773162841796875, -0.027121543884277344, -0.023469924926757812, -0.01981830596923828, -0.01616668701171875, -0.012515068054199219, -0.008863449096679688, -0.005211830139160156, -0.001560211181640625, 0.0020914077758789062, 0.0057430267333984375, 0.009394645690917969, 0.0130462646484375, 0.01669788360595703, 0.020349502563476562, 0.024001121520996094, 0.027652740478515625, 0.031304359436035156, 0.03495597839355469, 0.03860759735107422, 0.04225921630859375, 0.04591083526611328, 0.04956245422363281, 0.053214073181152344, 0.056865692138671875, 0.060517311096191406, 0.06416893005371094, 0.06782054901123047, 0.07147216796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 5.0, 12.0, 13.0, 31.0, 43.0, 99.0, 205.0, 428.0, 1036.0, 4303.0, 41038.0, 3953311.0, 183020.0, 8137.0, 1642.0, 500.0, 228.0, 116.0, 47.0, 29.0, 18.0, 15.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8515625, -0.8277053833007812, -0.8038482666015625, -0.7799911499023438, -0.756134033203125, -0.7322769165039062, -0.7084197998046875, -0.6845626831054688, -0.66070556640625, -0.6368484497070312, -0.6129913330078125, -0.5891342163085938, -0.565277099609375, -0.5414199829101562, -0.5175628662109375, -0.49370574951171875, -0.4698486328125, -0.44599151611328125, -0.4221343994140625, -0.39827728271484375, -0.374420166015625, -0.35056304931640625, -0.3267059326171875, -0.30284881591796875, -0.27899169921875, -0.25513458251953125, -0.2312774658203125, -0.20742034912109375, -0.183563232421875, -0.15970611572265625, -0.1358489990234375, -0.11199188232421875, -0.088134765625, -0.06427764892578125, -0.0404205322265625, -0.01656341552734375, 0.007293701171875, 0.03115081787109375, 0.0550079345703125, 0.07886505126953125, 0.10272216796875, 0.12657928466796875, 0.1504364013671875, 0.17429351806640625, 0.198150634765625, 0.22200775146484375, 0.2458648681640625, 0.26972198486328125, 0.2935791015625, 0.31743621826171875, 0.3412933349609375, 0.36515045166015625, 0.389007568359375, 0.41286468505859375, 0.4367218017578125, 0.46057891845703125, 0.48443603515625, 0.5082931518554688, 0.5321502685546875, 0.5560073852539062, 0.579864501953125, 0.6037216186523438, 0.6275787353515625, 0.6514358520507812, 0.67529296875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 6.0, 7.0, 12.0, 24.0, 22.0, 39.0, 50.0, 55.0, 122.0, 221.0, 442.0, 1077.0, 1027.0, 407.0, 232.0, 99.0, 71.0, 49.0, 28.0, 17.0, 11.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.09417724609375, -0.0916290283203125, -0.089080810546875, -0.0865325927734375, -0.083984375, -0.0814361572265625, -0.078887939453125, -0.0763397216796875, -0.07379150390625, -0.0712432861328125, -0.068695068359375, -0.0661468505859375, -0.0635986328125, -0.0610504150390625, -0.058502197265625, -0.0559539794921875, -0.05340576171875, -0.0508575439453125, -0.048309326171875, -0.0457611083984375, -0.043212890625, -0.0406646728515625, -0.038116455078125, -0.0355682373046875, -0.03302001953125, -0.0304718017578125, -0.027923583984375, -0.0253753662109375, -0.0228271484375, -0.0202789306640625, -0.017730712890625, -0.0151824951171875, -0.01263427734375, -0.0100860595703125, -0.007537841796875, -0.0049896240234375, -0.00244140625, 0.0001068115234375, 0.002655029296875, 0.0052032470703125, 0.00775146484375, 0.0102996826171875, 0.012847900390625, 0.0153961181640625, 0.0179443359375, 0.0204925537109375, 0.023040771484375, 0.0255889892578125, 0.02813720703125, 0.0306854248046875, 0.033233642578125, 0.0357818603515625, 0.038330078125, 0.0408782958984375, 0.043426513671875, 0.0459747314453125, 0.04852294921875, 0.0510711669921875, 0.053619384765625, 0.0561676025390625, 0.0587158203125, 0.0612640380859375, 0.063812255859375, 0.0663604736328125, 0.06890869140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 13.0, 38.0, 66.0, 175.0, 256.0, 221.0, 130.0, 46.0, 26.0, 13.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.571729302406311, -0.5414240956306458, -0.5111188888549805, -0.4808137118816376, -0.4505085051059723, -0.420203298330307, -0.3898981213569641, -0.35959291458129883, -0.32928770780563354, -0.29898250102996826, -0.268677294254303, -0.23837211728096008, -0.2080669105052948, -0.17776170372962952, -0.14745651185512543, -0.11715131998062134, -0.08684611320495605, -0.05654091387987137, -0.026235714554786682, 0.004069484770298004, 0.03437468409538269, 0.06467989087104797, 0.09498508274555206, 0.12529027462005615, 0.15559548139572144, 0.18590068817138672, 0.2162058800458908, 0.2465110719203949, 0.2768162786960602, 0.30712148547172546, 0.33742666244506836, 0.36773186922073364, 0.3980370759963989, 0.4283422827720642, 0.4586474895477295, 0.4889526665210724, 0.5192579030990601, 0.5495630502700806, 0.5798682570457458, 0.6101734638214111, 0.6404786705970764, 0.6707838773727417, 0.701089084148407, 0.7313942909240723, 0.7616994380950928, 0.7920047044754028, 0.8223098516464233, 0.8526150584220886, 0.8829202651977539, 0.9132254719734192, 0.9435306787490845, 0.9738358855247498, 1.004141092300415, 1.0344462394714355, 1.0647515058517456, 1.0950566530227661, 1.1253619194030762, 1.1556670665740967, 1.1859723329544067, 1.2162774801254272, 1.2465827465057373, 1.2768878936767578, 1.3071931600570679, 1.3374983072280884, 1.3678034543991089]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 9.0, 4.0, 8.0, 12.0, 13.0, 12.0, 29.0, 28.0, 27.0, 27.0, 42.0, 46.0, 47.0, 56.0, 47.0, 56.0, 61.0, 63.0, 39.0, 47.0, 47.0, 46.0, 39.0, 29.0, 35.0, 34.0, 18.0, 18.0, 16.0, 11.0, 9.0, 10.0, 7.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2684744596481323, -0.2583796977996826, -0.2482849657535553, -0.23819021880626678, -0.22809547185897827, -0.21800072491168976, -0.20790597796440125, -0.19781121611595154, -0.18771648406982422, -0.1776217371225357, -0.1675269901752472, -0.15743224322795868, -0.14733749628067017, -0.13724274933338165, -0.12714800238609314, -0.11705324798822403, -0.10695849359035492, -0.0968637466430664, -0.0867689996957779, -0.07667425274848938, -0.06657950580120087, -0.056484755128622055, -0.04639000445604324, -0.03629525750875473, -0.026200510561466217, -0.016105763614177704, -0.0060110148042440414, 0.004083734005689621, 0.014178480952978134, 0.024273227900266647, 0.03436797857284546, 0.04446272552013397, 0.054557472467422485, 0.064652219414711, 0.07474696636199951, 0.08484171330928802, 0.09493646025657654, 0.10503120720386505, 0.11512596160173416, 0.12522071599960327, 0.1353154480457306, 0.1454101949930191, 0.15550494194030762, 0.16559968888759613, 0.17569443583488464, 0.18578918278217316, 0.19588392972946167, 0.20597869157791138, 0.2160734385251999, 0.2261681854724884, 0.23626293241977692, 0.24635767936706543, 0.25645244121551514, 0.26654717326164246, 0.27664193511009216, 0.2867366671562195, 0.2968314290046692, 0.3069261908531189, 0.3170209228992462, 0.3271156847476959, 0.33721041679382324, 0.34730517864227295, 0.35739991068840027, 0.36749467253685, 0.3775894045829773]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 9.0, 9.0, 19.0, 19.0, 28.0, 40.0, 59.0, 121.0, 203.0, 335.0, 584.0, 1075.0, 2136.0, 4981.0, 17027.0, 96249.0, 494325.0, 355162.0, 56831.0, 11720.0, 3924.0, 1733.0, 921.0, 422.0, 239.0, 142.0, 82.0, 59.0, 39.0, 25.0, 10.0, 6.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3896484375, -0.37458038330078125, -0.3595123291015625, -0.34444427490234375, -0.329376220703125, -0.31430816650390625, -0.2992401123046875, -0.28417205810546875, -0.26910400390625, -0.25403594970703125, -0.2389678955078125, -0.22389984130859375, -0.208831787109375, -0.19376373291015625, -0.1786956787109375, -0.16362762451171875, -0.1485595703125, -0.13349151611328125, -0.1184234619140625, -0.10335540771484375, -0.088287353515625, -0.07321929931640625, -0.0581512451171875, -0.04308319091796875, -0.02801513671875, -0.01294708251953125, 0.0021209716796875, 0.01718902587890625, 0.032257080078125, 0.04732513427734375, 0.0623931884765625, 0.07746124267578125, 0.092529296875, 0.10759735107421875, 0.1226654052734375, 0.13773345947265625, 0.152801513671875, 0.16786956787109375, 0.1829376220703125, 0.19800567626953125, 0.21307373046875, 0.22814178466796875, 0.2432098388671875, 0.25827789306640625, 0.273345947265625, 0.28841400146484375, 0.3034820556640625, 0.31855010986328125, 0.3336181640625, 0.34868621826171875, 0.3637542724609375, 0.37882232666015625, 0.393890380859375, 0.40895843505859375, 0.4240264892578125, 0.43909454345703125, 0.45416259765625, 0.46923065185546875, 0.4842987060546875, 0.49936676025390625, 0.514434814453125, 0.5295028686523438, 0.5445709228515625, 0.5596389770507812, 0.57470703125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 14.0, 10.0, 24.0, 40.0, 56.0, 54.0, 99.0, 112.0, 138.0, 119.0, 103.0, 74.0, 56.0, 42.0, 23.0, 7.0, 10.0, 9.0, 6.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1612548828125, -0.15755748748779297, -0.15386009216308594, -0.1501626968383789, -0.14646530151367188, -0.14276790618896484, -0.1390705108642578, -0.13537311553955078, -0.13167572021484375, -0.12797832489013672, -0.12428092956542969, -0.12058353424072266, -0.11688613891601562, -0.1131887435913086, -0.10949134826660156, -0.10579395294189453, -0.1020965576171875, -0.09839916229248047, -0.09470176696777344, -0.0910043716430664, -0.08730697631835938, -0.08360958099365234, -0.07991218566894531, -0.07621479034423828, -0.07251739501953125, -0.06881999969482422, -0.06512260437011719, -0.061425209045410156, -0.057727813720703125, -0.054030418395996094, -0.05033302307128906, -0.04663562774658203, -0.042938232421875, -0.03924083709716797, -0.03554344177246094, -0.031846046447753906, -0.028148651123046875, -0.024451255798339844, -0.020753860473632812, -0.01705646514892578, -0.01335906982421875, -0.009661674499511719, -0.0059642791748046875, -0.0022668838500976562, 0.001430511474609375, 0.005127906799316406, 0.008825302124023438, 0.012522697448730469, 0.0162200927734375, 0.01991748809814453, 0.023614883422851562, 0.027312278747558594, 0.031009674072265625, 0.034707069396972656, 0.03840446472167969, 0.04210186004638672, 0.04579925537109375, 0.04949665069580078, 0.05319404602050781, 0.056891441345214844, 0.060588836669921875, 0.0642862319946289, 0.06798362731933594, 0.07168102264404297, 0.07537841796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 5.0, 10.0, 21.0, 19.0, 33.0, 44.0, 74.0, 108.0, 188.0, 252.0, 402.0, 672.0, 1265.0, 2233.0, 4424.0, 9170.0, 21359.0, 55071.0, 151276.0, 329622.0, 283549.0, 114082.0, 42052.0, 16574.0, 7586.0, 3667.0, 1987.0, 1125.0, 618.0, 355.0, 249.0, 125.0, 94.0, 75.0, 53.0, 35.0, 18.0, 17.0, 9.0, 9.0, 7.0, 3.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.293701171875, -0.2855110168457031, -0.27732086181640625, -0.2691307067871094, -0.2609405517578125, -0.2527503967285156, -0.24456024169921875, -0.23637008666992188, -0.228179931640625, -0.21998977661132812, -0.21179962158203125, -0.20360946655273438, -0.1954193115234375, -0.18722915649414062, -0.17903900146484375, -0.17084884643554688, -0.16265869140625, -0.15446853637695312, -0.14627838134765625, -0.13808822631835938, -0.1298980712890625, -0.12170791625976562, -0.11351776123046875, -0.10532760620117188, -0.097137451171875, -0.08894729614257812, -0.08075714111328125, -0.07256698608398438, -0.0643768310546875, -0.056186676025390625, -0.04799652099609375, -0.039806365966796875, -0.0316162109375, -0.023426055908203125, -0.01523590087890625, -0.007045745849609375, 0.0011444091796875, 0.009334564208984375, 0.01752471923828125, 0.025714874267578125, 0.033905029296875, 0.042095184326171875, 0.05028533935546875, 0.058475494384765625, 0.0666656494140625, 0.07485580444335938, 0.08304595947265625, 0.09123611450195312, 0.09942626953125, 0.10761642456054688, 0.11580657958984375, 0.12399673461914062, 0.1321868896484375, 0.14037704467773438, 0.14856719970703125, 0.15675735473632812, 0.164947509765625, 0.17313766479492188, 0.18132781982421875, 0.18951797485351562, 0.1977081298828125, 0.20589828491210938, 0.21408843994140625, 0.22227859497070312, 0.23046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 6.0, 4.0, 8.0, 13.0, 11.0, 10.0, 23.0, 21.0, 17.0, 32.0, 34.0, 48.0, 36.0, 32.0, 50.0, 44.0, 52.0, 58.0, 51.0, 64.0, 47.0, 30.0, 52.0, 38.0, 32.0, 25.0, 22.0, 28.0, 15.0, 14.0, 19.0, 13.0, 12.0, 9.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.328125, -0.31884002685546875, -0.3095550537109375, -0.30027008056640625, -0.290985107421875, -0.28170013427734375, -0.2724151611328125, -0.26313018798828125, -0.25384521484375, -0.24456024169921875, -0.2352752685546875, -0.22599029541015625, -0.216705322265625, -0.20742034912109375, -0.1981353759765625, -0.18885040283203125, -0.1795654296875, -0.17028045654296875, -0.1609954833984375, -0.15171051025390625, -0.142425537109375, -0.13314056396484375, -0.1238555908203125, -0.11457061767578125, -0.10528564453125, -0.09600067138671875, -0.0867156982421875, -0.07743072509765625, -0.068145751953125, -0.05886077880859375, -0.0495758056640625, -0.04029083251953125, -0.031005859375, -0.02172088623046875, -0.0124359130859375, -0.00315093994140625, 0.006134033203125, 0.01541900634765625, 0.0247039794921875, 0.03398895263671875, 0.04327392578125, 0.05255889892578125, 0.0618438720703125, 0.07112884521484375, 0.080413818359375, 0.08969879150390625, 0.0989837646484375, 0.10826873779296875, 0.1175537109375, 0.12683868408203125, 0.1361236572265625, 0.14540863037109375, 0.154693603515625, 0.16397857666015625, 0.1732635498046875, 0.18254852294921875, 0.19183349609375, 0.20111846923828125, 0.2104034423828125, 0.21968841552734375, 0.228973388671875, 0.23825836181640625, 0.2475433349609375, 0.25682830810546875, 0.26611328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 6.0, 10.0, 3.0, 8.0, 19.0, 22.0, 35.0, 62.0, 89.0, 148.0, 253.0, 428.0, 799.0, 1544.0, 3312.0, 7824.0, 23844.0, 131292.0, 649907.0, 183152.0, 29129.0, 9078.0, 3731.0, 1756.0, 872.0, 511.0, 285.0, 146.0, 94.0, 55.0, 38.0, 29.0, 14.0, 13.0, 9.0, 4.0, 6.0, 4.0, 2.0, 0.0, 3.0, 4.0, 7.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.2235107421875, -0.21722793579101562, -0.21094512939453125, -0.20466232299804688, -0.1983795166015625, -0.19209671020507812, -0.18581390380859375, -0.17953109741210938, -0.173248291015625, -0.16696548461914062, -0.16068267822265625, -0.15439987182617188, -0.1481170654296875, -0.14183425903320312, -0.13555145263671875, -0.12926864624023438, -0.12298583984375, -0.11670303344726562, -0.11042022705078125, -0.10413742065429688, -0.0978546142578125, -0.09157180786132812, -0.08528900146484375, -0.07900619506835938, -0.072723388671875, -0.06644058227539062, -0.06015777587890625, -0.053874969482421875, -0.0475921630859375, -0.041309356689453125, -0.03502655029296875, -0.028743743896484375, -0.0224609375, -0.016178131103515625, -0.00989532470703125, -0.003612518310546875, 0.0026702880859375, 0.008953094482421875, 0.01523590087890625, 0.021518707275390625, 0.027801513671875, 0.034084320068359375, 0.04036712646484375, 0.046649932861328125, 0.0529327392578125, 0.059215545654296875, 0.06549835205078125, 0.07178115844726562, 0.07806396484375, 0.08434677124023438, 0.09062957763671875, 0.09691238403320312, 0.1031951904296875, 0.10947799682617188, 0.11576080322265625, 0.12204360961914062, 0.128326416015625, 0.13460922241210938, 0.14089202880859375, 0.14717483520507812, 0.1534576416015625, 0.15974044799804688, 0.16602325439453125, 0.17230606079101562, 0.1785888671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 3.0, 8.0, 2.0, 9.0, 10.0, 9.0, 8.0, 6.0, 19.0, 24.0, 29.0, 28.0, 35.0, 55.0, 62.0, 77.0, 76.0, 96.0, 80.0, 65.0, 54.0, 55.0, 37.0, 22.0, 24.0, 16.0, 14.0, 13.0, 12.0, 8.0, 7.0, 5.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0001423358917236328, -0.0001380518078804016, -0.0001337677240371704, -0.0001294836401939392, -0.000125199556350708, -0.0001209154725074768, -0.0001166313886642456, -0.0001123473048210144, -0.0001080632209777832, -0.000103779137134552, -9.94950532913208e-05, -9.52109694480896e-05, -9.09268856048584e-05, -8.66428017616272e-05, -8.2358717918396e-05, -7.80746340751648e-05, -7.37905502319336e-05, -6.950646638870239e-05, -6.522238254547119e-05, -6.093829870223999e-05, -5.665421485900879e-05, -5.237013101577759e-05, -4.808604717254639e-05, -4.3801963329315186e-05, -3.9517879486083984e-05, -3.523379564285278e-05, -3.094971179962158e-05, -2.666562795639038e-05, -2.238154411315918e-05, -1.809746026992798e-05, -1.3813376426696777e-05, -9.529292583465576e-06, -5.245208740234375e-06, -9.611248970031738e-07, 3.3229589462280273e-06, 7.6070427894592285e-06, 1.189112663269043e-05, 1.617521047592163e-05, 2.0459294319152832e-05, 2.4743378162384033e-05, 2.9027462005615234e-05, 3.3311545848846436e-05, 3.759562969207764e-05, 4.187971353530884e-05, 4.616379737854004e-05, 5.044788122177124e-05, 5.473196506500244e-05, 5.901604890823364e-05, 6.330013275146484e-05, 6.758421659469604e-05, 7.186830043792725e-05, 7.615238428115845e-05, 8.043646812438965e-05, 8.472055196762085e-05, 8.900463581085205e-05, 9.328871965408325e-05, 9.757280349731445e-05, 0.00010185688734054565, 0.00010614097118377686, 0.00011042505502700806, 0.00011470913887023926, 0.00011899322271347046, 0.00012327730655670166, 0.00012756139039993286, 0.00013184547424316406]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 13.0, 17.0, 4.0, 17.0, 24.0, 33.0, 53.0, 99.0, 144.0, 292.0, 519.0, 1017.0, 2351.0, 5801.0, 18017.0, 123646.0, 738199.0, 129638.0, 18034.0, 6019.0, 2352.0, 1095.0, 502.0, 232.0, 145.0, 96.0, 59.0, 39.0, 26.0, 14.0, 12.0, 7.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2247314453125, -0.2171154022216797, -0.20949935913085938, -0.20188331604003906, -0.19426727294921875, -0.18665122985839844, -0.17903518676757812, -0.1714191436767578, -0.1638031005859375, -0.1561870574951172, -0.14857101440429688, -0.14095497131347656, -0.13333892822265625, -0.12572288513183594, -0.11810684204101562, -0.11049079895019531, -0.102874755859375, -0.09525871276855469, -0.08764266967773438, -0.08002662658691406, -0.07241058349609375, -0.06479454040527344, -0.057178497314453125, -0.04956245422363281, -0.0419464111328125, -0.03433036804199219, -0.026714324951171875, -0.019098281860351562, -0.01148223876953125, -0.0038661956787109375, 0.003749847412109375, 0.011365890502929688, 0.01898193359375, 0.026597976684570312, 0.034214019775390625, 0.04183006286621094, 0.04944610595703125, 0.05706214904785156, 0.06467819213867188, 0.07229423522949219, 0.0799102783203125, 0.08752632141113281, 0.09514236450195312, 0.10275840759277344, 0.11037445068359375, 0.11799049377441406, 0.12560653686523438, 0.1332225799560547, 0.140838623046875, 0.1484546661376953, 0.15607070922851562, 0.16368675231933594, 0.17130279541015625, 0.17891883850097656, 0.18653488159179688, 0.1941509246826172, 0.2017669677734375, 0.2093830108642578, 0.21699905395507812, 0.22461509704589844, 0.23223114013671875, 0.23984718322753906, 0.24746322631835938, 0.2550792694091797, 0.2626953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 5.0, 8.0, 10.0, 13.0, 26.0, 27.0, 41.0, 50.0, 56.0, 66.0, 93.0, 102.0, 91.0, 77.0, 76.0, 58.0, 54.0, 36.0, 26.0, 15.0, 16.0, 8.0, 10.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11285400390625, -0.10867595672607422, -0.10449790954589844, -0.10031986236572266, -0.09614181518554688, -0.0919637680053711, -0.08778572082519531, -0.08360767364501953, -0.07942962646484375, -0.07525157928466797, -0.07107353210449219, -0.0668954849243164, -0.06271743774414062, -0.058539390563964844, -0.05436134338378906, -0.05018329620361328, -0.0460052490234375, -0.04182720184326172, -0.03764915466308594, -0.033471107482910156, -0.029293060302734375, -0.025115013122558594, -0.020936965942382812, -0.01675891876220703, -0.01258087158203125, -0.008402824401855469, -0.0042247772216796875, -4.673004150390625e-05, 0.004131317138671875, 0.008309364318847656, 0.012487411499023438, 0.01666545867919922, 0.020843505859375, 0.02502155303955078, 0.029199600219726562, 0.033377647399902344, 0.037555694580078125, 0.041733741760253906, 0.04591178894042969, 0.05008983612060547, 0.05426788330078125, 0.05844593048095703, 0.06262397766113281, 0.0668020248413086, 0.07098007202148438, 0.07515811920166016, 0.07933616638183594, 0.08351421356201172, 0.0876922607421875, 0.09187030792236328, 0.09604835510253906, 0.10022640228271484, 0.10440444946289062, 0.1085824966430664, 0.11276054382324219, 0.11693859100341797, 0.12111663818359375, 0.12529468536376953, 0.1294727325439453, 0.1336507797241211, 0.13782882690429688, 0.14200687408447266, 0.14618492126464844, 0.15036296844482422, 0.154541015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 11.0, 13.0, 35.0, 47.0, 61.0, 123.0, 160.0, 165.0, 158.0, 103.0, 50.0, 28.0, 20.0, 10.0, 7.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.9370779991149902, -3.846107244491577, -3.755136489868164, -3.664165735244751, -3.573194980621338, -3.4822239875793457, -3.3912532329559326, -3.3002824783325195, -3.2093117237091064, -3.1183409690856934, -3.0273702144622803, -2.936399459838867, -2.845428466796875, -2.754457712173462, -2.663486957550049, -2.5725162029266357, -2.4815454483032227, -2.3905746936798096, -2.2996039390563965, -2.2086331844329834, -2.1176624298095703, -2.026691436767578, -1.935720682144165, -1.844749927520752, -1.7537791728973389, -1.6628084182739258, -1.5718376636505127, -1.48086678981781, -1.389896035194397, -1.2989252805709839, -1.2079544067382812, -1.1169836521148682, -1.026012897491455, -0.935042142868042, -0.8440713286399841, -0.7531005144119263, -0.6621297597885132, -0.5711590051651001, -0.48018819093704224, -0.3892173767089844, -0.2982466220855713, -0.20727583765983582, -0.11630505323410034, -0.025334268808364868, 0.0656365156173706, 0.15660730004310608, 0.24757808446884155, 0.3385488986968994, 0.4295196533203125, 0.5204904079437256, 0.6114612221717834, 0.7024320363998413, 0.7934027910232544, 0.8843735456466675, 0.9753443598747253, 1.0663151741027832, 1.1572859287261963, 1.2482566833496094, 1.3392274379730225, 1.430198311805725, 1.5211690664291382, 1.6121398210525513, 1.703110694885254, 1.794081449508667, 1.88505220413208]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 5.0, 11.0, 9.0, 12.0, 26.0, 24.0, 31.0, 41.0, 54.0, 74.0, 61.0, 84.0, 65.0, 59.0, 58.0, 98.0, 49.0, 53.0, 44.0, 27.0, 29.0, 24.0, 14.0, 15.0, 12.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9354915618896484, -1.8664132356643677, -1.7973347902297974, -1.7282564640045166, -1.6591780185699463, -1.5900996923446655, -1.5210213661193848, -1.4519429206848145, -1.3828645944595337, -1.313786268234253, -1.2447078227996826, -1.1756294965744019, -1.106551170349121, -1.0374727249145508, -0.96839439868927, -0.8993160128593445, -0.830237627029419, -0.7611592411994934, -0.6920808553695679, -0.6230025291442871, -0.5539241433143616, -0.48484575748443604, -0.4157674014568329, -0.34668904542922974, -0.2776106595993042, -0.20853228867053986, -0.1394539177417755, -0.07037554681301117, -0.0012971758842468262, 0.06778120994567871, 0.13685956597328186, 0.205937922000885, 0.27501654624938965, 0.3440949320793152, 0.41317328810691833, 0.4822516441345215, 0.551330029964447, 0.6204084157943726, 0.6894867420196533, 0.7585651278495789, 0.8276435136795044, 0.8967218995094299, 0.9658002853393555, 1.0348786115646362, 1.103956937789917, 1.1730353832244873, 1.242113709449768, 1.3111920356750488, 1.3802704811096191, 1.4493488073349, 1.5184272527694702, 1.587505578994751, 1.6565840244293213, 1.725662350654602, 1.7947406768798828, 1.8638191223144531, 1.9328974485397339, 2.0019757747650146, 2.071054220199585, 2.1401326656341553, 2.2092108726501465, 2.278289318084717, 2.347367763519287, 2.4164459705352783, 2.4855244159698486]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 6.0, 17.0, 22.0, 27.0, 50.0, 60.0, 112.0, 177.0, 297.0, 562.0, 1131.0, 3010.0, 13173.0, 148357.0, 3888851.0, 119991.0, 13068.0, 3140.0, 1143.0, 494.0, 253.0, 129.0, 84.0, 45.0, 21.0, 20.0, 12.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82421875, -0.799591064453125, -0.77496337890625, -0.750335693359375, -0.7257080078125, -0.701080322265625, -0.67645263671875, -0.651824951171875, -0.627197265625, -0.602569580078125, -0.57794189453125, -0.553314208984375, -0.5286865234375, -0.504058837890625, -0.47943115234375, -0.454803466796875, -0.43017578125, -0.405548095703125, -0.38092041015625, -0.356292724609375, -0.3316650390625, -0.307037353515625, -0.28240966796875, -0.257781982421875, -0.233154296875, -0.208526611328125, -0.18389892578125, -0.159271240234375, -0.1346435546875, -0.110015869140625, -0.08538818359375, -0.060760498046875, -0.0361328125, -0.011505126953125, 0.01312255859375, 0.037750244140625, 0.0623779296875, 0.087005615234375, 0.11163330078125, 0.136260986328125, 0.160888671875, 0.185516357421875, 0.21014404296875, 0.234771728515625, 0.2593994140625, 0.284027099609375, 0.30865478515625, 0.333282470703125, 0.35791015625, 0.382537841796875, 0.40716552734375, 0.431793212890625, 0.4564208984375, 0.481048583984375, 0.50567626953125, 0.530303955078125, 0.554931640625, 0.579559326171875, 0.60418701171875, 0.628814697265625, 0.6534423828125, 0.678070068359375, 0.70269775390625, 0.727325439453125, 0.751953125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 10.0, 10.0, 32.0, 64.0, 106.0, 140.0, 150.0, 141.0, 138.0, 83.0, 48.0, 38.0, 14.0, 9.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.16385459899902344, -0.15888595581054688, -0.1539173126220703, -0.14894866943359375, -0.1439800262451172, -0.13901138305664062, -0.13404273986816406, -0.1290740966796875, -0.12410545349121094, -0.11913681030273438, -0.11416816711425781, -0.10919952392578125, -0.10423088073730469, -0.09926223754882812, -0.09429359436035156, -0.089324951171875, -0.08435630798339844, -0.07938766479492188, -0.07441902160644531, -0.06945037841796875, -0.06448173522949219, -0.059513092041015625, -0.05454444885253906, -0.0495758056640625, -0.04460716247558594, -0.039638519287109375, -0.03466987609863281, -0.02970123291015625, -0.024732589721679688, -0.019763946533203125, -0.014795303344726562, -0.00982666015625, -0.0048580169677734375, 0.000110626220703125, 0.0050792694091796875, 0.01004791259765625, 0.015016555786132812, 0.019985198974609375, 0.024953842163085938, 0.0299224853515625, 0.03489112854003906, 0.039859771728515625, 0.04482841491699219, 0.04979705810546875, 0.05476570129394531, 0.059734344482421875, 0.06470298767089844, 0.069671630859375, 0.07464027404785156, 0.07960891723632812, 0.08457756042480469, 0.08954620361328125, 0.09451484680175781, 0.09948348999023438, 0.10445213317871094, 0.1094207763671875, 0.11438941955566406, 0.11935806274414062, 0.12432670593261719, 0.12929534912109375, 0.1342639923095703, 0.13923263549804688, 0.14420127868652344, 0.149169921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 5.0, 9.0, 19.0, 24.0, 43.0, 64.0, 159.0, 245.0, 509.0, 1098.0, 3186.0, 14164.0, 459957.0, 3680055.0, 27720.0, 4477.0, 1333.0, 546.0, 265.0, 155.0, 79.0, 78.0, 33.0, 16.0, 14.0, 4.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9404296875, -0.908172607421875, -0.87591552734375, -0.843658447265625, -0.8114013671875, -0.779144287109375, -0.74688720703125, -0.714630126953125, -0.682373046875, -0.650115966796875, -0.61785888671875, -0.585601806640625, -0.5533447265625, -0.521087646484375, -0.48883056640625, -0.456573486328125, -0.42431640625, -0.392059326171875, -0.35980224609375, -0.327545166015625, -0.2952880859375, -0.263031005859375, -0.23077392578125, -0.198516845703125, -0.166259765625, -0.134002685546875, -0.10174560546875, -0.069488525390625, -0.0372314453125, -0.004974365234375, 0.02728271484375, 0.059539794921875, 0.091796875, 0.124053955078125, 0.15631103515625, 0.188568115234375, 0.2208251953125, 0.253082275390625, 0.28533935546875, 0.317596435546875, 0.349853515625, 0.382110595703125, 0.41436767578125, 0.446624755859375, 0.4788818359375, 0.511138916015625, 0.54339599609375, 0.575653076171875, 0.60791015625, 0.640167236328125, 0.67242431640625, 0.704681396484375, 0.7369384765625, 0.769195556640625, 0.80145263671875, 0.833709716796875, 0.865966796875, 0.898223876953125, 0.93048095703125, 0.962738037109375, 0.9949951171875, 1.027252197265625, 1.05950927734375, 1.091766357421875, 1.1240234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 7.0, 14.0, 16.0, 23.0, 50.0, 110.0, 233.0, 757.0, 1792.0, 625.0, 223.0, 96.0, 45.0, 27.0, 12.0, 16.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.25439453125, -0.246307373046875, -0.23822021484375, -0.230133056640625, -0.2220458984375, -0.213958740234375, -0.20587158203125, -0.197784423828125, -0.189697265625, -0.181610107421875, -0.17352294921875, -0.165435791015625, -0.1573486328125, -0.149261474609375, -0.14117431640625, -0.133087158203125, -0.125, -0.116912841796875, -0.10882568359375, -0.100738525390625, -0.0926513671875, -0.084564208984375, -0.07647705078125, -0.068389892578125, -0.060302734375, -0.052215576171875, -0.04412841796875, -0.036041259765625, -0.0279541015625, -0.019866943359375, -0.01177978515625, -0.003692626953125, 0.00439453125, 0.012481689453125, 0.02056884765625, 0.028656005859375, 0.0367431640625, 0.044830322265625, 0.05291748046875, 0.061004638671875, 0.069091796875, 0.077178955078125, 0.08526611328125, 0.093353271484375, 0.1014404296875, 0.109527587890625, 0.11761474609375, 0.125701904296875, 0.1337890625, 0.141876220703125, 0.14996337890625, 0.158050537109375, 0.1661376953125, 0.174224853515625, 0.18231201171875, 0.190399169921875, 0.198486328125, 0.206573486328125, 0.21466064453125, 0.222747802734375, 0.2308349609375, 0.238922119140625, 0.24700927734375, 0.255096435546875, 0.26318359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 14.0, 18.0, 56.0, 103.0, 234.0, 257.0, 174.0, 82.0, 27.0, 16.0, 7.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2767488956451416, -2.2123172283172607, -2.147885799407959, -2.083454132080078, -2.0190224647521973, -1.954590916633606, -1.8901593685150146, -1.8257277011871338, -1.761296033859253, -1.6968644857406616, -1.6324328184127808, -1.5680012702941895, -1.5035696029663086, -1.4391380548477173, -1.374706506729126, -1.3102748394012451, -1.2458432912826538, -1.1814117431640625, -1.1169800758361816, -1.0525485277175903, -0.9881168603897095, -0.9236853122711182, -0.8592537045478821, -0.794822096824646, -0.7303904891014099, -0.6659588813781738, -0.6015272736549377, -0.5370956659317017, -0.47266408801078796, -0.4082324802875519, -0.3438009023666382, -0.2793692946434021, -0.21493756771087646, -0.15050595998764038, -0.08607436716556549, -0.0216427743434906, 0.04278883337974548, 0.10722044110298157, 0.17165201902389526, 0.23608362674713135, 0.30051523447036743, 0.3649468421936035, 0.4293784499168396, 0.4938100278377533, 0.558241605758667, 0.6226732730865479, 0.6871048212051392, 0.7515364289283752, 0.8159680366516113, 0.8803996443748474, 0.9448312520980835, 1.0092628002166748, 1.0736944675445557, 1.138126015663147, 1.2025575637817383, 1.2669892311096191, 1.3314208984375, 1.3958524465560913, 1.4602841138839722, 1.5247156620025635, 1.5891473293304443, 1.6535788774490356, 1.718010425567627, 1.7824420928955078, 1.8468736410140991]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 10.0, 9.0, 25.0, 27.0, 41.0, 62.0, 87.0, 92.0, 115.0, 109.0, 91.0, 80.0, 78.0, 54.0, 47.0, 31.0, 19.0, 11.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1883189678192139, -1.1507377624511719, -1.1131565570831299, -1.0755754709243774, -1.0379942655563354, -1.0004130601882935, -0.9628318548202515, -0.9252506494522095, -0.8876695036888123, -0.8500882983207703, -0.812507152557373, -0.774925947189331, -0.7373447418212891, -0.6997635960578918, -0.6621823906898499, -0.6246012449264526, -0.5870200395584106, -0.5494388341903687, -0.5118576884269714, -0.47427648305892944, -0.43669530749320984, -0.39911413192749023, -0.36153292655944824, -0.32395175099372864, -0.28637057542800903, -0.24878939986228943, -0.21120820939540863, -0.17362701892852783, -0.13604584336280823, -0.09846466779708862, -0.060883477330207825, -0.023302286863327026, 0.014278888702392578, 0.05186007171869278, 0.08944125473499298, 0.12702244520187378, 0.16460362076759338, 0.202184796333313, 0.2397659868001938, 0.2773471772670746, 0.3149283528327942, 0.3525095283985138, 0.3900907039642334, 0.4276719093322754, 0.465253084897995, 0.5028342604637146, 0.5404154658317566, 0.5779966115951538, 0.6155778169631958, 0.6531590223312378, 0.690740168094635, 0.728321373462677, 0.7659025192260742, 0.8034837245941162, 0.8410649299621582, 0.8786461353302002, 0.9162272810935974, 0.9538084864616394, 0.9913896322250366, 1.0289708375930786, 1.0665520429611206, 1.104133129119873, 1.141714334487915, 1.179295539855957, 1.216876745223999]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 4.0, 3.0, 7.0, 9.0, 17.0, 17.0, 27.0, 43.0, 46.0, 77.0, 124.0, 174.0, 267.0, 416.0, 706.0, 1075.0, 1977.0, 3734.0, 9273.0, 39604.0, 258004.0, 557540.0, 138747.0, 22790.0, 6711.0, 2963.0, 1597.0, 914.0, 574.0, 386.0, 230.0, 156.0, 112.0, 68.0, 61.0, 30.0, 27.0, 14.0, 13.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.476806640625, -0.4605522155761719, -0.44429779052734375, -0.4280433654785156, -0.4117889404296875, -0.3955345153808594, -0.37928009033203125, -0.3630256652832031, -0.346771240234375, -0.3305168151855469, -0.31426239013671875, -0.2980079650878906, -0.2817535400390625, -0.2654991149902344, -0.24924468994140625, -0.23299026489257812, -0.21673583984375, -0.20048141479492188, -0.18422698974609375, -0.16797256469726562, -0.1517181396484375, -0.13546371459960938, -0.11920928955078125, -0.10295486450195312, -0.086700439453125, -0.07044601440429688, -0.05419158935546875, -0.037937164306640625, -0.0216827392578125, -0.005428314208984375, 0.01082611083984375, 0.027080535888671875, 0.0433349609375, 0.059589385986328125, 0.07584381103515625, 0.09209823608398438, 0.1083526611328125, 0.12460708618164062, 0.14086151123046875, 0.15711593627929688, 0.173370361328125, 0.18962478637695312, 0.20587921142578125, 0.22213363647460938, 0.2383880615234375, 0.2546424865722656, 0.27089691162109375, 0.2871513366699219, 0.30340576171875, 0.3196601867675781, 0.33591461181640625, 0.3521690368652344, 0.3684234619140625, 0.3846778869628906, 0.40093231201171875, 0.4171867370605469, 0.433441162109375, 0.4496955871582031, 0.46595001220703125, 0.4822044372558594, 0.4984588623046875, 0.5147132873535156, 0.5309677124023438, 0.5472221374511719, 0.5634765625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 12.0, 14.0, 37.0, 63.0, 141.0, 156.0, 182.0, 143.0, 100.0, 64.0, 46.0, 19.0, 8.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1695556640625, -0.16399574279785156, -0.15843582153320312, -0.1528759002685547, -0.14731597900390625, -0.1417560577392578, -0.13619613647460938, -0.13063621520996094, -0.1250762939453125, -0.11951637268066406, -0.11395645141601562, -0.10839653015136719, -0.10283660888671875, -0.09727668762207031, -0.09171676635742188, -0.08615684509277344, -0.080596923828125, -0.07503700256347656, -0.06947708129882812, -0.06391716003417969, -0.05835723876953125, -0.05279731750488281, -0.047237396240234375, -0.04167747497558594, -0.0361175537109375, -0.030557632446289062, -0.024997711181640625, -0.019437789916992188, -0.01387786865234375, -0.008317947387695312, -0.002758026123046875, 0.0028018951416015625, 0.00836181640625, 0.013921737670898438, 0.019481658935546875, 0.025041580200195312, 0.03060150146484375, 0.03616142272949219, 0.041721343994140625, 0.04728126525878906, 0.0528411865234375, 0.05840110778808594, 0.06396102905273438, 0.06952095031738281, 0.07508087158203125, 0.08064079284667969, 0.08620071411132812, 0.09176063537597656, 0.097320556640625, 0.10288047790527344, 0.10844039916992188, 0.11400032043457031, 0.11956024169921875, 0.1251201629638672, 0.13068008422851562, 0.13624000549316406, 0.1417999267578125, 0.14735984802246094, 0.15291976928710938, 0.1584796905517578, 0.16403961181640625, 0.1695995330810547, 0.17515945434570312, 0.18071937561035156, 0.186279296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 6.0, 10.0, 4.0, 9.0, 12.0, 22.0, 29.0, 38.0, 64.0, 86.0, 142.0, 200.0, 328.0, 586.0, 1258.0, 2566.0, 6184.0, 15527.0, 41713.0, 113204.0, 260662.0, 323149.0, 174397.0, 67310.0, 24340.0, 9284.0, 3768.0, 1674.0, 796.0, 430.0, 269.0, 170.0, 96.0, 61.0, 36.0, 35.0, 33.0, 22.0, 15.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23876953125, -0.2311248779296875, -0.223480224609375, -0.2158355712890625, -0.20819091796875, -0.2005462646484375, -0.192901611328125, -0.1852569580078125, -0.1776123046875, -0.1699676513671875, -0.162322998046875, -0.1546783447265625, -0.14703369140625, -0.1393890380859375, -0.131744384765625, -0.1240997314453125, -0.116455078125, -0.1088104248046875, -0.101165771484375, -0.0935211181640625, -0.08587646484375, -0.0782318115234375, -0.070587158203125, -0.0629425048828125, -0.0552978515625, -0.0476531982421875, -0.040008544921875, -0.0323638916015625, -0.02471923828125, -0.0170745849609375, -0.009429931640625, -0.0017852783203125, 0.005859375, 0.0135040283203125, 0.021148681640625, 0.0287933349609375, 0.03643798828125, 0.0440826416015625, 0.051727294921875, 0.0593719482421875, 0.0670166015625, 0.0746612548828125, 0.082305908203125, 0.0899505615234375, 0.09759521484375, 0.1052398681640625, 0.112884521484375, 0.1205291748046875, 0.128173828125, 0.1358184814453125, 0.143463134765625, 0.1511077880859375, 0.15875244140625, 0.1663970947265625, 0.174041748046875, 0.1816864013671875, 0.1893310546875, 0.1969757080078125, 0.204620361328125, 0.2122650146484375, 0.21990966796875, 0.2275543212890625, 0.235198974609375, 0.2428436279296875, 0.25048828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 5.0, 12.0, 9.0, 9.0, 15.0, 20.0, 31.0, 30.0, 34.0, 27.0, 34.0, 48.0, 36.0, 48.0, 41.0, 54.0, 52.0, 63.0, 50.0, 37.0, 33.0, 38.0, 35.0, 34.0, 30.0, 27.0, 24.0, 27.0, 23.0, 19.0, 9.0, 12.0, 7.0, 11.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.2620391845703125, -0.253570556640625, -0.2451019287109375, -0.23663330078125, -0.2281646728515625, -0.219696044921875, -0.2112274169921875, -0.2027587890625, -0.1942901611328125, -0.185821533203125, -0.1773529052734375, -0.16888427734375, -0.1604156494140625, -0.151947021484375, -0.1434783935546875, -0.135009765625, -0.1265411376953125, -0.118072509765625, -0.1096038818359375, -0.10113525390625, -0.0926666259765625, -0.084197998046875, -0.0757293701171875, -0.0672607421875, -0.0587921142578125, -0.050323486328125, -0.0418548583984375, -0.03338623046875, -0.0249176025390625, -0.016448974609375, -0.0079803466796875, 0.00048828125, 0.0089569091796875, 0.017425537109375, 0.0258941650390625, 0.03436279296875, 0.0428314208984375, 0.051300048828125, 0.0597686767578125, 0.0682373046875, 0.0767059326171875, 0.085174560546875, 0.0936431884765625, 0.10211181640625, 0.1105804443359375, 0.119049072265625, 0.1275177001953125, 0.135986328125, 0.1444549560546875, 0.152923583984375, 0.1613922119140625, 0.16986083984375, 0.1783294677734375, 0.186798095703125, 0.1952667236328125, 0.2037353515625, 0.2122039794921875, 0.220672607421875, 0.2291412353515625, 0.23760986328125, 0.2460784912109375, 0.254547119140625, 0.2630157470703125, 0.271484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 9.0, 30.0, 48.0, 91.0, 160.0, 377.0, 941.0, 3014.0, 17009.0, 199610.0, 743008.0, 72529.0, 8673.0, 1826.0, 642.0, 304.0, 123.0, 63.0, 39.0, 26.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29931640625, -0.29084205627441406, -0.2823677062988281, -0.2738933563232422, -0.26541900634765625, -0.2569446563720703, -0.24847030639648438, -0.23999595642089844, -0.2315216064453125, -0.22304725646972656, -0.21457290649414062, -0.2060985565185547, -0.19762420654296875, -0.1891498565673828, -0.18067550659179688, -0.17220115661621094, -0.163726806640625, -0.15525245666503906, -0.14677810668945312, -0.1383037567138672, -0.12982940673828125, -0.12135505676269531, -0.11288070678710938, -0.10440635681152344, -0.0959320068359375, -0.08745765686035156, -0.07898330688476562, -0.07050895690917969, -0.06203460693359375, -0.05356025695800781, -0.045085906982421875, -0.03661155700683594, -0.02813720703125, -0.019662857055664062, -0.011188507080078125, -0.0027141571044921875, 0.00576019287109375, 0.014234542846679688, 0.022708892822265625, 0.031183242797851562, 0.0396575927734375, 0.04813194274902344, 0.056606292724609375, 0.06508064270019531, 0.07355499267578125, 0.08202934265136719, 0.09050369262695312, 0.09897804260253906, 0.107452392578125, 0.11592674255371094, 0.12440109252929688, 0.1328754425048828, 0.14134979248046875, 0.1498241424560547, 0.15829849243164062, 0.16677284240722656, 0.1752471923828125, 0.18372154235839844, 0.19219589233398438, 0.2006702423095703, 0.20914459228515625, 0.2176189422607422, 0.22609329223632812, 0.23456764221191406, 0.2430419921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 6.0, 3.0, 5.0, 12.0, 15.0, 15.0, 15.0, 22.0, 31.0, 36.0, 39.0, 71.0, 77.0, 121.0, 91.0, 90.0, 74.0, 45.0, 61.0, 34.0, 30.0, 21.0, 20.0, 17.0, 12.0, 8.0, 10.0, 9.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.00019252300262451172, -0.00018721632659435272, -0.00018190965056419373, -0.00017660297453403473, -0.00017129629850387573, -0.00016598962247371674, -0.00016068294644355774, -0.00015537627041339874, -0.00015006959438323975, -0.00014476291835308075, -0.00013945624232292175, -0.00013414956629276276, -0.00012884289026260376, -0.00012353621423244476, -0.00011822953820228577, -0.00011292286217212677, -0.00010761618614196777, -0.00010230951011180878, -9.700283408164978e-05, -9.169615805149078e-05, -8.638948202133179e-05, -8.108280599117279e-05, -7.57761299610138e-05, -7.04694539308548e-05, -6.51627779006958e-05, -5.9856101870536804e-05, -5.454942584037781e-05, -4.924274981021881e-05, -4.3936073780059814e-05, -3.862939774990082e-05, -3.332272171974182e-05, -2.8016045689582825e-05, -2.2709369659423828e-05, -1.740269362926483e-05, -1.2096017599105835e-05, -6.789341568946838e-06, -1.4826655387878418e-06, 3.824010491371155e-06, 9.130686521530151e-06, 1.4437362551689148e-05, 1.9744038581848145e-05, 2.505071461200714e-05, 3.0357390642166138e-05, 3.5664066672325134e-05, 4.097074270248413e-05, 4.627741873264313e-05, 5.1584094762802124e-05, 5.689077079296112e-05, 6.219744682312012e-05, 6.750412285327911e-05, 7.281079888343811e-05, 7.811747491359711e-05, 8.34241509437561e-05, 8.87308269739151e-05, 9.40375030040741e-05, 9.93441790342331e-05, 0.00010465085506439209, 0.00010995753109455109, 0.00011526420712471008, 0.00012057088315486908, 0.00012587755918502808, 0.00013118423521518707, 0.00013649091124534607, 0.00014179758727550507, 0.00014710426330566406]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 5.0, 9.0, 10.0, 9.0, 18.0, 28.0, 28.0, 51.0, 75.0, 115.0, 212.0, 475.0, 969.0, 2424.0, 6487.0, 22147.0, 113709.0, 573240.0, 267960.0, 43195.0, 10759.0, 3656.0, 1454.0, 670.0, 343.0, 179.0, 95.0, 67.0, 36.0, 28.0, 19.0, 22.0, 11.0, 14.0, 6.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.203125, -0.19759368896484375, -0.1920623779296875, -0.18653106689453125, -0.180999755859375, -0.17546844482421875, -0.1699371337890625, -0.16440582275390625, -0.15887451171875, -0.15334320068359375, -0.1478118896484375, -0.14228057861328125, -0.136749267578125, -0.13121795654296875, -0.1256866455078125, -0.12015533447265625, -0.1146240234375, -0.10909271240234375, -0.1035614013671875, -0.09803009033203125, -0.092498779296875, -0.08696746826171875, -0.0814361572265625, -0.07590484619140625, -0.07037353515625, -0.06484222412109375, -0.0593109130859375, -0.05377960205078125, -0.048248291015625, -0.04271697998046875, -0.0371856689453125, -0.03165435791015625, -0.026123046875, -0.02059173583984375, -0.0150604248046875, -0.00952911376953125, -0.003997802734375, 0.00153350830078125, 0.0070648193359375, 0.01259613037109375, 0.01812744140625, 0.02365875244140625, 0.0291900634765625, 0.03472137451171875, 0.040252685546875, 0.04578399658203125, 0.0513153076171875, 0.05684661865234375, 0.0623779296875, 0.06790924072265625, 0.0734405517578125, 0.07897186279296875, 0.084503173828125, 0.09003448486328125, 0.0955657958984375, 0.10109710693359375, 0.10662841796875, 0.11215972900390625, 0.1176910400390625, 0.12322235107421875, 0.128753662109375, 0.13428497314453125, 0.1398162841796875, 0.14534759521484375, 0.15087890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 5.0, 9.0, 11.0, 14.0, 22.0, 29.0, 29.0, 50.0, 45.0, 50.0, 80.0, 81.0, 83.0, 82.0, 82.0, 68.0, 50.0, 38.0, 31.0, 30.0, 19.0, 15.0, 12.0, 13.0, 7.0, 10.0, 4.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10626220703125, -0.1024026870727539, -0.09854316711425781, -0.09468364715576172, -0.09082412719726562, -0.08696460723876953, -0.08310508728027344, -0.07924556732177734, -0.07538604736328125, -0.07152652740478516, -0.06766700744628906, -0.06380748748779297, -0.059947967529296875, -0.05608844757080078, -0.05222892761230469, -0.048369407653808594, -0.0445098876953125, -0.040650367736816406, -0.03679084777832031, -0.03293132781982422, -0.029071807861328125, -0.02521228790283203, -0.021352767944335938, -0.017493247985839844, -0.01363372802734375, -0.009774208068847656, -0.0059146881103515625, -0.0020551681518554688, 0.001804351806640625, 0.005663871765136719, 0.009523391723632812, 0.013382911682128906, 0.017242431640625, 0.021101951599121094, 0.024961471557617188, 0.02882099151611328, 0.032680511474609375, 0.03654003143310547, 0.04039955139160156, 0.044259071350097656, 0.04811859130859375, 0.051978111267089844, 0.05583763122558594, 0.05969715118408203, 0.06355667114257812, 0.06741619110107422, 0.07127571105957031, 0.0751352310180664, 0.0789947509765625, 0.0828542709350586, 0.08671379089355469, 0.09057331085205078, 0.09443283081054688, 0.09829235076904297, 0.10215187072753906, 0.10601139068603516, 0.10987091064453125, 0.11373043060302734, 0.11758995056152344, 0.12144947052001953, 0.12530899047851562, 0.12916851043701172, 0.1330280303955078, 0.1368875503540039, 0.1407470703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 32.0, 43.0, 119.0, 192.0, 222.0, 176.0, 109.0, 59.0, 26.0, 11.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.015063285827637, -5.893158912658691, -5.771254539489746, -5.649350166320801, -5.5274457931518555, -5.40554141998291, -5.283637046813965, -5.161733150482178, -5.039828777313232, -4.917924404144287, -4.796020030975342, -4.6741156578063965, -4.552211284637451, -4.430307388305664, -4.308403015136719, -4.186498641967773, -4.064594268798828, -3.942689895629883, -3.8207855224609375, -3.698881149291992, -3.576977014541626, -3.4550726413726807, -3.3331682682037354, -3.21126389503479, -3.0893592834472656, -2.9674549102783203, -2.845550537109375, -2.7236461639404297, -2.6017420291900635, -2.479837656021118, -2.357933282852173, -2.2360289096832275, -2.1141250133514404, -1.9922206401824951, -1.8703163862228394, -1.748412013053894, -1.6265077590942383, -1.504603385925293, -1.3826990127563477, -1.2607946395874023, -1.1388903856277466, -1.0169860124588013, -0.8950817584991455, -0.7731773853302002, -0.6512730717658997, -0.5293687582015991, -0.4074643850326538, -0.28556007146835327, -0.16365575790405273, -0.041751429438591, 0.08015289902687073, 0.20205724239349365, 0.3239615559577942, 0.4458658695220947, 0.56777024269104, 0.6896745562553406, 0.8115788698196411, 0.9334831833839417, 1.0553874969482422, 1.1772918701171875, 1.2991962432861328, 1.4211004972457886, 1.5430048704147339, 1.6649091243743896, 1.786813497543335]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 9.0, 4.0, 14.0, 9.0, 14.0, 13.0, 22.0, 17.0, 18.0, 33.0, 38.0, 33.0, 47.0, 44.0, 40.0, 51.0, 49.0, 42.0, 50.0, 45.0, 61.0, 51.0, 53.0, 34.0, 31.0, 26.0, 34.0, 24.0, 20.0, 14.0, 18.0, 10.0, 8.0, 7.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.8470747470855713, -1.7968776226043701, -1.746680498123169, -1.6964833736419678, -1.6462862491607666, -1.5960891246795654, -1.5458920001983643, -1.495694875717163, -1.445497751235962, -1.3953006267547607, -1.3451035022735596, -1.2949063777923584, -1.2447092533111572, -1.194512128829956, -1.1443150043487549, -1.0941178798675537, -1.0439207553863525, -0.9937236309051514, -0.9435265064239502, -0.893329381942749, -0.8431322574615479, -0.7929351329803467, -0.7427380084991455, -0.6925408840179443, -0.6423436403274536, -0.5921465158462524, -0.5419493913650513, -0.4917522668838501, -0.4415551424026489, -0.39135798811912537, -0.3411608636379242, -0.290963739156723, -0.24076664447784424, -0.19056951999664307, -0.1403723955154419, -0.09017525613307953, -0.03997813165187836, 0.010219007730484009, 0.06041613221168518, 0.11061325669288635, 0.16081038117408752, 0.2110075056552887, 0.26120463013648987, 0.3114017844200134, 0.3615989089012146, 0.41179603338241577, 0.46199315786361694, 0.5121902823448181, 0.5623874068260193, 0.6125845313072205, 0.6627816557884216, 0.7129787802696228, 0.763175904750824, 0.8133730888366699, 0.8635702133178711, 0.9137673377990723, 0.9639644622802734, 1.0141615867614746, 1.0643587112426758, 1.114555835723877, 1.1647529602050781, 1.2149500846862793, 1.2651472091674805, 1.3153443336486816, 1.3655414581298828]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 7.0, 9.0, 17.0, 22.0, 26.0, 43.0, 44.0, 85.0, 107.0, 164.0, 256.0, 495.0, 901.0, 2141.0, 6961.0, 43977.0, 3695548.0, 413808.0, 21723.0, 4623.0, 1568.0, 700.0, 383.0, 245.0, 145.0, 88.0, 54.0, 49.0, 34.0, 22.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62841796875, -0.608673095703125, -0.58892822265625, -0.569183349609375, -0.5494384765625, -0.529693603515625, -0.50994873046875, -0.490203857421875, -0.470458984375, -0.450714111328125, -0.43096923828125, -0.411224365234375, -0.3914794921875, -0.371734619140625, -0.35198974609375, -0.332244873046875, -0.3125, -0.292755126953125, -0.27301025390625, -0.253265380859375, -0.2335205078125, -0.213775634765625, -0.19403076171875, -0.174285888671875, -0.154541015625, -0.134796142578125, -0.11505126953125, -0.095306396484375, -0.0755615234375, -0.055816650390625, -0.03607177734375, -0.016326904296875, 0.00341796875, 0.023162841796875, 0.04290771484375, 0.062652587890625, 0.0823974609375, 0.102142333984375, 0.12188720703125, 0.141632080078125, 0.161376953125, 0.181121826171875, 0.20086669921875, 0.220611572265625, 0.2403564453125, 0.260101318359375, 0.27984619140625, 0.299591064453125, 0.3193359375, 0.339080810546875, 0.35882568359375, 0.378570556640625, 0.3983154296875, 0.418060302734375, 0.43780517578125, 0.457550048828125, 0.477294921875, 0.497039794921875, 0.51678466796875, 0.536529541015625, 0.5562744140625, 0.576019287109375, 0.59576416015625, 0.615509033203125, 0.63525390625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 4.0, 13.0, 21.0, 37.0, 85.0, 130.0, 152.0, 154.0, 127.0, 109.0, 72.0, 39.0, 22.0, 13.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1810302734375, -0.17525672912597656, -0.16948318481445312, -0.1637096405029297, -0.15793609619140625, -0.1521625518798828, -0.14638900756835938, -0.14061546325683594, -0.1348419189453125, -0.12906837463378906, -0.12329483032226562, -0.11752128601074219, -0.11174774169921875, -0.10597419738769531, -0.10020065307617188, -0.09442710876464844, -0.088653564453125, -0.08288002014160156, -0.07710647583007812, -0.07133293151855469, -0.06555938720703125, -0.05978584289550781, -0.054012298583984375, -0.04823875427246094, -0.0424652099609375, -0.03669166564941406, -0.030918121337890625, -0.025144577026367188, -0.01937103271484375, -0.013597488403320312, -0.007823944091796875, -0.0020503997802734375, 0.00372314453125, 0.009496688842773438, 0.015270233154296875, 0.021043777465820312, 0.02681732177734375, 0.03259086608886719, 0.038364410400390625, 0.04413795471191406, 0.0499114990234375, 0.05568504333496094, 0.061458587646484375, 0.06723213195800781, 0.07300567626953125, 0.07877922058105469, 0.08455276489257812, 0.09032630920410156, 0.096099853515625, 0.10187339782714844, 0.10764694213867188, 0.11342048645019531, 0.11919403076171875, 0.12496757507324219, 0.13074111938476562, 0.13651466369628906, 0.1422882080078125, 0.14806175231933594, 0.15383529663085938, 0.1596088409423828, 0.16538238525390625, 0.1711559295654297, 0.17692947387695312, 0.18270301818847656, 0.1884765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 10.0, 10.0, 9.0, 19.0, 25.0, 35.0, 43.0, 61.0, 75.0, 114.0, 151.0, 248.0, 358.0, 536.0, 847.0, 1632.0, 3737.0, 9599.0, 31719.0, 150967.0, 2844896.0, 1022017.0, 91255.0, 21975.0, 7133.0, 2954.0, 1489.0, 820.0, 437.0, 338.0, 221.0, 171.0, 108.0, 77.0, 50.0, 44.0, 27.0, 17.0, 17.0, 7.0, 6.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.24186325073242188, -0.23348236083984375, -0.22510147094726562, -0.2167205810546875, -0.20833969116210938, -0.19995880126953125, -0.19157791137695312, -0.183197021484375, -0.17481613159179688, -0.16643524169921875, -0.15805435180664062, -0.1496734619140625, -0.14129257202148438, -0.13291168212890625, -0.12453079223632812, -0.11614990234375, -0.10776901245117188, -0.09938812255859375, -0.09100723266601562, -0.0826263427734375, -0.07424545288085938, -0.06586456298828125, -0.057483673095703125, -0.049102783203125, -0.040721893310546875, -0.03234100341796875, -0.023960113525390625, -0.0155792236328125, -0.007198333740234375, 0.00118255615234375, 0.009563446044921875, 0.0179443359375, 0.026325225830078125, 0.03470611572265625, 0.043087005615234375, 0.0514678955078125, 0.059848785400390625, 0.06822967529296875, 0.07661056518554688, 0.084991455078125, 0.09337234497070312, 0.10175323486328125, 0.11013412475585938, 0.1185150146484375, 0.12689590454101562, 0.13527679443359375, 0.14365768432617188, 0.15203857421875, 0.16041946411132812, 0.16880035400390625, 0.17718124389648438, 0.1855621337890625, 0.19394302368164062, 0.20232391357421875, 0.21070480346679688, 0.219085693359375, 0.22746658325195312, 0.23584747314453125, 0.24422836303710938, 0.2526092529296875, 0.2609901428222656, 0.26937103271484375, 0.2777519226074219, 0.2861328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 10.0, 19.0, 32.0, 44.0, 72.0, 152.0, 405.0, 1441.0, 1204.0, 331.0, 165.0, 82.0, 40.0, 26.0, 16.0, 7.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.154296875, -0.1493091583251953, -0.14432144165039062, -0.13933372497558594, -0.13434600830078125, -0.12935829162597656, -0.12437057495117188, -0.11938285827636719, -0.1143951416015625, -0.10940742492675781, -0.10441970825195312, -0.09943199157714844, -0.09444427490234375, -0.08945655822753906, -0.08446884155273438, -0.07948112487792969, -0.074493408203125, -0.06950569152832031, -0.06451797485351562, -0.05953025817871094, -0.05454254150390625, -0.04955482482910156, -0.044567108154296875, -0.03957939147949219, -0.0345916748046875, -0.029603958129882812, -0.024616241455078125, -0.019628524780273438, -0.01464080810546875, -0.009653091430664062, -0.004665374755859375, 0.0003223419189453125, 0.00531005859375, 0.010297775268554688, 0.015285491943359375, 0.020273208618164062, 0.02526092529296875, 0.030248641967773438, 0.035236358642578125, 0.04022407531738281, 0.0452117919921875, 0.05019950866699219, 0.055187225341796875, 0.06017494201660156, 0.06516265869140625, 0.07015037536621094, 0.07513809204101562, 0.08012580871582031, 0.085113525390625, 0.09010124206542969, 0.09508895874023438, 0.10007667541503906, 0.10506439208984375, 0.11005210876464844, 0.11503982543945312, 0.12002754211425781, 0.1250152587890625, 0.1300029754638672, 0.13499069213867188, 0.13997840881347656, 0.14496612548828125, 0.14995384216308594, 0.15494155883789062, 0.1599292755126953, 0.1649169921875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 18.0, 35.0, 70.0, 115.0, 217.0, 236.0, 131.0, 90.0, 44.0, 17.0, 8.0, 7.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9648955464363098, -0.9337611794471741, -0.9026267528533936, -0.8714923858642578, -0.8403580188751221, -0.8092235922813416, -0.7780892252922058, -0.7469547986984253, -0.7158204317092896, -0.6846860647201538, -0.6535516381263733, -0.6224172711372375, -0.591282844543457, -0.5601484775543213, -0.5290141105651855, -0.4978797137737274, -0.4667453169822693, -0.43561092019081116, -0.404476523399353, -0.3733421564102173, -0.34220775961875916, -0.311073362827301, -0.2799389958381653, -0.24880459904670715, -0.21767020225524902, -0.1865358054637909, -0.15540142357349396, -0.12426703423261642, -0.09313264489173889, -0.06199824810028076, -0.030863866209983826, 0.00027051568031311035, 0.031404972076416016, 0.06253936141729355, 0.09367375075817108, 0.12480814009904861, 0.15594252943992615, 0.18707692623138428, 0.2182113081216812, 0.24934569001197815, 0.2804800868034363, 0.3116144835948944, 0.34274888038635254, 0.3738832473754883, 0.4050176441669464, 0.43615204095840454, 0.4672864079475403, 0.4984208047389984, 0.5295552015304565, 0.5606895685195923, 0.5918239951133728, 0.6229583621025085, 0.6540927886962891, 0.6852271556854248, 0.7163615226745605, 0.7474958896636963, 0.7786303162574768, 0.8097646832466125, 0.8408991098403931, 0.8720334768295288, 0.9031678438186646, 0.9343022704124451, 0.9654366374015808, 0.9965710639953613, 1.027705430984497]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 2.0, 9.0, 6.0, 13.0, 11.0, 16.0, 25.0, 23.0, 34.0, 34.0, 37.0, 38.0, 46.0, 52.0, 53.0, 60.0, 50.0, 53.0, 51.0, 54.0, 51.0, 42.0, 39.0, 40.0, 32.0, 23.0, 25.0, 19.0, 14.0, 13.0, 15.0, 3.0, 5.0, 4.0, 5.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3352075219154358, -0.321824848651886, -0.3084421753883362, -0.2950595021247864, -0.28167685866355896, -0.26829418540000916, -0.25491151213645935, -0.24152883887290955, -0.22814618051052094, -0.21476350724697113, -0.20138084888458252, -0.18799817562103271, -0.1746155023574829, -0.1612328439950943, -0.1478501707315445, -0.13446751236915588, -0.12108483910560608, -0.10770217329263687, -0.09431950747966766, -0.08093683421611786, -0.06755416840314865, -0.05417150259017944, -0.04078882932662964, -0.02740616351366043, -0.014023497700691223, -0.0006408300250768661, 0.01274183765053749, 0.026124507188796997, 0.039507173001766205, 0.05288983881473541, 0.06627251207828522, 0.07965517789125443, 0.09303784370422363, 0.10642050951719284, 0.11980317533016205, 0.13318584859371185, 0.14656850695610046, 0.15995118021965027, 0.17333385348320007, 0.18671652674674988, 0.2000991851091385, 0.2134818583726883, 0.2268645167350769, 0.2402471899986267, 0.2536298632621765, 0.2670125365257263, 0.2803952097892761, 0.29377785325050354, 0.30716052651405334, 0.32054319977760315, 0.33392587304115295, 0.34730851650238037, 0.3606911897659302, 0.37407386302948, 0.3874565362930298, 0.4008392095565796, 0.4142218828201294, 0.4276045560836792, 0.440987229347229, 0.4543699026107788, 0.4677525460720062, 0.48113521933555603, 0.49451789259910583, 0.5079005360603333, 0.5212832093238831]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 10.0, 9.0, 14.0, 28.0, 37.0, 55.0, 82.0, 122.0, 187.0, 266.0, 389.0, 640.0, 1075.0, 1883.0, 3900.0, 10214.0, 39248.0, 227427.0, 553411.0, 163899.0, 29613.0, 8269.0, 3462.0, 1656.0, 1013.0, 566.0, 341.0, 221.0, 146.0, 99.0, 76.0, 44.0, 49.0, 25.0, 17.0, 15.0, 11.0, 9.0, 8.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.51708984375, -0.5006256103515625, -0.484161376953125, -0.4676971435546875, -0.45123291015625, -0.4347686767578125, -0.418304443359375, -0.4018402099609375, -0.3853759765625, -0.3689117431640625, -0.352447509765625, -0.3359832763671875, -0.31951904296875, -0.3030548095703125, -0.286590576171875, -0.2701263427734375, -0.253662109375, -0.2371978759765625, -0.220733642578125, -0.2042694091796875, -0.18780517578125, -0.1713409423828125, -0.154876708984375, -0.1384124755859375, -0.1219482421875, -0.1054840087890625, -0.089019775390625, -0.0725555419921875, -0.05609130859375, -0.0396270751953125, -0.023162841796875, -0.0066986083984375, 0.009765625, 0.0262298583984375, 0.042694091796875, 0.0591583251953125, 0.07562255859375, 0.0920867919921875, 0.108551025390625, 0.1250152587890625, 0.1414794921875, 0.1579437255859375, 0.174407958984375, 0.1908721923828125, 0.20733642578125, 0.2238006591796875, 0.240264892578125, 0.2567291259765625, 0.273193359375, 0.2896575927734375, 0.306121826171875, 0.3225860595703125, 0.33905029296875, 0.3555145263671875, 0.371978759765625, 0.3884429931640625, 0.4049072265625, 0.4213714599609375, 0.437835693359375, 0.4542999267578125, 0.47076416015625, 0.4872283935546875, 0.503692626953125, 0.5201568603515625, 0.53662109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 7.0, 12.0, 24.0, 38.0, 75.0, 123.0, 151.0, 162.0, 146.0, 96.0, 70.0, 38.0, 28.0, 16.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1845703125, -0.17869949340820312, -0.17282867431640625, -0.16695785522460938, -0.1610870361328125, -0.15521621704101562, -0.14934539794921875, -0.14347457885742188, -0.137603759765625, -0.13173294067382812, -0.12586212158203125, -0.11999130249023438, -0.1141204833984375, -0.10824966430664062, -0.10237884521484375, -0.09650802612304688, -0.09063720703125, -0.08476638793945312, -0.07889556884765625, -0.07302474975585938, -0.0671539306640625, -0.061283111572265625, -0.05541229248046875, -0.049541473388671875, -0.043670654296875, -0.037799835205078125, -0.03192901611328125, -0.026058197021484375, -0.0201873779296875, -0.014316558837890625, -0.00844573974609375, -0.002574920654296875, 0.0032958984375, 0.009166717529296875, 0.01503753662109375, 0.020908355712890625, 0.0267791748046875, 0.032649993896484375, 0.03852081298828125, 0.044391632080078125, 0.050262451171875, 0.056133270263671875, 0.06200408935546875, 0.06787490844726562, 0.0737457275390625, 0.07961654663085938, 0.08548736572265625, 0.09135818481445312, 0.09722900390625, 0.10309982299804688, 0.10897064208984375, 0.11484146118164062, 0.1207122802734375, 0.12658309936523438, 0.13245391845703125, 0.13832473754882812, 0.144195556640625, 0.15006637573242188, 0.15593719482421875, 0.16180801391601562, 0.1676788330078125, 0.17354965209960938, 0.17942047119140625, 0.18529129028320312, 0.191162109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 1.0, 7.0, 7.0, 9.0, 18.0, 27.0, 30.0, 30.0, 49.0, 59.0, 77.0, 116.0, 184.0, 257.0, 447.0, 715.0, 1344.0, 2809.0, 6233.0, 14073.0, 33113.0, 79818.0, 179161.0, 290369.0, 237390.0, 115940.0, 48725.0, 20349.0, 8896.0, 3843.0, 1863.0, 1035.0, 540.0, 307.0, 187.0, 148.0, 109.0, 63.0, 64.0, 36.0, 23.0, 25.0, 14.0, 15.0, 6.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.204833984375, -0.1981658935546875, -0.191497802734375, -0.1848297119140625, -0.17816162109375, -0.1714935302734375, -0.164825439453125, -0.1581573486328125, -0.1514892578125, -0.1448211669921875, -0.138153076171875, -0.1314849853515625, -0.12481689453125, -0.1181488037109375, -0.111480712890625, -0.1048126220703125, -0.09814453125, -0.0914764404296875, -0.084808349609375, -0.0781402587890625, -0.07147216796875, -0.0648040771484375, -0.058135986328125, -0.0514678955078125, -0.0447998046875, -0.0381317138671875, -0.031463623046875, -0.0247955322265625, -0.01812744140625, -0.0114593505859375, -0.004791259765625, 0.0018768310546875, 0.008544921875, 0.0152130126953125, 0.021881103515625, 0.0285491943359375, 0.03521728515625, 0.0418853759765625, 0.048553466796875, 0.0552215576171875, 0.0618896484375, 0.0685577392578125, 0.075225830078125, 0.0818939208984375, 0.08856201171875, 0.0952301025390625, 0.101898193359375, 0.1085662841796875, 0.115234375, 0.1219024658203125, 0.128570556640625, 0.1352386474609375, 0.14190673828125, 0.1485748291015625, 0.155242919921875, 0.1619110107421875, 0.1685791015625, 0.1752471923828125, 0.181915283203125, 0.1885833740234375, 0.19525146484375, 0.2019195556640625, 0.208587646484375, 0.2152557373046875, 0.221923828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 9.0, 8.0, 12.0, 10.0, 4.0, 16.0, 12.0, 14.0, 15.0, 11.0, 23.0, 30.0, 21.0, 21.0, 38.0, 32.0, 35.0, 44.0, 20.0, 40.0, 31.0, 37.0, 53.0, 48.0, 40.0, 45.0, 35.0, 32.0, 35.0, 33.0, 21.0, 30.0, 18.0, 23.0, 15.0, 18.0, 15.0, 21.0, 5.0, 10.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.270263671875, -0.26224708557128906, -0.2542304992675781, -0.2462139129638672, -0.23819732666015625, -0.2301807403564453, -0.22216415405273438, -0.21414756774902344, -0.2061309814453125, -0.19811439514160156, -0.19009780883789062, -0.1820812225341797, -0.17406463623046875, -0.1660480499267578, -0.15803146362304688, -0.15001487731933594, -0.141998291015625, -0.13398170471191406, -0.12596511840820312, -0.11794853210449219, -0.10993194580078125, -0.10191535949707031, -0.09389877319335938, -0.08588218688964844, -0.0778656005859375, -0.06984901428222656, -0.061832427978515625, -0.05381584167480469, -0.04579925537109375, -0.03778266906738281, -0.029766082763671875, -0.021749496459960938, -0.01373291015625, -0.0057163238525390625, 0.002300262451171875, 0.010316848754882812, 0.01833343505859375, 0.026350021362304688, 0.034366607666015625, 0.04238319396972656, 0.0503997802734375, 0.05841636657714844, 0.06643295288085938, 0.07444953918457031, 0.08246612548828125, 0.09048271179199219, 0.09849929809570312, 0.10651588439941406, 0.114532470703125, 0.12254905700683594, 0.13056564331054688, 0.1385822296142578, 0.14659881591796875, 0.1546154022216797, 0.16263198852539062, 0.17064857482910156, 0.1786651611328125, 0.18668174743652344, 0.19469833374023438, 0.2027149200439453, 0.21073150634765625, 0.2187480926513672, 0.22676467895507812, 0.23478126525878906, 0.2427978515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 10.0, 12.0, 19.0, 24.0, 58.0, 105.0, 165.0, 416.0, 1016.0, 3122.0, 11667.0, 63763.0, 439215.0, 446483.0, 65424.0, 12011.0, 3137.0, 1004.0, 453.0, 197.0, 104.0, 63.0, 25.0, 15.0, 16.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1702880859375, -0.16441726684570312, -0.15854644775390625, -0.15267562866210938, -0.1468048095703125, -0.14093399047851562, -0.13506317138671875, -0.12919235229492188, -0.123321533203125, -0.11745071411132812, -0.11157989501953125, -0.10570907592773438, -0.0998382568359375, -0.09396743774414062, -0.08809661865234375, -0.08222579956054688, -0.07635498046875, -0.07048416137695312, -0.06461334228515625, -0.058742523193359375, -0.0528717041015625, -0.047000885009765625, -0.04113006591796875, -0.035259246826171875, -0.029388427734375, -0.023517608642578125, -0.01764678955078125, -0.011775970458984375, -0.0059051513671875, -3.4332275390625e-05, 0.00583648681640625, 0.011707305908203125, 0.017578125, 0.023448944091796875, 0.02931976318359375, 0.035190582275390625, 0.0410614013671875, 0.046932220458984375, 0.05280303955078125, 0.058673858642578125, 0.064544677734375, 0.07041549682617188, 0.07628631591796875, 0.08215713500976562, 0.0880279541015625, 0.09389877319335938, 0.09976959228515625, 0.10564041137695312, 0.11151123046875, 0.11738204956054688, 0.12325286865234375, 0.12912368774414062, 0.1349945068359375, 0.14086532592773438, 0.14673614501953125, 0.15260696411132812, 0.158477783203125, 0.16434860229492188, 0.17021942138671875, 0.17609024047851562, 0.1819610595703125, 0.18783187866210938, 0.19370269775390625, 0.19957351684570312, 0.2054443359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 10.0, 7.0, 8.0, 14.0, 19.0, 26.0, 24.0, 37.0, 37.0, 45.0, 42.0, 50.0, 78.0, 92.0, 76.0, 73.0, 51.0, 44.0, 42.0, 46.0, 32.0, 32.0, 26.0, 18.0, 10.0, 13.0, 9.0, 6.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0], "bins": [-0.00014710426330566406, -0.00014321133494377136, -0.00013931840658187866, -0.00013542547821998596, -0.00013153254985809326, -0.00012763962149620056, -0.00012374669313430786, -0.00011985376477241516, -0.00011596083641052246, -0.00011206790804862976, -0.00010817497968673706, -0.00010428205132484436, -0.00010038912296295166, -9.649619460105896e-05, -9.260326623916626e-05, -8.871033787727356e-05, -8.481740951538086e-05, -8.092448115348816e-05, -7.703155279159546e-05, -7.313862442970276e-05, -6.924569606781006e-05, -6.535276770591736e-05, -6.145983934402466e-05, -5.756691098213196e-05, -5.367398262023926e-05, -4.978105425834656e-05, -4.588812589645386e-05, -4.199519753456116e-05, -3.810226917266846e-05, -3.420934081077576e-05, -3.0316412448883057e-05, -2.6423484086990356e-05, -2.2530555725097656e-05, -1.8637627363204956e-05, -1.4744699001312256e-05, -1.0851770639419556e-05, -6.9588422775268555e-06, -3.0659139156341553e-06, 8.270144462585449e-07, 4.719942808151245e-06, 8.612871170043945e-06, 1.2505799531936646e-05, 1.6398727893829346e-05, 2.0291656255722046e-05, 2.4184584617614746e-05, 2.8077512979507446e-05, 3.1970441341400146e-05, 3.586336970329285e-05, 3.975629806518555e-05, 4.364922642707825e-05, 4.754215478897095e-05, 5.143508315086365e-05, 5.532801151275635e-05, 5.922093987464905e-05, 6.311386823654175e-05, 6.700679659843445e-05, 7.089972496032715e-05, 7.479265332221985e-05, 7.868558168411255e-05, 8.257851004600525e-05, 8.647143840789795e-05, 9.036436676979065e-05, 9.425729513168335e-05, 9.815022349357605e-05, 0.00010204315185546875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 12.0, 21.0, 34.0, 62.0, 110.0, 236.0, 632.0, 2151.0, 11465.0, 102045.0, 746082.0, 165002.0, 16465.0, 2867.0, 793.0, 272.0, 128.0, 68.0, 33.0, 21.0, 15.0, 15.0, 6.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208740234375, -0.20058441162109375, -0.1924285888671875, -0.18427276611328125, -0.176116943359375, -0.16796112060546875, -0.1598052978515625, -0.15164947509765625, -0.14349365234375, -0.13533782958984375, -0.1271820068359375, -0.11902618408203125, -0.110870361328125, -0.10271453857421875, -0.0945587158203125, -0.08640289306640625, -0.0782470703125, -0.07009124755859375, -0.0619354248046875, -0.05377960205078125, -0.045623779296875, -0.03746795654296875, -0.0293121337890625, -0.02115631103515625, -0.01300048828125, -0.00484466552734375, 0.0033111572265625, 0.01146697998046875, 0.019622802734375, 0.02777862548828125, 0.0359344482421875, 0.04409027099609375, 0.05224609375, 0.06040191650390625, 0.0685577392578125, 0.07671356201171875, 0.084869384765625, 0.09302520751953125, 0.1011810302734375, 0.10933685302734375, 0.11749267578125, 0.12564849853515625, 0.1338043212890625, 0.14196014404296875, 0.150115966796875, 0.15827178955078125, 0.1664276123046875, 0.17458343505859375, 0.1827392578125, 0.19089508056640625, 0.1990509033203125, 0.20720672607421875, 0.215362548828125, 0.22351837158203125, 0.2316741943359375, 0.23983001708984375, 0.24798583984375, 0.25614166259765625, 0.2642974853515625, 0.27245330810546875, 0.280609130859375, 0.28876495361328125, 0.2969207763671875, 0.30507659912109375, 0.313232421875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 9.0, 4.0, 10.0, 7.0, 7.0, 9.0, 14.0, 10.0, 14.0, 28.0, 23.0, 43.0, 33.0, 41.0, 53.0, 64.0, 67.0, 67.0, 54.0, 50.0, 58.0, 64.0, 41.0, 40.0, 30.0, 28.0, 28.0, 19.0, 10.0, 11.0, 11.0, 10.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.08319091796875, -0.0801401138305664, -0.07708930969238281, -0.07403850555419922, -0.07098770141601562, -0.06793689727783203, -0.06488609313964844, -0.061835289001464844, -0.05878448486328125, -0.055733680725097656, -0.05268287658691406, -0.04963207244873047, -0.046581268310546875, -0.04353046417236328, -0.04047966003417969, -0.037428855895996094, -0.0343780517578125, -0.031327247619628906, -0.028276443481445312, -0.02522563934326172, -0.022174835205078125, -0.01912403106689453, -0.016073226928710938, -0.013022422790527344, -0.00997161865234375, -0.006920814514160156, -0.0038700103759765625, -0.0008192062377929688, 0.002231597900390625, 0.005282402038574219, 0.008333206176757812, 0.011384010314941406, 0.014434814453125, 0.017485618591308594, 0.020536422729492188, 0.02358722686767578, 0.026638031005859375, 0.02968883514404297, 0.03273963928222656, 0.035790443420410156, 0.03884124755859375, 0.041892051696777344, 0.04494285583496094, 0.04799365997314453, 0.051044464111328125, 0.05409526824951172, 0.05714607238769531, 0.060196876525878906, 0.0632476806640625, 0.0662984848022461, 0.06934928894042969, 0.07240009307861328, 0.07545089721679688, 0.07850170135498047, 0.08155250549316406, 0.08460330963134766, 0.08765411376953125, 0.09070491790771484, 0.09375572204589844, 0.09680652618408203, 0.09985733032226562, 0.10290813446044922, 0.10595893859863281, 0.1090097427368164, 0.112060546875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 17.0, 36.0, 108.0, 316.0, 329.0, 129.0, 47.0, 13.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.66799545288086, -8.487131118774414, -8.306265830993652, -8.125401496887207, -7.9445366859436035, -7.763671875, -7.5828070640563965, -7.401942253112793, -7.221077919006348, -7.040213108062744, -6.859348297119141, -6.678483963012695, -6.497619152069092, -6.316754341125488, -6.135889530181885, -5.955024719238281, -5.774159908294678, -5.593295097351074, -5.412430286407471, -5.231565475463867, -5.050701141357422, -4.869836330413818, -4.688971519470215, -4.508106708526611, -4.327241897583008, -4.146377086639404, -3.96551251411438, -3.7846477031707764, -3.603783130645752, -3.4229183197021484, -3.242053508758545, -3.0611886978149414, -2.8803248405456543, -2.699460029602051, -2.5185954570770264, -2.337730646133423, -2.1568660736083984, -1.976001262664795, -1.7951364517211914, -1.6142717599868774, -1.4334070682525635, -1.2525423765182495, -1.0716776847839355, -0.890812873840332, -0.7099481821060181, -0.5290834903717041, -0.3482186794281006, -0.16735398769378662, 0.013510704040527344, 0.1943754255771637, 0.37524014711380005, 0.5561048984527588, 0.7369695901870728, 0.9178342819213867, 1.0986990928649902, 1.2795637845993042, 1.4604284763336182, 1.6412931680679321, 1.822157859802246, 2.0030226707458496, 2.183887481689453, 2.3647520542144775, 2.545616865158081, 2.7264814376831055, 2.907346248626709]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 10.0, 7.0, 6.0, 10.0, 18.0, 15.0, 15.0, 17.0, 28.0, 35.0, 34.0, 34.0, 25.0, 45.0, 34.0, 44.0, 56.0, 43.0, 43.0, 50.0, 39.0, 41.0, 39.0, 40.0, 32.0, 37.0, 30.0, 24.0, 35.0, 18.0, 14.0, 19.0, 10.0, 8.0, 8.0, 3.0, 4.0, 7.0, 3.0, 4.0, 7.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0], "bins": [-1.8163119554519653, -1.7647607326507568, -1.7132095098495483, -1.6616582870483398, -1.6101070642471313, -1.5585558414459229, -1.507004737854004, -1.4554533958435059, -1.403902292251587, -1.3523510694503784, -1.30079984664917, -1.2492486238479614, -1.197697401046753, -1.1461461782455444, -1.094594955444336, -1.043043851852417, -0.991492509841919, -0.9399412870407104, -0.888390064239502, -0.8368388414382935, -0.785287618637085, -0.7337363958358765, -0.6821852326393127, -0.6306340098381042, -0.5790827870368958, -0.5275315642356873, -0.47598034143447876, -0.42442914843559265, -0.37287792563438416, -0.32132670283317566, -0.26977550983428955, -0.21822428703308105, -0.1666731834411621, -0.11512196809053421, -0.06357075273990631, -0.012019544839859009, 0.03953167796134949, 0.09108290076255798, 0.1426340937614441, 0.1941853165626526, 0.24573653936386108, 0.2972877621650696, 0.3488389849662781, 0.4003901779651642, 0.4519414007663727, 0.5034925937652588, 0.5550438165664673, 0.6065950393676758, 0.6581462621688843, 0.7096974849700928, 0.7612487077713013, 0.8127999305725098, 0.8643511533737183, 0.9159023761749268, 0.9674535393714905, 1.0190048217773438, 1.0705559253692627, 1.1221071481704712, 1.1736583709716797, 1.2252095937728882, 1.2767608165740967, 1.3283120393753052, 1.3798632621765137, 1.4314143657684326, 1.4829657077789307]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 5.0, 7.0, 8.0, 23.0, 40.0, 63.0, 89.0, 206.0, 370.0, 808.0, 2435.0, 14435.0, 1829623.0, 2326201.0, 15542.0, 2661.0, 931.0, 420.0, 175.0, 88.0, 62.0, 34.0, 13.0, 12.0, 9.0, 2.0, 4.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.810546875, -0.7805328369140625, -0.750518798828125, -0.7205047607421875, -0.69049072265625, -0.6604766845703125, -0.630462646484375, -0.6004486083984375, -0.5704345703125, -0.5404205322265625, -0.510406494140625, -0.4803924560546875, -0.45037841796875, -0.4203643798828125, -0.390350341796875, -0.3603363037109375, -0.330322265625, -0.3003082275390625, -0.270294189453125, -0.2402801513671875, -0.21026611328125, -0.1802520751953125, -0.150238037109375, -0.1202239990234375, -0.0902099609375, -0.0601959228515625, -0.030181884765625, -0.0001678466796875, 0.02984619140625, 0.0598602294921875, 0.089874267578125, 0.1198883056640625, 0.14990234375, 0.1799163818359375, 0.209930419921875, 0.2399444580078125, 0.26995849609375, 0.2999725341796875, 0.329986572265625, 0.3600006103515625, 0.3900146484375, 0.4200286865234375, 0.450042724609375, 0.4800567626953125, 0.51007080078125, 0.5400848388671875, 0.570098876953125, 0.6001129150390625, 0.630126953125, 0.6601409912109375, 0.690155029296875, 0.7201690673828125, 0.75018310546875, 0.7801971435546875, 0.810211181640625, 0.8402252197265625, 0.8702392578125, 0.9002532958984375, 0.930267333984375, 0.9602813720703125, 0.99029541015625, 1.0203094482421875, 1.050323486328125, 1.0803375244140625, 1.1103515625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 10.0, 15.0, 23.0, 47.0, 85.0, 114.0, 144.0, 148.0, 140.0, 89.0, 65.0, 42.0, 37.0, 23.0, 4.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1929931640625, -0.1868610382080078, -0.18072891235351562, -0.17459678649902344, -0.16846466064453125, -0.16233253479003906, -0.15620040893554688, -0.1500682830810547, -0.1439361572265625, -0.1378040313720703, -0.13167190551757812, -0.12553977966308594, -0.11940765380859375, -0.11327552795410156, -0.10714340209960938, -0.10101127624511719, -0.094879150390625, -0.08874702453613281, -0.08261489868164062, -0.07648277282714844, -0.07035064697265625, -0.06421852111816406, -0.058086395263671875, -0.05195426940917969, -0.0458221435546875, -0.03969001770019531, -0.033557891845703125, -0.027425765991210938, -0.02129364013671875, -0.015161514282226562, -0.009029388427734375, -0.0028972625732421875, 0.00323486328125, 0.009366989135742188, 0.015499114990234375, 0.021631240844726562, 0.02776336669921875, 0.03389549255371094, 0.040027618408203125, 0.04615974426269531, 0.0522918701171875, 0.05842399597167969, 0.06455612182617188, 0.07068824768066406, 0.07682037353515625, 0.08295249938964844, 0.08908462524414062, 0.09521675109863281, 0.101348876953125, 0.10748100280761719, 0.11361312866210938, 0.11974525451660156, 0.12587738037109375, 0.13200950622558594, 0.13814163208007812, 0.1442737579345703, 0.1504058837890625, 0.1565380096435547, 0.16267013549804688, 0.16880226135253906, 0.17493438720703125, 0.18106651306152344, 0.18719863891601562, 0.1933307647705078, 0.199462890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 7.0, 1.0, 10.0, 17.0, 48.0, 98.0, 138.0, 277.0, 515.0, 1181.0, 2754.0, 7313.0, 26449.0, 171597.0, 3543986.0, 381241.0, 41760.0, 10384.0, 3576.0, 1457.0, 675.0, 337.0, 187.0, 110.0, 70.0, 35.0, 19.0, 19.0, 8.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.352783203125, -0.34088134765625, -0.3289794921875, -0.31707763671875, -0.30517578125, -0.29327392578125, -0.2813720703125, -0.26947021484375, -0.257568359375, -0.24566650390625, -0.2337646484375, -0.22186279296875, -0.2099609375, -0.19805908203125, -0.1861572265625, -0.17425537109375, -0.162353515625, -0.15045166015625, -0.1385498046875, -0.12664794921875, -0.11474609375, -0.10284423828125, -0.0909423828125, -0.07904052734375, -0.067138671875, -0.05523681640625, -0.0433349609375, -0.03143310546875, -0.01953125, -0.00762939453125, 0.0042724609375, 0.01617431640625, 0.028076171875, 0.03997802734375, 0.0518798828125, 0.06378173828125, 0.07568359375, 0.08758544921875, 0.0994873046875, 0.11138916015625, 0.123291015625, 0.13519287109375, 0.1470947265625, 0.15899658203125, 0.1708984375, 0.18280029296875, 0.1947021484375, 0.20660400390625, 0.218505859375, 0.23040771484375, 0.2423095703125, 0.25421142578125, 0.26611328125, 0.27801513671875, 0.2899169921875, 0.30181884765625, 0.313720703125, 0.32562255859375, 0.3375244140625, 0.34942626953125, 0.361328125, 0.37322998046875, 0.3851318359375, 0.39703369140625, 0.408935546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 5.0, 15.0, 14.0, 36.0, 34.0, 75.0, 155.0, 311.0, 887.0, 1537.0, 494.0, 199.0, 104.0, 50.0, 38.0, 41.0, 19.0, 15.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136474609375, -0.13083839416503906, -0.12520217895507812, -0.11956596374511719, -0.11392974853515625, -0.10829353332519531, -0.10265731811523438, -0.09702110290527344, -0.0913848876953125, -0.08574867248535156, -0.08011245727539062, -0.07447624206542969, -0.06884002685546875, -0.06320381164550781, -0.057567596435546875, -0.05193138122558594, -0.046295166015625, -0.04065895080566406, -0.035022735595703125, -0.029386520385742188, -0.02375030517578125, -0.018114089965820312, -0.012477874755859375, -0.0068416595458984375, -0.0012054443359375, 0.0044307708740234375, 0.010066986083984375, 0.015703201293945312, 0.02133941650390625, 0.026975631713867188, 0.032611846923828125, 0.03824806213378906, 0.04388427734375, 0.04952049255371094, 0.055156707763671875, 0.06079292297363281, 0.06642913818359375, 0.07206535339355469, 0.07770156860351562, 0.08333778381347656, 0.0889739990234375, 0.09461021423339844, 0.10024642944335938, 0.10588264465332031, 0.11151885986328125, 0.11715507507324219, 0.12279129028320312, 0.12842750549316406, 0.134063720703125, 0.13969993591308594, 0.14533615112304688, 0.1509723663330078, 0.15660858154296875, 0.1622447967529297, 0.16788101196289062, 0.17351722717285156, 0.1791534423828125, 0.18478965759277344, 0.19042587280273438, 0.1960620880126953, 0.20169830322265625, 0.2073345184326172, 0.21297073364257812, 0.21860694885253906, 0.2242431640625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 28.0, 56.0, 147.0, 249.0, 244.0, 167.0, 68.0, 19.0, 14.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9786741733551025, -0.9270185232162476, -0.8753628730773926, -0.8237072229385376, -0.7720515727996826, -0.7203959226608276, -0.6687402725219727, -0.6170846223831177, -0.5654289722442627, -0.5137733221054077, -0.46211767196655273, -0.41046202182769775, -0.3588063716888428, -0.3071507513523102, -0.2554951012134552, -0.20383945107460022, -0.15218383073806763, -0.10052818059921265, -0.04887253791093826, 0.0027831047773361206, 0.0544387549161911, 0.10609439015388489, 0.15775004029273987, 0.20940569043159485, 0.26106134057044983, 0.3127169907093048, 0.3643726408481598, 0.4160282611846924, 0.46768391132354736, 0.5193395614624023, 0.5709952116012573, 0.6226508617401123, 0.6743065118789673, 0.7259621620178223, 0.7776178121566772, 0.8292734622955322, 0.8809291124343872, 0.9325847625732422, 0.9842404127120972, 1.0358960628509521, 1.0875517129898071, 1.139207363128662, 1.190863013267517, 1.242518663406372, 1.294174313545227, 1.345829963684082, 1.397485613822937, 1.449141263961792, 1.5007967948913574, 1.5524524450302124, 1.6041080951690674, 1.6557637453079224, 1.7074193954467773, 1.7590750455856323, 1.8107306957244873, 1.8623863458633423, 1.9140419960021973, 1.9656976461410522, 2.0173532962799072, 2.0690088272094727, 2.120664596557617, 2.1723201274871826, 2.223975896835327, 2.2756314277648926, 2.327287197113037]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 11.0, 24.0, 24.0, 34.0, 34.0, 34.0, 49.0, 64.0, 72.0, 65.0, 78.0, 59.0, 62.0, 61.0, 73.0, 49.0, 45.0, 33.0, 26.0, 32.0, 13.0, 11.0, 8.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.8303853869438171, -0.8079603314399719, -0.7855352759361267, -0.7631101608276367, -0.7406851053237915, -0.7182600498199463, -0.6958349943161011, -0.6734099388122559, -0.6509848833084106, -0.6285598278045654, -0.6061347723007202, -0.583709716796875, -0.561284601688385, -0.5388595461845398, -0.5164344906806946, -0.49400943517684937, -0.4715843200683594, -0.44915926456451416, -0.42673417925834656, -0.40430912375450134, -0.38188403844833374, -0.3594589829444885, -0.3370339274406433, -0.3146088719367981, -0.2921837866306305, -0.2697587311267853, -0.24733364582061768, -0.22490859031677246, -0.20248351991176605, -0.18005844950675964, -0.15763339400291443, -0.13520832359790802, -0.11278319358825684, -0.09035812318325043, -0.06793306022882462, -0.045507997274398804, -0.023082926869392395, -0.0006578564643859863, 0.02176719903945923, 0.04419226944446564, 0.06661733984947205, 0.08904241025447845, 0.11146747320890427, 0.13389253616333008, 0.1563176065683365, 0.1787426769733429, 0.2011677324771881, 0.22359280288219452, 0.24601787328720093, 0.26844292879104614, 0.29086801409721375, 0.31329306960105896, 0.33571815490722656, 0.3581432104110718, 0.380568265914917, 0.4029933214187622, 0.4254184067249298, 0.447843462228775, 0.4702685475349426, 0.49269360303878784, 0.5151186585426331, 0.537543773651123, 0.5599688291549683, 0.5823938846588135, 0.6048189401626587]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 8.0, 17.0, 25.0, 43.0, 50.0, 65.0, 118.0, 169.0, 231.0, 460.0, 792.0, 1561.0, 3323.0, 8983.0, 37737.0, 256102.0, 593411.0, 114300.0, 20015.0, 6049.0, 2376.0, 1141.0, 602.0, 317.0, 216.0, 130.0, 91.0, 64.0, 37.0, 42.0, 21.0, 15.0, 8.0, 2.0, 2.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.60546875, -0.5867233276367188, -0.5679779052734375, -0.5492324829101562, -0.530487060546875, -0.5117416381835938, -0.4929962158203125, -0.47425079345703125, -0.45550537109375, -0.43675994873046875, -0.4180145263671875, -0.39926910400390625, -0.380523681640625, -0.36177825927734375, -0.3430328369140625, -0.32428741455078125, -0.3055419921875, -0.28679656982421875, -0.2680511474609375, -0.24930572509765625, -0.230560302734375, -0.21181488037109375, -0.1930694580078125, -0.17432403564453125, -0.15557861328125, -0.13683319091796875, -0.1180877685546875, -0.09934234619140625, -0.080596923828125, -0.06185150146484375, -0.0431060791015625, -0.02436065673828125, -0.005615234375, 0.01313018798828125, 0.0318756103515625, 0.05062103271484375, 0.069366455078125, 0.08811187744140625, 0.1068572998046875, 0.12560272216796875, 0.14434814453125, 0.16309356689453125, 0.1818389892578125, 0.20058441162109375, 0.219329833984375, 0.23807525634765625, 0.2568206787109375, 0.27556610107421875, 0.2943115234375, 0.31305694580078125, 0.3318023681640625, 0.35054779052734375, 0.369293212890625, 0.38803863525390625, 0.4067840576171875, 0.42552947998046875, 0.44427490234375, 0.46302032470703125, 0.4817657470703125, 0.5005111694335938, 0.519256591796875, 0.5380020141601562, 0.5567474365234375, 0.5754928588867188, 0.59423828125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 14.0, 25.0, 39.0, 82.0, 125.0, 126.0, 147.0, 132.0, 117.0, 70.0, 45.0, 33.0, 17.0, 11.0, 5.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.195556640625, -0.1891632080078125, -0.182769775390625, -0.1763763427734375, -0.16998291015625, -0.1635894775390625, -0.157196044921875, -0.1508026123046875, -0.1444091796875, -0.1380157470703125, -0.131622314453125, -0.1252288818359375, -0.11883544921875, -0.1124420166015625, -0.106048583984375, -0.0996551513671875, -0.09326171875, -0.0868682861328125, -0.080474853515625, -0.0740814208984375, -0.06768798828125, -0.0612945556640625, -0.054901123046875, -0.0485076904296875, -0.0421142578125, -0.0357208251953125, -0.029327392578125, -0.0229339599609375, -0.01654052734375, -0.0101470947265625, -0.003753662109375, 0.0026397705078125, 0.009033203125, 0.0154266357421875, 0.021820068359375, 0.0282135009765625, 0.03460693359375, 0.0410003662109375, 0.047393798828125, 0.0537872314453125, 0.0601806640625, 0.0665740966796875, 0.072967529296875, 0.0793609619140625, 0.08575439453125, 0.0921478271484375, 0.098541259765625, 0.1049346923828125, 0.111328125, 0.1177215576171875, 0.124114990234375, 0.1305084228515625, 0.13690185546875, 0.1432952880859375, 0.149688720703125, 0.1560821533203125, 0.1624755859375, 0.1688690185546875, 0.175262451171875, 0.1816558837890625, 0.18804931640625, 0.1944427490234375, 0.200836181640625, 0.2072296142578125, 0.213623046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 9.0, 15.0, 14.0, 14.0, 22.0, 20.0, 42.0, 59.0, 69.0, 150.0, 229.0, 469.0, 1054.0, 3147.0, 11605.0, 57202.0, 317503.0, 511239.0, 115845.0, 21520.0, 5178.0, 1599.0, 674.0, 315.0, 150.0, 111.0, 81.0, 43.0, 46.0, 24.0, 23.0, 21.0, 9.0, 19.0, 8.0, 8.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.46875, -0.454193115234375, -0.43963623046875, -0.425079345703125, -0.4105224609375, -0.395965576171875, -0.38140869140625, -0.366851806640625, -0.352294921875, -0.337738037109375, -0.32318115234375, -0.308624267578125, -0.2940673828125, -0.279510498046875, -0.26495361328125, -0.250396728515625, -0.23583984375, -0.221282958984375, -0.20672607421875, -0.192169189453125, -0.1776123046875, -0.163055419921875, -0.14849853515625, -0.133941650390625, -0.119384765625, -0.104827880859375, -0.09027099609375, -0.075714111328125, -0.0611572265625, -0.046600341796875, -0.03204345703125, -0.017486572265625, -0.0029296875, 0.011627197265625, 0.02618408203125, 0.040740966796875, 0.0552978515625, 0.069854736328125, 0.08441162109375, 0.098968505859375, 0.113525390625, 0.128082275390625, 0.14263916015625, 0.157196044921875, 0.1717529296875, 0.186309814453125, 0.20086669921875, 0.215423583984375, 0.22998046875, 0.244537353515625, 0.25909423828125, 0.273651123046875, 0.2882080078125, 0.302764892578125, 0.31732177734375, 0.331878662109375, 0.346435546875, 0.360992431640625, 0.37554931640625, 0.390106201171875, 0.4046630859375, 0.419219970703125, 0.43377685546875, 0.448333740234375, 0.462890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 11.0, 6.0, 10.0, 10.0, 18.0, 24.0, 22.0, 30.0, 14.0, 35.0, 40.0, 50.0, 45.0, 48.0, 46.0, 57.0, 48.0, 51.0, 54.0, 53.0, 35.0, 34.0, 35.0, 36.0, 27.0, 23.0, 21.0, 18.0, 18.0, 9.0, 13.0, 14.0, 10.0, 6.0, 3.0, 5.0, 3.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.37451171875, -0.36356353759765625, -0.3526153564453125, -0.34166717529296875, -0.330718994140625, -0.31977081298828125, -0.3088226318359375, -0.29787445068359375, -0.28692626953125, -0.27597808837890625, -0.2650299072265625, -0.25408172607421875, -0.243133544921875, -0.23218536376953125, -0.2212371826171875, -0.21028900146484375, -0.1993408203125, -0.18839263916015625, -0.1774444580078125, -0.16649627685546875, -0.155548095703125, -0.14459991455078125, -0.1336517333984375, -0.12270355224609375, -0.11175537109375, -0.10080718994140625, -0.0898590087890625, -0.07891082763671875, -0.067962646484375, -0.05701446533203125, -0.0460662841796875, -0.03511810302734375, -0.024169921875, -0.01322174072265625, -0.0022735595703125, 0.00867462158203125, 0.019622802734375, 0.03057098388671875, 0.0415191650390625, 0.05246734619140625, 0.06341552734375, 0.07436370849609375, 0.0853118896484375, 0.09626007080078125, 0.107208251953125, 0.11815643310546875, 0.1291046142578125, 0.14005279541015625, 0.1510009765625, 0.16194915771484375, 0.1728973388671875, 0.18384552001953125, 0.194793701171875, 0.20574188232421875, 0.2166900634765625, 0.22763824462890625, 0.23858642578125, 0.24953460693359375, 0.2604827880859375, 0.27143096923828125, 0.282379150390625, 0.29332733154296875, 0.3042755126953125, 0.31522369384765625, 0.326171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 25.0, 68.0, 161.0, 700.0, 10872.0, 1032106.0, 4003.0, 424.0, 115.0, 41.0, 14.0, 13.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55859375, -1.50164794921875, -1.4447021484375, -1.38775634765625, -1.330810546875, -1.27386474609375, -1.2169189453125, -1.15997314453125, -1.10302734375, -1.04608154296875, -0.9891357421875, -0.93218994140625, -0.875244140625, -0.81829833984375, -0.7613525390625, -0.70440673828125, -0.6474609375, -0.59051513671875, -0.5335693359375, -0.47662353515625, -0.419677734375, -0.36273193359375, -0.3057861328125, -0.24884033203125, -0.19189453125, -0.13494873046875, -0.0780029296875, -0.02105712890625, 0.035888671875, 0.09283447265625, 0.1497802734375, 0.20672607421875, 0.263671875, 0.32061767578125, 0.3775634765625, 0.43450927734375, 0.491455078125, 0.54840087890625, 0.6053466796875, 0.66229248046875, 0.71923828125, 0.77618408203125, 0.8331298828125, 0.89007568359375, 0.947021484375, 1.00396728515625, 1.0609130859375, 1.11785888671875, 1.1748046875, 1.23175048828125, 1.2886962890625, 1.34564208984375, 1.402587890625, 1.45953369140625, 1.5164794921875, 1.57342529296875, 1.63037109375, 1.68731689453125, 1.7442626953125, 1.80120849609375, 1.858154296875, 1.91510009765625, 1.9720458984375, 2.02899169921875, 2.0859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 11.0, 15.0, 17.0, 43.0, 69.0, 141.0, 263.0, 222.0, 94.0, 52.0, 28.0, 19.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000244140625, -0.00023428350687026978, -0.00022442638874053955, -0.00021456927061080933, -0.0002047121524810791, -0.00019485503435134888, -0.00018499791622161865, -0.00017514079809188843, -0.0001652836799621582, -0.00015542656183242798, -0.00014556944370269775, -0.00013571232557296753, -0.0001258552074432373, -0.00011599808931350708, -0.00010614097118377686, -9.628385305404663e-05, -8.64267349243164e-05, -7.656961679458618e-05, -6.671249866485596e-05, -5.685538053512573e-05, -4.699826240539551e-05, -3.714114427566528e-05, -2.728402614593506e-05, -1.7426908016204834e-05, -7.569789886474609e-06, 2.2873282432556152e-06, 1.214444637298584e-05, 2.2001564502716064e-05, 3.185868263244629e-05, 4.1715800762176514e-05, 5.157291889190674e-05, 6.143003702163696e-05, 7.128715515136719e-05, 8.114427328109741e-05, 9.100139141082764e-05, 0.00010085850954055786, 0.00011071562767028809, 0.00012057274580001831, 0.00013042986392974854, 0.00014028698205947876, 0.00015014410018920898, 0.0001600012183189392, 0.00016985833644866943, 0.00017971545457839966, 0.00018957257270812988, 0.0001994296908378601, 0.00020928680896759033, 0.00021914392709732056, 0.00022900104522705078, 0.000238858163356781, 0.00024871528148651123, 0.00025857239961624146, 0.0002684295177459717, 0.0002782866358757019, 0.00028814375400543213, 0.00029800087213516235, 0.0003078579902648926, 0.0003177151083946228, 0.00032757222652435303, 0.00033742934465408325, 0.0003472864627838135, 0.0003571435809135437, 0.0003670006990432739, 0.00037685781717300415, 0.0003867149353027344]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 10.0, 22.0, 30.0, 61.0, 121.0, 216.0, 480.0, 2249.0, 106633.0, 933783.0, 3766.0, 654.0, 243.0, 129.0, 71.0, 39.0, 25.0, 12.0, 8.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.28125, -1.241363525390625, -1.20147705078125, -1.161590576171875, -1.1217041015625, -1.081817626953125, -1.04193115234375, -1.002044677734375, -0.962158203125, -0.922271728515625, -0.88238525390625, -0.842498779296875, -0.8026123046875, -0.762725830078125, -0.72283935546875, -0.682952880859375, -0.64306640625, -0.603179931640625, -0.56329345703125, -0.523406982421875, -0.4835205078125, -0.443634033203125, -0.40374755859375, -0.363861083984375, -0.323974609375, -0.284088134765625, -0.24420166015625, -0.204315185546875, -0.1644287109375, -0.124542236328125, -0.08465576171875, -0.044769287109375, -0.0048828125, 0.035003662109375, 0.07489013671875, 0.114776611328125, 0.1546630859375, 0.194549560546875, 0.23443603515625, 0.274322509765625, 0.314208984375, 0.354095458984375, 0.39398193359375, 0.433868408203125, 0.4737548828125, 0.513641357421875, 0.55352783203125, 0.593414306640625, 0.63330078125, 0.673187255859375, 0.71307373046875, 0.752960205078125, 0.7928466796875, 0.832733154296875, 0.87261962890625, 0.912506103515625, 0.952392578125, 0.992279052734375, 1.03216552734375, 1.072052001953125, 1.1119384765625, 1.151824951171875, 1.19171142578125, 1.231597900390625, 1.271484375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 15.0, 63.0, 374.0, 424.0, 99.0, 18.0, 9.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1015625, -1.068267822265625, -1.03497314453125, -1.001678466796875, -0.9683837890625, -0.935089111328125, -0.90179443359375, -0.868499755859375, -0.835205078125, -0.801910400390625, -0.76861572265625, -0.735321044921875, -0.7020263671875, -0.668731689453125, -0.63543701171875, -0.602142333984375, -0.56884765625, -0.535552978515625, -0.50225830078125, -0.468963623046875, -0.4356689453125, -0.402374267578125, -0.36907958984375, -0.335784912109375, -0.302490234375, -0.269195556640625, -0.23590087890625, -0.202606201171875, -0.1693115234375, -0.136016845703125, -0.10272216796875, -0.069427490234375, -0.0361328125, -0.002838134765625, 0.03045654296875, 0.063751220703125, 0.0970458984375, 0.130340576171875, 0.16363525390625, 0.196929931640625, 0.230224609375, 0.263519287109375, 0.29681396484375, 0.330108642578125, 0.3634033203125, 0.396697998046875, 0.42999267578125, 0.463287353515625, 0.49658203125, 0.529876708984375, 0.56317138671875, 0.596466064453125, 0.6297607421875, 0.663055419921875, 0.69635009765625, 0.729644775390625, 0.762939453125, 0.796234130859375, 0.82952880859375, 0.862823486328125, 0.8961181640625, 0.929412841796875, 0.96270751953125, 0.996002197265625, 1.029296875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 43.0, 314.0, 498.0, 121.0, 20.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-22.58203125, -22.140111923217773, -21.698190689086914, -21.256271362304688, -20.814350128173828, -20.3724308013916, -19.930509567260742, -19.488590240478516, -19.046669006347656, -18.60474967956543, -18.16282844543457, -17.720909118652344, -17.278987884521484, -16.837068557739258, -16.3951473236084, -15.953227996826172, -15.511308670043945, -15.069388389587402, -14.62746810913086, -14.185547828674316, -13.743627548217773, -13.301708221435547, -12.859786987304688, -12.417867660522461, -11.975946426391602, -11.534026145935059, -11.092105865478516, -10.650185585021973, -10.20826530456543, -9.766345977783203, -9.324424743652344, -8.882505416870117, -8.440584182739258, -7.998663902282715, -7.556743621826172, -7.114823341369629, -6.672903537750244, -6.230983257293701, -5.789062976837158, -5.347143173217773, -4.9052228927612305, -4.4633026123046875, -4.0213823318481445, -3.5794622898101807, -3.137542247772217, -2.695621967315674, -2.253701686859131, -1.811781644821167, -1.3698616027832031, -0.9279414415359497, -0.4860212206840515, -0.04410099983215332, 0.3978191614151001, 0.8397393226623535, 1.2816596031188965, 1.7235796451568604, 2.1654999256134033, 2.6074202060699463, 3.04934024810791, 3.491260528564453, 3.933180809020996, 4.375101089477539, 4.817021369934082, 5.258941173553467, 5.70086145401001]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 4.0, 4.0, 12.0, 3.0, 7.0, 14.0, 22.0, 18.0, 29.0, 19.0, 31.0, 31.0, 47.0, 37.0, 47.0, 48.0, 37.0, 49.0, 48.0, 61.0, 53.0, 47.0, 44.0, 52.0, 31.0, 32.0, 26.0, 26.0, 23.0, 32.0, 12.0, 11.0, 11.0, 3.0, 7.0, 11.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.638761520385742, -2.5725622177124023, -2.5063629150390625, -2.4401638507843018, -2.373964548110962, -2.307765245437622, -2.2415659427642822, -2.1753666400909424, -2.1091675758361816, -2.042968273162842, -1.9767690896987915, -1.9105697870254517, -1.8443706035614014, -1.7781713008880615, -1.7119719982147217, -1.6457726955413818, -1.579573392868042, -1.5133740901947021, -1.4471749067306519, -1.380975604057312, -1.3147764205932617, -1.2485771179199219, -1.182377815246582, -1.1161785125732422, -1.049979329109192, -0.9837800860404968, -0.9175808429718018, -0.8513815402984619, -0.7851822972297668, -0.7189830541610718, -0.6527837514877319, -0.5865845084190369, -0.5203855037689209, -0.45418626070022583, -0.3879869878292084, -0.3217877149581909, -0.25558847188949585, -0.18938922882080078, -0.12318995594978333, -0.05699068307876587, 0.0092085599899292, 0.07540781795978546, 0.14160707592964172, 0.20780633389949799, 0.27400559186935425, 0.3402048349380493, 0.4064041078090668, 0.47260338068008423, 0.5388026237487793, 0.6050018668174744, 0.6712011098861694, 0.7374004125595093, 0.8035996556282043, 0.8697988986968994, 0.9359982013702393, 1.002197504043579, 1.0683966875076294, 1.1345959901809692, 1.2007951736450195, 1.2669944763183594, 1.3331937789916992, 1.3993929624557495, 1.4655922651290894, 1.5317914485931396, 1.5979907512664795]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 3.0, 7.0, 5.0, 12.0, 13.0, 21.0, 18.0, 28.0, 28.0, 39.0, 73.0, 80.0, 128.0, 173.0, 313.0, 514.0, 1040.0, 2297.0, 5985.0, 19137.0, 107879.0, 3781946.0, 230589.0, 29212.0, 8202.0, 3195.0, 1428.0, 692.0, 398.0, 220.0, 171.0, 117.0, 83.0, 61.0, 42.0, 37.0, 28.0, 27.0, 9.0, 9.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.52685546875, -0.5116462707519531, -0.49643707275390625, -0.4812278747558594, -0.4660186767578125, -0.4508094787597656, -0.43560028076171875, -0.4203910827636719, -0.405181884765625, -0.3899726867675781, -0.37476348876953125, -0.3595542907714844, -0.3443450927734375, -0.3291358947753906, -0.31392669677734375, -0.2987174987792969, -0.28350830078125, -0.2682991027832031, -0.25308990478515625, -0.23788070678710938, -0.2226715087890625, -0.20746231079101562, -0.19225311279296875, -0.17704391479492188, -0.161834716796875, -0.14662551879882812, -0.13141632080078125, -0.11620712280273438, -0.1009979248046875, -0.08578872680664062, -0.07057952880859375, -0.055370330810546875, -0.0401611328125, -0.024951934814453125, -0.00974273681640625, 0.005466461181640625, 0.0206756591796875, 0.035884857177734375, 0.05109405517578125, 0.06630325317382812, 0.081512451171875, 0.09672164916992188, 0.11193084716796875, 0.12714004516601562, 0.1423492431640625, 0.15755844116210938, 0.17276763916015625, 0.18797683715820312, 0.20318603515625, 0.21839523315429688, 0.23360443115234375, 0.24881362915039062, 0.2640228271484375, 0.2792320251464844, 0.29444122314453125, 0.3096504211425781, 0.324859619140625, 0.3400688171386719, 0.35527801513671875, 0.3704872131347656, 0.3856964111328125, 0.4009056091308594, 0.41611480712890625, 0.4313240051269531, 0.446533203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 10.0, 6.0, 18.0, 42.0, 47.0, 87.0, 127.0, 132.0, 132.0, 112.0, 87.0, 72.0, 53.0, 30.0, 24.0, 12.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.20914649963378906, -0.20247268676757812, -0.1957988739013672, -0.18912506103515625, -0.1824512481689453, -0.17577743530273438, -0.16910362243652344, -0.1624298095703125, -0.15575599670410156, -0.14908218383789062, -0.1424083709716797, -0.13573455810546875, -0.1290607452392578, -0.12238693237304688, -0.11571311950683594, -0.109039306640625, -0.10236549377441406, -0.09569168090820312, -0.08901786804199219, -0.08234405517578125, -0.07567024230957031, -0.06899642944335938, -0.06232261657714844, -0.0556488037109375, -0.04897499084472656, -0.042301177978515625, -0.03562736511230469, -0.02895355224609375, -0.022279739379882812, -0.015605926513671875, -0.008932113647460938, -0.00225830078125, 0.0044155120849609375, 0.011089324951171875, 0.017763137817382812, 0.02443695068359375, 0.031110763549804688, 0.037784576416015625, 0.04445838928222656, 0.0511322021484375, 0.05780601501464844, 0.06447982788085938, 0.07115364074707031, 0.07782745361328125, 0.08450126647949219, 0.09117507934570312, 0.09784889221191406, 0.104522705078125, 0.11119651794433594, 0.11787033081054688, 0.12454414367675781, 0.13121795654296875, 0.1378917694091797, 0.14456558227539062, 0.15123939514160156, 0.1579132080078125, 0.16458702087402344, 0.17126083374023438, 0.1779346466064453, 0.18460845947265625, 0.1912822723388672, 0.19795608520507812, 0.20462989807128906, 0.2113037109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 8.0, 16.0, 43.0, 58.0, 123.0, 252.0, 558.0, 1309.0, 3456.0, 11712.0, 65389.0, 3668535.0, 403704.0, 28658.0, 6591.0, 2176.0, 933.0, 407.0, 185.0, 70.0, 51.0, 21.0, 13.0, 8.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.349365234375, -0.3307762145996094, -0.31218719482421875, -0.2935981750488281, -0.2750091552734375, -0.2564201354980469, -0.23783111572265625, -0.21924209594726562, -0.200653076171875, -0.18206405639648438, -0.16347503662109375, -0.14488601684570312, -0.1262969970703125, -0.10770797729492188, -0.08911895751953125, -0.07052993774414062, -0.05194091796875, -0.033351898193359375, -0.01476287841796875, 0.003826141357421875, 0.0224151611328125, 0.041004180908203125, 0.05959320068359375, 0.07818222045898438, 0.096771240234375, 0.11536026000976562, 0.13394927978515625, 0.15253829956054688, 0.1711273193359375, 0.18971633911132812, 0.20830535888671875, 0.22689437866210938, 0.2454833984375, 0.2640724182128906, 0.28266143798828125, 0.3012504577636719, 0.3198394775390625, 0.3384284973144531, 0.35701751708984375, 0.3756065368652344, 0.394195556640625, 0.4127845764160156, 0.43137359619140625, 0.4499626159667969, 0.4685516357421875, 0.4871406555175781, 0.5057296752929688, 0.5243186950683594, 0.54290771484375, 0.5614967346191406, 0.5800857543945312, 0.5986747741699219, 0.6172637939453125, 0.6358528137207031, 0.6544418334960938, 0.6730308532714844, 0.691619873046875, 0.7102088928222656, 0.7287979125976562, 0.7473869323730469, 0.7659759521484375, 0.7845649719238281, 0.8031539916992188, 0.8217430114746094, 0.84033203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 4.0, 12.0, 8.0, 11.0, 16.0, 19.0, 29.0, 66.0, 76.0, 146.0, 317.0, 1304.0, 1388.0, 303.0, 142.0, 63.0, 55.0, 25.0, 17.0, 14.0, 12.0, 11.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.158447265625, -0.15333938598632812, -0.14823150634765625, -0.14312362670898438, -0.1380157470703125, -0.13290786743164062, -0.12779998779296875, -0.12269210815429688, -0.117584228515625, -0.11247634887695312, -0.10736846923828125, -0.10226058959960938, -0.0971527099609375, -0.09204483032226562, -0.08693695068359375, -0.08182907104492188, -0.07672119140625, -0.07161331176757812, -0.06650543212890625, -0.061397552490234375, -0.0562896728515625, -0.051181793212890625, -0.04607391357421875, -0.040966033935546875, -0.035858154296875, -0.030750274658203125, -0.02564239501953125, -0.020534515380859375, -0.0154266357421875, -0.010318756103515625, -0.00521087646484375, -0.000102996826171875, 0.0050048828125, 0.010112762451171875, 0.01522064208984375, 0.020328521728515625, 0.0254364013671875, 0.030544281005859375, 0.03565216064453125, 0.040760040283203125, 0.045867919921875, 0.050975799560546875, 0.05608367919921875, 0.061191558837890625, 0.0662994384765625, 0.07140731811523438, 0.07651519775390625, 0.08162307739257812, 0.08673095703125, 0.09183883666992188, 0.09694671630859375, 0.10205459594726562, 0.1071624755859375, 0.11227035522460938, 0.11737823486328125, 0.12248611450195312, 0.127593994140625, 0.13270187377929688, 0.13780975341796875, 0.14291763305664062, 0.1480255126953125, 0.15313339233398438, 0.15824127197265625, 0.16334915161132812, 0.16845703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 10.0, 35.0, 128.0, 288.0, 326.0, 153.0, 39.0, 19.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8991286754608154, -2.823695659637451, -2.748262882232666, -2.6728298664093018, -2.5973970890045166, -2.5219640731811523, -2.446531295776367, -2.371098279953003, -2.2956652641296387, -2.2202322483062744, -2.1447994709014893, -2.069366455078125, -1.9939335584640503, -1.9185006618499756, -1.8430677652359009, -1.7676348686218262, -1.6922019720077515, -1.6167690753936768, -1.541336178779602, -1.4659032821655273, -1.390470266342163, -1.3150373697280884, -1.2396044731140137, -1.1641714572906494, -1.0887386798858643, -1.0133057832717896, -0.9378728270530701, -0.8624399304389954, -0.7870069742202759, -0.7115740776062012, -0.6361411809921265, -0.560708224773407, -0.4852752685546875, -0.4098423421382904, -0.3344094157218933, -0.2589765191078186, -0.1835435926914215, -0.10811066627502441, -0.03267776966094971, 0.042755186557769775, 0.11818808317184448, 0.19362100958824158, 0.26905393600463867, 0.3444868326187134, 0.4199197590351105, 0.49535268545150757, 0.5707855820655823, 0.6462185382843018, 0.7216514348983765, 0.7970843315124512, 0.8725172877311707, 0.9479501843452454, 1.0233831405639648, 1.0988160371780396, 1.1742489337921143, 1.2496819496154785, 1.3251147270202637, 1.4005476236343384, 1.475980520248413, 1.5514135360717773, 1.626846432685852, 1.7022793292999268, 1.7777122259140015, 1.8531451225280762, 1.9285781383514404]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 11.0, 14.0, 7.0, 18.0, 14.0, 24.0, 24.0, 18.0, 46.0, 40.0, 54.0, 43.0, 59.0, 68.0, 62.0, 62.0, 60.0, 49.0, 51.0, 50.0, 33.0, 35.0, 23.0, 20.0, 22.0, 24.0, 22.0, 10.0, 14.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4988066554069519, -0.47856348752975464, -0.4583203196525574, -0.4380771517753601, -0.41783398389816284, -0.3975908160209656, -0.3773476183414459, -0.35710445046424866, -0.3368612825870514, -0.3166181147098541, -0.29637494683265686, -0.2761317789554596, -0.25588858127593994, -0.23564542829990387, -0.2154022455215454, -0.19515907764434814, -0.17491590976715088, -0.1546727418899536, -0.13442957401275635, -0.11418639123439789, -0.09394322335720062, -0.07370005548000336, -0.053456880152225494, -0.03321370482444763, -0.012970536947250366, 0.007272634655237198, 0.027515806257724762, 0.047758977860212326, 0.06800214946269989, 0.08824531733989716, 0.10848849266767502, 0.12873166799545288, 0.14897489547729492, 0.1692180633544922, 0.18946123123168945, 0.2097044140100479, 0.22994758188724518, 0.25019073486328125, 0.2704339325428009, 0.29067710041999817, 0.31092026829719543, 0.3311634361743927, 0.35140660405158997, 0.37164977192878723, 0.3918929696083069, 0.41213613748550415, 0.4323793053627014, 0.4526224732398987, 0.47286564111709595, 0.4931088089942932, 0.5133519768714905, 0.5335951447486877, 0.553838312625885, 0.5740814805030823, 0.5943246483802795, 0.6145678758621216, 0.6348110437393188, 0.6550542116165161, 0.6752973794937134, 0.6955405473709106, 0.7157837152481079, 0.7360268831253052, 0.7562700510025024, 0.7765132188796997, 0.796756386756897]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 13.0, 30.0, 51.0, 96.0, 164.0, 355.0, 694.0, 1662.0, 5166.0, 35752.0, 470136.0, 488842.0, 37080.0, 5377.0, 1653.0, 783.0, 336.0, 171.0, 85.0, 41.0, 24.0, 17.0, 15.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8505859375, -0.8240127563476562, -0.7974395751953125, -0.7708663940429688, -0.744293212890625, -0.7177200317382812, -0.6911468505859375, -0.6645736694335938, -0.63800048828125, -0.6114273071289062, -0.5848541259765625, -0.5582809448242188, -0.531707763671875, -0.5051345825195312, -0.4785614013671875, -0.45198822021484375, -0.4254150390625, -0.39884185791015625, -0.3722686767578125, -0.34569549560546875, -0.319122314453125, -0.29254913330078125, -0.2659759521484375, -0.23940277099609375, -0.21282958984375, -0.18625640869140625, -0.1596832275390625, -0.13311004638671875, -0.106536865234375, -0.07996368408203125, -0.0533905029296875, -0.02681732177734375, -0.000244140625, 0.02632904052734375, 0.0529022216796875, 0.07947540283203125, 0.106048583984375, 0.13262176513671875, 0.1591949462890625, 0.18576812744140625, 0.21234130859375, 0.23891448974609375, 0.2654876708984375, 0.29206085205078125, 0.318634033203125, 0.34520721435546875, 0.3717803955078125, 0.39835357666015625, 0.4249267578125, 0.45149993896484375, 0.4780731201171875, 0.5046463012695312, 0.531219482421875, 0.5577926635742188, 0.5843658447265625, 0.6109390258789062, 0.63751220703125, 0.6640853881835938, 0.6906585693359375, 0.7172317504882812, 0.743804931640625, 0.7703781127929688, 0.7969512939453125, 0.8235244750976562, 0.85009765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 16.0, 19.0, 61.0, 64.0, 91.0, 131.0, 131.0, 124.0, 118.0, 79.0, 61.0, 39.0, 27.0, 17.0, 10.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.213623046875, -0.2069263458251953, -0.20022964477539062, -0.19353294372558594, -0.18683624267578125, -0.18013954162597656, -0.17344284057617188, -0.1667461395263672, -0.1600494384765625, -0.1533527374267578, -0.14665603637695312, -0.13995933532714844, -0.13326263427734375, -0.12656593322753906, -0.11986923217773438, -0.11317253112792969, -0.106475830078125, -0.09977912902832031, -0.09308242797851562, -0.08638572692871094, -0.07968902587890625, -0.07299232482910156, -0.06629562377929688, -0.05959892272949219, -0.0529022216796875, -0.04620552062988281, -0.039508819580078125, -0.03281211853027344, -0.02611541748046875, -0.019418716430664062, -0.012722015380859375, -0.0060253143310546875, 0.00067138671875, 0.0073680877685546875, 0.014064788818359375, 0.020761489868164062, 0.02745819091796875, 0.03415489196777344, 0.040851593017578125, 0.04754829406738281, 0.0542449951171875, 0.06094169616699219, 0.06763839721679688, 0.07433509826660156, 0.08103179931640625, 0.08772850036621094, 0.09442520141601562, 0.10112190246582031, 0.107818603515625, 0.11451530456542969, 0.12121200561523438, 0.12790870666503906, 0.13460540771484375, 0.14130210876464844, 0.14799880981445312, 0.1546955108642578, 0.1613922119140625, 0.1680889129638672, 0.17478561401367188, 0.18148231506347656, 0.18817901611328125, 0.19487571716308594, 0.20157241821289062, 0.2082691192626953, 0.2149658203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 8.0, 17.0, 31.0, 33.0, 37.0, 56.0, 74.0, 119.0, 166.0, 381.0, 848.0, 2325.0, 8376.0, 34832.0, 162134.0, 508647.0, 256540.0, 55361.0, 12910.0, 3409.0, 1113.0, 442.0, 224.0, 129.0, 77.0, 55.0, 45.0, 29.0, 23.0, 36.0, 19.0, 9.0, 4.0, 8.0, 5.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3720703125, -0.3590850830078125, -0.346099853515625, -0.3331146240234375, -0.32012939453125, -0.3071441650390625, -0.294158935546875, -0.2811737060546875, -0.2681884765625, -0.2552032470703125, -0.242218017578125, -0.2292327880859375, -0.21624755859375, -0.2032623291015625, -0.190277099609375, -0.1772918701171875, -0.164306640625, -0.1513214111328125, -0.138336181640625, -0.1253509521484375, -0.11236572265625, -0.0993804931640625, -0.086395263671875, -0.0734100341796875, -0.0604248046875, -0.0474395751953125, -0.034454345703125, -0.0214691162109375, -0.00848388671875, 0.0045013427734375, 0.017486572265625, 0.0304718017578125, 0.04345703125, 0.0564422607421875, 0.069427490234375, 0.0824127197265625, 0.09539794921875, 0.1083831787109375, 0.121368408203125, 0.1343536376953125, 0.1473388671875, 0.1603240966796875, 0.173309326171875, 0.1862945556640625, 0.19927978515625, 0.2122650146484375, 0.225250244140625, 0.2382354736328125, 0.251220703125, 0.2642059326171875, 0.277191162109375, 0.2901763916015625, 0.30316162109375, 0.3161468505859375, 0.329132080078125, 0.3421173095703125, 0.3551025390625, 0.3680877685546875, 0.381072998046875, 0.3940582275390625, 0.40704345703125, 0.4200286865234375, 0.433013916015625, 0.4459991455078125, 0.458984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 7.0, 4.0, 7.0, 4.0, 8.0, 8.0, 17.0, 21.0, 26.0, 23.0, 35.0, 25.0, 34.0, 34.0, 37.0, 39.0, 49.0, 35.0, 47.0, 35.0, 58.0, 37.0, 36.0, 36.0, 40.0, 28.0, 30.0, 27.0, 27.0, 35.0, 18.0, 17.0, 15.0, 17.0, 17.0, 8.0, 7.0, 5.0, 5.0, 6.0, 4.0, 6.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.3271484375, -0.3177528381347656, -0.30835723876953125, -0.2989616394042969, -0.2895660400390625, -0.2801704406738281, -0.27077484130859375, -0.2613792419433594, -0.251983642578125, -0.24258804321289062, -0.23319244384765625, -0.22379684448242188, -0.2144012451171875, -0.20500564575195312, -0.19561004638671875, -0.18621444702148438, -0.17681884765625, -0.16742324829101562, -0.15802764892578125, -0.14863204956054688, -0.1392364501953125, -0.12984085083007812, -0.12044525146484375, -0.11104965209960938, -0.101654052734375, -0.09225845336914062, -0.08286285400390625, -0.07346725463867188, -0.0640716552734375, -0.054676055908203125, -0.04528045654296875, -0.035884857177734375, -0.0264892578125, -0.017093658447265625, -0.00769805908203125, 0.001697540283203125, 0.0110931396484375, 0.020488739013671875, 0.02988433837890625, 0.039279937744140625, 0.048675537109375, 0.058071136474609375, 0.06746673583984375, 0.07686233520507812, 0.0862579345703125, 0.09565353393554688, 0.10504913330078125, 0.11444473266601562, 0.12384033203125, 0.13323593139648438, 0.14263153076171875, 0.15202713012695312, 0.1614227294921875, 0.17081832885742188, 0.18021392822265625, 0.18960952758789062, 0.199005126953125, 0.20840072631835938, 0.21779632568359375, 0.22719192504882812, 0.2365875244140625, 0.24598312377929688, 0.25537872314453125, 0.2647743225097656, 0.274169921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 2.0, 2.0, 8.0, 16.0, 14.0, 15.0, 35.0, 64.0, 128.0, 229.0, 514.0, 1166.0, 2940.0, 7705.0, 22952.0, 83436.0, 496849.0, 341062.0, 62661.0, 18326.0, 6147.0, 2404.0, 1029.0, 405.0, 209.0, 100.0, 43.0, 26.0, 15.0, 20.0, 10.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1800537109375, -0.17530250549316406, -0.17055130004882812, -0.1658000946044922, -0.16104888916015625, -0.1562976837158203, -0.15154647827148438, -0.14679527282714844, -0.1420440673828125, -0.13729286193847656, -0.13254165649414062, -0.1277904510498047, -0.12303924560546875, -0.11828804016113281, -0.11353683471679688, -0.10878562927246094, -0.104034423828125, -0.09928321838378906, -0.09453201293945312, -0.08978080749511719, -0.08502960205078125, -0.08027839660644531, -0.07552719116210938, -0.07077598571777344, -0.0660247802734375, -0.06127357482910156, -0.056522369384765625, -0.05177116394042969, -0.04701995849609375, -0.04226875305175781, -0.037517547607421875, -0.03276634216308594, -0.02801513671875, -0.023263931274414062, -0.018512725830078125, -0.013761520385742188, -0.00901031494140625, -0.0042591094970703125, 0.000492095947265625, 0.0052433013916015625, 0.0099945068359375, 0.014745712280273438, 0.019496917724609375, 0.024248123168945312, 0.02899932861328125, 0.03375053405761719, 0.038501739501953125, 0.04325294494628906, 0.048004150390625, 0.05275535583496094, 0.057506561279296875, 0.06225776672363281, 0.06700897216796875, 0.07176017761230469, 0.07651138305664062, 0.08126258850097656, 0.0860137939453125, 0.09076499938964844, 0.09551620483398438, 0.10026741027832031, 0.10501861572265625, 0.10976982116699219, 0.11452102661132812, 0.11927223205566406, 0.1240234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 9.0, 11.0, 9.0, 9.0, 14.0, 11.0, 13.0, 20.0, 32.0, 37.0, 36.0, 39.0, 57.0, 89.0, 107.0, 120.0, 73.0, 54.0, 51.0, 34.0, 27.0, 25.0, 12.0, 13.0, 9.0, 15.0, 19.0, 7.0, 10.0, 9.0, 3.0, 4.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00016450881958007812, -0.00015978701412677765, -0.00015506520867347717, -0.0001503434032201767, -0.00014562159776687622, -0.00014089979231357574, -0.00013617798686027527, -0.0001314561814069748, -0.00012673437595367432, -0.00012201257050037384, -0.00011729076504707336, -0.00011256895959377289, -0.00010784715414047241, -0.00010312534868717194, -9.840354323387146e-05, -9.368173778057098e-05, -8.895993232727051e-05, -8.423812687397003e-05, -7.951632142066956e-05, -7.479451596736908e-05, -7.00727105140686e-05, -6.535090506076813e-05, -6.062909960746765e-05, -5.5907294154167175e-05, -5.11854887008667e-05, -4.646368324756622e-05, -4.174187779426575e-05, -3.702007234096527e-05, -3.2298266887664795e-05, -2.757646143436432e-05, -2.2854655981063843e-05, -1.8132850527763367e-05, -1.341104507446289e-05, -8.689239621162415e-06, -3.9674341678619385e-06, 7.543712854385376e-07, 5.476176738739014e-06, 1.019798219203949e-05, 1.4919787645339966e-05, 1.9641593098640442e-05, 2.4363398551940918e-05, 2.9085204005241394e-05, 3.380700945854187e-05, 3.8528814911842346e-05, 4.325062036514282e-05, 4.79724258184433e-05, 5.2694231271743774e-05, 5.741603672504425e-05, 6.213784217834473e-05, 6.68596476316452e-05, 7.158145308494568e-05, 7.630325853824615e-05, 8.102506399154663e-05, 8.574686944484711e-05, 9.046867489814758e-05, 9.519048035144806e-05, 9.991228580474854e-05, 0.00010463409125804901, 0.00010935589671134949, 0.00011407770216464996, 0.00011879950761795044, 0.00012352131307125092, 0.0001282431185245514, 0.00013296492397785187, 0.00013768672943115234]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 11.0, 9.0, 15.0, 17.0, 26.0, 46.0, 78.0, 125.0, 235.0, 433.0, 1039.0, 2738.0, 8811.0, 37405.0, 318717.0, 605406.0, 55273.0, 12177.0, 3556.0, 1279.0, 550.0, 238.0, 124.0, 73.0, 38.0, 35.0, 29.0, 13.0, 14.0, 9.0, 10.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1861572265625, -0.1797637939453125, -0.173370361328125, -0.1669769287109375, -0.16058349609375, -0.1541900634765625, -0.147796630859375, -0.1414031982421875, -0.135009765625, -0.1286163330078125, -0.122222900390625, -0.1158294677734375, -0.10943603515625, -0.1030426025390625, -0.096649169921875, -0.0902557373046875, -0.0838623046875, -0.0774688720703125, -0.071075439453125, -0.0646820068359375, -0.05828857421875, -0.0518951416015625, -0.045501708984375, -0.0391082763671875, -0.03271484375, -0.0263214111328125, -0.019927978515625, -0.0135345458984375, -0.00714111328125, -0.0007476806640625, 0.005645751953125, 0.0120391845703125, 0.0184326171875, 0.0248260498046875, 0.031219482421875, 0.0376129150390625, 0.04400634765625, 0.0503997802734375, 0.056793212890625, 0.0631866455078125, 0.069580078125, 0.0759735107421875, 0.082366943359375, 0.0887603759765625, 0.09515380859375, 0.1015472412109375, 0.107940673828125, 0.1143341064453125, 0.1207275390625, 0.1271209716796875, 0.133514404296875, 0.1399078369140625, 0.14630126953125, 0.1526947021484375, 0.159088134765625, 0.1654815673828125, 0.171875, 0.1782684326171875, 0.184661865234375, 0.1910552978515625, 0.19744873046875, 0.2038421630859375, 0.210235595703125, 0.2166290283203125, 0.2230224609375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 9.0, 7.0, 5.0, 8.0, 13.0, 17.0, 27.0, 22.0, 34.0, 53.0, 50.0, 112.0, 159.0, 128.0, 97.0, 63.0, 40.0, 28.0, 24.0, 22.0, 14.0, 8.0, 11.0, 8.0, 3.0, 10.0, 2.0, 2.0, 6.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1153564453125, -0.11072349548339844, -0.10609054565429688, -0.10145759582519531, -0.09682464599609375, -0.09219169616699219, -0.08755874633789062, -0.08292579650878906, -0.0782928466796875, -0.07365989685058594, -0.06902694702148438, -0.06439399719238281, -0.05976104736328125, -0.05512809753417969, -0.050495147705078125, -0.04586219787597656, -0.041229248046875, -0.03659629821777344, -0.031963348388671875, -0.027330398559570312, -0.02269744873046875, -0.018064498901367188, -0.013431549072265625, -0.008798599243164062, -0.0041656494140625, 0.0004673004150390625, 0.005100250244140625, 0.009733200073242188, 0.01436614990234375, 0.018999099731445312, 0.023632049560546875, 0.028264999389648438, 0.03289794921875, 0.03753089904785156, 0.042163848876953125, 0.04679679870605469, 0.05142974853515625, 0.05606269836425781, 0.060695648193359375, 0.06532859802246094, 0.0699615478515625, 0.07459449768066406, 0.07922744750976562, 0.08386039733886719, 0.08849334716796875, 0.09312629699707031, 0.09775924682617188, 0.10239219665527344, 0.107025146484375, 0.11165809631347656, 0.11629104614257812, 0.12092399597167969, 0.12555694580078125, 0.1301898956298828, 0.13482284545898438, 0.13945579528808594, 0.1440887451171875, 0.14872169494628906, 0.15335464477539062, 0.1579875946044922, 0.16262054443359375, 0.1672534942626953, 0.17188644409179688, 0.17651939392089844, 0.18115234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 14.0, 10.0, 24.0, 53.0, 97.0, 146.0, 164.0, 164.0, 131.0, 78.0, 52.0, 30.0, 25.0, 8.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0489306449890137, -0.9510831236839294, -0.8532356023788452, -0.7553880214691162, -0.6575405597686768, -0.5596929788589478, -0.4618454575538635, -0.3639979362487793, -0.26615041494369507, -0.16830289363861084, -0.07045535743236542, 0.027392178773880005, 0.12523970007896423, 0.22308722138404846, 0.3209347724914551, 0.4187822937965393, 0.5166298151016235, 0.6144773364067078, 0.712324857711792, 0.810172438621521, 0.9080199003219604, 1.0058674812316895, 1.103714942932129, 1.201562523841858, 1.299410104751587, 1.397257685661316, 1.4951051473617554, 1.5929527282714844, 1.6908001899719238, 1.7886477708816528, 1.8864953517913818, 1.9843428134918213, 2.0821902751922607, 2.1800377368927, 2.2778854370117188, 2.375732898712158, 2.4735803604125977, 2.571427822113037, 2.6692755222320557, 2.767122983932495, 2.8649704456329346, 2.962817907333374, 3.0606656074523926, 3.158513069152832, 3.2563605308532715, 3.354207992553711, 3.4520556926727295, 3.549903154373169, 3.6477508544921875, 3.745598316192627, 3.8434460163116455, 3.941293478012085, 4.0391411781311035, 4.136988639831543, 4.234836101531982, 4.332683563232422, 4.430531024932861, 4.528378486633301, 4.62622594833374, 4.72407341003418, 4.821921348571777, 4.919768810272217, 5.017616271972656, 5.115463733673096, 5.213311195373535]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 9.0, 14.0, 16.0, 15.0, 14.0, 21.0, 12.0, 20.0, 21.0, 26.0, 27.0, 41.0, 29.0, 30.0, 26.0, 29.0, 31.0, 36.0, 29.0, 45.0, 39.0, 39.0, 49.0, 29.0, 32.0, 35.0, 26.0, 26.0, 28.0, 22.0, 24.0, 20.0, 25.0, 17.0, 14.0, 3.0, 10.0, 7.0, 9.0, 4.0, 2.0, 6.0, 3.0, 6.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0], "bins": [-1.4185442924499512, -1.375292420387268, -1.332040548324585, -1.2887885570526123, -1.2455366849899292, -1.202284812927246, -1.159032940864563, -1.1157810688018799, -1.0725290775299072, -1.0292772054672241, -0.9860252737998962, -0.9427734017372131, -0.8995214700698853, -0.8562695980072021, -0.813017725944519, -0.7697658538818359, -0.7265139818191528, -0.6832621097564697, -0.6400101780891418, -0.5967583060264587, -0.5535063743591309, -0.5102545022964478, -0.46700263023376465, -0.42375072836875916, -0.38049882650375366, -0.33724692463874817, -0.2939950227737427, -0.25074315071105957, -0.20749124884605408, -0.16423934698104858, -0.12098747491836548, -0.07773557305335999, -0.03448367118835449, 0.008768223226070404, 0.0520201176404953, 0.0952720046043396, 0.1385239064693451, 0.18177580833435059, 0.2250276803970337, 0.2682795822620392, 0.3115314841270447, 0.35478338599205017, 0.39803528785705566, 0.44128715991973877, 0.48453906178474426, 0.5277909636497498, 0.5710428357124329, 0.6142947673797607, 0.6575466394424438, 0.700798511505127, 0.7440504431724548, 0.7873023152351379, 0.8305542469024658, 0.8738061189651489, 0.917057991027832, 0.9603098630905151, 1.0035617351531982, 1.0468136072158813, 1.0900654792785645, 1.133317470550537, 1.1765693426132202, 1.2198212146759033, 1.2630730867385864, 1.3063249588012695, 1.3495769500732422]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 13.0, 8.0, 12.0, 35.0, 49.0, 68.0, 137.0, 214.0, 462.0, 1155.0, 3329.0, 13327.0, 115172.0, 3987153.0, 59368.0, 9199.0, 2586.0, 921.0, 462.0, 237.0, 112.0, 91.0, 40.0, 42.0, 32.0, 7.0, 12.0, 9.0, 10.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92626953125, -0.8897781372070312, -0.8532867431640625, -0.8167953491210938, -0.780303955078125, -0.7438125610351562, -0.7073211669921875, -0.6708297729492188, -0.63433837890625, -0.5978469848632812, -0.5613555908203125, -0.5248641967773438, -0.488372802734375, -0.45188140869140625, -0.4153900146484375, -0.37889862060546875, -0.3424072265625, -0.30591583251953125, -0.2694244384765625, -0.23293304443359375, -0.196441650390625, -0.15995025634765625, -0.1234588623046875, -0.08696746826171875, -0.05047607421875, -0.01398468017578125, 0.0225067138671875, 0.05899810791015625, 0.095489501953125, 0.13198089599609375, 0.1684722900390625, 0.20496368408203125, 0.241455078125, 0.27794647216796875, 0.3144378662109375, 0.35092926025390625, 0.387420654296875, 0.42391204833984375, 0.4604034423828125, 0.49689483642578125, 0.53338623046875, 0.5698776245117188, 0.6063690185546875, 0.6428604125976562, 0.679351806640625, 0.7158432006835938, 0.7523345947265625, 0.7888259887695312, 0.8253173828125, 0.8618087768554688, 0.8983001708984375, 0.9347915649414062, 0.971282958984375, 1.0077743530273438, 1.0442657470703125, 1.0807571411132812, 1.11724853515625, 1.1537399291992188, 1.1902313232421875, 1.2267227172851562, 1.263214111328125, 1.2997055053710938, 1.3361968994140625, 1.3726882934570312, 1.4091796875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 12.0, 11.0, 22.0, 50.0, 60.0, 84.0, 113.0, 105.0, 123.0, 108.0, 97.0, 76.0, 60.0, 32.0, 20.0, 13.0, 10.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2115478515625, -0.20479202270507812, -0.19803619384765625, -0.19128036499023438, -0.1845245361328125, -0.17776870727539062, -0.17101287841796875, -0.16425704956054688, -0.157501220703125, -0.15074539184570312, -0.14398956298828125, -0.13723373413085938, -0.1304779052734375, -0.12372207641601562, -0.11696624755859375, -0.11021041870117188, -0.10345458984375, -0.09669876098632812, -0.08994293212890625, -0.08318710327148438, -0.0764312744140625, -0.06967544555664062, -0.06291961669921875, -0.056163787841796875, -0.049407958984375, -0.042652130126953125, -0.03589630126953125, -0.029140472412109375, -0.0223846435546875, -0.015628814697265625, -0.00887298583984375, -0.002117156982421875, 0.004638671875, 0.011394500732421875, 0.01815032958984375, 0.024906158447265625, 0.0316619873046875, 0.038417816162109375, 0.04517364501953125, 0.051929473876953125, 0.058685302734375, 0.06544113159179688, 0.07219696044921875, 0.07895278930664062, 0.0857086181640625, 0.09246444702148438, 0.09922027587890625, 0.10597610473632812, 0.11273193359375, 0.11948776245117188, 0.12624359130859375, 0.13299942016601562, 0.1397552490234375, 0.14651107788085938, 0.15326690673828125, 0.16002273559570312, 0.166778564453125, 0.17353439331054688, 0.18029022216796875, 0.18704605102539062, 0.1938018798828125, 0.20055770874023438, 0.20731353759765625, 0.21406936645507812, 0.2208251953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 15.0, 29.0, 49.0, 149.0, 314.0, 899.0, 2592.0, 8713.0, 49779.0, 3769192.0, 331935.0, 22727.0, 5182.0, 1699.0, 576.0, 259.0, 101.0, 43.0, 18.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.7800521850585938, -0.7519989013671875, -0.7239456176757812, -0.695892333984375, -0.6678390502929688, -0.6397857666015625, -0.6117324829101562, -0.58367919921875, -0.5556259155273438, -0.5275726318359375, -0.49951934814453125, -0.471466064453125, -0.44341278076171875, -0.4153594970703125, -0.38730621337890625, -0.3592529296875, -0.33119964599609375, -0.3031463623046875, -0.27509307861328125, -0.247039794921875, -0.21898651123046875, -0.1909332275390625, -0.16287994384765625, -0.13482666015625, -0.10677337646484375, -0.0787200927734375, -0.05066680908203125, -0.022613525390625, 0.00543975830078125, 0.0334930419921875, 0.06154632568359375, 0.089599609375, 0.11765289306640625, 0.1457061767578125, 0.17375946044921875, 0.201812744140625, 0.22986602783203125, 0.2579193115234375, 0.28597259521484375, 0.31402587890625, 0.34207916259765625, 0.3701324462890625, 0.39818572998046875, 0.426239013671875, 0.45429229736328125, 0.4823455810546875, 0.5103988647460938, 0.5384521484375, 0.5665054321289062, 0.5945587158203125, 0.6226119995117188, 0.650665283203125, 0.6787185668945312, 0.7067718505859375, 0.7348251342773438, 0.76287841796875, 0.7909317016601562, 0.8189849853515625, 0.8470382690429688, 0.875091552734375, 0.9031448364257812, 0.9311981201171875, 0.9592514038085938, 0.9873046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 5.0, 3.0, 4.0, 10.0, 10.0, 9.0, 12.0, 24.0, 45.0, 57.0, 103.0, 254.0, 2067.0, 945.0, 226.0, 104.0, 63.0, 41.0, 23.0, 20.0, 16.0, 2.0, 10.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218017578125, -0.21072006225585938, -0.20342254638671875, -0.19612503051757812, -0.1888275146484375, -0.18152999877929688, -0.17423248291015625, -0.16693496704101562, -0.159637451171875, -0.15233993530273438, -0.14504241943359375, -0.13774490356445312, -0.1304473876953125, -0.12314987182617188, -0.11585235595703125, -0.10855484008789062, -0.10125732421875, -0.09395980834960938, -0.08666229248046875, -0.07936477661132812, -0.0720672607421875, -0.06476974487304688, -0.05747222900390625, -0.050174713134765625, -0.042877197265625, -0.035579681396484375, -0.02828216552734375, -0.020984649658203125, -0.0136871337890625, -0.006389617919921875, 0.00090789794921875, 0.008205413818359375, 0.0155029296875, 0.022800445556640625, 0.03009796142578125, 0.037395477294921875, 0.0446929931640625, 0.051990509033203125, 0.05928802490234375, 0.06658554077148438, 0.073883056640625, 0.08118057250976562, 0.08847808837890625, 0.09577560424804688, 0.1030731201171875, 0.11037063598632812, 0.11766815185546875, 0.12496566772460938, 0.13226318359375, 0.13956069946289062, 0.14685821533203125, 0.15415573120117188, 0.1614532470703125, 0.16875076293945312, 0.17604827880859375, 0.18334579467773438, 0.190643310546875, 0.19794082641601562, 0.20523834228515625, 0.21253585815429688, 0.2198333740234375, 0.22713088989257812, 0.23442840576171875, 0.24172592163085938, 0.2490234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 10.0, 47.0, 223.0, 443.0, 224.0, 41.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.302762508392334, -4.188028335571289, -4.073294162750244, -3.958559989929199, -3.8438258171081543, -3.7290916442871094, -3.6143572330474854, -3.4996230602264404, -3.3848888874053955, -3.2701547145843506, -3.1554205417633057, -3.0406863689422607, -2.9259519577026367, -2.811217784881592, -2.696483612060547, -2.581749439239502, -2.467015266418457, -2.352281093597412, -2.237546920776367, -2.1228127479553223, -2.0080785751342773, -1.8933442831039429, -1.7786099910736084, -1.6638758182525635, -1.5491416454315186, -1.4344074726104736, -1.3196732997894287, -1.2049390077590942, -1.0902048349380493, -0.9754706621170044, -0.8607364296913147, -0.746002197265625, -0.6312682628631592, -0.5165340900421143, -0.40179985761642456, -0.28706565499305725, -0.17233145236968994, -0.05759727954864502, 0.05713695287704468, 0.17187118530273438, 0.2866053581237793, 0.4013395607471466, 0.5160737633705139, 0.6308079957962036, 0.7455421686172485, 0.8602763414382935, 0.9750105738639832, 1.0897448062896729, 1.2044789791107178, 1.3192131519317627, 1.4339473247528076, 1.548681616783142, 1.663415789604187, 1.778149962425232, 1.8928842544555664, 2.0076184272766113, 2.1223526000976562, 2.237086772918701, 2.351820945739746, 2.466555118560791, 2.581289291381836, 2.696023464202881, 2.810757875442505, 2.92549204826355, 3.0402262210845947]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 2.0, 9.0, 18.0, 27.0, 31.0, 45.0, 49.0, 57.0, 77.0, 79.0, 89.0, 67.0, 58.0, 61.0, 74.0, 75.0, 55.0, 41.0, 33.0, 18.0, 19.0, 9.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.2582192420959473, -1.2260786294937134, -1.1939380168914795, -1.161797285079956, -1.1296566724777222, -1.0975160598754883, -1.0653754472732544, -1.0332348346710205, -1.001094102859497, -0.9689534902572632, -0.9368128180503845, -0.9046722054481506, -0.872531533241272, -0.8403909206390381, -0.8082503080368042, -0.7761096954345703, -0.7439690828323364, -0.7118284702301025, -0.6796877980232239, -0.64754718542099, -0.6154065132141113, -0.5832659006118774, -0.5511252880096436, -0.5189846754074097, -0.486844003200531, -0.45470336079597473, -0.42256271839141846, -0.39042210578918457, -0.3582814633846283, -0.326140820980072, -0.29400020837783813, -0.26185956597328186, -0.22971880435943604, -0.19757816195487976, -0.16543753445148468, -0.1332969069480896, -0.10115626454353333, -0.06901562213897705, -0.03687499463558197, -0.00473436713218689, 0.027406275272369385, 0.05954691022634506, 0.09168754518032074, 0.12382818013429642, 0.1559688150882721, 0.18810945749282837, 0.22025008499622345, 0.25239071249961853, 0.2845313549041748, 0.3166719973087311, 0.34881263971328735, 0.38095325231552124, 0.4130938947200775, 0.4452345371246338, 0.4773751497268677, 0.5095157623291016, 0.5416564345359802, 0.5737970471382141, 0.6059377193450928, 0.6380783319473267, 0.6702189445495605, 0.7023596167564392, 0.7345002293586731, 0.7666409015655518, 0.7987815141677856]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 12.0, 19.0, 27.0, 48.0, 91.0, 138.0, 256.0, 514.0, 1115.0, 2530.0, 7928.0, 40237.0, 316502.0, 569118.0, 89176.0, 14120.0, 3804.0, 1433.0, 683.0, 340.0, 167.0, 109.0, 57.0, 36.0, 32.0, 19.0, 7.0, 6.0, 12.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82666015625, -0.8017578125, -0.77685546875, -0.751953125, -0.72705078125, -0.7021484375, -0.67724609375, -0.65234375, -0.62744140625, -0.6025390625, -0.57763671875, -0.552734375, -0.52783203125, -0.5029296875, -0.47802734375, -0.453125, -0.42822265625, -0.4033203125, -0.37841796875, -0.353515625, -0.32861328125, -0.3037109375, -0.27880859375, -0.25390625, -0.22900390625, -0.2041015625, -0.17919921875, -0.154296875, -0.12939453125, -0.1044921875, -0.07958984375, -0.0546875, -0.02978515625, -0.0048828125, 0.02001953125, 0.044921875, 0.06982421875, 0.0947265625, 0.11962890625, 0.14453125, 0.16943359375, 0.1943359375, 0.21923828125, 0.244140625, 0.26904296875, 0.2939453125, 0.31884765625, 0.34375, 0.36865234375, 0.3935546875, 0.41845703125, 0.443359375, 0.46826171875, 0.4931640625, 0.51806640625, 0.54296875, 0.56787109375, 0.5927734375, 0.61767578125, 0.642578125, 0.66748046875, 0.6923828125, 0.71728515625, 0.7421875, 0.76708984375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 11.0, 21.0, 27.0, 66.0, 69.0, 124.0, 103.0, 122.0, 110.0, 98.0, 96.0, 59.0, 33.0, 25.0, 19.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2183837890625, -0.21126556396484375, -0.2041473388671875, -0.19702911376953125, -0.189910888671875, -0.18279266357421875, -0.1756744384765625, -0.16855621337890625, -0.16143798828125, -0.15431976318359375, -0.1472015380859375, -0.14008331298828125, -0.132965087890625, -0.12584686279296875, -0.1187286376953125, -0.11161041259765625, -0.1044921875, -0.09737396240234375, -0.0902557373046875, -0.08313751220703125, -0.076019287109375, -0.06890106201171875, -0.0617828369140625, -0.05466461181640625, -0.04754638671875, -0.04042816162109375, -0.0333099365234375, -0.02619171142578125, -0.019073486328125, -0.01195526123046875, -0.0048370361328125, 0.00228118896484375, 0.0093994140625, 0.01651763916015625, 0.0236358642578125, 0.03075408935546875, 0.037872314453125, 0.04499053955078125, 0.0521087646484375, 0.05922698974609375, 0.06634521484375, 0.07346343994140625, 0.0805816650390625, 0.08769989013671875, 0.094818115234375, 0.10193634033203125, 0.1090545654296875, 0.11617279052734375, 0.123291015625, 0.13040924072265625, 0.1375274658203125, 0.14464569091796875, 0.151763916015625, 0.15888214111328125, 0.1660003662109375, 0.17311859130859375, 0.18023681640625, 0.18735504150390625, 0.1944732666015625, 0.20159149169921875, 0.208709716796875, 0.21582794189453125, 0.2229461669921875, 0.23006439208984375, 0.2371826171875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 11.0, 16.0, 21.0, 30.0, 26.0, 62.0, 94.0, 172.0, 284.0, 538.0, 1069.0, 2526.0, 6962.0, 24666.0, 111126.0, 442495.0, 351861.0, 78630.0, 18546.0, 5367.0, 2085.0, 906.0, 427.0, 241.0, 142.0, 78.0, 54.0, 38.0, 26.0, 14.0, 14.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.59375, -0.5788650512695312, -0.5639801025390625, -0.5490951538085938, -0.534210205078125, -0.5193252563476562, -0.5044403076171875, -0.48955535888671875, -0.47467041015625, -0.45978546142578125, -0.4449005126953125, -0.43001556396484375, -0.415130615234375, -0.40024566650390625, -0.3853607177734375, -0.37047576904296875, -0.3555908203125, -0.34070587158203125, -0.3258209228515625, -0.31093597412109375, -0.296051025390625, -0.28116607666015625, -0.2662811279296875, -0.25139617919921875, -0.23651123046875, -0.22162628173828125, -0.2067413330078125, -0.19185638427734375, -0.176971435546875, -0.16208648681640625, -0.1472015380859375, -0.13231658935546875, -0.117431640625, -0.10254669189453125, -0.0876617431640625, -0.07277679443359375, -0.057891845703125, -0.04300689697265625, -0.0281219482421875, -0.01323699951171875, 0.00164794921875, 0.01653289794921875, 0.0314178466796875, 0.04630279541015625, 0.061187744140625, 0.07607269287109375, 0.0909576416015625, 0.10584259033203125, 0.1207275390625, 0.13561248779296875, 0.1504974365234375, 0.16538238525390625, 0.180267333984375, 0.19515228271484375, 0.2100372314453125, 0.22492218017578125, 0.23980712890625, 0.25469207763671875, 0.2695770263671875, 0.28446197509765625, 0.299346923828125, 0.31423187255859375, 0.3291168212890625, 0.34400177001953125, 0.35888671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 12.0, 11.0, 15.0, 14.0, 16.0, 19.0, 24.0, 20.0, 24.0, 29.0, 39.0, 38.0, 61.0, 58.0, 50.0, 50.0, 54.0, 44.0, 42.0, 50.0, 53.0, 46.0, 30.0, 39.0, 29.0, 18.0, 25.0, 16.0, 14.0, 7.0, 5.0, 9.0, 6.0, 5.0, 7.0, 3.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.5322265625, -0.5175857543945312, -0.5029449462890625, -0.48830413818359375, -0.473663330078125, -0.45902252197265625, -0.4443817138671875, -0.42974090576171875, -0.41510009765625, -0.40045928955078125, -0.3858184814453125, -0.37117767333984375, -0.356536865234375, -0.34189605712890625, -0.3272552490234375, -0.31261444091796875, -0.2979736328125, -0.28333282470703125, -0.2686920166015625, -0.25405120849609375, -0.239410400390625, -0.22476959228515625, -0.2101287841796875, -0.19548797607421875, -0.18084716796875, -0.16620635986328125, -0.1515655517578125, -0.13692474365234375, -0.122283935546875, -0.10764312744140625, -0.0930023193359375, -0.07836151123046875, -0.063720703125, -0.04907989501953125, -0.0344390869140625, -0.01979827880859375, -0.005157470703125, 0.00948333740234375, 0.0241241455078125, 0.03876495361328125, 0.05340576171875, 0.06804656982421875, 0.0826873779296875, 0.09732818603515625, 0.111968994140625, 0.12660980224609375, 0.1412506103515625, 0.15589141845703125, 0.1705322265625, 0.18517303466796875, 0.1998138427734375, 0.21445465087890625, 0.229095458984375, 0.24373626708984375, 0.2583770751953125, 0.27301788330078125, 0.28765869140625, 0.30229949951171875, 0.3169403076171875, 0.33158111572265625, 0.346221923828125, 0.36086273193359375, 0.3755035400390625, 0.39014434814453125, 0.40478515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 9.0, 16.0, 20.0, 34.0, 67.0, 93.0, 190.0, 321.0, 600.0, 1100.0, 2270.0, 5515.0, 21053.0, 226973.0, 731310.0, 44129.0, 8691.0, 3044.0, 1433.0, 713.0, 383.0, 249.0, 142.0, 80.0, 41.0, 26.0, 22.0, 11.0, 4.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51611328125, -0.5005645751953125, -0.485015869140625, -0.4694671630859375, -0.45391845703125, -0.4383697509765625, -0.422821044921875, -0.4072723388671875, -0.3917236328125, -0.3761749267578125, -0.360626220703125, -0.3450775146484375, -0.32952880859375, -0.3139801025390625, -0.298431396484375, -0.2828826904296875, -0.267333984375, -0.2517852783203125, -0.236236572265625, -0.2206878662109375, -0.20513916015625, -0.1895904541015625, -0.174041748046875, -0.1584930419921875, -0.1429443359375, -0.1273956298828125, -0.111846923828125, -0.0962982177734375, -0.08074951171875, -0.0652008056640625, -0.049652099609375, -0.0341033935546875, -0.0185546875, -0.0030059814453125, 0.012542724609375, 0.0280914306640625, 0.04364013671875, 0.0591888427734375, 0.074737548828125, 0.0902862548828125, 0.1058349609375, 0.1213836669921875, 0.136932373046875, 0.1524810791015625, 0.16802978515625, 0.1835784912109375, 0.199127197265625, 0.2146759033203125, 0.230224609375, 0.2457733154296875, 0.261322021484375, 0.2768707275390625, 0.29241943359375, 0.3079681396484375, 0.323516845703125, 0.3390655517578125, 0.3546142578125, 0.3701629638671875, 0.385711669921875, 0.4012603759765625, 0.41680908203125, 0.4323577880859375, 0.447906494140625, 0.4634552001953125, 0.47900390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 12.0, 14.0, 22.0, 29.0, 37.0, 37.0, 38.0, 60.0, 95.0, 128.0, 125.0, 82.0, 59.0, 47.0, 40.0, 26.0, 21.0, 20.0, 14.0, 18.0, 14.0, 6.0, 3.0, 3.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018084049224853516, -0.00017577968537807465, -0.00017071887850761414, -0.00016565807163715363, -0.00016059726476669312, -0.0001555364578962326, -0.0001504756510257721, -0.00014541484415531158, -0.00014035403728485107, -0.00013529323041439056, -0.00013023242354393005, -0.00012517161667346954, -0.00012011080980300903, -0.00011505000293254852, -0.00010998919606208801, -0.0001049283891916275, -9.986758232116699e-05, -9.480677545070648e-05, -8.974596858024597e-05, -8.468516170978546e-05, -7.962435483932495e-05, -7.456354796886444e-05, -6.950274109840393e-05, -6.444193422794342e-05, -5.938112735748291e-05, -5.43203204870224e-05, -4.925951361656189e-05, -4.419870674610138e-05, -3.913789987564087e-05, -3.407709300518036e-05, -2.901628613471985e-05, -2.395547926425934e-05, -1.8894672393798828e-05, -1.3833865523338318e-05, -8.773058652877808e-06, -3.7122517824172974e-06, 1.3485550880432129e-06, 6.409361958503723e-06, 1.1470168828964233e-05, 1.6530975699424744e-05, 2.1591782569885254e-05, 2.6652589440345764e-05, 3.1713396310806274e-05, 3.6774203181266785e-05, 4.1835010051727295e-05, 4.6895816922187805e-05, 5.1956623792648315e-05, 5.7017430663108826e-05, 6.207823753356934e-05, 6.713904440402985e-05, 7.219985127449036e-05, 7.726065814495087e-05, 8.232146501541138e-05, 8.738227188587189e-05, 9.24430787563324e-05, 9.750388562679291e-05, 0.00010256469249725342, 0.00010762549936771393, 0.00011268630623817444, 0.00011774711310863495, 0.00012280791997909546, 0.00012786872684955597, 0.00013292953372001648, 0.000137990340590477, 0.0001430511474609375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 4.0, 6.0, 12.0, 39.0, 78.0, 294.0, 1586.0, 22131.0, 997571.0, 24661.0, 1675.0, 312.0, 101.0, 22.0, 18.0, 12.0, 5.0, 6.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.0687103271484375, -1.025115966796875, -0.9815216064453125, -0.93792724609375, -0.8943328857421875, -0.850738525390625, -0.8071441650390625, -0.7635498046875, -0.7199554443359375, -0.676361083984375, -0.6327667236328125, -0.58917236328125, -0.5455780029296875, -0.501983642578125, -0.4583892822265625, -0.414794921875, -0.3712005615234375, -0.327606201171875, -0.2840118408203125, -0.24041748046875, -0.1968231201171875, -0.153228759765625, -0.1096343994140625, -0.0660400390625, -0.0224456787109375, 0.021148681640625, 0.0647430419921875, 0.10833740234375, 0.1519317626953125, 0.195526123046875, 0.2391204833984375, 0.28271484375, 0.3263092041015625, 0.369903564453125, 0.4134979248046875, 0.45709228515625, 0.5006866455078125, 0.544281005859375, 0.5878753662109375, 0.6314697265625, 0.6750640869140625, 0.718658447265625, 0.7622528076171875, 0.80584716796875, 0.8494415283203125, 0.893035888671875, 0.9366302490234375, 0.980224609375, 1.0238189697265625, 1.067413330078125, 1.1110076904296875, 1.15460205078125, 1.1981964111328125, 1.241790771484375, 1.2853851318359375, 1.3289794921875, 1.3725738525390625, 1.416168212890625, 1.4597625732421875, 1.50335693359375, 1.5469512939453125, 1.590545654296875, 1.6341400146484375, 1.677734375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 8.0, 18.0, 21.0, 43.0, 92.0, 130.0, 224.0, 216.0, 93.0, 51.0, 32.0, 13.0, 13.0, 7.0, 9.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67578125, -0.6563034057617188, -0.6368255615234375, -0.6173477172851562, -0.597869873046875, -0.5783920288085938, -0.5589141845703125, -0.5394363403320312, -0.51995849609375, -0.5004806518554688, -0.4810028076171875, -0.46152496337890625, -0.442047119140625, -0.42256927490234375, -0.4030914306640625, -0.38361358642578125, -0.3641357421875, -0.34465789794921875, -0.3251800537109375, -0.30570220947265625, -0.286224365234375, -0.26674652099609375, -0.2472686767578125, -0.22779083251953125, -0.20831298828125, -0.18883514404296875, -0.1693572998046875, -0.14987945556640625, -0.130401611328125, -0.11092376708984375, -0.0914459228515625, -0.07196807861328125, -0.052490234375, -0.03301239013671875, -0.0135345458984375, 0.00594329833984375, 0.025421142578125, 0.04489898681640625, 0.0643768310546875, 0.08385467529296875, 0.10333251953125, 0.12281036376953125, 0.1422882080078125, 0.16176605224609375, 0.181243896484375, 0.20072174072265625, 0.2201995849609375, 0.23967742919921875, 0.2591552734375, 0.27863311767578125, 0.2981109619140625, 0.31758880615234375, 0.337066650390625, 0.35654449462890625, 0.3760223388671875, 0.39550018310546875, 0.41497802734375, 0.43445587158203125, 0.4539337158203125, 0.47341156005859375, 0.492889404296875, 0.5123672485351562, 0.5318450927734375, 0.5513229370117188, 0.57080078125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 18.0, 64.0, 170.0, 339.0, 263.0, 110.0, 28.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.45939826965332, -9.105244636535645, -8.751090049743652, -8.396936416625977, -8.0427827835083, -7.688628673553467, -7.334474563598633, -6.980320930480957, -6.626167297363281, -6.272013187408447, -5.9178595542907715, -5.5637054443359375, -5.209551811218262, -4.855397701263428, -4.501243591308594, -4.147089958190918, -3.792935848236084, -3.438781976699829, -3.084628105163574, -2.7304739952087402, -2.3763203620910645, -2.0221662521362305, -1.6680123805999756, -1.3138585090637207, -0.9597046375274658, -0.6055507659912109, -0.2513968348503113, 0.10275709629058838, 0.45691096782684326, 0.8110648393630981, 1.1652188301086426, 1.5193727016448975, 1.8735265731811523, 2.2276804447174072, 2.581834316253662, 2.935988426208496, 3.290142059326172, 3.644296169281006, 3.9984500408172607, 4.352603912353516, 4.706757545471191, 5.060911655426025, 5.415065288543701, 5.769219398498535, 6.123373031616211, 6.477527141571045, 6.831681251525879, 7.185834884643555, 7.539988994598389, 7.894143104553223, 8.248296737670898, 8.602450370788574, 8.956604957580566, 9.310758590698242, 9.664912223815918, 10.019065856933594, 10.373220443725586, 10.727374076843262, 11.081528663635254, 11.43568229675293, 11.789835929870605, 12.143989562988281, 12.498144149780273, 12.85229778289795, 13.206451416015625]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 6.0, 5.0, 11.0, 10.0, 14.0, 17.0, 20.0, 21.0, 24.0, 25.0, 34.0, 25.0, 36.0, 55.0, 31.0, 47.0, 53.0, 44.0, 48.0, 57.0, 50.0, 32.0, 37.0, 34.0, 38.0, 29.0, 25.0, 29.0, 16.0, 27.0, 22.0, 16.0, 11.0, 7.0, 10.0, 9.0, 8.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.656383514404297, -2.5737974643707275, -2.491211414337158, -2.408625364303589, -2.3260393142700195, -2.24345326423645, -2.160867214202881, -2.0782811641693115, -1.9956951141357422, -1.9131090641021729, -1.8305230140686035, -1.7479369640350342, -1.6653509140014648, -1.5827648639678955, -1.5001788139343262, -1.4175927639007568, -1.335006833076477, -1.2524207830429077, -1.1698347330093384, -1.087248682975769, -1.0046626329421997, -0.9220765829086304, -0.8394905924797058, -0.7569045424461365, -0.6743184924125671, -0.5917324423789978, -0.5091463923454285, -0.4265603721141815, -0.3439743220806122, -0.26138827204704285, -0.1788022518157959, -0.09621620178222656, -0.013630151748657227, 0.06895589083433151, 0.15154193341732025, 0.2341279685497284, 0.31671401858329773, 0.39930006861686707, 0.481886088848114, 0.5644721388816833, 0.6470581889152527, 0.729644238948822, 0.8122302889823914, 0.8948162794113159, 0.9774023294448853, 1.0599883794784546, 1.142574429512024, 1.2251604795455933, 1.3077465295791626, 1.390332579612732, 1.4729186296463013, 1.5555046796798706, 1.63809072971344, 1.7206767797470093, 1.803262710571289, 1.8858487606048584, 1.9684348106384277, 2.051020860671997, 2.1336069107055664, 2.2161929607391357, 2.298779010772705, 2.3813650608062744, 2.4639511108398438, 2.546537160873413, 2.6291232109069824]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 5.0, 5.0, 4.0, 10.0, 12.0, 11.0, 14.0, 21.0, 30.0, 43.0, 62.0, 82.0, 158.0, 228.0, 453.0, 743.0, 1506.0, 3103.0, 6959.0, 18541.0, 67397.0, 972181.0, 3001107.0, 84466.0, 21808.0, 7904.0, 3448.0, 1697.0, 869.0, 504.0, 309.0, 193.0, 111.0, 79.0, 64.0, 51.0, 32.0, 18.0, 13.0, 6.0, 7.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.64501953125, -0.6242599487304688, -0.6035003662109375, -0.5827407836914062, -0.561981201171875, -0.5412216186523438, -0.5204620361328125, -0.49970245361328125, -0.47894287109375, -0.45818328857421875, -0.4374237060546875, -0.41666412353515625, -0.395904541015625, -0.37514495849609375, -0.3543853759765625, -0.33362579345703125, -0.3128662109375, -0.29210662841796875, -0.2713470458984375, -0.25058746337890625, -0.229827880859375, -0.20906829833984375, -0.1883087158203125, -0.16754913330078125, -0.14678955078125, -0.12602996826171875, -0.1052703857421875, -0.08451080322265625, -0.063751220703125, -0.04299163818359375, -0.0222320556640625, -0.00147247314453125, 0.019287109375, 0.04004669189453125, 0.0608062744140625, 0.08156585693359375, 0.102325439453125, 0.12308502197265625, 0.1438446044921875, 0.16460418701171875, 0.18536376953125, 0.20612335205078125, 0.2268829345703125, 0.24764251708984375, 0.268402099609375, 0.28916168212890625, 0.3099212646484375, 0.33068084716796875, 0.3514404296875, 0.37220001220703125, 0.3929595947265625, 0.41371917724609375, 0.434478759765625, 0.45523834228515625, 0.4759979248046875, 0.49675750732421875, 0.51751708984375, 0.5382766723632812, 0.5590362548828125, 0.5797958374023438, 0.600555419921875, 0.6213150024414062, 0.6420745849609375, 0.6628341674804688, 0.68359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 8.0, 11.0, 20.0, 27.0, 39.0, 67.0, 92.0, 90.0, 105.0, 97.0, 110.0, 97.0, 71.0, 59.0, 47.0, 22.0, 21.0, 10.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243408203125, -0.23590469360351562, -0.22840118408203125, -0.22089767456054688, -0.2133941650390625, -0.20589065551757812, -0.19838714599609375, -0.19088363647460938, -0.183380126953125, -0.17587661743164062, -0.16837310791015625, -0.16086959838867188, -0.1533660888671875, -0.14586257934570312, -0.13835906982421875, -0.13085556030273438, -0.12335205078125, -0.11584854125976562, -0.10834503173828125, -0.10084152221679688, -0.0933380126953125, -0.08583450317382812, -0.07833099365234375, -0.07082748413085938, -0.063323974609375, -0.055820465087890625, -0.04831695556640625, -0.040813446044921875, -0.0333099365234375, -0.025806427001953125, -0.01830291748046875, -0.010799407958984375, -0.0032958984375, 0.004207611083984375, 0.01171112060546875, 0.019214630126953125, 0.0267181396484375, 0.034221649169921875, 0.04172515869140625, 0.049228668212890625, 0.056732177734375, 0.06423568725585938, 0.07173919677734375, 0.07924270629882812, 0.0867462158203125, 0.09424972534179688, 0.10175323486328125, 0.10925674438476562, 0.11676025390625, 0.12426376342773438, 0.13176727294921875, 0.13927078247070312, 0.1467742919921875, 0.15427780151367188, 0.16178131103515625, 0.16928482055664062, 0.176788330078125, 0.18429183959960938, 0.19179534912109375, 0.19929885864257812, 0.2068023681640625, 0.21430587768554688, 0.22180938720703125, 0.22931289672851562, 0.23681640625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 12.0, 13.0, 33.0, 72.0, 199.0, 504.0, 1481.0, 6229.0, 37971.0, 3392088.0, 722060.0, 27021.0, 4654.0, 1265.0, 413.0, 154.0, 65.0, 18.0, 17.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21484375, -1.1742401123046875, -1.133636474609375, -1.0930328369140625, -1.05242919921875, -1.0118255615234375, -0.971221923828125, -0.9306182861328125, -0.8900146484375, -0.8494110107421875, -0.808807373046875, -0.7682037353515625, -0.72760009765625, -0.6869964599609375, -0.646392822265625, -0.6057891845703125, -0.565185546875, -0.5245819091796875, -0.483978271484375, -0.4433746337890625, -0.40277099609375, -0.3621673583984375, -0.321563720703125, -0.2809600830078125, -0.2403564453125, -0.1997528076171875, -0.159149169921875, -0.1185455322265625, -0.07794189453125, -0.0373382568359375, 0.003265380859375, 0.0438690185546875, 0.08447265625, 0.1250762939453125, 0.165679931640625, 0.2062835693359375, 0.24688720703125, 0.2874908447265625, 0.328094482421875, 0.3686981201171875, 0.4093017578125, 0.4499053955078125, 0.490509033203125, 0.5311126708984375, 0.57171630859375, 0.6123199462890625, 0.652923583984375, 0.6935272216796875, 0.734130859375, 0.7747344970703125, 0.815338134765625, 0.8559417724609375, 0.89654541015625, 0.9371490478515625, 0.977752685546875, 1.0183563232421875, 1.0589599609375, 1.0995635986328125, 1.140167236328125, 1.1807708740234375, 1.22137451171875, 1.2619781494140625, 1.302581787109375, 1.3431854248046875, 1.3837890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 13.0, 24.0, 31.0, 53.0, 65.0, 102.0, 221.0, 1093.0, 1825.0, 283.0, 107.0, 75.0, 40.0, 35.0, 16.0, 13.0, 16.0, 5.0, 4.0, 5.0, 5.0, 7.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.3272895812988281, -0.31473541259765625, -0.3021812438964844, -0.2896270751953125, -0.2770729064941406, -0.26451873779296875, -0.2519645690917969, -0.239410400390625, -0.22685623168945312, -0.21430206298828125, -0.20174789428710938, -0.1891937255859375, -0.17663955688476562, -0.16408538818359375, -0.15153121948242188, -0.13897705078125, -0.12642288208007812, -0.11386871337890625, -0.10131454467773438, -0.0887603759765625, -0.07620620727539062, -0.06365203857421875, -0.051097869873046875, -0.038543701171875, -0.025989532470703125, -0.01343536376953125, -0.000881195068359375, 0.0116729736328125, 0.024227142333984375, 0.03678131103515625, 0.049335479736328125, 0.0618896484375, 0.07444381713867188, 0.08699798583984375, 0.09955215454101562, 0.1121063232421875, 0.12466049194335938, 0.13721466064453125, 0.14976882934570312, 0.162322998046875, 0.17487716674804688, 0.18743133544921875, 0.19998550415039062, 0.2125396728515625, 0.22509384155273438, 0.23764801025390625, 0.2502021789550781, 0.26275634765625, 0.2753105163574219, 0.28786468505859375, 0.3004188537597656, 0.3129730224609375, 0.3255271911621094, 0.33808135986328125, 0.3506355285644531, 0.363189697265625, 0.3757438659667969, 0.38829803466796875, 0.4008522033691406, 0.4134063720703125, 0.4259605407714844, 0.43851470947265625, 0.4510688781738281, 0.463623046875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 19.0, 34.0, 86.0, 191.0, 224.0, 225.0, 115.0, 51.0, 34.0, 19.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3231747150421143, -3.218048572540283, -3.112922191619873, -3.007796049118042, -2.902669668197632, -2.797543525695801, -2.6924171447753906, -2.5872910022735596, -2.4821648597717285, -2.3770387172698975, -2.2719123363494873, -2.1667861938476562, -2.061659812927246, -1.956533670425415, -1.8514074087142944, -1.7462811470031738, -1.6411547660827637, -1.536028504371643, -1.4309022426605225, -1.3257761001586914, -1.2206497192382812, -1.1155235767364502, -1.0103973150253296, -0.905271053314209, -0.8001447916030884, -0.6950185298919678, -0.5898922681808472, -0.48476606607437134, -0.37963980436325073, -0.2745135426521301, -0.1693873405456543, -0.06426107883453369, 0.040865421295166016, 0.14599166810512543, 0.25111791491508484, 0.35624414682388306, 0.46137040853500366, 0.5664966702461243, 0.6716228723526001, 0.7767491340637207, 0.8818753957748413, 0.9870016574859619, 1.0921279191970825, 1.1972541809082031, 1.3023803234100342, 1.4075067043304443, 1.5126328468322754, 1.617759108543396, 1.7228853702545166, 1.8280116319656372, 1.9331378936767578, 2.038264036178589, 2.143390417098999, 2.24851655960083, 2.3536429405212402, 2.4587690830230713, 2.5638952255249023, 2.6690213680267334, 2.7741477489471436, 2.8792738914489746, 2.9844002723693848, 3.089526414871216, 3.194652557373047, 3.299778938293457, 3.404905319213867]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 10.0, 7.0, 6.0, 22.0, 30.0, 40.0, 39.0, 47.0, 67.0, 66.0, 71.0, 64.0, 73.0, 83.0, 62.0, 55.0, 48.0, 48.0, 42.0, 29.0, 28.0, 18.0, 20.0, 13.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.770959734916687, -1.7147836685180664, -1.6586076021194458, -1.6024315357208252, -1.5462554693222046, -1.490079402923584, -1.4339032173156738, -1.3777271509170532, -1.3215510845184326, -1.265375018119812, -1.2091989517211914, -1.1530228853225708, -1.0968468189239502, -1.04067063331604, -0.9844946265220642, -0.9283185005187988, -0.872142493724823, -0.8159664273262024, -0.7597903609275818, -0.7036142349243164, -0.6474381685256958, -0.5912621021270752, -0.5350860357284546, -0.4789099395275116, -0.422733873128891, -0.3665578067302704, -0.3103817105293274, -0.2542056441307068, -0.198029562830925, -0.1418534815311432, -0.08567741513252258, -0.02950131893157959, 0.026674747467041016, 0.08285082876682281, 0.13902691006660461, 0.19520297646522522, 0.2513790726661682, 0.3075551390647888, 0.3637312054634094, 0.4199073016643524, 0.476083368062973, 0.532259464263916, 0.5884355306625366, 0.6446115970611572, 0.7007876634597778, 0.7569637298583984, 0.813139796257019, 0.8693159222602844, 0.925491988658905, 0.9816680550575256, 1.037844181060791, 1.0940202474594116, 1.1501963138580322, 1.2063723802566528, 1.2625484466552734, 1.318724513053894, 1.3749005794525146, 1.4310766458511353, 1.4872527122497559, 1.5434287786483765, 1.599604845046997, 1.6557810306549072, 1.7119569778442383, 1.7681331634521484, 1.824309229850769]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 8.0, 14.0, 14.0, 40.0, 55.0, 78.0, 150.0, 240.0, 443.0, 839.0, 1832.0, 4399.0, 11926.0, 36931.0, 121726.0, 325676.0, 344572.0, 136771.0, 40782.0, 13277.0, 4790.0, 1928.0, 942.0, 465.0, 249.0, 149.0, 94.0, 53.0, 34.0, 28.0, 20.0, 6.0, 6.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.523590087890625, -0.50616455078125, -0.488739013671875, -0.4713134765625, -0.453887939453125, -0.43646240234375, -0.419036865234375, -0.401611328125, -0.384185791015625, -0.36676025390625, -0.349334716796875, -0.3319091796875, -0.314483642578125, -0.29705810546875, -0.279632568359375, -0.26220703125, -0.244781494140625, -0.22735595703125, -0.209930419921875, -0.1925048828125, -0.175079345703125, -0.15765380859375, -0.140228271484375, -0.122802734375, -0.105377197265625, -0.08795166015625, -0.070526123046875, -0.0531005859375, -0.035675048828125, -0.01824951171875, -0.000823974609375, 0.0166015625, 0.034027099609375, 0.05145263671875, 0.068878173828125, 0.0863037109375, 0.103729248046875, 0.12115478515625, 0.138580322265625, 0.156005859375, 0.173431396484375, 0.19085693359375, 0.208282470703125, 0.2257080078125, 0.243133544921875, 0.26055908203125, 0.277984619140625, 0.29541015625, 0.312835693359375, 0.33026123046875, 0.347686767578125, 0.3651123046875, 0.382537841796875, 0.39996337890625, 0.417388916015625, 0.434814453125, 0.452239990234375, 0.46966552734375, 0.487091064453125, 0.5045166015625, 0.521942138671875, 0.53936767578125, 0.556793212890625, 0.57421875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 4.0, 8.0, 19.0, 24.0, 36.0, 47.0, 66.0, 73.0, 82.0, 89.0, 105.0, 97.0, 88.0, 73.0, 53.0, 44.0, 35.0, 28.0, 13.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2445068359375, -0.23673439025878906, -0.22896194458007812, -0.2211894989013672, -0.21341705322265625, -0.2056446075439453, -0.19787216186523438, -0.19009971618652344, -0.1823272705078125, -0.17455482482910156, -0.16678237915039062, -0.1590099334716797, -0.15123748779296875, -0.1434650421142578, -0.13569259643554688, -0.12792015075683594, -0.120147705078125, -0.11237525939941406, -0.10460281372070312, -0.09683036804199219, -0.08905792236328125, -0.08128547668457031, -0.07351303100585938, -0.06574058532714844, -0.0579681396484375, -0.05019569396972656, -0.042423248291015625, -0.03465080261230469, -0.02687835693359375, -0.019105911254882812, -0.011333465576171875, -0.0035610198974609375, 0.00421142578125, 0.011983871459960938, 0.019756317138671875, 0.027528762817382812, 0.03530120849609375, 0.04307365417480469, 0.050846099853515625, 0.05861854553222656, 0.0663909912109375, 0.07416343688964844, 0.08193588256835938, 0.08970832824707031, 0.09748077392578125, 0.10525321960449219, 0.11302566528320312, 0.12079811096191406, 0.128570556640625, 0.13634300231933594, 0.14411544799804688, 0.1518878936767578, 0.15966033935546875, 0.1674327850341797, 0.17520523071289062, 0.18297767639160156, 0.1907501220703125, 0.19852256774902344, 0.20629501342773438, 0.2140674591064453, 0.22183990478515625, 0.2296123504638672, 0.23738479614257812, 0.24515724182128906, 0.2529296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 15.0, 31.0, 16.0, 28.0, 40.0, 93.0, 152.0, 238.0, 520.0, 1152.0, 3193.0, 10409.0, 39899.0, 185991.0, 512596.0, 226883.0, 48624.0, 12278.0, 3815.0, 1338.0, 581.0, 272.0, 142.0, 87.0, 33.0, 50.0, 32.0, 15.0, 9.0, 5.0, 8.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.822265625, -0.8003768920898438, -0.7784881591796875, -0.7565994262695312, -0.734710693359375, -0.7128219604492188, -0.6909332275390625, -0.6690444946289062, -0.64715576171875, -0.6252670288085938, -0.6033782958984375, -0.5814895629882812, -0.559600830078125, -0.5377120971679688, -0.5158233642578125, -0.49393463134765625, -0.4720458984375, -0.45015716552734375, -0.4282684326171875, -0.40637969970703125, -0.384490966796875, -0.36260223388671875, -0.3407135009765625, -0.31882476806640625, -0.29693603515625, -0.27504730224609375, -0.2531585693359375, -0.23126983642578125, -0.209381103515625, -0.18749237060546875, -0.1656036376953125, -0.14371490478515625, -0.121826171875, -0.09993743896484375, -0.0780487060546875, -0.05615997314453125, -0.034271240234375, -0.01238250732421875, 0.0095062255859375, 0.03139495849609375, 0.05328369140625, 0.07517242431640625, 0.0970611572265625, 0.11894989013671875, 0.140838623046875, 0.16272735595703125, 0.1846160888671875, 0.20650482177734375, 0.2283935546875, 0.25028228759765625, 0.2721710205078125, 0.29405975341796875, 0.315948486328125, 0.33783721923828125, 0.3597259521484375, 0.38161468505859375, 0.40350341796875, 0.42539215087890625, 0.4472808837890625, 0.46916961669921875, 0.491058349609375, 0.5129470825195312, 0.5348358154296875, 0.5567245483398438, 0.57861328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 9.0, 3.0, 7.0, 3.0, 5.0, 10.0, 8.0, 12.0, 11.0, 14.0, 18.0, 18.0, 33.0, 43.0, 37.0, 32.0, 28.0, 36.0, 42.0, 51.0, 57.0, 46.0, 54.0, 36.0, 48.0, 34.0, 38.0, 32.0, 39.0, 28.0, 32.0, 21.0, 21.0, 19.0, 20.0, 15.0, 5.0, 9.0, 10.0, 4.0, 4.0, 5.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.7353515625, -0.7147979736328125, -0.694244384765625, -0.6736907958984375, -0.65313720703125, -0.6325836181640625, -0.612030029296875, -0.5914764404296875, -0.5709228515625, -0.5503692626953125, -0.529815673828125, -0.5092620849609375, -0.48870849609375, -0.4681549072265625, -0.447601318359375, -0.4270477294921875, -0.406494140625, -0.3859405517578125, -0.365386962890625, -0.3448333740234375, -0.32427978515625, -0.3037261962890625, -0.283172607421875, -0.2626190185546875, -0.2420654296875, -0.2215118408203125, -0.200958251953125, -0.1804046630859375, -0.15985107421875, -0.1392974853515625, -0.118743896484375, -0.0981903076171875, -0.07763671875, -0.0570831298828125, -0.036529541015625, -0.0159759521484375, 0.00457763671875, 0.0251312255859375, 0.045684814453125, 0.0662384033203125, 0.0867919921875, 0.1073455810546875, 0.127899169921875, 0.1484527587890625, 0.16900634765625, 0.1895599365234375, 0.210113525390625, 0.2306671142578125, 0.251220703125, 0.2717742919921875, 0.292327880859375, 0.3128814697265625, 0.33343505859375, 0.3539886474609375, 0.374542236328125, 0.3950958251953125, 0.4156494140625, 0.4362030029296875, 0.456756591796875, 0.4773101806640625, 0.49786376953125, 0.5184173583984375, 0.538970947265625, 0.5595245361328125, 0.580078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 8.0, 15.0, 15.0, 15.0, 17.0, 37.0, 31.0, 80.0, 111.0, 198.0, 373.0, 809.0, 1866.0, 6098.0, 31591.0, 427606.0, 532380.0, 36644.0, 6859.0, 2015.0, 819.0, 416.0, 196.0, 140.0, 67.0, 52.0, 44.0, 20.0, 14.0, 10.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7412109375, -0.7147750854492188, -0.6883392333984375, -0.6619033813476562, -0.635467529296875, -0.6090316772460938, -0.5825958251953125, -0.5561599731445312, -0.52972412109375, -0.5032882690429688, -0.4768524169921875, -0.45041656494140625, -0.423980712890625, -0.39754486083984375, -0.3711090087890625, -0.34467315673828125, -0.3182373046875, -0.29180145263671875, -0.2653656005859375, -0.23892974853515625, -0.212493896484375, -0.18605804443359375, -0.1596221923828125, -0.13318634033203125, -0.10675048828125, -0.08031463623046875, -0.0538787841796875, -0.02744293212890625, -0.001007080078125, 0.02542877197265625, 0.0518646240234375, 0.07830047607421875, 0.104736328125, 0.13117218017578125, 0.1576080322265625, 0.18404388427734375, 0.210479736328125, 0.23691558837890625, 0.2633514404296875, 0.28978729248046875, 0.31622314453125, 0.34265899658203125, 0.3690948486328125, 0.39553070068359375, 0.421966552734375, 0.44840240478515625, 0.4748382568359375, 0.5012741088867188, 0.5277099609375, 0.5541458129882812, 0.5805816650390625, 0.6070175170898438, 0.633453369140625, 0.6598892211914062, 0.6863250732421875, 0.7127609252929688, 0.73919677734375, 0.7656326293945312, 0.7920684814453125, 0.8185043334960938, 0.844940185546875, 0.8713760375976562, 0.8978118896484375, 0.9242477416992188, 0.95068359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 9.0, 15.0, 33.0, 49.0, 73.0, 92.0, 147.0, 143.0, 142.0, 106.0, 59.0, 42.0, 34.0, 14.0, 8.0, 7.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020682811737060547, -0.00019803829491138458, -0.0001892484724521637, -0.0001804586499929428, -0.00017166882753372192, -0.00016287900507450104, -0.00015408918261528015, -0.00014529936015605927, -0.00013650953769683838, -0.0001277197152376175, -0.0001189298927783966, -0.00011014007031917572, -0.00010135024785995483, -9.256042540073395e-05, -8.377060294151306e-05, -7.498078048229218e-05, -6.619095802307129e-05, -5.74011355638504e-05, -4.8611313104629517e-05, -3.982149064540863e-05, -3.1031668186187744e-05, -2.2241845726966858e-05, -1.3452023267745972e-05, -4.6622008085250854e-06, 4.127621650695801e-06, 1.2917444109916687e-05, 2.1707266569137573e-05, 3.049708902835846e-05, 3.9286911487579346e-05, 4.807673394680023e-05, 5.686655640602112e-05, 6.5656378865242e-05, 7.444620132446289e-05, 8.323602378368378e-05, 9.202584624290466e-05, 0.00010081566870212555, 0.00010960549116134644, 0.00011839531362056732, 0.0001271851360797882, 0.0001359749585390091, 0.00014476478099822998, 0.00015355460345745087, 0.00016234442591667175, 0.00017113424837589264, 0.00017992407083511353, 0.0001887138932943344, 0.0001975037157535553, 0.00020629353821277618, 0.00021508336067199707, 0.00022387318313121796, 0.00023266300559043884, 0.00024145282804965973, 0.0002502426505088806, 0.0002590324729681015, 0.0002678222954273224, 0.0002766121178865433, 0.00028540194034576416, 0.00029419176280498505, 0.00030298158526420593, 0.0003117714077234268, 0.0003205612301826477, 0.0003293510526418686, 0.0003381408751010895, 0.00034693069756031036, 0.00035572052001953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 11.0, 13.0, 31.0, 62.0, 82.0, 238.0, 656.0, 2895.0, 41978.0, 927433.0, 70110.0, 3779.0, 778.0, 252.0, 97.0, 50.0, 30.0, 14.0, 13.0, 9.0, 3.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1533203125, -1.112945556640625, -1.07257080078125, -1.032196044921875, -0.9918212890625, -0.951446533203125, -0.91107177734375, -0.870697021484375, -0.830322265625, -0.789947509765625, -0.74957275390625, -0.709197998046875, -0.6688232421875, -0.628448486328125, -0.58807373046875, -0.547698974609375, -0.50732421875, -0.466949462890625, -0.42657470703125, -0.386199951171875, -0.3458251953125, -0.305450439453125, -0.26507568359375, -0.224700927734375, -0.184326171875, -0.143951416015625, -0.10357666015625, -0.063201904296875, -0.0228271484375, 0.017547607421875, 0.05792236328125, 0.098297119140625, 0.138671875, 0.179046630859375, 0.21942138671875, 0.259796142578125, 0.3001708984375, 0.340545654296875, 0.38092041015625, 0.421295166015625, 0.461669921875, 0.502044677734375, 0.54241943359375, 0.582794189453125, 0.6231689453125, 0.663543701171875, 0.70391845703125, 0.744293212890625, 0.78466796875, 0.825042724609375, 0.86541748046875, 0.905792236328125, 0.9461669921875, 0.986541748046875, 1.02691650390625, 1.067291259765625, 1.107666015625, 1.148040771484375, 1.18841552734375, 1.228790283203125, 1.2691650390625, 1.309539794921875, 1.34991455078125, 1.390289306640625, 1.4306640625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 4.0, 11.0, 11.0, 20.0, 16.0, 31.0, 69.0, 131.0, 164.0, 209.0, 118.0, 73.0, 55.0, 31.0, 16.0, 19.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97119140625, -0.9379806518554688, -0.9047698974609375, -0.8715591430664062, -0.838348388671875, -0.8051376342773438, -0.7719268798828125, -0.7387161254882812, -0.70550537109375, -0.6722946166992188, -0.6390838623046875, -0.6058731079101562, -0.572662353515625, -0.5394515991210938, -0.5062408447265625, -0.47303009033203125, -0.4398193359375, -0.40660858154296875, -0.3733978271484375, -0.34018707275390625, -0.306976318359375, -0.27376556396484375, -0.2405548095703125, -0.20734405517578125, -0.17413330078125, -0.14092254638671875, -0.1077117919921875, -0.07450103759765625, -0.041290283203125, -0.00807952880859375, 0.0251312255859375, 0.05834197998046875, 0.091552734375, 0.12476348876953125, 0.1579742431640625, 0.19118499755859375, 0.224395751953125, 0.25760650634765625, 0.2908172607421875, 0.32402801513671875, 0.35723876953125, 0.39044952392578125, 0.4236602783203125, 0.45687103271484375, 0.490081787109375, 0.5232925415039062, 0.5565032958984375, 0.5897140502929688, 0.6229248046875, 0.6561355590820312, 0.6893463134765625, 0.7225570678710938, 0.755767822265625, 0.7889785766601562, 0.8221893310546875, 0.8554000854492188, 0.88861083984375, 0.9218215942382812, 0.9550323486328125, 0.9882431030273438, 1.021453857421875, 1.0546646118164062, 1.0878753662109375, 1.1210861206054688, 1.154296875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 12.0, 90.0, 344.0, 413.0, 116.0, 24.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.767391204833984, -22.011369705200195, -21.255348205566406, -20.499326705932617, -19.743305206298828, -18.98728370666504, -18.23126220703125, -17.475242614746094, -16.719219207763672, -15.963197708129883, -15.207176208496094, -14.451154708862305, -13.695133209228516, -12.939111709594727, -12.183091163635254, -11.427069664001465, -10.671049118041992, -9.915027618408203, -9.159006118774414, -8.402984619140625, -7.646963596343994, -6.890942096710205, -6.134921073913574, -5.378899574279785, -4.622878074645996, -3.866856575012207, -3.110835313796997, -2.354814052581787, -1.598792552947998, -0.842771053314209, -0.08675003051757812, 0.6692714691162109, 1.4252910614013672, 2.1813125610351562, 2.937333822250366, 3.693355083465576, 4.449376583099365, 5.205398082733154, 5.961419105529785, 6.717440605163574, 7.473462104797363, 8.229483604431152, 8.985505104064941, 9.741525650024414, 10.497547149658203, 11.253568649291992, 12.009590148925781, 12.76561164855957, 13.52163314819336, 14.277654647827148, 15.033676147460938, 15.789697647094727, 16.545719146728516, 17.301740646362305, 18.057762145996094, 18.81378173828125, 19.569805145263672, 20.32582664489746, 21.08184814453125, 21.83786964416504, 22.593891143798828, 23.349912643432617, 24.105934143066406, 24.861953735351562, 25.61797523498535]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 5.0, 14.0, 10.0, 17.0, 18.0, 25.0, 19.0, 35.0, 45.0, 49.0, 59.0, 50.0, 58.0, 62.0, 38.0, 54.0, 56.0, 74.0, 64.0, 50.0, 36.0, 32.0, 24.0, 23.0, 24.0, 20.0, 7.0, 7.0, 4.0, 8.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.075491905212402, -4.907909870147705, -4.740327835083008, -4.5727458000183105, -4.405163764953613, -4.237581729888916, -4.069999694824219, -3.9024174213409424, -3.734835386276245, -3.567253351211548, -3.3996713161468506, -3.232089042663574, -3.064507007598877, -2.8969249725341797, -2.7293429374694824, -2.561760902404785, -2.394178867340088, -2.2265968322753906, -2.0590147972106934, -1.8914326429367065, -1.7238506078720093, -1.556268572807312, -1.3886864185333252, -1.221104383468628, -1.0535223484039307, -0.8859403133392334, -0.7183582186698914, -0.5507761240005493, -0.38319408893585205, -0.21561205387115479, -0.04802989959716797, 0.1195521354675293, 0.28713417053222656, 0.4547162353992462, 0.6222983002662659, 0.7898803949356079, 0.9574624300003052, 1.1250444650650024, 1.2926266193389893, 1.4602086544036865, 1.6277906894683838, 1.795372724533081, 1.9629547595977783, 2.1305370330810547, 2.298119068145752, 2.465701103210449, 2.6332831382751465, 2.8008651733398438, 2.968447208404541, 3.1360292434692383, 3.3036112785339355, 3.471193313598633, 3.63877534866333, 3.8063573837280273, 3.9739396572113037, 4.141521453857422, 4.309103965759277, 4.476686000823975, 4.644268035888672, 4.811850070953369, 4.979432106018066, 5.147014141082764, 5.314596176147461, 5.482178688049316, 5.6497602462768555]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 4.0, 3.0, 6.0, 8.0, 11.0, 11.0, 30.0, 43.0, 54.0, 91.0, 142.0, 244.0, 388.0, 649.0, 1335.0, 2518.0, 5431.0, 13695.0, 50699.0, 3624151.0, 436531.0, 37200.0, 11031.0, 4836.0, 2312.0, 1188.0, 628.0, 392.0, 227.0, 146.0, 93.0, 68.0, 46.0, 20.0, 11.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8095703125, -0.786376953125, -0.76318359375, -0.739990234375, -0.716796875, -0.693603515625, -0.67041015625, -0.647216796875, -0.6240234375, -0.600830078125, -0.57763671875, -0.554443359375, -0.53125, -0.508056640625, -0.48486328125, -0.461669921875, -0.4384765625, -0.415283203125, -0.39208984375, -0.368896484375, -0.345703125, -0.322509765625, -0.29931640625, -0.276123046875, -0.2529296875, -0.229736328125, -0.20654296875, -0.183349609375, -0.16015625, -0.136962890625, -0.11376953125, -0.090576171875, -0.0673828125, -0.044189453125, -0.02099609375, 0.002197265625, 0.025390625, 0.048583984375, 0.07177734375, 0.094970703125, 0.1181640625, 0.141357421875, 0.16455078125, 0.187744140625, 0.2109375, 0.234130859375, 0.25732421875, 0.280517578125, 0.3037109375, 0.326904296875, 0.35009765625, 0.373291015625, 0.396484375, 0.419677734375, 0.44287109375, 0.466064453125, 0.4892578125, 0.512451171875, 0.53564453125, 0.558837890625, 0.58203125, 0.605224609375, 0.62841796875, 0.651611328125, 0.6748046875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 9.0, 16.0, 11.0, 28.0, 33.0, 36.0, 53.0, 69.0, 83.0, 73.0, 72.0, 88.0, 74.0, 71.0, 63.0, 51.0, 36.0, 43.0, 32.0, 17.0, 11.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.2606468200683594, -0.25225067138671875, -0.24385452270507812, -0.2354583740234375, -0.22706222534179688, -0.21866607666015625, -0.21026992797851562, -0.201873779296875, -0.19347763061523438, -0.18508148193359375, -0.17668533325195312, -0.1682891845703125, -0.15989303588867188, -0.15149688720703125, -0.14310073852539062, -0.13470458984375, -0.12630844116210938, -0.11791229248046875, -0.10951614379882812, -0.1011199951171875, -0.09272384643554688, -0.08432769775390625, -0.07593154907226562, -0.067535400390625, -0.059139251708984375, -0.05074310302734375, -0.042346954345703125, -0.0339508056640625, -0.025554656982421875, -0.01715850830078125, -0.008762359619140625, -0.0003662109375, 0.008029937744140625, 0.01642608642578125, 0.024822235107421875, 0.0332183837890625, 0.041614532470703125, 0.05001068115234375, 0.058406829833984375, 0.066802978515625, 0.07519912719726562, 0.08359527587890625, 0.09199142456054688, 0.1003875732421875, 0.10878372192382812, 0.11717987060546875, 0.12557601928710938, 0.13397216796875, 0.14236831665039062, 0.15076446533203125, 0.15916061401367188, 0.1675567626953125, 0.17595291137695312, 0.18434906005859375, 0.19274520874023438, 0.201141357421875, 0.20953750610351562, 0.21793365478515625, 0.22632980346679688, 0.2347259521484375, 0.24312210083007812, 0.25151824951171875, 0.2599143981933594, 0.268310546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 13.0, 17.0, 18.0, 29.0, 42.0, 59.0, 99.0, 147.0, 255.0, 462.0, 671.0, 1218.0, 2302.0, 5021.0, 13952.0, 63936.0, 3916653.0, 154351.0, 21495.0, 6880.0, 2967.0, 1492.0, 854.0, 508.0, 286.0, 188.0, 98.0, 70.0, 38.0, 31.0, 24.0, 18.0, 14.0, 12.0, 13.0, 5.0, 4.0, 5.0, 3.0, 5.0, 1.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.86279296875, -0.8337173461914062, -0.8046417236328125, -0.7755661010742188, -0.746490478515625, -0.7174148559570312, -0.6883392333984375, -0.6592636108398438, -0.63018798828125, -0.6011123657226562, -0.5720367431640625, -0.5429611206054688, -0.513885498046875, -0.48480987548828125, -0.4557342529296875, -0.42665863037109375, -0.3975830078125, -0.36850738525390625, -0.3394317626953125, -0.31035614013671875, -0.281280517578125, -0.25220489501953125, -0.2231292724609375, -0.19405364990234375, -0.16497802734375, -0.13590240478515625, -0.1068267822265625, -0.07775115966796875, -0.048675537109375, -0.01959991455078125, 0.0094757080078125, 0.03855133056640625, 0.067626953125, 0.09670257568359375, 0.1257781982421875, 0.15485382080078125, 0.183929443359375, 0.21300506591796875, 0.2420806884765625, 0.27115631103515625, 0.30023193359375, 0.32930755615234375, 0.3583831787109375, 0.38745880126953125, 0.416534423828125, 0.44561004638671875, 0.4746856689453125, 0.5037612915039062, 0.5328369140625, 0.5619125366210938, 0.5909881591796875, 0.6200637817382812, 0.649139404296875, 0.6782150268554688, 0.7072906494140625, 0.7363662719726562, 0.76544189453125, 0.7945175170898438, 0.8235931396484375, 0.8526687622070312, 0.881744384765625, 0.9108200073242188, 0.9398956298828125, 0.9689712524414062, 0.998046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 15.0, 22.0, 40.0, 97.0, 2787.0, 917.0, 96.0, 38.0, 20.0, 15.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1929931640625, -0.1828136444091797, -0.17263412475585938, -0.16245460510253906, -0.15227508544921875, -0.14209556579589844, -0.13191604614257812, -0.12173652648925781, -0.1115570068359375, -0.10137748718261719, -0.09119796752929688, -0.08101844787597656, -0.07083892822265625, -0.06065940856933594, -0.050479888916015625, -0.04030036926269531, -0.030120849609375, -0.019941329956054688, -0.009761810302734375, 0.0004177093505859375, 0.01059722900390625, 0.020776748657226562, 0.030956268310546875, 0.04113578796386719, 0.0513153076171875, 0.06149482727050781, 0.07167434692382812, 0.08185386657714844, 0.09203338623046875, 0.10221290588378906, 0.11239242553710938, 0.12257194519042969, 0.13275146484375, 0.1429309844970703, 0.15311050415039062, 0.16329002380371094, 0.17346954345703125, 0.18364906311035156, 0.19382858276367188, 0.2040081024169922, 0.2141876220703125, 0.2243671417236328, 0.23454666137695312, 0.24472618103027344, 0.25490570068359375, 0.26508522033691406, 0.2752647399902344, 0.2854442596435547, 0.295623779296875, 0.3058032989501953, 0.3159828186035156, 0.32616233825683594, 0.33634185791015625, 0.34652137756347656, 0.3567008972167969, 0.3668804168701172, 0.3770599365234375, 0.3872394561767578, 0.3974189758300781, 0.40759849548339844, 0.41777801513671875, 0.42795753479003906, 0.4381370544433594, 0.4483165740966797, 0.45849609375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 18.0, 33.0, 61.0, 138.0, 207.0, 236.0, 155.0, 97.0, 30.0, 11.0, 12.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.230276107788086, -2.186631441116333, -2.142986536026001, -2.099341869354248, -2.055697202682495, -2.012052297592163, -1.9684076309204102, -1.9247629642486572, -1.8811181783676147, -1.8374733924865723, -1.7938287258148193, -1.7501839399337769, -1.7065391540527344, -1.6628944873809814, -1.619249701499939, -1.5756049156188965, -1.5319602489471436, -1.488315463066101, -1.4446707963943481, -1.4010260105133057, -1.3573813438415527, -1.3137365579605103, -1.2700917720794678, -1.2264471054077148, -1.1828023195266724, -1.1391575336456299, -1.095512866973877, -1.0518680810928345, -1.008223295211792, -0.9645786285400391, -0.9209338426589966, -0.8772891163825989, -0.8336445093154907, -0.789999783039093, -0.7463550567626953, -0.7027102708816528, -0.6590655446052551, -0.6154208183288574, -0.5717760324478149, -0.5281313061714172, -0.48448657989501953, -0.4408418536186218, -0.39719709753990173, -0.35355234146118164, -0.30990761518478394, -0.26626288890838623, -0.22261813282966614, -0.17897337675094604, -0.13532865047454834, -0.09168390929698944, -0.04803916811943054, -0.004394426941871643, 0.039250314235687256, 0.08289505541324615, 0.12653979659080505, 0.17018455266952515, 0.21382927894592285, 0.25747400522232056, 0.30111876130104065, 0.34476351737976074, 0.38840824365615845, 0.43205296993255615, 0.47569772601127625, 0.5193424820899963, 0.562987208366394]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 2.0, 8.0, 11.0, 7.0, 18.0, 11.0, 9.0, 25.0, 19.0, 27.0, 27.0, 31.0, 38.0, 38.0, 35.0, 45.0, 35.0, 54.0, 47.0, 41.0, 43.0, 48.0, 37.0, 49.0, 31.0, 32.0, 45.0, 35.0, 14.0, 24.0, 18.0, 20.0, 14.0, 7.0, 9.0, 10.0, 5.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3721722960472107, -0.3590085208415985, -0.34584471583366394, -0.33268094062805176, -0.3195171356201172, -0.306353360414505, -0.2931895852088928, -0.28002578020095825, -0.2668619751930237, -0.2536981999874115, -0.24053439497947693, -0.22737061977386475, -0.21420681476593018, -0.201043039560318, -0.18787924945354462, -0.17471545934677124, -0.16155168414115906, -0.14838789403438568, -0.1352241039276123, -0.12206032127141953, -0.10889653116464615, -0.09573274105787277, -0.08256895840167999, -0.06940516829490662, -0.05624137818813324, -0.04307758808135986, -0.029913801699876785, -0.016750015318393707, -0.003586225211620331, 0.009577564895153046, 0.022741347551345825, 0.0359051376581192, 0.04906892776489258, 0.062232717871665955, 0.07539650797843933, 0.08856029063463211, 0.10172408074140549, 0.11488787084817886, 0.12805165350437164, 0.14121544361114502, 0.1543792337179184, 0.16754302382469177, 0.18070681393146515, 0.19387060403823853, 0.2070343792438507, 0.22019818425178528, 0.23336195945739746, 0.24652574956417084, 0.2596895396709442, 0.2728533148765564, 0.28601711988449097, 0.29918089509010315, 0.3123447000980377, 0.3255084753036499, 0.3386722803115845, 0.35183605551719666, 0.36499983072280884, 0.378163605928421, 0.3913274109363556, 0.4044911861419678, 0.41765499114990234, 0.4308187663555145, 0.4439825415611267, 0.4571463465690613, 0.47031015157699585]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 0.0, 2.0, 10.0, 11.0, 13.0, 21.0, 37.0, 42.0, 76.0, 123.0, 215.0, 354.0, 707.0, 1599.0, 3896.0, 11599.0, 37594.0, 125948.0, 327696.0, 340876.0, 136551.0, 41020.0, 12400.0, 4305.0, 1731.0, 756.0, 386.0, 213.0, 128.0, 85.0, 50.0, 31.0, 28.0, 9.0, 13.0, 10.0, 8.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6611328125, -0.6404953002929688, -0.6198577880859375, -0.5992202758789062, -0.578582763671875, -0.5579452514648438, -0.5373077392578125, -0.5166702270507812, -0.49603271484375, -0.47539520263671875, -0.4547576904296875, -0.43412017822265625, -0.413482666015625, -0.39284515380859375, -0.3722076416015625, -0.35157012939453125, -0.3309326171875, -0.31029510498046875, -0.2896575927734375, -0.26902008056640625, -0.248382568359375, -0.22774505615234375, -0.2071075439453125, -0.18647003173828125, -0.16583251953125, -0.14519500732421875, -0.1245574951171875, -0.10391998291015625, -0.083282470703125, -0.06264495849609375, -0.0420074462890625, -0.02136993408203125, -0.000732421875, 0.01990509033203125, 0.0405426025390625, 0.06118011474609375, 0.081817626953125, 0.10245513916015625, 0.1230926513671875, 0.14373016357421875, 0.16436767578125, 0.18500518798828125, 0.2056427001953125, 0.22628021240234375, 0.246917724609375, 0.26755523681640625, 0.2881927490234375, 0.30883026123046875, 0.3294677734375, 0.35010528564453125, 0.3707427978515625, 0.39138031005859375, 0.412017822265625, 0.43265533447265625, 0.4532928466796875, 0.47393035888671875, 0.49456787109375, 0.5152053833007812, 0.5358428955078125, 0.5564804077148438, 0.577117919921875, 0.5977554321289062, 0.6183929443359375, 0.6390304565429688, 0.65966796875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 13.0, 20.0, 17.0, 28.0, 44.0, 37.0, 52.0, 43.0, 71.0, 73.0, 81.0, 69.0, 86.0, 58.0, 61.0, 53.0, 50.0, 20.0, 34.0, 28.0, 13.0, 14.0, 10.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27197265625, -0.2635307312011719, -0.25508880615234375, -0.24664688110351562, -0.2382049560546875, -0.22976303100585938, -0.22132110595703125, -0.21287918090820312, -0.204437255859375, -0.19599533081054688, -0.18755340576171875, -0.17911148071289062, -0.1706695556640625, -0.16222763061523438, -0.15378570556640625, -0.14534378051757812, -0.13690185546875, -0.12845993041992188, -0.12001800537109375, -0.11157608032226562, -0.1031341552734375, -0.09469223022460938, -0.08625030517578125, -0.07780838012695312, -0.069366455078125, -0.060924530029296875, -0.05248260498046875, -0.044040679931640625, -0.0355987548828125, -0.027156829833984375, -0.01871490478515625, -0.010272979736328125, -0.0018310546875, 0.006610870361328125, 0.01505279541015625, 0.023494720458984375, 0.0319366455078125, 0.040378570556640625, 0.04882049560546875, 0.057262420654296875, 0.065704345703125, 0.07414627075195312, 0.08258819580078125, 0.09103012084960938, 0.0994720458984375, 0.10791397094726562, 0.11635589599609375, 0.12479782104492188, 0.13323974609375, 0.14168167114257812, 0.15012359619140625, 0.15856552124023438, 0.1670074462890625, 0.17544937133789062, 0.18389129638671875, 0.19233322143554688, 0.200775146484375, 0.20921707153320312, 0.21765899658203125, 0.22610092163085938, 0.2345428466796875, 0.24298477172851562, 0.25142669677734375, 0.2598686218261719, 0.268310546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 9.0, 5.0, 10.0, 17.0, 38.0, 31.0, 50.0, 78.0, 163.0, 305.0, 633.0, 1581.0, 5011.0, 21695.0, 133127.0, 591421.0, 244889.0, 37935.0, 7670.0, 2174.0, 836.0, 363.0, 204.0, 118.0, 64.0, 44.0, 28.0, 11.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8779296875, -0.845001220703125, -0.81207275390625, -0.779144287109375, -0.7462158203125, -0.713287353515625, -0.68035888671875, -0.647430419921875, -0.614501953125, -0.581573486328125, -0.54864501953125, -0.515716552734375, -0.4827880859375, -0.449859619140625, -0.41693115234375, -0.384002685546875, -0.35107421875, -0.318145751953125, -0.28521728515625, -0.252288818359375, -0.2193603515625, -0.186431884765625, -0.15350341796875, -0.120574951171875, -0.087646484375, -0.054718017578125, -0.02178955078125, 0.011138916015625, 0.0440673828125, 0.076995849609375, 0.10992431640625, 0.142852783203125, 0.17578125, 0.208709716796875, 0.24163818359375, 0.274566650390625, 0.3074951171875, 0.340423583984375, 0.37335205078125, 0.406280517578125, 0.439208984375, 0.472137451171875, 0.50506591796875, 0.537994384765625, 0.5709228515625, 0.603851318359375, 0.63677978515625, 0.669708251953125, 0.70263671875, 0.735565185546875, 0.76849365234375, 0.801422119140625, 0.8343505859375, 0.867279052734375, 0.90020751953125, 0.933135986328125, 0.966064453125, 0.998992919921875, 1.03192138671875, 1.064849853515625, 1.0977783203125, 1.130706787109375, 1.16363525390625, 1.196563720703125, 1.2294921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 6.0, 9.0, 12.0, 4.0, 7.0, 9.0, 18.0, 33.0, 17.0, 37.0, 21.0, 33.0, 34.0, 44.0, 36.0, 31.0, 58.0, 36.0, 54.0, 47.0, 37.0, 55.0, 50.0, 32.0, 45.0, 32.0, 41.0, 30.0, 32.0, 21.0, 15.0, 15.0, 16.0, 9.0, 6.0, 4.0, 6.0, 6.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0048828125, -0.971282958984375, -0.93768310546875, -0.904083251953125, -0.8704833984375, -0.836883544921875, -0.80328369140625, -0.769683837890625, -0.736083984375, -0.702484130859375, -0.66888427734375, -0.635284423828125, -0.6016845703125, -0.568084716796875, -0.53448486328125, -0.500885009765625, -0.46728515625, -0.433685302734375, -0.40008544921875, -0.366485595703125, -0.3328857421875, -0.299285888671875, -0.26568603515625, -0.232086181640625, -0.198486328125, -0.164886474609375, -0.13128662109375, -0.097686767578125, -0.0640869140625, -0.030487060546875, 0.00311279296875, 0.036712646484375, 0.0703125, 0.103912353515625, 0.13751220703125, 0.171112060546875, 0.2047119140625, 0.238311767578125, 0.27191162109375, 0.305511474609375, 0.339111328125, 0.372711181640625, 0.40631103515625, 0.439910888671875, 0.4735107421875, 0.507110595703125, 0.54071044921875, 0.574310302734375, 0.60791015625, 0.641510009765625, 0.67510986328125, 0.708709716796875, 0.7423095703125, 0.775909423828125, 0.80950927734375, 0.843109130859375, 0.876708984375, 0.910308837890625, 0.94390869140625, 0.977508544921875, 1.0111083984375, 1.044708251953125, 1.07830810546875, 1.111907958984375, 1.1455078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 16.0, 24.0, 38.0, 92.0, 229.0, 504.0, 1921.0, 21454.0, 968124.0, 52081.0, 2914.0, 680.0, 247.0, 96.0, 58.0, 32.0, 15.0, 9.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.83203125, -2.76397705078125, -2.6959228515625, -2.62786865234375, -2.559814453125, -2.49176025390625, -2.4237060546875, -2.35565185546875, -2.28759765625, -2.21954345703125, -2.1514892578125, -2.08343505859375, -2.015380859375, -1.94732666015625, -1.8792724609375, -1.81121826171875, -1.7431640625, -1.67510986328125, -1.6070556640625, -1.53900146484375, -1.470947265625, -1.40289306640625, -1.3348388671875, -1.26678466796875, -1.19873046875, -1.13067626953125, -1.0626220703125, -0.99456787109375, -0.926513671875, -0.85845947265625, -0.7904052734375, -0.72235107421875, -0.654296875, -0.58624267578125, -0.5181884765625, -0.45013427734375, -0.382080078125, -0.31402587890625, -0.2459716796875, -0.17791748046875, -0.10986328125, -0.04180908203125, 0.0262451171875, 0.09429931640625, 0.162353515625, 0.23040771484375, 0.2984619140625, 0.36651611328125, 0.4345703125, 0.50262451171875, 0.5706787109375, 0.63873291015625, 0.706787109375, 0.77484130859375, 0.8428955078125, 0.91094970703125, 0.97900390625, 1.04705810546875, 1.1151123046875, 1.18316650390625, 1.251220703125, 1.31927490234375, 1.3873291015625, 1.45538330078125, 1.5234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 18.0, 11.0, 21.0, 31.0, 51.0, 64.0, 92.0, 134.0, 137.0, 139.0, 98.0, 72.0, 46.0, 33.0, 17.0, 22.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019347667694091797, -0.0001862887293100357, -0.00017910078167915344, -0.00017191283404827118, -0.00016472488641738892, -0.00015753693878650665, -0.0001503489911556244, -0.00014316104352474213, -0.00013597309589385986, -0.0001287851482629776, -0.00012159720063209534, -0.00011440925300121307, -0.00010722130537033081, -0.00010003335773944855, -9.284541010856628e-05, -8.565746247768402e-05, -7.846951484680176e-05, -7.12815672159195e-05, -6.409361958503723e-05, -5.690567195415497e-05, -4.9717724323272705e-05, -4.252977669239044e-05, -3.534182906150818e-05, -2.8153881430625916e-05, -2.0965933799743652e-05, -1.377798616886139e-05, -6.590038537979126e-06, 5.979090929031372e-07, 7.7858567237854e-06, 1.4973804354667664e-05, 2.2161751985549927e-05, 2.934969961643219e-05, 3.653764724731445e-05, 4.3725594878196716e-05, 5.091354250907898e-05, 5.810149013996124e-05, 6.52894377708435e-05, 7.247738540172577e-05, 7.966533303260803e-05, 8.68532806634903e-05, 9.404122829437256e-05, 0.00010122917592525482, 0.00010841712355613708, 0.00011560507118701935, 0.0001227930188179016, 0.00012998096644878387, 0.00013716891407966614, 0.0001443568617105484, 0.00015154480934143066, 0.00015873275697231293, 0.0001659207046031952, 0.00017310865223407745, 0.00018029659986495972, 0.00018748454749584198, 0.00019467249512672424, 0.0002018604427576065, 0.00020904839038848877, 0.00021623633801937103, 0.0002234242856502533, 0.00023061223328113556, 0.00023780018091201782, 0.0002449881285429001, 0.00025217607617378235, 0.0002593640238046646, 0.0002665519714355469]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 17.0, 26.0, 28.0, 52.0, 120.0, 221.0, 621.0, 2740.0, 33137.0, 916818.0, 88921.0, 4406.0, 877.0, 291.0, 117.0, 51.0, 34.0, 19.0, 15.0, 11.0, 12.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0625, -1.0175323486328125, -0.972564697265625, -0.9275970458984375, -0.88262939453125, -0.8376617431640625, -0.792694091796875, -0.7477264404296875, -0.7027587890625, -0.6577911376953125, -0.612823486328125, -0.5678558349609375, -0.52288818359375, -0.4779205322265625, -0.432952880859375, -0.3879852294921875, -0.343017578125, -0.2980499267578125, -0.253082275390625, -0.2081146240234375, -0.16314697265625, -0.1181793212890625, -0.073211669921875, -0.0282440185546875, 0.0167236328125, 0.0616912841796875, 0.106658935546875, 0.1516265869140625, 0.19659423828125, 0.2415618896484375, 0.286529541015625, 0.3314971923828125, 0.37646484375, 0.4214324951171875, 0.466400146484375, 0.5113677978515625, 0.55633544921875, 0.6013031005859375, 0.646270751953125, 0.6912384033203125, 0.7362060546875, 0.7811737060546875, 0.826141357421875, 0.8711090087890625, 0.91607666015625, 0.9610443115234375, 1.006011962890625, 1.0509796142578125, 1.095947265625, 1.1409149169921875, 1.185882568359375, 1.2308502197265625, 1.27581787109375, 1.3207855224609375, 1.365753173828125, 1.4107208251953125, 1.4556884765625, 1.5006561279296875, 1.545623779296875, 1.5905914306640625, 1.63555908203125, 1.6805267333984375, 1.725494384765625, 1.7704620361328125, 1.8154296875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 8.0, 9.0, 21.0, 34.0, 66.0, 107.0, 149.0, 171.0, 164.0, 103.0, 65.0, 37.0, 18.0, 14.0, 12.0, 8.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.4173736572265625, -1.370880126953125, -1.3243865966796875, -1.27789306640625, -1.2313995361328125, -1.184906005859375, -1.1384124755859375, -1.0919189453125, -1.0454254150390625, -0.998931884765625, -0.9524383544921875, -0.90594482421875, -0.8594512939453125, -0.812957763671875, -0.7664642333984375, -0.719970703125, -0.6734771728515625, -0.626983642578125, -0.5804901123046875, -0.53399658203125, -0.4875030517578125, -0.441009521484375, -0.3945159912109375, -0.3480224609375, -0.3015289306640625, -0.255035400390625, -0.2085418701171875, -0.16204833984375, -0.1155548095703125, -0.069061279296875, -0.0225677490234375, 0.02392578125, 0.0704193115234375, 0.116912841796875, 0.1634063720703125, 0.20989990234375, 0.2563934326171875, 0.302886962890625, 0.3493804931640625, 0.3958740234375, 0.4423675537109375, 0.488861083984375, 0.5353546142578125, 0.58184814453125, 0.6283416748046875, 0.674835205078125, 0.7213287353515625, 0.767822265625, 0.8143157958984375, 0.860809326171875, 0.9073028564453125, 0.95379638671875, 1.0002899169921875, 1.046783447265625, 1.0932769775390625, 1.1397705078125, 1.1862640380859375, 1.232757568359375, 1.2792510986328125, 1.32574462890625, 1.3722381591796875, 1.418731689453125, 1.4652252197265625, 1.51171875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 13.0, 25.0, 37.0, 102.0, 119.0, 185.0, 190.0, 137.0, 89.0, 46.0, 25.0, 12.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.667972564697266, -12.285761833190918, -11.903550148010254, -11.521339416503906, -11.139127731323242, -10.756916999816895, -10.374706268310547, -9.992494583129883, -9.610283851623535, -9.228073120117188, -8.845861434936523, -8.463650703430176, -8.081439971923828, -7.699228286743164, -7.317017555236816, -6.9348063468933105, -6.552595138549805, -6.170383930206299, -5.788172721862793, -5.405961990356445, -5.0237507820129395, -4.641539573669434, -4.259328842163086, -3.87711763381958, -3.494906425476074, -3.1126952171325684, -2.7304842472076416, -2.348273277282715, -1.966062068939209, -1.5838509798049927, -1.2016398906707764, -0.8194289207458496, -0.43721771240234375, -0.05500662326812744, 0.32720446586608887, 0.7094155550003052, 1.0916266441345215, 1.4738377332687378, 1.856048822402954, 2.238259792327881, 2.6204710006713867, 3.0026822090148926, 3.3848931789398193, 3.767104148864746, 4.149315357208252, 4.531526565551758, 4.9137372970581055, 5.295948505401611, 5.678159713745117, 6.060370922088623, 6.442582130432129, 6.824792861938477, 7.207004070281982, 7.589215278625488, 7.971426010131836, 8.3536376953125, 8.735848426818848, 9.118059158325195, 9.50027084350586, 9.882481575012207, 10.264692306518555, 10.646903991699219, 11.029114723205566, 11.411325454711914, 11.793537139892578]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 8.0, 8.0, 14.0, 16.0, 19.0, 21.0, 20.0, 37.0, 22.0, 28.0, 30.0, 47.0, 56.0, 55.0, 53.0, 39.0, 48.0, 54.0, 42.0, 53.0, 37.0, 24.0, 34.0, 30.0, 29.0, 24.0, 18.0, 22.0, 17.0, 12.0, 11.0, 15.0, 9.0, 8.0, 7.0, 4.0, 6.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.865495204925537, -4.699230194091797, -4.532965660095215, -4.366700649261475, -4.200435638427734, -4.034171104431152, -3.867906093597412, -3.701641321182251, -3.53537654876709, -3.3691117763519287, -3.2028470039367676, -3.0365819931030273, -2.870317220687866, -2.704052448272705, -2.537787437438965, -2.3715226650238037, -2.2052578926086426, -2.0389931201934814, -1.8727282285690308, -1.70646333694458, -1.540198564529419, -1.3739337921142578, -1.2076689004898071, -1.0414040088653564, -0.8751392364501953, -0.7088744044303894, -0.5426095724105835, -0.3763447403907776, -0.21007990837097168, -0.04381507635116577, 0.12244975566864014, 0.2887146472930908, 0.45497989654541016, 0.6212447285652161, 0.787509560585022, 0.9537743926048279, 1.1200392246246338, 1.286303997039795, 1.4525688886642456, 1.6188337802886963, 1.7850985527038574, 1.9513633251190186, 2.1176280975341797, 2.28389310836792, 2.450157880783081, 2.616422653198242, 2.7826876640319824, 2.9489524364471436, 3.1152172088623047, 3.281481981277466, 3.447746753692627, 3.614011764526367, 3.7802765369415283, 3.9465413093566895, 4.11280632019043, 4.279070854187012, 4.445335865020752, 4.611600875854492, 4.777865409851074, 4.9441304206848145, 5.110395431518555, 5.276659965515137, 5.442924976348877, 5.609189987182617, 5.775454521179199]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 5.0, 12.0, 12.0, 27.0, 46.0, 87.0, 236.0, 526.0, 1580.0, 5741.0, 37047.0, 3994146.0, 138902.0, 11619.0, 2716.0, 872.0, 351.0, 169.0, 62.0, 41.0, 28.0, 24.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2255859375, -1.1739044189453125, -1.122222900390625, -1.0705413818359375, -1.01885986328125, -0.9671783447265625, -0.915496826171875, -0.8638153076171875, -0.8121337890625, -0.7604522705078125, -0.708770751953125, -0.6570892333984375, -0.60540771484375, -0.5537261962890625, -0.502044677734375, -0.4503631591796875, -0.398681640625, -0.3470001220703125, -0.295318603515625, -0.2436370849609375, -0.19195556640625, -0.1402740478515625, -0.088592529296875, -0.0369110107421875, 0.0147705078125, 0.0664520263671875, 0.118133544921875, 0.1698150634765625, 0.22149658203125, 0.2731781005859375, 0.324859619140625, 0.3765411376953125, 0.42822265625, 0.4799041748046875, 0.531585693359375, 0.5832672119140625, 0.63494873046875, 0.6866302490234375, 0.738311767578125, 0.7899932861328125, 0.8416748046875, 0.8933563232421875, 0.945037841796875, 0.9967193603515625, 1.04840087890625, 1.1000823974609375, 1.151763916015625, 1.2034454345703125, 1.255126953125, 1.3068084716796875, 1.358489990234375, 1.4101715087890625, 1.46185302734375, 1.5135345458984375, 1.565216064453125, 1.6168975830078125, 1.6685791015625, 1.7202606201171875, 1.771942138671875, 1.8236236572265625, 1.87530517578125, 1.9269866943359375, 1.978668212890625, 2.0303497314453125, 2.08203125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 14.0, 13.0, 25.0, 32.0, 31.0, 47.0, 32.0, 48.0, 46.0, 72.0, 68.0, 82.0, 62.0, 57.0, 64.0, 46.0, 47.0, 47.0, 26.0, 27.0, 20.0, 23.0, 13.0, 11.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.286865234375, -0.2781219482421875, -0.269378662109375, -0.2606353759765625, -0.25189208984375, -0.2431488037109375, -0.234405517578125, -0.2256622314453125, -0.2169189453125, -0.2081756591796875, -0.199432373046875, -0.1906890869140625, -0.18194580078125, -0.1732025146484375, -0.164459228515625, -0.1557159423828125, -0.14697265625, -0.1382293701171875, -0.129486083984375, -0.1207427978515625, -0.11199951171875, -0.1032562255859375, -0.094512939453125, -0.0857696533203125, -0.0770263671875, -0.0682830810546875, -0.059539794921875, -0.0507965087890625, -0.04205322265625, -0.0333099365234375, -0.024566650390625, -0.0158233642578125, -0.007080078125, 0.0016632080078125, 0.010406494140625, 0.0191497802734375, 0.02789306640625, 0.0366363525390625, 0.045379638671875, 0.0541229248046875, 0.0628662109375, 0.0716094970703125, 0.080352783203125, 0.0890960693359375, 0.09783935546875, 0.1065826416015625, 0.115325927734375, 0.1240692138671875, 0.1328125, 0.1415557861328125, 0.150299072265625, 0.1590423583984375, 0.16778564453125, 0.1765289306640625, 0.185272216796875, 0.1940155029296875, 0.2027587890625, 0.2115020751953125, 0.220245361328125, 0.2289886474609375, 0.23773193359375, 0.2464752197265625, 0.255218505859375, 0.2639617919921875, 0.272705078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 9.0, 10.0, 17.0, 17.0, 25.0, 39.0, 49.0, 76.0, 115.0, 145.0, 208.0, 304.0, 444.0, 598.0, 925.0, 1383.0, 2270.0, 3587.0, 6167.0, 11823.0, 25267.0, 68059.0, 314410.0, 3466621.0, 194881.0, 51919.0, 20764.0, 10018.0, 5279.0, 3014.0, 1991.0, 1247.0, 839.0, 548.0, 357.0, 246.0, 177.0, 112.0, 85.0, 63.0, 56.0, 30.0, 25.0, 20.0, 12.0, 14.0, 5.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.53857421875, -0.520843505859375, -0.50311279296875, -0.485382080078125, -0.4676513671875, -0.449920654296875, -0.43218994140625, -0.414459228515625, -0.396728515625, -0.378997802734375, -0.36126708984375, -0.343536376953125, -0.3258056640625, -0.308074951171875, -0.29034423828125, -0.272613525390625, -0.2548828125, -0.237152099609375, -0.21942138671875, -0.201690673828125, -0.1839599609375, -0.166229248046875, -0.14849853515625, -0.130767822265625, -0.113037109375, -0.095306396484375, -0.07757568359375, -0.059844970703125, -0.0421142578125, -0.024383544921875, -0.00665283203125, 0.011077880859375, 0.02880859375, 0.046539306640625, 0.06427001953125, 0.082000732421875, 0.0997314453125, 0.117462158203125, 0.13519287109375, 0.152923583984375, 0.170654296875, 0.188385009765625, 0.20611572265625, 0.223846435546875, 0.2415771484375, 0.259307861328125, 0.27703857421875, 0.294769287109375, 0.3125, 0.330230712890625, 0.34796142578125, 0.365692138671875, 0.3834228515625, 0.401153564453125, 0.41888427734375, 0.436614990234375, 0.454345703125, 0.472076416015625, 0.48980712890625, 0.507537841796875, 0.5252685546875, 0.542999267578125, 0.56072998046875, 0.578460693359375, 0.59619140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 10.0, 30.0, 27.0, 44.0, 65.0, 161.0, 391.0, 2691.0, 332.0, 132.0, 66.0, 29.0, 20.0, 10.0, 8.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258056640625, -0.24957656860351562, -0.24109649658203125, -0.23261642456054688, -0.2241363525390625, -0.21565628051757812, -0.20717620849609375, -0.19869613647460938, -0.190216064453125, -0.18173599243164062, -0.17325592041015625, -0.16477584838867188, -0.1562957763671875, -0.14781570434570312, -0.13933563232421875, -0.13085556030273438, -0.12237548828125, -0.11389541625976562, -0.10541534423828125, -0.09693527221679688, -0.0884552001953125, -0.07997512817382812, -0.07149505615234375, -0.06301498413085938, -0.054534912109375, -0.046054840087890625, -0.03757476806640625, -0.029094696044921875, -0.0206146240234375, -0.012134552001953125, -0.00365447998046875, 0.004825592041015625, 0.0133056640625, 0.021785736083984375, 0.03026580810546875, 0.038745880126953125, 0.0472259521484375, 0.055706024169921875, 0.06418609619140625, 0.07266616821289062, 0.081146240234375, 0.08962631225585938, 0.09810638427734375, 0.10658645629882812, 0.1150665283203125, 0.12354660034179688, 0.13202667236328125, 0.14050674438476562, 0.14898681640625, 0.15746688842773438, 0.16594696044921875, 0.17442703247070312, 0.1829071044921875, 0.19138717651367188, 0.19986724853515625, 0.20834732055664062, 0.216827392578125, 0.22530746459960938, 0.23378753662109375, 0.24226760864257812, 0.2507476806640625, 0.2592277526855469, 0.26770782470703125, 0.2761878967285156, 0.28466796875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 13.0, 62.0, 437.0, 433.0, 54.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.496169924736023, -1.3140807151794434, -1.1319915056228638, -0.949902355670929, -0.7678131461143494, -0.5857239365577698, -0.40363478660583496, -0.22154557704925537, -0.03945636749267578, 0.14263282716274261, 0.324722021818161, 0.5068112015724182, 0.6889004111289978, 0.8709896206855774, 1.0530787706375122, 1.2351679801940918, 1.4172571897506714, 1.599346399307251, 1.7814356088638306, 1.9635248184204102, 2.1456139087677, 2.3277032375335693, 2.5097923278808594, 2.6918816566467285, 2.8739707469940186, 3.0560598373413086, 3.2381491661071777, 3.4202382564544678, 3.602327585220337, 3.784416675567627, 3.966506004333496, 4.148594856262207, 4.330684185028076, 4.512773513793945, 4.694862365722656, 4.876951694488525, 5.0590410232543945, 5.241130352020264, 5.423219203948975, 5.605308532714844, 5.787397861480713, 5.969487190246582, 6.151576042175293, 6.333665370941162, 6.515754699707031, 6.6978440284729, 6.879932880401611, 7.0620222091674805, 7.244111061096191, 7.4262003898620605, 7.6082892417907715, 7.790378570556641, 7.97246789932251, 8.154557228088379, 8.33664608001709, 8.518735885620117, 8.700824737548828, 8.882913589477539, 9.065003395080566, 9.247092247009277, 9.429181098937988, 9.611270904541016, 9.793359756469727, 9.975448608398438, 10.157538414001465]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 9.0, 3.0, 11.0, 8.0, 9.0, 12.0, 10.0, 18.0, 21.0, 35.0, 24.0, 37.0, 29.0, 29.0, 39.0, 32.0, 42.0, 37.0, 40.0, 30.0, 42.0, 30.0, 37.0, 36.0, 35.0, 27.0, 26.0, 34.0, 34.0, 25.0, 16.0, 22.0, 18.0, 15.0, 13.0, 12.0, 17.0, 9.0, 11.0, 11.0, 7.0, 3.0, 6.0, 8.0, 4.0, 3.0, 2.0, 5.0, 5.0, 0.0, 3.0, 2.0], "bins": [-0.6169381737709045, -0.5983559489250183, -0.5797737836837769, -0.5611915588378906, -0.5426093339920044, -0.5240271091461182, -0.5054449439048767, -0.4868627190589905, -0.46828052401542664, -0.4496983289718628, -0.43111610412597656, -0.4125339090824127, -0.3939517140388489, -0.37536948919296265, -0.3567872941493988, -0.33820509910583496, -0.31962287425994873, -0.3010406792163849, -0.28245845437049866, -0.2638762593269348, -0.24529404938220978, -0.22671183943748474, -0.2081296443939209, -0.18954743444919586, -0.17096522450447083, -0.1523830145597458, -0.13380080461502075, -0.11521860957145691, -0.09663639962673187, -0.07805418968200684, -0.059471987187862396, -0.04088978469371796, -0.022307515144348145, -0.0037253089249134064, 0.014856897294521332, 0.03343910351395607, 0.05202130973339081, 0.07060351967811584, 0.08918572217226028, 0.10776792466640472, 0.12635013461112976, 0.1449323445558548, 0.16351455450057983, 0.18209674954414368, 0.2006789594888687, 0.21926116943359375, 0.2378433644771576, 0.25642555952072144, 0.27500778436660767, 0.2935899794101715, 0.31217220425605774, 0.3307543992996216, 0.3493366241455078, 0.36791881918907166, 0.3865010142326355, 0.40508323907852173, 0.42366543412208557, 0.4422476291656494, 0.46082985401153564, 0.4794120490550995, 0.49799424409866333, 0.5165764689445496, 0.5351586937904358, 0.5537408590316772, 0.5723230838775635]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 24.0, 21.0, 38.0, 52.0, 88.0, 145.0, 226.0, 391.0, 728.0, 1449.0, 2899.0, 6961.0, 17046.0, 45485.0, 121144.0, 264252.0, 310132.0, 169206.0, 65818.0, 24735.0, 9658.0, 4007.0, 1915.0, 945.0, 484.0, 290.0, 145.0, 79.0, 57.0, 44.0, 20.0, 16.0, 14.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.55517578125, -0.5389366149902344, -0.5226974487304688, -0.5064582824707031, -0.4902191162109375, -0.4739799499511719, -0.45774078369140625, -0.4415016174316406, -0.425262451171875, -0.4090232849121094, -0.39278411865234375, -0.3765449523925781, -0.3603057861328125, -0.3440666198730469, -0.32782745361328125, -0.3115882873535156, -0.29534912109375, -0.2791099548339844, -0.26287078857421875, -0.24663162231445312, -0.2303924560546875, -0.21415328979492188, -0.19791412353515625, -0.18167495727539062, -0.165435791015625, -0.14919662475585938, -0.13295745849609375, -0.11671829223632812, -0.1004791259765625, -0.08423995971679688, -0.06800079345703125, -0.051761627197265625, -0.0355224609375, -0.019283294677734375, -0.00304412841796875, 0.013195037841796875, 0.0294342041015625, 0.045673370361328125, 0.06191253662109375, 0.07815170288085938, 0.094390869140625, 0.11063003540039062, 0.12686920166015625, 0.14310836791992188, 0.1593475341796875, 0.17558670043945312, 0.19182586669921875, 0.20806503295898438, 0.22430419921875, 0.24054336547851562, 0.25678253173828125, 0.2730216979980469, 0.2892608642578125, 0.3055000305175781, 0.32173919677734375, 0.3379783630371094, 0.354217529296875, 0.3704566955566406, 0.38669586181640625, 0.4029350280761719, 0.4191741943359375, 0.4354133605957031, 0.45165252685546875, 0.4678916931152344, 0.484130859375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 10.0, 10.0, 9.0, 20.0, 24.0, 20.0, 20.0, 32.0, 51.0, 54.0, 48.0, 57.0, 65.0, 55.0, 69.0, 71.0, 57.0, 53.0, 48.0, 41.0, 34.0, 22.0, 22.0, 21.0, 25.0, 18.0, 9.0, 12.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28515625, -0.2760581970214844, -0.26696014404296875, -0.2578620910644531, -0.2487640380859375, -0.23966598510742188, -0.23056793212890625, -0.22146987915039062, -0.212371826171875, -0.20327377319335938, -0.19417572021484375, -0.18507766723632812, -0.1759796142578125, -0.16688156127929688, -0.15778350830078125, -0.14868545532226562, -0.13958740234375, -0.13048934936523438, -0.12139129638671875, -0.11229324340820312, -0.1031951904296875, -0.09409713745117188, -0.08499908447265625, -0.07590103149414062, -0.066802978515625, -0.057704925537109375, -0.04860687255859375, -0.039508819580078125, -0.0304107666015625, -0.021312713623046875, -0.01221466064453125, -0.003116607666015625, 0.0059814453125, 0.015079498291015625, 0.02417755126953125, 0.033275604248046875, 0.0423736572265625, 0.051471710205078125, 0.06056976318359375, 0.06966781616210938, 0.078765869140625, 0.08786392211914062, 0.09696197509765625, 0.10606002807617188, 0.1151580810546875, 0.12425613403320312, 0.13335418701171875, 0.14245223999023438, 0.15155029296875, 0.16064834594726562, 0.16974639892578125, 0.17884445190429688, 0.1879425048828125, 0.19704055786132812, 0.20613861083984375, 0.21523666381835938, 0.224334716796875, 0.23343276977539062, 0.24253082275390625, 0.2516288757324219, 0.2607269287109375, 0.2698249816894531, 0.27892303466796875, 0.2880210876464844, 0.297119140625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 9.0, 6.0, 8.0, 19.0, 16.0, 26.0, 42.0, 55.0, 109.0, 159.0, 349.0, 689.0, 1799.0, 6395.0, 41874.0, 495114.0, 454202.0, 38321.0, 6078.0, 1792.0, 697.0, 333.0, 174.0, 116.0, 61.0, 33.0, 27.0, 15.0, 9.0, 7.0, 8.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.123046875, -1.0798187255859375, -1.036590576171875, -0.9933624267578125, -0.95013427734375, -0.9069061279296875, -0.863677978515625, -0.8204498291015625, -0.7772216796875, -0.7339935302734375, -0.690765380859375, -0.6475372314453125, -0.60430908203125, -0.5610809326171875, -0.517852783203125, -0.4746246337890625, -0.431396484375, -0.3881683349609375, -0.344940185546875, -0.3017120361328125, -0.25848388671875, -0.2152557373046875, -0.172027587890625, -0.1287994384765625, -0.0855712890625, -0.0423431396484375, 0.000885009765625, 0.0441131591796875, 0.08734130859375, 0.1305694580078125, 0.173797607421875, 0.2170257568359375, 0.26025390625, 0.3034820556640625, 0.346710205078125, 0.3899383544921875, 0.43316650390625, 0.4763946533203125, 0.519622802734375, 0.5628509521484375, 0.6060791015625, 0.6493072509765625, 0.692535400390625, 0.7357635498046875, 0.77899169921875, 0.8222198486328125, 0.865447998046875, 0.9086761474609375, 0.951904296875, 0.9951324462890625, 1.038360595703125, 1.0815887451171875, 1.12481689453125, 1.1680450439453125, 1.211273193359375, 1.2545013427734375, 1.2977294921875, 1.3409576416015625, 1.384185791015625, 1.4274139404296875, 1.47064208984375, 1.5138702392578125, 1.557098388671875, 1.6003265380859375, 1.6435546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 3.0, 5.0, 3.0, 6.0, 8.0, 8.0, 16.0, 19.0, 14.0, 28.0, 33.0, 34.0, 40.0, 59.0, 48.0, 45.0, 41.0, 45.0, 49.0, 49.0, 44.0, 47.0, 41.0, 33.0, 44.0, 40.0, 28.0, 27.0, 28.0, 28.0, 13.0, 14.0, 14.0, 6.0, 12.0, 6.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.072265625, -1.03314208984375, -0.9940185546875, -0.95489501953125, -0.915771484375, -0.87664794921875, -0.8375244140625, -0.79840087890625, -0.75927734375, -0.72015380859375, -0.6810302734375, -0.64190673828125, -0.602783203125, -0.56365966796875, -0.5245361328125, -0.48541259765625, -0.4462890625, -0.40716552734375, -0.3680419921875, -0.32891845703125, -0.289794921875, -0.25067138671875, -0.2115478515625, -0.17242431640625, -0.13330078125, -0.09417724609375, -0.0550537109375, -0.01593017578125, 0.023193359375, 0.06231689453125, 0.1014404296875, 0.14056396484375, 0.1796875, 0.21881103515625, 0.2579345703125, 0.29705810546875, 0.336181640625, 0.37530517578125, 0.4144287109375, 0.45355224609375, 0.49267578125, 0.53179931640625, 0.5709228515625, 0.61004638671875, 0.649169921875, 0.68829345703125, 0.7274169921875, 0.76654052734375, 0.8056640625, 0.84478759765625, 0.8839111328125, 0.92303466796875, 0.962158203125, 1.00128173828125, 1.0404052734375, 1.07952880859375, 1.11865234375, 1.15777587890625, 1.1968994140625, 1.23602294921875, 1.275146484375, 1.31427001953125, 1.3533935546875, 1.39251708984375, 1.431640625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 9.0, 19.0, 26.0, 56.0, 90.0, 160.0, 322.0, 901.0, 3154.0, 37849.0, 921936.0, 77569.0, 4518.0, 1113.0, 410.0, 198.0, 82.0, 48.0, 31.0, 23.0, 14.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9423828125, -1.8933258056640625, -1.844268798828125, -1.7952117919921875, -1.74615478515625, -1.6970977783203125, -1.648040771484375, -1.5989837646484375, -1.5499267578125, -1.5008697509765625, -1.451812744140625, -1.4027557373046875, -1.35369873046875, -1.3046417236328125, -1.255584716796875, -1.2065277099609375, -1.157470703125, -1.1084136962890625, -1.059356689453125, -1.0102996826171875, -0.96124267578125, -0.9121856689453125, -0.863128662109375, -0.8140716552734375, -0.7650146484375, -0.7159576416015625, -0.666900634765625, -0.6178436279296875, -0.56878662109375, -0.5197296142578125, -0.470672607421875, -0.4216156005859375, -0.37255859375, -0.3235015869140625, -0.274444580078125, -0.2253875732421875, -0.17633056640625, -0.1272735595703125, -0.078216552734375, -0.0291595458984375, 0.0198974609375, 0.0689544677734375, 0.118011474609375, 0.1670684814453125, 0.21612548828125, 0.2651824951171875, 0.314239501953125, 0.3632965087890625, 0.412353515625, 0.4614105224609375, 0.510467529296875, 0.5595245361328125, 0.60858154296875, 0.6576385498046875, 0.706695556640625, 0.7557525634765625, 0.8048095703125, 0.8538665771484375, 0.902923583984375, 0.9519805908203125, 1.00103759765625, 1.0500946044921875, 1.099151611328125, 1.1482086181640625, 1.197265625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 13.0, 21.0, 52.0, 60.0, 99.0, 136.0, 154.0, 137.0, 136.0, 60.0, 47.0, 30.0, 20.0, 12.0, 10.0, 3.0, 5.0, 4.0, 2.0, 1.0], "bins": [-0.0002639293670654297, -0.00025871768593788147, -0.00025350600481033325, -0.00024829432368278503, -0.00024308264255523682, -0.0002378709614276886, -0.00023265928030014038, -0.00022744759917259216, -0.00022223591804504395, -0.00021702423691749573, -0.0002118125557899475, -0.0002066008746623993, -0.00020138919353485107, -0.00019617751240730286, -0.00019096583127975464, -0.00018575415015220642, -0.0001805424690246582, -0.00017533078789710999, -0.00017011910676956177, -0.00016490742564201355, -0.00015969574451446533, -0.00015448406338691711, -0.0001492723822593689, -0.00014406070113182068, -0.00013884902000427246, -0.00013363733887672424, -0.00012842565774917603, -0.0001232139766216278, -0.00011800229549407959, -0.00011279061436653137, -0.00010757893323898315, -0.00010236725211143494, -9.715557098388672e-05, -9.19438898563385e-05, -8.673220872879028e-05, -8.152052760124207e-05, -7.630884647369385e-05, -7.109716534614563e-05, -6.588548421859741e-05, -6.0673803091049194e-05, -5.5462121963500977e-05, -5.025044083595276e-05, -4.503875970840454e-05, -3.982707858085632e-05, -3.4615397453308105e-05, -2.9403716325759888e-05, -2.419203519821167e-05, -1.8980354070663452e-05, -1.3768672943115234e-05, -8.556991815567017e-06, -3.345310688018799e-06, 1.866370439529419e-06, 7.078051567077637e-06, 1.2289732694625854e-05, 1.7501413822174072e-05, 2.271309494972229e-05, 2.7924776077270508e-05, 3.3136457204818726e-05, 3.834813833236694e-05, 4.355981945991516e-05, 4.877150058746338e-05, 5.39831817150116e-05, 5.9194862842559814e-05, 6.440654397010803e-05, 6.961822509765625e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 7.0, 6.0, 17.0, 14.0, 31.0, 43.0, 84.0, 137.0, 272.0, 575.0, 1511.0, 5738.0, 52369.0, 803248.0, 169575.0, 11046.0, 2264.0, 797.0, 346.0, 174.0, 101.0, 71.0, 34.0, 25.0, 12.0, 13.0, 10.0, 10.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.125, -1.0915985107421875, -1.058197021484375, -1.0247955322265625, -0.99139404296875, -0.9579925537109375, -0.924591064453125, -0.8911895751953125, -0.8577880859375, -0.8243865966796875, -0.790985107421875, -0.7575836181640625, -0.72418212890625, -0.6907806396484375, -0.657379150390625, -0.6239776611328125, -0.590576171875, -0.5571746826171875, -0.523773193359375, -0.4903717041015625, -0.45697021484375, -0.4235687255859375, -0.390167236328125, -0.3567657470703125, -0.3233642578125, -0.2899627685546875, -0.256561279296875, -0.2231597900390625, -0.18975830078125, -0.1563568115234375, -0.122955322265625, -0.0895538330078125, -0.05615234375, -0.0227508544921875, 0.010650634765625, 0.0440521240234375, 0.07745361328125, 0.1108551025390625, 0.144256591796875, 0.1776580810546875, 0.2110595703125, 0.2444610595703125, 0.277862548828125, 0.3112640380859375, 0.34466552734375, 0.3780670166015625, 0.411468505859375, 0.4448699951171875, 0.478271484375, 0.5116729736328125, 0.545074462890625, 0.5784759521484375, 0.61187744140625, 0.6452789306640625, 0.678680419921875, 0.7120819091796875, 0.7454833984375, 0.7788848876953125, 0.812286376953125, 0.8456878662109375, 0.87908935546875, 0.9124908447265625, 0.945892333984375, 0.9792938232421875, 1.0126953125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 16.0, 55.0, 96.0, 182.0, 189.0, 204.0, 111.0, 72.0, 37.0, 18.0, 7.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8857421875, -0.8294525146484375, -0.773162841796875, -0.7168731689453125, -0.66058349609375, -0.6042938232421875, -0.548004150390625, -0.4917144775390625, -0.4354248046875, -0.3791351318359375, -0.322845458984375, -0.2665557861328125, -0.21026611328125, -0.1539764404296875, -0.097686767578125, -0.0413970947265625, 0.014892578125, 0.0711822509765625, 0.127471923828125, 0.1837615966796875, 0.24005126953125, 0.2963409423828125, 0.352630615234375, 0.4089202880859375, 0.4652099609375, 0.5214996337890625, 0.577789306640625, 0.6340789794921875, 0.69036865234375, 0.7466583251953125, 0.802947998046875, 0.8592376708984375, 0.91552734375, 0.9718170166015625, 1.028106689453125, 1.0843963623046875, 1.14068603515625, 1.1969757080078125, 1.253265380859375, 1.3095550537109375, 1.3658447265625, 1.4221343994140625, 1.478424072265625, 1.5347137451171875, 1.59100341796875, 1.6472930908203125, 1.703582763671875, 1.7598724365234375, 1.816162109375, 1.8724517822265625, 1.928741455078125, 1.9850311279296875, 2.04132080078125, 2.0976104736328125, 2.153900146484375, 2.2101898193359375, 2.2664794921875, 2.3227691650390625, 2.379058837890625, 2.4353485107421875, 2.49163818359375, 2.5479278564453125, 2.604217529296875, 2.6605072021484375, 2.716796875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 20.0, 71.0, 213.0, 363.0, 240.0, 62.0, 26.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.64280700683594, -39.80159378051758, -38.96038055419922, -38.119171142578125, -37.277957916259766, -36.436744689941406, -35.59553527832031, -34.75432205200195, -33.913108825683594, -33.071895599365234, -32.230682373046875, -31.38947296142578, -30.548259735107422, -29.707046508789062, -28.865835189819336, -28.02462387084961, -27.18341064453125, -26.34219741821289, -25.500986099243164, -24.659774780273438, -23.818561553955078, -22.97734832763672, -22.136137008666992, -21.294925689697266, -20.453712463378906, -19.612499237060547, -18.77128791809082, -17.930076599121094, -17.088863372802734, -16.247650146484375, -15.406438827514648, -14.565226554870605, -13.724013328552246, -12.882801055908203, -12.04158878326416, -11.200376510620117, -10.359164237976074, -9.517951965332031, -8.676739692687988, -7.835527420043945, -6.994315147399902, -6.153102874755859, -5.311890602111816, -4.470678329467773, -3.6294660568237305, -2.7882537841796875, -1.9470415115356445, -1.1058292388916016, -0.2646169662475586, 0.5765953063964844, 1.4178075790405273, 2.2590198516845703, 3.1002321243286133, 3.9414443969726562, 4.782656669616699, 5.623868942260742, 6.465081214904785, 7.306293487548828, 8.147505760192871, 8.988718032836914, 9.829930305480957, 10.671142578125, 11.512354850769043, 12.353567123413086, 13.194779396057129]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 7.0, 9.0, 9.0, 13.0, 11.0, 17.0, 25.0, 30.0, 33.0, 37.0, 34.0, 35.0, 51.0, 53.0, 62.0, 54.0, 50.0, 55.0, 53.0, 63.0, 42.0, 51.0, 32.0, 25.0, 31.0, 21.0, 25.0, 17.0, 11.0, 11.0, 10.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.026670455932617, -5.824587821960449, -5.6225056648254395, -5.42042350769043, -5.218340873718262, -5.016258239746094, -4.814176082611084, -4.612093925476074, -4.410011291503906, -4.207928657531738, -4.0058465003967285, -3.8037641048431396, -3.601681709289551, -3.399599313735962, -3.197516918182373, -2.995434522628784, -2.7933521270751953, -2.5912697315216064, -2.3891873359680176, -2.1871049404144287, -1.9850225448608398, -1.782940149307251, -1.580857753753662, -1.3787753582000732, -1.1766929626464844, -0.9746105670928955, -0.7725281715393066, -0.5704457759857178, -0.3683633804321289, -0.16628098487854004, 0.03580141067504883, 0.2378838062286377, 0.43996667861938477, 0.6420490741729736, 0.8441314697265625, 1.0462138652801514, 1.2482962608337402, 1.450378656387329, 1.652461051940918, 1.8545434474945068, 2.0566258430480957, 2.2587082386016846, 2.4607906341552734, 2.6628730297088623, 2.864955425262451, 3.06703782081604, 3.269120216369629, 3.4712026119232178, 3.6732850074768066, 3.8753674030303955, 4.077449798583984, 4.279532432556152, 4.481614589691162, 4.683696746826172, 4.88577938079834, 5.087862014770508, 5.289944171905518, 5.492026329040527, 5.694108963012695, 5.896191596984863, 6.098273754119873, 6.300355911254883, 6.502438545227051, 6.704521179199219, 6.9066033363342285]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 10.0, 12.0, 18.0, 21.0, 37.0, 85.0, 123.0, 221.0, 473.0, 1112.0, 3041.0, 11142.0, 86111.0, 4035176.0, 44899.0, 7723.0, 2255.0, 868.0, 428.0, 210.0, 109.0, 72.0, 51.0, 37.0, 15.0, 7.0, 11.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8130722045898438, -0.7662811279296875, -0.7194900512695312, -0.672698974609375, -0.6259078979492188, -0.5791168212890625, -0.5323257446289062, -0.48553466796875, -0.43874359130859375, -0.3919525146484375, -0.34516143798828125, -0.298370361328125, -0.25157928466796875, -0.2047882080078125, -0.15799713134765625, -0.1112060546875, -0.06441497802734375, -0.0176239013671875, 0.02916717529296875, 0.075958251953125, 0.12274932861328125, 0.1695404052734375, 0.21633148193359375, 0.26312255859375, 0.30991363525390625, 0.3567047119140625, 0.40349578857421875, 0.450286865234375, 0.49707794189453125, 0.5438690185546875, 0.5906600952148438, 0.637451171875, 0.6842422485351562, 0.7310333251953125, 0.7778244018554688, 0.824615478515625, 0.8714065551757812, 0.9181976318359375, 0.9649887084960938, 1.01177978515625, 1.0585708618164062, 1.1053619384765625, 1.1521530151367188, 1.198944091796875, 1.2457351684570312, 1.2925262451171875, 1.3393173217773438, 1.3861083984375, 1.4328994750976562, 1.4796905517578125, 1.5264816284179688, 1.573272705078125, 1.6200637817382812, 1.6668548583984375, 1.7136459350585938, 1.76043701171875, 1.8072280883789062, 1.8540191650390625, 1.9008102416992188, 1.947601318359375, 1.9943923950195312, 2.0411834716796875, 2.0879745483398438, 2.134765625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 6.0, 4.0, 9.0, 11.0, 17.0, 17.0, 37.0, 42.0, 40.0, 63.0, 75.0, 86.0, 80.0, 71.0, 77.0, 72.0, 58.0, 62.0, 47.0, 27.0, 25.0, 18.0, 11.0, 14.0, 6.0, 7.0, 9.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2942619323730469, -0.28163909912109375, -0.2690162658691406, -0.2563934326171875, -0.24377059936523438, -0.23114776611328125, -0.21852493286132812, -0.205902099609375, -0.19327926635742188, -0.18065643310546875, -0.16803359985351562, -0.1554107666015625, -0.14278793334960938, -0.13016510009765625, -0.11754226684570312, -0.10491943359375, -0.09229660034179688, -0.07967376708984375, -0.06705093383789062, -0.0544281005859375, -0.041805267333984375, -0.02918243408203125, -0.016559600830078125, -0.003936767578125, 0.008686065673828125, 0.02130889892578125, 0.033931732177734375, 0.0465545654296875, 0.059177398681640625, 0.07180023193359375, 0.08442306518554688, 0.0970458984375, 0.10966873168945312, 0.12229156494140625, 0.13491439819335938, 0.1475372314453125, 0.16016006469726562, 0.17278289794921875, 0.18540573120117188, 0.198028564453125, 0.21065139770507812, 0.22327423095703125, 0.23589706420898438, 0.2485198974609375, 0.2611427307128906, 0.27376556396484375, 0.2863883972167969, 0.29901123046875, 0.3116340637207031, 0.32425689697265625, 0.3368797302246094, 0.3495025634765625, 0.3621253967285156, 0.37474822998046875, 0.3873710632324219, 0.399993896484375, 0.4126167297363281, 0.42523956298828125, 0.4378623962402344, 0.4504852294921875, 0.4631080627441406, 0.47573089599609375, 0.4883537292480469, 0.5009765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 4.0, 5.0, 11.0, 14.0, 19.0, 34.0, 43.0, 43.0, 76.0, 98.0, 194.0, 274.0, 465.0, 714.0, 1412.0, 3083.0, 8039.0, 28261.0, 222537.0, 3847756.0, 58605.0, 13417.0, 4611.0, 2041.0, 1048.0, 511.0, 317.0, 214.0, 160.0, 93.0, 50.0, 37.0, 18.0, 27.0, 15.0, 9.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90869140625, -0.8753128051757812, -0.8419342041015625, -0.8085556030273438, -0.775177001953125, -0.7417984008789062, -0.7084197998046875, -0.6750411987304688, -0.64166259765625, -0.6082839965820312, -0.5749053955078125, -0.5415267944335938, -0.508148193359375, -0.47476959228515625, -0.4413909912109375, -0.40801239013671875, -0.3746337890625, -0.34125518798828125, -0.3078765869140625, -0.27449798583984375, -0.241119384765625, -0.20774078369140625, -0.1743621826171875, -0.14098358154296875, -0.10760498046875, -0.07422637939453125, -0.0408477783203125, -0.00746917724609375, 0.025909423828125, 0.05928802490234375, 0.0926666259765625, 0.12604522705078125, 0.159423828125, 0.19280242919921875, 0.2261810302734375, 0.25955963134765625, 0.292938232421875, 0.32631683349609375, 0.3596954345703125, 0.39307403564453125, 0.42645263671875, 0.45983123779296875, 0.4932098388671875, 0.5265884399414062, 0.559967041015625, 0.5933456420898438, 0.6267242431640625, 0.6601028442382812, 0.6934814453125, 0.7268600463867188, 0.7602386474609375, 0.7936172485351562, 0.826995849609375, 0.8603744506835938, 0.8937530517578125, 0.9271316528320312, 0.96051025390625, 0.9938888549804688, 1.0272674560546875, 1.0606460571289062, 1.094024658203125, 1.1274032592773438, 1.1607818603515625, 1.1941604614257812, 1.2275390625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 12.0, 23.0, 26.0, 59.0, 125.0, 2823.0, 771.0, 125.0, 43.0, 25.0, 9.0, 8.0, 8.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389404296875, -0.3779449462890625, -0.366485595703125, -0.3550262451171875, -0.34356689453125, -0.3321075439453125, -0.320648193359375, -0.3091888427734375, -0.2977294921875, -0.2862701416015625, -0.274810791015625, -0.2633514404296875, -0.25189208984375, -0.2404327392578125, -0.228973388671875, -0.2175140380859375, -0.2060546875, -0.1945953369140625, -0.183135986328125, -0.1716766357421875, -0.16021728515625, -0.1487579345703125, -0.137298583984375, -0.1258392333984375, -0.1143798828125, -0.1029205322265625, -0.091461181640625, -0.0800018310546875, -0.06854248046875, -0.0570831298828125, -0.045623779296875, -0.0341644287109375, -0.022705078125, -0.0112457275390625, 0.000213623046875, 0.0116729736328125, 0.02313232421875, 0.0345916748046875, 0.046051025390625, 0.0575103759765625, 0.0689697265625, 0.0804290771484375, 0.091888427734375, 0.1033477783203125, 0.11480712890625, 0.1262664794921875, 0.137725830078125, 0.1491851806640625, 0.16064453125, 0.1721038818359375, 0.183563232421875, 0.1950225830078125, 0.20648193359375, 0.2179412841796875, 0.229400634765625, 0.2408599853515625, 0.2523193359375, 0.2637786865234375, 0.275238037109375, 0.2866973876953125, 0.29815673828125, 0.3096160888671875, 0.321075439453125, 0.3325347900390625, 0.343994140625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 11.0, 10.0, 13.0, 39.0, 105.0, 141.0, 168.0, 180.0, 145.0, 79.0, 56.0, 29.0, 14.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0764315128326416, -1.0300545692443848, -0.9836775064468384, -0.9373005628585815, -0.8909235596656799, -0.8445465564727783, -0.7981696128845215, -0.7517926096916199, -0.7054156064987183, -0.6590386033058167, -0.612661600112915, -0.5662846565246582, -0.5199076533317566, -0.473530650138855, -0.42715367674827576, -0.38077670335769653, -0.3343997001647949, -0.2880226969718933, -0.2416457235813141, -0.19526873528957367, -0.14889174699783325, -0.10251475870609283, -0.05613777041435242, -0.009760797023773193, 0.03661620616912842, 0.08299319446086884, 0.12937018275260925, 0.17574717104434967, 0.2221241593360901, 0.2685011625289917, 0.3148781359195709, 0.36125510931015015, 0.4076322317123413, 0.4540092349052429, 0.5003862380981445, 0.5467631816864014, 0.593140184879303, 0.6395171880722046, 0.6858941316604614, 0.732271134853363, 0.7786481380462646, 0.8250251412391663, 0.8714021444320679, 0.9177790880203247, 0.9641560912132263, 1.010533094406128, 1.0569100379943848, 1.1032869815826416, 1.149664044380188, 1.1960409879684448, 1.2424180507659912, 1.288794994354248, 1.3351719379425049, 1.3815490007400513, 1.427925944328308, 1.4743030071258545, 1.5206799507141113, 1.5670568943023682, 1.6134339570999146, 1.6598109006881714, 1.7061879634857178, 1.7525649070739746, 1.7989418506622314, 1.8453187942504883, 1.8916958570480347]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 5.0, 8.0, 11.0, 9.0, 17.0, 21.0, 27.0, 28.0, 34.0, 45.0, 57.0, 48.0, 57.0, 54.0, 41.0, 53.0, 55.0, 62.0, 61.0, 46.0, 51.0, 40.0, 38.0, 23.0, 25.0, 18.0, 17.0, 12.0, 15.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6839041709899902, -0.6615318655967712, -0.6391595005989075, -0.6167871952056885, -0.5944148302078247, -0.5720425248146057, -0.5496701598167419, -0.527297854423523, -0.5049254894256592, -0.4825531542301178, -0.4601808190345764, -0.43780848383903503, -0.41543614864349365, -0.39306381344795227, -0.3706914782524109, -0.3483191728591919, -0.3259468376636505, -0.30357450246810913, -0.28120216727256775, -0.25882983207702637, -0.23645749688148499, -0.2140851616859436, -0.19171284139156342, -0.16934050619602203, -0.14696817100048065, -0.12459583580493927, -0.10222350060939789, -0.0798511728644371, -0.05747883766889572, -0.03510650247335434, -0.012734174728393555, 0.009638160467147827, 0.03201049566268921, 0.05438283085823059, 0.07675516605377197, 0.09912749379873276, 0.12149982899427414, 0.14387217164039612, 0.1662444919347763, 0.1886168271303177, 0.21098916232585907, 0.23336149752140045, 0.25573381781578064, 0.278106153011322, 0.3004784882068634, 0.3228508234024048, 0.34522315859794617, 0.36759549379348755, 0.38996782898902893, 0.4123401641845703, 0.4347124993801117, 0.4570848345756531, 0.47945716977119446, 0.5018295049667358, 0.5242018103599548, 0.5465741753578186, 0.5689464807510376, 0.5913187861442566, 0.6136911511421204, 0.6360634565353394, 0.6584358215332031, 0.6808081269264221, 0.7031804919242859, 0.7255527973175049, 0.7479251623153687]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 10.0, 8.0, 9.0, 22.0, 23.0, 26.0, 56.0, 57.0, 112.0, 190.0, 275.0, 455.0, 800.0, 1498.0, 2942.0, 6742.0, 16695.0, 47506.0, 146472.0, 355567.0, 301881.0, 108231.0, 35520.0, 12816.0, 5217.0, 2448.0, 1227.0, 665.0, 397.0, 227.0, 134.0, 88.0, 65.0, 58.0, 35.0, 23.0, 19.0, 12.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.58447265625, -0.5655364990234375, -0.546600341796875, -0.5276641845703125, -0.50872802734375, -0.4897918701171875, -0.470855712890625, -0.4519195556640625, -0.4329833984375, -0.4140472412109375, -0.395111083984375, -0.3761749267578125, -0.35723876953125, -0.3383026123046875, -0.319366455078125, -0.3004302978515625, -0.281494140625, -0.2625579833984375, -0.243621826171875, -0.2246856689453125, -0.20574951171875, -0.1868133544921875, -0.167877197265625, -0.1489410400390625, -0.1300048828125, -0.1110687255859375, -0.092132568359375, -0.0731964111328125, -0.05426025390625, -0.0353240966796875, -0.016387939453125, 0.0025482177734375, 0.021484375, 0.0404205322265625, 0.059356689453125, 0.0782928466796875, 0.09722900390625, 0.1161651611328125, 0.135101318359375, 0.1540374755859375, 0.1729736328125, 0.1919097900390625, 0.210845947265625, 0.2297821044921875, 0.24871826171875, 0.2676544189453125, 0.286590576171875, 0.3055267333984375, 0.324462890625, 0.3433990478515625, 0.362335205078125, 0.3812713623046875, 0.40020751953125, 0.4191436767578125, 0.438079833984375, 0.4570159912109375, 0.4759521484375, 0.4948883056640625, 0.513824462890625, 0.5327606201171875, 0.55169677734375, 0.5706329345703125, 0.589569091796875, 0.6085052490234375, 0.62744140625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 14.0, 15.0, 18.0, 17.0, 22.0, 32.0, 40.0, 49.0, 57.0, 72.0, 66.0, 74.0, 69.0, 57.0, 62.0, 51.0, 57.0, 34.0, 43.0, 27.0, 22.0, 23.0, 20.0, 12.0, 9.0, 4.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28564453125, -0.27442169189453125, -0.2631988525390625, -0.25197601318359375, -0.240753173828125, -0.22953033447265625, -0.2183074951171875, -0.20708465576171875, -0.19586181640625, -0.18463897705078125, -0.1734161376953125, -0.16219329833984375, -0.150970458984375, -0.13974761962890625, -0.1285247802734375, -0.11730194091796875, -0.1060791015625, -0.09485626220703125, -0.0836334228515625, -0.07241058349609375, -0.061187744140625, -0.04996490478515625, -0.0387420654296875, -0.02751922607421875, -0.01629638671875, -0.00507354736328125, 0.0061492919921875, 0.01737213134765625, 0.028594970703125, 0.03981781005859375, 0.0510406494140625, 0.06226348876953125, 0.073486328125, 0.08470916748046875, 0.0959320068359375, 0.10715484619140625, 0.118377685546875, 0.12960052490234375, 0.1408233642578125, 0.15204620361328125, 0.16326904296875, 0.17449188232421875, 0.1857147216796875, 0.19693756103515625, 0.208160400390625, 0.21938323974609375, 0.2306060791015625, 0.24182891845703125, 0.2530517578125, 0.26427459716796875, 0.2754974365234375, 0.28672027587890625, 0.297943115234375, 0.30916595458984375, 0.3203887939453125, 0.33161163330078125, 0.34283447265625, 0.35405731201171875, 0.3652801513671875, 0.37650299072265625, 0.387725830078125, 0.39894866943359375, 0.4101715087890625, 0.42139434814453125, 0.4326171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 10.0, 7.0, 11.0, 19.0, 15.0, 31.0, 52.0, 61.0, 104.0, 164.0, 248.0, 398.0, 864.0, 2175.0, 8246.0, 64091.0, 608164.0, 326135.0, 29689.0, 4822.0, 1541.0, 686.0, 320.0, 214.0, 159.0, 107.0, 65.0, 37.0, 27.0, 23.0, 15.0, 12.0, 11.0, 6.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.32421875, -1.287261962890625, -1.25030517578125, -1.213348388671875, -1.1763916015625, -1.139434814453125, -1.10247802734375, -1.065521240234375, -1.028564453125, -0.991607666015625, -0.95465087890625, -0.917694091796875, -0.8807373046875, -0.843780517578125, -0.80682373046875, -0.769866943359375, -0.73291015625, -0.695953369140625, -0.65899658203125, -0.622039794921875, -0.5850830078125, -0.548126220703125, -0.51116943359375, -0.474212646484375, -0.437255859375, -0.400299072265625, -0.36334228515625, -0.326385498046875, -0.2894287109375, -0.252471923828125, -0.21551513671875, -0.178558349609375, -0.1416015625, -0.104644775390625, -0.06768798828125, -0.030731201171875, 0.0062255859375, 0.043182373046875, 0.08013916015625, 0.117095947265625, 0.154052734375, 0.191009521484375, 0.22796630859375, 0.264923095703125, 0.3018798828125, 0.338836669921875, 0.37579345703125, 0.412750244140625, 0.44970703125, 0.486663818359375, 0.52362060546875, 0.560577392578125, 0.5975341796875, 0.634490966796875, 0.67144775390625, 0.708404541015625, 0.745361328125, 0.782318115234375, 0.81927490234375, 0.856231689453125, 0.8931884765625, 0.930145263671875, 0.96710205078125, 1.004058837890625, 1.041015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 4.0, 4.0, 5.0, 9.0, 6.0, 10.0, 13.0, 19.0, 17.0, 21.0, 21.0, 19.0, 30.0, 37.0, 29.0, 39.0, 36.0, 37.0, 52.0, 38.0, 42.0, 47.0, 46.0, 35.0, 36.0, 33.0, 33.0, 29.0, 31.0, 23.0, 30.0, 27.0, 24.0, 24.0, 18.0, 10.0, 21.0, 10.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 6.0, 0.0, 3.0], "bins": [-1.2255859375, -1.1900177001953125, -1.154449462890625, -1.1188812255859375, -1.08331298828125, -1.0477447509765625, -1.012176513671875, -0.9766082763671875, -0.9410400390625, -0.9054718017578125, -0.869903564453125, -0.8343353271484375, -0.79876708984375, -0.7631988525390625, -0.727630615234375, -0.6920623779296875, -0.656494140625, -0.6209259033203125, -0.585357666015625, -0.5497894287109375, -0.51422119140625, -0.4786529541015625, -0.443084716796875, -0.4075164794921875, -0.3719482421875, -0.3363800048828125, -0.300811767578125, -0.2652435302734375, -0.22967529296875, -0.1941070556640625, -0.158538818359375, -0.1229705810546875, -0.08740234375, -0.0518341064453125, -0.016265869140625, 0.0193023681640625, 0.05487060546875, 0.0904388427734375, 0.126007080078125, 0.1615753173828125, 0.1971435546875, 0.2327117919921875, 0.268280029296875, 0.3038482666015625, 0.33941650390625, 0.3749847412109375, 0.410552978515625, 0.4461212158203125, 0.481689453125, 0.5172576904296875, 0.552825927734375, 0.5883941650390625, 0.62396240234375, 0.6595306396484375, 0.695098876953125, 0.7306671142578125, 0.7662353515625, 0.8018035888671875, 0.837371826171875, 0.8729400634765625, 0.90850830078125, 0.9440765380859375, 0.979644775390625, 1.0152130126953125, 1.05078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 8.0, 15.0, 27.0, 41.0, 61.0, 134.0, 296.0, 1079.0, 6821.0, 604075.0, 428641.0, 5875.0, 923.0, 282.0, 101.0, 54.0, 40.0, 19.0, 20.0, 15.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6904296875, -1.64208984375, -1.59375, -1.54541015625, -1.4970703125, -1.44873046875, -1.400390625, -1.35205078125, -1.3037109375, -1.25537109375, -1.20703125, -1.15869140625, -1.1103515625, -1.06201171875, -1.013671875, -0.96533203125, -0.9169921875, -0.86865234375, -0.8203125, -0.77197265625, -0.7236328125, -0.67529296875, -0.626953125, -0.57861328125, -0.5302734375, -0.48193359375, -0.43359375, -0.38525390625, -0.3369140625, -0.28857421875, -0.240234375, -0.19189453125, -0.1435546875, -0.09521484375, -0.046875, 0.00146484375, 0.0498046875, 0.09814453125, 0.146484375, 0.19482421875, 0.2431640625, 0.29150390625, 0.33984375, 0.38818359375, 0.4365234375, 0.48486328125, 0.533203125, 0.58154296875, 0.6298828125, 0.67822265625, 0.7265625, 0.77490234375, 0.8232421875, 0.87158203125, 0.919921875, 0.96826171875, 1.0166015625, 1.06494140625, 1.11328125, 1.16162109375, 1.2099609375, 1.25830078125, 1.306640625, 1.35498046875, 1.4033203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 9.0, 15.0, 15.0, 22.0, 34.0, 44.0, 44.0, 57.0, 103.0, 98.0, 108.0, 109.0, 76.0, 77.0, 53.0, 39.0, 25.0, 15.0, 12.0, 11.0, 10.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.580352783203125e-05, -6.271898746490479e-05, -5.963444709777832e-05, -5.6549906730651855e-05, -5.346536636352539e-05, -5.0380825996398926e-05, -4.729628562927246e-05, -4.4211745262145996e-05, -4.112720489501953e-05, -3.8042664527893066e-05, -3.49581241607666e-05, -3.187358379364014e-05, -2.8789043426513672e-05, -2.5704503059387207e-05, -2.2619962692260742e-05, -1.9535422325134277e-05, -1.6450881958007812e-05, -1.3366341590881348e-05, -1.0281801223754883e-05, -7.197260856628418e-06, -4.112720489501953e-06, -1.0281801223754883e-06, 2.0563602447509766e-06, 5.140900611877441e-06, 8.225440979003906e-06, 1.1309981346130371e-05, 1.4394521713256836e-05, 1.74790620803833e-05, 2.0563602447509766e-05, 2.364814281463623e-05, 2.6732683181762695e-05, 2.981722354888916e-05, 3.2901763916015625e-05, 3.598630428314209e-05, 3.9070844650268555e-05, 4.215538501739502e-05, 4.5239925384521484e-05, 4.832446575164795e-05, 5.1409006118774414e-05, 5.449354648590088e-05, 5.7578086853027344e-05, 6.066262722015381e-05, 6.374716758728027e-05, 6.683170795440674e-05, 6.99162483215332e-05, 7.300078868865967e-05, 7.608532905578613e-05, 7.91698694229126e-05, 8.225440979003906e-05, 8.533895015716553e-05, 8.842349052429199e-05, 9.150803089141846e-05, 9.459257125854492e-05, 9.767711162567139e-05, 0.00010076165199279785, 0.00010384619235992432, 0.00010693073272705078, 0.00011001527309417725, 0.00011309981346130371, 0.00011618435382843018, 0.00011926889419555664, 0.0001223534345626831, 0.00012543797492980957, 0.00012852251529693604, 0.0001316070556640625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 15.0, 18.0, 27.0, 53.0, 104.0, 171.0, 377.0, 1086.0, 4070.0, 40275.0, 864895.0, 127688.0, 7259.0, 1503.0, 497.0, 215.0, 109.0, 58.0, 35.0, 30.0, 18.0, 12.0, 6.0, 10.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.041015625, -1.0109786987304688, -0.9809417724609375, -0.9509048461914062, -0.920867919921875, -0.8908309936523438, -0.8607940673828125, -0.8307571411132812, -0.80072021484375, -0.7706832885742188, -0.7406463623046875, -0.7106094360351562, -0.680572509765625, -0.6505355834960938, -0.6204986572265625, -0.5904617309570312, -0.5604248046875, -0.5303878784179688, -0.5003509521484375, -0.47031402587890625, -0.440277099609375, -0.41024017333984375, -0.3802032470703125, -0.35016632080078125, -0.32012939453125, -0.29009246826171875, -0.2600555419921875, -0.23001861572265625, -0.199981689453125, -0.16994476318359375, -0.1399078369140625, -0.10987091064453125, -0.079833984375, -0.04979705810546875, -0.0197601318359375, 0.01027679443359375, 0.040313720703125, 0.07035064697265625, 0.1003875732421875, 0.13042449951171875, 0.16046142578125, 0.19049835205078125, 0.2205352783203125, 0.25057220458984375, 0.280609130859375, 0.31064605712890625, 0.3406829833984375, 0.37071990966796875, 0.4007568359375, 0.43079376220703125, 0.4608306884765625, 0.49086761474609375, 0.520904541015625, 0.5509414672851562, 0.5809783935546875, 0.6110153198242188, 0.64105224609375, 0.6710891723632812, 0.7011260986328125, 0.7311630249023438, 0.761199951171875, 0.7912368774414062, 0.8212738037109375, 0.8513107299804688, 0.88134765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 17.0, 16.0, 21.0, 35.0, 30.0, 59.0, 57.0, 67.0, 82.0, 107.0, 84.0, 79.0, 69.0, 53.0, 46.0, 49.0, 32.0, 19.0, 8.0, 16.0, 9.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40673828125, -0.3888702392578125, -0.371002197265625, -0.3531341552734375, -0.33526611328125, -0.3173980712890625, -0.299530029296875, -0.2816619873046875, -0.2637939453125, -0.2459259033203125, -0.228057861328125, -0.2101898193359375, -0.19232177734375, -0.1744537353515625, -0.156585693359375, -0.1387176513671875, -0.120849609375, -0.1029815673828125, -0.085113525390625, -0.0672454833984375, -0.04937744140625, -0.0315093994140625, -0.013641357421875, 0.0042266845703125, 0.0220947265625, 0.0399627685546875, 0.057830810546875, 0.0756988525390625, 0.09356689453125, 0.1114349365234375, 0.129302978515625, 0.1471710205078125, 0.1650390625, 0.1829071044921875, 0.200775146484375, 0.2186431884765625, 0.23651123046875, 0.2543792724609375, 0.272247314453125, 0.2901153564453125, 0.3079833984375, 0.3258514404296875, 0.343719482421875, 0.3615875244140625, 0.37945556640625, 0.3973236083984375, 0.415191650390625, 0.4330596923828125, 0.450927734375, 0.4687957763671875, 0.486663818359375, 0.5045318603515625, 0.52239990234375, 0.5402679443359375, 0.558135986328125, 0.5760040283203125, 0.5938720703125, 0.6117401123046875, 0.629608154296875, 0.6474761962890625, 0.66534423828125, 0.6832122802734375, 0.701080322265625, 0.7189483642578125, 0.73681640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 36.0, 50.0, 119.0, 159.0, 197.0, 164.0, 114.0, 79.0, 39.0, 18.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.68136978149414, -13.344270706176758, -13.007170677185059, -12.67007064819336, -12.332971572875977, -11.995872497558594, -11.658772468566895, -11.321672439575195, -10.984573364257812, -10.64747428894043, -10.31037425994873, -9.973274230957031, -9.636175155639648, -9.299076080322266, -8.961976051330566, -8.624876022338867, -8.287776947021484, -7.950677394866943, -7.613577842712402, -7.276478290557861, -6.93937873840332, -6.602279186248779, -6.265179634094238, -5.928080081939697, -5.590980529785156, -5.253880977630615, -4.916781425476074, -4.579681873321533, -4.242582321166992, -3.905482769012451, -3.56838321685791, -3.231283664703369, -2.8941831588745117, -2.5570836067199707, -2.2199840545654297, -1.8828845024108887, -1.5457849502563477, -1.2086853981018066, -0.8715858459472656, -0.5344862937927246, -0.1973867416381836, 0.13971281051635742, 0.47681236267089844, 0.8139119148254395, 1.1510114669799805, 1.4881110191345215, 1.8252105712890625, 2.1623101234436035, 2.4994096755981445, 2.8365092277526855, 3.1736087799072266, 3.5107083320617676, 3.8478078842163086, 4.18490743637085, 4.522006988525391, 4.859106540679932, 5.196206092834473, 5.533305644989014, 5.870405197143555, 6.207504749298096, 6.544604301452637, 6.881703853607178, 7.218803405761719, 7.55590295791626, 7.893002510070801]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 13.0, 14.0, 14.0, 27.0, 26.0, 26.0, 26.0, 41.0, 33.0, 38.0, 52.0, 57.0, 55.0, 43.0, 58.0, 66.0, 52.0, 49.0, 49.0, 39.0, 36.0, 31.0, 26.0, 17.0, 13.0, 24.0, 12.0, 7.0, 11.0, 6.0, 6.0, 6.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.996451377868652, -6.802894592285156, -6.60933780670166, -6.415781021118164, -6.222224235534668, -6.028667449951172, -5.835110664367676, -5.64155387878418, -5.447997093200684, -5.2544403076171875, -5.060883522033691, -4.867326736450195, -4.673769950866699, -4.480213165283203, -4.286656379699707, -4.093099594116211, -3.899543285369873, -3.705986499786377, -3.512429714202881, -3.3188729286193848, -3.1253161430358887, -2.9317593574523926, -2.7382028102874756, -2.5446460247039795, -2.3510892391204834, -2.1575324535369873, -1.9639756679534912, -1.7704190015792847, -1.5768622159957886, -1.3833054304122925, -1.189748764038086, -0.9961919784545898, -0.802635669708252, -0.6090788841247559, -0.41552215814590454, -0.22196543216705322, -0.02840864658355713, 0.16514813899993896, 0.3587048053741455, 0.5522615909576416, 0.7458183765411377, 0.9393751621246338, 1.1329319477081299, 1.3264886140823364, 1.5200453996658325, 1.7136021852493286, 1.9071588516235352, 2.1007156372070312, 2.2942724227905273, 2.4878292083740234, 2.6813859939575195, 2.8749427795410156, 3.0684995651245117, 3.262056350708008, 3.455612897872925, 3.649169683456421, 3.842726469039917, 4.036283016204834, 4.22983980178833, 4.423396587371826, 4.616953372955322, 4.810510158538818, 5.0040669441223145, 5.1976237297058105, 5.391180515289307]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 8.0, 18.0, 27.0, 41.0, 75.0, 117.0, 217.0, 343.0, 661.0, 1340.0, 2996.0, 7882.0, 25669.0, 150951.0, 3824361.0, 141725.0, 24570.0, 7401.0, 2975.0, 1287.0, 687.0, 366.0, 185.0, 118.0, 68.0, 53.0, 36.0, 34.0, 26.0, 10.0, 9.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.85205078125, -0.8266067504882812, -0.8011627197265625, -0.7757186889648438, -0.750274658203125, -0.7248306274414062, -0.6993865966796875, -0.6739425659179688, -0.64849853515625, -0.6230545043945312, -0.5976104736328125, -0.5721664428710938, -0.546722412109375, -0.5212783813476562, -0.4958343505859375, -0.47039031982421875, -0.4449462890625, -0.41950225830078125, -0.3940582275390625, -0.36861419677734375, -0.343170166015625, -0.31772613525390625, -0.2922821044921875, -0.26683807373046875, -0.24139404296875, -0.21595001220703125, -0.1905059814453125, -0.16506195068359375, -0.139617919921875, -0.11417388916015625, -0.0887298583984375, -0.06328582763671875, -0.037841796875, -0.01239776611328125, 0.0130462646484375, 0.03849029541015625, 0.063934326171875, 0.08937835693359375, 0.1148223876953125, 0.14026641845703125, 0.16571044921875, 0.19115447998046875, 0.2165985107421875, 0.24204254150390625, 0.267486572265625, 0.29293060302734375, 0.3183746337890625, 0.34381866455078125, 0.3692626953125, 0.39470672607421875, 0.4201507568359375, 0.44559478759765625, 0.471038818359375, 0.49648284912109375, 0.5219268798828125, 0.5473709106445312, 0.57281494140625, 0.5982589721679688, 0.6237030029296875, 0.6491470336914062, 0.674591064453125, 0.7000350952148438, 0.7254791259765625, 0.7509231567382812, 0.7763671875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 11.0, 12.0, 21.0, 15.0, 32.0, 33.0, 58.0, 68.0, 77.0, 75.0, 88.0, 87.0, 70.0, 65.0, 54.0, 46.0, 36.0, 39.0, 35.0, 17.0, 6.0, 12.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.385986328125, -0.37351226806640625, -0.3610382080078125, -0.34856414794921875, -0.336090087890625, -0.32361602783203125, -0.3111419677734375, -0.29866790771484375, -0.28619384765625, -0.27371978759765625, -0.2612457275390625, -0.24877166748046875, -0.236297607421875, -0.22382354736328125, -0.2113494873046875, -0.19887542724609375, -0.1864013671875, -0.17392730712890625, -0.1614532470703125, -0.14897918701171875, -0.136505126953125, -0.12403106689453125, -0.1115570068359375, -0.09908294677734375, -0.08660888671875, -0.07413482666015625, -0.0616607666015625, -0.04918670654296875, -0.036712646484375, -0.02423858642578125, -0.0117645263671875, 0.00070953369140625, 0.01318359375, 0.02565765380859375, 0.0381317138671875, 0.05060577392578125, 0.063079833984375, 0.07555389404296875, 0.0880279541015625, 0.10050201416015625, 0.11297607421875, 0.12545013427734375, 0.1379241943359375, 0.15039825439453125, 0.162872314453125, 0.17534637451171875, 0.1878204345703125, 0.20029449462890625, 0.2127685546875, 0.22524261474609375, 0.2377166748046875, 0.25019073486328125, 0.262664794921875, 0.27513885498046875, 0.2876129150390625, 0.30008697509765625, 0.31256103515625, 0.32503509521484375, 0.3375091552734375, 0.34998321533203125, 0.362457275390625, 0.37493133544921875, 0.3874053955078125, 0.39987945556640625, 0.412353515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 11.0, 23.0, 18.0, 39.0, 61.0, 111.0, 179.0, 342.0, 606.0, 1019.0, 2118.0, 4533.0, 10827.0, 30115.0, 108972.0, 3136119.0, 773247.0, 83628.0, 25076.0, 9302.0, 3899.0, 1855.0, 946.0, 492.0, 273.0, 167.0, 117.0, 61.0, 44.0, 29.0, 19.0, 13.0, 9.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6015625, -0.5838241577148438, -0.5660858154296875, -0.5483474731445312, -0.530609130859375, -0.5128707885742188, -0.4951324462890625, -0.47739410400390625, -0.45965576171875, -0.44191741943359375, -0.4241790771484375, -0.40644073486328125, -0.388702392578125, -0.37096405029296875, -0.3532257080078125, -0.33548736572265625, -0.3177490234375, -0.30001068115234375, -0.2822723388671875, -0.26453399658203125, -0.246795654296875, -0.22905731201171875, -0.2113189697265625, -0.19358062744140625, -0.17584228515625, -0.15810394287109375, -0.1403656005859375, -0.12262725830078125, -0.104888916015625, -0.08715057373046875, -0.0694122314453125, -0.05167388916015625, -0.033935546875, -0.01619720458984375, 0.0015411376953125, 0.01927947998046875, 0.037017822265625, 0.05475616455078125, 0.0724945068359375, 0.09023284912109375, 0.10797119140625, 0.12570953369140625, 0.1434478759765625, 0.16118621826171875, 0.178924560546875, 0.19666290283203125, 0.2144012451171875, 0.23213958740234375, 0.2498779296875, 0.26761627197265625, 0.2853546142578125, 0.30309295654296875, 0.320831298828125, 0.33856964111328125, 0.3563079833984375, 0.37404632568359375, 0.39178466796875, 0.40952301025390625, 0.4272613525390625, 0.44499969482421875, 0.462738037109375, 0.48047637939453125, 0.4982147216796875, 0.5159530639648438, 0.53369140625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 9.0, 13.0, 19.0, 18.0, 23.0, 40.0, 63.0, 83.0, 191.0, 365.0, 2428.0, 413.0, 147.0, 83.0, 62.0, 33.0, 17.0, 23.0, 11.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31298828125, -0.3023872375488281, -0.29178619384765625, -0.2811851501464844, -0.2705841064453125, -0.2599830627441406, -0.24938201904296875, -0.23878097534179688, -0.228179931640625, -0.21757888793945312, -0.20697784423828125, -0.19637680053710938, -0.1857757568359375, -0.17517471313476562, -0.16457366943359375, -0.15397262573242188, -0.14337158203125, -0.13277053833007812, -0.12216949462890625, -0.11156845092773438, -0.1009674072265625, -0.09036636352539062, -0.07976531982421875, -0.06916427612304688, -0.058563232421875, -0.047962188720703125, -0.03736114501953125, -0.026760101318359375, -0.0161590576171875, -0.005558013916015625, 0.00504302978515625, 0.015644073486328125, 0.0262451171875, 0.036846160888671875, 0.04744720458984375, 0.058048248291015625, 0.0686492919921875, 0.07925033569335938, 0.08985137939453125, 0.10045242309570312, 0.111053466796875, 0.12165451049804688, 0.13225555419921875, 0.14285659790039062, 0.1534576416015625, 0.16405868530273438, 0.17465972900390625, 0.18526077270507812, 0.19586181640625, 0.20646286010742188, 0.21706390380859375, 0.22766494750976562, 0.2382659912109375, 0.24886703491210938, 0.25946807861328125, 0.2700691223144531, 0.280670166015625, 0.2912712097167969, 0.30187225341796875, 0.3124732971191406, 0.3230743408203125, 0.3336753845214844, 0.34427642822265625, 0.3548774719238281, 0.365478515625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 12.0, 31.0, 66.0, 135.0, 241.0, 230.0, 144.0, 82.0, 37.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.896330833435059, -4.804879188537598, -4.713428020477295, -4.621976375579834, -4.530524730682373, -4.43907356262207, -4.347621917724609, -4.256170272827148, -4.164719104766846, -4.073267459869385, -3.981816053390503, -3.890364646911621, -3.7989132404327393, -3.7074618339538574, -3.6160101890563965, -3.5245587825775146, -3.433107376098633, -3.341655969619751, -3.25020432472229, -3.158752918243408, -3.0673015117645264, -2.9758501052856445, -2.8843984603881836, -2.7929470539093018, -2.701495409011841, -2.610044002532959, -2.518592357635498, -2.427140951156616, -2.3356895446777344, -2.2442381381988525, -2.1527864933013916, -2.0613350868225098, -1.969883680343628, -1.8784321546554565, -1.7869807481765747, -1.6955292224884033, -1.6040778160095215, -1.51262629032135, -1.4211747646331787, -1.3297233581542969, -1.2382718324661255, -1.146820306777954, -1.0553689002990723, -0.9639173746109009, -0.872465968132019, -0.7810144424438477, -0.689562976360321, -0.5981115102767944, -0.5066600441932678, -0.4152085781097412, -0.3237571120262146, -0.2323056161403656, -0.140854150056839, -0.04940268397331238, 0.04204881191253662, 0.13350027799606323, 0.22495174407958984, 0.31640321016311646, 0.40785467624664307, 0.49930617213249207, 0.5907576084136963, 0.6822091341018677, 0.7736606001853943, 0.8651120662689209, 0.9565635323524475]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 4.0, 6.0, 10.0, 9.0, 17.0, 23.0, 15.0, 19.0, 23.0, 26.0, 32.0, 43.0, 41.0, 44.0, 36.0, 42.0, 42.0, 41.0, 38.0, 29.0, 33.0, 48.0, 31.0, 29.0, 45.0, 34.0, 25.0, 30.0, 30.0, 21.0, 22.0, 21.0, 12.0, 13.0, 12.0, 11.0, 9.0, 3.0, 3.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8800595998764038, -0.851436972618103, -0.8228143453598022, -0.7941917181015015, -0.7655691504478455, -0.7369465231895447, -0.7083238959312439, -0.6797012686729431, -0.6510787010192871, -0.6224560737609863, -0.5938334465026855, -0.5652108192443848, -0.5365882515907288, -0.507965624332428, -0.4793429970741272, -0.4507203698158264, -0.42209774255752563, -0.39347511529922485, -0.36485251784324646, -0.3362298905849457, -0.3076072931289673, -0.2789846658706665, -0.2503620386123657, -0.22173942625522614, -0.19311681389808655, -0.16449420154094696, -0.13587158918380737, -0.10724896192550659, -0.078626349568367, -0.05000373721122742, -0.021381109952926636, 0.007241502404212952, 0.035864055156707764, 0.06448666751384735, 0.09310928732156754, 0.12173190712928772, 0.1503545194864273, 0.1789771318435669, 0.20759975910186768, 0.23622237145900726, 0.26484498381614685, 0.29346761107444763, 0.322090208530426, 0.3507128357887268, 0.3793354630470276, 0.407958060503006, 0.43658068776130676, 0.46520328521728516, 0.49382591247558594, 0.5224485397338867, 0.5510711669921875, 0.5796937942504883, 0.6083163619041443, 0.6369389891624451, 0.6655616164207458, 0.6941842436790466, 0.7228068113327026, 0.7514294385910034, 0.7800520658493042, 0.808674693107605, 0.837297260761261, 0.8659198880195618, 0.8945425152778625, 0.9231651425361633, 0.9517877697944641]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 15.0, 9.0, 21.0, 35.0, 45.0, 73.0, 135.0, 287.0, 657.0, 1853.0, 7058.0, 41327.0, 353408.0, 552926.0, 75124.0, 11293.0, 2670.0, 882.0, 345.0, 149.0, 97.0, 57.0, 22.0, 17.0, 10.0, 9.0, 2.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.3232421875, -1.2885513305664062, -1.2538604736328125, -1.2191696166992188, -1.184478759765625, -1.1497879028320312, -1.1150970458984375, -1.0804061889648438, -1.04571533203125, -1.0110244750976562, -0.9763336181640625, -0.9416427612304688, -0.906951904296875, -0.8722610473632812, -0.8375701904296875, -0.8028793334960938, -0.7681884765625, -0.7334976196289062, -0.6988067626953125, -0.6641159057617188, -0.629425048828125, -0.5947341918945312, -0.5600433349609375, -0.5253524780273438, -0.49066162109375, -0.45597076416015625, -0.4212799072265625, -0.38658905029296875, -0.351898193359375, -0.31720733642578125, -0.2825164794921875, -0.24782562255859375, -0.213134765625, -0.17844390869140625, -0.1437530517578125, -0.10906219482421875, -0.074371337890625, -0.03968048095703125, -0.0049896240234375, 0.02970123291015625, 0.06439208984375, 0.09908294677734375, 0.1337738037109375, 0.16846466064453125, 0.203155517578125, 0.23784637451171875, 0.2725372314453125, 0.30722808837890625, 0.3419189453125, 0.37660980224609375, 0.4113006591796875, 0.44599151611328125, 0.480682373046875, 0.5153732299804688, 0.5500640869140625, 0.5847549438476562, 0.61944580078125, 0.6541366577148438, 0.6888275146484375, 0.7235183715820312, 0.758209228515625, 0.7929000854492188, 0.8275909423828125, 0.8622817993164062, 0.89697265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 5.0, 13.0, 11.0, 15.0, 15.0, 34.0, 41.0, 33.0, 49.0, 64.0, 71.0, 85.0, 101.0, 84.0, 74.0, 65.0, 59.0, 40.0, 30.0, 24.0, 22.0, 13.0, 16.0, 9.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.40283203125, -0.39003753662109375, -0.3772430419921875, -0.36444854736328125, -0.351654052734375, -0.33885955810546875, -0.3260650634765625, -0.31327056884765625, -0.30047607421875, -0.28768157958984375, -0.2748870849609375, -0.26209259033203125, -0.249298095703125, -0.23650360107421875, -0.2237091064453125, -0.21091461181640625, -0.1981201171875, -0.18532562255859375, -0.1725311279296875, -0.15973663330078125, -0.146942138671875, -0.13414764404296875, -0.1213531494140625, -0.10855865478515625, -0.09576416015625, -0.08296966552734375, -0.0701751708984375, -0.05738067626953125, -0.044586181640625, -0.03179168701171875, -0.0189971923828125, -0.00620269775390625, 0.006591796875, 0.01938629150390625, 0.0321807861328125, 0.04497528076171875, 0.057769775390625, 0.07056427001953125, 0.0833587646484375, 0.09615325927734375, 0.10894775390625, 0.12174224853515625, 0.1345367431640625, 0.14733123779296875, 0.160125732421875, 0.17292022705078125, 0.1857147216796875, 0.19850921630859375, 0.2113037109375, 0.22409820556640625, 0.2368927001953125, 0.24968719482421875, 0.262481689453125, 0.27527618408203125, 0.2880706787109375, 0.30086517333984375, 0.31365966796875, 0.32645416259765625, 0.3392486572265625, 0.35204315185546875, 0.364837646484375, 0.37763214111328125, 0.3904266357421875, 0.40322113037109375, 0.416015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 3.0, 4.0, 6.0, 3.0, 12.0, 14.0, 19.0, 26.0, 43.0, 56.0, 83.0, 117.0, 206.0, 337.0, 618.0, 1305.0, 3867.0, 20112.0, 237737.0, 696834.0, 74010.0, 8721.0, 2235.0, 941.0, 480.0, 241.0, 159.0, 120.0, 67.0, 55.0, 32.0, 20.0, 12.0, 14.0, 19.0, 6.0, 7.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.390625, -1.352294921875, -1.31396484375, -1.275634765625, -1.2373046875, -1.198974609375, -1.16064453125, -1.122314453125, -1.083984375, -1.045654296875, -1.00732421875, -0.968994140625, -0.9306640625, -0.892333984375, -0.85400390625, -0.815673828125, -0.77734375, -0.739013671875, -0.70068359375, -0.662353515625, -0.6240234375, -0.585693359375, -0.54736328125, -0.509033203125, -0.470703125, -0.432373046875, -0.39404296875, -0.355712890625, -0.3173828125, -0.279052734375, -0.24072265625, -0.202392578125, -0.1640625, -0.125732421875, -0.08740234375, -0.049072265625, -0.0107421875, 0.027587890625, 0.06591796875, 0.104248046875, 0.142578125, 0.180908203125, 0.21923828125, 0.257568359375, 0.2958984375, 0.334228515625, 0.37255859375, 0.410888671875, 0.44921875, 0.487548828125, 0.52587890625, 0.564208984375, 0.6025390625, 0.640869140625, 0.67919921875, 0.717529296875, 0.755859375, 0.794189453125, 0.83251953125, 0.870849609375, 0.9091796875, 0.947509765625, 0.98583984375, 1.024169921875, 1.0625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 1.0, 9.0, 9.0, 8.0, 12.0, 19.0, 22.0, 26.0, 25.0, 31.0, 32.0, 35.0, 30.0, 41.0, 44.0, 45.0, 53.0, 54.0, 55.0, 57.0, 44.0, 37.0, 36.0, 39.0, 35.0, 25.0, 27.0, 22.0, 19.0, 24.0, 17.0, 19.0, 7.0, 6.0, 11.0, 7.0, 3.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3759765625, -1.33538818359375, -1.2947998046875, -1.25421142578125, -1.213623046875, -1.17303466796875, -1.1324462890625, -1.09185791015625, -1.05126953125, -1.01068115234375, -0.9700927734375, -0.92950439453125, -0.888916015625, -0.84832763671875, -0.8077392578125, -0.76715087890625, -0.7265625, -0.68597412109375, -0.6453857421875, -0.60479736328125, -0.564208984375, -0.52362060546875, -0.4830322265625, -0.44244384765625, -0.40185546875, -0.36126708984375, -0.3206787109375, -0.28009033203125, -0.239501953125, -0.19891357421875, -0.1583251953125, -0.11773681640625, -0.0771484375, -0.03656005859375, 0.0040283203125, 0.04461669921875, 0.085205078125, 0.12579345703125, 0.1663818359375, 0.20697021484375, 0.24755859375, 0.28814697265625, 0.3287353515625, 0.36932373046875, 0.409912109375, 0.45050048828125, 0.4910888671875, 0.53167724609375, 0.572265625, 0.61285400390625, 0.6534423828125, 0.69403076171875, 0.734619140625, 0.77520751953125, 0.8157958984375, 0.85638427734375, 0.89697265625, 0.93756103515625, 0.9781494140625, 1.01873779296875, 1.059326171875, 1.09991455078125, 1.1405029296875, 1.18109130859375, 1.2216796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 6.0, 4.0, 6.0, 14.0, 16.0, 53.0, 57.0, 98.0, 164.0, 339.0, 811.0, 2367.0, 12241.0, 191496.0, 783181.0, 49622.0, 5513.0, 1411.0, 540.0, 235.0, 152.0, 65.0, 55.0, 32.0, 21.0, 14.0, 8.0, 4.0, 2.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.48575592041015625, -0.4685821533203125, -0.45140838623046875, -0.434234619140625, -0.41706085205078125, -0.3998870849609375, -0.38271331787109375, -0.36553955078125, -0.34836578369140625, -0.3311920166015625, -0.31401824951171875, -0.296844482421875, -0.27967071533203125, -0.2624969482421875, -0.24532318115234375, -0.2281494140625, -0.21097564697265625, -0.1938018798828125, -0.17662811279296875, -0.159454345703125, -0.14228057861328125, -0.1251068115234375, -0.10793304443359375, -0.09075927734375, -0.07358551025390625, -0.0564117431640625, -0.03923797607421875, -0.022064208984375, -0.00489044189453125, 0.0122833251953125, 0.02945709228515625, 0.046630859375, 0.06380462646484375, 0.0809783935546875, 0.09815216064453125, 0.115325927734375, 0.13249969482421875, 0.1496734619140625, 0.16684722900390625, 0.18402099609375, 0.20119476318359375, 0.2183685302734375, 0.23554229736328125, 0.252716064453125, 0.26988983154296875, 0.2870635986328125, 0.30423736572265625, 0.3214111328125, 0.33858489990234375, 0.3557586669921875, 0.37293243408203125, 0.390106201171875, 0.40727996826171875, 0.4244537353515625, 0.44162750244140625, 0.45880126953125, 0.47597503662109375, 0.4931488037109375, 0.5103225708007812, 0.527496337890625, 0.5446701049804688, 0.5618438720703125, 0.5790176391601562, 0.59619140625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 12.0, 8.0, 7.0, 19.0, 25.0, 38.0, 45.0, 62.0, 63.0, 110.0, 115.0, 133.0, 80.0, 62.0, 59.0, 35.0, 24.0, 28.0, 19.0, 19.0, 12.0, 9.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.606910705566406e-05, -8.32732766866684e-05, -8.047744631767273e-05, -7.768161594867706e-05, -7.48857855796814e-05, -7.208995521068573e-05, -6.929412484169006e-05, -6.64982944726944e-05, -6.370246410369873e-05, -6.0906633734703064e-05, -5.81108033657074e-05, -5.531497299671173e-05, -5.2519142627716064e-05, -4.97233122587204e-05, -4.692748188972473e-05, -4.4131651520729065e-05, -4.13358211517334e-05, -3.853999078273773e-05, -3.5744160413742065e-05, -3.29483300447464e-05, -3.0152499675750732e-05, -2.7356669306755066e-05, -2.45608389377594e-05, -2.1765008568763733e-05, -1.8969178199768066e-05, -1.61733478307724e-05, -1.3377517461776733e-05, -1.0581687092781067e-05, -7.7858567237854e-06, -4.990026354789734e-06, -2.1941959857940674e-06, 6.016343832015991e-07, 3.3974647521972656e-06, 6.193295121192932e-06, 8.989125490188599e-06, 1.1784955859184265e-05, 1.4580786228179932e-05, 1.7376616597175598e-05, 2.0172446966171265e-05, 2.296827733516693e-05, 2.5764107704162598e-05, 2.8559938073158264e-05, 3.135576844215393e-05, 3.41515988111496e-05, 3.6947429180145264e-05, 3.974325954914093e-05, 4.25390899181366e-05, 4.533492028713226e-05, 4.813075065612793e-05, 5.0926581025123596e-05, 5.372241139411926e-05, 5.651824176311493e-05, 5.9314072132110596e-05, 6.210990250110626e-05, 6.490573287010193e-05, 6.77015632390976e-05, 7.049739360809326e-05, 7.329322397708893e-05, 7.60890543460846e-05, 7.888488471508026e-05, 8.168071508407593e-05, 8.44765454530716e-05, 8.727237582206726e-05, 9.006820619106293e-05, 9.28640365600586e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 9.0, 18.0, 24.0, 51.0, 110.0, 297.0, 1002.0, 5397.0, 275253.0, 754245.0, 10063.0, 1409.0, 407.0, 133.0, 77.0, 29.0, 15.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0908203125, -1.0622024536132812, -1.0335845947265625, -1.0049667358398438, -0.976348876953125, -0.9477310180664062, -0.9191131591796875, -0.8904953002929688, -0.86187744140625, -0.8332595825195312, -0.8046417236328125, -0.7760238647460938, -0.747406005859375, -0.7187881469726562, -0.6901702880859375, -0.6615524291992188, -0.6329345703125, -0.6043167114257812, -0.5756988525390625, -0.5470809936523438, -0.518463134765625, -0.48984527587890625, -0.4612274169921875, -0.43260955810546875, -0.40399169921875, -0.37537384033203125, -0.3467559814453125, -0.31813812255859375, -0.289520263671875, -0.26090240478515625, -0.2322845458984375, -0.20366668701171875, -0.175048828125, -0.14643096923828125, -0.1178131103515625, -0.08919525146484375, -0.060577392578125, -0.03195953369140625, -0.0033416748046875, 0.02527618408203125, 0.05389404296875, 0.08251190185546875, 0.1111297607421875, 0.13974761962890625, 0.168365478515625, 0.19698333740234375, 0.2256011962890625, 0.25421905517578125, 0.2828369140625, 0.31145477294921875, 0.3400726318359375, 0.36869049072265625, 0.397308349609375, 0.42592620849609375, 0.4545440673828125, 0.48316192626953125, 0.51177978515625, 0.5403976440429688, 0.5690155029296875, 0.5976333618164062, 0.626251220703125, 0.6548690795898438, 0.6834869384765625, 0.7121047973632812, 0.74072265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 8.0, 3.0, 10.0, 16.0, 15.0, 34.0, 35.0, 42.0, 74.0, 64.0, 86.0, 109.0, 125.0, 90.0, 59.0, 63.0, 43.0, 36.0, 25.0, 16.0, 12.0, 10.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4189453125, -0.40431976318359375, -0.3896942138671875, -0.37506866455078125, -0.360443115234375, -0.34581756591796875, -0.3311920166015625, -0.31656646728515625, -0.30194091796875, -0.28731536865234375, -0.2726898193359375, -0.25806427001953125, -0.243438720703125, -0.22881317138671875, -0.2141876220703125, -0.19956207275390625, -0.1849365234375, -0.17031097412109375, -0.1556854248046875, -0.14105987548828125, -0.126434326171875, -0.11180877685546875, -0.0971832275390625, -0.08255767822265625, -0.06793212890625, -0.05330657958984375, -0.0386810302734375, -0.02405548095703125, -0.009429931640625, 0.00519561767578125, 0.0198211669921875, 0.03444671630859375, 0.049072265625, 0.06369781494140625, 0.0783233642578125, 0.09294891357421875, 0.107574462890625, 0.12220001220703125, 0.1368255615234375, 0.15145111083984375, 0.16607666015625, 0.18070220947265625, 0.1953277587890625, 0.20995330810546875, 0.224578857421875, 0.23920440673828125, 0.2538299560546875, 0.26845550537109375, 0.2830810546875, 0.29770660400390625, 0.3123321533203125, 0.32695770263671875, 0.341583251953125, 0.35620880126953125, 0.3708343505859375, 0.38545989990234375, 0.40008544921875, 0.41471099853515625, 0.4293365478515625, 0.44396209716796875, 0.458587646484375, 0.47321319580078125, 0.4878387451171875, 0.5024642944335938, 0.51708984375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 11.0, 53.0, 114.0, 248.0, 274.0, 167.0, 84.0, 25.0, 13.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.16891860961914, -15.74285888671875, -15.316798210144043, -14.890738487243652, -14.464678764343262, -14.038618087768555, -13.612558364868164, -13.186498641967773, -12.760438919067383, -12.334379196166992, -11.908318519592285, -11.482258796691895, -11.056199073791504, -10.630138397216797, -10.204078674316406, -9.778018951416016, -9.351958274841309, -8.925898551940918, -8.499837875366211, -8.07377815246582, -7.64771842956543, -7.221658229827881, -6.795598030090332, -6.369538307189941, -5.943478107452393, -5.517417907714844, -5.091358184814453, -4.665297985076904, -4.2392377853393555, -3.813178062438965, -3.387117862701416, -2.9610579013824463, -2.534998893737793, -2.1089389324188232, -1.682878851890564, -1.2568187713623047, -0.830758810043335, -0.40469884872436523, 0.021361351013183594, 0.4474213123321533, 0.873481273651123, 1.2995412349700928, 1.725601315498352, 2.1516613960266113, 2.577721357345581, 3.003781318664551, 3.4298415184020996, 3.8559014797210693, 4.281961441040039, 4.708021640777588, 5.1340813636779785, 5.560141563415527, 5.986201286315918, 6.412261486053467, 6.838321685791016, 7.264381408691406, 7.690441608428955, 8.116501808166504, 8.542561531066895, 8.968622207641602, 9.394681930541992, 9.820741653442383, 10.246801376342773, 10.67286205291748, 11.098921775817871]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 7.0, 10.0, 6.0, 7.0, 7.0, 22.0, 22.0, 21.0, 24.0, 38.0, 27.0, 29.0, 44.0, 49.0, 32.0, 50.0, 57.0, 55.0, 62.0, 55.0, 51.0, 46.0, 34.0, 45.0, 33.0, 23.0, 30.0, 22.0, 21.0, 19.0, 7.0, 7.0, 8.0, 4.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.240418434143066, -5.056118011474609, -4.8718180656433105, -4.687518119812012, -4.503217697143555, -4.318917274475098, -4.134617328643799, -3.950317144393921, -3.766016960144043, -3.581716775894165, -3.397416591644287, -3.213116407394409, -3.0288162231445312, -2.8445160388946533, -2.6602158546447754, -2.4759156703948975, -2.2916154861450195, -2.1073153018951416, -1.9230151176452637, -1.7387149333953857, -1.5544147491455078, -1.3701145648956299, -1.185814380645752, -1.001514196395874, -0.8172140121459961, -0.6329138278961182, -0.44861364364624023, -0.2643134593963623, -0.08001327514648438, 0.10428690910339355, 0.2885870933532715, 0.4728872776031494, 0.6571869850158691, 0.8414871692657471, 1.025787353515625, 1.210087537765503, 1.3943877220153809, 1.5786879062652588, 1.7629880905151367, 1.9472882747650146, 2.1315884590148926, 2.3158886432647705, 2.5001888275146484, 2.6844890117645264, 2.8687891960144043, 3.0530893802642822, 3.23738956451416, 3.421689748764038, 3.605989933013916, 3.790290117263794, 3.974590301513672, 4.158890724182129, 4.343190670013428, 4.527490615844727, 4.711791038513184, 4.896091461181641, 5.0803914070129395, 5.264691352844238, 5.448991775512695, 5.633292198181152, 5.817592144012451, 6.00189208984375, 6.186192512512207, 6.370492935180664, 6.554792881011963]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 7.0, 4.0, 16.0, 10.0, 19.0, 21.0, 31.0, 64.0, 89.0, 187.0, 380.0, 893.0, 3178.0, 17053.0, 313648.0, 3768992.0, 78342.0, 8243.0, 1822.0, 601.0, 269.0, 153.0, 81.0, 57.0, 33.0, 26.0, 17.0, 12.0, 14.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.130859375, -1.097900390625, -1.06494140625, -1.031982421875, -0.9990234375, -0.966064453125, -0.93310546875, -0.900146484375, -0.8671875, -0.834228515625, -0.80126953125, -0.768310546875, -0.7353515625, -0.702392578125, -0.66943359375, -0.636474609375, -0.603515625, -0.570556640625, -0.53759765625, -0.504638671875, -0.4716796875, -0.438720703125, -0.40576171875, -0.372802734375, -0.33984375, -0.306884765625, -0.27392578125, -0.240966796875, -0.2080078125, -0.175048828125, -0.14208984375, -0.109130859375, -0.076171875, -0.043212890625, -0.01025390625, 0.022705078125, 0.0556640625, 0.088623046875, 0.12158203125, 0.154541015625, 0.1875, 0.220458984375, 0.25341796875, 0.286376953125, 0.3193359375, 0.352294921875, 0.38525390625, 0.418212890625, 0.451171875, 0.484130859375, 0.51708984375, 0.550048828125, 0.5830078125, 0.615966796875, 0.64892578125, 0.681884765625, 0.71484375, 0.747802734375, 0.78076171875, 0.813720703125, 0.8466796875, 0.879638671875, 0.91259765625, 0.945556640625, 0.978515625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 10.0, 12.0, 16.0, 26.0, 27.0, 41.0, 52.0, 63.0, 77.0, 75.0, 73.0, 95.0, 83.0, 81.0, 62.0, 51.0, 43.0, 27.0, 28.0, 15.0, 16.0, 11.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.339111328125, -0.3261260986328125, -0.313140869140625, -0.3001556396484375, -0.28717041015625, -0.2741851806640625, -0.261199951171875, -0.2482147216796875, -0.2352294921875, -0.2222442626953125, -0.209259033203125, -0.1962738037109375, -0.18328857421875, -0.1703033447265625, -0.157318115234375, -0.1443328857421875, -0.13134765625, -0.1183624267578125, -0.105377197265625, -0.0923919677734375, -0.07940673828125, -0.0664215087890625, -0.053436279296875, -0.0404510498046875, -0.0274658203125, -0.0144805908203125, -0.001495361328125, 0.0114898681640625, 0.02447509765625, 0.0374603271484375, 0.050445556640625, 0.0634307861328125, 0.076416015625, 0.0894012451171875, 0.102386474609375, 0.1153717041015625, 0.12835693359375, 0.1413421630859375, 0.154327392578125, 0.1673126220703125, 0.1802978515625, 0.1932830810546875, 0.206268310546875, 0.2192535400390625, 0.23223876953125, 0.2452239990234375, 0.258209228515625, 0.2711944580078125, 0.2841796875, 0.2971649169921875, 0.310150146484375, 0.3231353759765625, 0.33612060546875, 0.3491058349609375, 0.362091064453125, 0.3750762939453125, 0.3880615234375, 0.4010467529296875, 0.414031982421875, 0.4270172119140625, 0.44000244140625, 0.4529876708984375, 0.465972900390625, 0.4789581298828125, 0.491943359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 3.0, 10.0, 5.0, 13.0, 13.0, 21.0, 21.0, 38.0, 77.0, 107.0, 179.0, 333.0, 828.0, 2679.0, 12223.0, 95268.0, 3615477.0, 431747.0, 28249.0, 4844.0, 1223.0, 427.0, 189.0, 105.0, 67.0, 29.0, 18.0, 15.0, 15.0, 11.0, 10.0, 8.0, 3.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77392578125, -0.7438430786132812, -0.7137603759765625, -0.6836776733398438, -0.653594970703125, -0.6235122680664062, -0.5934295654296875, -0.5633468627929688, -0.53326416015625, -0.5031814575195312, -0.4730987548828125, -0.44301605224609375, -0.412933349609375, -0.38285064697265625, -0.3527679443359375, -0.32268524169921875, -0.2926025390625, -0.26251983642578125, -0.2324371337890625, -0.20235443115234375, -0.172271728515625, -0.14218902587890625, -0.1121063232421875, -0.08202362060546875, -0.05194091796875, -0.02185821533203125, 0.0082244873046875, 0.03830718994140625, 0.068389892578125, 0.09847259521484375, 0.1285552978515625, 0.15863800048828125, 0.188720703125, 0.21880340576171875, 0.2488861083984375, 0.27896881103515625, 0.309051513671875, 0.33913421630859375, 0.3692169189453125, 0.39929962158203125, 0.42938232421875, 0.45946502685546875, 0.4895477294921875, 0.5196304321289062, 0.549713134765625, 0.5797958374023438, 0.6098785400390625, 0.6399612426757812, 0.6700439453125, 0.7001266479492188, 0.7302093505859375, 0.7602920532226562, 0.790374755859375, 0.8204574584960938, 0.8505401611328125, 0.8806228637695312, 0.91070556640625, 0.9407882690429688, 0.9708709716796875, 1.0009536743164062, 1.031036376953125, 1.0611190795898438, 1.0912017822265625, 1.1212844848632812, 1.1513671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 4.0, 8.0, 13.0, 11.0, 17.0, 23.0, 45.0, 65.0, 138.0, 285.0, 649.0, 1361.0, 766.0, 331.0, 146.0, 77.0, 38.0, 25.0, 15.0, 15.0, 17.0, 7.0, 6.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2529296875, -1.222808837890625, -1.19268798828125, -1.162567138671875, -1.1324462890625, -1.102325439453125, -1.07220458984375, -1.042083740234375, -1.011962890625, -0.981842041015625, -0.95172119140625, -0.921600341796875, -0.8914794921875, -0.861358642578125, -0.83123779296875, -0.801116943359375, -0.77099609375, -0.740875244140625, -0.71075439453125, -0.680633544921875, -0.6505126953125, -0.620391845703125, -0.59027099609375, -0.560150146484375, -0.530029296875, -0.499908447265625, -0.46978759765625, -0.439666748046875, -0.4095458984375, -0.379425048828125, -0.34930419921875, -0.319183349609375, -0.2890625, -0.258941650390625, -0.22882080078125, -0.198699951171875, -0.1685791015625, -0.138458251953125, -0.10833740234375, -0.078216552734375, -0.048095703125, -0.017974853515625, 0.01214599609375, 0.042266845703125, 0.0723876953125, 0.102508544921875, 0.13262939453125, 0.162750244140625, 0.19287109375, 0.222991943359375, 0.25311279296875, 0.283233642578125, 0.3133544921875, 0.343475341796875, 0.37359619140625, 0.403717041015625, 0.433837890625, 0.463958740234375, 0.49407958984375, 0.524200439453125, 0.5543212890625, 0.584442138671875, 0.61456298828125, 0.644683837890625, 0.6748046875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 6.0, 8.0, 14.0, 32.0, 69.0, 172.0, 209.0, 217.0, 138.0, 64.0, 30.0, 14.0, 6.0, 2.0, 7.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.639715194702148, -8.412349700927734, -8.184985160827637, -7.957619667053223, -7.730254173278809, -7.502889156341553, -7.275524139404297, -7.048158645629883, -6.820793628692627, -6.593428611755371, -6.366063117980957, -6.138698101043701, -5.911333084106445, -5.683967590332031, -5.456602573394775, -5.2292375564575195, -5.0018720626831055, -4.77450704574585, -4.5471415519714355, -4.31977653503418, -4.092411041259766, -3.8650460243225098, -3.637681007385254, -3.410315752029419, -3.182950496673584, -2.955585241317749, -2.728219985961914, -2.500854969024658, -2.2734897136688232, -2.0461244583129883, -1.8187593221664429, -1.5913941860198975, -1.3640289306640625, -1.1366636753082275, -0.9092985391616821, -0.6819333434104919, -0.45456814765930176, -0.2272028923034668, 0.00016224384307861328, 0.22752737998962402, 0.454892635345459, 0.6822578310966492, 0.9096230268478394, 1.1369881629943848, 1.3643534183502197, 1.5917186737060547, 1.8190838098526, 2.0464489459991455, 2.2738142013549805, 2.5011794567108154, 2.7285447120666504, 2.9559097290039062, 3.183274984359741, 3.410640239715576, 3.638005256652832, 3.865370512008667, 4.092735767364502, 4.320100784301758, 4.547466278076172, 4.774831295013428, 5.002196311950684, 5.229561805725098, 5.4569268226623535, 5.684291839599609, 5.911657333374023]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 7.0, 9.0, 4.0, 21.0, 24.0, 25.0, 26.0, 36.0, 50.0, 66.0, 55.0, 66.0, 70.0, 60.0, 65.0, 75.0, 55.0, 64.0, 54.0, 25.0, 24.0, 29.0, 22.0, 15.0, 17.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.453827857971191, -4.315446376800537, -4.177064895629883, -4.0386834144592285, -3.900301933288574, -3.76192045211792, -3.6235389709472656, -3.4851574897766113, -3.346776008605957, -3.2083945274353027, -3.0700130462646484, -2.931631565093994, -2.79325008392334, -2.6548686027526855, -2.5164871215820312, -2.378105640411377, -2.2397241592407227, -2.1013426780700684, -1.962961196899414, -1.8245797157287598, -1.6861982345581055, -1.5478167533874512, -1.4094352722167969, -1.2710537910461426, -1.1326723098754883, -0.994290828704834, -0.8559093475341797, -0.7175278663635254, -0.5791463851928711, -0.4407649040222168, -0.3023834228515625, -0.1640019416809082, -0.025620460510253906, 0.11276102066040039, 0.2511425018310547, 0.389523983001709, 0.5279054641723633, 0.6662869453430176, 0.8046684265136719, 0.9430499076843262, 1.0814313888549805, 1.2198128700256348, 1.358194351196289, 1.4965758323669434, 1.6349573135375977, 1.773338794708252, 1.9117202758789062, 2.0501017570495605, 2.188483238220215, 2.326864719390869, 2.4652462005615234, 2.6036276817321777, 2.742009162902832, 2.8803906440734863, 3.0187721252441406, 3.157153606414795, 3.295535087585449, 3.4339165687561035, 3.572298049926758, 3.710679531097412, 3.8490610122680664, 3.9874424934387207, 4.125823974609375, 4.264205455780029, 4.402586936950684]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 8.0, 13.0, 15.0, 28.0, 45.0, 72.0, 135.0, 228.0, 433.0, 790.0, 1660.0, 3467.0, 8098.0, 21052.0, 62056.0, 196013.0, 421623.0, 222423.0, 70072.0, 23789.0, 9002.0, 3823.0, 1765.0, 874.0, 414.0, 253.0, 152.0, 97.0, 51.0, 34.0, 18.0, 20.0, 11.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45166015625, -0.43637847900390625, -0.4210968017578125, -0.40581512451171875, -0.390533447265625, -0.37525177001953125, -0.3599700927734375, -0.34468841552734375, -0.32940673828125, -0.31412506103515625, -0.2988433837890625, -0.28356170654296875, -0.268280029296875, -0.25299835205078125, -0.2377166748046875, -0.22243499755859375, -0.2071533203125, -0.19187164306640625, -0.1765899658203125, -0.16130828857421875, -0.146026611328125, -0.13074493408203125, -0.1154632568359375, -0.10018157958984375, -0.08489990234375, -0.06961822509765625, -0.0543365478515625, -0.03905487060546875, -0.023773193359375, -0.00849151611328125, 0.0067901611328125, 0.02207183837890625, 0.037353515625, 0.05263519287109375, 0.0679168701171875, 0.08319854736328125, 0.098480224609375, 0.11376190185546875, 0.1290435791015625, 0.14432525634765625, 0.15960693359375, 0.17488861083984375, 0.1901702880859375, 0.20545196533203125, 0.220733642578125, 0.23601531982421875, 0.2512969970703125, 0.26657867431640625, 0.2818603515625, 0.29714202880859375, 0.3124237060546875, 0.32770538330078125, 0.342987060546875, 0.35826873779296875, 0.3735504150390625, 0.38883209228515625, 0.40411376953125, 0.41939544677734375, 0.4346771240234375, 0.44995880126953125, 0.465240478515625, 0.48052215576171875, 0.4958038330078125, 0.5110855102539062, 0.5263671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 6.0, 9.0, 10.0, 11.0, 24.0, 33.0, 35.0, 32.0, 49.0, 45.0, 51.0, 56.0, 67.0, 57.0, 68.0, 57.0, 56.0, 50.0, 49.0, 37.0, 42.0, 31.0, 31.0, 20.0, 11.0, 8.0, 11.0, 9.0, 8.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.331298828125, -0.32183074951171875, -0.3123626708984375, -0.30289459228515625, -0.293426513671875, -0.28395843505859375, -0.2744903564453125, -0.26502227783203125, -0.25555419921875, -0.24608612060546875, -0.2366180419921875, -0.22714996337890625, -0.217681884765625, -0.20821380615234375, -0.1987457275390625, -0.18927764892578125, -0.1798095703125, -0.17034149169921875, -0.1608734130859375, -0.15140533447265625, -0.141937255859375, -0.13246917724609375, -0.1230010986328125, -0.11353302001953125, -0.10406494140625, -0.09459686279296875, -0.0851287841796875, -0.07566070556640625, -0.066192626953125, -0.05672454833984375, -0.0472564697265625, -0.03778839111328125, -0.0283203125, -0.01885223388671875, -0.0093841552734375, 8.392333984375e-05, 0.009552001953125, 0.01902008056640625, 0.0284881591796875, 0.03795623779296875, 0.04742431640625, 0.05689239501953125, 0.0663604736328125, 0.07582855224609375, 0.085296630859375, 0.09476470947265625, 0.1042327880859375, 0.11370086669921875, 0.1231689453125, 0.13263702392578125, 0.1421051025390625, 0.15157318115234375, 0.161041259765625, 0.17050933837890625, 0.1799774169921875, 0.18944549560546875, 0.19891357421875, 0.20838165283203125, 0.2178497314453125, 0.22731781005859375, 0.236785888671875, 0.24625396728515625, 0.2557220458984375, 0.26519012451171875, 0.274658203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 9.0, 14.0, 15.0, 18.0, 38.0, 50.0, 87.0, 103.0, 209.0, 408.0, 838.0, 1896.0, 6923.0, 76940.0, 850735.0, 98240.0, 8041.0, 2073.0, 904.0, 415.0, 203.0, 134.0, 95.0, 56.0, 37.0, 21.0, 20.0, 17.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0248565673828125, -0.986236572265625, -0.9476165771484375, -0.90899658203125, -0.8703765869140625, -0.831756591796875, -0.7931365966796875, -0.7545166015625, -0.7158966064453125, -0.677276611328125, -0.6386566162109375, -0.60003662109375, -0.5614166259765625, -0.522796630859375, -0.4841766357421875, -0.445556640625, -0.4069366455078125, -0.368316650390625, -0.3296966552734375, -0.29107666015625, -0.2524566650390625, -0.213836669921875, -0.1752166748046875, -0.1365966796875, -0.0979766845703125, -0.059356689453125, -0.0207366943359375, 0.01788330078125, 0.0565032958984375, 0.095123291015625, 0.1337432861328125, 0.17236328125, 0.2109832763671875, 0.249603271484375, 0.2882232666015625, 0.32684326171875, 0.3654632568359375, 0.404083251953125, 0.4427032470703125, 0.4813232421875, 0.5199432373046875, 0.558563232421875, 0.5971832275390625, 0.63580322265625, 0.6744232177734375, 0.713043212890625, 0.7516632080078125, 0.790283203125, 0.8289031982421875, 0.867523193359375, 0.9061431884765625, 0.94476318359375, 0.9833831787109375, 1.022003173828125, 1.0606231689453125, 1.0992431640625, 1.1378631591796875, 1.176483154296875, 1.2151031494140625, 1.25372314453125, 1.2923431396484375, 1.330963134765625, 1.3695831298828125, 1.408203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 3.0, 3.0, 13.0, 21.0, 13.0, 19.0, 26.0, 29.0, 36.0, 39.0, 53.0, 44.0, 47.0, 76.0, 59.0, 59.0, 62.0, 63.0, 50.0, 51.0, 36.0, 47.0, 41.0, 24.0, 28.0, 19.0, 13.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3857421875, -1.3437042236328125, -1.301666259765625, -1.2596282958984375, -1.21759033203125, -1.1755523681640625, -1.133514404296875, -1.0914764404296875, -1.0494384765625, -1.0074005126953125, -0.965362548828125, -0.9233245849609375, -0.88128662109375, -0.8392486572265625, -0.797210693359375, -0.7551727294921875, -0.713134765625, -0.6710968017578125, -0.629058837890625, -0.5870208740234375, -0.54498291015625, -0.5029449462890625, -0.460906982421875, -0.4188690185546875, -0.3768310546875, -0.3347930908203125, -0.292755126953125, -0.2507171630859375, -0.20867919921875, -0.1666412353515625, -0.124603271484375, -0.0825653076171875, -0.04052734375, 0.0015106201171875, 0.043548583984375, 0.0855865478515625, 0.12762451171875, 0.1696624755859375, 0.211700439453125, 0.2537384033203125, 0.2957763671875, 0.3378143310546875, 0.379852294921875, 0.4218902587890625, 0.46392822265625, 0.5059661865234375, 0.548004150390625, 0.5900421142578125, 0.632080078125, 0.6741180419921875, 0.716156005859375, 0.7581939697265625, 0.80023193359375, 0.8422698974609375, 0.884307861328125, 0.9263458251953125, 0.9683837890625, 1.0104217529296875, 1.052459716796875, 1.0944976806640625, 1.13653564453125, 1.1785736083984375, 1.220611572265625, 1.2626495361328125, 1.3046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 8.0, 8.0, 17.0, 22.0, 29.0, 50.0, 72.0, 181.0, 422.0, 1565.0, 10596.0, 732056.0, 294460.0, 7188.0, 1169.0, 376.0, 160.0, 68.0, 45.0, 26.0, 9.0, 6.0, 11.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80224609375, -0.7762985229492188, -0.7503509521484375, -0.7244033813476562, -0.698455810546875, -0.6725082397460938, -0.6465606689453125, -0.6206130981445312, -0.59466552734375, -0.5687179565429688, -0.5427703857421875, -0.5168228149414062, -0.490875244140625, -0.46492767333984375, -0.4389801025390625, -0.41303253173828125, -0.3870849609375, -0.36113739013671875, -0.3351898193359375, -0.30924224853515625, -0.283294677734375, -0.25734710693359375, -0.2313995361328125, -0.20545196533203125, -0.17950439453125, -0.15355682373046875, -0.1276092529296875, -0.10166168212890625, -0.075714111328125, -0.04976654052734375, -0.0238189697265625, 0.00212860107421875, 0.028076171875, 0.05402374267578125, 0.0799713134765625, 0.10591888427734375, 0.131866455078125, 0.15781402587890625, 0.1837615966796875, 0.20970916748046875, 0.23565673828125, 0.26160430908203125, 0.2875518798828125, 0.31349945068359375, 0.339447021484375, 0.36539459228515625, 0.3913421630859375, 0.41728973388671875, 0.4432373046875, 0.46918487548828125, 0.4951324462890625, 0.5210800170898438, 0.547027587890625, 0.5729751586914062, 0.5989227294921875, 0.6248703002929688, 0.65081787109375, 0.6767654418945312, 0.7027130126953125, 0.7286605834960938, 0.754608154296875, 0.7805557250976562, 0.8065032958984375, 0.8324508666992188, 0.8583984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 5.0, 3.0, 11.0, 15.0, 13.0, 18.0, 20.0, 41.0, 42.0, 51.0, 86.0, 137.0, 138.0, 107.0, 71.0, 54.0, 37.0, 32.0, 24.0, 18.0, 14.0, 12.0, 7.0, 9.0, 7.0, 6.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.600950241088867e-05, -8.296500891447067e-05, -7.992051541805267e-05, -7.687602192163467e-05, -7.383152842521667e-05, -7.078703492879868e-05, -6.774254143238068e-05, -6.469804793596268e-05, -6.165355443954468e-05, -5.860906094312668e-05, -5.556456744670868e-05, -5.252007395029068e-05, -4.947558045387268e-05, -4.643108695745468e-05, -4.338659346103668e-05, -4.034209996461868e-05, -3.7297606468200684e-05, -3.4253112971782684e-05, -3.1208619475364685e-05, -2.8164125978946686e-05, -2.5119632482528687e-05, -2.2075138986110687e-05, -1.9030645489692688e-05, -1.598615199327469e-05, -1.294165849685669e-05, -9.89716500043869e-06, -6.852671504020691e-06, -3.8081780076026917e-06, -7.636845111846924e-07, 2.280808985233307e-06, 5.325302481651306e-06, 8.369795978069305e-06, 1.1414289474487305e-05, 1.4458782970905304e-05, 1.7503276467323303e-05, 2.0547769963741302e-05, 2.3592263460159302e-05, 2.66367569565773e-05, 2.96812504529953e-05, 3.27257439494133e-05, 3.57702374458313e-05, 3.88147309422493e-05, 4.18592244386673e-05, 4.49037179350853e-05, 4.7948211431503296e-05, 5.0992704927921295e-05, 5.4037198424339294e-05, 5.7081691920757294e-05, 6.012618541717529e-05, 6.317067891359329e-05, 6.621517241001129e-05, 6.925966590642929e-05, 7.230415940284729e-05, 7.534865289926529e-05, 7.839314639568329e-05, 8.143763989210129e-05, 8.448213338851929e-05, 8.752662688493729e-05, 9.057112038135529e-05, 9.361561387777328e-05, 9.666010737419128e-05, 9.970460087060928e-05, 0.00010274909436702728, 0.00010579358786344528, 0.00010883808135986328]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 6.0, 1.0, 7.0, 5.0, 10.0, 11.0, 24.0, 24.0, 63.0, 111.0, 213.0, 479.0, 1143.0, 3869.0, 27808.0, 786863.0, 212717.0, 11258.0, 2365.0, 836.0, 324.0, 172.0, 84.0, 56.0, 28.0, 27.0, 17.0, 6.0, 10.0, 7.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.63427734375, -0.6149444580078125, -0.595611572265625, -0.5762786865234375, -0.55694580078125, -0.5376129150390625, -0.518280029296875, -0.4989471435546875, -0.4796142578125, -0.4602813720703125, -0.440948486328125, -0.4216156005859375, -0.40228271484375, -0.3829498291015625, -0.363616943359375, -0.3442840576171875, -0.324951171875, -0.3056182861328125, -0.286285400390625, -0.2669525146484375, -0.24761962890625, -0.2282867431640625, -0.208953857421875, -0.1896209716796875, -0.1702880859375, -0.1509552001953125, -0.131622314453125, -0.1122894287109375, -0.09295654296875, -0.0736236572265625, -0.054290771484375, -0.0349578857421875, -0.015625, 0.0037078857421875, 0.023040771484375, 0.0423736572265625, 0.06170654296875, 0.0810394287109375, 0.100372314453125, 0.1197052001953125, 0.1390380859375, 0.1583709716796875, 0.177703857421875, 0.1970367431640625, 0.21636962890625, 0.2357025146484375, 0.255035400390625, 0.2743682861328125, 0.293701171875, 0.3130340576171875, 0.332366943359375, 0.3516998291015625, 0.37103271484375, 0.3903656005859375, 0.409698486328125, 0.4290313720703125, 0.4483642578125, 0.4676971435546875, 0.487030029296875, 0.5063629150390625, 0.52569580078125, 0.5450286865234375, 0.564361572265625, 0.5836944580078125, 0.60302734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 9.0, 10.0, 15.0, 16.0, 33.0, 46.0, 48.0, 102.0, 119.0, 122.0, 129.0, 91.0, 71.0, 57.0, 31.0, 29.0, 17.0, 18.0, 16.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5712890625, -0.553314208984375, -0.53533935546875, -0.517364501953125, -0.4993896484375, -0.481414794921875, -0.46343994140625, -0.445465087890625, -0.427490234375, -0.409515380859375, -0.39154052734375, -0.373565673828125, -0.3555908203125, -0.337615966796875, -0.31964111328125, -0.301666259765625, -0.28369140625, -0.265716552734375, -0.24774169921875, -0.229766845703125, -0.2117919921875, -0.193817138671875, -0.17584228515625, -0.157867431640625, -0.139892578125, -0.121917724609375, -0.10394287109375, -0.085968017578125, -0.0679931640625, -0.050018310546875, -0.03204345703125, -0.014068603515625, 0.00390625, 0.021881103515625, 0.03985595703125, 0.057830810546875, 0.0758056640625, 0.093780517578125, 0.11175537109375, 0.129730224609375, 0.147705078125, 0.165679931640625, 0.18365478515625, 0.201629638671875, 0.2196044921875, 0.237579345703125, 0.25555419921875, 0.273529052734375, 0.29150390625, 0.309478759765625, 0.32745361328125, 0.345428466796875, 0.3634033203125, 0.381378173828125, 0.39935302734375, 0.417327880859375, 0.435302734375, 0.453277587890625, 0.47125244140625, 0.489227294921875, 0.5072021484375, 0.525177001953125, 0.54315185546875, 0.561126708984375, 0.5791015625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 40.0, 63.0, 106.0, 206.0, 227.0, 151.0, 100.0, 38.0, 26.0, 9.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.062172889709473, -3.8374850749969482, -3.612797260284424, -3.3881092071533203, -3.163421392440796, -2.9387335777282715, -2.714045763015747, -2.4893579483032227, -2.264669895172119, -2.0399820804595947, -1.8152941465377808, -1.5906063318252563, -1.3659183979034424, -1.141230583190918, -0.9165427684783936, -0.6918548345565796, -0.4671671390533447, -0.24247927963733673, -0.017791420221328735, 0.20689642429351807, 0.43158429861068726, 0.6562721729278564, 0.8809599876403809, 1.1056479215621948, 1.3303357362747192, 1.5550235509872437, 1.7797114849090576, 2.004399299621582, 2.2290871143341064, 2.453774929046631, 2.6784629821777344, 2.903150796890259, 3.127838611602783, 3.3525264263153076, 3.577214241027832, 3.8019022941589355, 4.026589870452881, 4.251277923583984, 4.47596549987793, 4.700653553009033, 4.925341606140137, 5.15002965927124, 5.3747172355651855, 5.599405288696289, 5.824092864990234, 6.048780918121338, 6.273468971252441, 6.498156547546387, 6.722844123840332, 6.9475321769714355, 7.172219753265381, 7.396907806396484, 7.62159538269043, 7.846283435821533, 8.070971488952637, 8.295659065246582, 8.520347595214844, 8.745035171508789, 8.96972370147705, 9.194411277770996, 9.419098854064941, 9.643787384033203, 9.868474960327148, 10.093162536621094, 10.317850112915039]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 15.0, 14.0, 25.0, 27.0, 63.0, 45.0, 60.0, 96.0, 121.0, 94.0, 94.0, 63.0, 84.0, 55.0, 36.0, 28.0, 26.0, 16.0, 13.0, 6.0, 7.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.118273735046387, -7.866584300994873, -7.614894866943359, -7.3632049560546875, -7.111515522003174, -6.85982608795166, -6.608136177062988, -6.356446743011475, -6.104757308959961, -5.853067874908447, -5.601378440856934, -5.349688529968262, -5.097999095916748, -4.846309661865234, -4.5946197509765625, -4.342930316925049, -4.091240882873535, -3.8395514488220215, -3.5878617763519287, -3.336172103881836, -3.0844826698303223, -2.8327932357788086, -2.581103563308716, -2.329413890838623, -2.0777244567871094, -1.8260349035263062, -1.574345350265503, -1.3226557970046997, -1.0709662437438965, -0.8192766904830933, -0.56758713722229, -0.3158975839614868, -0.0642085075378418, 0.18748104572296143, 0.43917059898376465, 0.6908601522445679, 0.9425497055053711, 1.1942392587661743, 1.4459288120269775, 1.6976183652877808, 1.949307918548584, 2.2009973526000977, 2.4526870250701904, 2.704376697540283, 2.956066131591797, 3.2077555656433105, 3.4594452381134033, 3.711134910583496, 3.9628243446350098, 4.214513778686523, 4.466203689575195, 4.717893123626709, 4.969582557678223, 5.221271991729736, 5.47296142578125, 5.724651336669922, 5.9763407707214355, 6.228030204772949, 6.479720115661621, 6.731409549713135, 6.983098983764648, 7.234788417816162, 7.486477851867676, 7.738167762756348, 7.989857196807861]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 7.0, 12.0, 19.0, 25.0, 40.0, 71.0, 102.0, 281.0, 680.0, 2043.0, 9548.0, 105822.0, 3836436.0, 220713.0, 14139.0, 2868.0, 852.0, 315.0, 146.0, 57.0, 34.0, 24.0, 12.0, 7.0, 6.0, 11.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.091796875, -1.0649032592773438, -1.0380096435546875, -1.0111160278320312, -0.984222412109375, -0.9573287963867188, -0.9304351806640625, -0.9035415649414062, -0.87664794921875, -0.8497543334960938, -0.8228607177734375, -0.7959671020507812, -0.769073486328125, -0.7421798706054688, -0.7152862548828125, -0.6883926391601562, -0.6614990234375, -0.6346054077148438, -0.6077117919921875, -0.5808181762695312, -0.553924560546875, -0.5270309448242188, -0.5001373291015625, -0.47324371337890625, -0.44635009765625, -0.41945648193359375, -0.3925628662109375, -0.36566925048828125, -0.338775634765625, -0.31188201904296875, -0.2849884033203125, -0.25809478759765625, -0.231201171875, -0.20430755615234375, -0.1774139404296875, -0.15052032470703125, -0.123626708984375, -0.09673309326171875, -0.0698394775390625, -0.04294586181640625, -0.01605224609375, 0.01084136962890625, 0.0377349853515625, 0.06462860107421875, 0.091522216796875, 0.11841583251953125, 0.1453094482421875, 0.17220306396484375, 0.1990966796875, 0.22599029541015625, 0.2528839111328125, 0.27977752685546875, 0.306671142578125, 0.33356475830078125, 0.3604583740234375, 0.38735198974609375, 0.41424560546875, 0.44113922119140625, 0.4680328369140625, 0.49492645263671875, 0.521820068359375, 0.5487136840820312, 0.5756072998046875, 0.6025009155273438, 0.62939453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 13.0, 14.0, 36.0, 68.0, 98.0, 121.0, 139.0, 155.0, 128.0, 85.0, 75.0, 36.0, 23.0, 10.0, 11.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77587890625, -0.7543792724609375, -0.732879638671875, -0.7113800048828125, -0.68988037109375, -0.6683807373046875, -0.646881103515625, -0.6253814697265625, -0.6038818359375, -0.5823822021484375, -0.560882568359375, -0.5393829345703125, -0.51788330078125, -0.4963836669921875, -0.474884033203125, -0.4533843994140625, -0.431884765625, -0.4103851318359375, -0.388885498046875, -0.3673858642578125, -0.34588623046875, -0.3243865966796875, -0.302886962890625, -0.2813873291015625, -0.2598876953125, -0.2383880615234375, -0.216888427734375, -0.1953887939453125, -0.17388916015625, -0.1523895263671875, -0.130889892578125, -0.1093902587890625, -0.087890625, -0.0663909912109375, -0.044891357421875, -0.0233917236328125, -0.00189208984375, 0.0196075439453125, 0.041107177734375, 0.0626068115234375, 0.0841064453125, 0.1056060791015625, 0.127105712890625, 0.1486053466796875, 0.17010498046875, 0.1916046142578125, 0.213104248046875, 0.2346038818359375, 0.256103515625, 0.2776031494140625, 0.299102783203125, 0.3206024169921875, 0.34210205078125, 0.3636016845703125, 0.385101318359375, 0.4066009521484375, 0.4281005859375, 0.4496002197265625, 0.471099853515625, 0.4925994873046875, 0.51409912109375, 0.5355987548828125, 0.557098388671875, 0.5785980224609375, 0.60009765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 3.0, 6.0, 9.0, 26.0, 44.0, 70.0, 160.0, 438.0, 1198.0, 4702.0, 27905.0, 557137.0, 3515552.0, 74160.0, 9540.0, 2199.0, 689.0, 261.0, 93.0, 36.0, 23.0, 15.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.5684280395507812, -0.5416412353515625, -0.5148544311523438, -0.488067626953125, -0.46128082275390625, -0.4344940185546875, -0.40770721435546875, -0.38092041015625, -0.35413360595703125, -0.3273468017578125, -0.30055999755859375, -0.273773193359375, -0.24698638916015625, -0.2201995849609375, -0.19341278076171875, -0.1666259765625, -0.13983917236328125, -0.1130523681640625, -0.08626556396484375, -0.059478759765625, -0.03269195556640625, -0.0059051513671875, 0.02088165283203125, 0.04766845703125, 0.07445526123046875, 0.1012420654296875, 0.12802886962890625, 0.154815673828125, 0.18160247802734375, 0.2083892822265625, 0.23517608642578125, 0.261962890625, 0.28874969482421875, 0.3155364990234375, 0.34232330322265625, 0.369110107421875, 0.39589691162109375, 0.4226837158203125, 0.44947052001953125, 0.47625732421875, 0.5030441284179688, 0.5298309326171875, 0.5566177368164062, 0.583404541015625, 0.6101913452148438, 0.6369781494140625, 0.6637649536132812, 0.6905517578125, 0.7173385620117188, 0.7441253662109375, 0.7709121704101562, 0.797698974609375, 0.8244857788085938, 0.8512725830078125, 0.8780593872070312, 0.90484619140625, 0.9316329956054688, 0.9584197998046875, 0.9852066040039062, 1.011993408203125, 1.0387802124023438, 1.0655670166015625, 1.0923538208007812, 1.119140625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 13.0, 15.0, 19.0, 32.0, 33.0, 77.0, 132.0, 261.0, 569.0, 1195.0, 928.0, 383.0, 182.0, 79.0, 42.0, 30.0, 15.0, 26.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.81201171875, -0.7892913818359375, -0.766571044921875, -0.7438507080078125, -0.72113037109375, -0.6984100341796875, -0.675689697265625, -0.6529693603515625, -0.6302490234375, -0.6075286865234375, -0.584808349609375, -0.5620880126953125, -0.53936767578125, -0.5166473388671875, -0.493927001953125, -0.4712066650390625, -0.448486328125, -0.4257659912109375, -0.403045654296875, -0.3803253173828125, -0.35760498046875, -0.3348846435546875, -0.312164306640625, -0.2894439697265625, -0.2667236328125, -0.2440032958984375, -0.221282958984375, -0.1985626220703125, -0.17584228515625, -0.1531219482421875, -0.130401611328125, -0.1076812744140625, -0.0849609375, -0.0622406005859375, -0.039520263671875, -0.0167999267578125, 0.00592041015625, 0.0286407470703125, 0.051361083984375, 0.0740814208984375, 0.0968017578125, 0.1195220947265625, 0.142242431640625, 0.1649627685546875, 0.18768310546875, 0.2104034423828125, 0.233123779296875, 0.2558441162109375, 0.278564453125, 0.3012847900390625, 0.324005126953125, 0.3467254638671875, 0.36944580078125, 0.3921661376953125, 0.414886474609375, 0.4376068115234375, 0.4603271484375, 0.4830474853515625, 0.505767822265625, 0.5284881591796875, 0.55120849609375, 0.5739288330078125, 0.596649169921875, 0.6193695068359375, 0.64208984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 11.0, 52.0, 131.0, 336.0, 321.0, 97.0, 24.0, 3.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.753754615783691, -10.455516815185547, -10.157278060913086, -9.859040260314941, -9.560802459716797, -9.262564659118652, -8.964326858520508, -8.666088104248047, -8.367850303649902, -8.069612503051758, -7.771374225616455, -7.473135948181152, -7.174898147583008, -6.876660346984863, -6.5784220695495605, -6.280183792114258, -5.981945991516113, -5.683708190917969, -5.385469913482666, -5.087231636047363, -4.788993835449219, -4.490756034851074, -4.1925177574157715, -3.894279718399048, -3.596041679382324, -3.2978036403656006, -2.999565601348877, -2.7013275623321533, -2.4030895233154297, -2.104851484298706, -1.8066134452819824, -1.5083754062652588, -1.2101364135742188, -0.9118983745574951, -0.6136603355407715, -0.31542229652404785, -0.01718425750732422, 0.2810537815093994, 0.579291820526123, 0.8775298595428467, 1.1757678985595703, 1.474005937576294, 1.7722439765930176, 2.070482015609741, 2.368720054626465, 2.6669580936431885, 2.965196132659912, 3.2634341716766357, 3.5616722106933594, 3.859910249710083, 4.158148288726807, 4.456386566162109, 4.754624366760254, 5.052862167358398, 5.351100444793701, 5.649338722229004, 5.947576522827148, 6.245814323425293, 6.544052600860596, 6.842290878295898, 7.140528678894043, 7.4387664794921875, 7.73700475692749, 8.035243034362793, 8.333480834960938]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 11.0, 17.0, 11.0, 14.0, 24.0, 31.0, 40.0, 48.0, 58.0, 61.0, 71.0, 66.0, 65.0, 72.0, 69.0, 60.0, 51.0, 59.0, 37.0, 31.0, 22.0, 21.0, 15.0, 8.0, 11.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5510036945343018, -3.4221067428588867, -3.2932097911834717, -3.1643128395080566, -3.0354161262512207, -2.9065191745758057, -2.7776222229003906, -2.6487252712249756, -2.5198283195495605, -2.3909313678741455, -2.2620344161987305, -2.1331377029418945, -2.0042407512664795, -1.8753437995910645, -1.7464468479156494, -1.6175498962402344, -1.4886531829833984, -1.3597562313079834, -1.230859398841858, -1.1019624471664429, -0.9730655550956726, -0.8441686630249023, -0.7152717113494873, -0.586374819278717, -0.4574779272079468, -0.3285810351371765, -0.19968411326408386, -0.07078719139099121, 0.05810970067977905, 0.18700659275054932, 0.31590354442596436, 0.4448004364967346, 0.573697566986084, 0.7025944590568542, 0.8314913511276245, 0.9603883028030396, 1.089285135269165, 1.21818208694458, 1.3470790386199951, 1.4759759902954102, 1.6048728227615356, 1.7337697744369507, 1.8626666069030762, 1.9915635585784912, 2.1204605102539062, 2.249357223510742, 2.3782544136047363, 2.5071511268615723, 2.6360480785369873, 2.7649450302124023, 2.8938419818878174, 3.0227389335632324, 3.1516356468200684, 3.2805325984954834, 3.4094295501708984, 3.5383265018463135, 3.6672234535217285, 3.7961204051971436, 3.9250173568725586, 4.0539140701293945, 4.182811260223389, 4.311707973480225, 4.440605163574219, 4.569501876831055, 4.698398590087891]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 8.0, 15.0, 17.0, 18.0, 33.0, 55.0, 70.0, 118.0, 195.0, 325.0, 570.0, 1031.0, 1995.0, 4132.0, 8867.0, 21742.0, 61317.0, 196840.0, 425841.0, 216274.0, 66683.0, 23658.0, 9586.0, 4473.0, 2084.0, 1141.0, 577.0, 359.0, 190.0, 117.0, 78.0, 49.0, 25.0, 16.0, 12.0, 10.0, 9.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.50732421875, -0.49304962158203125, -0.4787750244140625, -0.46450042724609375, -0.450225830078125, -0.43595123291015625, -0.4216766357421875, -0.40740203857421875, -0.39312744140625, -0.37885284423828125, -0.3645782470703125, -0.35030364990234375, -0.336029052734375, -0.32175445556640625, -0.3074798583984375, -0.29320526123046875, -0.2789306640625, -0.26465606689453125, -0.2503814697265625, -0.23610687255859375, -0.221832275390625, -0.20755767822265625, -0.1932830810546875, -0.17900848388671875, -0.16473388671875, -0.15045928955078125, -0.1361846923828125, -0.12191009521484375, -0.107635498046875, -0.09336090087890625, -0.0790863037109375, -0.06481170654296875, -0.050537109375, -0.03626251220703125, -0.0219879150390625, -0.00771331787109375, 0.006561279296875, 0.02083587646484375, 0.0351104736328125, 0.04938507080078125, 0.06365966796875, 0.07793426513671875, 0.0922088623046875, 0.10648345947265625, 0.120758056640625, 0.13503265380859375, 0.1493072509765625, 0.16358184814453125, 0.1778564453125, 0.19213104248046875, 0.2064056396484375, 0.22068023681640625, 0.234954833984375, 0.24922943115234375, 0.2635040283203125, 0.27777862548828125, 0.29205322265625, 0.30632781982421875, 0.3206024169921875, 0.33487701416015625, 0.349151611328125, 0.36342620849609375, 0.3777008056640625, 0.39197540283203125, 0.40625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 12.0, 15.0, 24.0, 31.0, 44.0, 46.0, 68.0, 64.0, 60.0, 79.0, 85.0, 86.0, 79.0, 59.0, 53.0, 51.0, 39.0, 23.0, 24.0, 18.0, 12.0, 5.0, 7.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48388671875, -0.4719276428222656, -0.45996856689453125, -0.4480094909667969, -0.4360504150390625, -0.4240913391113281, -0.41213226318359375, -0.4001731872558594, -0.388214111328125, -0.3762550354003906, -0.36429595947265625, -0.3523368835449219, -0.3403778076171875, -0.3284187316894531, -0.31645965576171875, -0.3045005798339844, -0.29254150390625, -0.2805824279785156, -0.26862335205078125, -0.2566642761230469, -0.2447052001953125, -0.23274612426757812, -0.22078704833984375, -0.20882797241210938, -0.196868896484375, -0.18490982055664062, -0.17295074462890625, -0.16099166870117188, -0.1490325927734375, -0.13707351684570312, -0.12511444091796875, -0.11315536499023438, -0.1011962890625, -0.08923721313476562, -0.07727813720703125, -0.06531906127929688, -0.0533599853515625, -0.041400909423828125, -0.02944183349609375, -0.017482757568359375, -0.005523681640625, 0.006435394287109375, 0.01839447021484375, 0.030353546142578125, 0.0423126220703125, 0.054271697998046875, 0.06623077392578125, 0.07818984985351562, 0.09014892578125, 0.10210800170898438, 0.11406707763671875, 0.12602615356445312, 0.1379852294921875, 0.14994430541992188, 0.16190338134765625, 0.17386245727539062, 0.185821533203125, 0.19778060913085938, 0.20973968505859375, 0.22169876098632812, 0.2336578369140625, 0.24561691284179688, 0.25757598876953125, 0.2695350646972656, 0.281494140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 9.0, 2.0, 8.0, 18.0, 18.0, 25.0, 40.0, 75.0, 108.0, 258.0, 519.0, 1325.0, 5005.0, 45453.0, 784854.0, 194458.0, 12450.0, 2441.0, 744.0, 345.0, 170.0, 85.0, 51.0, 30.0, 20.0, 11.0, 11.0, 6.0, 2.0, 2.0, 4.0, 7.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.619140625, -1.5812530517578125, -1.543365478515625, -1.5054779052734375, -1.46759033203125, -1.4297027587890625, -1.391815185546875, -1.3539276123046875, -1.3160400390625, -1.2781524658203125, -1.240264892578125, -1.2023773193359375, -1.16448974609375, -1.1266021728515625, -1.088714599609375, -1.0508270263671875, -1.012939453125, -0.9750518798828125, -0.937164306640625, -0.8992767333984375, -0.86138916015625, -0.8235015869140625, -0.785614013671875, -0.7477264404296875, -0.7098388671875, -0.6719512939453125, -0.634063720703125, -0.5961761474609375, -0.55828857421875, -0.5204010009765625, -0.482513427734375, -0.4446258544921875, -0.40673828125, -0.3688507080078125, -0.330963134765625, -0.2930755615234375, -0.25518798828125, -0.2173004150390625, -0.179412841796875, -0.1415252685546875, -0.1036376953125, -0.0657501220703125, -0.027862548828125, 0.0100250244140625, 0.04791259765625, 0.0858001708984375, 0.123687744140625, 0.1615753173828125, 0.199462890625, 0.2373504638671875, 0.275238037109375, 0.3131256103515625, 0.35101318359375, 0.3889007568359375, 0.426788330078125, 0.4646759033203125, 0.5025634765625, 0.5404510498046875, 0.578338623046875, 0.6162261962890625, 0.65411376953125, 0.6920013427734375, 0.729888916015625, 0.7677764892578125, 0.8056640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 11.0, 10.0, 10.0, 12.0, 26.0, 28.0, 34.0, 35.0, 46.0, 39.0, 52.0, 61.0, 61.0, 62.0, 55.0, 66.0, 61.0, 49.0, 53.0, 47.0, 35.0, 27.0, 31.0, 24.0, 20.0, 11.0, 10.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1182403564453125, -1.082183837890625, -1.0461273193359375, -1.01007080078125, -0.9740142822265625, -0.937957763671875, -0.9019012451171875, -0.8658447265625, -0.8297882080078125, -0.793731689453125, -0.7576751708984375, -0.72161865234375, -0.6855621337890625, -0.649505615234375, -0.6134490966796875, -0.577392578125, -0.5413360595703125, -0.505279541015625, -0.4692230224609375, -0.43316650390625, -0.3971099853515625, -0.361053466796875, -0.3249969482421875, -0.2889404296875, -0.2528839111328125, -0.216827392578125, -0.1807708740234375, -0.14471435546875, -0.1086578369140625, -0.072601318359375, -0.0365447998046875, -0.00048828125, 0.0355682373046875, 0.071624755859375, 0.1076812744140625, 0.14373779296875, 0.1797943115234375, 0.215850830078125, 0.2519073486328125, 0.2879638671875, 0.3240203857421875, 0.360076904296875, 0.3961334228515625, 0.43218994140625, 0.4682464599609375, 0.504302978515625, 0.5403594970703125, 0.576416015625, 0.6124725341796875, 0.648529052734375, 0.6845855712890625, 0.72064208984375, 0.7566986083984375, 0.792755126953125, 0.8288116455078125, 0.8648681640625, 0.9009246826171875, 0.936981201171875, 0.9730377197265625, 1.00909423828125, 1.0451507568359375, 1.081207275390625, 1.1172637939453125, 1.1533203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 11.0, 11.0, 37.0, 82.0, 173.0, 692.0, 5337.0, 895511.0, 143496.0, 2469.0, 422.0, 152.0, 58.0, 30.0, 21.0, 7.0, 9.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.991302490234375, -0.95916748046875, -0.927032470703125, -0.8948974609375, -0.862762451171875, -0.83062744140625, -0.798492431640625, -0.766357421875, -0.734222412109375, -0.70208740234375, -0.669952392578125, -0.6378173828125, -0.605682373046875, -0.57354736328125, -0.541412353515625, -0.50927734375, -0.477142333984375, -0.44500732421875, -0.412872314453125, -0.3807373046875, -0.348602294921875, -0.31646728515625, -0.284332275390625, -0.252197265625, -0.220062255859375, -0.18792724609375, -0.155792236328125, -0.1236572265625, -0.091522216796875, -0.05938720703125, -0.027252197265625, 0.0048828125, 0.037017822265625, 0.06915283203125, 0.101287841796875, 0.1334228515625, 0.165557861328125, 0.19769287109375, 0.229827880859375, 0.261962890625, 0.294097900390625, 0.32623291015625, 0.358367919921875, 0.3905029296875, 0.422637939453125, 0.45477294921875, 0.486907958984375, 0.51904296875, 0.551177978515625, 0.58331298828125, 0.615447998046875, 0.6475830078125, 0.679718017578125, 0.71185302734375, 0.743988037109375, 0.776123046875, 0.808258056640625, 0.84039306640625, 0.872528076171875, 0.9046630859375, 0.936798095703125, 0.96893310546875, 1.001068115234375, 1.033203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 8.0, 3.0, 5.0, 11.0, 14.0, 14.0, 24.0, 29.0, 38.0, 44.0, 49.0, 62.0, 89.0, 99.0, 84.0, 84.0, 82.0, 46.0, 47.0, 34.0, 18.0, 17.0, 20.0, 12.0, 14.0, 4.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.18832015991211e-05, -6.989296525716782e-05, -6.790272891521454e-05, -6.591249257326126e-05, -6.392225623130798e-05, -6.19320198893547e-05, -5.994178354740143e-05, -5.795154720544815e-05, -5.596131086349487e-05, -5.3971074521541595e-05, -5.198083817958832e-05, -4.999060183763504e-05, -4.800036549568176e-05, -4.6010129153728485e-05, -4.401989281177521e-05, -4.202965646982193e-05, -4.003942012786865e-05, -3.8049183785915375e-05, -3.60589474439621e-05, -3.406871110200882e-05, -3.207847476005554e-05, -3.0088238418102264e-05, -2.8098002076148987e-05, -2.610776573419571e-05, -2.411752939224243e-05, -2.2127293050289154e-05, -2.0137056708335876e-05, -1.81468203663826e-05, -1.615658402442932e-05, -1.4166347682476044e-05, -1.2176111340522766e-05, -1.0185874998569489e-05, -8.195638656616211e-06, -6.205402314662933e-06, -4.215165972709656e-06, -2.224929630756378e-06, -2.3469328880310059e-07, 1.755543053150177e-06, 3.7457793951034546e-06, 5.736015737056732e-06, 7.72625207901001e-06, 9.716488420963287e-06, 1.1706724762916565e-05, 1.3696961104869843e-05, 1.568719744682312e-05, 1.7677433788776398e-05, 1.9667670130729675e-05, 2.1657906472682953e-05, 2.364814281463623e-05, 2.5638379156589508e-05, 2.7628615498542786e-05, 2.9618851840496063e-05, 3.160908818244934e-05, 3.359932452440262e-05, 3.5589560866355896e-05, 3.7579797208309174e-05, 3.957003355026245e-05, 4.156026989221573e-05, 4.3550506234169006e-05, 4.5540742576122284e-05, 4.753097891807556e-05, 4.952121526002884e-05, 5.151145160198212e-05, 5.3501687943935394e-05, 5.549192428588867e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 9.0, 15.0, 20.0, 47.0, 77.0, 109.0, 270.0, 644.0, 2156.0, 12432.0, 345578.0, 665005.0, 18082.0, 2715.0, 778.0, 282.0, 137.0, 63.0, 41.0, 29.0, 14.0, 12.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40576171875, -0.38890838623046875, -0.3720550537109375, -0.35520172119140625, -0.338348388671875, -0.32149505615234375, -0.3046417236328125, -0.28778839111328125, -0.27093505859375, -0.25408172607421875, -0.2372283935546875, -0.22037506103515625, -0.203521728515625, -0.18666839599609375, -0.1698150634765625, -0.15296173095703125, -0.1361083984375, -0.11925506591796875, -0.1024017333984375, -0.08554840087890625, -0.068695068359375, -0.05184173583984375, -0.0349884033203125, -0.01813507080078125, -0.00128173828125, 0.01557159423828125, 0.0324249267578125, 0.04927825927734375, 0.066131591796875, 0.08298492431640625, 0.0998382568359375, 0.11669158935546875, 0.133544921875, 0.15039825439453125, 0.1672515869140625, 0.18410491943359375, 0.200958251953125, 0.21781158447265625, 0.2346649169921875, 0.25151824951171875, 0.26837158203125, 0.28522491455078125, 0.3020782470703125, 0.31893157958984375, 0.335784912109375, 0.35263824462890625, 0.3694915771484375, 0.38634490966796875, 0.4031982421875, 0.42005157470703125, 0.4369049072265625, 0.45375823974609375, 0.470611572265625, 0.48746490478515625, 0.5043182373046875, 0.5211715698242188, 0.53802490234375, 0.5548782348632812, 0.5717315673828125, 0.5885848999023438, 0.605438232421875, 0.6222915649414062, 0.6391448974609375, 0.6559982299804688, 0.6728515625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 12.0, 10.0, 12.0, 17.0, 20.0, 31.0, 27.0, 38.0, 47.0, 71.0, 64.0, 65.0, 70.0, 76.0, 66.0, 69.0, 62.0, 54.0, 33.0, 30.0, 31.0, 17.0, 15.0, 8.0, 12.0, 12.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.283203125, -0.2750988006591797, -0.2669944763183594, -0.25889015197753906, -0.25078582763671875, -0.24268150329589844, -0.23457717895507812, -0.2264728546142578, -0.2183685302734375, -0.2102642059326172, -0.20215988159179688, -0.19405555725097656, -0.18595123291015625, -0.17784690856933594, -0.16974258422851562, -0.1616382598876953, -0.153533935546875, -0.1454296112060547, -0.13732528686523438, -0.12922096252441406, -0.12111663818359375, -0.11301231384277344, -0.10490798950195312, -0.09680366516113281, -0.0886993408203125, -0.08059501647949219, -0.07249069213867188, -0.06438636779785156, -0.05628204345703125, -0.04817771911621094, -0.040073394775390625, -0.03196907043457031, -0.02386474609375, -0.015760421752929688, -0.007656097412109375, 0.0004482269287109375, 0.00855255126953125, 0.016656875610351562, 0.024761199951171875, 0.03286552429199219, 0.0409698486328125, 0.04907417297363281, 0.057178497314453125, 0.06528282165527344, 0.07338714599609375, 0.08149147033691406, 0.08959579467773438, 0.09770011901855469, 0.105804443359375, 0.11390876770019531, 0.12201309204101562, 0.13011741638183594, 0.13822174072265625, 0.14632606506347656, 0.15443038940429688, 0.1625347137451172, 0.1706390380859375, 0.1787433624267578, 0.18684768676757812, 0.19495201110839844, 0.20305633544921875, 0.21116065979003906, 0.21926498413085938, 0.2273693084716797, 0.2354736328125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 1.0, 21.0, 147.0, 463.0, 282.0, 59.0, 13.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.77346420288086, -20.297883987426758, -19.822303771972656, -19.346725463867188, -18.871145248413086, -18.395565032958984, -17.919984817504883, -17.444406509399414, -16.968826293945312, -16.49324607849121, -16.01766586303711, -15.542086601257324, -15.066507339477539, -14.590927124023438, -14.115347862243652, -13.63976764678955, -13.164188385009766, -12.688608169555664, -12.213028907775879, -11.737448692321777, -11.261869430541992, -10.78628921508789, -10.310709953308105, -9.835129737854004, -9.359549522399902, -8.8839693069458, -8.408390045166016, -7.932810306549072, -7.457230567932129, -6.981650352478027, -6.506071090698242, -6.030490875244141, -5.5549116134643555, -5.079331874847412, -4.603752136230469, -4.128172397613525, -3.652592658996582, -3.1770126819610596, -2.701432943344116, -2.225853204727173, -1.7502734661102295, -1.2746937274932861, -0.799113929271698, -0.32353413105010986, 0.1520456075668335, 0.6276254653930664, 1.1032052040100098, 1.5787849426269531, 2.0543646812438965, 2.52994441986084, 3.005524158477783, 3.4811038970947266, 3.95668363571167, 4.432263374328613, 4.907843589782715, 5.3834228515625, 5.859003067016602, 6.334582805633545, 6.810162544250488, 7.285742282867432, 7.761322021484375, 8.236902236938477, 8.712481498718262, 9.188061714172363, 9.663640975952148]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 2.0, 5.0, 8.0, 12.0, 16.0, 23.0, 19.0, 19.0, 22.0, 26.0, 32.0, 40.0, 42.0, 45.0, 45.0, 57.0, 54.0, 63.0, 58.0, 64.0, 41.0, 43.0, 37.0, 42.0, 38.0, 26.0, 19.0, 18.0, 17.0, 8.0, 17.0, 16.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.266371726989746, -5.125722885131836, -4.985073566436768, -4.844424724578857, -4.703775405883789, -4.563126564025879, -4.422477722167969, -4.2818284034729, -4.14117956161499, -4.00053071975708, -3.8598814010620117, -3.7192325592041016, -3.5785834789276123, -3.437934398651123, -3.297285318374634, -3.1566362380981445, -3.0159871578216553, -2.875338077545166, -2.7346889972686768, -2.5940399169921875, -2.4533910751342773, -2.312741994857788, -2.172092914581299, -2.0314438343048096, -1.8907948732376099, -1.7501457929611206, -1.609496831893921, -1.4688477516174316, -1.3281986713409424, -1.1875497102737427, -1.0469006299972534, -0.9062516093254089, -0.7656025886535645, -0.62495356798172, -0.4843045175075531, -0.34365546703338623, -0.20300644636154175, -0.062357425689697266, 0.07829165458679199, 0.21894067525863647, 0.35958969593048096, 0.5002387166023254, 0.6408877372741699, 0.7815368175506592, 0.9221858382225037, 1.0628348588943481, 1.2034839391708374, 1.344132900238037, 1.4847819805145264, 1.6254310607910156, 1.7660800218582153, 1.9067291021347046, 2.0473780632019043, 2.1880271434783936, 2.328676223754883, 2.469325304031372, 2.6099743843078613, 2.7506234645843506, 2.89127254486084, 3.03192138671875, 3.1725704669952393, 3.3132195472717285, 3.4538686275482178, 3.594517707824707, 3.735166549682617]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 14.0, 15.0, 25.0, 31.0, 62.0, 102.0, 157.0, 289.0, 534.0, 1178.0, 3078.0, 9942.0, 41256.0, 326890.0, 2927550.0, 787342.0, 72424.0, 15550.0, 4613.0, 1674.0, 694.0, 381.0, 208.0, 101.0, 57.0, 29.0, 28.0, 16.0, 10.0, 10.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.40943145751953125, -0.3964996337890625, -0.38356781005859375, -0.370635986328125, -0.35770416259765625, -0.3447723388671875, -0.33184051513671875, -0.31890869140625, -0.30597686767578125, -0.2930450439453125, -0.28011322021484375, -0.267181396484375, -0.25424957275390625, -0.2413177490234375, -0.22838592529296875, -0.2154541015625, -0.20252227783203125, -0.1895904541015625, -0.17665863037109375, -0.163726806640625, -0.15079498291015625, -0.1378631591796875, -0.12493133544921875, -0.11199951171875, -0.09906768798828125, -0.0861358642578125, -0.07320404052734375, -0.060272216796875, -0.04734039306640625, -0.0344085693359375, -0.02147674560546875, -0.008544921875, 0.00438690185546875, 0.0173187255859375, 0.03025054931640625, 0.043182373046875, 0.05611419677734375, 0.0690460205078125, 0.08197784423828125, 0.09490966796875, 0.10784149169921875, 0.1207733154296875, 0.13370513916015625, 0.146636962890625, 0.15956878662109375, 0.1725006103515625, 0.18543243408203125, 0.1983642578125, 0.21129608154296875, 0.2242279052734375, 0.23715972900390625, 0.250091552734375, 0.26302337646484375, 0.2759552001953125, 0.28888702392578125, 0.30181884765625, 0.31475067138671875, 0.3276824951171875, 0.34061431884765625, 0.353546142578125, 0.36647796630859375, 0.3794097900390625, 0.39234161376953125, 0.4052734375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 6.0, 10.0, 13.0, 16.0, 27.0, 32.0, 42.0, 36.0, 61.0, 67.0, 75.0, 81.0, 73.0, 89.0, 69.0, 56.0, 46.0, 41.0, 39.0, 34.0, 28.0, 18.0, 8.0, 11.0, 11.0, 9.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.3710136413574219, -0.36141204833984375, -0.3518104553222656, -0.3422088623046875, -0.3326072692871094, -0.32300567626953125, -0.3134040832519531, -0.303802490234375, -0.2942008972167969, -0.28459930419921875, -0.2749977111816406, -0.2653961181640625, -0.2557945251464844, -0.24619293212890625, -0.23659133911132812, -0.22698974609375, -0.21738815307617188, -0.20778656005859375, -0.19818496704101562, -0.1885833740234375, -0.17898178100585938, -0.16938018798828125, -0.15977859497070312, -0.150177001953125, -0.14057540893554688, -0.13097381591796875, -0.12137222290039062, -0.1117706298828125, -0.10216903686523438, -0.09256744384765625, -0.08296585083007812, -0.0733642578125, -0.06376266479492188, -0.05416107177734375, -0.044559478759765625, -0.0349578857421875, -0.025356292724609375, -0.01575469970703125, -0.006153106689453125, 0.003448486328125, 0.013050079345703125, 0.02265167236328125, 0.032253265380859375, 0.0418548583984375, 0.051456451416015625, 0.06105804443359375, 0.07065963745117188, 0.08026123046875, 0.08986282348632812, 0.09946441650390625, 0.10906600952148438, 0.1186676025390625, 0.12826919555664062, 0.13787078857421875, 0.14747238159179688, 0.157073974609375, 0.16667556762695312, 0.17627716064453125, 0.18587875366210938, 0.1954803466796875, 0.20508193969726562, 0.21468353271484375, 0.22428512573242188, 0.23388671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 16.0, 22.0, 33.0, 33.0, 73.0, 81.0, 148.0, 342.0, 1127.0, 9970.0, 477526.0, 3667697.0, 34132.0, 2268.0, 460.0, 167.0, 83.0, 44.0, 23.0, 13.0, 15.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0528106689453125, -1.016754150390625, -0.9806976318359375, -0.94464111328125, -0.9085845947265625, -0.872528076171875, -0.8364715576171875, -0.8004150390625, -0.7643585205078125, -0.728302001953125, -0.6922454833984375, -0.65618896484375, -0.6201324462890625, -0.584075927734375, -0.5480194091796875, -0.511962890625, -0.4759063720703125, -0.439849853515625, -0.4037933349609375, -0.36773681640625, -0.3316802978515625, -0.295623779296875, -0.2595672607421875, -0.2235107421875, -0.1874542236328125, -0.151397705078125, -0.1153411865234375, -0.07928466796875, -0.0432281494140625, -0.007171630859375, 0.0288848876953125, 0.06494140625, 0.1009979248046875, 0.137054443359375, 0.1731109619140625, 0.20916748046875, 0.2452239990234375, 0.281280517578125, 0.3173370361328125, 0.3533935546875, 0.3894500732421875, 0.425506591796875, 0.4615631103515625, 0.49761962890625, 0.5336761474609375, 0.569732666015625, 0.6057891845703125, 0.641845703125, 0.6779022216796875, 0.713958740234375, 0.7500152587890625, 0.78607177734375, 0.8221282958984375, 0.858184814453125, 0.8942413330078125, 0.9302978515625, 0.9663543701171875, 1.002410888671875, 1.0384674072265625, 1.07452392578125, 1.1105804443359375, 1.146636962890625, 1.1826934814453125, 1.21875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 13.0, 10.0, 24.0, 27.0, 68.0, 87.0, 135.0, 301.0, 580.0, 939.0, 824.0, 493.0, 216.0, 129.0, 63.0, 57.0, 30.0, 19.0, 12.0, 10.0, 9.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-1.0576171875, -1.0345573425292969, -1.0114974975585938, -0.9884376525878906, -0.9653778076171875, -0.9423179626464844, -0.9192581176757812, -0.8961982727050781, -0.873138427734375, -0.8500785827636719, -0.8270187377929688, -0.8039588928222656, -0.7808990478515625, -0.7578392028808594, -0.7347793579101562, -0.7117195129394531, -0.68865966796875, -0.6655998229980469, -0.6425399780273438, -0.6194801330566406, -0.5964202880859375, -0.5733604431152344, -0.5503005981445312, -0.5272407531738281, -0.504180908203125, -0.4811210632324219, -0.45806121826171875, -0.4350013732910156, -0.4119415283203125, -0.3888816833496094, -0.36582183837890625, -0.3427619934082031, -0.3197021484375, -0.2966423034667969, -0.27358245849609375, -0.2505226135253906, -0.2274627685546875, -0.20440292358398438, -0.18134307861328125, -0.15828323364257812, -0.135223388671875, -0.11216354370117188, -0.08910369873046875, -0.06604385375976562, -0.0429840087890625, -0.019924163818359375, 0.00313568115234375, 0.026195526123046875, 0.04925537109375, 0.07231521606445312, 0.09537506103515625, 0.11843490600585938, 0.1414947509765625, 0.16455459594726562, 0.18761444091796875, 0.21067428588867188, 0.233734130859375, 0.2567939758300781, 0.27985382080078125, 0.3029136657714844, 0.3259735107421875, 0.3490333557128906, 0.37209320068359375, 0.3951530456542969, 0.418212890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 16.0, 40.0, 158.0, 385.0, 281.0, 88.0, 20.0, 8.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.395563125610352, -10.035148620605469, -9.674735069274902, -9.31432056427002, -8.953906059265137, -8.59349250793457, -8.233078002929688, -7.872663497924805, -7.51224946975708, -7.1518354415893555, -6.791420936584473, -6.431006908416748, -6.070592880249023, -5.710178375244141, -5.349764347076416, -4.989350318908691, -4.628935813903809, -4.268521785736084, -3.908107280731201, -3.5476932525634766, -3.187278985977173, -2.826864719390869, -2.4664506912231445, -2.106036424636841, -1.745622158050537, -1.3852078914642334, -1.0247937440872192, -0.6643795967102051, -0.30396533012390137, 0.056448936462402344, 0.41686296463012695, 0.7772772312164307, 1.137690544128418, 1.4981048107147217, 1.8585189580917358, 2.21893310546875, 2.5793473720550537, 2.9397616386413574, 3.300175666809082, 3.6605899333953857, 4.0210041999816895, 4.381418228149414, 4.741832733154297, 5.1022467613220215, 5.462660789489746, 5.823075294494629, 6.1834893226623535, 6.543903350830078, 6.904317855834961, 7.2647318840026855, 7.625146389007568, 7.985560417175293, 8.345974922180176, 8.706388473510742, 9.066802978515625, 9.427217483520508, 9.78763198852539, 10.148046493530273, 10.50846004486084, 10.868874549865723, 11.229289054870605, 11.589702606201172, 11.950117111206055, 12.310531616210938, 12.670945167541504]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 10.0, 12.0, 18.0, 19.0, 27.0, 24.0, 45.0, 38.0, 61.0, 45.0, 55.0, 57.0, 69.0, 70.0, 77.0, 72.0, 47.0, 52.0, 52.0, 38.0, 20.0, 16.0, 22.0, 18.0, 7.0, 12.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8141088485717773, -2.705805778503418, -2.5975029468536377, -2.4891998767852783, -2.380897045135498, -2.2725939750671387, -2.1642911434173584, -2.055988073348999, -1.9476852416992188, -1.839382290840149, -1.731079339981079, -1.6227763891220093, -1.5144734382629395, -1.40617036819458, -1.2978675365447998, -1.1895644664764404, -1.0812615156173706, -0.9729585647583008, -0.864655613899231, -0.7563526630401611, -0.6480497121810913, -0.5397467017173767, -0.4314437508583069, -0.32314079999923706, -0.21483784914016724, -0.10653489083051682, 0.001768067479133606, 0.11007103323936462, 0.21837398409843445, 0.32667696475982666, 0.4349799156188965, 0.5432828664779663, 0.6515858173370361, 0.759888768196106, 0.8681917190551758, 0.9764946699142456, 1.0847976207733154, 1.1931006908416748, 1.301403522491455, 1.4097065925598145, 1.5180094242095947, 1.6263123750686646, 1.7346153259277344, 1.8429182767868042, 1.951221227645874, 2.0595242977142334, 2.1678271293640137, 2.276130199432373, 2.3844332695007324, 2.492736339569092, 2.601039171218872, 2.7093422412872314, 2.8176450729370117, 2.925948143005371, 3.0342509746551514, 3.1425540447235107, 3.250856876373291, 3.3591599464416504, 3.4674627780914307, 3.57576584815979, 3.6840686798095703, 3.7923717498779297, 3.90067458152771, 4.00897741317749, 4.11728048324585]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 13.0, 23.0, 24.0, 42.0, 85.0, 111.0, 186.0, 289.0, 533.0, 1167.0, 2444.0, 5955.0, 15085.0, 43016.0, 126343.0, 331182.0, 328722.0, 125116.0, 42330.0, 15234.0, 5932.0, 2339.0, 1067.0, 533.0, 310.0, 178.0, 108.0, 64.0, 53.0, 24.0, 10.0, 16.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.434814453125, -0.4220237731933594, -0.40923309326171875, -0.3964424133300781, -0.3836517333984375, -0.3708610534667969, -0.35807037353515625, -0.3452796936035156, -0.332489013671875, -0.3196983337402344, -0.30690765380859375, -0.2941169738769531, -0.2813262939453125, -0.2685356140136719, -0.25574493408203125, -0.24295425415039062, -0.23016357421875, -0.21737289428710938, -0.20458221435546875, -0.19179153442382812, -0.1790008544921875, -0.16621017456054688, -0.15341949462890625, -0.14062881469726562, -0.127838134765625, -0.11504745483398438, -0.10225677490234375, -0.08946609497070312, -0.0766754150390625, -0.06388473510742188, -0.05109405517578125, -0.038303375244140625, -0.0255126953125, -0.012722015380859375, 6.866455078125e-05, 0.012859344482421875, 0.0256500244140625, 0.038440704345703125, 0.05123138427734375, 0.06402206420898438, 0.076812744140625, 0.08960342407226562, 0.10239410400390625, 0.11518478393554688, 0.1279754638671875, 0.14076614379882812, 0.15355682373046875, 0.16634750366210938, 0.17913818359375, 0.19192886352539062, 0.20471954345703125, 0.21751022338867188, 0.2303009033203125, 0.24309158325195312, 0.25588226318359375, 0.2686729431152344, 0.281463623046875, 0.2942543029785156, 0.30704498291015625, 0.3198356628417969, 0.3326263427734375, 0.3454170227050781, 0.35820770263671875, 0.3709983825683594, 0.3837890625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 9.0, 11.0, 11.0, 18.0, 17.0, 18.0, 24.0, 31.0, 37.0, 30.0, 34.0, 43.0, 48.0, 54.0, 52.0, 69.0, 57.0, 44.0, 45.0, 53.0, 45.0, 44.0, 23.0, 34.0, 20.0, 25.0, 18.0, 17.0, 12.0, 9.0, 12.0, 7.0, 4.0, 7.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1953125, -0.18858718872070312, -0.18186187744140625, -0.17513656616210938, -0.1684112548828125, -0.16168594360351562, -0.15496063232421875, -0.14823532104492188, -0.141510009765625, -0.13478469848632812, -0.12805938720703125, -0.12133407592773438, -0.1146087646484375, -0.10788345336914062, -0.10115814208984375, -0.09443283081054688, -0.08770751953125, -0.08098220825195312, -0.07425689697265625, -0.06753158569335938, -0.0608062744140625, -0.054080963134765625, -0.04735565185546875, -0.040630340576171875, -0.033905029296875, -0.027179718017578125, -0.02045440673828125, -0.013729095458984375, -0.0070037841796875, -0.000278472900390625, 0.00644683837890625, 0.013172149658203125, 0.0198974609375, 0.026622772216796875, 0.03334808349609375, 0.040073394775390625, 0.0467987060546875, 0.053524017333984375, 0.06024932861328125, 0.06697463989257812, 0.073699951171875, 0.08042526245117188, 0.08715057373046875, 0.09387588500976562, 0.1006011962890625, 0.10732650756835938, 0.11405181884765625, 0.12077713012695312, 0.12750244140625, 0.13422775268554688, 0.14095306396484375, 0.14767837524414062, 0.1544036865234375, 0.16112899780273438, 0.16785430908203125, 0.17457962036132812, 0.181304931640625, 0.18803024291992188, 0.19475555419921875, 0.20148086547851562, 0.2082061767578125, 0.21493148803710938, 0.22165679931640625, 0.22838211059570312, 0.235107421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 6.0, 8.0, 11.0, 14.0, 15.0, 24.0, 32.0, 54.0, 73.0, 107.0, 189.0, 250.0, 407.0, 680.0, 1163.0, 2266.0, 5906.0, 29706.0, 318977.0, 624739.0, 49663.0, 8013.0, 2752.0, 1369.0, 753.0, 501.0, 298.0, 188.0, 116.0, 93.0, 55.0, 40.0, 27.0, 17.0, 13.0, 4.0, 10.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6513671875, -0.6264266967773438, -0.6014862060546875, -0.5765457153320312, -0.551605224609375, -0.5266647338867188, -0.5017242431640625, -0.47678375244140625, -0.45184326171875, -0.42690277099609375, -0.4019622802734375, -0.37702178955078125, -0.352081298828125, -0.32714080810546875, -0.3022003173828125, -0.27725982666015625, -0.2523193359375, -0.22737884521484375, -0.2024383544921875, -0.17749786376953125, -0.152557373046875, -0.12761688232421875, -0.1026763916015625, -0.07773590087890625, -0.05279541015625, -0.02785491943359375, -0.0029144287109375, 0.02202606201171875, 0.046966552734375, 0.07190704345703125, 0.0968475341796875, 0.12178802490234375, 0.146728515625, 0.17166900634765625, 0.1966094970703125, 0.22154998779296875, 0.246490478515625, 0.27143096923828125, 0.2963714599609375, 0.32131195068359375, 0.34625244140625, 0.37119293212890625, 0.3961334228515625, 0.42107391357421875, 0.446014404296875, 0.47095489501953125, 0.4958953857421875, 0.5208358764648438, 0.5457763671875, 0.5707168579101562, 0.5956573486328125, 0.6205978393554688, 0.645538330078125, 0.6704788208007812, 0.6954193115234375, 0.7203598022460938, 0.74530029296875, 0.7702407836914062, 0.7951812744140625, 0.8201217651367188, 0.845062255859375, 0.8700027465820312, 0.8949432373046875, 0.9198837280273438, 0.94482421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 4.0, 12.0, 11.0, 6.0, 14.0, 17.0, 25.0, 23.0, 35.0, 36.0, 47.0, 30.0, 42.0, 40.0, 60.0, 56.0, 50.0, 68.0, 45.0, 48.0, 46.0, 52.0, 38.0, 26.0, 32.0, 24.0, 16.0, 18.0, 20.0, 12.0, 12.0, 3.0, 6.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.91162109375, -0.88262939453125, -0.8536376953125, -0.82464599609375, -0.795654296875, -0.76666259765625, -0.7376708984375, -0.70867919921875, -0.6796875, -0.65069580078125, -0.6217041015625, -0.59271240234375, -0.563720703125, -0.53472900390625, -0.5057373046875, -0.47674560546875, -0.44775390625, -0.41876220703125, -0.3897705078125, -0.36077880859375, -0.331787109375, -0.30279541015625, -0.2738037109375, -0.24481201171875, -0.2158203125, -0.18682861328125, -0.1578369140625, -0.12884521484375, -0.099853515625, -0.07086181640625, -0.0418701171875, -0.01287841796875, 0.01611328125, 0.04510498046875, 0.0740966796875, 0.10308837890625, 0.132080078125, 0.16107177734375, 0.1900634765625, 0.21905517578125, 0.248046875, 0.27703857421875, 0.3060302734375, 0.33502197265625, 0.364013671875, 0.39300537109375, 0.4219970703125, 0.45098876953125, 0.47998046875, 0.50897216796875, 0.5379638671875, 0.56695556640625, 0.595947265625, 0.62493896484375, 0.6539306640625, 0.68292236328125, 0.7119140625, 0.74090576171875, 0.7698974609375, 0.79888916015625, 0.827880859375, 0.85687255859375, 0.8858642578125, 0.91485595703125, 0.94384765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 8.0, 9.0, 12.0, 18.0, 31.0, 45.0, 59.0, 90.0, 157.0, 263.0, 517.0, 1306.0, 4858.0, 36763.0, 693387.0, 285819.0, 19924.0, 3196.0, 1049.0, 431.0, 223.0, 107.0, 70.0, 45.0, 51.0, 32.0, 22.0, 19.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30908203125, -0.2996788024902344, -0.29027557373046875, -0.2808723449707031, -0.2714691162109375, -0.2620658874511719, -0.25266265869140625, -0.24325942993164062, -0.233856201171875, -0.22445297241210938, -0.21504974365234375, -0.20564651489257812, -0.1962432861328125, -0.18684005737304688, -0.17743682861328125, -0.16803359985351562, -0.15863037109375, -0.14922714233398438, -0.13982391357421875, -0.13042068481445312, -0.1210174560546875, -0.11161422729492188, -0.10221099853515625, -0.09280776977539062, -0.083404541015625, -0.07400131225585938, -0.06459808349609375, -0.055194854736328125, -0.0457916259765625, -0.036388397216796875, -0.02698516845703125, -0.017581939697265625, -0.0081787109375, 0.001224517822265625, 0.01062774658203125, 0.020030975341796875, 0.0294342041015625, 0.038837432861328125, 0.04824066162109375, 0.057643890380859375, 0.067047119140625, 0.07645034790039062, 0.08585357666015625, 0.09525680541992188, 0.1046600341796875, 0.11406326293945312, 0.12346649169921875, 0.13286972045898438, 0.14227294921875, 0.15167617797851562, 0.16107940673828125, 0.17048263549804688, 0.1798858642578125, 0.18928909301757812, 0.19869232177734375, 0.20809555053710938, 0.217498779296875, 0.22690200805664062, 0.23630523681640625, 0.24570846557617188, 0.2551116943359375, 0.2645149230957031, 0.27391815185546875, 0.2833213806152344, 0.292724609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 14.0, 11.0, 15.0, 15.0, 22.0, 22.0, 25.0, 34.0, 48.0, 70.0, 70.0, 99.0, 83.0, 79.0, 77.0, 55.0, 58.0, 33.0, 26.0, 23.0, 21.0, 13.0, 15.0, 12.0, 8.0, 6.0, 10.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.604194641113281e-05, -6.37182965874672e-05, -6.139464676380157e-05, -5.9070996940135956e-05, -5.674734711647034e-05, -5.442369729280472e-05, -5.21000474691391e-05, -4.977639764547348e-05, -4.745274782180786e-05, -4.512909799814224e-05, -4.2805448174476624e-05, -4.0481798350811005e-05, -3.8158148527145386e-05, -3.583449870347977e-05, -3.351084887981415e-05, -3.118719905614853e-05, -2.886354923248291e-05, -2.653989940881729e-05, -2.4216249585151672e-05, -2.1892599761486053e-05, -1.9568949937820435e-05, -1.7245300114154816e-05, -1.4921650290489197e-05, -1.2598000466823578e-05, -1.0274350643157959e-05, -7.95070081949234e-06, -5.627050995826721e-06, -3.3034011721611023e-06, -9.797513484954834e-07, 1.3438984751701355e-06, 3.6675482988357544e-06, 5.991198122501373e-06, 8.314847946166992e-06, 1.0638497769832611e-05, 1.296214759349823e-05, 1.528579741716385e-05, 1.7609447240829468e-05, 1.9933097064495087e-05, 2.2256746888160706e-05, 2.4580396711826324e-05, 2.6904046535491943e-05, 2.9227696359157562e-05, 3.155134618282318e-05, 3.38749960064888e-05, 3.619864583015442e-05, 3.852229565382004e-05, 4.084594547748566e-05, 4.3169595301151276e-05, 4.5493245124816895e-05, 4.7816894948482513e-05, 5.014054477214813e-05, 5.246419459581375e-05, 5.478784441947937e-05, 5.711149424314499e-05, 5.943514406681061e-05, 6.175879389047623e-05, 6.408244371414185e-05, 6.640609353780746e-05, 6.872974336147308e-05, 7.10533931851387e-05, 7.337704300880432e-05, 7.570069283246994e-05, 7.802434265613556e-05, 8.034799247980118e-05, 8.26716423034668e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 15.0, 11.0, 10.0, 20.0, 27.0, 29.0, 49.0, 76.0, 98.0, 128.0, 200.0, 307.0, 564.0, 982.0, 1916.0, 4571.0, 13771.0, 67545.0, 650384.0, 257735.0, 34546.0, 8911.0, 3072.0, 1398.0, 784.0, 448.0, 303.0, 187.0, 113.0, 103.0, 65.0, 51.0, 41.0, 20.0, 18.0, 11.0, 14.0, 5.0, 6.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.2322998046875, -0.22542953491210938, -0.21855926513671875, -0.21168899536132812, -0.2048187255859375, -0.19794845581054688, -0.19107818603515625, -0.18420791625976562, -0.177337646484375, -0.17046737670898438, -0.16359710693359375, -0.15672683715820312, -0.1498565673828125, -0.14298629760742188, -0.13611602783203125, -0.12924575805664062, -0.12237548828125, -0.11550521850585938, -0.10863494873046875, -0.10176467895507812, -0.0948944091796875, -0.08802413940429688, -0.08115386962890625, -0.07428359985351562, -0.067413330078125, -0.060543060302734375, -0.05367279052734375, -0.046802520751953125, -0.0399322509765625, -0.033061981201171875, -0.02619171142578125, -0.019321441650390625, -0.012451171875, -0.005580902099609375, 0.00128936767578125, 0.008159637451171875, 0.0150299072265625, 0.021900177001953125, 0.02877044677734375, 0.035640716552734375, 0.042510986328125, 0.049381256103515625, 0.05625152587890625, 0.06312179565429688, 0.0699920654296875, 0.07686233520507812, 0.08373260498046875, 0.09060287475585938, 0.09747314453125, 0.10434341430664062, 0.11121368408203125, 0.11808395385742188, 0.1249542236328125, 0.13182449340820312, 0.13869476318359375, 0.14556503295898438, 0.152435302734375, 0.15930557250976562, 0.16617584228515625, 0.17304611206054688, 0.1799163818359375, 0.18678665161132812, 0.19365692138671875, 0.20052719116210938, 0.2073974609375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 8.0, 5.0, 6.0, 10.0, 7.0, 14.0, 20.0, 28.0, 28.0, 37.0, 48.0, 46.0, 64.0, 72.0, 75.0, 75.0, 74.0, 63.0, 59.0, 52.0, 46.0, 28.0, 27.0, 23.0, 16.0, 16.0, 15.0, 6.0, 6.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2313232421875, -0.22442626953125, -0.217529296875, -0.21063232421875, -0.2037353515625, -0.19683837890625, -0.18994140625, -0.18304443359375, -0.1761474609375, -0.16925048828125, -0.162353515625, -0.15545654296875, -0.1485595703125, -0.14166259765625, -0.134765625, -0.12786865234375, -0.1209716796875, -0.11407470703125, -0.107177734375, -0.10028076171875, -0.0933837890625, -0.08648681640625, -0.07958984375, -0.07269287109375, -0.0657958984375, -0.05889892578125, -0.052001953125, -0.04510498046875, -0.0382080078125, -0.03131103515625, -0.0244140625, -0.01751708984375, -0.0106201171875, -0.00372314453125, 0.003173828125, 0.01007080078125, 0.0169677734375, 0.02386474609375, 0.03076171875, 0.03765869140625, 0.0445556640625, 0.05145263671875, 0.058349609375, 0.06524658203125, 0.0721435546875, 0.07904052734375, 0.0859375, 0.09283447265625, 0.0997314453125, 0.10662841796875, 0.113525390625, 0.12042236328125, 0.1273193359375, 0.13421630859375, 0.14111328125, 0.14801025390625, 0.1549072265625, 0.16180419921875, 0.168701171875, 0.17559814453125, 0.1824951171875, 0.18939208984375, 0.1962890625, 0.20318603515625, 0.2100830078125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 17.0, 29.0, 93.0, 230.0, 316.0, 193.0, 60.0, 30.0, 10.0, 8.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.631749153137207, -6.396434307098389, -6.16111946105957, -5.92580509185791, -5.690490245819092, -5.455175399780273, -5.219860553741455, -4.984545707702637, -4.749230861663818, -4.513916015625, -4.278601169586182, -4.043286323547363, -3.807971715927124, -3.5726571083068848, -3.3373422622680664, -3.102027416229248, -2.866712808609009, -2.6313979625701904, -2.396083354949951, -2.160768508911133, -1.9254536628723145, -1.6901389360427856, -1.4548242092132568, -1.2195093631744385, -0.9841946363449097, -0.7488798499107361, -0.5135650634765625, -0.2782503366470337, -0.04293555021286011, 0.19237923622131348, 0.4276939630508423, 0.6630088090896606, 0.8983235359191895, 1.1336382627487183, 1.3689531087875366, 1.6042678356170654, 1.8395826816558838, 2.074897289276123, 2.3102121353149414, 2.5455269813537598, 2.780841827392578, 3.0161566734313965, 3.2514712810516357, 3.486786127090454, 3.7221009731292725, 3.9574155807495117, 4.19273042678833, 4.428045272827148, 4.663359642028809, 4.898674488067627, 5.133989334106445, 5.3693037033081055, 5.604618549346924, 5.839933395385742, 6.0752482414245605, 6.310563087463379, 6.545877933502197, 6.781192779541016, 7.016507625579834, 7.251822471618652, 7.4871368408203125, 7.722451686859131, 7.957766532897949, 8.19308090209961, 8.428396224975586]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 6.0, 3.0, 6.0, 8.0, 4.0, 15.0, 16.0, 17.0, 12.0, 15.0, 19.0, 24.0, 21.0, 44.0, 38.0, 41.0, 44.0, 61.0, 65.0, 72.0, 73.0, 46.0, 27.0, 48.0, 29.0, 24.0, 34.0, 32.0, 21.0, 16.0, 24.0, 27.0, 17.0, 10.0, 10.0, 7.0, 11.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.701176643371582, -2.6003732681274414, -2.4995696544647217, -2.398766279220581, -2.2979626655578613, -2.1971592903137207, -2.09635591506958, -1.99555242061615, -1.8947489261627197, -1.7939454317092896, -1.6931419372558594, -1.5923385620117188, -1.4915350675582886, -1.3907315731048584, -1.2899281978607178, -1.1891247034072876, -1.0883212089538574, -0.9875177145004272, -0.8867142796516418, -0.7859108448028564, -0.6851073503494263, -0.5843038558959961, -0.4835004210472107, -0.3826969861984253, -0.2818934917449951, -0.18109002709388733, -0.08028656244277954, 0.020516902208328247, 0.12132036685943604, 0.2221238613128662, 0.3229272961616516, 0.423730731010437, 0.5245342254638672, 0.6253377199172974, 0.7261411547660828, 0.8269445896148682, 0.9277480840682983, 1.0285515785217285, 1.1293549537658691, 1.2301584482192993, 1.3309619426727295, 1.4317654371261597, 1.5325689315795898, 1.6333723068237305, 1.7341758012771606, 1.8349792957305908, 1.9357826709747314, 2.036586284637451, 2.137389659881592, 2.2381930351257324, 2.338996648788452, 2.4398000240325928, 2.5406036376953125, 2.641407012939453, 2.7422103881835938, 2.8430137634277344, 2.943817377090454, 3.0446207523345947, 3.1454243659973145, 3.246227741241455, 3.3470311164855957, 3.4478347301483154, 3.548638105392456, 3.649441719055176, 3.7502450942993164]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 27.0, 18.0, 34.0, 86.0, 160.0, 308.0, 624.0, 1425.0, 3611.0, 11059.0, 41428.0, 259560.0, 2376539.0, 1336972.0, 125466.0, 24991.0, 7160.0, 2611.0, 1114.0, 494.0, 242.0, 138.0, 80.0, 43.0, 22.0, 17.0, 13.0, 13.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.42236328125, -0.4120197296142578, -0.4016761779785156, -0.39133262634277344, -0.38098907470703125, -0.37064552307128906, -0.3603019714355469, -0.3499584197998047, -0.3396148681640625, -0.3292713165283203, -0.3189277648925781, -0.30858421325683594, -0.29824066162109375, -0.28789710998535156, -0.2775535583496094, -0.2672100067138672, -0.256866455078125, -0.2465229034423828, -0.23617935180664062, -0.22583580017089844, -0.21549224853515625, -0.20514869689941406, -0.19480514526367188, -0.1844615936279297, -0.1741180419921875, -0.1637744903564453, -0.15343093872070312, -0.14308738708496094, -0.13274383544921875, -0.12240028381347656, -0.11205673217773438, -0.10171318054199219, -0.09136962890625, -0.08102607727050781, -0.07068252563476562, -0.06033897399902344, -0.04999542236328125, -0.03965187072753906, -0.029308319091796875, -0.018964767456054688, -0.0086212158203125, 0.0017223358154296875, 0.012065887451171875, 0.022409439086914062, 0.03275299072265625, 0.04309654235839844, 0.053440093994140625, 0.06378364562988281, 0.074127197265625, 0.08447074890136719, 0.09481430053710938, 0.10515785217285156, 0.11550140380859375, 0.12584495544433594, 0.13618850708007812, 0.1465320587158203, 0.1568756103515625, 0.1672191619873047, 0.17756271362304688, 0.18790626525878906, 0.19824981689453125, 0.20859336853027344, 0.21893692016601562, 0.2292804718017578, 0.2396240234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 13.0, 8.0, 6.0, 13.0, 23.0, 22.0, 25.0, 25.0, 39.0, 28.0, 45.0, 49.0, 53.0, 54.0, 52.0, 37.0, 55.0, 35.0, 49.0, 38.0, 41.0, 51.0, 32.0, 35.0, 34.0, 24.0, 20.0, 20.0, 11.0, 11.0, 9.0, 11.0, 7.0, 2.0, 4.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1822509765625, -0.17580413818359375, -0.1693572998046875, -0.16291046142578125, -0.156463623046875, -0.15001678466796875, -0.1435699462890625, -0.13712310791015625, -0.13067626953125, -0.12422943115234375, -0.1177825927734375, -0.11133575439453125, -0.104888916015625, -0.09844207763671875, -0.0919952392578125, -0.08554840087890625, -0.0791015625, -0.07265472412109375, -0.0662078857421875, -0.05976104736328125, -0.053314208984375, -0.04686737060546875, -0.0404205322265625, -0.03397369384765625, -0.02752685546875, -0.02108001708984375, -0.0146331787109375, -0.00818634033203125, -0.001739501953125, 0.00470733642578125, 0.0111541748046875, 0.01760101318359375, 0.0240478515625, 0.03049468994140625, 0.0369415283203125, 0.04338836669921875, 0.049835205078125, 0.05628204345703125, 0.0627288818359375, 0.06917572021484375, 0.07562255859375, 0.08206939697265625, 0.0885162353515625, 0.09496307373046875, 0.101409912109375, 0.10785675048828125, 0.1143035888671875, 0.12075042724609375, 0.127197265625, 0.13364410400390625, 0.1400909423828125, 0.14653778076171875, 0.152984619140625, 0.15943145751953125, 0.1658782958984375, 0.17232513427734375, 0.17877197265625, 0.18521881103515625, 0.1916656494140625, 0.19811248779296875, 0.204559326171875, 0.21100616455078125, 0.2174530029296875, 0.22389984130859375, 0.2303466796875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 6.0, 2.0, 8.0, 23.0, 22.0, 40.0, 44.0, 88.0, 159.0, 295.0, 618.0, 1547.0, 4347.0, 15948.0, 82112.0, 1180197.0, 2719138.0, 153564.0, 25637.0, 6447.0, 2175.0, 892.0, 405.0, 225.0, 122.0, 82.0, 50.0, 29.0, 20.0, 12.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.344482421875, -0.3307838439941406, -0.31708526611328125, -0.3033866882324219, -0.2896881103515625, -0.2759895324707031, -0.26229095458984375, -0.24859237670898438, -0.234893798828125, -0.22119522094726562, -0.20749664306640625, -0.19379806518554688, -0.1800994873046875, -0.16640090942382812, -0.15270233154296875, -0.13900375366210938, -0.12530517578125, -0.11160659790039062, -0.09790802001953125, -0.08420944213867188, -0.0705108642578125, -0.056812286376953125, -0.04311370849609375, -0.029415130615234375, -0.015716552734375, -0.002017974853515625, 0.01168060302734375, 0.025379180908203125, 0.0390777587890625, 0.052776336669921875, 0.06647491455078125, 0.08017349243164062, 0.0938720703125, 0.10757064819335938, 0.12126922607421875, 0.13496780395507812, 0.1486663818359375, 0.16236495971679688, 0.17606353759765625, 0.18976211547851562, 0.203460693359375, 0.21715927124023438, 0.23085784912109375, 0.24455642700195312, 0.2582550048828125, 0.2719535827636719, 0.28565216064453125, 0.2993507385253906, 0.31304931640625, 0.3267478942871094, 0.34044647216796875, 0.3541450500488281, 0.3678436279296875, 0.3815422058105469, 0.39524078369140625, 0.4089393615722656, 0.422637939453125, 0.4363365173339844, 0.45003509521484375, 0.4637336730957031, 0.4774322509765625, 0.4911308288574219, 0.5048294067382812, 0.5185279846191406, 0.5322265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 10.0, 12.0, 13.0, 16.0, 22.0, 37.0, 61.0, 82.0, 161.0, 239.0, 407.0, 717.0, 838.0, 571.0, 366.0, 171.0, 110.0, 79.0, 40.0, 31.0, 22.0, 12.0, 18.0, 12.0, 5.0, 9.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3916015625, -0.375457763671875, -0.35931396484375, -0.343170166015625, -0.3270263671875, -0.310882568359375, -0.29473876953125, -0.278594970703125, -0.262451171875, -0.246307373046875, -0.23016357421875, -0.214019775390625, -0.1978759765625, -0.181732177734375, -0.16558837890625, -0.149444580078125, -0.13330078125, -0.117156982421875, -0.10101318359375, -0.084869384765625, -0.0687255859375, -0.052581787109375, -0.03643798828125, -0.020294189453125, -0.004150390625, 0.011993408203125, 0.02813720703125, 0.044281005859375, 0.0604248046875, 0.076568603515625, 0.09271240234375, 0.108856201171875, 0.125, 0.141143798828125, 0.15728759765625, 0.173431396484375, 0.1895751953125, 0.205718994140625, 0.22186279296875, 0.238006591796875, 0.254150390625, 0.270294189453125, 0.28643798828125, 0.302581787109375, 0.3187255859375, 0.334869384765625, 0.35101318359375, 0.367156982421875, 0.38330078125, 0.399444580078125, 0.41558837890625, 0.431732177734375, 0.4478759765625, 0.464019775390625, 0.48016357421875, 0.496307373046875, 0.512451171875, 0.528594970703125, 0.54473876953125, 0.560882568359375, 0.5770263671875, 0.593170166015625, 0.60931396484375, 0.625457763671875, 0.6416015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 27.0, 62.0, 159.0, 346.0, 247.0, 116.0, 18.0, 7.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.518516540527344, -8.265787124633789, -8.013056755065918, -7.760326862335205, -7.507596969604492, -7.254867076873779, -7.002137184143066, -6.749407768249512, -6.496677398681641, -6.243947505950928, -5.991217613220215, -5.738487720489502, -5.485757827758789, -5.233027935028076, -4.980298042297363, -4.727568626403809, -4.474838733673096, -4.222108840942383, -3.96937894821167, -3.716649055480957, -3.463919162750244, -3.2111892700195312, -2.9584596157073975, -2.7057297229766846, -2.4529998302459717, -2.200269937515259, -1.947540044784546, -1.6948102712631226, -1.4420803785324097, -1.1893504858016968, -0.9366207122802734, -0.6838908195495605, -0.43116092681884766, -0.17843106389045715, 0.07429879903793335, 0.32702863216400146, 0.5797585248947144, 0.8324884176254272, 1.0852181911468506, 1.3379480838775635, 1.5906779766082764, 1.8434078693389893, 2.096137762069702, 2.348867416381836, 2.601597309112549, 2.8543272018432617, 3.1070570945739746, 3.3597869873046875, 3.6125168800354004, 3.8652467727661133, 4.117976665496826, 4.370706558227539, 4.623436450958252, 4.876166343688965, 5.1288957595825195, 5.381626129150391, 5.634355545043945, 5.887085437774658, 6.139815330505371, 6.392545223236084, 6.645275115966797, 6.89800500869751, 7.150734901428223, 7.403464317321777, 7.656194686889648]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 11.0, 15.0, 13.0, 21.0, 22.0, 28.0, 26.0, 39.0, 52.0, 61.0, 46.0, 46.0, 57.0, 56.0, 69.0, 50.0, 62.0, 41.0, 54.0, 34.0, 25.0, 33.0, 26.0, 15.0, 24.0, 16.0, 16.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.970703125, -1.888615369796753, -1.8065276145935059, -1.7244398593902588, -1.6423521041870117, -1.5602643489837646, -1.4781767129898071, -1.39608895778656, -1.314001202583313, -1.231913447380066, -1.1498256921768188, -1.0677379369735718, -0.9856502413749695, -0.9035624861717224, -0.8214747905731201, -0.739387035369873, -0.657299280166626, -0.5752115249633789, -0.4931237995624542, -0.41103607416152954, -0.32894831895828247, -0.2468605637550354, -0.16477283835411072, -0.08268511295318604, -0.0005973577499389648, 0.08149038255214691, 0.1635781228542328, 0.24566586315631866, 0.32775360345840454, 0.4098413586616516, 0.4919290840625763, 0.574016809463501, 0.656104326248169, 0.738192081451416, 0.8202798366546631, 0.9023675322532654, 0.9844552874565125, 1.0665431022644043, 1.1486307382583618, 1.2307184934616089, 1.312806248664856, 1.394894003868103, 1.47698175907135, 1.5590695142745972, 1.6411571502685547, 1.7232449054718018, 1.8053326606750488, 1.887420415878296, 1.969508171081543, 2.05159592628479, 2.133683681488037, 2.215771436691284, 2.2978591918945312, 2.3799469470977783, 2.4620347023010254, 2.5441222190856934, 2.6262102127075195, 2.7082979679107666, 2.7903857231140137, 2.8724734783172607, 2.954561233520508, 3.036648988723755, 3.118736743927002, 3.20082426071167, 3.282912015914917]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 15.0, 10.0, 15.0, 20.0, 47.0, 44.0, 65.0, 150.0, 256.0, 421.0, 865.0, 1564.0, 3130.0, 7145.0, 18222.0, 51281.0, 155912.0, 374972.0, 282270.0, 97298.0, 32671.0, 12029.0, 5084.0, 2300.0, 1195.0, 674.0, 352.0, 207.0, 111.0, 72.0, 48.0, 26.0, 22.0, 15.0, 11.0, 3.0, 4.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.3449516296386719, -0.33296966552734375, -0.3209877014160156, -0.3090057373046875, -0.2970237731933594, -0.28504180908203125, -0.2730598449707031, -0.261077880859375, -0.24909591674804688, -0.23711395263671875, -0.22513198852539062, -0.2131500244140625, -0.20116806030273438, -0.18918609619140625, -0.17720413208007812, -0.16522216796875, -0.15324020385742188, -0.14125823974609375, -0.12927627563476562, -0.1172943115234375, -0.10531234741210938, -0.09333038330078125, -0.08134841918945312, -0.069366455078125, -0.057384490966796875, -0.04540252685546875, -0.033420562744140625, -0.0214385986328125, -0.009456634521484375, 0.00252532958984375, 0.014507293701171875, 0.0264892578125, 0.038471221923828125, 0.05045318603515625, 0.062435150146484375, 0.0744171142578125, 0.08639907836914062, 0.09838104248046875, 0.11036300659179688, 0.122344970703125, 0.13432693481445312, 0.14630889892578125, 0.15829086303710938, 0.1702728271484375, 0.18225479125976562, 0.19423675537109375, 0.20621871948242188, 0.21820068359375, 0.23018264770507812, 0.24216461181640625, 0.2541465759277344, 0.2661285400390625, 0.2781105041503906, 0.29009246826171875, 0.3020744323730469, 0.314056396484375, 0.3260383605957031, 0.33802032470703125, 0.3500022888183594, 0.3619842529296875, 0.3739662170410156, 0.38594818115234375, 0.3979301452636719, 0.409912109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 4.0, 14.0, 12.0, 9.0, 13.0, 14.0, 21.0, 22.0, 28.0, 22.0, 38.0, 37.0, 31.0, 46.0, 56.0, 62.0, 58.0, 35.0, 54.0, 45.0, 54.0, 45.0, 29.0, 33.0, 44.0, 21.0, 22.0, 20.0, 25.0, 15.0, 11.0, 10.0, 15.0, 5.0, 7.0, 6.0, 4.0, 2.0, 6.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.17333984375, -0.16707801818847656, -0.16081619262695312, -0.1545543670654297, -0.14829254150390625, -0.1420307159423828, -0.13576889038085938, -0.12950706481933594, -0.1232452392578125, -0.11698341369628906, -0.11072158813476562, -0.10445976257324219, -0.09819793701171875, -0.09193611145019531, -0.08567428588867188, -0.07941246032714844, -0.073150634765625, -0.06688880920410156, -0.060626983642578125, -0.05436515808105469, -0.04810333251953125, -0.04184150695800781, -0.035579681396484375, -0.029317855834960938, -0.0230560302734375, -0.016794204711914062, -0.010532379150390625, -0.0042705535888671875, 0.00199127197265625, 0.008253097534179688, 0.014514923095703125, 0.020776748657226562, 0.02703857421875, 0.03330039978027344, 0.039562225341796875, 0.04582405090332031, 0.05208587646484375, 0.05834770202636719, 0.06460952758789062, 0.07087135314941406, 0.0771331787109375, 0.08339500427246094, 0.08965682983398438, 0.09591865539550781, 0.10218048095703125, 0.10844230651855469, 0.11470413208007812, 0.12096595764160156, 0.127227783203125, 0.13348960876464844, 0.13975143432617188, 0.1460132598876953, 0.15227508544921875, 0.1585369110107422, 0.16479873657226562, 0.17106056213378906, 0.1773223876953125, 0.18358421325683594, 0.18984603881835938, 0.1961078643798828, 0.20236968994140625, 0.2086315155029297, 0.21489334106445312, 0.22115516662597656, 0.2274169921875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 8.0, 6.0, 18.0, 25.0, 27.0, 64.0, 78.0, 109.0, 207.0, 440.0, 823.0, 1715.0, 5589.0, 44368.0, 808156.0, 169996.0, 11675.0, 2815.0, 1099.0, 538.0, 307.0, 190.0, 111.0, 61.0, 48.0, 26.0, 16.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96337890625, -0.9309616088867188, -0.8985443115234375, -0.8661270141601562, -0.833709716796875, -0.8012924194335938, -0.7688751220703125, -0.7364578247070312, -0.70404052734375, -0.6716232299804688, -0.6392059326171875, -0.6067886352539062, -0.574371337890625, -0.5419540405273438, -0.5095367431640625, -0.47711944580078125, -0.4447021484375, -0.41228485107421875, -0.3798675537109375, -0.34745025634765625, -0.315032958984375, -0.28261566162109375, -0.2501983642578125, -0.21778106689453125, -0.18536376953125, -0.15294647216796875, -0.1205291748046875, -0.08811187744140625, -0.055694580078125, -0.02327728271484375, 0.0091400146484375, 0.04155731201171875, 0.073974609375, 0.10639190673828125, 0.1388092041015625, 0.17122650146484375, 0.203643798828125, 0.23606109619140625, 0.2684783935546875, 0.30089569091796875, 0.33331298828125, 0.36573028564453125, 0.3981475830078125, 0.43056488037109375, 0.462982177734375, 0.49539947509765625, 0.5278167724609375, 0.5602340698242188, 0.5926513671875, 0.6250686645507812, 0.6574859619140625, 0.6899032592773438, 0.722320556640625, 0.7547378540039062, 0.7871551513671875, 0.8195724487304688, 0.85198974609375, 0.8844070434570312, 0.9168243408203125, 0.9492416381835938, 0.981658935546875, 1.0140762329101562, 1.0464935302734375, 1.0789108276367188, 1.111328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 9.0, 5.0, 6.0, 14.0, 25.0, 25.0, 29.0, 39.0, 40.0, 60.0, 49.0, 67.0, 65.0, 78.0, 66.0, 73.0, 66.0, 51.0, 49.0, 34.0, 39.0, 25.0, 20.0, 14.0, 15.0, 10.0, 8.0, 5.0, 6.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.251953125, -1.2189559936523438, -1.1859588623046875, -1.1529617309570312, -1.119964599609375, -1.0869674682617188, -1.0539703369140625, -1.0209732055664062, -0.98797607421875, -0.9549789428710938, -0.9219818115234375, -0.8889846801757812, -0.855987548828125, -0.8229904174804688, -0.7899932861328125, -0.7569961547851562, -0.7239990234375, -0.6910018920898438, -0.6580047607421875, -0.6250076293945312, -0.592010498046875, -0.5590133666992188, -0.5260162353515625, -0.49301910400390625, -0.46002197265625, -0.42702484130859375, -0.3940277099609375, -0.36103057861328125, -0.328033447265625, -0.29503631591796875, -0.2620391845703125, -0.22904205322265625, -0.196044921875, -0.16304779052734375, -0.1300506591796875, -0.09705352783203125, -0.064056396484375, -0.03105926513671875, 0.0019378662109375, 0.03493499755859375, 0.06793212890625, 0.10092926025390625, 0.1339263916015625, 0.16692352294921875, 0.199920654296875, 0.23291778564453125, 0.2659149169921875, 0.29891204833984375, 0.3319091796875, 0.36490631103515625, 0.3979034423828125, 0.43090057373046875, 0.463897705078125, 0.49689483642578125, 0.5298919677734375, 0.5628890991210938, 0.59588623046875, 0.6288833618164062, 0.6618804931640625, 0.6948776245117188, 0.727874755859375, 0.7608718872070312, 0.7938690185546875, 0.8268661499023438, 0.85986328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 7.0, 3.0, 8.0, 16.0, 11.0, 22.0, 31.0, 44.0, 73.0, 83.0, 132.0, 270.0, 714.0, 2641.0, 20919.0, 704131.0, 303041.0, 13282.0, 1881.0, 621.0, 247.0, 135.0, 54.0, 59.0, 37.0, 30.0, 19.0, 14.0, 10.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376708984375, -0.3649024963378906, -0.35309600830078125, -0.3412895202636719, -0.3294830322265625, -0.3176765441894531, -0.30587005615234375, -0.2940635681152344, -0.282257080078125, -0.2704505920410156, -0.25864410400390625, -0.24683761596679688, -0.2350311279296875, -0.22322463989257812, -0.21141815185546875, -0.19961166381835938, -0.18780517578125, -0.17599868774414062, -0.16419219970703125, -0.15238571166992188, -0.1405792236328125, -0.12877273559570312, -0.11696624755859375, -0.10515975952148438, -0.093353271484375, -0.08154678344726562, -0.06974029541015625, -0.057933807373046875, -0.0461273193359375, -0.034320831298828125, -0.02251434326171875, -0.010707855224609375, 0.0010986328125, 0.012905120849609375, 0.02471160888671875, 0.036518096923828125, 0.0483245849609375, 0.060131072998046875, 0.07193756103515625, 0.08374404907226562, 0.095550537109375, 0.10735702514648438, 0.11916351318359375, 0.13097000122070312, 0.1427764892578125, 0.15458297729492188, 0.16638946533203125, 0.17819595336914062, 0.19000244140625, 0.20180892944335938, 0.21361541748046875, 0.22542190551757812, 0.2372283935546875, 0.24903488159179688, 0.26084136962890625, 0.2726478576660156, 0.284454345703125, 0.2962608337402344, 0.30806732177734375, 0.3198738098144531, 0.3316802978515625, 0.3434867858886719, 0.35529327392578125, 0.3670997619628906, 0.37890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 2.0, 4.0, 6.0, 8.0, 8.0, 17.0, 16.0, 20.0, 26.0, 47.0, 60.0, 73.0, 102.0, 117.0, 105.0, 98.0, 90.0, 54.0, 34.0, 27.0, 27.0, 14.0, 10.0, 8.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.863210678100586e-05, -8.602812886238098e-05, -8.34241509437561e-05, -8.082017302513123e-05, -7.821619510650635e-05, -7.561221718788147e-05, -7.300823926925659e-05, -7.040426135063171e-05, -6.780028343200684e-05, -6.519630551338196e-05, -6.259232759475708e-05, -5.99883496761322e-05, -5.7384371757507324e-05, -5.4780393838882446e-05, -5.217641592025757e-05, -4.957243800163269e-05, -4.696846008300781e-05, -4.4364482164382935e-05, -4.176050424575806e-05, -3.915652632713318e-05, -3.65525484085083e-05, -3.394857048988342e-05, -3.1344592571258545e-05, -2.8740614652633667e-05, -2.613663673400879e-05, -2.353265881538391e-05, -2.0928680896759033e-05, -1.8324702978134155e-05, -1.5720725059509277e-05, -1.31167471408844e-05, -1.0512769222259521e-05, -7.908791303634644e-06, -5.304813385009766e-06, -2.7008354663848877e-06, -9.685754776000977e-08, 2.507120370864868e-06, 5.111098289489746e-06, 7.715076208114624e-06, 1.0319054126739502e-05, 1.292303204536438e-05, 1.5527009963989258e-05, 1.8130987882614136e-05, 2.0734965801239014e-05, 2.333894371986389e-05, 2.594292163848877e-05, 2.8546899557113647e-05, 3.1150877475738525e-05, 3.37548553943634e-05, 3.635883331298828e-05, 3.896281123161316e-05, 4.156678915023804e-05, 4.4170767068862915e-05, 4.677474498748779e-05, 4.937872290611267e-05, 5.198270082473755e-05, 5.458667874336243e-05, 5.7190656661987305e-05, 5.979463458061218e-05, 6.239861249923706e-05, 6.500259041786194e-05, 6.760656833648682e-05, 7.02105462551117e-05, 7.281452417373657e-05, 7.541850209236145e-05, 7.802248001098633e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 8.0, 7.0, 13.0, 10.0, 23.0, 34.0, 45.0, 76.0, 95.0, 184.0, 302.0, 533.0, 1133.0, 2919.0, 11169.0, 72517.0, 777542.0, 156713.0, 18038.0, 4161.0, 1461.0, 633.0, 341.0, 221.0, 120.0, 82.0, 49.0, 42.0, 34.0, 14.0, 13.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.238037109375, -0.2302703857421875, -0.222503662109375, -0.2147369384765625, -0.20697021484375, -0.1992034912109375, -0.191436767578125, -0.1836700439453125, -0.1759033203125, -0.1681365966796875, -0.160369873046875, -0.1526031494140625, -0.14483642578125, -0.1370697021484375, -0.129302978515625, -0.1215362548828125, -0.11376953125, -0.1060028076171875, -0.098236083984375, -0.0904693603515625, -0.08270263671875, -0.0749359130859375, -0.067169189453125, -0.0594024658203125, -0.0516357421875, -0.0438690185546875, -0.036102294921875, -0.0283355712890625, -0.02056884765625, -0.0128021240234375, -0.005035400390625, 0.0027313232421875, 0.010498046875, 0.0182647705078125, 0.026031494140625, 0.0337982177734375, 0.04156494140625, 0.0493316650390625, 0.057098388671875, 0.0648651123046875, 0.0726318359375, 0.0803985595703125, 0.088165283203125, 0.0959320068359375, 0.10369873046875, 0.1114654541015625, 0.119232177734375, 0.1269989013671875, 0.134765625, 0.1425323486328125, 0.150299072265625, 0.1580657958984375, 0.16583251953125, 0.1735992431640625, 0.181365966796875, 0.1891326904296875, 0.1968994140625, 0.2046661376953125, 0.212432861328125, 0.2201995849609375, 0.22796630859375, 0.2357330322265625, 0.243499755859375, 0.2512664794921875, 0.259033203125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 6.0, 2.0, 5.0, 3.0, 6.0, 10.0, 7.0, 9.0, 17.0, 21.0, 24.0, 50.0, 59.0, 88.0, 104.0, 140.0, 129.0, 100.0, 79.0, 38.0, 30.0, 21.0, 13.0, 9.0, 5.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1881103515625, -0.1801013946533203, -0.17209243774414062, -0.16408348083496094, -0.15607452392578125, -0.14806556701660156, -0.14005661010742188, -0.1320476531982422, -0.1240386962890625, -0.11602973937988281, -0.10802078247070312, -0.10001182556152344, -0.09200286865234375, -0.08399391174316406, -0.07598495483398438, -0.06797599792480469, -0.059967041015625, -0.05195808410644531, -0.043949127197265625, -0.03594017028808594, -0.02793121337890625, -0.019922256469726562, -0.011913299560546875, -0.0039043426513671875, 0.0041046142578125, 0.012113571166992188, 0.020122528076171875, 0.028131484985351562, 0.03614044189453125, 0.04414939880371094, 0.052158355712890625, 0.06016731262207031, 0.06817626953125, 0.07618522644042969, 0.08419418334960938, 0.09220314025878906, 0.10021209716796875, 0.10822105407714844, 0.11623001098632812, 0.12423896789550781, 0.1322479248046875, 0.1402568817138672, 0.14826583862304688, 0.15627479553222656, 0.16428375244140625, 0.17229270935058594, 0.18030166625976562, 0.1883106231689453, 0.196319580078125, 0.2043285369873047, 0.21233749389648438, 0.22034645080566406, 0.22835540771484375, 0.23636436462402344, 0.24437332153320312, 0.2523822784423828, 0.2603912353515625, 0.2684001922607422, 0.2764091491699219, 0.28441810607910156, 0.29242706298828125, 0.30043601989746094, 0.3084449768066406, 0.3164539337158203, 0.324462890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 7.0, 10.0, 7.0, 24.0, 47.0, 73.0, 119.0, 197.0, 218.0, 118.0, 69.0, 45.0, 22.0, 8.0, 10.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.646583080291748, -3.521165609359741, -3.3957483768463135, -3.2703309059143066, -3.1449134349823, -3.019495964050293, -2.8940787315368652, -2.7686612606048584, -2.6432437896728516, -2.5178263187408447, -2.392409086227417, -2.26699161529541, -2.1415741443634033, -2.0161566734313965, -1.8907394409179688, -1.765321969985962, -1.6399047374725342, -1.514487385749817, -1.38906991481781, -1.2636525630950928, -1.138235092163086, -1.0128177404403687, -0.8874003887176514, -0.7619829773902893, -0.6365655660629272, -0.5111481547355652, -0.3857307732105255, -0.26031339168548584, -0.13489598035812378, -0.009478569030761719, 0.11593878269195557, 0.24135619401931763, 0.3667736053466797, 0.49219101667404175, 0.6176084280014038, 0.7430257797241211, 0.8684431910514832, 0.9938606023788452, 1.1192779541015625, 1.2446954250335693, 1.3701127767562866, 1.495530128479004, 1.6209475994110107, 1.746364951133728, 1.8717823028564453, 1.9971997737884521, 2.122617244720459, 2.2480344772338867, 2.3734519481658936, 2.4988694190979004, 2.624286651611328, 2.749704122543335, 2.875121593475342, 3.0005388259887695, 3.1259562969207764, 3.251373767852783, 3.376791000366211, 3.5022084712982178, 3.6276257038116455, 3.7530431747436523, 3.878460645675659, 4.003878116607666, 4.129295349121094, 4.2547125816345215, 4.380130290985107]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 5.0, 11.0, 12.0, 15.0, 10.0, 17.0, 13.0, 15.0, 20.0, 41.0, 30.0, 37.0, 30.0, 46.0, 56.0, 68.0, 65.0, 66.0, 60.0, 41.0, 41.0, 41.0, 30.0, 25.0, 35.0, 22.0, 18.0, 23.0, 16.0, 13.0, 13.0, 17.0, 11.0, 6.0, 7.0, 12.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5675745010375977, -2.4754998683929443, -2.383425235748291, -2.2913506031036377, -2.1992759704589844, -2.10720157623291, -2.0151267051696777, -1.9230523109436035, -1.8309776782989502, -1.7389030456542969, -1.6468284130096436, -1.5547537803649902, -1.4626792669296265, -1.3706046342849731, -1.2785300016403198, -1.186455488204956, -1.0943807363510132, -1.0023061037063599, -0.9102315306663513, -0.818156898021698, -0.7260823249816895, -0.6340076923370361, -0.5419330596923828, -0.44985848665237427, -0.35778385400772095, -0.26570925116539, -0.1736346334218979, -0.08156001567840576, 0.010514587163925171, 0.1025891900062561, 0.19466382265090942, 0.28673839569091797, 0.3788130283355713, 0.4708876311779022, 0.5629622340202332, 0.6550368666648865, 0.747111439704895, 0.8391860723495483, 0.9312607049942017, 1.0233352184295654, 1.1154098510742188, 1.207484483718872, 1.2995591163635254, 1.3916337490081787, 1.4837082624435425, 1.5757828950881958, 1.6678575277328491, 1.759932041168213, 1.8520067930221558, 1.944081425666809, 2.036155939102173, 2.128230571746826, 2.2203052043914795, 2.312379837036133, 2.404454469680786, 2.4965291023254395, 2.5886037349700928, 2.680678367614746, 2.7727530002593994, 2.8648276329040527, 2.956902265548706, 3.0489768981933594, 3.1410512924194336, 3.233125925064087, 3.3252005577087402]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 7.0, 8.0, 14.0, 21.0, 33.0, 62.0, 121.0, 204.0, 371.0, 756.0, 1862.0, 5478.0, 23259.0, 240094.0, 3166117.0, 702509.0, 41566.0, 7669.0, 2309.0, 870.0, 390.0, 228.0, 124.0, 77.0, 51.0, 25.0, 18.0, 16.0, 12.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.29938507080078125, -0.2872467041015625, -0.27510833740234375, -0.262969970703125, -0.25083160400390625, -0.2386932373046875, -0.22655487060546875, -0.21441650390625, -0.20227813720703125, -0.1901397705078125, -0.17800140380859375, -0.165863037109375, -0.15372467041015625, -0.1415863037109375, -0.12944793701171875, -0.1173095703125, -0.10517120361328125, -0.0930328369140625, -0.08089447021484375, -0.068756103515625, -0.05661773681640625, -0.0444793701171875, -0.03234100341796875, -0.02020263671875, -0.00806427001953125, 0.0040740966796875, 0.01621246337890625, 0.028350830078125, 0.04048919677734375, 0.0526275634765625, 0.06476593017578125, 0.076904296875, 0.08904266357421875, 0.1011810302734375, 0.11331939697265625, 0.125457763671875, 0.13759613037109375, 0.1497344970703125, 0.16187286376953125, 0.17401123046875, 0.18614959716796875, 0.1982879638671875, 0.21042633056640625, 0.222564697265625, 0.23470306396484375, 0.2468414306640625, 0.25897979736328125, 0.2711181640625, 0.28325653076171875, 0.2953948974609375, 0.30753326416015625, 0.319671630859375, 0.33180999755859375, 0.3439483642578125, 0.35608673095703125, 0.36822509765625, 0.38036346435546875, 0.3925018310546875, 0.40464019775390625, 0.416778564453125, 0.42891693115234375, 0.4410552978515625, 0.45319366455078125, 0.46533203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 10.0, 8.0, 9.0, 12.0, 23.0, 18.0, 29.0, 30.0, 28.0, 41.0, 43.0, 46.0, 58.0, 49.0, 57.0, 53.0, 53.0, 50.0, 46.0, 55.0, 38.0, 61.0, 23.0, 24.0, 27.0, 19.0, 15.0, 18.0, 9.0, 9.0, 3.0, 13.0, 6.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155517578125, -0.14900588989257812, -0.14249420166015625, -0.13598251342773438, -0.1294708251953125, -0.12295913696289062, -0.11644744873046875, -0.10993576049804688, -0.103424072265625, -0.09691238403320312, -0.09040069580078125, -0.08388900756835938, -0.0773773193359375, -0.07086563110351562, -0.06435394287109375, -0.057842254638671875, -0.05133056640625, -0.044818878173828125, -0.03830718994140625, -0.031795501708984375, -0.0252838134765625, -0.018772125244140625, -0.01226043701171875, -0.005748748779296875, 0.000762939453125, 0.007274627685546875, 0.01378631591796875, 0.020298004150390625, 0.0268096923828125, 0.033321380615234375, 0.03983306884765625, 0.046344757080078125, 0.0528564453125, 0.059368133544921875, 0.06587982177734375, 0.07239151000976562, 0.0789031982421875, 0.08541488647460938, 0.09192657470703125, 0.09843826293945312, 0.104949951171875, 0.11146163940429688, 0.11797332763671875, 0.12448501586914062, 0.1309967041015625, 0.13750839233398438, 0.14402008056640625, 0.15053176879882812, 0.15704345703125, 0.16355514526367188, 0.17006683349609375, 0.17657852172851562, 0.1830902099609375, 0.18960189819335938, 0.19611358642578125, 0.20262527465820312, 0.209136962890625, 0.21564865112304688, 0.22216033935546875, 0.22867202758789062, 0.2351837158203125, 0.24169540405273438, 0.24820709228515625, 0.2547187805175781, 0.26123046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 6.0, 4.0, 9.0, 19.0, 20.0, 31.0, 41.0, 85.0, 153.0, 308.0, 531.0, 1345.0, 4520.0, 23105.0, 312748.0, 3648657.0, 177909.0, 18173.0, 4066.0, 1318.0, 563.0, 249.0, 171.0, 89.0, 56.0, 37.0, 27.0, 16.0, 7.0, 8.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.490478515625, -0.4743537902832031, -0.45822906494140625, -0.4421043395996094, -0.4259796142578125, -0.4098548889160156, -0.39373016357421875, -0.3776054382324219, -0.361480712890625, -0.3453559875488281, -0.32923126220703125, -0.3131065368652344, -0.2969818115234375, -0.2808570861816406, -0.26473236083984375, -0.24860763549804688, -0.23248291015625, -0.21635818481445312, -0.20023345947265625, -0.18410873413085938, -0.1679840087890625, -0.15185928344726562, -0.13573455810546875, -0.11960983276367188, -0.103485107421875, -0.08736038208007812, -0.07123565673828125, -0.055110931396484375, -0.0389862060546875, -0.022861480712890625, -0.00673675537109375, 0.009387969970703125, 0.0255126953125, 0.041637420654296875, 0.05776214599609375, 0.07388687133789062, 0.0900115966796875, 0.10613632202148438, 0.12226104736328125, 0.13838577270507812, 0.154510498046875, 0.17063522338867188, 0.18675994873046875, 0.20288467407226562, 0.2190093994140625, 0.23513412475585938, 0.25125885009765625, 0.2673835754394531, 0.28350830078125, 0.2996330261230469, 0.31575775146484375, 0.3318824768066406, 0.3480072021484375, 0.3641319274902344, 0.38025665283203125, 0.3963813781738281, 0.412506103515625, 0.4286308288574219, 0.44475555419921875, 0.4608802795410156, 0.4770050048828125, 0.4931297302246094, 0.5092544555664062, 0.5253791809082031, 0.54150390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 2.0, 10.0, 7.0, 15.0, 17.0, 31.0, 46.0, 74.0, 101.0, 165.0, 282.0, 506.0, 734.0, 708.0, 523.0, 305.0, 175.0, 104.0, 92.0, 53.0, 27.0, 18.0, 13.0, 13.0, 12.0, 9.0, 6.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.318359375, -0.3056449890136719, -0.29293060302734375, -0.2802162170410156, -0.2675018310546875, -0.2547874450683594, -0.24207305908203125, -0.22935867309570312, -0.216644287109375, -0.20392990112304688, -0.19121551513671875, -0.17850112915039062, -0.1657867431640625, -0.15307235717773438, -0.14035797119140625, -0.12764358520507812, -0.11492919921875, -0.10221481323242188, -0.08950042724609375, -0.07678604125976562, -0.0640716552734375, -0.051357269287109375, -0.03864288330078125, -0.025928497314453125, -0.013214111328125, -0.000499725341796875, 0.01221466064453125, 0.024929046630859375, 0.0376434326171875, 0.050357818603515625, 0.06307220458984375, 0.07578659057617188, 0.0885009765625, 0.10121536254882812, 0.11392974853515625, 0.12664413452148438, 0.1393585205078125, 0.15207290649414062, 0.16478729248046875, 0.17750167846679688, 0.190216064453125, 0.20293045043945312, 0.21564483642578125, 0.22835922241210938, 0.2410736083984375, 0.2537879943847656, 0.26650238037109375, 0.2792167663574219, 0.29193115234375, 0.3046455383300781, 0.31735992431640625, 0.3300743103027344, 0.3427886962890625, 0.3555030822753906, 0.36821746826171875, 0.3809318542480469, 0.393646240234375, 0.4063606262207031, 0.41907501220703125, 0.4317893981933594, 0.4445037841796875, 0.4572181701660156, 0.46993255615234375, 0.4826469421386719, 0.495361328125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 15.0, 23.0, 65.0, 214.0, 319.0, 211.0, 87.0, 29.0, 9.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.889784812927246, -7.703793525695801, -7.517802715301514, -7.331811428070068, -7.145820140838623, -6.959829330444336, -6.773838043212891, -6.587846755981445, -6.40185546875, -6.215864181518555, -6.029873371124268, -5.843882083892822, -5.657890796661377, -5.47189998626709, -5.2859086990356445, -5.099917411804199, -4.913926601409912, -4.727935314178467, -4.54194450378418, -4.355953216552734, -4.169961929321289, -3.983970880508423, -3.7979798316955566, -3.6119885444641113, -3.425997495651245, -3.240006446838379, -3.0540151596069336, -2.8680241107940674, -2.682033061981201, -2.496041774749756, -2.3100507259368896, -2.1240596771240234, -1.93806791305542, -1.7520767450332642, -1.5660855770111084, -1.3800945281982422, -1.1941033601760864, -1.0081121921539307, -0.8221211433410645, -0.6361299753189087, -0.45013880729675293, -0.26414766907691956, -0.07815653085708618, 0.1078345775604248, 0.29382574558258057, 0.47981691360473633, 0.6658079624176025, 0.8517991304397583, 1.037790298461914, 1.2237814664840698, 1.4097726345062256, 1.5957636833190918, 1.7817548513412476, 1.9677460193634033, 2.1537370681762695, 2.339728355407715, 2.525719404220581, 2.7117104530334473, 2.8977017402648926, 3.083692789077759, 3.269683837890625, 3.4556751251220703, 3.6416661739349365, 3.8276572227478027, 4.013648509979248]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 8.0, 11.0, 17.0, 13.0, 16.0, 23.0, 26.0, 28.0, 41.0, 43.0, 44.0, 59.0, 45.0, 58.0, 65.0, 42.0, 52.0, 54.0, 54.0, 39.0, 55.0, 24.0, 26.0, 32.0, 16.0, 23.0, 17.0, 17.0, 13.0, 6.0, 7.0, 4.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9379534721374512, -1.8723942041397095, -1.8068349361419678, -1.741275668144226, -1.6757164001464844, -1.6101572513580322, -1.5445979833602905, -1.4790387153625488, -1.4134794473648071, -1.3479201793670654, -1.2823609113693237, -1.216801643371582, -1.1512424945831299, -1.0856831073760986, -1.0201239585876465, -0.9545646905899048, -0.8890054225921631, -0.8234461545944214, -0.7578868865966797, -0.6923276782035828, -0.6267684102058411, -0.5612091422080994, -0.49564990401268005, -0.43009066581726074, -0.36453139781951904, -0.29897212982177734, -0.23341289162635803, -0.16785363852977753, -0.10229438543319702, -0.03673511743545532, 0.02882412075996399, 0.0943833589553833, 0.1599423885345459, 0.2255016416311264, 0.2910608947277069, 0.3566201329231262, 0.4221794009208679, 0.4877386689186096, 0.5532978773117065, 0.6188571453094482, 0.6844164133071899, 0.7499756813049316, 0.8155349493026733, 0.8810941576957703, 0.946653425693512, 1.0122127532958984, 1.0777719020843506, 1.1433311700820923, 1.208890438079834, 1.2744497060775757, 1.3400089740753174, 1.405568242073059, 1.4711275100708008, 1.536686658859253, 1.6022459268569946, 1.6678051948547363, 1.733364462852478, 1.7989237308502197, 1.8644829988479614, 1.9300422668457031, 1.9956014156341553, 2.0611608028411865, 2.1267199516296387, 2.19227933883667, 2.257838487625122]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 7.0, 4.0, 7.0, 3.0, 19.0, 20.0, 30.0, 37.0, 70.0, 108.0, 188.0, 391.0, 885.0, 2115.0, 6216.0, 23633.0, 110082.0, 446751.0, 356541.0, 76301.0, 16998.0, 4987.0, 1709.0, 695.0, 342.0, 154.0, 98.0, 49.0, 33.0, 23.0, 17.0, 6.0, 8.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.50244140625, -0.4871635437011719, -0.47188568115234375, -0.4566078186035156, -0.4413299560546875, -0.4260520935058594, -0.41077423095703125, -0.3954963684082031, -0.380218505859375, -0.3649406433105469, -0.34966278076171875, -0.3343849182128906, -0.3191070556640625, -0.3038291931152344, -0.28855133056640625, -0.2732734680175781, -0.25799560546875, -0.24271774291992188, -0.22743988037109375, -0.21216201782226562, -0.1968841552734375, -0.18160629272460938, -0.16632843017578125, -0.15105056762695312, -0.135772705078125, -0.12049484252929688, -0.10521697998046875, -0.08993911743164062, -0.0746612548828125, -0.059383392333984375, -0.04410552978515625, -0.028827667236328125, -0.0135498046875, 0.001728057861328125, 0.01700592041015625, 0.032283782958984375, 0.0475616455078125, 0.06283950805664062, 0.07811737060546875, 0.09339523315429688, 0.108673095703125, 0.12395095825195312, 0.13922882080078125, 0.15450668334960938, 0.1697845458984375, 0.18506240844726562, 0.20034027099609375, 0.21561813354492188, 0.23089599609375, 0.24617385864257812, 0.26145172119140625, 0.2767295837402344, 0.2920074462890625, 0.3072853088378906, 0.32256317138671875, 0.3378410339355469, 0.353118896484375, 0.3683967590332031, 0.38367462158203125, 0.3989524841308594, 0.4142303466796875, 0.4295082092285156, 0.44478607177734375, 0.4600639343261719, 0.475341796875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 11.0, 11.0, 13.0, 15.0, 21.0, 16.0, 28.0, 26.0, 37.0, 32.0, 48.0, 59.0, 63.0, 53.0, 46.0, 51.0, 59.0, 50.0, 50.0, 51.0, 47.0, 42.0, 25.0, 28.0, 24.0, 21.0, 20.0, 7.0, 12.0, 5.0, 7.0, 7.0, 9.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1572265625, -0.15021896362304688, -0.14321136474609375, -0.13620376586914062, -0.1291961669921875, -0.12218856811523438, -0.11518096923828125, -0.10817337036132812, -0.101165771484375, -0.09415817260742188, -0.08715057373046875, -0.08014297485351562, -0.0731353759765625, -0.06612777709960938, -0.05912017822265625, -0.052112579345703125, -0.04510498046875, -0.038097381591796875, -0.03108978271484375, -0.024082183837890625, -0.0170745849609375, -0.010066986083984375, -0.00305938720703125, 0.003948211669921875, 0.010955810546875, 0.017963409423828125, 0.02497100830078125, 0.031978607177734375, 0.0389862060546875, 0.045993804931640625, 0.05300140380859375, 0.060009002685546875, 0.0670166015625, 0.07402420043945312, 0.08103179931640625, 0.08803939819335938, 0.0950469970703125, 0.10205459594726562, 0.10906219482421875, 0.11606979370117188, 0.123077392578125, 0.13008499145507812, 0.13709259033203125, 0.14410018920898438, 0.1511077880859375, 0.15811538696289062, 0.16512298583984375, 0.17213058471679688, 0.17913818359375, 0.18614578247070312, 0.19315338134765625, 0.20016098022460938, 0.2071685791015625, 0.21417617797851562, 0.22118377685546875, 0.22819137573242188, 0.235198974609375, 0.24220657348632812, 0.24921417236328125, 0.2562217712402344, 0.2632293701171875, 0.2702369689941406, 0.27724456787109375, 0.2842521667480469, 0.291259765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 11.0, 13.0, 19.0, 19.0, 30.0, 59.0, 64.0, 110.0, 190.0, 372.0, 815.0, 2305.0, 8158.0, 41149.0, 281695.0, 616222.0, 78070.0, 13457.0, 3577.0, 1104.0, 447.0, 227.0, 150.0, 97.0, 58.0, 40.0, 24.0, 16.0, 12.0, 12.0, 4.0, 6.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5711593627929688, -0.5539398193359375, -0.5367202758789062, -0.519500732421875, -0.5022811889648438, -0.4850616455078125, -0.46784210205078125, -0.45062255859375, -0.43340301513671875, -0.4161834716796875, -0.39896392822265625, -0.381744384765625, -0.36452484130859375, -0.3473052978515625, -0.33008575439453125, -0.3128662109375, -0.29564666748046875, -0.2784271240234375, -0.26120758056640625, -0.243988037109375, -0.22676849365234375, -0.2095489501953125, -0.19232940673828125, -0.17510986328125, -0.15789031982421875, -0.1406707763671875, -0.12345123291015625, -0.106231689453125, -0.08901214599609375, -0.0717926025390625, -0.05457305908203125, -0.037353515625, -0.02013397216796875, -0.0029144287109375, 0.01430511474609375, 0.031524658203125, 0.04874420166015625, 0.0659637451171875, 0.08318328857421875, 0.10040283203125, 0.11762237548828125, 0.1348419189453125, 0.15206146240234375, 0.169281005859375, 0.18650054931640625, 0.2037200927734375, 0.22093963623046875, 0.2381591796875, 0.25537872314453125, 0.2725982666015625, 0.28981781005859375, 0.307037353515625, 0.32425689697265625, 0.3414764404296875, 0.35869598388671875, 0.37591552734375, 0.39313507080078125, 0.4103546142578125, 0.42757415771484375, 0.444793701171875, 0.46201324462890625, 0.4792327880859375, 0.49645233154296875, 0.513671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 11.0, 7.0, 14.0, 9.0, 16.0, 30.0, 37.0, 28.0, 42.0, 42.0, 56.0, 59.0, 60.0, 62.0, 62.0, 62.0, 61.0, 61.0, 47.0, 40.0, 38.0, 32.0, 20.0, 21.0, 15.0, 17.0, 14.0, 10.0, 1.0, 7.0, 7.0, 2.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.90234375, -0.8760910034179688, -0.8498382568359375, -0.8235855102539062, -0.797332763671875, -0.7710800170898438, -0.7448272705078125, -0.7185745239257812, -0.69232177734375, -0.6660690307617188, -0.6398162841796875, -0.6135635375976562, -0.587310791015625, -0.5610580444335938, -0.5348052978515625, -0.5085525512695312, -0.4822998046875, -0.45604705810546875, -0.4297943115234375, -0.40354156494140625, -0.377288818359375, -0.35103607177734375, -0.3247833251953125, -0.29853057861328125, -0.27227783203125, -0.24602508544921875, -0.2197723388671875, -0.19351959228515625, -0.167266845703125, -0.14101409912109375, -0.1147613525390625, -0.08850860595703125, -0.062255859375, -0.03600311279296875, -0.0097503662109375, 0.01650238037109375, 0.042755126953125, 0.06900787353515625, 0.0952606201171875, 0.12151336669921875, 0.14776611328125, 0.17401885986328125, 0.2002716064453125, 0.22652435302734375, 0.252777099609375, 0.27902984619140625, 0.3052825927734375, 0.33153533935546875, 0.3577880859375, 0.38404083251953125, 0.4102935791015625, 0.43654632568359375, 0.462799072265625, 0.48905181884765625, 0.5153045654296875, 0.5415573120117188, 0.56781005859375, 0.5940628051757812, 0.6203155517578125, 0.6465682983398438, 0.672821044921875, 0.6990737915039062, 0.7253265380859375, 0.7515792846679688, 0.77783203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 9.0, 15.0, 9.0, 11.0, 35.0, 46.0, 88.0, 142.0, 238.0, 636.0, 1704.0, 6870.0, 39260.0, 380875.0, 565805.0, 42429.0, 7180.0, 1884.0, 678.0, 272.0, 133.0, 86.0, 41.0, 27.0, 17.0, 13.0, 12.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.195556640625, -0.1896343231201172, -0.18371200561523438, -0.17778968811035156, -0.17186737060546875, -0.16594505310058594, -0.16002273559570312, -0.1541004180908203, -0.1481781005859375, -0.1422557830810547, -0.13633346557617188, -0.13041114807128906, -0.12448883056640625, -0.11856651306152344, -0.11264419555664062, -0.10672187805175781, -0.100799560546875, -0.09487724304199219, -0.08895492553710938, -0.08303260803222656, -0.07711029052734375, -0.07118797302246094, -0.06526565551757812, -0.05934333801269531, -0.0534210205078125, -0.04749870300292969, -0.041576385498046875, -0.03565406799316406, -0.02973175048828125, -0.023809432983398438, -0.017887115478515625, -0.011964797973632812, -0.00604248046875, -0.0001201629638671875, 0.005802154541015625, 0.011724472045898438, 0.01764678955078125, 0.023569107055664062, 0.029491424560546875, 0.03541374206542969, 0.0413360595703125, 0.04725837707519531, 0.053180694580078125, 0.05910301208496094, 0.06502532958984375, 0.07094764709472656, 0.07686996459960938, 0.08279228210449219, 0.088714599609375, 0.09463691711425781, 0.10055923461914062, 0.10648155212402344, 0.11240386962890625, 0.11832618713378906, 0.12424850463867188, 0.1301708221435547, 0.1360931396484375, 0.1420154571533203, 0.14793777465820312, 0.15386009216308594, 0.15978240966796875, 0.16570472717285156, 0.17162704467773438, 0.1775493621826172, 0.1834716796875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 9.0, 9.0, 12.0, 17.0, 21.0, 38.0, 44.0, 49.0, 65.0, 95.0, 89.0, 98.0, 96.0, 83.0, 74.0, 40.0, 38.0, 33.0, 25.0, 8.0, 15.0, 5.0, 7.0, 5.0, 3.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.607439041137695e-05, -4.4452957808971405e-05, -4.283152520656586e-05, -4.121009260416031e-05, -3.958866000175476e-05, -3.796722739934921e-05, -3.6345794796943665e-05, -3.4724362194538116e-05, -3.310292959213257e-05, -3.148149698972702e-05, -2.9860064387321472e-05, -2.8238631784915924e-05, -2.6617199182510376e-05, -2.4995766580104828e-05, -2.337433397769928e-05, -2.175290137529373e-05, -2.0131468772888184e-05, -1.8510036170482635e-05, -1.6888603568077087e-05, -1.526717096567154e-05, -1.3645738363265991e-05, -1.2024305760860443e-05, -1.0402873158454895e-05, -8.781440556049347e-06, -7.160007953643799e-06, -5.538575351238251e-06, -3.917142748832703e-06, -2.2957101464271545e-06, -6.742775440216064e-07, 9.471550583839417e-07, 2.5685876607894897e-06, 4.190020263195038e-06, 5.811452865600586e-06, 7.432885468006134e-06, 9.054318070411682e-06, 1.067575067281723e-05, 1.2297183275222778e-05, 1.3918615877628326e-05, 1.5540048480033875e-05, 1.7161481082439423e-05, 1.878291368484497e-05, 2.040434628725052e-05, 2.2025778889656067e-05, 2.3647211492061615e-05, 2.5268644094467163e-05, 2.689007669687271e-05, 2.851150929927826e-05, 3.0132941901683807e-05, 3.1754374504089355e-05, 3.3375807106494904e-05, 3.499723970890045e-05, 3.6618672311306e-05, 3.824010491371155e-05, 3.9861537516117096e-05, 4.1482970118522644e-05, 4.310440272092819e-05, 4.472583532333374e-05, 4.634726792573929e-05, 4.7968700528144836e-05, 4.9590133130550385e-05, 5.121156573295593e-05, 5.283299833536148e-05, 5.445443093776703e-05, 5.607586354017258e-05, 5.7697296142578125e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 4.0, 13.0, 8.0, 23.0, 48.0, 89.0, 234.0, 713.0, 3887.0, 50881.0, 906619.0, 79655.0, 5028.0, 853.0, 267.0, 92.0, 54.0, 33.0, 25.0, 9.0, 10.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28271484375, -0.27207183837890625, -0.2614288330078125, -0.25078582763671875, -0.240142822265625, -0.22949981689453125, -0.2188568115234375, -0.20821380615234375, -0.19757080078125, -0.18692779541015625, -0.1762847900390625, -0.16564178466796875, -0.154998779296875, -0.14435577392578125, -0.1337127685546875, -0.12306976318359375, -0.1124267578125, -0.10178375244140625, -0.0911407470703125, -0.08049774169921875, -0.069854736328125, -0.05921173095703125, -0.0485687255859375, -0.03792572021484375, -0.02728271484375, -0.01663970947265625, -0.0059967041015625, 0.00464630126953125, 0.015289306640625, 0.02593231201171875, 0.0365753173828125, 0.04721832275390625, 0.057861328125, 0.06850433349609375, 0.0791473388671875, 0.08979034423828125, 0.100433349609375, 0.11107635498046875, 0.1217193603515625, 0.13236236572265625, 0.14300537109375, 0.15364837646484375, 0.1642913818359375, 0.17493438720703125, 0.185577392578125, 0.19622039794921875, 0.2068634033203125, 0.21750640869140625, 0.2281494140625, 0.23879241943359375, 0.2494354248046875, 0.26007843017578125, 0.270721435546875, 0.28136444091796875, 0.2920074462890625, 0.30265045166015625, 0.31329345703125, 0.32393646240234375, 0.3345794677734375, 0.34522247314453125, 0.355865478515625, 0.36650848388671875, 0.3771514892578125, 0.38779449462890625, 0.3984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 8.0, 4.0, 12.0, 19.0, 21.0, 36.0, 49.0, 69.0, 83.0, 105.0, 104.0, 115.0, 89.0, 91.0, 44.0, 34.0, 25.0, 27.0, 20.0, 10.0, 9.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1514892578125, -0.14542007446289062, -0.13935089111328125, -0.13328170776367188, -0.1272125244140625, -0.12114334106445312, -0.11507415771484375, -0.10900497436523438, -0.102935791015625, -0.09686660766601562, -0.09079742431640625, -0.08472824096679688, -0.0786590576171875, -0.07258987426757812, -0.06652069091796875, -0.060451507568359375, -0.05438232421875, -0.048313140869140625, -0.04224395751953125, -0.036174774169921875, -0.0301055908203125, -0.024036407470703125, -0.01796722412109375, -0.011898040771484375, -0.005828857421875, 0.000240325927734375, 0.00630950927734375, 0.012378692626953125, 0.0184478759765625, 0.024517059326171875, 0.03058624267578125, 0.036655426025390625, 0.042724609375, 0.048793792724609375, 0.05486297607421875, 0.060932159423828125, 0.0670013427734375, 0.07307052612304688, 0.07913970947265625, 0.08520889282226562, 0.091278076171875, 0.09734725952148438, 0.10341644287109375, 0.10948562622070312, 0.1155548095703125, 0.12162399291992188, 0.12769317626953125, 0.13376235961914062, 0.13983154296875, 0.14590072631835938, 0.15196990966796875, 0.15803909301757812, 0.1641082763671875, 0.17017745971679688, 0.17624664306640625, 0.18231582641601562, 0.188385009765625, 0.19445419311523438, 0.20052337646484375, 0.20659255981445312, 0.2126617431640625, 0.21873092651367188, 0.22480010986328125, 0.23086929321289062, 0.2369384765625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 14.0, 18.0, 46.0, 88.0, 151.0, 271.0, 199.0, 97.0, 46.0, 29.0, 7.0, 8.0, 4.0, 5.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4549970626831055, -4.326457500457764, -4.19791841506958, -4.069378852844238, -3.9408395290374756, -3.812300205230713, -3.683760643005371, -3.5552213191986084, -3.4266819953918457, -3.298142671585083, -3.169603109359741, -3.0410637855529785, -2.912524461746216, -2.783985137939453, -2.6554455757141113, -2.5269062519073486, -2.398366689682007, -2.269827365875244, -2.1412878036499023, -2.0127484798431396, -1.884209156036377, -1.7556697130203247, -1.6271302700042725, -1.4985909461975098, -1.3700515031814575, -1.2415120601654053, -1.1129727363586426, -0.9844332933425903, -0.8558939099311829, -0.7273545265197754, -0.5988150835037231, -0.4702757000923157, -0.3417363166809082, -0.21319691836833954, -0.08465752005577087, 0.043881893157958984, 0.17242127656936646, 0.3009606599807739, 0.42950010299682617, 0.5580394864082336, 0.6865788698196411, 0.8151182532310486, 0.943657636642456, 1.0721970796585083, 1.2007365226745605, 1.3292758464813232, 1.4578152894973755, 1.5863547325134277, 1.7148940563201904, 1.8434334993362427, 1.9719728231430054, 2.1005122661590576, 2.2290515899658203, 2.357591152191162, 2.486130475997925, 2.6146697998046875, 2.7432093620300293, 2.871748685836792, 3.000288248062134, 3.1288275718688965, 3.257366895675659, 3.385906219482422, 3.5144457817077637, 3.6429851055145264, 3.771524429321289]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 8.0, 2.0, 14.0, 18.0, 17.0, 23.0, 21.0, 34.0, 32.0, 43.0, 60.0, 59.0, 80.0, 104.0, 115.0, 71.0, 70.0, 36.0, 43.0, 40.0, 29.0, 20.0, 16.0, 15.0, 11.0, 9.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6192779541015625, -4.4971842765808105, -4.375090599060059, -4.252996444702148, -4.1309027671813965, -4.0088090896606445, -3.8867154121398926, -3.7646217346191406, -3.6425278186798096, -3.5204341411590576, -3.3983402252197266, -3.2762465476989746, -3.1541528701782227, -3.0320589542388916, -2.9099652767181396, -2.7878713607788086, -2.6657776832580566, -2.5436840057373047, -2.4215900897979736, -2.2994964122772217, -2.1774024963378906, -2.0553088188171387, -1.9332151412963867, -1.8111213445663452, -1.6890275478363037, -1.5669337511062622, -1.4448399543762207, -1.3227462768554688, -1.2006524801254272, -1.0785586833953857, -0.956464946269989, -0.8343712091445923, -0.7122771739959717, -0.5901833772659302, -0.46808964014053345, -0.34599587321281433, -0.22390210628509521, -0.10180830955505371, 0.020285427570343018, 0.14237916469573975, 0.26447296142578125, 0.38656672835350037, 0.5086604952812195, 0.6307542324066162, 0.7528480291366577, 0.8749418258666992, 0.997035562992096, 1.1191293001174927, 1.2412230968475342, 1.3633168935775757, 1.4854106903076172, 1.6075043678283691, 1.7295981645584106, 1.8516919612884521, 1.973785638809204, 2.095879554748535, 2.217973232269287, 2.340066909790039, 2.46216082572937, 2.584254503250122, 2.706348419189453, 2.828442096710205, 2.950535774230957, 3.072629451751709, 3.19472336769104]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 1.0, 4.0, 2.0, 5.0, 10.0, 10.0, 15.0, 32.0, 56.0, 68.0, 125.0, 192.0, 316.0, 601.0, 984.0, 1821.0, 4340.0, 12114.0, 51170.0, 322979.0, 2020976.0, 1511338.0, 215208.0, 35854.0, 9134.0, 3465.0, 1569.0, 790.0, 394.0, 277.0, 142.0, 87.0, 61.0, 53.0, 22.0, 17.0, 14.0, 9.0, 11.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.2261962890625, -0.21910476684570312, -0.21201324462890625, -0.20492172241210938, -0.1978302001953125, -0.19073867797851562, -0.18364715576171875, -0.17655563354492188, -0.169464111328125, -0.16237258911132812, -0.15528106689453125, -0.14818954467773438, -0.1410980224609375, -0.13400650024414062, -0.12691497802734375, -0.11982345581054688, -0.11273193359375, -0.10564041137695312, -0.09854888916015625, -0.09145736694335938, -0.0843658447265625, -0.07727432250976562, -0.07018280029296875, -0.06309127807617188, -0.055999755859375, -0.048908233642578125, -0.04181671142578125, -0.034725189208984375, -0.0276336669921875, -0.020542144775390625, -0.01345062255859375, -0.006359100341796875, 0.000732421875, 0.007823944091796875, 0.01491546630859375, 0.022006988525390625, 0.0290985107421875, 0.036190032958984375, 0.04328155517578125, 0.050373077392578125, 0.057464599609375, 0.06455612182617188, 0.07164764404296875, 0.07873916625976562, 0.0858306884765625, 0.09292221069335938, 0.10001373291015625, 0.10710525512695312, 0.11419677734375, 0.12128829956054688, 0.12837982177734375, 0.13547134399414062, 0.1425628662109375, 0.14965438842773438, 0.15674591064453125, 0.16383743286132812, 0.170928955078125, 0.17802047729492188, 0.18511199951171875, 0.19220352172851562, 0.1992950439453125, 0.20638656616210938, 0.21347808837890625, 0.22056961059570312, 0.2276611328125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 5.0, 14.0, 12.0, 11.0, 8.0, 16.0, 13.0, 19.0, 23.0, 40.0, 30.0, 56.0, 40.0, 45.0, 49.0, 41.0, 53.0, 51.0, 49.0, 49.0, 42.0, 51.0, 26.0, 43.0, 33.0, 33.0, 17.0, 16.0, 21.0, 16.0, 13.0, 13.0, 11.0, 6.0, 3.0, 10.0, 2.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1588134765625, -0.15280532836914062, -0.14679718017578125, -0.14078903198242188, -0.1347808837890625, -0.12877273559570312, -0.12276458740234375, -0.11675643920898438, -0.110748291015625, -0.10474014282226562, -0.09873199462890625, -0.09272384643554688, -0.0867156982421875, -0.08070755004882812, -0.07469940185546875, -0.06869125366210938, -0.06268310546875, -0.056674957275390625, -0.05066680908203125, -0.044658660888671875, -0.0386505126953125, -0.032642364501953125, -0.02663421630859375, -0.020626068115234375, -0.014617919921875, -0.008609771728515625, -0.00260162353515625, 0.003406524658203125, 0.0094146728515625, 0.015422821044921875, 0.02143096923828125, 0.027439117431640625, 0.033447265625, 0.039455413818359375, 0.04546356201171875, 0.051471710205078125, 0.0574798583984375, 0.06348800659179688, 0.06949615478515625, 0.07550430297851562, 0.081512451171875, 0.08752059936523438, 0.09352874755859375, 0.09953689575195312, 0.1055450439453125, 0.11155319213867188, 0.11756134033203125, 0.12356948852539062, 0.12957763671875, 0.13558578491210938, 0.14159393310546875, 0.14760208129882812, 0.1536102294921875, 0.15961837768554688, 0.16562652587890625, 0.17163467407226562, 0.177642822265625, 0.18365097045898438, 0.18965911865234375, 0.19566726684570312, 0.2016754150390625, 0.20768356323242188, 0.21369171142578125, 0.21969985961914062, 0.2257080078125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 12.0, 12.0, 14.0, 25.0, 39.0, 69.0, 125.0, 278.0, 616.0, 1696.0, 7777.0, 80966.0, 3441166.0, 632076.0, 23806.0, 3694.0, 996.0, 398.0, 193.0, 129.0, 61.0, 43.0, 26.0, 13.0, 12.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59130859375, -0.5747756958007812, -0.5582427978515625, -0.5417098999023438, -0.525177001953125, -0.5086441040039062, -0.4921112060546875, -0.47557830810546875, -0.45904541015625, -0.44251251220703125, -0.4259796142578125, -0.40944671630859375, -0.392913818359375, -0.37638092041015625, -0.3598480224609375, -0.34331512451171875, -0.3267822265625, -0.31024932861328125, -0.2937164306640625, -0.27718353271484375, -0.260650634765625, -0.24411773681640625, -0.2275848388671875, -0.21105194091796875, -0.19451904296875, -0.17798614501953125, -0.1614532470703125, -0.14492034912109375, -0.128387451171875, -0.11185455322265625, -0.0953216552734375, -0.07878875732421875, -0.062255859375, -0.04572296142578125, -0.0291900634765625, -0.01265716552734375, 0.003875732421875, 0.02040863037109375, 0.0369415283203125, 0.05347442626953125, 0.07000732421875, 0.08654022216796875, 0.1030731201171875, 0.11960601806640625, 0.136138916015625, 0.15267181396484375, 0.1692047119140625, 0.18573760986328125, 0.2022705078125, 0.21880340576171875, 0.2353363037109375, 0.25186920166015625, 0.268402099609375, 0.28493499755859375, 0.3014678955078125, 0.31800079345703125, 0.33453369140625, 0.35106658935546875, 0.3675994873046875, 0.38413238525390625, 0.400665283203125, 0.41719818115234375, 0.4337310791015625, 0.45026397705078125, 0.466796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 22.0, 24.0, 39.0, 64.0, 141.0, 288.0, 503.0, 861.0, 940.0, 557.0, 255.0, 145.0, 79.0, 42.0, 45.0, 19.0, 16.0, 4.0, 4.0, 9.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400146484375, -0.3841590881347656, -0.36817169189453125, -0.3521842956542969, -0.3361968994140625, -0.3202095031738281, -0.30422210693359375, -0.2882347106933594, -0.272247314453125, -0.2562599182128906, -0.24027252197265625, -0.22428512573242188, -0.2082977294921875, -0.19231033325195312, -0.17632293701171875, -0.16033554077148438, -0.14434814453125, -0.12836074829101562, -0.11237335205078125, -0.09638595581054688, -0.0803985595703125, -0.06441116333007812, -0.04842376708984375, -0.032436370849609375, -0.016448974609375, -0.000461578369140625, 0.01552581787109375, 0.031513214111328125, 0.0475006103515625, 0.06348800659179688, 0.07947540283203125, 0.09546279907226562, 0.1114501953125, 0.12743759155273438, 0.14342498779296875, 0.15941238403320312, 0.1753997802734375, 0.19138717651367188, 0.20737457275390625, 0.22336196899414062, 0.239349365234375, 0.2553367614746094, 0.27132415771484375, 0.2873115539550781, 0.3032989501953125, 0.3192863464355469, 0.33527374267578125, 0.3512611389160156, 0.36724853515625, 0.3832359313964844, 0.39922332763671875, 0.4152107238769531, 0.4311981201171875, 0.4471855163574219, 0.46317291259765625, 0.4791603088378906, 0.495147705078125, 0.5111351013183594, 0.5271224975585938, 0.5431098937988281, 0.5590972900390625, 0.5750846862792969, 0.5910720825195312, 0.6070594787597656, 0.623046875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 11.0, 18.0, 69.0, 147.0, 260.0, 263.0, 114.0, 64.0, 32.0, 15.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.004892349243164, -5.853524684906006, -5.702157497406006, -5.550789833068848, -5.399422645568848, -5.2480549812316895, -5.096687316894531, -4.945320129394531, -4.793952465057373, -4.642584800720215, -4.491217613220215, -4.339849948883057, -4.188482761383057, -4.037115097045898, -3.8857476711273193, -3.7343802452087402, -3.583012819290161, -3.431645393371582, -3.280277967453003, -3.128910541534424, -2.9775428771972656, -2.8261754512786865, -2.6748080253601074, -2.523440361022949, -2.372073173522949, -2.22070574760437, -2.069338321685791, -1.9179707765579224, -1.7666032314300537, -1.6152358055114746, -1.4638683795928955, -1.3125008344650269, -1.1611332893371582, -1.009765863418579, -0.8583983182907104, -0.7070308923721313, -0.5556634068489075, -0.4042959213256836, -0.2529284954071045, -0.10156095027923584, 0.04980647563934326, 0.20117394626140594, 0.35254141688346863, 0.5039088726043701, 0.655276358127594, 0.8066438436508179, 0.958011269569397, 1.1093788146972656, 1.2607462406158447, 1.4121136665344238, 1.5634812116622925, 1.7148486375808716, 1.8662161827087402, 2.0175836086273193, 2.1689510345458984, 2.3203186988830566, 2.4716858863830566, 2.6230533123016357, 2.774420738220215, 2.925788402557373, 3.077155828475952, 3.2285232543945312, 3.3798906803131104, 3.5312581062316895, 3.6826257705688477]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 11.0, 13.0, 14.0, 18.0, 20.0, 34.0, 37.0, 29.0, 46.0, 50.0, 41.0, 64.0, 49.0, 50.0, 65.0, 60.0, 60.0, 48.0, 48.0, 40.0, 40.0, 30.0, 23.0, 19.0, 13.0, 13.0, 9.0, 12.0, 5.0, 9.0, 4.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5020151138305664, -1.4444628953933716, -1.3869106769561768, -1.3293583393096924, -1.2718061208724976, -1.2142539024353027, -1.156701683998108, -1.099149465560913, -1.0415971279144287, -0.9840449094772339, -0.9264926314353943, -0.8689404129981995, -0.8113881349563599, -0.753835916519165, -0.6962836980819702, -0.6387314200401306, -0.5811792016029358, -0.523626983165741, -0.46607470512390137, -0.40852248668670654, -0.35097020864486694, -0.2934179902076721, -0.2358657419681549, -0.1783134937286377, -0.12076124548912048, -0.06320899724960327, -0.0056567564606666565, 0.05189548432826996, 0.10944773256778717, 0.1669999659061432, 0.2245522141456604, 0.2821044623851776, 0.3396567106246948, 0.39720895886421204, 0.45476120710372925, 0.5123134255409241, 0.5698657035827637, 0.6274179220199585, 0.6849701404571533, 0.7425224184989929, 0.8000746965408325, 0.8576269149780273, 0.9151791930198669, 0.9727314114570618, 1.0302836894989014, 1.0878359079360962, 1.145388126373291, 1.2029404640197754, 1.2604925632476807, 1.3180447816848755, 1.3755970001220703, 1.4331493377685547, 1.4907015562057495, 1.5482537746429443, 1.6058059930801392, 1.663358211517334, 1.7209105491638184, 1.7784627676010132, 1.836014986038208, 1.8935673236846924, 1.9511195421218872, 2.008671760559082, 2.0662240982055664, 2.1237761974334717, 2.181328535079956]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 11.0, 25.0, 44.0, 88.0, 168.0, 433.0, 1176.0, 4394.0, 22638.0, 166375.0, 652224.0, 171126.0, 23301.0, 4535.0, 1201.0, 448.0, 176.0, 80.0, 61.0, 17.0, 12.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3798828125, -0.361358642578125, -0.34283447265625, -0.324310302734375, -0.3057861328125, -0.287261962890625, -0.26873779296875, -0.250213623046875, -0.231689453125, -0.213165283203125, -0.19464111328125, -0.176116943359375, -0.1575927734375, -0.139068603515625, -0.12054443359375, -0.102020263671875, -0.08349609375, -0.064971923828125, -0.04644775390625, -0.027923583984375, -0.0093994140625, 0.009124755859375, 0.02764892578125, 0.046173095703125, 0.064697265625, 0.083221435546875, 0.10174560546875, 0.120269775390625, 0.1387939453125, 0.157318115234375, 0.17584228515625, 0.194366455078125, 0.212890625, 0.231414794921875, 0.24993896484375, 0.268463134765625, 0.2869873046875, 0.305511474609375, 0.32403564453125, 0.342559814453125, 0.361083984375, 0.379608154296875, 0.39813232421875, 0.416656494140625, 0.4351806640625, 0.453704833984375, 0.47222900390625, 0.490753173828125, 0.50927734375, 0.527801513671875, 0.54632568359375, 0.564849853515625, 0.5833740234375, 0.601898193359375, 0.62042236328125, 0.638946533203125, 0.657470703125, 0.675994873046875, 0.69451904296875, 0.713043212890625, 0.7315673828125, 0.750091552734375, 0.76861572265625, 0.787139892578125, 0.8056640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 5.0, 13.0, 11.0, 17.0, 11.0, 18.0, 20.0, 24.0, 40.0, 61.0, 46.0, 49.0, 43.0, 35.0, 55.0, 39.0, 61.0, 38.0, 51.0, 51.0, 38.0, 35.0, 38.0, 28.0, 30.0, 22.0, 19.0, 17.0, 15.0, 10.0, 10.0, 11.0, 8.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.196044921875, -0.1895313262939453, -0.18301773071289062, -0.17650413513183594, -0.16999053955078125, -0.16347694396972656, -0.15696334838867188, -0.1504497528076172, -0.1439361572265625, -0.1374225616455078, -0.13090896606445312, -0.12439537048339844, -0.11788177490234375, -0.11136817932128906, -0.10485458374023438, -0.09834098815917969, -0.091827392578125, -0.08531379699707031, -0.07880020141601562, -0.07228660583496094, -0.06577301025390625, -0.05925941467285156, -0.052745819091796875, -0.04623222351074219, -0.0397186279296875, -0.03320503234863281, -0.026691436767578125, -0.020177841186523438, -0.01366424560546875, -0.0071506500244140625, -0.000637054443359375, 0.0058765411376953125, 0.01239013671875, 0.018903732299804688, 0.025417327880859375, 0.03193092346191406, 0.03844451904296875, 0.04495811462402344, 0.051471710205078125, 0.05798530578613281, 0.0644989013671875, 0.07101249694824219, 0.07752609252929688, 0.08403968811035156, 0.09055328369140625, 0.09706687927246094, 0.10358047485351562, 0.11009407043457031, 0.116607666015625, 0.12312126159667969, 0.12963485717773438, 0.13614845275878906, 0.14266204833984375, 0.14917564392089844, 0.15568923950195312, 0.1622028350830078, 0.1687164306640625, 0.1752300262451172, 0.18174362182617188, 0.18825721740722656, 0.19477081298828125, 0.20128440856933594, 0.20779800415039062, 0.2143115997314453, 0.2208251953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 8.0, 9.0, 10.0, 11.0, 16.0, 22.0, 25.0, 38.0, 67.0, 76.0, 100.0, 125.0, 211.0, 300.0, 443.0, 734.0, 1265.0, 3076.0, 9974.0, 45894.0, 287425.0, 607616.0, 69895.0, 13635.0, 3777.0, 1546.0, 753.0, 440.0, 313.0, 202.0, 161.0, 111.0, 70.0, 49.0, 38.0, 27.0, 23.0, 18.0, 17.0, 3.0, 4.0, 5.0, 3.0, 5.0, 6.0, 2.0, 5.0, 0.0, 0.0, 3.0, 1.0, 3.0], "bins": [-0.492431640625, -0.47756195068359375, -0.4626922607421875, -0.44782257080078125, -0.432952880859375, -0.41808319091796875, -0.4032135009765625, -0.38834381103515625, -0.37347412109375, -0.35860443115234375, -0.3437347412109375, -0.32886505126953125, -0.313995361328125, -0.29912567138671875, -0.2842559814453125, -0.26938629150390625, -0.2545166015625, -0.23964691162109375, -0.2247772216796875, -0.20990753173828125, -0.195037841796875, -0.18016815185546875, -0.1652984619140625, -0.15042877197265625, -0.13555908203125, -0.12068939208984375, -0.1058197021484375, -0.09095001220703125, -0.076080322265625, -0.06121063232421875, -0.0463409423828125, -0.03147125244140625, -0.0166015625, -0.00173187255859375, 0.0131378173828125, 0.02800750732421875, 0.042877197265625, 0.05774688720703125, 0.0726165771484375, 0.08748626708984375, 0.10235595703125, 0.11722564697265625, 0.1320953369140625, 0.14696502685546875, 0.161834716796875, 0.17670440673828125, 0.1915740966796875, 0.20644378662109375, 0.2213134765625, 0.23618316650390625, 0.2510528564453125, 0.26592254638671875, 0.280792236328125, 0.29566192626953125, 0.3105316162109375, 0.32540130615234375, 0.34027099609375, 0.35514068603515625, 0.3700103759765625, 0.38488006591796875, 0.399749755859375, 0.41461944580078125, 0.4294891357421875, 0.44435882568359375, 0.459228515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 9.0, 12.0, 13.0, 14.0, 20.0, 34.0, 27.0, 25.0, 36.0, 44.0, 36.0, 41.0, 59.0, 55.0, 61.0, 56.0, 57.0, 45.0, 58.0, 54.0, 47.0, 29.0, 27.0, 20.0, 24.0, 22.0, 10.0, 9.0, 12.0, 10.0, 8.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.9697265625, -0.9449844360351562, -0.9202423095703125, -0.8955001831054688, -0.870758056640625, -0.8460159301757812, -0.8212738037109375, -0.7965316772460938, -0.77178955078125, -0.7470474243164062, -0.7223052978515625, -0.6975631713867188, -0.672821044921875, -0.6480789184570312, -0.6233367919921875, -0.5985946655273438, -0.5738525390625, -0.5491104125976562, -0.5243682861328125, -0.49962615966796875, -0.474884033203125, -0.45014190673828125, -0.4253997802734375, -0.40065765380859375, -0.37591552734375, -0.35117340087890625, -0.3264312744140625, -0.30168914794921875, -0.276947021484375, -0.25220489501953125, -0.2274627685546875, -0.20272064208984375, -0.177978515625, -0.15323638916015625, -0.1284942626953125, -0.10375213623046875, -0.079010009765625, -0.05426788330078125, -0.0295257568359375, -0.00478363037109375, 0.01995849609375, 0.04470062255859375, 0.0694427490234375, 0.09418487548828125, 0.118927001953125, 0.14366912841796875, 0.1684112548828125, 0.19315338134765625, 0.2178955078125, 0.24263763427734375, 0.2673797607421875, 0.29212188720703125, 0.316864013671875, 0.34160614013671875, 0.3663482666015625, 0.39109039306640625, 0.41583251953125, 0.44057464599609375, 0.4653167724609375, 0.49005889892578125, 0.514801025390625, 0.5395431518554688, 0.5642852783203125, 0.5890274047851562, 0.61376953125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 17.0, 19.0, 25.0, 30.0, 54.0, 101.0, 175.0, 383.0, 698.0, 1858.0, 5313.0, 19472.0, 97365.0, 755584.0, 133170.0, 23898.0, 6396.0, 2199.0, 874.0, 395.0, 190.0, 127.0, 55.0, 43.0, 21.0, 20.0, 12.0, 7.0, 10.0, 6.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1561279296875, -0.15102195739746094, -0.14591598510742188, -0.1408100128173828, -0.13570404052734375, -0.1305980682373047, -0.12549209594726562, -0.12038612365722656, -0.1152801513671875, -0.11017417907714844, -0.10506820678710938, -0.09996223449707031, -0.09485626220703125, -0.08975028991699219, -0.08464431762695312, -0.07953834533691406, -0.074432373046875, -0.06932640075683594, -0.06422042846679688, -0.05911445617675781, -0.05400848388671875, -0.04890251159667969, -0.043796539306640625, -0.03869056701660156, -0.0335845947265625, -0.028478622436523438, -0.023372650146484375, -0.018266677856445312, -0.01316070556640625, -0.008054733276367188, -0.002948760986328125, 0.0021572113037109375, 0.00726318359375, 0.012369155883789062, 0.017475128173828125, 0.022581100463867188, 0.02768707275390625, 0.03279304504394531, 0.037899017333984375, 0.04300498962402344, 0.0481109619140625, 0.05321693420410156, 0.058322906494140625, 0.06342887878417969, 0.06853485107421875, 0.07364082336425781, 0.07874679565429688, 0.08385276794433594, 0.088958740234375, 0.09406471252441406, 0.09917068481445312, 0.10427665710449219, 0.10938262939453125, 0.11448860168457031, 0.11959457397460938, 0.12470054626464844, 0.1298065185546875, 0.13491249084472656, 0.14001846313476562, 0.1451244354248047, 0.15023040771484375, 0.1553363800048828, 0.16044235229492188, 0.16554832458496094, 0.170654296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 18.0, 9.0, 15.0, 21.0, 31.0, 30.0, 27.0, 46.0, 59.0, 78.0, 79.0, 104.0, 97.0, 62.0, 59.0, 49.0, 41.0, 22.0, 30.0, 13.0, 16.0, 13.0, 12.0, 10.0, 6.0, 7.0, 9.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.790855407714844e-05, -3.657303750514984e-05, -3.5237520933151245e-05, -3.390200436115265e-05, -3.256648778915405e-05, -3.1230971217155457e-05, -2.989545464515686e-05, -2.8559938073158264e-05, -2.7224421501159668e-05, -2.5888904929161072e-05, -2.4553388357162476e-05, -2.321787178516388e-05, -2.1882355213165283e-05, -2.0546838641166687e-05, -1.921132206916809e-05, -1.7875805497169495e-05, -1.65402889251709e-05, -1.5204772353172302e-05, -1.3869255781173706e-05, -1.253373920917511e-05, -1.1198222637176514e-05, -9.862706065177917e-06, -8.527189493179321e-06, -7.191672921180725e-06, -5.856156349182129e-06, -4.520639777183533e-06, -3.1851232051849365e-06, -1.8496066331863403e-06, -5.140900611877441e-07, 8.21426510810852e-07, 2.1569430828094482e-06, 3.4924596548080444e-06, 4.827976226806641e-06, 6.163492798805237e-06, 7.499009370803833e-06, 8.83452594280243e-06, 1.0170042514801025e-05, 1.1505559086799622e-05, 1.2841075658798218e-05, 1.4176592230796814e-05, 1.551210880279541e-05, 1.6847625374794006e-05, 1.8183141946792603e-05, 1.95186585187912e-05, 2.0854175090789795e-05, 2.218969166278839e-05, 2.3525208234786987e-05, 2.4860724806785583e-05, 2.619624137878418e-05, 2.7531757950782776e-05, 2.8867274522781372e-05, 3.0202791094779968e-05, 3.1538307666778564e-05, 3.287382423877716e-05, 3.420934081077576e-05, 3.554485738277435e-05, 3.688037395477295e-05, 3.8215890526771545e-05, 3.955140709877014e-05, 4.088692367076874e-05, 4.2222440242767334e-05, 4.355795681476593e-05, 4.4893473386764526e-05, 4.622898995876312e-05, 4.756450653076172e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 9.0, 5.0, 8.0, 25.0, 34.0, 43.0, 58.0, 131.0, 220.0, 466.0, 746.0, 1775.0, 4897.0, 16905.0, 77418.0, 684306.0, 210685.0, 36188.0, 8986.0, 3062.0, 1212.0, 587.0, 310.0, 174.0, 105.0, 66.0, 41.0, 21.0, 23.0, 17.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.141357421875, -0.1367626190185547, -0.13216781616210938, -0.12757301330566406, -0.12297821044921875, -0.11838340759277344, -0.11378860473632812, -0.10919380187988281, -0.1045989990234375, -0.10000419616699219, -0.09540939331054688, -0.09081459045410156, -0.08621978759765625, -0.08162498474121094, -0.07703018188476562, -0.07243537902832031, -0.067840576171875, -0.06324577331542969, -0.058650970458984375, -0.05405616760253906, -0.04946136474609375, -0.04486656188964844, -0.040271759033203125, -0.03567695617675781, -0.0310821533203125, -0.026487350463867188, -0.021892547607421875, -0.017297744750976562, -0.01270294189453125, -0.008108139038085938, -0.003513336181640625, 0.0010814666748046875, 0.00567626953125, 0.010271072387695312, 0.014865875244140625, 0.019460678100585938, 0.02405548095703125, 0.028650283813476562, 0.033245086669921875, 0.03783988952636719, 0.0424346923828125, 0.04702949523925781, 0.051624298095703125, 0.05621910095214844, 0.06081390380859375, 0.06540870666503906, 0.07000350952148438, 0.07459831237792969, 0.079193115234375, 0.08378791809082031, 0.08838272094726562, 0.09297752380371094, 0.09757232666015625, 0.10216712951660156, 0.10676193237304688, 0.11135673522949219, 0.1159515380859375, 0.12054634094238281, 0.12514114379882812, 0.12973594665527344, 0.13433074951171875, 0.13892555236816406, 0.14352035522460938, 0.1481151580810547, 0.1527099609375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 7.0, 6.0, 11.0, 12.0, 17.0, 25.0, 26.0, 36.0, 43.0, 57.0, 81.0, 97.0, 103.0, 93.0, 67.0, 84.0, 51.0, 29.0, 43.0, 16.0, 14.0, 15.0, 11.0, 11.0, 5.0, 5.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.142578125, -0.13804054260253906, -0.13350296020507812, -0.1289653778076172, -0.12442779541015625, -0.11989021301269531, -0.11535263061523438, -0.11081504821777344, -0.1062774658203125, -0.10173988342285156, -0.09720230102539062, -0.09266471862792969, -0.08812713623046875, -0.08358955383300781, -0.07905197143554688, -0.07451438903808594, -0.069976806640625, -0.06543922424316406, -0.060901641845703125, -0.05636405944824219, -0.05182647705078125, -0.04728889465332031, -0.042751312255859375, -0.03821372985839844, -0.0336761474609375, -0.029138565063476562, -0.024600982666015625, -0.020063400268554688, -0.01552581787109375, -0.010988235473632812, -0.006450653076171875, -0.0019130706787109375, 0.00262451171875, 0.0071620941162109375, 0.011699676513671875, 0.016237258911132812, 0.02077484130859375, 0.025312423706054688, 0.029850006103515625, 0.03438758850097656, 0.0389251708984375, 0.04346275329589844, 0.048000335693359375, 0.05253791809082031, 0.05707550048828125, 0.06161308288574219, 0.06615066528320312, 0.07068824768066406, 0.075225830078125, 0.07976341247558594, 0.08430099487304688, 0.08883857727050781, 0.09337615966796875, 0.09791374206542969, 0.10245132446289062, 0.10698890686035156, 0.1115264892578125, 0.11606407165527344, 0.12060165405273438, 0.1251392364501953, 0.12967681884765625, 0.1342144012451172, 0.13875198364257812, 0.14328956604003906, 0.1478271484375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 9.0, 17.0, 36.0, 53.0, 80.0, 135.0, 299.0, 134.0, 79.0, 55.0, 34.0, 21.0, 9.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.667967677116394, -1.5528870820999146, -1.437806487083435, -1.322725772857666, -1.2076451778411865, -1.092564582824707, -0.9774839878082275, -0.862403392791748, -0.7473227977752686, -0.6322422027587891, -0.5171616077423096, -0.4020809531211853, -0.2870003581047058, -0.17191976308822632, -0.05683910846710205, 0.05824148654937744, 0.17332208156585693, 0.2884026765823364, 0.4034833014011383, 0.5185639262199402, 0.6336445212364197, 0.7487251162528992, 0.8638057708740234, 0.9788863658905029, 1.0939669609069824, 1.209047555923462, 1.3241281509399414, 1.439208745956421, 1.5542893409729004, 1.6693699359893799, 1.784450650215149, 1.8995312452316284, 2.0146117210388184, 2.129692316055298, 2.2447729110717773, 2.359853506088257, 2.4749341011047363, 2.590014696121216, 2.7050952911376953, 2.820176124572754, 2.9352564811706543, 3.050337076187134, 3.1654176712036133, 3.2804982662200928, 3.3955788612365723, 3.5106594562530518, 3.6257400512695312, 3.74082088470459, 3.8559014797210693, 3.970982074737549, 4.086062908172607, 4.201143264770508, 4.316224098205566, 4.431304454803467, 4.546385288238525, 4.661465644836426, 4.776546478271484, 4.891627311706543, 5.006707668304443, 5.121788501739502, 5.236868858337402, 5.351949691772461, 5.467030048370361, 5.58211088180542, 5.69719123840332]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 6.0, 9.0, 15.0, 11.0, 17.0, 20.0, 22.0, 21.0, 33.0, 30.0, 28.0, 36.0, 55.0, 71.0, 117.0, 100.0, 75.0, 55.0, 38.0, 39.0, 26.0, 23.0, 28.0, 18.0, 18.0, 12.0, 19.0, 18.0, 8.0, 4.0, 6.0, 3.0, 8.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.255918502807617, -3.162818670272827, -3.069719076156616, -2.976619243621826, -2.8835196495056152, -2.790419816970825, -2.697319984436035, -2.604220390319824, -2.5111207962036133, -2.4180209636688232, -2.3249213695526123, -2.2318215370178223, -2.1387219429016113, -2.0456221103668213, -1.9525223970413208, -1.8594226837158203, -1.7663228511810303, -1.6732231378555298, -1.5801234245300293, -1.4870235919952393, -1.3939239978790283, -1.3008241653442383, -1.2077244520187378, -1.1146247386932373, -1.0215250253677368, -0.9284253120422363, -0.8353255987167358, -0.7422258257865906, -0.6491261124610901, -0.5560263991355896, -0.46292662620544434, -0.36982691287994385, -0.27672719955444336, -0.18362747132778168, -0.09052774310112, 0.002572000026702881, 0.09567171335220337, 0.18877142667770386, 0.2818711996078491, 0.3749709129333496, 0.4680706262588501, 0.5611703395843506, 0.6542700529098511, 0.7473698258399963, 0.8404695391654968, 0.9335692524909973, 1.0266690254211426, 1.119768738746643, 1.2128684520721436, 1.305968165397644, 1.3990678787231445, 1.4921677112579346, 1.5852673053741455, 1.6783671379089355, 1.771466851234436, 1.8645665645599365, 1.957666277885437, 2.0507659912109375, 2.1438658237457275, 2.2369654178619385, 2.3300652503967285, 2.4231648445129395, 2.5162646770477295, 2.6093645095825195, 2.7024641036987305]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 20.0, 27.0, 63.0, 100.0, 199.0, 404.0, 905.0, 2325.0, 7695.0, 46829.0, 582114.0, 2893537.0, 600060.0, 48367.0, 7695.0, 2201.0, 863.0, 406.0, 174.0, 114.0, 69.0, 33.0, 22.0, 18.0, 7.0, 5.0, 7.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.43359375, -0.42314720153808594, -0.4127006530761719, -0.4022541046142578, -0.39180755615234375, -0.3813610076904297, -0.3709144592285156, -0.36046791076660156, -0.3500213623046875, -0.33957481384277344, -0.3291282653808594, -0.3186817169189453, -0.30823516845703125, -0.2977886199951172, -0.2873420715332031, -0.27689552307128906, -0.266448974609375, -0.25600242614746094, -0.24555587768554688, -0.2351093292236328, -0.22466278076171875, -0.2142162322998047, -0.20376968383789062, -0.19332313537597656, -0.1828765869140625, -0.17243003845214844, -0.16198348999023438, -0.1515369415283203, -0.14109039306640625, -0.1306438446044922, -0.12019729614257812, -0.10975074768066406, -0.09930419921875, -0.08885765075683594, -0.07841110229492188, -0.06796455383300781, -0.05751800537109375, -0.04707145690917969, -0.036624908447265625, -0.026178359985351562, -0.0157318115234375, -0.0052852630615234375, 0.005161285400390625, 0.015607833862304688, 0.02605438232421875, 0.03650093078613281, 0.046947479248046875, 0.05739402770996094, 0.067840576171875, 0.07828712463378906, 0.08873367309570312, 0.09918022155761719, 0.10962677001953125, 0.12007331848144531, 0.13051986694335938, 0.14096641540527344, 0.1514129638671875, 0.16185951232910156, 0.17230606079101562, 0.1827526092529297, 0.19319915771484375, 0.2036457061767578, 0.21409225463867188, 0.22453880310058594, 0.2349853515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 13.0, 11.0, 13.0, 18.0, 23.0, 37.0, 38.0, 51.0, 45.0, 53.0, 39.0, 41.0, 49.0, 54.0, 37.0, 49.0, 44.0, 56.0, 53.0, 42.0, 33.0, 39.0, 27.0, 25.0, 13.0, 21.0, 14.0, 10.0, 10.0, 10.0, 1.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208984375, -0.20225143432617188, -0.19551849365234375, -0.18878555297851562, -0.1820526123046875, -0.17531967163085938, -0.16858673095703125, -0.16185379028320312, -0.155120849609375, -0.14838790893554688, -0.14165496826171875, -0.13492202758789062, -0.1281890869140625, -0.12145614624023438, -0.11472320556640625, -0.10799026489257812, -0.10125732421875, -0.09452438354492188, -0.08779144287109375, -0.08105850219726562, -0.0743255615234375, -0.06759262084960938, -0.06085968017578125, -0.054126739501953125, -0.047393798828125, -0.040660858154296875, -0.03392791748046875, -0.027194976806640625, -0.0204620361328125, -0.013729095458984375, -0.00699615478515625, -0.000263214111328125, 0.0064697265625, 0.013202667236328125, 0.01993560791015625, 0.026668548583984375, 0.0334014892578125, 0.040134429931640625, 0.04686737060546875, 0.053600311279296875, 0.060333251953125, 0.06706619262695312, 0.07379913330078125, 0.08053207397460938, 0.0872650146484375, 0.09399795532226562, 0.10073089599609375, 0.10746383666992188, 0.11419677734375, 0.12092971801757812, 0.12766265869140625, 0.13439559936523438, 0.1411285400390625, 0.14786148071289062, 0.15459442138671875, 0.16132736206054688, 0.168060302734375, 0.17479324340820312, 0.18152618408203125, 0.18825912475585938, 0.1949920654296875, 0.20172500610351562, 0.20845794677734375, 0.21519088745117188, 0.221923828125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 13.0, 11.0, 14.0, 16.0, 47.0, 82.0, 176.0, 360.0, 1252.0, 8411.0, 384872.0, 3760117.0, 35130.0, 2681.0, 585.0, 250.0, 125.0, 58.0, 36.0, 13.0, 14.0, 9.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0207595825195312, -0.9965972900390625, -0.9724349975585938, -0.948272705078125, -0.9241104125976562, -0.8999481201171875, -0.8757858276367188, -0.85162353515625, -0.8274612426757812, -0.8032989501953125, -0.7791366577148438, -0.754974365234375, -0.7308120727539062, -0.7066497802734375, -0.6824874877929688, -0.6583251953125, -0.6341629028320312, -0.6100006103515625, -0.5858383178710938, -0.561676025390625, -0.5375137329101562, -0.5133514404296875, -0.48918914794921875, -0.46502685546875, -0.44086456298828125, -0.4167022705078125, -0.39253997802734375, -0.368377685546875, -0.34421539306640625, -0.3200531005859375, -0.29589080810546875, -0.271728515625, -0.24756622314453125, -0.2234039306640625, -0.19924163818359375, -0.175079345703125, -0.15091705322265625, -0.1267547607421875, -0.10259246826171875, -0.07843017578125, -0.05426788330078125, -0.0301055908203125, -0.00594329833984375, 0.018218994140625, 0.04238128662109375, 0.0665435791015625, 0.09070587158203125, 0.1148681640625, 0.13903045654296875, 0.1631927490234375, 0.18735504150390625, 0.211517333984375, 0.23567962646484375, 0.2598419189453125, 0.28400421142578125, 0.30816650390625, 0.33232879638671875, 0.3564910888671875, 0.38065338134765625, 0.404815673828125, 0.42897796630859375, 0.4531402587890625, 0.47730255126953125, 0.50146484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 9.0, 4.0, 6.0, 19.0, 18.0, 25.0, 39.0, 96.0, 150.0, 275.0, 495.0, 788.0, 812.0, 603.0, 328.0, 196.0, 84.0, 55.0, 24.0, 17.0, 14.0, 12.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.751953125, -0.7349205017089844, -0.7178878784179688, -0.7008552551269531, -0.6838226318359375, -0.6667900085449219, -0.6497573852539062, -0.6327247619628906, -0.615692138671875, -0.5986595153808594, -0.5816268920898438, -0.5645942687988281, -0.5475616455078125, -0.5305290222167969, -0.5134963989257812, -0.4964637756347656, -0.47943115234375, -0.4623985290527344, -0.44536590576171875, -0.4283332824707031, -0.4113006591796875, -0.3942680358886719, -0.37723541259765625, -0.3602027893066406, -0.343170166015625, -0.3261375427246094, -0.30910491943359375, -0.2920722961425781, -0.2750396728515625, -0.2580070495605469, -0.24097442626953125, -0.22394180297851562, -0.2069091796875, -0.18987655639648438, -0.17284393310546875, -0.15581130981445312, -0.1387786865234375, -0.12174606323242188, -0.10471343994140625, -0.08768081665039062, -0.070648193359375, -0.053615570068359375, -0.03658294677734375, -0.019550323486328125, -0.0025177001953125, 0.014514923095703125, 0.03154754638671875, 0.048580169677734375, 0.06561279296875, 0.08264541625976562, 0.09967803955078125, 0.11671066284179688, 0.1337432861328125, 0.15077590942382812, 0.16780853271484375, 0.18484115600585938, 0.201873779296875, 0.21890640258789062, 0.23593902587890625, 0.2529716491699219, 0.2700042724609375, 0.2870368957519531, 0.30406951904296875, 0.3211021423339844, 0.338134765625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 16.0, 32.0, 99.0, 271.0, 339.0, 158.0, 50.0, 18.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.036361694335938, -7.841573238372803, -7.646785259246826, -7.451996803283691, -7.257208824157715, -7.06242036819458, -6.867631912231445, -6.672843933105469, -6.478055953979492, -6.283267498016357, -6.088479518890381, -5.893691062927246, -5.6989030838012695, -5.504114627838135, -5.309326171875, -5.114538192749023, -4.919749736785889, -4.724961280822754, -4.530173301696777, -4.335384845733643, -4.140596866607666, -3.9458084106445312, -3.7510201930999756, -3.55623197555542, -3.3614437580108643, -3.1666555404663086, -2.971867322921753, -2.7770791053771973, -2.5822906494140625, -2.387502670288086, -2.192714214324951, -1.9979259967803955, -1.8031377792358398, -1.6083495616912842, -1.4135613441467285, -1.2187730073928833, -1.0239847898483276, -0.829196572303772, -0.6344082355499268, -0.4396200180053711, -0.24483180046081543, -0.05004355311393738, 0.14474469423294067, 0.3395329713821411, 0.5343211889266968, 0.7291094064712524, 0.9238977432250977, 1.1186859607696533, 1.313474178314209, 1.5082623958587646, 1.7030506134033203, 1.8978389501571655, 2.0926270484924316, 2.2874155044555664, 2.482203722000122, 2.6769919395446777, 2.8717801570892334, 3.066568374633789, 3.2613565921783447, 3.4561448097229004, 3.650933265686035, 3.8457212448120117, 4.0405097007751465, 4.235298156738281, 4.430086135864258]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 8.0, 6.0, 5.0, 7.0, 10.0, 7.0, 12.0, 17.0, 24.0, 19.0, 23.0, 41.0, 24.0, 32.0, 51.0, 49.0, 56.0, 66.0, 49.0, 48.0, 68.0, 66.0, 42.0, 31.0, 35.0, 30.0, 35.0, 27.0, 27.0, 23.0, 19.0, 15.0, 9.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.259957790374756, -2.196604013442993, -2.1332499980926514, -2.0698962211608887, -2.006542205810547, -1.9431883096694946, -1.8798344135284424, -1.8164806365966797, -1.753126621246338, -1.6897727251052856, -1.6264188289642334, -1.5630649328231812, -1.499711036682129, -1.4363571405410767, -1.3730032444000244, -1.3096494674682617, -1.2462955713272095, -1.1829416751861572, -1.119587779045105, -1.0562338829040527, -0.9928799867630005, -0.9295260906219482, -0.8661722540855408, -0.8028183579444885, -0.7394644618034363, -0.676110565662384, -0.6127566695213318, -0.5494028329849243, -0.4860489070415497, -0.42269501090049744, -0.3593411445617676, -0.29598724842071533, -0.23263335227966309, -0.16927945613861084, -0.10592557489871979, -0.042571693658828735, 0.02078220248222351, 0.08413609862327576, 0.14748996496200562, 0.21084386110305786, 0.2741977572441101, 0.33755165338516235, 0.4009055495262146, 0.46425941586494446, 0.5276132822036743, 0.5909671783447266, 0.6543210744857788, 0.717674970626831, 0.7810288667678833, 0.8443827629089355, 0.9077366590499878, 0.97109055519104, 1.0344444513320923, 1.0977983474731445, 1.1611521244049072, 1.224506139755249, 1.2878599166870117, 1.351213812828064, 1.4145677089691162, 1.4779216051101685, 1.5412755012512207, 1.604629397392273, 1.6679832935333252, 1.731337070465088, 1.7946910858154297]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 3.0, 6.0, 17.0, 38.0, 83.0, 255.0, 749.0, 3044.0, 17307.0, 171678.0, 744108.0, 96776.0, 11402.0, 2175.0, 596.0, 199.0, 69.0, 31.0, 10.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68017578125, -0.6553421020507812, -0.6305084228515625, -0.6056747436523438, -0.580841064453125, -0.5560073852539062, -0.5311737060546875, -0.5063400268554688, -0.48150634765625, -0.45667266845703125, -0.4318389892578125, -0.40700531005859375, -0.382171630859375, -0.35733795166015625, -0.3325042724609375, -0.30767059326171875, -0.2828369140625, -0.25800323486328125, -0.2331695556640625, -0.20833587646484375, -0.183502197265625, -0.15866851806640625, -0.1338348388671875, -0.10900115966796875, -0.08416748046875, -0.05933380126953125, -0.0345001220703125, -0.00966644287109375, 0.015167236328125, 0.04000091552734375, 0.0648345947265625, 0.08966827392578125, 0.114501953125, 0.13933563232421875, 0.1641693115234375, 0.18900299072265625, 0.213836669921875, 0.23867034912109375, 0.2635040283203125, 0.28833770751953125, 0.31317138671875, 0.33800506591796875, 0.3628387451171875, 0.38767242431640625, 0.412506103515625, 0.43733978271484375, 0.4621734619140625, 0.48700714111328125, 0.5118408203125, 0.5366744995117188, 0.5615081787109375, 0.5863418579101562, 0.611175537109375, 0.6360092163085938, 0.6608428955078125, 0.6856765747070312, 0.71051025390625, 0.7353439331054688, 0.7601776123046875, 0.7850112915039062, 0.809844970703125, 0.8346786499023438, 0.8595123291015625, 0.8843460083007812, 0.9091796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 6.0, 6.0, 10.0, 8.0, 14.0, 13.0, 23.0, 35.0, 36.0, 38.0, 49.0, 36.0, 48.0, 51.0, 54.0, 68.0, 47.0, 44.0, 44.0, 46.0, 54.0, 43.0, 39.0, 31.0, 34.0, 20.0, 18.0, 23.0, 20.0, 11.0, 4.0, 10.0, 5.0, 4.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23046875, -0.2235698699951172, -0.21667098999023438, -0.20977210998535156, -0.20287322998046875, -0.19597434997558594, -0.18907546997070312, -0.1821765899658203, -0.1752777099609375, -0.1683788299560547, -0.16147994995117188, -0.15458106994628906, -0.14768218994140625, -0.14078330993652344, -0.13388442993164062, -0.1269855499267578, -0.120086669921875, -0.11318778991699219, -0.10628890991210938, -0.09939002990722656, -0.09249114990234375, -0.08559226989746094, -0.07869338989257812, -0.07179450988769531, -0.0648956298828125, -0.05799674987792969, -0.051097869873046875, -0.04419898986816406, -0.03730010986328125, -0.030401229858398438, -0.023502349853515625, -0.016603469848632812, -0.00970458984375, -0.0028057098388671875, 0.004093170166015625, 0.010992050170898438, 0.01789093017578125, 0.024789810180664062, 0.031688690185546875, 0.03858757019042969, 0.0454864501953125, 0.05238533020019531, 0.059284210205078125, 0.06618309020996094, 0.07308197021484375, 0.07998085021972656, 0.08687973022460938, 0.09377861022949219, 0.100677490234375, 0.10757637023925781, 0.11447525024414062, 0.12137413024902344, 0.12827301025390625, 0.13517189025878906, 0.14207077026367188, 0.1489696502685547, 0.1558685302734375, 0.1627674102783203, 0.16966629028320312, 0.17656517028808594, 0.18346405029296875, 0.19036293029785156, 0.19726181030273438, 0.2041606903076172, 0.2110595703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 9.0, 5.0, 14.0, 14.0, 15.0, 23.0, 26.0, 49.0, 60.0, 87.0, 108.0, 192.0, 251.0, 416.0, 659.0, 1210.0, 2752.0, 10571.0, 115692.0, 847735.0, 56743.0, 7091.0, 2122.0, 1026.0, 581.0, 317.0, 209.0, 153.0, 126.0, 87.0, 50.0, 40.0, 33.0, 17.0, 20.0, 10.0, 8.0, 7.0, 2.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6660614013671875, -0.644134521484375, -0.6222076416015625, -0.60028076171875, -0.5783538818359375, -0.556427001953125, -0.5345001220703125, -0.5125732421875, -0.4906463623046875, -0.468719482421875, -0.4467926025390625, -0.42486572265625, -0.4029388427734375, -0.381011962890625, -0.3590850830078125, -0.337158203125, -0.3152313232421875, -0.293304443359375, -0.2713775634765625, -0.24945068359375, -0.2275238037109375, -0.205596923828125, -0.1836700439453125, -0.1617431640625, -0.1398162841796875, -0.117889404296875, -0.0959625244140625, -0.07403564453125, -0.0521087646484375, -0.030181884765625, -0.0082550048828125, 0.013671875, 0.0355987548828125, 0.057525634765625, 0.0794525146484375, 0.10137939453125, 0.1233062744140625, 0.145233154296875, 0.1671600341796875, 0.1890869140625, 0.2110137939453125, 0.232940673828125, 0.2548675537109375, 0.27679443359375, 0.2987213134765625, 0.320648193359375, 0.3425750732421875, 0.364501953125, 0.3864288330078125, 0.408355712890625, 0.4302825927734375, 0.45220947265625, 0.4741363525390625, 0.496063232421875, 0.5179901123046875, 0.5399169921875, 0.5618438720703125, 0.583770751953125, 0.6056976318359375, 0.62762451171875, 0.6495513916015625, 0.671478271484375, 0.6934051513671875, 0.71533203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 10.0, 13.0, 19.0, 26.0, 17.0, 25.0, 38.0, 46.0, 63.0, 66.0, 60.0, 67.0, 56.0, 66.0, 64.0, 55.0, 51.0, 43.0, 36.0, 46.0, 24.0, 18.0, 13.0, 11.0, 8.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.88671875, -0.8603744506835938, -0.8340301513671875, -0.8076858520507812, -0.781341552734375, -0.7549972534179688, -0.7286529541015625, -0.7023086547851562, -0.67596435546875, -0.6496200561523438, -0.6232757568359375, -0.5969314575195312, -0.570587158203125, -0.5442428588867188, -0.5178985595703125, -0.49155426025390625, -0.4652099609375, -0.43886566162109375, -0.4125213623046875, -0.38617706298828125, -0.359832763671875, -0.33348846435546875, -0.3071441650390625, -0.28079986572265625, -0.25445556640625, -0.22811126708984375, -0.2017669677734375, -0.17542266845703125, -0.149078369140625, -0.12273406982421875, -0.0963897705078125, -0.07004547119140625, -0.043701171875, -0.01735687255859375, 0.0089874267578125, 0.03533172607421875, 0.061676025390625, 0.08802032470703125, 0.1143646240234375, 0.14070892333984375, 0.16705322265625, 0.19339752197265625, 0.2197418212890625, 0.24608612060546875, 0.272430419921875, 0.29877471923828125, 0.3251190185546875, 0.35146331787109375, 0.3778076171875, 0.40415191650390625, 0.4304962158203125, 0.45684051513671875, 0.483184814453125, 0.5095291137695312, 0.5358734130859375, 0.5622177124023438, 0.58856201171875, 0.6149063110351562, 0.6412506103515625, 0.6675949096679688, 0.693939208984375, 0.7202835083007812, 0.7466278076171875, 0.7729721069335938, 0.79931640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 10.0, 6.0, 21.0, 15.0, 14.0, 27.0, 32.0, 58.0, 70.0, 153.0, 303.0, 691.0, 2270.0, 14764.0, 825589.0, 193110.0, 8715.0, 1606.0, 502.0, 219.0, 116.0, 74.0, 46.0, 48.0, 18.0, 19.0, 11.0, 13.0, 7.0, 5.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.2739601135253906, -0.26447296142578125, -0.2549858093261719, -0.2454986572265625, -0.23601150512695312, -0.22652435302734375, -0.21703720092773438, -0.207550048828125, -0.19806289672851562, -0.18857574462890625, -0.17908859252929688, -0.1696014404296875, -0.16011428833007812, -0.15062713623046875, -0.14113998413085938, -0.13165283203125, -0.12216567993164062, -0.11267852783203125, -0.10319137573242188, -0.0937042236328125, -0.08421707153320312, -0.07472991943359375, -0.06524276733398438, -0.055755615234375, -0.046268463134765625, -0.03678131103515625, -0.027294158935546875, -0.0178070068359375, -0.008319854736328125, 0.00116729736328125, 0.010654449462890625, 0.0201416015625, 0.029628753662109375, 0.03911590576171875, 0.048603057861328125, 0.0580902099609375, 0.06757736206054688, 0.07706451416015625, 0.08655166625976562, 0.096038818359375, 0.10552597045898438, 0.11501312255859375, 0.12450027465820312, 0.1339874267578125, 0.14347457885742188, 0.15296173095703125, 0.16244888305664062, 0.17193603515625, 0.18142318725585938, 0.19091033935546875, 0.20039749145507812, 0.2098846435546875, 0.21937179565429688, 0.22885894775390625, 0.23834609985351562, 0.247833251953125, 0.2573204040527344, 0.26680755615234375, 0.2762947082519531, 0.2857818603515625, 0.2952690124511719, 0.30475616455078125, 0.3142433166503906, 0.32373046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 5.0, 8.0, 8.0, 12.0, 12.0, 18.0, 10.0, 19.0, 46.0, 51.0, 62.0, 91.0, 87.0, 122.0, 99.0, 93.0, 65.0, 39.0, 36.0, 16.0, 15.0, 15.0, 14.0, 18.0, 4.0, 5.0, 7.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.257129669189453e-05, -5.0951726734638214e-05, -4.93321567773819e-05, -4.771258682012558e-05, -4.609301686286926e-05, -4.4473446905612946e-05, -4.285387694835663e-05, -4.123430699110031e-05, -3.9614737033843994e-05, -3.799516707658768e-05, -3.637559711933136e-05, -3.475602716207504e-05, -3.3136457204818726e-05, -3.151688724756241e-05, -2.989731729030609e-05, -2.8277747333049774e-05, -2.6658177375793457e-05, -2.503860741853714e-05, -2.3419037461280823e-05, -2.1799467504024506e-05, -2.017989754676819e-05, -1.856032758951187e-05, -1.6940757632255554e-05, -1.5321187674999237e-05, -1.370161771774292e-05, -1.2082047760486603e-05, -1.0462477803230286e-05, -8.842907845973969e-06, -7.223337888717651e-06, -5.603767931461334e-06, -3.984197974205017e-06, -2.3646280169487e-06, -7.450580596923828e-07, 8.745118975639343e-07, 2.4940818548202515e-06, 4.113651812076569e-06, 5.733221769332886e-06, 7.352791726589203e-06, 8.97236168384552e-06, 1.0591931641101837e-05, 1.2211501598358154e-05, 1.3831071555614471e-05, 1.545064151287079e-05, 1.7070211470127106e-05, 1.8689781427383423e-05, 2.030935138463974e-05, 2.1928921341896057e-05, 2.3548491299152374e-05, 2.516806125640869e-05, 2.678763121366501e-05, 2.8407201170921326e-05, 3.0026771128177643e-05, 3.164634108543396e-05, 3.326591104269028e-05, 3.4885480999946594e-05, 3.650505095720291e-05, 3.812462091445923e-05, 3.9744190871715546e-05, 4.136376082897186e-05, 4.298333078622818e-05, 4.46029007434845e-05, 4.6222470700740814e-05, 4.784204065799713e-05, 4.946161061525345e-05, 5.1081180572509766e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 5.0, 6.0, 7.0, 3.0, 11.0, 4.0, 17.0, 14.0, 16.0, 20.0, 31.0, 34.0, 54.0, 91.0, 97.0, 137.0, 241.0, 292.0, 530.0, 913.0, 1650.0, 3594.0, 9150.0, 32668.0, 219903.0, 695584.0, 59824.0, 13508.0, 4910.0, 2295.0, 1143.0, 616.0, 357.0, 228.0, 158.0, 111.0, 80.0, 56.0, 51.0, 36.0, 22.0, 18.0, 19.0, 15.0, 11.0, 5.0, 7.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1221923828125, -0.11850929260253906, -0.11482620239257812, -0.11114311218261719, -0.10746002197265625, -0.10377693176269531, -0.10009384155273438, -0.09641075134277344, -0.0927276611328125, -0.08904457092285156, -0.08536148071289062, -0.08167839050292969, -0.07799530029296875, -0.07431221008300781, -0.07062911987304688, -0.06694602966308594, -0.063262939453125, -0.05957984924316406, -0.055896759033203125, -0.05221366882324219, -0.04853057861328125, -0.04484748840332031, -0.041164398193359375, -0.03748130798339844, -0.0337982177734375, -0.030115127563476562, -0.026432037353515625, -0.022748947143554688, -0.01906585693359375, -0.015382766723632812, -0.011699676513671875, -0.008016586303710938, -0.00433349609375, -0.0006504058837890625, 0.003032684326171875, 0.0067157745361328125, 0.01039886474609375, 0.014081954956054688, 0.017765045166015625, 0.021448135375976562, 0.0251312255859375, 0.028814315795898438, 0.032497406005859375, 0.03618049621582031, 0.03986358642578125, 0.04354667663574219, 0.047229766845703125, 0.05091285705566406, 0.054595947265625, 0.05827903747558594, 0.061962127685546875, 0.06564521789550781, 0.06932830810546875, 0.07301139831542969, 0.07669448852539062, 0.08037757873535156, 0.0840606689453125, 0.08774375915527344, 0.09142684936523438, 0.09510993957519531, 0.09879302978515625, 0.10247611999511719, 0.10615921020507812, 0.10984230041503906, 0.113525390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 1.0, 4.0, 6.0, 3.0, 4.0, 3.0, 7.0, 3.0, 12.0, 15.0, 24.0, 36.0, 36.0, 39.0, 56.0, 88.0, 114.0, 119.0, 110.0, 74.0, 41.0, 45.0, 38.0, 22.0, 17.0, 20.0, 14.0, 8.0, 5.0, 4.0, 6.0, 7.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.1317138671875, -0.12735557556152344, -0.12299728393554688, -0.11863899230957031, -0.11428070068359375, -0.10992240905761719, -0.10556411743164062, -0.10120582580566406, -0.0968475341796875, -0.09248924255371094, -0.08813095092773438, -0.08377265930175781, -0.07941436767578125, -0.07505607604980469, -0.07069778442382812, -0.06633949279785156, -0.061981201171875, -0.05762290954589844, -0.053264617919921875, -0.04890632629394531, -0.04454803466796875, -0.04018974304199219, -0.035831451416015625, -0.03147315979003906, -0.0271148681640625, -0.022756576538085938, -0.018398284912109375, -0.014039993286132812, -0.00968170166015625, -0.0053234100341796875, -0.000965118408203125, 0.0033931732177734375, 0.00775146484375, 0.012109756469726562, 0.016468048095703125, 0.020826339721679688, 0.02518463134765625, 0.029542922973632812, 0.033901214599609375, 0.03825950622558594, 0.0426177978515625, 0.04697608947753906, 0.051334381103515625, 0.05569267272949219, 0.06005096435546875, 0.06440925598144531, 0.06876754760742188, 0.07312583923339844, 0.077484130859375, 0.08184242248535156, 0.08620071411132812, 0.09055900573730469, 0.09491729736328125, 0.09927558898925781, 0.10363388061523438, 0.10799217224121094, 0.1123504638671875, 0.11670875549316406, 0.12106704711914062, 0.1254253387451172, 0.12978363037109375, 0.1341419219970703, 0.13850021362304688, 0.14285850524902344, 0.147216796875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 5.0, 9.0, 20.0, 74.0, 328.0, 375.0, 122.0, 39.0, 13.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.278661727905273, -8.05510425567627, -7.831547260284424, -7.607990264892578, -7.384432792663574, -7.1608757972717285, -6.937318801879883, -6.713761329650879, -6.490203857421875, -6.266646862030029, -6.043089389801025, -5.81953239440918, -5.595974922180176, -5.37241792678833, -5.148860931396484, -4.9253034591674805, -4.701746463775635, -4.478189468383789, -4.254631996154785, -4.0310750007629395, -3.8075175285339355, -3.58396053314209, -3.360403299331665, -3.1368460655212402, -2.9132888317108154, -2.6897315979003906, -2.466174364089966, -2.242617130279541, -2.0190601348876953, -1.795502781867981, -1.5719456672668457, -1.348388433456421, -1.124830722808838, -0.9012734889984131, -0.6777163147926331, -0.454159140586853, -0.23060190677642822, -0.007044672966003418, 0.21651244163513184, 0.44006967544555664, 0.6636269092559814, 0.8871841430664062, 1.110741376876831, 1.3342984914779663, 1.5578557252883911, 1.781412959098816, 2.004970073699951, 2.228527307510376, 2.452084541320801, 2.6756417751312256, 2.8991990089416504, 3.122756004333496, 3.3463134765625, 3.5698704719543457, 3.7934277057647705, 4.016984939575195, 4.240542411804199, 4.464099407196045, 4.687656879425049, 4.9112138748168945, 5.134771347045898, 5.358328342437744, 5.58188533782959, 5.805442810058594, 6.0289998054504395]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 7.0, 8.0, 9.0, 12.0, 12.0, 13.0, 19.0, 8.0, 15.0, 19.0, 20.0, 12.0, 27.0, 29.0, 24.0, 32.0, 45.0, 95.0, 126.0, 94.0, 38.0, 49.0, 30.0, 22.0, 23.0, 26.0, 23.0, 22.0, 22.0, 21.0, 14.0, 17.0, 5.0, 15.0, 5.0, 4.0, 6.0, 3.0, 7.0, 2.0, 1.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.2721033096313477, -2.2023508548736572, -2.132598400115967, -2.0628459453582764, -1.9930933713912964, -1.923340916633606, -1.853588342666626, -1.7838358879089355, -1.7140834331512451, -1.6443309783935547, -1.5745785236358643, -1.5048259496688843, -1.4350734949111938, -1.3653210401535034, -1.2955684661865234, -1.225816011428833, -1.1560635566711426, -1.0863111019134521, -1.0165586471557617, -0.9468060731887817, -0.8770536184310913, -0.8073011636734009, -0.7375486493110657, -0.6677961349487305, -0.59804368019104, -0.5282912254333496, -0.4585387110710144, -0.3887862265110016, -0.31903374195098877, -0.24928125739097595, -0.17952877283096313, -0.10977628827095032, -0.0400238037109375, 0.029728680849075317, 0.09948116540908813, 0.16923364996910095, 0.23898613452911377, 0.3087386190891266, 0.3784911036491394, 0.4482435882091522, 0.517996072769165, 0.5877485275268555, 0.6575010418891907, 0.7272535562515259, 0.7970060110092163, 0.8667584657669067, 0.9365109801292419, 1.0062634944915771, 1.0760159492492676, 1.145768404006958, 1.2155208587646484, 1.2852734327316284, 1.3550258874893188, 1.4247783422470093, 1.4945309162139893, 1.5642833709716797, 1.6340358257293701, 1.7037882804870605, 1.773540735244751, 1.843293309211731, 1.9130457639694214, 1.9827982187271118, 2.052550792694092, 2.1223032474517822, 2.1920557022094727]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 10.0, 11.0, 12.0, 14.0, 21.0, 21.0, 41.0, 63.0, 99.0, 156.0, 251.0, 422.0, 616.0, 1141.0, 2124.0, 4101.0, 8998.0, 23922.0, 86803.0, 390340.0, 1334910.0, 1636801.0, 531639.0, 119144.0, 31300.0, 10724.0, 4825.0, 2394.0, 1314.0, 795.0, 435.0, 300.0, 189.0, 121.0, 72.0, 35.0, 34.0, 27.0, 21.0, 14.0, 4.0, 6.0, 1.0, 6.0, 7.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.223388671875, -0.21544265747070312, -0.20749664306640625, -0.19955062866210938, -0.1916046142578125, -0.18365859985351562, -0.17571258544921875, -0.16776657104492188, -0.159820556640625, -0.15187454223632812, -0.14392852783203125, -0.13598251342773438, -0.1280364990234375, -0.12009048461914062, -0.11214447021484375, -0.10419845581054688, -0.09625244140625, -0.08830642700195312, -0.08036041259765625, -0.07241439819335938, -0.0644683837890625, -0.056522369384765625, -0.04857635498046875, -0.040630340576171875, -0.032684326171875, -0.024738311767578125, -0.01679229736328125, -0.008846282958984375, -0.0009002685546875, 0.007045745849609375, 0.01499176025390625, 0.022937774658203125, 0.0308837890625, 0.038829803466796875, 0.04677581787109375, 0.054721832275390625, 0.0626678466796875, 0.07061386108398438, 0.07855987548828125, 0.08650588989257812, 0.094451904296875, 0.10239791870117188, 0.11034393310546875, 0.11828994750976562, 0.1262359619140625, 0.13418197631835938, 0.14212799072265625, 0.15007400512695312, 0.15802001953125, 0.16596603393554688, 0.17391204833984375, 0.18185806274414062, 0.1898040771484375, 0.19775009155273438, 0.20569610595703125, 0.21364212036132812, 0.221588134765625, 0.22953414916992188, 0.23748016357421875, 0.24542617797851562, 0.2533721923828125, 0.2613182067871094, 0.26926422119140625, 0.2772102355957031, 0.28515625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 8.0, 4.0, 11.0, 10.0, 18.0, 28.0, 21.0, 26.0, 43.0, 35.0, 47.0, 46.0, 51.0, 56.0, 63.0, 53.0, 55.0, 49.0, 43.0, 41.0, 46.0, 31.0, 40.0, 23.0, 25.0, 26.0, 12.0, 21.0, 14.0, 12.0, 10.0, 9.0, 8.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2012939453125, -0.1949748992919922, -0.18865585327148438, -0.18233680725097656, -0.17601776123046875, -0.16969871520996094, -0.16337966918945312, -0.1570606231689453, -0.1507415771484375, -0.1444225311279297, -0.13810348510742188, -0.13178443908691406, -0.12546539306640625, -0.11914634704589844, -0.11282730102539062, -0.10650825500488281, -0.100189208984375, -0.09387016296386719, -0.08755111694335938, -0.08123207092285156, -0.07491302490234375, -0.06859397888183594, -0.062274932861328125, -0.05595588684082031, -0.0496368408203125, -0.04331779479980469, -0.036998748779296875, -0.030679702758789062, -0.02436065673828125, -0.018041610717773438, -0.011722564697265625, -0.0054035186767578125, 0.00091552734375, 0.0072345733642578125, 0.013553619384765625, 0.019872665405273438, 0.02619171142578125, 0.03251075744628906, 0.038829803466796875, 0.04514884948730469, 0.0514678955078125, 0.05778694152832031, 0.06410598754882812, 0.07042503356933594, 0.07674407958984375, 0.08306312561035156, 0.08938217163085938, 0.09570121765136719, 0.102020263671875, 0.10833930969238281, 0.11465835571289062, 0.12097740173339844, 0.12729644775390625, 0.13361549377441406, 0.13993453979492188, 0.1462535858154297, 0.1525726318359375, 0.1588916778564453, 0.16521072387695312, 0.17152976989746094, 0.17784881591796875, 0.18416786193847656, 0.19048690795898438, 0.1968059539794922, 0.203125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 5.0, 7.0, 5.0, 8.0, 15.0, 16.0, 23.0, 34.0, 45.0, 79.0, 124.0, 223.0, 350.0, 674.0, 1594.0, 5063.0, 45674.0, 3830812.0, 293565.0, 11207.0, 2566.0, 984.0, 464.0, 264.0, 162.0, 90.0, 74.0, 39.0, 36.0, 22.0, 18.0, 10.0, 6.0, 6.0, 6.0, 2.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95703125, -0.925872802734375, -0.89471435546875, -0.863555908203125, -0.8323974609375, -0.801239013671875, -0.77008056640625, -0.738922119140625, -0.707763671875, -0.676605224609375, -0.64544677734375, -0.614288330078125, -0.5831298828125, -0.551971435546875, -0.52081298828125, -0.489654541015625, -0.45849609375, -0.427337646484375, -0.39617919921875, -0.365020751953125, -0.3338623046875, -0.302703857421875, -0.27154541015625, -0.240386962890625, -0.209228515625, -0.178070068359375, -0.14691162109375, -0.115753173828125, -0.0845947265625, -0.053436279296875, -0.02227783203125, 0.008880615234375, 0.0400390625, 0.071197509765625, 0.10235595703125, 0.133514404296875, 0.1646728515625, 0.195831298828125, 0.22698974609375, 0.258148193359375, 0.289306640625, 0.320465087890625, 0.35162353515625, 0.382781982421875, 0.4139404296875, 0.445098876953125, 0.47625732421875, 0.507415771484375, 0.53857421875, 0.569732666015625, 0.60089111328125, 0.632049560546875, 0.6632080078125, 0.694366455078125, 0.72552490234375, 0.756683349609375, 0.787841796875, 0.819000244140625, 0.85015869140625, 0.881317138671875, 0.9124755859375, 0.943634033203125, 0.97479248046875, 1.005950927734375, 1.037109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 9.0, 10.0, 12.0, 19.0, 26.0, 40.0, 42.0, 58.0, 72.0, 119.0, 147.0, 220.0, 306.0, 405.0, 512.0, 514.0, 432.0, 319.0, 219.0, 163.0, 116.0, 78.0, 64.0, 49.0, 37.0, 19.0, 16.0, 14.0, 6.0, 0.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52294921875, -0.5060043334960938, -0.4890594482421875, -0.47211456298828125, -0.455169677734375, -0.43822479248046875, -0.4212799072265625, -0.40433502197265625, -0.38739013671875, -0.37044525146484375, -0.3535003662109375, -0.33655548095703125, -0.319610595703125, -0.30266571044921875, -0.2857208251953125, -0.26877593994140625, -0.2518310546875, -0.23488616943359375, -0.2179412841796875, -0.20099639892578125, -0.184051513671875, -0.16710662841796875, -0.1501617431640625, -0.13321685791015625, -0.11627197265625, -0.09932708740234375, -0.0823822021484375, -0.06543731689453125, -0.048492431640625, -0.03154754638671875, -0.0146026611328125, 0.00234222412109375, 0.019287109375, 0.03623199462890625, 0.0531768798828125, 0.07012176513671875, 0.087066650390625, 0.10401153564453125, 0.1209564208984375, 0.13790130615234375, 0.15484619140625, 0.17179107666015625, 0.1887359619140625, 0.20568084716796875, 0.222625732421875, 0.23957061767578125, 0.2565155029296875, 0.27346038818359375, 0.2904052734375, 0.30735015869140625, 0.3242950439453125, 0.34123992919921875, 0.358184814453125, 0.37512969970703125, 0.3920745849609375, 0.40901947021484375, 0.42596435546875, 0.44290924072265625, 0.4598541259765625, 0.47679901123046875, 0.493743896484375, 0.5106887817382812, 0.5276336669921875, 0.5445785522460938, 0.5615234375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 11.0, 21.0, 39.0, 68.0, 109.0, 172.0, 196.0, 133.0, 81.0, 54.0, 36.0, 21.0, 11.0, 11.0, 2.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.19105339050293, -4.985244274139404, -4.779434680938721, -4.573625564575195, -4.367815971374512, -4.162006855010986, -3.956197500228882, -3.7503881454467773, -3.544578790664673, -3.3387694358825684, -3.132960081100464, -2.9271507263183594, -2.721341609954834, -2.5155320167541504, -2.309722900390625, -2.1039135456085205, -1.898104190826416, -1.6922948360443115, -1.486485481262207, -1.280676245689392, -1.0748668909072876, -0.8690575361251831, -0.6632483005523682, -0.45743894577026367, -0.2516295909881592, -0.045820266008377075, 0.15998905897140503, 0.36579835414886475, 0.5716077089309692, 0.7774170637130737, 0.9832262992858887, 1.1890356540679932, 1.3948450088500977, 1.6006543636322021, 1.8064637184143066, 2.012272834777832, 2.2180824279785156, 2.423891544342041, 2.6297008991241455, 2.83551025390625, 3.0413196086883545, 3.247128963470459, 3.4529383182525635, 3.658747673034668, 3.8645567893981934, 4.070366382598877, 4.276175498962402, 4.481985092163086, 4.687794208526611, 4.893603324890137, 5.09941291809082, 5.305222034454346, 5.511031627655029, 5.716840744018555, 5.922650337219238, 6.128459453582764, 6.334268569946289, 6.5400776863098145, 6.745887279510498, 6.951696395874023, 7.157505989074707, 7.363315105438232, 7.569124221801758, 7.774933815002441, 7.980743408203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 4.0, 5.0, 9.0, 6.0, 8.0, 9.0, 14.0, 13.0, 16.0, 18.0, 17.0, 31.0, 29.0, 39.0, 44.0, 29.0, 53.0, 52.0, 54.0, 64.0, 77.0, 70.0, 48.0, 46.0, 41.0, 43.0, 28.0, 30.0, 24.0, 19.0, 16.0, 18.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9535839557647705, -3.8372952938079834, -3.7210066318511963, -3.604717969894409, -3.488429546356201, -3.372140884399414, -3.255852222442627, -3.13956356048584, -3.0232748985290527, -2.9069862365722656, -2.7906975746154785, -2.6744089126586914, -2.5581202507019043, -2.441831588745117, -2.325543165206909, -2.209254503250122, -2.092965841293335, -1.9766771793365479, -1.8603885173797607, -1.7440999746322632, -1.627811312675476, -1.511522650718689, -1.3952341079711914, -1.2789454460144043, -1.1626567840576172, -1.04636812210083, -0.9300795197486877, -0.8137909173965454, -0.6975022554397583, -0.5812135934829712, -0.46492499113082886, -0.3486363887786865, -0.2323474884033203, -0.11605885624885559, 0.00022977590560913086, 0.11651840806007385, 0.23280704021453857, 0.3490957021713257, 0.465384304523468, 0.5816729068756104, 0.6979615688323975, 0.8142502307891846, 0.9305388331413269, 1.0468274354934692, 1.1631160974502563, 1.2794047594070435, 1.395693302154541, 1.5119819641113281, 1.6282706260681152, 1.7445592880249023, 1.8608479499816895, 1.977136492729187, 2.0934252738952637, 2.209713935852051, 2.326002359390259, 2.442291021347046, 2.558579683303833, 2.67486834526062, 2.7911570072174072, 2.9074456691741943, 3.0237340927124023, 3.1400227546691895, 3.2563114166259766, 3.3726000785827637, 3.488888740539551]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 15.0, 18.0, 17.0, 17.0, 61.0, 82.0, 118.0, 285.0, 516.0, 1019.0, 2313.0, 5802.0, 17493.0, 75563.0, 600815.0, 279186.0, 45369.0, 12030.0, 4226.0, 1812.0, 829.0, 392.0, 221.0, 133.0, 59.0, 42.0, 32.0, 17.0, 15.0, 13.0, 8.0, 0.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.44873046875, -0.4354705810546875, -0.422210693359375, -0.4089508056640625, -0.39569091796875, -0.3824310302734375, -0.369171142578125, -0.3559112548828125, -0.3426513671875, -0.3293914794921875, -0.316131591796875, -0.3028717041015625, -0.28961181640625, -0.2763519287109375, -0.263092041015625, -0.2498321533203125, -0.236572265625, -0.2233123779296875, -0.210052490234375, -0.1967926025390625, -0.18353271484375, -0.1702728271484375, -0.157012939453125, -0.1437530517578125, -0.1304931640625, -0.1172332763671875, -0.103973388671875, -0.0907135009765625, -0.07745361328125, -0.0641937255859375, -0.050933837890625, -0.0376739501953125, -0.0244140625, -0.0111541748046875, 0.002105712890625, 0.0153656005859375, 0.02862548828125, 0.0418853759765625, 0.055145263671875, 0.0684051513671875, 0.0816650390625, 0.0949249267578125, 0.108184814453125, 0.1214447021484375, 0.13470458984375, 0.1479644775390625, 0.161224365234375, 0.1744842529296875, 0.187744140625, 0.2010040283203125, 0.214263916015625, 0.2275238037109375, 0.24078369140625, 0.2540435791015625, 0.267303466796875, 0.2805633544921875, 0.2938232421875, 0.3070831298828125, 0.320343017578125, 0.3336029052734375, 0.34686279296875, 0.3601226806640625, 0.373382568359375, 0.3866424560546875, 0.39990234375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 18.0, 8.0, 18.0, 27.0, 35.0, 61.0, 69.0, 78.0, 60.0, 79.0, 74.0, 75.0, 80.0, 66.0, 57.0, 43.0, 39.0, 22.0, 29.0, 16.0, 7.0, 11.0, 11.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357666015625, -0.3466835021972656, -0.33570098876953125, -0.3247184753417969, -0.3137359619140625, -0.3027534484863281, -0.29177093505859375, -0.2807884216308594, -0.269805908203125, -0.2588233947753906, -0.24784088134765625, -0.23685836791992188, -0.2258758544921875, -0.21489334106445312, -0.20391082763671875, -0.19292831420898438, -0.18194580078125, -0.17096328735351562, -0.15998077392578125, -0.14899826049804688, -0.1380157470703125, -0.12703323364257812, -0.11605072021484375, -0.10506820678710938, -0.094085693359375, -0.08310317993164062, -0.07212066650390625, -0.061138153076171875, -0.0501556396484375, -0.039173126220703125, -0.02819061279296875, -0.017208099365234375, -0.0062255859375, 0.004756927490234375, 0.01573944091796875, 0.026721954345703125, 0.0377044677734375, 0.048686981201171875, 0.05966949462890625, 0.07065200805664062, 0.081634521484375, 0.09261703491210938, 0.10359954833984375, 0.11458206176757812, 0.1255645751953125, 0.13654708862304688, 0.14752960205078125, 0.15851211547851562, 0.16949462890625, 0.18047714233398438, 0.19145965576171875, 0.20244216918945312, 0.2134246826171875, 0.22440719604492188, 0.23538970947265625, 0.24637222290039062, 0.257354736328125, 0.2683372497558594, 0.27931976318359375, 0.2903022766113281, 0.3012847900390625, 0.3122673034667969, 0.32324981689453125, 0.3342323303222656, 0.34521484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 2.0, 6.0, 5.0, 10.0, 7.0, 11.0, 17.0, 25.0, 28.0, 38.0, 58.0, 77.0, 103.0, 178.0, 298.0, 518.0, 1064.0, 2798.0, 12085.0, 103665.0, 875529.0, 41615.0, 6480.0, 1905.0, 758.0, 422.0, 280.0, 179.0, 118.0, 79.0, 57.0, 33.0, 13.0, 24.0, 12.0, 9.0, 9.0, 10.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.44677734375, -0.432037353515625, -0.41729736328125, -0.402557373046875, -0.3878173828125, -0.373077392578125, -0.35833740234375, -0.343597412109375, -0.328857421875, -0.314117431640625, -0.29937744140625, -0.284637451171875, -0.2698974609375, -0.255157470703125, -0.24041748046875, -0.225677490234375, -0.2109375, -0.196197509765625, -0.18145751953125, -0.166717529296875, -0.1519775390625, -0.137237548828125, -0.12249755859375, -0.107757568359375, -0.093017578125, -0.078277587890625, -0.06353759765625, -0.048797607421875, -0.0340576171875, -0.019317626953125, -0.00457763671875, 0.010162353515625, 0.02490234375, 0.039642333984375, 0.05438232421875, 0.069122314453125, 0.0838623046875, 0.098602294921875, 0.11334228515625, 0.128082275390625, 0.142822265625, 0.157562255859375, 0.17230224609375, 0.187042236328125, 0.2017822265625, 0.216522216796875, 0.23126220703125, 0.246002197265625, 0.2607421875, 0.275482177734375, 0.29022216796875, 0.304962158203125, 0.3197021484375, 0.334442138671875, 0.34918212890625, 0.363922119140625, 0.378662109375, 0.393402099609375, 0.40814208984375, 0.422882080078125, 0.4376220703125, 0.452362060546875, 0.46710205078125, 0.481842041015625, 0.49658203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 1.0, 2.0, 5.0, 8.0, 9.0, 6.0, 8.0, 13.0, 8.0, 20.0, 20.0, 18.0, 21.0, 35.0, 35.0, 40.0, 76.0, 86.0, 99.0, 94.0, 74.0, 61.0, 50.0, 32.0, 30.0, 27.0, 21.0, 17.0, 14.0, 14.0, 13.0, 8.0, 5.0, 9.0, 9.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.94775390625, -0.9168624877929688, -0.8859710693359375, -0.8550796508789062, -0.824188232421875, -0.7932968139648438, -0.7624053955078125, -0.7315139770507812, -0.70062255859375, -0.6697311401367188, -0.6388397216796875, -0.6079483032226562, -0.577056884765625, -0.5461654663085938, -0.5152740478515625, -0.48438262939453125, -0.4534912109375, -0.42259979248046875, -0.3917083740234375, -0.36081695556640625, -0.329925537109375, -0.29903411865234375, -0.2681427001953125, -0.23725128173828125, -0.20635986328125, -0.17546844482421875, -0.1445770263671875, -0.11368560791015625, -0.082794189453125, -0.05190277099609375, -0.0210113525390625, 0.00988006591796875, 0.040771484375, 0.07166290283203125, 0.1025543212890625, 0.13344573974609375, 0.164337158203125, 0.19522857666015625, 0.2261199951171875, 0.25701141357421875, 0.28790283203125, 0.31879425048828125, 0.3496856689453125, 0.38057708740234375, 0.411468505859375, 0.44235992431640625, 0.4732513427734375, 0.5041427612304688, 0.5350341796875, 0.5659255981445312, 0.5968170166015625, 0.6277084350585938, 0.658599853515625, 0.6894912719726562, 0.7203826904296875, 0.7512741088867188, 0.78216552734375, 0.8130569458007812, 0.8439483642578125, 0.8748397827148438, 0.905731201171875, 0.9366226196289062, 0.9675140380859375, 0.9984054565429688, 1.029296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 7.0, 3.0, 3.0, 5.0, 10.0, 16.0, 21.0, 21.0, 41.0, 45.0, 95.0, 127.0, 213.0, 301.0, 529.0, 1025.0, 2245.0, 5719.0, 18097.0, 80383.0, 830374.0, 80882.0, 17847.0, 5730.0, 2287.0, 1078.0, 574.0, 336.0, 179.0, 97.0, 75.0, 36.0, 47.0, 33.0, 17.0, 11.0, 12.0, 5.0, 6.0, 5.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.05682229995727539, -0.05495929718017578, -0.05309629440307617, -0.05123329162597656, -0.04937028884887695, -0.047507286071777344, -0.045644283294677734, -0.043781280517578125, -0.041918277740478516, -0.040055274963378906, -0.0381922721862793, -0.03632926940917969, -0.03446626663208008, -0.03260326385498047, -0.03074026107788086, -0.02887725830078125, -0.02701425552368164, -0.02515125274658203, -0.023288249969482422, -0.021425247192382812, -0.019562244415283203, -0.017699241638183594, -0.015836238861083984, -0.013973236083984375, -0.012110233306884766, -0.010247230529785156, -0.008384227752685547, -0.0065212249755859375, -0.004658222198486328, -0.0027952194213867188, -0.0009322166442871094, 0.0009307861328125, 0.0027937889099121094, 0.004656791687011719, 0.006519794464111328, 0.008382797241210938, 0.010245800018310547, 0.012108802795410156, 0.013971805572509766, 0.015834808349609375, 0.017697811126708984, 0.019560813903808594, 0.021423816680908203, 0.023286819458007812, 0.025149822235107422, 0.02701282501220703, 0.02887582778930664, 0.03073883056640625, 0.03260183334350586, 0.03446483612060547, 0.03632783889770508, 0.03819084167480469, 0.0400538444519043, 0.041916847229003906, 0.043779850006103516, 0.045642852783203125, 0.047505855560302734, 0.049368858337402344, 0.05123186111450195, 0.05309486389160156, 0.05495786666870117, 0.05682086944580078, 0.05868387222290039, 0.060546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 3.0, 8.0, 5.0, 9.0, 8.0, 16.0, 12.0, 9.0, 17.0, 19.0, 22.0, 44.0, 35.0, 44.0, 52.0, 61.0, 88.0, 98.0, 73.0, 61.0, 47.0, 46.0, 43.0, 24.0, 28.0, 16.0, 14.0, 14.0, 12.0, 7.0, 8.0, 8.0, 7.0, 6.0, 2.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.777576446533203e-05, -2.6756897568702698e-05, -2.5738030672073364e-05, -2.471916377544403e-05, -2.3700296878814697e-05, -2.2681429982185364e-05, -2.166256308555603e-05, -2.0643696188926697e-05, -1.9624829292297363e-05, -1.860596239566803e-05, -1.7587095499038696e-05, -1.6568228602409363e-05, -1.554936170578003e-05, -1.4530494809150696e-05, -1.3511627912521362e-05, -1.2492761015892029e-05, -1.1473894119262695e-05, -1.0455027222633362e-05, -9.436160326004028e-06, -8.417293429374695e-06, -7.398426532745361e-06, -6.379559636116028e-06, -5.360692739486694e-06, -4.341825842857361e-06, -3.3229589462280273e-06, -2.304092049598694e-06, -1.2852251529693604e-06, -2.6635825634002686e-07, 7.525086402893066e-07, 1.7713755369186401e-06, 2.7902424335479736e-06, 3.809109330177307e-06, 4.827976226806641e-06, 5.846843123435974e-06, 6.865710020065308e-06, 7.884576916694641e-06, 8.903443813323975e-06, 9.922310709953308e-06, 1.0941177606582642e-05, 1.1960044503211975e-05, 1.2978911399841309e-05, 1.3997778296470642e-05, 1.5016645193099976e-05, 1.603551208972931e-05, 1.7054378986358643e-05, 1.8073245882987976e-05, 1.909211277961731e-05, 2.0110979676246643e-05, 2.1129846572875977e-05, 2.214871346950531e-05, 2.3167580366134644e-05, 2.4186447262763977e-05, 2.520531415939331e-05, 2.6224181056022644e-05, 2.7243047952651978e-05, 2.826191484928131e-05, 2.9280781745910645e-05, 3.0299648642539978e-05, 3.131851553916931e-05, 3.2337382435798645e-05, 3.335624933242798e-05, 3.437511622905731e-05, 3.5393983125686646e-05, 3.641285002231598e-05, 3.743171691894531e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 8.0, 6.0, 4.0, 5.0, 15.0, 15.0, 20.0, 38.0, 38.0, 49.0, 76.0, 122.0, 160.0, 274.0, 429.0, 657.0, 1168.0, 2083.0, 3902.0, 8168.0, 19381.0, 58434.0, 701748.0, 180560.0, 41538.0, 15091.0, 6753.0, 3246.0, 1772.0, 1002.0, 649.0, 377.0, 236.0, 156.0, 100.0, 76.0, 50.0, 26.0, 31.0, 19.0, 15.0, 8.0, 9.0, 9.0, 9.0, 5.0, 1.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.03924560546875, -0.03801393508911133, -0.036782264709472656, -0.035550594329833984, -0.03431892395019531, -0.03308725357055664, -0.03185558319091797, -0.030623912811279297, -0.029392242431640625, -0.028160572052001953, -0.02692890167236328, -0.02569723129272461, -0.024465560913085938, -0.023233890533447266, -0.022002220153808594, -0.020770549774169922, -0.01953887939453125, -0.018307209014892578, -0.017075538635253906, -0.015843868255615234, -0.014612197875976562, -0.01338052749633789, -0.012148857116699219, -0.010917186737060547, -0.009685516357421875, -0.008453845977783203, -0.007222175598144531, -0.005990505218505859, -0.0047588348388671875, -0.0035271644592285156, -0.0022954940795898438, -0.0010638236999511719, 0.0001678466796875, 0.0013995170593261719, 0.0026311874389648438, 0.0038628578186035156, 0.0050945281982421875, 0.006326198577880859, 0.007557868957519531, 0.008789539337158203, 0.010021209716796875, 0.011252880096435547, 0.012484550476074219, 0.01371622085571289, 0.014947891235351562, 0.016179561614990234, 0.017411231994628906, 0.018642902374267578, 0.01987457275390625, 0.021106243133544922, 0.022337913513183594, 0.023569583892822266, 0.024801254272460938, 0.02603292465209961, 0.02726459503173828, 0.028496265411376953, 0.029727935791015625, 0.030959606170654297, 0.03219127655029297, 0.03342294692993164, 0.03465461730957031, 0.035886287689208984, 0.037117958068847656, 0.03834962844848633, 0.039581298828125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 9.0, 18.0, 21.0, 21.0, 21.0, 31.0, 53.0, 52.0, 80.0, 95.0, 121.0, 83.0, 76.0, 67.0, 55.0, 42.0, 27.0, 29.0, 19.0, 18.0, 15.0, 5.0, 5.0, 2.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.096435546875, -0.0938119888305664, -0.09118843078613281, -0.08856487274169922, -0.08594131469726562, -0.08331775665283203, -0.08069419860839844, -0.07807064056396484, -0.07544708251953125, -0.07282352447509766, -0.07019996643066406, -0.06757640838623047, -0.06495285034179688, -0.06232929229736328, -0.05970573425292969, -0.057082176208496094, -0.0544586181640625, -0.051835060119628906, -0.04921150207519531, -0.04658794403076172, -0.043964385986328125, -0.04134082794189453, -0.03871726989746094, -0.036093711853027344, -0.03347015380859375, -0.030846595764160156, -0.028223037719726562, -0.02559947967529297, -0.022975921630859375, -0.02035236358642578, -0.017728805541992188, -0.015105247497558594, -0.012481689453125, -0.009858131408691406, -0.0072345733642578125, -0.004611015319824219, -0.001987457275390625, 0.0006361007690429688, 0.0032596588134765625, 0.005883216857910156, 0.00850677490234375, 0.011130332946777344, 0.013753890991210938, 0.01637744903564453, 0.019001007080078125, 0.02162456512451172, 0.024248123168945312, 0.026871681213378906, 0.0294952392578125, 0.032118797302246094, 0.03474235534667969, 0.03736591339111328, 0.039989471435546875, 0.04261302947998047, 0.04523658752441406, 0.047860145568847656, 0.05048370361328125, 0.053107261657714844, 0.05573081970214844, 0.05835437774658203, 0.060977935791015625, 0.06360149383544922, 0.06622505187988281, 0.0688486099243164, 0.07147216796875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 18.0, 45.0, 83.0, 407.0, 280.0, 95.0, 29.0, 22.0, 4.0, 3.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.082947731018066, -3.925687789916992, -3.768427848815918, -3.6111679077148438, -3.4539079666137695, -3.2966480255126953, -3.1393883228302, -2.982128381729126, -2.8248684406280518, -2.6676084995269775, -2.5103485584259033, -2.353088617324829, -2.195828914642334, -2.0385689735412598, -1.8813090324401855, -1.7240490913391113, -1.566789150238037, -1.409529209136963, -1.2522692680358887, -1.095009446144104, -0.9377495050430298, -0.7804895639419556, -0.6232296824455261, -0.4659698009490967, -0.30870985984802246, -0.15144994854927063, 0.005809962749481201, 0.16306987404823303, 0.32032978534698486, 0.4775897264480591, 0.6348496079444885, 0.792109489440918, 0.949368953704834, 1.1066288948059082, 1.2638888359069824, 1.421148657798767, 1.5784085988998413, 1.7356685400009155, 1.8929283618927002, 2.0501883029937744, 2.2074482440948486, 2.364708185195923, 2.521968126296997, 2.6792280673980713, 2.8364877700805664, 2.9937477111816406, 3.151007652282715, 3.308267593383789, 3.4655275344848633, 3.6227874755859375, 3.7800474166870117, 3.937307357788086, 4.09456729888916, 4.251827239990234, 4.409087181091309, 4.566347122192383, 4.723607063293457, 4.880867004394531, 5.0381269454956055, 5.19538688659668, 5.352646827697754, 5.509906768798828, 5.667166709899902, 5.824426651000977, 5.981686115264893]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 7.0, 13.0, 7.0, 9.0, 13.0, 16.0, 11.0, 15.0, 9.0, 16.0, 12.0, 20.0, 21.0, 21.0, 46.0, 135.0, 199.0, 149.0, 32.0, 30.0, 16.0, 24.0, 22.0, 18.0, 24.0, 12.0, 12.0, 14.0, 10.0, 15.0, 9.0, 9.0, 4.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.3717689514160156, -2.303168773651123, -2.2345685958862305, -2.165968179702759, -2.097368001937866, -2.0287678241729736, -1.960167646408081, -1.8915674686431885, -1.8229671716690063, -1.7543669939041138, -1.6857666969299316, -1.617166519165039, -1.5485663414001465, -1.4799660444259644, -1.4113658666610718, -1.3427655696868896, -1.274165391921997, -1.2055652141571045, -1.1369649171829224, -1.0683647394180298, -0.9997645020484924, -0.9311642646789551, -0.8625640869140625, -0.7939638495445251, -0.7253636121749878, -0.6567633748054504, -0.5881631374359131, -0.5195629596710205, -0.45096272230148315, -0.3823624849319458, -0.31376227736473083, -0.24516206979751587, -0.17656159400939941, -0.10796137154102325, -0.039361149072647095, 0.029239073395729065, 0.09783929586410522, 0.16643953323364258, 0.23503974080085754, 0.3036399483680725, 0.37224018573760986, 0.4408404231071472, 0.5094406604766846, 0.5780408382415771, 0.6466410756111145, 0.7152413129806519, 0.7838414907455444, 0.8524417281150818, 0.9210419654846191, 0.9896422028541565, 1.0582424402236938, 1.1268426179885864, 1.1954429149627686, 1.2640430927276611, 1.3326432704925537, 1.4012434482574463, 1.4698437452316284, 1.538443922996521, 1.6070442199707031, 1.6756443977355957, 1.7442445755004883, 1.8128448724746704, 1.881445050239563, 1.9500453472137451, 2.0186455249786377]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 9.0, 15.0, 12.0, 15.0, 16.0, 22.0, 27.0, 40.0, 38.0, 34.0, 47.0, 125.0, 253.0, 61.0, 25.0, 38.0, 38.0, 25.0, 23.0, 24.0, 15.0, 11.0, 11.0, 8.0, 7.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1572265625, -0.15047836303710938, -0.14373016357421875, -0.13698196411132812, -0.1302337646484375, -0.12348556518554688, -0.11673736572265625, -0.10998916625976562, -0.103240966796875, -0.09649276733398438, -0.08974456787109375, -0.08299636840820312, -0.0762481689453125, -0.06949996948242188, -0.06275177001953125, -0.056003570556640625, -0.04925537109375, -0.042507171630859375, -0.03575897216796875, -0.029010772705078125, -0.0222625732421875, -0.015514373779296875, -0.00876617431640625, -0.002017974853515625, 0.004730224609375, 0.011478424072265625, 0.01822662353515625, 0.024974822998046875, 0.0317230224609375, 0.038471221923828125, 0.04521942138671875, 0.051967620849609375, 0.0587158203125, 0.06546401977539062, 0.07221221923828125, 0.07896041870117188, 0.0857086181640625, 0.09245681762695312, 0.09920501708984375, 0.10595321655273438, 0.112701416015625, 0.11944961547851562, 0.12619781494140625, 0.13294601440429688, 0.1396942138671875, 0.14644241333007812, 0.15319061279296875, 0.15993881225585938, 0.16668701171875, 0.17343521118164062, 0.18018341064453125, 0.18693161010742188, 0.1936798095703125, 0.20042800903320312, 0.20717620849609375, 0.21392440795898438, 0.220672607421875, 0.22742080688476562, 0.23416900634765625, 0.24091720581054688, 0.2476654052734375, 0.2544136047363281, 0.26116180419921875, 0.2679100036621094, 0.274658203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 8.0, 17.0, 16.0, 25.0, 56.0, 86.0, 264.0, 750.0, 4065.0, 8262953.0, 116026.0, 3163.0, 665.0, 240.0, 105.0, 53.0, 25.0, 14.0, 15.0, 9.0, 10.0, 10.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.584643602371216, -2.4921183586120605, -2.399592876434326, -2.307067632675171, -2.2145423889160156, -2.1220169067382812, -2.029491662979126, -1.9369663000106812, -1.8444409370422363, -1.7519155740737915, -1.6593903303146362, -1.5668649673461914, -1.4743396043777466, -1.3818142414093018, -1.2892889976501465, -1.1967636346817017, -1.1042383909225464, -1.0117130279541016, -0.9191877245903015, -0.8266624212265015, -0.7341370582580566, -0.6416117548942566, -0.5490864515304565, -0.4565610885620117, -0.36403578519821167, -0.27151045203208923, -0.178985133767128, -0.08645981550216675, 0.0060655176639556885, 0.09859085083007812, 0.19111615419387817, 0.283641517162323, 0.37616682052612305, 0.4686921536922455, 0.5612174868583679, 0.653742790222168, 0.7462681531906128, 0.8387934565544128, 0.9313187599182129, 1.0238441228866577, 1.1163694858551025, 1.2088948488235474, 1.3014200925827026, 1.3939454555511475, 1.4864708185195923, 1.578996181488037, 1.6715214252471924, 1.7640467882156372, 1.8565720319747925, 1.9490973949432373, 2.0416226387023926, 2.134148120880127, 2.2266733646392822, 2.3191986083984375, 2.411724090576172, 2.504249334335327, 2.5967745780944824, 2.6892998218536377, 2.781825304031372, 2.8743505477905273, 2.9668757915496826, 3.059401273727417, 3.1519265174865723, 3.2444519996643066, 3.336977243423462]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 5.0, 10.0, 2.0, 6.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 3.0, 5.0, 5.0, 5.0, 7.0, 6.0, 1.0, 0.0, 1.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.9421043395996094, -3.840648651123047, -3.7391929626464844, -3.637737274169922, -3.5362815856933594, -3.434825897216797, -3.3333702087402344, -3.231914520263672, -3.1304588317871094, -3.029003143310547, -2.9275474548339844, -2.826091766357422, -2.7246360778808594, -2.623180389404297, -2.5217247009277344, -2.420269012451172, -2.3188135623931885, -2.217357873916626, -2.1159021854400635, -2.014446496963501, -1.9129908084869385, -1.811535120010376, -1.710079550743103, -1.6086238622665405, -1.507168173789978, -1.4057124853134155, -1.304256796836853, -1.20280122756958, -1.1013455390930176, -0.9998897910118103, -0.8984341621398926, -0.7969784736633301, -0.6955227851867676, -0.5940670967102051, -0.49261143803596497, -0.39115577936172485, -0.28970009088516235, -0.18824440240859985, -0.08678877353668213, 0.014666914939880371, 0.11612260341644287, 0.21757827699184418, 0.3190339505672455, 0.4204896092414856, 0.5219452977180481, 0.6234009861946106, 0.7248566150665283, 0.8263123035430908, 0.9277679920196533, 1.0292236804962158, 1.1306793689727783, 1.2321350574493408, 1.3335907459259033, 1.4350464344024658, 1.5365020036697388, 1.6379576921463013, 1.7394133806228638, 1.8408690690994263, 1.9423247575759888, 2.0437803268432617, 2.145236015319824, 2.2466917037963867, 2.348147392272949, 2.4496030807495117, 2.551058769226074]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 9.0, 11.0, 14.0, 20.0, 25.0, 28.0, 41.0, 46.0, 79.0, 107.0, 211.0, 288.0, 506.0, 1206.0, 3217.0, 9794.0, 33183.0, 120212.0, 227162.0, 90185.0, 25357.0, 7633.0, 2618.0, 1037.0, 489.0, 254.0, 175.0, 98.0, 68.0, 49.0, 32.0, 24.0, 20.0, 21.0, 6.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9892578125, -1.93304443359375, -1.8768310546875, -1.82061767578125, -1.764404296875, -1.70819091796875, -1.6519775390625, -1.59576416015625, -1.53955078125, -1.48333740234375, -1.4271240234375, -1.37091064453125, -1.314697265625, -1.25848388671875, -1.2022705078125, -1.14605712890625, -1.08984375, -1.03363037109375, -0.9774169921875, -0.92120361328125, -0.864990234375, -0.80877685546875, -0.7525634765625, -0.69635009765625, -0.64013671875, -0.58392333984375, -0.5277099609375, -0.47149658203125, -0.415283203125, -0.35906982421875, -0.3028564453125, -0.24664306640625, -0.1904296875, -0.13421630859375, -0.0780029296875, -0.02178955078125, 0.034423828125, 0.09063720703125, 0.1468505859375, 0.20306396484375, 0.25927734375, 0.31549072265625, 0.3717041015625, 0.42791748046875, 0.484130859375, 0.54034423828125, 0.5965576171875, 0.65277099609375, 0.708984375, 0.76519775390625, 0.8214111328125, 0.87762451171875, 0.933837890625, 0.99005126953125, 1.0462646484375, 1.10247802734375, 1.15869140625, 1.21490478515625, 1.2711181640625, 1.32733154296875, 1.383544921875, 1.43975830078125, 1.4959716796875, 1.55218505859375, 1.6083984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 6.0, 3.0, 10.0, 5.0, 12.0, 16.0, 30.0, 40.0, 54.0, 59.0, 55.0, 72.0, 76.0, 76.0, 101.0, 81.0, 66.0, 50.0, 53.0, 31.0, 27.0, 14.0, 18.0, 6.0, 9.0, 9.0, 8.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.3583984375, -0.348358154296875, -0.33831787109375, -0.328277587890625, -0.3182373046875, -0.308197021484375, -0.29815673828125, -0.288116455078125, -0.278076171875, -0.268035888671875, -0.25799560546875, -0.247955322265625, -0.2379150390625, -0.227874755859375, -0.21783447265625, -0.207794189453125, -0.19775390625, -0.187713623046875, -0.17767333984375, -0.167633056640625, -0.1575927734375, -0.147552490234375, -0.13751220703125, -0.127471923828125, -0.117431640625, -0.107391357421875, -0.09735107421875, -0.087310791015625, -0.0772705078125, -0.067230224609375, -0.05718994140625, -0.047149658203125, -0.037109375, -0.027069091796875, -0.01702880859375, -0.006988525390625, 0.0030517578125, 0.013092041015625, 0.02313232421875, 0.033172607421875, 0.043212890625, 0.053253173828125, 0.06329345703125, 0.073333740234375, 0.0833740234375, 0.093414306640625, 0.10345458984375, 0.113494873046875, 0.12353515625, 0.133575439453125, 0.14361572265625, 0.153656005859375, 0.1636962890625, 0.173736572265625, 0.18377685546875, 0.193817138671875, 0.203857421875, 0.213897705078125, 0.22393798828125, 0.233978271484375, 0.2440185546875, 0.254058837890625, 0.26409912109375, 0.274139404296875, 0.2841796875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 10.0, 19.0, 33.0, 81.0, 96.0, 93.0, 67.0, 35.0, 9.0, 12.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.1596553325653076, -3.085617780685425, -3.011580228805542, -2.937542676925659, -2.8635051250457764, -2.7894675731658936, -2.7154300212860107, -2.641392707824707, -2.567355155944824, -2.4933176040649414, -2.4192800521850586, -2.345242500305176, -2.271204948425293, -2.19716739654541, -2.1231298446655273, -2.0490922927856445, -1.9750547409057617, -1.901017189025879, -1.826979637145996, -1.7529420852661133, -1.6789045333862305, -1.6048669815063477, -1.5308295488357544, -1.4567919969558716, -1.3827544450759888, -1.308716893196106, -1.2346793413162231, -1.1606417894363403, -1.086604356765747, -1.0125668048858643, -0.9385292530059814, -0.8644917011260986, -0.7904542684555054, -0.7164167165756226, -0.6423791646957397, -0.5683416724205017, -0.4943041205406189, -0.4202665686607361, -0.34622904658317566, -0.27219152450561523, -0.19815397262573242, -0.1241164356470108, -0.050078898668289185, 0.023958638310432434, 0.09799617528915405, 0.17203372716903687, 0.2460712492465973, 0.3201087713241577, 0.3941463232040405, 0.46818387508392334, 0.5422214269638062, 0.6162589192390442, 0.690296471118927, 0.7643340229988098, 0.8383715152740479, 0.9124090671539307, 0.9864466190338135, 1.0604841709136963, 1.134521722793579, 1.208559274673462, 1.2825968265533447, 1.3566343784332275, 1.4306718111038208, 1.5047093629837036, 1.5787469148635864]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 10.0, 15.0, 14.0, 35.0, 55.0, 116.0, 98.0, 50.0, 26.0, 14.0, 11.0, 7.0, 6.0, 1.0, 1.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.063533067703247, -2.007631301879883, -1.951729416847229, -1.8958276510238647, -1.839925765991211, -1.7840240001678467, -1.7281222343444824, -1.6722203493118286, -1.6163185834884644, -1.5604168176651, -1.5045149326324463, -1.448613166809082, -1.3927112817764282, -1.336809515953064, -1.2809076309204102, -1.225005865097046, -1.1691040992736816, -1.1132023334503174, -1.0573004484176636, -1.0013986825942993, -0.9454968571662903, -0.8895950317382812, -0.8336932063102722, -0.7777913808822632, -0.7218894958496094, -0.6659876704216003, -0.6100858449935913, -0.554184079170227, -0.498282253742218, -0.442380428314209, -0.38647860288619995, -0.3305768072605133, -0.27467501163482666, -0.21877320110797882, -0.16287139058113098, -0.10696956515312195, -0.05106775462627411, 0.0048340559005737305, 0.060735881328582764, 0.11663767695426941, 0.17253950238227844, 0.22844131290912628, 0.2843431234359741, 0.34024494886398315, 0.3961467742919922, 0.45204856991767883, 0.5079504251480103, 0.5638521909713745, 0.6197540163993835, 0.6756558418273926, 0.7315576672554016, 0.7874594926834106, 0.8433612585067749, 0.8992630839347839, 0.955164909362793, 1.0110666751861572, 1.066968560218811, 1.1228703260421753, 1.178772211074829, 1.2346739768981934, 1.2905758619308472, 1.3464776277542114, 1.4023795127868652, 1.4582812786102295, 1.5141830444335938]}, "eval/loss": 4.216550350189209, "eval/wer": 2.3908964696548987, "eval/runtime": 932.3753, "eval/samples_per_second": 2.834, "eval/steps_per_second": 0.237, "train/train_runtime": 5668.958, "train/train_samples_per_second": 5.034, "train/train_steps_per_second": 0.105, "train/total_flos": 0.0, "train/train_loss": 4.277455122382553, "_wandb": {"runtime": 6942}} \ No newline at end of file